diff options
author | Al Viro <viro@zeniv.linux.org.uk> | 2014-11-01 10:57:28 -0400 |
---|---|---|
committer | Al Viro <viro@zeniv.linux.org.uk> | 2014-12-10 21:30:20 -0500 |
commit | e149ed2b805fefdccf7ccdfc19eca22fdd4514ac (patch) | |
tree | 8c9cd88deff8c7309ca2acb8d4cb475aaca47b14 /fs/proc | |
parent | f77c80142e1afe6d5c16975ca5d7d1fc324b16f9 (diff) |
take the targets of /proc/*/ns/* symlinks to separate fs
New pseudo-filesystem: nsfs. Targets of /proc/*/ns/* live there now.
It's not mountable (not even registered, so it's not in /proc/filesystems,
etc.). Files on it *are* bindable - we explicitly permit that in do_loopback().
This stuff lives in fs/nsfs.c now; proc_ns_fget() moved there as well.
get_proc_ns() is a macro now (it's simply returning ->i_private; would
have been an inline, if not for header ordering headache).
proc_ns_inode() is an ex-parrot. The interface used in procfs is
ns_get_path(path, task, ops) and ns_get_name(buf, size, task, ops).
Dentries and inodes are never hashed; a non-counting reference to dentry
is stashed in ns_common (removed by ->d_prune()) and reused by ns_get_path()
if present. See ns_get_path()/ns_prune_dentry/nsfs_evict() for details
of that mechanism.
As the result, proc_ns_follow_link() has stopped poking in nd->path.mnt;
it does nd_jump_link() on a consistent <vfsmount,dentry> pair it gets
from ns_get_path().
Signed-off-by: Al Viro <viro@zeniv.linux.org.uk>
Diffstat (limited to 'fs/proc')
-rw-r--r-- | fs/proc/inode.c | 5 | ||||
-rw-r--r-- | fs/proc/namespaces.c | 152 |
2 files changed, 13 insertions, 144 deletions
diff --git a/fs/proc/inode.c b/fs/proc/inode.c index a212996e0987..57a9be9a6668 100644 --- a/fs/proc/inode.c +++ b/fs/proc/inode.c | |||
@@ -32,7 +32,6 @@ static void proc_evict_inode(struct inode *inode) | |||
32 | { | 32 | { |
33 | struct proc_dir_entry *de; | 33 | struct proc_dir_entry *de; |
34 | struct ctl_table_header *head; | 34 | struct ctl_table_header *head; |
35 | struct ns_common *ns; | ||
36 | 35 | ||
37 | truncate_inode_pages_final(&inode->i_data); | 36 | truncate_inode_pages_final(&inode->i_data); |
38 | clear_inode(inode); | 37 | clear_inode(inode); |
@@ -49,10 +48,6 @@ static void proc_evict_inode(struct inode *inode) | |||
49 | RCU_INIT_POINTER(PROC_I(inode)->sysctl, NULL); | 48 | RCU_INIT_POINTER(PROC_I(inode)->sysctl, NULL); |
50 | sysctl_head_put(head); | 49 | sysctl_head_put(head); |
51 | } | 50 | } |
52 | /* Release any associated namespace */ | ||
53 | ns = PROC_I(inode)->ns.ns; | ||
54 | if (ns && ns->ops) | ||
55 | ns->ops->put(ns); | ||
56 | } | 51 | } |
57 | 52 | ||
58 | static struct kmem_cache * proc_inode_cachep; | 53 | static struct kmem_cache * proc_inode_cachep; |
diff --git a/fs/proc/namespaces.c b/fs/proc/namespaces.c index 18fc1cf899de..aaaac77abad0 100644 --- a/fs/proc/namespaces.c +++ b/fs/proc/namespaces.c | |||
@@ -1,10 +1,6 @@ | |||
1 | #include <linux/proc_fs.h> | 1 | #include <linux/proc_fs.h> |
2 | #include <linux/nsproxy.h> | 2 | #include <linux/nsproxy.h> |
3 | #include <linux/sched.h> | ||
4 | #include <linux/ptrace.h> | 3 | #include <linux/ptrace.h> |
5 | #include <linux/fs_struct.h> | ||
6 | #include <linux/mount.h> | ||
7 | #include <linux/path.h> | ||
8 | #include <linux/namei.h> | 4 | #include <linux/namei.h> |
9 | #include <linux/file.h> | 5 | #include <linux/file.h> |
10 | #include <linux/utsname.h> | 6 | #include <linux/utsname.h> |
@@ -34,139 +30,45 @@ static const struct proc_ns_operations *ns_entries[] = { | |||
34 | &mntns_operations, | 30 | &mntns_operations, |
35 | }; | 31 | }; |
36 | 32 | ||
37 | static const struct file_operations ns_file_operations = { | ||
38 | .llseek = no_llseek, | ||
39 | }; | ||
40 | |||
41 | static const struct inode_operations ns_inode_operations = { | ||
42 | .setattr = proc_setattr, | ||
43 | }; | ||
44 | |||
45 | static char *ns_dname(struct dentry *dentry, char *buffer, int buflen) | ||
46 | { | ||
47 | struct inode *inode = dentry->d_inode; | ||
48 | const struct proc_ns_operations *ns_ops = dentry->d_fsdata; | ||
49 | |||
50 | return dynamic_dname(dentry, buffer, buflen, "%s:[%lu]", | ||
51 | ns_ops->name, inode->i_ino); | ||
52 | } | ||
53 | |||
54 | const struct dentry_operations ns_dentry_operations = | ||
55 | { | ||
56 | .d_delete = always_delete_dentry, | ||
57 | .d_dname = ns_dname, | ||
58 | }; | ||
59 | |||
60 | static struct dentry *proc_ns_get_dentry(struct super_block *sb, | ||
61 | struct task_struct *task, const struct proc_ns_operations *ns_ops) | ||
62 | { | ||
63 | struct dentry *dentry, *result; | ||
64 | struct inode *inode; | ||
65 | struct proc_inode *ei; | ||
66 | struct qstr qname = { .name = "", }; | ||
67 | struct ns_common *ns; | ||
68 | |||
69 | ns = ns_ops->get(task); | ||
70 | if (!ns) | ||
71 | return ERR_PTR(-ENOENT); | ||
72 | |||
73 | dentry = d_alloc_pseudo(sb, &qname); | ||
74 | if (!dentry) { | ||
75 | ns_ops->put(ns); | ||
76 | return ERR_PTR(-ENOMEM); | ||
77 | } | ||
78 | dentry->d_fsdata = (void *)ns_ops; | ||
79 | |||
80 | inode = iget_locked(sb, ns->inum); | ||
81 | if (!inode) { | ||
82 | dput(dentry); | ||
83 | ns_ops->put(ns); | ||
84 | return ERR_PTR(-ENOMEM); | ||
85 | } | ||
86 | |||
87 | ei = PROC_I(inode); | ||
88 | if (inode->i_state & I_NEW) { | ||
89 | inode->i_mtime = inode->i_atime = inode->i_ctime = CURRENT_TIME; | ||
90 | inode->i_op = &ns_inode_operations; | ||
91 | inode->i_mode = S_IFREG | S_IRUGO; | ||
92 | inode->i_fop = &ns_file_operations; | ||
93 | ei->ns.ns_ops = ns_ops; | ||
94 | ei->ns.ns = ns; | ||
95 | unlock_new_inode(inode); | ||
96 | } else { | ||
97 | ns_ops->put(ns); | ||
98 | } | ||
99 | |||
100 | d_set_d_op(dentry, &ns_dentry_operations); | ||
101 | result = d_instantiate_unique(dentry, inode); | ||
102 | if (result) { | ||
103 | dput(dentry); | ||
104 | dentry = result; | ||
105 | } | ||
106 | |||
107 | return dentry; | ||
108 | } | ||
109 | |||
110 | static void *proc_ns_follow_link(struct dentry *dentry, struct nameidata *nd) | 33 | static void *proc_ns_follow_link(struct dentry *dentry, struct nameidata *nd) |
111 | { | 34 | { |
112 | struct inode *inode = dentry->d_inode; | 35 | struct inode *inode = dentry->d_inode; |
113 | struct super_block *sb = inode->i_sb; | 36 | const struct proc_ns_operations *ns_ops = PROC_I(inode)->ns.ns_ops; |
114 | struct proc_inode *ei = PROC_I(inode); | ||
115 | struct task_struct *task; | 37 | struct task_struct *task; |
116 | struct path ns_path; | 38 | struct path ns_path; |
117 | void *error = ERR_PTR(-EACCES); | 39 | void *error = ERR_PTR(-EACCES); |
118 | 40 | ||
119 | task = get_proc_task(inode); | 41 | task = get_proc_task(inode); |
120 | if (!task) | 42 | if (!task) |
121 | goto out; | 43 | return error; |
122 | 44 | ||
123 | if (!ptrace_may_access(task, PTRACE_MODE_READ)) | 45 | if (ptrace_may_access(task, PTRACE_MODE_READ)) { |
124 | goto out_put_task; | 46 | error = ns_get_path(&ns_path, task, ns_ops); |
125 | 47 | if (!error) | |
126 | ns_path.dentry = proc_ns_get_dentry(sb, task, ei->ns.ns_ops); | 48 | nd_jump_link(nd, &ns_path); |
127 | if (IS_ERR(ns_path.dentry)) { | ||
128 | error = ERR_CAST(ns_path.dentry); | ||
129 | goto out_put_task; | ||
130 | } | 49 | } |
131 | |||
132 | ns_path.mnt = mntget(nd->path.mnt); | ||
133 | nd_jump_link(nd, &ns_path); | ||
134 | error = NULL; | ||
135 | |||
136 | out_put_task: | ||
137 | put_task_struct(task); | 50 | put_task_struct(task); |
138 | out: | ||
139 | return error; | 51 | return error; |
140 | } | 52 | } |
141 | 53 | ||
142 | static int proc_ns_readlink(struct dentry *dentry, char __user *buffer, int buflen) | 54 | static int proc_ns_readlink(struct dentry *dentry, char __user *buffer, int buflen) |
143 | { | 55 | { |
144 | struct inode *inode = dentry->d_inode; | 56 | struct inode *inode = dentry->d_inode; |
145 | struct proc_inode *ei = PROC_I(inode); | 57 | const struct proc_ns_operations *ns_ops = PROC_I(inode)->ns.ns_ops; |
146 | const struct proc_ns_operations *ns_ops = ei->ns.ns_ops; | ||
147 | struct task_struct *task; | 58 | struct task_struct *task; |
148 | struct ns_common *ns; | ||
149 | char name[50]; | 59 | char name[50]; |
150 | int res = -EACCES; | 60 | int res = -EACCES; |
151 | 61 | ||
152 | task = get_proc_task(inode); | 62 | task = get_proc_task(inode); |
153 | if (!task) | 63 | if (!task) |
154 | goto out; | 64 | return res; |
155 | |||
156 | if (!ptrace_may_access(task, PTRACE_MODE_READ)) | ||
157 | goto out_put_task; | ||
158 | 65 | ||
159 | res = -ENOENT; | 66 | if (ptrace_may_access(task, PTRACE_MODE_READ)) { |
160 | ns = ns_ops->get(task); | 67 | res = ns_get_name(name, sizeof(name), task, ns_ops); |
161 | if (!ns) | 68 | if (res >= 0) |
162 | goto out_put_task; | 69 | res = readlink_copy(buffer, buflen, name); |
163 | 70 | } | |
164 | snprintf(name, sizeof(name), "%s:[%u]", ns_ops->name, ns->inum); | ||
165 | res = readlink_copy(buffer, buflen, name); | ||
166 | ns_ops->put(ns); | ||
167 | out_put_task: | ||
168 | put_task_struct(task); | 71 | put_task_struct(task); |
169 | out: | ||
170 | return res; | 72 | return res; |
171 | } | 73 | } |
172 | 74 | ||
@@ -268,31 +170,3 @@ const struct inode_operations proc_ns_dir_inode_operations = { | |||
268 | .getattr = pid_getattr, | 170 | .getattr = pid_getattr, |
269 | .setattr = proc_setattr, | 171 | .setattr = proc_setattr, |
270 | }; | 172 | }; |
271 | |||
272 | struct file *proc_ns_fget(int fd) | ||
273 | { | ||
274 | struct file *file; | ||
275 | |||
276 | file = fget(fd); | ||
277 | if (!file) | ||
278 | return ERR_PTR(-EBADF); | ||
279 | |||
280 | if (file->f_op != &ns_file_operations) | ||
281 | goto out_invalid; | ||
282 | |||
283 | return file; | ||
284 | |||
285 | out_invalid: | ||
286 | fput(file); | ||
287 | return ERR_PTR(-EINVAL); | ||
288 | } | ||
289 | |||
290 | struct ns_common *get_proc_ns(struct inode *inode) | ||
291 | { | ||
292 | return PROC_I(inode)->ns.ns; | ||
293 | } | ||
294 | |||
295 | bool proc_ns_inode(struct inode *inode) | ||
296 | { | ||
297 | return inode->i_fop == &ns_file_operations; | ||
298 | } | ||