diff options
author | Linus Torvalds <torvalds@linux-foundation.org> | 2011-05-25 21:10:16 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2011-05-25 21:10:16 -0400 |
commit | 14d74e0cab7a7779a7ff0c3863c04c8a8e507106 (patch) | |
tree | 5e27d7495f8f7ce178b637d588ec42bd7b4173d8 | |
parent | 49a78d085fa6b44d6ed791923c7172a6433589c2 (diff) | |
parent | 956c920786694f51601a0ef7ee12956fd6aa216e (diff) |
Merge git://git.kernel.org/pub/scm/linux/kernel/git/ebiederm/linux-2.6-nsfd
* git://git.kernel.org/pub/scm/linux/kernel/git/ebiederm/linux-2.6-nsfd:
net: fix get_net_ns_by_fd for !CONFIG_NET_NS
ns proc: Return -ENOENT for a nonexistent /proc/self/ns/ entry.
ns: Declare sys_setns in syscalls.h
net: Allow setting the network namespace by fd
ns proc: Add support for the ipc namespace
ns proc: Add support for the uts namespace
ns proc: Add support for the network namespace.
ns: Introduce the setns syscall
ns: proc files for namespace naming policy.
-rw-r--r-- | fs/proc/Makefile | 1 | ||||
-rw-r--r-- | fs/proc/base.c | 20 | ||||
-rw-r--r-- | fs/proc/inode.c | 7 | ||||
-rw-r--r-- | fs/proc/internal.h | 18 | ||||
-rw-r--r-- | fs/proc/namespaces.c | 198 | ||||
-rw-r--r-- | include/linux/if_link.h | 1 | ||||
-rw-r--r-- | include/linux/proc_fs.h | 21 | ||||
-rw-r--r-- | include/linux/syscalls.h | 1 | ||||
-rw-r--r-- | include/net/net_namespace.h | 1 | ||||
-rw-r--r-- | ipc/namespace.c | 37 | ||||
-rw-r--r-- | kernel/nsproxy.c | 42 | ||||
-rw-r--r-- | kernel/utsname.c | 39 | ||||
-rw-r--r-- | net/core/net_namespace.c | 65 | ||||
-rw-r--r-- | net/core/rtnetlink.c | 5 |
14 files changed, 444 insertions, 12 deletions
diff --git a/fs/proc/Makefile b/fs/proc/Makefile index df434c5f28fb..c1c729335924 100644 --- a/fs/proc/Makefile +++ b/fs/proc/Makefile | |||
@@ -20,6 +20,7 @@ proc-y += stat.o | |||
20 | proc-y += uptime.o | 20 | proc-y += uptime.o |
21 | proc-y += version.o | 21 | proc-y += version.o |
22 | proc-y += softirqs.o | 22 | proc-y += softirqs.o |
23 | proc-y += namespaces.o | ||
23 | proc-$(CONFIG_PROC_SYSCTL) += proc_sysctl.o | 24 | proc-$(CONFIG_PROC_SYSCTL) += proc_sysctl.o |
24 | proc-$(CONFIG_NET) += proc_net.o | 25 | proc-$(CONFIG_NET) += proc_net.o |
25 | proc-$(CONFIG_PROC_KCORE) += kcore.o | 26 | proc-$(CONFIG_PROC_KCORE) += kcore.o |
diff --git a/fs/proc/base.c b/fs/proc/base.c index dfa532730e55..dc8bca72b002 100644 --- a/fs/proc/base.c +++ b/fs/proc/base.c | |||
@@ -600,7 +600,7 @@ static int proc_fd_access_allowed(struct inode *inode) | |||
600 | return allowed; | 600 | return allowed; |
601 | } | 601 | } |
602 | 602 | ||
603 | static int proc_setattr(struct dentry *dentry, struct iattr *attr) | 603 | int proc_setattr(struct dentry *dentry, struct iattr *attr) |
604 | { | 604 | { |
605 | int error; | 605 | int error; |
606 | struct inode *inode = dentry->d_inode; | 606 | struct inode *inode = dentry->d_inode; |
@@ -1736,8 +1736,7 @@ static int task_dumpable(struct task_struct *task) | |||
1736 | return 0; | 1736 | return 0; |
1737 | } | 1737 | } |
1738 | 1738 | ||
1739 | 1739 | struct inode *proc_pid_make_inode(struct super_block * sb, struct task_struct *task) | |
1740 | static struct inode *proc_pid_make_inode(struct super_block * sb, struct task_struct *task) | ||
1741 | { | 1740 | { |
1742 | struct inode * inode; | 1741 | struct inode * inode; |
1743 | struct proc_inode *ei; | 1742 | struct proc_inode *ei; |
@@ -1779,7 +1778,7 @@ out_unlock: | |||
1779 | return NULL; | 1778 | return NULL; |
1780 | } | 1779 | } |
1781 | 1780 | ||
1782 | static int pid_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat) | 1781 | int pid_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat) |
1783 | { | 1782 | { |
1784 | struct inode *inode = dentry->d_inode; | 1783 | struct inode *inode = dentry->d_inode; |
1785 | struct task_struct *task; | 1784 | struct task_struct *task; |
@@ -1820,7 +1819,7 @@ static int pid_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat | |||
1820 | * made this apply to all per process world readable and executable | 1819 | * made this apply to all per process world readable and executable |
1821 | * directories. | 1820 | * directories. |
1822 | */ | 1821 | */ |
1823 | static int pid_revalidate(struct dentry *dentry, struct nameidata *nd) | 1822 | int pid_revalidate(struct dentry *dentry, struct nameidata *nd) |
1824 | { | 1823 | { |
1825 | struct inode *inode; | 1824 | struct inode *inode; |
1826 | struct task_struct *task; | 1825 | struct task_struct *task; |
@@ -1862,7 +1861,7 @@ static int pid_delete_dentry(const struct dentry * dentry) | |||
1862 | return !proc_pid(dentry->d_inode)->tasks[PIDTYPE_PID].first; | 1861 | return !proc_pid(dentry->d_inode)->tasks[PIDTYPE_PID].first; |
1863 | } | 1862 | } |
1864 | 1863 | ||
1865 | static const struct dentry_operations pid_dentry_operations = | 1864 | const struct dentry_operations pid_dentry_operations = |
1866 | { | 1865 | { |
1867 | .d_revalidate = pid_revalidate, | 1866 | .d_revalidate = pid_revalidate, |
1868 | .d_delete = pid_delete_dentry, | 1867 | .d_delete = pid_delete_dentry, |
@@ -1870,9 +1869,6 @@ static const struct dentry_operations pid_dentry_operations = | |||
1870 | 1869 | ||
1871 | /* Lookups */ | 1870 | /* Lookups */ |
1872 | 1871 | ||
1873 | typedef struct dentry *instantiate_t(struct inode *, struct dentry *, | ||
1874 | struct task_struct *, const void *); | ||
1875 | |||
1876 | /* | 1872 | /* |
1877 | * Fill a directory entry. | 1873 | * Fill a directory entry. |
1878 | * | 1874 | * |
@@ -1885,8 +1881,8 @@ typedef struct dentry *instantiate_t(struct inode *, struct dentry *, | |||
1885 | * reported by readdir in sync with the inode numbers reported | 1881 | * reported by readdir in sync with the inode numbers reported |
1886 | * by stat. | 1882 | * by stat. |
1887 | */ | 1883 | */ |
1888 | static int proc_fill_cache(struct file *filp, void *dirent, filldir_t filldir, | 1884 | int proc_fill_cache(struct file *filp, void *dirent, filldir_t filldir, |
1889 | char *name, int len, | 1885 | const char *name, int len, |
1890 | instantiate_t instantiate, struct task_struct *task, const void *ptr) | 1886 | instantiate_t instantiate, struct task_struct *task, const void *ptr) |
1891 | { | 1887 | { |
1892 | struct dentry *child, *dir = filp->f_path.dentry; | 1888 | struct dentry *child, *dir = filp->f_path.dentry; |
@@ -2820,6 +2816,7 @@ static const struct pid_entry tgid_base_stuff[] = { | |||
2820 | DIR("task", S_IRUGO|S_IXUGO, proc_task_inode_operations, proc_task_operations), | 2816 | DIR("task", S_IRUGO|S_IXUGO, proc_task_inode_operations, proc_task_operations), |
2821 | DIR("fd", S_IRUSR|S_IXUSR, proc_fd_inode_operations, proc_fd_operations), | 2817 | DIR("fd", S_IRUSR|S_IXUSR, proc_fd_inode_operations, proc_fd_operations), |
2822 | DIR("fdinfo", S_IRUSR|S_IXUSR, proc_fdinfo_inode_operations, proc_fdinfo_operations), | 2818 | DIR("fdinfo", S_IRUSR|S_IXUSR, proc_fdinfo_inode_operations, proc_fdinfo_operations), |
2819 | DIR("ns", S_IRUSR|S_IXUGO, proc_ns_dir_inode_operations, proc_ns_dir_operations), | ||
2823 | #ifdef CONFIG_NET | 2820 | #ifdef CONFIG_NET |
2824 | DIR("net", S_IRUGO|S_IXUGO, proc_net_inode_operations, proc_net_operations), | 2821 | DIR("net", S_IRUGO|S_IXUGO, proc_net_inode_operations, proc_net_operations), |
2825 | #endif | 2822 | #endif |
@@ -3168,6 +3165,7 @@ out_no_task: | |||
3168 | static const struct pid_entry tid_base_stuff[] = { | 3165 | static const struct pid_entry tid_base_stuff[] = { |
3169 | DIR("fd", S_IRUSR|S_IXUSR, proc_fd_inode_operations, proc_fd_operations), | 3166 | DIR("fd", S_IRUSR|S_IXUSR, proc_fd_inode_operations, proc_fd_operations), |
3170 | DIR("fdinfo", S_IRUSR|S_IXUSR, proc_fdinfo_inode_operations, proc_fdinfo_operations), | 3167 | DIR("fdinfo", S_IRUSR|S_IXUSR, proc_fdinfo_inode_operations, proc_fdinfo_operations), |
3168 | DIR("ns", S_IRUSR|S_IXUGO, proc_ns_dir_inode_operations, proc_ns_dir_operations), | ||
3171 | REG("environ", S_IRUSR, proc_environ_operations), | 3169 | REG("environ", S_IRUSR, proc_environ_operations), |
3172 | INF("auxv", S_IRUSR, proc_pid_auxv), | 3170 | INF("auxv", S_IRUSR, proc_pid_auxv), |
3173 | ONE("status", S_IRUGO, proc_pid_status), | 3171 | ONE("status", S_IRUGO, proc_pid_status), |
diff --git a/fs/proc/inode.c b/fs/proc/inode.c index d15aa1b1cc8f..74b48cfa1bb2 100644 --- a/fs/proc/inode.c +++ b/fs/proc/inode.c | |||
@@ -28,6 +28,7 @@ static void proc_evict_inode(struct inode *inode) | |||
28 | { | 28 | { |
29 | struct proc_dir_entry *de; | 29 | struct proc_dir_entry *de; |
30 | struct ctl_table_header *head; | 30 | struct ctl_table_header *head; |
31 | const struct proc_ns_operations *ns_ops; | ||
31 | 32 | ||
32 | truncate_inode_pages(&inode->i_data, 0); | 33 | truncate_inode_pages(&inode->i_data, 0); |
33 | end_writeback(inode); | 34 | end_writeback(inode); |
@@ -44,6 +45,10 @@ static void proc_evict_inode(struct inode *inode) | |||
44 | rcu_assign_pointer(PROC_I(inode)->sysctl, NULL); | 45 | rcu_assign_pointer(PROC_I(inode)->sysctl, NULL); |
45 | sysctl_head_put(head); | 46 | sysctl_head_put(head); |
46 | } | 47 | } |
48 | /* Release any associated namespace */ | ||
49 | ns_ops = PROC_I(inode)->ns_ops; | ||
50 | if (ns_ops && ns_ops->put) | ||
51 | ns_ops->put(PROC_I(inode)->ns); | ||
47 | } | 52 | } |
48 | 53 | ||
49 | static struct kmem_cache * proc_inode_cachep; | 54 | static struct kmem_cache * proc_inode_cachep; |
@@ -62,6 +67,8 @@ static struct inode *proc_alloc_inode(struct super_block *sb) | |||
62 | ei->pde = NULL; | 67 | ei->pde = NULL; |
63 | ei->sysctl = NULL; | 68 | ei->sysctl = NULL; |
64 | ei->sysctl_entry = NULL; | 69 | ei->sysctl_entry = NULL; |
70 | ei->ns = NULL; | ||
71 | ei->ns_ops = NULL; | ||
65 | inode = &ei->vfs_inode; | 72 | inode = &ei->vfs_inode; |
66 | inode->i_mtime = inode->i_atime = inode->i_ctime = CURRENT_TIME; | 73 | inode->i_mtime = inode->i_atime = inode->i_ctime = CURRENT_TIME; |
67 | return inode; | 74 | return inode; |
diff --git a/fs/proc/internal.h b/fs/proc/internal.h index 3763b436e69d..7838e5cfec14 100644 --- a/fs/proc/internal.h +++ b/fs/proc/internal.h | |||
@@ -127,3 +127,21 @@ struct inode *proc_get_inode(struct super_block *, struct proc_dir_entry *); | |||
127 | */ | 127 | */ |
128 | int proc_readdir(struct file *, void *, filldir_t); | 128 | int proc_readdir(struct file *, void *, filldir_t); |
129 | struct dentry *proc_lookup(struct inode *, struct dentry *, struct nameidata *); | 129 | struct dentry *proc_lookup(struct inode *, struct dentry *, struct nameidata *); |
130 | |||
131 | |||
132 | |||
133 | /* Lookups */ | ||
134 | typedef struct dentry *instantiate_t(struct inode *, struct dentry *, | ||
135 | struct task_struct *, const void *); | ||
136 | int proc_fill_cache(struct file *filp, void *dirent, filldir_t filldir, | ||
137 | const char *name, int len, | ||
138 | instantiate_t instantiate, struct task_struct *task, const void *ptr); | ||
139 | int pid_revalidate(struct dentry *dentry, struct nameidata *nd); | ||
140 | struct inode *proc_pid_make_inode(struct super_block * sb, struct task_struct *task); | ||
141 | extern const struct dentry_operations pid_dentry_operations; | ||
142 | int pid_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat); | ||
143 | int proc_setattr(struct dentry *dentry, struct iattr *attr); | ||
144 | |||
145 | extern const struct inode_operations proc_ns_dir_inode_operations; | ||
146 | extern const struct file_operations proc_ns_dir_operations; | ||
147 | |||
diff --git a/fs/proc/namespaces.c b/fs/proc/namespaces.c new file mode 100644 index 000000000000..781dec5bd682 --- /dev/null +++ b/fs/proc/namespaces.c | |||
@@ -0,0 +1,198 @@ | |||
1 | #include <linux/proc_fs.h> | ||
2 | #include <linux/nsproxy.h> | ||
3 | #include <linux/sched.h> | ||
4 | #include <linux/ptrace.h> | ||
5 | #include <linux/fs_struct.h> | ||
6 | #include <linux/mount.h> | ||
7 | #include <linux/path.h> | ||
8 | #include <linux/namei.h> | ||
9 | #include <linux/file.h> | ||
10 | #include <linux/utsname.h> | ||
11 | #include <net/net_namespace.h> | ||
12 | #include <linux/mnt_namespace.h> | ||
13 | #include <linux/ipc_namespace.h> | ||
14 | #include <linux/pid_namespace.h> | ||
15 | #include "internal.h" | ||
16 | |||
17 | |||
18 | static const struct proc_ns_operations *ns_entries[] = { | ||
19 | #ifdef CONFIG_NET_NS | ||
20 | &netns_operations, | ||
21 | #endif | ||
22 | #ifdef CONFIG_UTS_NS | ||
23 | &utsns_operations, | ||
24 | #endif | ||
25 | #ifdef CONFIG_IPC_NS | ||
26 | &ipcns_operations, | ||
27 | #endif | ||
28 | }; | ||
29 | |||
30 | static const struct file_operations ns_file_operations = { | ||
31 | .llseek = no_llseek, | ||
32 | }; | ||
33 | |||
34 | static struct dentry *proc_ns_instantiate(struct inode *dir, | ||
35 | struct dentry *dentry, struct task_struct *task, const void *ptr) | ||
36 | { | ||
37 | const struct proc_ns_operations *ns_ops = ptr; | ||
38 | struct inode *inode; | ||
39 | struct proc_inode *ei; | ||
40 | struct dentry *error = ERR_PTR(-ENOENT); | ||
41 | |||
42 | inode = proc_pid_make_inode(dir->i_sb, task); | ||
43 | if (!inode) | ||
44 | goto out; | ||
45 | |||
46 | ei = PROC_I(inode); | ||
47 | inode->i_mode = S_IFREG|S_IRUSR; | ||
48 | inode->i_fop = &ns_file_operations; | ||
49 | ei->ns_ops = ns_ops; | ||
50 | ei->ns = ns_ops->get(task); | ||
51 | if (!ei->ns) | ||
52 | goto out_iput; | ||
53 | |||
54 | dentry->d_op = &pid_dentry_operations; | ||
55 | d_add(dentry, inode); | ||
56 | /* Close the race of the process dying before we return the dentry */ | ||
57 | if (pid_revalidate(dentry, NULL)) | ||
58 | error = NULL; | ||
59 | out: | ||
60 | return error; | ||
61 | out_iput: | ||
62 | iput(inode); | ||
63 | goto out; | ||
64 | } | ||
65 | |||
66 | static int proc_ns_fill_cache(struct file *filp, void *dirent, | ||
67 | filldir_t filldir, struct task_struct *task, | ||
68 | const struct proc_ns_operations *ops) | ||
69 | { | ||
70 | return proc_fill_cache(filp, dirent, filldir, | ||
71 | ops->name, strlen(ops->name), | ||
72 | proc_ns_instantiate, task, ops); | ||
73 | } | ||
74 | |||
75 | static int proc_ns_dir_readdir(struct file *filp, void *dirent, | ||
76 | filldir_t filldir) | ||
77 | { | ||
78 | int i; | ||
79 | struct dentry *dentry = filp->f_path.dentry; | ||
80 | struct inode *inode = dentry->d_inode; | ||
81 | struct task_struct *task = get_proc_task(inode); | ||
82 | const struct proc_ns_operations **entry, **last; | ||
83 | ino_t ino; | ||
84 | int ret; | ||
85 | |||
86 | ret = -ENOENT; | ||
87 | if (!task) | ||
88 | goto out_no_task; | ||
89 | |||
90 | ret = -EPERM; | ||
91 | if (!ptrace_may_access(task, PTRACE_MODE_READ)) | ||
92 | goto out; | ||
93 | |||
94 | ret = 0; | ||
95 | i = filp->f_pos; | ||
96 | switch (i) { | ||
97 | case 0: | ||
98 | ino = inode->i_ino; | ||
99 | if (filldir(dirent, ".", 1, i, ino, DT_DIR) < 0) | ||
100 | goto out; | ||
101 | i++; | ||
102 | filp->f_pos++; | ||
103 | /* fall through */ | ||
104 | case 1: | ||
105 | ino = parent_ino(dentry); | ||
106 | if (filldir(dirent, "..", 2, i, ino, DT_DIR) < 0) | ||
107 | goto out; | ||
108 | i++; | ||
109 | filp->f_pos++; | ||
110 | /* fall through */ | ||
111 | default: | ||
112 | i -= 2; | ||
113 | if (i >= ARRAY_SIZE(ns_entries)) { | ||
114 | ret = 1; | ||
115 | goto out; | ||
116 | } | ||
117 | entry = ns_entries + i; | ||
118 | last = &ns_entries[ARRAY_SIZE(ns_entries) - 1]; | ||
119 | while (entry <= last) { | ||
120 | if (proc_ns_fill_cache(filp, dirent, filldir, | ||
121 | task, *entry) < 0) | ||
122 | goto out; | ||
123 | filp->f_pos++; | ||
124 | entry++; | ||
125 | } | ||
126 | } | ||
127 | |||
128 | ret = 1; | ||
129 | out: | ||
130 | put_task_struct(task); | ||
131 | out_no_task: | ||
132 | return ret; | ||
133 | } | ||
134 | |||
135 | const struct file_operations proc_ns_dir_operations = { | ||
136 | .read = generic_read_dir, | ||
137 | .readdir = proc_ns_dir_readdir, | ||
138 | }; | ||
139 | |||
140 | static struct dentry *proc_ns_dir_lookup(struct inode *dir, | ||
141 | struct dentry *dentry, struct nameidata *nd) | ||
142 | { | ||
143 | struct dentry *error; | ||
144 | struct task_struct *task = get_proc_task(dir); | ||
145 | const struct proc_ns_operations **entry, **last; | ||
146 | unsigned int len = dentry->d_name.len; | ||
147 | |||
148 | error = ERR_PTR(-ENOENT); | ||
149 | |||
150 | if (!task) | ||
151 | goto out_no_task; | ||
152 | |||
153 | error = ERR_PTR(-EPERM); | ||
154 | if (!ptrace_may_access(task, PTRACE_MODE_READ)) | ||
155 | goto out; | ||
156 | |||
157 | last = &ns_entries[ARRAY_SIZE(ns_entries) - 1]; | ||
158 | for (entry = ns_entries; entry <= last; entry++) { | ||
159 | if (strlen((*entry)->name) != len) | ||
160 | continue; | ||
161 | if (!memcmp(dentry->d_name.name, (*entry)->name, len)) | ||
162 | break; | ||
163 | } | ||
164 | error = ERR_PTR(-ENOENT); | ||
165 | if (entry > last) | ||
166 | goto out; | ||
167 | |||
168 | error = proc_ns_instantiate(dir, dentry, task, *entry); | ||
169 | out: | ||
170 | put_task_struct(task); | ||
171 | out_no_task: | ||
172 | return error; | ||
173 | } | ||
174 | |||
175 | const struct inode_operations proc_ns_dir_inode_operations = { | ||
176 | .lookup = proc_ns_dir_lookup, | ||
177 | .getattr = pid_getattr, | ||
178 | .setattr = proc_setattr, | ||
179 | }; | ||
180 | |||
181 | struct file *proc_ns_fget(int fd) | ||
182 | { | ||
183 | struct file *file; | ||
184 | |||
185 | file = fget(fd); | ||
186 | if (!file) | ||
187 | return ERR_PTR(-EBADF); | ||
188 | |||
189 | if (file->f_op != &ns_file_operations) | ||
190 | goto out_invalid; | ||
191 | |||
192 | return file; | ||
193 | |||
194 | out_invalid: | ||
195 | fput(file); | ||
196 | return ERR_PTR(-EINVAL); | ||
197 | } | ||
198 | |||
diff --git a/include/linux/if_link.h b/include/linux/if_link.h index f4a2e6b1b864..0ee969a5593d 100644 --- a/include/linux/if_link.h +++ b/include/linux/if_link.h | |||
@@ -136,6 +136,7 @@ enum { | |||
136 | IFLA_PORT_SELF, | 136 | IFLA_PORT_SELF, |
137 | IFLA_AF_SPEC, | 137 | IFLA_AF_SPEC, |
138 | IFLA_GROUP, /* Group the device belongs to */ | 138 | IFLA_GROUP, /* Group the device belongs to */ |
139 | IFLA_NET_NS_FD, | ||
139 | __IFLA_MAX | 140 | __IFLA_MAX |
140 | }; | 141 | }; |
141 | 142 | ||
diff --git a/include/linux/proc_fs.h b/include/linux/proc_fs.h index 3686cd6c9aca..648c9c58add7 100644 --- a/include/linux/proc_fs.h +++ b/include/linux/proc_fs.h | |||
@@ -179,6 +179,8 @@ extern void set_mm_exe_file(struct mm_struct *mm, struct file *new_exe_file); | |||
179 | extern struct file *get_mm_exe_file(struct mm_struct *mm); | 179 | extern struct file *get_mm_exe_file(struct mm_struct *mm); |
180 | extern void dup_mm_exe_file(struct mm_struct *oldmm, struct mm_struct *newmm); | 180 | extern void dup_mm_exe_file(struct mm_struct *oldmm, struct mm_struct *newmm); |
181 | 181 | ||
182 | extern struct file *proc_ns_fget(int fd); | ||
183 | |||
182 | #else | 184 | #else |
183 | 185 | ||
184 | #define proc_net_fops_create(net, name, mode, fops) ({ (void)(mode), NULL; }) | 186 | #define proc_net_fops_create(net, name, mode, fops) ({ (void)(mode), NULL; }) |
@@ -241,6 +243,11 @@ static inline void dup_mm_exe_file(struct mm_struct *oldmm, | |||
241 | struct mm_struct *newmm) | 243 | struct mm_struct *newmm) |
242 | {} | 244 | {} |
243 | 245 | ||
246 | static inline struct file *proc_ns_fget(int fd) | ||
247 | { | ||
248 | return ERR_PTR(-EINVAL); | ||
249 | } | ||
250 | |||
244 | #endif /* CONFIG_PROC_FS */ | 251 | #endif /* CONFIG_PROC_FS */ |
245 | 252 | ||
246 | #if !defined(CONFIG_PROC_KCORE) | 253 | #if !defined(CONFIG_PROC_KCORE) |
@@ -252,6 +259,18 @@ kclist_add(struct kcore_list *new, void *addr, size_t size, int type) | |||
252 | extern void kclist_add(struct kcore_list *, void *, size_t, int type); | 259 | extern void kclist_add(struct kcore_list *, void *, size_t, int type); |
253 | #endif | 260 | #endif |
254 | 261 | ||
262 | struct nsproxy; | ||
263 | struct proc_ns_operations { | ||
264 | const char *name; | ||
265 | int type; | ||
266 | void *(*get)(struct task_struct *task); | ||
267 | void (*put)(void *ns); | ||
268 | int (*install)(struct nsproxy *nsproxy, void *ns); | ||
269 | }; | ||
270 | extern const struct proc_ns_operations netns_operations; | ||
271 | extern const struct proc_ns_operations utsns_operations; | ||
272 | extern const struct proc_ns_operations ipcns_operations; | ||
273 | |||
255 | union proc_op { | 274 | union proc_op { |
256 | int (*proc_get_link)(struct inode *, struct path *); | 275 | int (*proc_get_link)(struct inode *, struct path *); |
257 | int (*proc_read)(struct task_struct *task, char *page); | 276 | int (*proc_read)(struct task_struct *task, char *page); |
@@ -270,6 +289,8 @@ struct proc_inode { | |||
270 | struct proc_dir_entry *pde; | 289 | struct proc_dir_entry *pde; |
271 | struct ctl_table_header *sysctl; | 290 | struct ctl_table_header *sysctl; |
272 | struct ctl_table *sysctl_entry; | 291 | struct ctl_table *sysctl_entry; |
292 | void *ns; | ||
293 | const struct proc_ns_operations *ns_ops; | ||
273 | struct inode vfs_inode; | 294 | struct inode vfs_inode; |
274 | }; | 295 | }; |
275 | 296 | ||
diff --git a/include/linux/syscalls.h b/include/linux/syscalls.h index ab71447d0c5a..8c03b98df5f9 100644 --- a/include/linux/syscalls.h +++ b/include/linux/syscalls.h | |||
@@ -846,4 +846,5 @@ asmlinkage long sys_name_to_handle_at(int dfd, const char __user *name, | |||
846 | asmlinkage long sys_open_by_handle_at(int mountdirfd, | 846 | asmlinkage long sys_open_by_handle_at(int mountdirfd, |
847 | struct file_handle __user *handle, | 847 | struct file_handle __user *handle, |
848 | int flags); | 848 | int flags); |
849 | asmlinkage long sys_setns(int fd, int nstype); | ||
849 | #endif | 850 | #endif |
diff --git a/include/net/net_namespace.h b/include/net/net_namespace.h index 3ae491932bc8..dcc8f5749d3f 100644 --- a/include/net/net_namespace.h +++ b/include/net/net_namespace.h | |||
@@ -119,6 +119,7 @@ static inline struct net *copy_net_ns(unsigned long flags, struct net *net_ns) | |||
119 | extern struct list_head net_namespace_list; | 119 | extern struct list_head net_namespace_list; |
120 | 120 | ||
121 | extern struct net *get_net_ns_by_pid(pid_t pid); | 121 | extern struct net *get_net_ns_by_pid(pid_t pid); |
122 | extern struct net *get_net_ns_by_fd(int pid); | ||
122 | 123 | ||
123 | #ifdef CONFIG_NET_NS | 124 | #ifdef CONFIG_NET_NS |
124 | extern void __put_net(struct net *net); | 125 | extern void __put_net(struct net *net); |
diff --git a/ipc/namespace.c b/ipc/namespace.c index 8054c8e5faf1..ce0a647869b1 100644 --- a/ipc/namespace.c +++ b/ipc/namespace.c | |||
@@ -12,6 +12,7 @@ | |||
12 | #include <linux/fs.h> | 12 | #include <linux/fs.h> |
13 | #include <linux/mount.h> | 13 | #include <linux/mount.h> |
14 | #include <linux/user_namespace.h> | 14 | #include <linux/user_namespace.h> |
15 | #include <linux/proc_fs.h> | ||
15 | 16 | ||
16 | #include "util.h" | 17 | #include "util.h" |
17 | 18 | ||
@@ -140,3 +141,39 @@ void put_ipc_ns(struct ipc_namespace *ns) | |||
140 | free_ipc_ns(ns); | 141 | free_ipc_ns(ns); |
141 | } | 142 | } |
142 | } | 143 | } |
144 | |||
145 | static void *ipcns_get(struct task_struct *task) | ||
146 | { | ||
147 | struct ipc_namespace *ns = NULL; | ||
148 | struct nsproxy *nsproxy; | ||
149 | |||
150 | rcu_read_lock(); | ||
151 | nsproxy = task_nsproxy(task); | ||
152 | if (nsproxy) | ||
153 | ns = get_ipc_ns(nsproxy->ipc_ns); | ||
154 | rcu_read_unlock(); | ||
155 | |||
156 | return ns; | ||
157 | } | ||
158 | |||
159 | static void ipcns_put(void *ns) | ||
160 | { | ||
161 | return put_ipc_ns(ns); | ||
162 | } | ||
163 | |||
164 | static int ipcns_install(struct nsproxy *nsproxy, void *ns) | ||
165 | { | ||
166 | /* Ditch state from the old ipc namespace */ | ||
167 | exit_sem(current); | ||
168 | put_ipc_ns(nsproxy->ipc_ns); | ||
169 | nsproxy->ipc_ns = get_ipc_ns(ns); | ||
170 | return 0; | ||
171 | } | ||
172 | |||
173 | const struct proc_ns_operations ipcns_operations = { | ||
174 | .name = "ipc", | ||
175 | .type = CLONE_NEWIPC, | ||
176 | .get = ipcns_get, | ||
177 | .put = ipcns_put, | ||
178 | .install = ipcns_install, | ||
179 | }; | ||
diff --git a/kernel/nsproxy.c b/kernel/nsproxy.c index a05d191ffdd9..5424e37673ed 100644 --- a/kernel/nsproxy.c +++ b/kernel/nsproxy.c | |||
@@ -22,6 +22,9 @@ | |||
22 | #include <linux/pid_namespace.h> | 22 | #include <linux/pid_namespace.h> |
23 | #include <net/net_namespace.h> | 23 | #include <net/net_namespace.h> |
24 | #include <linux/ipc_namespace.h> | 24 | #include <linux/ipc_namespace.h> |
25 | #include <linux/proc_fs.h> | ||
26 | #include <linux/file.h> | ||
27 | #include <linux/syscalls.h> | ||
25 | 28 | ||
26 | static struct kmem_cache *nsproxy_cachep; | 29 | static struct kmem_cache *nsproxy_cachep; |
27 | 30 | ||
@@ -233,6 +236,45 @@ void exit_task_namespaces(struct task_struct *p) | |||
233 | switch_task_namespaces(p, NULL); | 236 | switch_task_namespaces(p, NULL); |
234 | } | 237 | } |
235 | 238 | ||
239 | SYSCALL_DEFINE2(setns, int, fd, int, nstype) | ||
240 | { | ||
241 | const struct proc_ns_operations *ops; | ||
242 | struct task_struct *tsk = current; | ||
243 | struct nsproxy *new_nsproxy; | ||
244 | struct proc_inode *ei; | ||
245 | struct file *file; | ||
246 | int err; | ||
247 | |||
248 | if (!capable(CAP_SYS_ADMIN)) | ||
249 | return -EPERM; | ||
250 | |||
251 | file = proc_ns_fget(fd); | ||
252 | if (IS_ERR(file)) | ||
253 | return PTR_ERR(file); | ||
254 | |||
255 | err = -EINVAL; | ||
256 | ei = PROC_I(file->f_dentry->d_inode); | ||
257 | ops = ei->ns_ops; | ||
258 | if (nstype && (ops->type != nstype)) | ||
259 | goto out; | ||
260 | |||
261 | new_nsproxy = create_new_namespaces(0, tsk, tsk->fs); | ||
262 | if (IS_ERR(new_nsproxy)) { | ||
263 | err = PTR_ERR(new_nsproxy); | ||
264 | goto out; | ||
265 | } | ||
266 | |||
267 | err = ops->install(new_nsproxy, ei->ns); | ||
268 | if (err) { | ||
269 | free_nsproxy(new_nsproxy); | ||
270 | goto out; | ||
271 | } | ||
272 | switch_task_namespaces(tsk, new_nsproxy); | ||
273 | out: | ||
274 | fput(file); | ||
275 | return err; | ||
276 | } | ||
277 | |||
236 | static int __init nsproxy_cache_init(void) | 278 | static int __init nsproxy_cache_init(void) |
237 | { | 279 | { |
238 | nsproxy_cachep = KMEM_CACHE(nsproxy, SLAB_PANIC); | 280 | nsproxy_cachep = KMEM_CACHE(nsproxy, SLAB_PANIC); |
diff --git a/kernel/utsname.c b/kernel/utsname.c index 44646179eaba..bff131b9510a 100644 --- a/kernel/utsname.c +++ b/kernel/utsname.c | |||
@@ -15,6 +15,7 @@ | |||
15 | #include <linux/err.h> | 15 | #include <linux/err.h> |
16 | #include <linux/slab.h> | 16 | #include <linux/slab.h> |
17 | #include <linux/user_namespace.h> | 17 | #include <linux/user_namespace.h> |
18 | #include <linux/proc_fs.h> | ||
18 | 19 | ||
19 | static struct uts_namespace *create_uts_ns(void) | 20 | static struct uts_namespace *create_uts_ns(void) |
20 | { | 21 | { |
@@ -79,3 +80,41 @@ void free_uts_ns(struct kref *kref) | |||
79 | put_user_ns(ns->user_ns); | 80 | put_user_ns(ns->user_ns); |
80 | kfree(ns); | 81 | kfree(ns); |
81 | } | 82 | } |
83 | |||
84 | static void *utsns_get(struct task_struct *task) | ||
85 | { | ||
86 | struct uts_namespace *ns = NULL; | ||
87 | struct nsproxy *nsproxy; | ||
88 | |||
89 | rcu_read_lock(); | ||
90 | nsproxy = task_nsproxy(task); | ||
91 | if (nsproxy) { | ||
92 | ns = nsproxy->uts_ns; | ||
93 | get_uts_ns(ns); | ||
94 | } | ||
95 | rcu_read_unlock(); | ||
96 | |||
97 | return ns; | ||
98 | } | ||
99 | |||
100 | static void utsns_put(void *ns) | ||
101 | { | ||
102 | put_uts_ns(ns); | ||
103 | } | ||
104 | |||
105 | static int utsns_install(struct nsproxy *nsproxy, void *ns) | ||
106 | { | ||
107 | get_uts_ns(ns); | ||
108 | put_uts_ns(nsproxy->uts_ns); | ||
109 | nsproxy->uts_ns = ns; | ||
110 | return 0; | ||
111 | } | ||
112 | |||
113 | const struct proc_ns_operations utsns_operations = { | ||
114 | .name = "uts", | ||
115 | .type = CLONE_NEWUTS, | ||
116 | .get = utsns_get, | ||
117 | .put = utsns_put, | ||
118 | .install = utsns_install, | ||
119 | }; | ||
120 | |||
diff --git a/net/core/net_namespace.c b/net/core/net_namespace.c index 2e2dce6583e1..6c6b86d0da15 100644 --- a/net/core/net_namespace.c +++ b/net/core/net_namespace.c | |||
@@ -8,6 +8,8 @@ | |||
8 | #include <linux/idr.h> | 8 | #include <linux/idr.h> |
9 | #include <linux/rculist.h> | 9 | #include <linux/rculist.h> |
10 | #include <linux/nsproxy.h> | 10 | #include <linux/nsproxy.h> |
11 | #include <linux/proc_fs.h> | ||
12 | #include <linux/file.h> | ||
11 | #include <net/net_namespace.h> | 13 | #include <net/net_namespace.h> |
12 | #include <net/netns/generic.h> | 14 | #include <net/netns/generic.h> |
13 | 15 | ||
@@ -302,6 +304,28 @@ void __put_net(struct net *net) | |||
302 | } | 304 | } |
303 | EXPORT_SYMBOL_GPL(__put_net); | 305 | EXPORT_SYMBOL_GPL(__put_net); |
304 | 306 | ||
307 | struct net *get_net_ns_by_fd(int fd) | ||
308 | { | ||
309 | struct proc_inode *ei; | ||
310 | struct file *file; | ||
311 | struct net *net; | ||
312 | |||
313 | net = ERR_PTR(-EINVAL); | ||
314 | file = proc_ns_fget(fd); | ||
315 | if (!file) | ||
316 | goto out; | ||
317 | |||
318 | ei = PROC_I(file->f_dentry->d_inode); | ||
319 | if (ei->ns_ops != &netns_operations) | ||
320 | goto out; | ||
321 | |||
322 | net = get_net(ei->ns); | ||
323 | out: | ||
324 | if (file) | ||
325 | fput(file); | ||
326 | return net; | ||
327 | } | ||
328 | |||
305 | #else | 329 | #else |
306 | struct net *copy_net_ns(unsigned long flags, struct net *old_net) | 330 | struct net *copy_net_ns(unsigned long flags, struct net *old_net) |
307 | { | 331 | { |
@@ -309,6 +333,11 @@ struct net *copy_net_ns(unsigned long flags, struct net *old_net) | |||
309 | return ERR_PTR(-EINVAL); | 333 | return ERR_PTR(-EINVAL); |
310 | return old_net; | 334 | return old_net; |
311 | } | 335 | } |
336 | |||
337 | struct net *get_net_ns_by_fd(int fd) | ||
338 | { | ||
339 | return ERR_PTR(-EINVAL); | ||
340 | } | ||
312 | #endif | 341 | #endif |
313 | 342 | ||
314 | struct net *get_net_ns_by_pid(pid_t pid) | 343 | struct net *get_net_ns_by_pid(pid_t pid) |
@@ -561,3 +590,39 @@ void unregister_pernet_device(struct pernet_operations *ops) | |||
561 | mutex_unlock(&net_mutex); | 590 | mutex_unlock(&net_mutex); |
562 | } | 591 | } |
563 | EXPORT_SYMBOL_GPL(unregister_pernet_device); | 592 | EXPORT_SYMBOL_GPL(unregister_pernet_device); |
593 | |||
594 | #ifdef CONFIG_NET_NS | ||
595 | static void *netns_get(struct task_struct *task) | ||
596 | { | ||
597 | struct net *net = NULL; | ||
598 | struct nsproxy *nsproxy; | ||
599 | |||
600 | rcu_read_lock(); | ||
601 | nsproxy = task_nsproxy(task); | ||
602 | if (nsproxy) | ||
603 | net = get_net(nsproxy->net_ns); | ||
604 | rcu_read_unlock(); | ||
605 | |||
606 | return net; | ||
607 | } | ||
608 | |||
609 | static void netns_put(void *ns) | ||
610 | { | ||
611 | put_net(ns); | ||
612 | } | ||
613 | |||
614 | static int netns_install(struct nsproxy *nsproxy, void *ns) | ||
615 | { | ||
616 | put_net(nsproxy->net_ns); | ||
617 | nsproxy->net_ns = get_net(ns); | ||
618 | return 0; | ||
619 | } | ||
620 | |||
621 | const struct proc_ns_operations netns_operations = { | ||
622 | .name = "net", | ||
623 | .type = CLONE_NEWNET, | ||
624 | .get = netns_get, | ||
625 | .put = netns_put, | ||
626 | .install = netns_install, | ||
627 | }; | ||
628 | #endif | ||
diff --git a/net/core/rtnetlink.c b/net/core/rtnetlink.c index 2d56cb9b0b94..abd936d8a716 100644 --- a/net/core/rtnetlink.c +++ b/net/core/rtnetlink.c | |||
@@ -1046,6 +1046,7 @@ const struct nla_policy ifla_policy[IFLA_MAX+1] = { | |||
1046 | [IFLA_LINKMODE] = { .type = NLA_U8 }, | 1046 | [IFLA_LINKMODE] = { .type = NLA_U8 }, |
1047 | [IFLA_LINKINFO] = { .type = NLA_NESTED }, | 1047 | [IFLA_LINKINFO] = { .type = NLA_NESTED }, |
1048 | [IFLA_NET_NS_PID] = { .type = NLA_U32 }, | 1048 | [IFLA_NET_NS_PID] = { .type = NLA_U32 }, |
1049 | [IFLA_NET_NS_FD] = { .type = NLA_U32 }, | ||
1049 | [IFLA_IFALIAS] = { .type = NLA_STRING, .len = IFALIASZ-1 }, | 1050 | [IFLA_IFALIAS] = { .type = NLA_STRING, .len = IFALIASZ-1 }, |
1050 | [IFLA_VFINFO_LIST] = {. type = NLA_NESTED }, | 1051 | [IFLA_VFINFO_LIST] = {. type = NLA_NESTED }, |
1051 | [IFLA_VF_PORTS] = { .type = NLA_NESTED }, | 1052 | [IFLA_VF_PORTS] = { .type = NLA_NESTED }, |
@@ -1094,6 +1095,8 @@ struct net *rtnl_link_get_net(struct net *src_net, struct nlattr *tb[]) | |||
1094 | */ | 1095 | */ |
1095 | if (tb[IFLA_NET_NS_PID]) | 1096 | if (tb[IFLA_NET_NS_PID]) |
1096 | net = get_net_ns_by_pid(nla_get_u32(tb[IFLA_NET_NS_PID])); | 1097 | net = get_net_ns_by_pid(nla_get_u32(tb[IFLA_NET_NS_PID])); |
1098 | else if (tb[IFLA_NET_NS_FD]) | ||
1099 | net = get_net_ns_by_fd(nla_get_u32(tb[IFLA_NET_NS_FD])); | ||
1097 | else | 1100 | else |
1098 | net = get_net(src_net); | 1101 | net = get_net(src_net); |
1099 | return net; | 1102 | return net; |
@@ -1224,7 +1227,7 @@ static int do_setlink(struct net_device *dev, struct ifinfomsg *ifm, | |||
1224 | int send_addr_notify = 0; | 1227 | int send_addr_notify = 0; |
1225 | int err; | 1228 | int err; |
1226 | 1229 | ||
1227 | if (tb[IFLA_NET_NS_PID]) { | 1230 | if (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD]) { |
1228 | struct net *net = rtnl_link_get_net(dev_net(dev), tb); | 1231 | struct net *net = rtnl_link_get_net(dev_net(dev), tb); |
1229 | if (IS_ERR(net)) { | 1232 | if (IS_ERR(net)) { |
1230 | err = PTR_ERR(net); | 1233 | err = PTR_ERR(net); |