diff options
-rw-r--r-- | include/linux/init_task.h | 2 | ||||
-rw-r--r-- | include/linux/nsproxy.h | 1 | ||||
-rw-r--r-- | include/linux/sched.h | 3 | ||||
-rw-r--r-- | include/linux/user_namespace.h | 57 | ||||
-rw-r--r-- | init/Kconfig | 9 | ||||
-rw-r--r-- | kernel/Makefile | 2 | ||||
-rw-r--r-- | kernel/fork.c | 2 | ||||
-rw-r--r-- | kernel/nsproxy.c | 9 | ||||
-rw-r--r-- | kernel/sys.c | 5 | ||||
-rw-r--r-- | kernel/user.c | 18 | ||||
-rw-r--r-- | kernel/user_namespace.c | 43 |
11 files changed, 137 insertions, 14 deletions
diff --git a/include/linux/init_task.h b/include/linux/init_task.h index 276ccaa2670c..cab741c2d603 100644 --- a/include/linux/init_task.h +++ b/include/linux/init_task.h | |||
@@ -8,6 +8,7 @@ | |||
8 | #include <linux/lockdep.h> | 8 | #include <linux/lockdep.h> |
9 | #include <linux/ipc.h> | 9 | #include <linux/ipc.h> |
10 | #include <linux/pid_namespace.h> | 10 | #include <linux/pid_namespace.h> |
11 | #include <linux/user_namespace.h> | ||
11 | 12 | ||
12 | #define INIT_FDTABLE \ | 13 | #define INIT_FDTABLE \ |
13 | { \ | 14 | { \ |
@@ -78,6 +79,7 @@ extern struct nsproxy init_nsproxy; | |||
78 | .uts_ns = &init_uts_ns, \ | 79 | .uts_ns = &init_uts_ns, \ |
79 | .mnt_ns = NULL, \ | 80 | .mnt_ns = NULL, \ |
80 | INIT_IPC_NS(ipc_ns) \ | 81 | INIT_IPC_NS(ipc_ns) \ |
82 | .user_ns = &init_user_ns, \ | ||
81 | } | 83 | } |
82 | 84 | ||
83 | #define INIT_SIGHAND(sighand) { \ | 85 | #define INIT_SIGHAND(sighand) { \ |
diff --git a/include/linux/nsproxy.h b/include/linux/nsproxy.h index 189e0dc993ab..6d179a397bfb 100644 --- a/include/linux/nsproxy.h +++ b/include/linux/nsproxy.h | |||
@@ -28,6 +28,7 @@ struct nsproxy { | |||
28 | struct ipc_namespace *ipc_ns; | 28 | struct ipc_namespace *ipc_ns; |
29 | struct mnt_namespace *mnt_ns; | 29 | struct mnt_namespace *mnt_ns; |
30 | struct pid_namespace *pid_ns; | 30 | struct pid_namespace *pid_ns; |
31 | struct user_namespace *user_ns; | ||
31 | }; | 32 | }; |
32 | extern struct nsproxy init_nsproxy; | 33 | extern struct nsproxy init_nsproxy; |
33 | 34 | ||
diff --git a/include/linux/sched.h b/include/linux/sched.h index b579624477f4..c667255d70db 100644 --- a/include/linux/sched.h +++ b/include/linux/sched.h | |||
@@ -287,6 +287,7 @@ extern signed long schedule_timeout_uninterruptible(signed long timeout); | |||
287 | asmlinkage void schedule(void); | 287 | asmlinkage void schedule(void); |
288 | 288 | ||
289 | struct nsproxy; | 289 | struct nsproxy; |
290 | struct user_namespace; | ||
290 | 291 | ||
291 | /* Maximum number of active map areas.. This is a random (large) number */ | 292 | /* Maximum number of active map areas.. This is a random (large) number */ |
292 | #define DEFAULT_MAX_MAP_COUNT 65536 | 293 | #define DEFAULT_MAX_MAP_COUNT 65536 |
@@ -1408,7 +1409,7 @@ extern struct task_struct *find_task_by_pid_type(int type, int pid); | |||
1408 | extern void __set_special_pids(pid_t session, pid_t pgrp); | 1409 | extern void __set_special_pids(pid_t session, pid_t pgrp); |
1409 | 1410 | ||
1410 | /* per-UID process charging. */ | 1411 | /* per-UID process charging. */ |
1411 | extern struct user_struct * alloc_uid(uid_t); | 1412 | extern struct user_struct * alloc_uid(struct user_namespace *, uid_t); |
1412 | static inline struct user_struct *get_uid(struct user_struct *u) | 1413 | static inline struct user_struct *get_uid(struct user_struct *u) |
1413 | { | 1414 | { |
1414 | atomic_inc(&u->__count); | 1415 | atomic_inc(&u->__count); |
diff --git a/include/linux/user_namespace.h b/include/linux/user_namespace.h new file mode 100644 index 000000000000..92a45867ecfb --- /dev/null +++ b/include/linux/user_namespace.h | |||
@@ -0,0 +1,57 @@ | |||
1 | #ifndef _LINUX_USER_NAMESPACE_H | ||
2 | #define _LINUX_USER_NAMESPACE_H | ||
3 | |||
4 | #include <linux/kref.h> | ||
5 | #include <linux/nsproxy.h> | ||
6 | #include <linux/sched.h> | ||
7 | |||
8 | #define UIDHASH_BITS (CONFIG_BASE_SMALL ? 3 : 8) | ||
9 | #define UIDHASH_SZ (1 << UIDHASH_BITS) | ||
10 | |||
11 | struct user_namespace { | ||
12 | struct kref kref; | ||
13 | struct list_head uidhash_table[UIDHASH_SZ]; | ||
14 | struct user_struct *root_user; | ||
15 | }; | ||
16 | |||
17 | extern struct user_namespace init_user_ns; | ||
18 | |||
19 | #ifdef CONFIG_USER_NS | ||
20 | |||
21 | static inline struct user_namespace *get_user_ns(struct user_namespace *ns) | ||
22 | { | ||
23 | if (ns) | ||
24 | kref_get(&ns->kref); | ||
25 | return ns; | ||
26 | } | ||
27 | |||
28 | extern struct user_namespace *copy_user_ns(int flags, | ||
29 | struct user_namespace *old_ns); | ||
30 | extern void free_user_ns(struct kref *kref); | ||
31 | |||
32 | static inline void put_user_ns(struct user_namespace *ns) | ||
33 | { | ||
34 | if (ns) | ||
35 | kref_put(&ns->kref, free_user_ns); | ||
36 | } | ||
37 | |||
38 | #else | ||
39 | |||
40 | static inline struct user_namespace *get_user_ns(struct user_namespace *ns) | ||
41 | { | ||
42 | return &init_user_ns; | ||
43 | } | ||
44 | |||
45 | static inline struct user_namespace *copy_user_ns(int flags, | ||
46 | struct user_namespace *old_ns) | ||
47 | { | ||
48 | return NULL; | ||
49 | } | ||
50 | |||
51 | static inline void put_user_ns(struct user_namespace *ns) | ||
52 | { | ||
53 | } | ||
54 | |||
55 | #endif | ||
56 | |||
57 | #endif /* _LINUX_USER_H */ | ||
diff --git a/init/Kconfig b/init/Kconfig index 1e198b8c6936..0b0e29ed82d1 100644 --- a/init/Kconfig +++ b/init/Kconfig | |||
@@ -209,6 +209,15 @@ config TASK_IO_ACCOUNTING | |||
209 | 209 | ||
210 | Say N if unsure. | 210 | Say N if unsure. |
211 | 211 | ||
212 | config USER_NS | ||
213 | bool "User Namespaces (EXPERIMENTAL)" | ||
214 | default n | ||
215 | depends on EXPERIMENTAL | ||
216 | help | ||
217 | Support user namespaces. This allows containers, i.e. | ||
218 | vservers, to use user namespaces to provide different | ||
219 | user info for different servers. If unsure, say N. | ||
220 | |||
212 | config AUDIT | 221 | config AUDIT |
213 | bool "Auditing support" | 222 | bool "Auditing support" |
214 | depends on NET | 223 | depends on NET |
diff --git a/kernel/Makefile b/kernel/Makefile index fa8efd437afb..2a999836ca18 100644 --- a/kernel/Makefile +++ b/kernel/Makefile | |||
@@ -4,7 +4,7 @@ | |||
4 | 4 | ||
5 | obj-y = sched.o fork.o exec_domain.o panic.o printk.o profile.o \ | 5 | obj-y = sched.o fork.o exec_domain.o panic.o printk.o profile.o \ |
6 | exit.o itimer.o time.o softirq.o resource.o \ | 6 | exit.o itimer.o time.o softirq.o resource.o \ |
7 | sysctl.o capability.o ptrace.o timer.o user.o \ | 7 | sysctl.o capability.o ptrace.o timer.o user.o user_namespace.o \ |
8 | signal.o sys.o kmod.o workqueue.o pid.o \ | 8 | signal.o sys.o kmod.o workqueue.o pid.o \ |
9 | rcupdate.o extable.o params.o posix-timers.o \ | 9 | rcupdate.o extable.o params.o posix-timers.o \ |
10 | kthread.o wait.o kfifo.o sys_ni.o posix-cpu-timers.o mutex.o \ | 10 | kthread.o wait.o kfifo.o sys_ni.o posix-cpu-timers.o mutex.o \ |
diff --git a/kernel/fork.c b/kernel/fork.c index 4015912aaac2..13cf0978780a 100644 --- a/kernel/fork.c +++ b/kernel/fork.c | |||
@@ -1002,7 +1002,7 @@ static struct task_struct *copy_process(unsigned long clone_flags, | |||
1002 | if (atomic_read(&p->user->processes) >= | 1002 | if (atomic_read(&p->user->processes) >= |
1003 | p->signal->rlim[RLIMIT_NPROC].rlim_cur) { | 1003 | p->signal->rlim[RLIMIT_NPROC].rlim_cur) { |
1004 | if (!capable(CAP_SYS_ADMIN) && !capable(CAP_SYS_RESOURCE) && | 1004 | if (!capable(CAP_SYS_ADMIN) && !capable(CAP_SYS_RESOURCE) && |
1005 | p->user != &root_user) | 1005 | p->user != current->nsproxy->user_ns->root_user) |
1006 | goto bad_fork_free; | 1006 | goto bad_fork_free; |
1007 | } | 1007 | } |
1008 | 1008 | ||
diff --git a/kernel/nsproxy.c b/kernel/nsproxy.c index e38bed75367d..895e3a3f2044 100644 --- a/kernel/nsproxy.c +++ b/kernel/nsproxy.c | |||
@@ -79,8 +79,15 @@ static struct nsproxy *create_new_namespaces(int flags, struct task_struct *tsk, | |||
79 | if (IS_ERR(new_nsp->pid_ns)) | 79 | if (IS_ERR(new_nsp->pid_ns)) |
80 | goto out_pid; | 80 | goto out_pid; |
81 | 81 | ||
82 | new_nsp->user_ns = copy_user_ns(flags, tsk->nsproxy->user_ns); | ||
83 | if (IS_ERR(new_nsp->user_ns)) | ||
84 | goto out_user; | ||
85 | |||
82 | return new_nsp; | 86 | return new_nsp; |
83 | 87 | ||
88 | out_user: | ||
89 | if (new_nsp->pid_ns) | ||
90 | put_pid_ns(new_nsp->pid_ns); | ||
84 | out_pid: | 91 | out_pid: |
85 | if (new_nsp->ipc_ns) | 92 | if (new_nsp->ipc_ns) |
86 | put_ipc_ns(new_nsp->ipc_ns); | 93 | put_ipc_ns(new_nsp->ipc_ns); |
@@ -140,6 +147,8 @@ void free_nsproxy(struct nsproxy *ns) | |||
140 | put_ipc_ns(ns->ipc_ns); | 147 | put_ipc_ns(ns->ipc_ns); |
141 | if (ns->pid_ns) | 148 | if (ns->pid_ns) |
142 | put_pid_ns(ns->pid_ns); | 149 | put_pid_ns(ns->pid_ns); |
150 | if (ns->user_ns) | ||
151 | put_user_ns(ns->user_ns); | ||
143 | kfree(ns); | 152 | kfree(ns); |
144 | } | 153 | } |
145 | 154 | ||
diff --git a/kernel/sys.c b/kernel/sys.c index 872271ccc384..ed92e2f03342 100644 --- a/kernel/sys.c +++ b/kernel/sys.c | |||
@@ -35,6 +35,7 @@ | |||
35 | #include <linux/compat.h> | 35 | #include <linux/compat.h> |
36 | #include <linux/syscalls.h> | 36 | #include <linux/syscalls.h> |
37 | #include <linux/kprobes.h> | 37 | #include <linux/kprobes.h> |
38 | #include <linux/user_namespace.h> | ||
38 | 39 | ||
39 | #include <asm/uaccess.h> | 40 | #include <asm/uaccess.h> |
40 | #include <asm/io.h> | 41 | #include <asm/io.h> |
@@ -1078,13 +1079,13 @@ static int set_user(uid_t new_ruid, int dumpclear) | |||
1078 | { | 1079 | { |
1079 | struct user_struct *new_user; | 1080 | struct user_struct *new_user; |
1080 | 1081 | ||
1081 | new_user = alloc_uid(new_ruid); | 1082 | new_user = alloc_uid(current->nsproxy->user_ns, new_ruid); |
1082 | if (!new_user) | 1083 | if (!new_user) |
1083 | return -EAGAIN; | 1084 | return -EAGAIN; |
1084 | 1085 | ||
1085 | if (atomic_read(&new_user->processes) >= | 1086 | if (atomic_read(&new_user->processes) >= |
1086 | current->signal->rlim[RLIMIT_NPROC].rlim_cur && | 1087 | current->signal->rlim[RLIMIT_NPROC].rlim_cur && |
1087 | new_user != &root_user) { | 1088 | new_user != current->nsproxy->user_ns->root_user) { |
1088 | free_uid(new_user); | 1089 | free_uid(new_user); |
1089 | return -EAGAIN; | 1090 | return -EAGAIN; |
1090 | } | 1091 | } |
diff --git a/kernel/user.c b/kernel/user.c index 4869563080e9..98b82507797a 100644 --- a/kernel/user.c +++ b/kernel/user.c | |||
@@ -14,20 +14,19 @@ | |||
14 | #include <linux/bitops.h> | 14 | #include <linux/bitops.h> |
15 | #include <linux/key.h> | 15 | #include <linux/key.h> |
16 | #include <linux/interrupt.h> | 16 | #include <linux/interrupt.h> |
17 | #include <linux/module.h> | ||
18 | #include <linux/user_namespace.h> | ||
17 | 19 | ||
18 | /* | 20 | /* |
19 | * UID task count cache, to get fast user lookup in "alloc_uid" | 21 | * UID task count cache, to get fast user lookup in "alloc_uid" |
20 | * when changing user ID's (ie setuid() and friends). | 22 | * when changing user ID's (ie setuid() and friends). |
21 | */ | 23 | */ |
22 | 24 | ||
23 | #define UIDHASH_BITS (CONFIG_BASE_SMALL ? 3 : 8) | ||
24 | #define UIDHASH_SZ (1 << UIDHASH_BITS) | ||
25 | #define UIDHASH_MASK (UIDHASH_SZ - 1) | 25 | #define UIDHASH_MASK (UIDHASH_SZ - 1) |
26 | #define __uidhashfn(uid) (((uid >> UIDHASH_BITS) + uid) & UIDHASH_MASK) | 26 | #define __uidhashfn(uid) (((uid >> UIDHASH_BITS) + uid) & UIDHASH_MASK) |
27 | #define uidhashentry(uid) (uidhash_table + __uidhashfn((uid))) | 27 | #define uidhashentry(ns, uid) ((ns)->uidhash_table + __uidhashfn((uid))) |
28 | 28 | ||
29 | static struct kmem_cache *uid_cachep; | 29 | static struct kmem_cache *uid_cachep; |
30 | static struct list_head uidhash_table[UIDHASH_SZ]; | ||
31 | 30 | ||
32 | /* | 31 | /* |
33 | * The uidhash_lock is mostly taken from process context, but it is | 32 | * The uidhash_lock is mostly taken from process context, but it is |
@@ -94,9 +93,10 @@ struct user_struct *find_user(uid_t uid) | |||
94 | { | 93 | { |
95 | struct user_struct *ret; | 94 | struct user_struct *ret; |
96 | unsigned long flags; | 95 | unsigned long flags; |
96 | struct user_namespace *ns = current->nsproxy->user_ns; | ||
97 | 97 | ||
98 | spin_lock_irqsave(&uidhash_lock, flags); | 98 | spin_lock_irqsave(&uidhash_lock, flags); |
99 | ret = uid_hash_find(uid, uidhashentry(uid)); | 99 | ret = uid_hash_find(uid, uidhashentry(ns, uid)); |
100 | spin_unlock_irqrestore(&uidhash_lock, flags); | 100 | spin_unlock_irqrestore(&uidhash_lock, flags); |
101 | return ret; | 101 | return ret; |
102 | } | 102 | } |
@@ -120,9 +120,9 @@ void free_uid(struct user_struct *up) | |||
120 | } | 120 | } |
121 | } | 121 | } |
122 | 122 | ||
123 | struct user_struct * alloc_uid(uid_t uid) | 123 | struct user_struct * alloc_uid(struct user_namespace *ns, uid_t uid) |
124 | { | 124 | { |
125 | struct list_head *hashent = uidhashentry(uid); | 125 | struct list_head *hashent = uidhashentry(ns, uid); |
126 | struct user_struct *up; | 126 | struct user_struct *up; |
127 | 127 | ||
128 | spin_lock_irq(&uidhash_lock); | 128 | spin_lock_irq(&uidhash_lock); |
@@ -211,11 +211,11 @@ static int __init uid_cache_init(void) | |||
211 | 0, SLAB_HWCACHE_ALIGN|SLAB_PANIC, NULL, NULL); | 211 | 0, SLAB_HWCACHE_ALIGN|SLAB_PANIC, NULL, NULL); |
212 | 212 | ||
213 | for(n = 0; n < UIDHASH_SZ; ++n) | 213 | for(n = 0; n < UIDHASH_SZ; ++n) |
214 | INIT_LIST_HEAD(uidhash_table + n); | 214 | INIT_LIST_HEAD(init_user_ns.uidhash_table + n); |
215 | 215 | ||
216 | /* Insert the root user immediately (init already runs as root) */ | 216 | /* Insert the root user immediately (init already runs as root) */ |
217 | spin_lock_irq(&uidhash_lock); | 217 | spin_lock_irq(&uidhash_lock); |
218 | uid_hash_insert(&root_user, uidhashentry(0)); | 218 | uid_hash_insert(&root_user, uidhashentry(&init_user_ns, 0)); |
219 | spin_unlock_irq(&uidhash_lock); | 219 | spin_unlock_irq(&uidhash_lock); |
220 | 220 | ||
221 | return 0; | 221 | return 0; |
diff --git a/kernel/user_namespace.c b/kernel/user_namespace.c new file mode 100644 index 000000000000..3d7964209774 --- /dev/null +++ b/kernel/user_namespace.c | |||
@@ -0,0 +1,43 @@ | |||
1 | /* | ||
2 | * This program is free software; you can redistribute it and/or | ||
3 | * modify it under the terms of the GNU General Public License as | ||
4 | * published by the Free Software Foundation, version 2 of the | ||
5 | * License. | ||
6 | */ | ||
7 | |||
8 | #include <linux/module.h> | ||
9 | #include <linux/version.h> | ||
10 | #include <linux/nsproxy.h> | ||
11 | #include <linux/user_namespace.h> | ||
12 | |||
13 | struct user_namespace init_user_ns = { | ||
14 | .kref = { | ||
15 | .refcount = ATOMIC_INIT(2), | ||
16 | }, | ||
17 | .root_user = &root_user, | ||
18 | }; | ||
19 | |||
20 | EXPORT_SYMBOL_GPL(init_user_ns); | ||
21 | |||
22 | #ifdef CONFIG_USER_NS | ||
23 | |||
24 | struct user_namespace * copy_user_ns(int flags, struct user_namespace *old_ns) | ||
25 | { | ||
26 | struct user_namespace *new_ns; | ||
27 | |||
28 | BUG_ON(!old_ns); | ||
29 | get_user_ns(old_ns); | ||
30 | |||
31 | new_ns = old_ns; | ||
32 | return new_ns; | ||
33 | } | ||
34 | |||
35 | void free_user_ns(struct kref *kref) | ||
36 | { | ||
37 | struct user_namespace *ns; | ||
38 | |||
39 | ns = container_of(kref, struct user_namespace, kref); | ||
40 | kfree(ns); | ||
41 | } | ||
42 | |||
43 | #endif /* CONFIG_USER_NS */ | ||