Commit | Line | Data |
---|---|---|
b2441318 | 1 | // SPDX-License-Identifier: GPL-2.0 |
ae5e1b22 PE |
2 | /* |
3 | * linux/ipc/namespace.c | |
4 | * Copyright (C) 2006 Pavel Emelyanov <xemul@openvz.org> OpenVZ, SWsoft Inc. | |
5 | */ | |
6 | ||
7 | #include <linux/ipc.h> | |
8 | #include <linux/msg.h> | |
9 | #include <linux/ipc_namespace.h> | |
10 | #include <linux/rcupdate.h> | |
11 | #include <linux/nsproxy.h> | |
12 | #include <linux/slab.h> | |
5b825c3a | 13 | #include <linux/cred.h> |
7eafd7c7 SH |
14 | #include <linux/fs.h> |
15 | #include <linux/mount.h> | |
b515498f | 16 | #include <linux/user_namespace.h> |
0bb80f24 | 17 | #include <linux/proc_ns.h> |
f719ff9b | 18 | #include <linux/sched/task.h> |
ae5e1b22 PE |
19 | |
20 | #include "util.h" | |
21 | ||
aba35661 EB |
22 | static struct ucounts *inc_ipc_namespaces(struct user_namespace *ns) |
23 | { | |
24 | return inc_ucount(ns, current_euid(), UCOUNT_IPC_NAMESPACES); | |
25 | } | |
26 | ||
27 | static void dec_ipc_namespaces(struct ucounts *ucounts) | |
28 | { | |
29 | dec_ucount(ucounts, UCOUNT_IPC_NAMESPACES); | |
30 | } | |
31 | ||
bcf58e72 | 32 | static struct ipc_namespace *create_ipc_ns(struct user_namespace *user_ns, |
b0e77598 | 33 | struct ipc_namespace *old_ns) |
ae5e1b22 | 34 | { |
ae5e1b22 | 35 | struct ipc_namespace *ns; |
aba35661 | 36 | struct ucounts *ucounts; |
7eafd7c7 | 37 | int err; |
ae5e1b22 | 38 | |
df75e774 | 39 | err = -ENOSPC; |
aba35661 EB |
40 | ucounts = inc_ipc_namespaces(user_ns); |
41 | if (!ucounts) | |
42 | goto fail; | |
43 | ||
44 | err = -ENOMEM; | |
30acd0bd | 45 | ns = kzalloc(sizeof(struct ipc_namespace), GFP_KERNEL_ACCOUNT); |
ae5e1b22 | 46 | if (ns == NULL) |
aba35661 | 47 | goto fail_dec; |
ae5e1b22 | 48 | |
6344c433 | 49 | err = ns_alloc_inum(&ns->ns); |
aba35661 EB |
50 | if (err) |
51 | goto fail_free; | |
33c42940 | 52 | ns->ns.ops = &ipcns_operations; |
98f842e6 | 53 | |
137ec390 | 54 | refcount_set(&ns->ns.count, 1); |
b236017a | 55 | ns->user_ns = get_user_ns(user_ns); |
aba35661 | 56 | ns->ucounts = ucounts; |
b236017a | 57 | |
eae04d25 | 58 | err = mq_init_ns(ns); |
aba35661 EB |
59 | if (err) |
60 | goto fail_put; | |
4d89dc6a | 61 | |
dc55e35f AG |
62 | err = -ENOMEM; |
63 | if (!setup_mq_sysctls(ns)) | |
64 | goto fail_put; | |
65 | ||
eae04d25 DB |
66 | sem_init_ns(ns); |
67 | msg_init_ns(ns); | |
68 | shm_init_ns(ns); | |
ae5e1b22 | 69 | |
ae5e1b22 | 70 | return ns; |
aba35661 EB |
71 | |
72 | fail_put: | |
73 | put_user_ns(ns->user_ns); | |
74 | ns_free_inum(&ns->ns); | |
75 | fail_free: | |
76 | kfree(ns); | |
77 | fail_dec: | |
78 | dec_ipc_namespaces(ucounts); | |
79 | fail: | |
80 | return ERR_PTR(err); | |
ae5e1b22 PE |
81 | } |
82 | ||
b0e77598 | 83 | struct ipc_namespace *copy_ipcs(unsigned long flags, |
bcf58e72 | 84 | struct user_namespace *user_ns, struct ipc_namespace *ns) |
ae5e1b22 | 85 | { |
ae5e1b22 | 86 | if (!(flags & CLONE_NEWIPC)) |
64424289 | 87 | return get_ipc_ns(ns); |
bcf58e72 | 88 | return create_ipc_ns(user_ns, ns); |
ae5e1b22 PE |
89 | } |
90 | ||
01b8b07a PP |
91 | /* |
92 | * free_ipcs - free all ipcs of one type | |
93 | * @ns: the namespace to remove the ipcs from | |
94 | * @ids: the table of ipcs to free | |
95 | * @free: the function called to free each individual ipc | |
96 | * | |
97 | * Called for each kind of ipc when an ipc_namespace exits. | |
98 | */ | |
99 | void free_ipcs(struct ipc_namespace *ns, struct ipc_ids *ids, | |
100 | void (*free)(struct ipc_namespace *, struct kern_ipc_perm *)) | |
101 | { | |
102 | struct kern_ipc_perm *perm; | |
103 | int next_id; | |
104 | int total, in_use; | |
105 | ||
d9a605e4 | 106 | down_write(&ids->rwsem); |
01b8b07a PP |
107 | |
108 | in_use = ids->in_use; | |
109 | ||
110 | for (total = 0, next_id = 0; total < in_use; next_id++) { | |
111 | perm = idr_find(&ids->ipcs_idr, next_id); | |
112 | if (perm == NULL) | |
113 | continue; | |
32a27500 DB |
114 | rcu_read_lock(); |
115 | ipc_lock_object(perm); | |
01b8b07a PP |
116 | free(ns, perm); |
117 | total++; | |
118 | } | |
d9a605e4 | 119 | up_write(&ids->rwsem); |
01b8b07a PP |
120 | } |
121 | ||
b4188def AD |
122 | static void free_ipc_ns(struct ipc_namespace *ns) |
123 | { | |
e1eb26fa GS |
124 | /* mq_put_mnt() waits for a grace period as kern_unmount() |
125 | * uses synchronize_rcu(). | |
126 | */ | |
127 | mq_put_mnt(ns); | |
b4188def AD |
128 | sem_exit_ns(ns); |
129 | msg_exit_ns(ns); | |
130 | shm_exit_ns(ns); | |
b4188def | 131 | |
dc55e35f AG |
132 | retire_mq_sysctls(ns); |
133 | ||
aba35661 | 134 | dec_ipc_namespaces(ns->ucounts); |
b515498f | 135 | put_user_ns(ns->user_ns); |
6344c433 | 136 | ns_free_inum(&ns->ns); |
be4d250a | 137 | kfree(ns); |
b4188def AD |
138 | } |
139 | ||
e1eb26fa GS |
140 | static LLIST_HEAD(free_ipc_list); |
141 | static void free_ipc(struct work_struct *unused) | |
142 | { | |
143 | struct llist_node *node = llist_del_all(&free_ipc_list); | |
144 | struct ipc_namespace *n, *t; | |
145 | ||
146 | llist_for_each_entry_safe(n, t, node, mnt_llist) | |
147 | free_ipc_ns(n); | |
148 | } | |
149 | ||
150 | /* | |
151 | * The work queue is used to avoid the cost of synchronize_rcu in kern_unmount. | |
152 | */ | |
153 | static DECLARE_WORK(free_ipc_work, free_ipc); | |
154 | ||
7eafd7c7 SH |
155 | /* |
156 | * put_ipc_ns - drop a reference to an ipc namespace. | |
157 | * @ns: the namespace to put | |
158 | * | |
159 | * If this is the last task in the namespace exiting, and | |
160 | * it is dropping the refcount to 0, then it can race with | |
161 | * a task in another ipc namespace but in a mounts namespace | |
162 | * which has this ipcns's mqueuefs mounted, doing some action | |
163 | * with one of the mqueuefs files. That can raise the refcount. | |
164 | * So dropping the refcount, and raising the refcount when | |
165 | * accessing it through the VFS, are protected with mq_lock. | |
166 | * | |
167 | * (Clearly, a task raising the refcount on its own ipc_ns | |
168 | * needn't take mq_lock since it can't race with the last task | |
169 | * in the ipcns exiting). | |
170 | */ | |
171 | void put_ipc_ns(struct ipc_namespace *ns) | |
ae5e1b22 | 172 | { |
137ec390 | 173 | if (refcount_dec_and_lock(&ns->ns.count, &mq_lock)) { |
7eafd7c7 SH |
174 | mq_clear_sbinfo(ns); |
175 | spin_unlock(&mq_lock); | |
e1eb26fa GS |
176 | |
177 | if (llist_add(&ns->mnt_llist, &free_ipc_list)) | |
178 | schedule_work(&free_ipc_work); | |
7eafd7c7 SH |
179 | } |
180 | } | |
a00eaf11 | 181 | |
3c041184 AV |
182 | static inline struct ipc_namespace *to_ipc_ns(struct ns_common *ns) |
183 | { | |
184 | return container_of(ns, struct ipc_namespace, ns); | |
185 | } | |
186 | ||
64964528 | 187 | static struct ns_common *ipcns_get(struct task_struct *task) |
a00eaf11 EB |
188 | { |
189 | struct ipc_namespace *ns = NULL; | |
190 | struct nsproxy *nsproxy; | |
191 | ||
728dba3a EB |
192 | task_lock(task); |
193 | nsproxy = task->nsproxy; | |
a00eaf11 EB |
194 | if (nsproxy) |
195 | ns = get_ipc_ns(nsproxy->ipc_ns); | |
728dba3a | 196 | task_unlock(task); |
a00eaf11 | 197 | |
3c041184 | 198 | return ns ? &ns->ns : NULL; |
a00eaf11 EB |
199 | } |
200 | ||
64964528 | 201 | static void ipcns_put(struct ns_common *ns) |
a00eaf11 | 202 | { |
3c041184 | 203 | return put_ipc_ns(to_ipc_ns(ns)); |
a00eaf11 EB |
204 | } |
205 | ||
f2a8d52e | 206 | static int ipcns_install(struct nsset *nsset, struct ns_common *new) |
a00eaf11 | 207 | { |
f2a8d52e | 208 | struct nsproxy *nsproxy = nsset->nsproxy; |
3c041184 | 209 | struct ipc_namespace *ns = to_ipc_ns(new); |
5e4a0847 | 210 | if (!ns_capable(ns->user_ns, CAP_SYS_ADMIN) || |
f2a8d52e | 211 | !ns_capable(nsset->cred->user_ns, CAP_SYS_ADMIN)) |
142e1d1d EB |
212 | return -EPERM; |
213 | ||
a00eaf11 EB |
214 | put_ipc_ns(nsproxy->ipc_ns); |
215 | nsproxy->ipc_ns = get_ipc_ns(ns); | |
216 | return 0; | |
217 | } | |
218 | ||
bcac25a5 AV |
219 | static struct user_namespace *ipcns_owner(struct ns_common *ns) |
220 | { | |
221 | return to_ipc_ns(ns)->user_ns; | |
222 | } | |
223 | ||
a00eaf11 EB |
224 | const struct proc_ns_operations ipcns_operations = { |
225 | .name = "ipc", | |
226 | .type = CLONE_NEWIPC, | |
227 | .get = ipcns_get, | |
228 | .put = ipcns_put, | |
229 | .install = ipcns_install, | |
bcac25a5 | 230 | .owner = ipcns_owner, |
a00eaf11 | 231 | }; |