blob: 6ecc30effd3ec6e875b1db39e85b6be76e5a0186 [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -08002/*
3 * linux/ipc/namespace.c
4 * Copyright (C) 2006 Pavel Emelyanov <xemul@openvz.org> OpenVZ, SWsoft Inc.
5 */
6
7#include <linux/ipc.h>
8#include <linux/msg.h>
9#include <linux/ipc_namespace.h>
10#include <linux/rcupdate.h>
11#include <linux/nsproxy.h>
12#include <linux/slab.h>
Ingo Molnar5b825c32017-02-02 17:54:15 +010013#include <linux/cred.h>
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -070014#include <linux/fs.h>
15#include <linux/mount.h>
Serge E. Hallynb5154982011-03-23 16:43:23 -070016#include <linux/user_namespace.h>
David Howells0bb80f22013-04-12 01:50:06 +010017#include <linux/proc_ns.h>
Ingo Molnarf719ff9b2017-02-06 10:57:33 +010018#include <linux/sched/task.h>
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080019
20#include "util.h"
21
Rik van Riela80c4ad2023-01-27 13:46:50 -050022/*
23 * The work queue is used to avoid the cost of synchronize_rcu in kern_unmount.
24 */
25static void free_ipc(struct work_struct *unused);
26static DECLARE_WORK(free_ipc_work, free_ipc);
27
Eric W. Biedermanaba35662016-08-08 14:20:23 -050028static struct ucounts *inc_ipc_namespaces(struct user_namespace *ns)
29{
30 return inc_ucount(ns, current_euid(), UCOUNT_IPC_NAMESPACES);
31}
32
33static void dec_ipc_namespaces(struct ucounts *ucounts)
34{
35 dec_ucount(ucounts, UCOUNT_IPC_NAMESPACES);
36}
37
Eric W. Biedermanbcf58e72012-07-26 04:02:49 -070038static struct ipc_namespace *create_ipc_ns(struct user_namespace *user_ns,
Serge E. Hallynb0e77592011-03-23 16:43:24 -070039 struct ipc_namespace *old_ns)
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080040{
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080041 struct ipc_namespace *ns;
Eric W. Biedermanaba35662016-08-08 14:20:23 -050042 struct ucounts *ucounts;
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -070043 int err;
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080044
Eric W. Biedermandf75e772016-09-22 13:08:36 -050045 err = -ENOSPC;
Rik van Riela80c4ad2023-01-27 13:46:50 -050046 again:
Eric W. Biedermanaba35662016-08-08 14:20:23 -050047 ucounts = inc_ipc_namespaces(user_ns);
Rik van Riela80c4ad2023-01-27 13:46:50 -050048 if (!ucounts) {
49 /*
50 * IPC namespaces are freed asynchronously, by free_ipc_work.
51 * If frees were pending, flush_work will wait, and
52 * return true. Fail the allocation if no frees are pending.
53 */
54 if (flush_work(&free_ipc_work))
55 goto again;
Eric W. Biedermanaba35662016-08-08 14:20:23 -050056 goto fail;
Rik van Riela80c4ad2023-01-27 13:46:50 -050057 }
Eric W. Biedermanaba35662016-08-08 14:20:23 -050058
59 err = -ENOMEM;
Vasily Averin30acd0b2021-09-02 14:55:27 -070060 ns = kzalloc(sizeof(struct ipc_namespace), GFP_KERNEL_ACCOUNT);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080061 if (ns == NULL)
Eric W. Biedermanaba35662016-08-08 14:20:23 -050062 goto fail_dec;
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080063
Al Viro6344c432014-11-01 00:45:45 -040064 err = ns_alloc_inum(&ns->ns);
Eric W. Biedermanaba35662016-08-08 14:20:23 -050065 if (err)
66 goto fail_free;
Al Viro33c42942014-11-01 02:32:53 -040067 ns->ns.ops = &ipcns_operations;
Eric W. Biederman98f842e2011-06-15 10:21:48 -070068
Kirill Tkhai137ec392020-08-03 13:16:27 +030069 refcount_set(&ns->ns.count, 1);
Eric W. Biedermanb2360172016-05-31 12:26:41 -050070 ns->user_ns = get_user_ns(user_ns);
Eric W. Biedermanaba35662016-08-08 14:20:23 -050071 ns->ucounts = ucounts;
Eric W. Biedermanb2360172016-05-31 12:26:41 -050072
Guillaume Knispel0cfb6ae2017-09-08 16:17:55 -070073 err = mq_init_ns(ns);
74 if (err)
Davidlohr Buesoeae04d22018-08-21 22:01:56 -070075 goto fail_put;
76
Alexey Gladkovdc55e352022-02-14 19:18:14 +010077 err = -ENOMEM;
78 if (!setup_mq_sysctls(ns))
79 goto fail_put;
80
Alexey Gladkov1f5c1352022-02-14 19:18:15 +010081 if (!setup_ipc_sysctls(ns))
Alexey Gladkovdb7cfc32022-06-22 22:07:29 +020082 goto fail_mq;
Alexey Gladkov1f5c1352022-02-14 19:18:15 +010083
Jiebin Sun72d1e612022-09-14 03:25:38 +080084 err = msg_init_ns(ns);
85 if (err)
86 goto fail_put;
87
Davidlohr Buesoeae04d22018-08-21 22:01:56 -070088 sem_init_ns(ns);
Davidlohr Buesoeae04d22018-08-21 22:01:56 -070089 shm_init_ns(ns);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080090
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080091 return ns;
Eric W. Biedermanaba35662016-08-08 14:20:23 -050092
Alexey Gladkovdb7cfc32022-06-22 22:07:29 +020093fail_mq:
94 retire_mq_sysctls(ns);
95
Eric W. Biedermanaba35662016-08-08 14:20:23 -050096fail_put:
97 put_user_ns(ns->user_ns);
98 ns_free_inum(&ns->ns);
99fail_free:
100 kfree(ns);
101fail_dec:
102 dec_ipc_namespaces(ucounts);
103fail:
104 return ERR_PTR(err);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -0800105}
106
Serge E. Hallynb0e77592011-03-23 16:43:24 -0700107struct ipc_namespace *copy_ipcs(unsigned long flags,
Eric W. Biedermanbcf58e72012-07-26 04:02:49 -0700108 struct user_namespace *user_ns, struct ipc_namespace *ns)
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -0800109{
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -0800110 if (!(flags & CLONE_NEWIPC))
Alexey Dobriyan64424282009-06-17 16:27:54 -0700111 return get_ipc_ns(ns);
Eric W. Biedermanbcf58e72012-07-26 04:02:49 -0700112 return create_ipc_ns(user_ns, ns);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -0800113}
114
Pierre Peiffer01b8b072008-02-08 04:18:57 -0800115/*
116 * free_ipcs - free all ipcs of one type
117 * @ns: the namespace to remove the ipcs from
118 * @ids: the table of ipcs to free
119 * @free: the function called to free each individual ipc
120 *
121 * Called for each kind of ipc when an ipc_namespace exits.
122 */
123void free_ipcs(struct ipc_namespace *ns, struct ipc_ids *ids,
124 void (*free)(struct ipc_namespace *, struct kern_ipc_perm *))
125{
126 struct kern_ipc_perm *perm;
127 int next_id;
128 int total, in_use;
129
Davidlohr Buesod9a605e2013-09-11 14:26:24 -0700130 down_write(&ids->rwsem);
Pierre Peiffer01b8b072008-02-08 04:18:57 -0800131
132 in_use = ids->in_use;
133
134 for (total = 0, next_id = 0; total < in_use; next_id++) {
135 perm = idr_find(&ids->ipcs_idr, next_id);
136 if (perm == NULL)
137 continue;
Davidlohr Bueso32a27502013-09-11 14:26:29 -0700138 rcu_read_lock();
139 ipc_lock_object(perm);
Pierre Peiffer01b8b072008-02-08 04:18:57 -0800140 free(ns, perm);
141 total++;
142 }
Davidlohr Buesod9a605e2013-09-11 14:26:24 -0700143 up_write(&ids->rwsem);
Pierre Peiffer01b8b072008-02-08 04:18:57 -0800144}
145
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700146static void free_ipc_ns(struct ipc_namespace *ns)
147{
Rik van Rielda27f792023-01-27 13:46:51 -0500148 /*
149 * Caller needs to wait for an RCU grace period to have passed
150 * after making the mount point inaccessible to new accesses.
Giuseppe Scrivanoe1eb26f2020-06-07 21:40:10 -0700151 */
Rik van Rielda27f792023-01-27 13:46:51 -0500152 mntput(ns->mq_mnt);
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700153 sem_exit_ns(ns);
154 msg_exit_ns(ns);
155 shm_exit_ns(ns);
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700156
Alexey Gladkovdc55e352022-02-14 19:18:14 +0100157 retire_mq_sysctls(ns);
Alexey Gladkov1f5c1352022-02-14 19:18:15 +0100158 retire_ipc_sysctls(ns);
Alexey Gladkovdc55e352022-02-14 19:18:14 +0100159
Eric W. Biedermanaba35662016-08-08 14:20:23 -0500160 dec_ipc_namespaces(ns->ucounts);
Serge E. Hallynb5154982011-03-23 16:43:23 -0700161 put_user_ns(ns->user_ns);
Al Viro6344c432014-11-01 00:45:45 -0400162 ns_free_inum(&ns->ns);
Xiaotian Fengbe4d2502011-03-25 01:57:01 -0700163 kfree(ns);
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700164}
165
Giuseppe Scrivanoe1eb26f2020-06-07 21:40:10 -0700166static LLIST_HEAD(free_ipc_list);
167static void free_ipc(struct work_struct *unused)
168{
169 struct llist_node *node = llist_del_all(&free_ipc_list);
170 struct ipc_namespace *n, *t;
171
172 llist_for_each_entry_safe(n, t, node, mnt_llist)
Rik van Rielda27f792023-01-27 13:46:51 -0500173 mnt_make_shortterm(n->mq_mnt);
174
175 /* Wait for any last users to have gone away. */
176 synchronize_rcu();
177
178 llist_for_each_entry_safe(n, t, node, mnt_llist)
Giuseppe Scrivanoe1eb26f2020-06-07 21:40:10 -0700179 free_ipc_ns(n);
180}
181
182/*
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -0700183 * put_ipc_ns - drop a reference to an ipc namespace.
184 * @ns: the namespace to put
185 *
186 * If this is the last task in the namespace exiting, and
187 * it is dropping the refcount to 0, then it can race with
188 * a task in another ipc namespace but in a mounts namespace
189 * which has this ipcns's mqueuefs mounted, doing some action
190 * with one of the mqueuefs files. That can raise the refcount.
191 * So dropping the refcount, and raising the refcount when
192 * accessing it through the VFS, are protected with mq_lock.
193 *
194 * (Clearly, a task raising the refcount on its own ipc_ns
195 * needn't take mq_lock since it can't race with the last task
196 * in the ipcns exiting).
197 */
198void put_ipc_ns(struct ipc_namespace *ns)
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -0800199{
Kirill Tkhai137ec392020-08-03 13:16:27 +0300200 if (refcount_dec_and_lock(&ns->ns.count, &mq_lock)) {
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -0700201 mq_clear_sbinfo(ns);
202 spin_unlock(&mq_lock);
Giuseppe Scrivanoe1eb26f2020-06-07 21:40:10 -0700203
204 if (llist_add(&ns->mnt_llist, &free_ipc_list))
205 schedule_work(&free_ipc_work);
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -0700206 }
207}
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800208
Al Viro3c041182014-11-01 00:25:30 -0400209static inline struct ipc_namespace *to_ipc_ns(struct ns_common *ns)
210{
211 return container_of(ns, struct ipc_namespace, ns);
212}
213
Al Viro64964522014-11-01 00:37:32 -0400214static struct ns_common *ipcns_get(struct task_struct *task)
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800215{
216 struct ipc_namespace *ns = NULL;
217 struct nsproxy *nsproxy;
218
Eric W. Biederman728dba32014-02-03 19:13:49 -0800219 task_lock(task);
220 nsproxy = task->nsproxy;
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800221 if (nsproxy)
222 ns = get_ipc_ns(nsproxy->ipc_ns);
Eric W. Biederman728dba32014-02-03 19:13:49 -0800223 task_unlock(task);
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800224
Al Viro3c041182014-11-01 00:25:30 -0400225 return ns ? &ns->ns : NULL;
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800226}
227
Al Viro64964522014-11-01 00:37:32 -0400228static void ipcns_put(struct ns_common *ns)
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800229{
Al Viro3c041182014-11-01 00:25:30 -0400230 return put_ipc_ns(to_ipc_ns(ns));
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800231}
232
Christian Braunerf2a8d522020-05-05 16:04:30 +0200233static int ipcns_install(struct nsset *nsset, struct ns_common *new)
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800234{
Christian Braunerf2a8d522020-05-05 16:04:30 +0200235 struct nsproxy *nsproxy = nsset->nsproxy;
Al Viro3c041182014-11-01 00:25:30 -0400236 struct ipc_namespace *ns = to_ipc_ns(new);
Eric W. Biederman5e4a0842012-12-14 07:55:36 -0800237 if (!ns_capable(ns->user_ns, CAP_SYS_ADMIN) ||
Christian Braunerf2a8d522020-05-05 16:04:30 +0200238 !ns_capable(nsset->cred->user_ns, CAP_SYS_ADMIN))
Eric W. Biederman142e1d12012-07-26 01:13:20 -0700239 return -EPERM;
240
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800241 put_ipc_ns(nsproxy->ipc_ns);
242 nsproxy->ipc_ns = get_ipc_ns(ns);
243 return 0;
244}
245
Andrey Vaginbcac25a2016-09-06 00:47:13 -0700246static struct user_namespace *ipcns_owner(struct ns_common *ns)
247{
248 return to_ipc_ns(ns)->user_ns;
249}
250
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800251const struct proc_ns_operations ipcns_operations = {
252 .name = "ipc",
253 .type = CLONE_NEWIPC,
254 .get = ipcns_get,
255 .put = ipcns_put,
256 .install = ipcns_install,
Andrey Vaginbcac25a2016-09-06 00:47:13 -0700257 .owner = ipcns_owner,
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800258};