blob: 24e7b45320f724be853fe15be748229f7732beb3 [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -08002/*
3 * linux/ipc/namespace.c
4 * Copyright (C) 2006 Pavel Emelyanov <xemul@openvz.org> OpenVZ, SWsoft Inc.
5 */
6
7#include <linux/ipc.h>
8#include <linux/msg.h>
9#include <linux/ipc_namespace.h>
10#include <linux/rcupdate.h>
11#include <linux/nsproxy.h>
12#include <linux/slab.h>
Ingo Molnar5b825c32017-02-02 17:54:15 +010013#include <linux/cred.h>
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -070014#include <linux/fs.h>
15#include <linux/mount.h>
Serge E. Hallynb5154982011-03-23 16:43:23 -070016#include <linux/user_namespace.h>
David Howells0bb80f22013-04-12 01:50:06 +010017#include <linux/proc_ns.h>
Ingo Molnarf719ff9b2017-02-06 10:57:33 +010018#include <linux/sched/task.h>
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080019
20#include "util.h"
21
Eric W. Biedermanaba35662016-08-08 14:20:23 -050022static struct ucounts *inc_ipc_namespaces(struct user_namespace *ns)
23{
24 return inc_ucount(ns, current_euid(), UCOUNT_IPC_NAMESPACES);
25}
26
27static void dec_ipc_namespaces(struct ucounts *ucounts)
28{
29 dec_ucount(ucounts, UCOUNT_IPC_NAMESPACES);
30}
31
Eric W. Biedermanbcf58e72012-07-26 04:02:49 -070032static struct ipc_namespace *create_ipc_ns(struct user_namespace *user_ns,
Serge E. Hallynb0e77592011-03-23 16:43:24 -070033 struct ipc_namespace *old_ns)
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080034{
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080035 struct ipc_namespace *ns;
Eric W. Biedermanaba35662016-08-08 14:20:23 -050036 struct ucounts *ucounts;
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -070037 int err;
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080038
Eric W. Biedermandf75e772016-09-22 13:08:36 -050039 err = -ENOSPC;
Eric W. Biedermanaba35662016-08-08 14:20:23 -050040 ucounts = inc_ipc_namespaces(user_ns);
41 if (!ucounts)
42 goto fail;
43
44 err = -ENOMEM;
David Howells935c69122018-11-01 23:07:25 +000045 ns = kzalloc(sizeof(struct ipc_namespace), GFP_KERNEL);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080046 if (ns == NULL)
Eric W. Biedermanaba35662016-08-08 14:20:23 -050047 goto fail_dec;
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080048
Al Viro6344c432014-11-01 00:45:45 -040049 err = ns_alloc_inum(&ns->ns);
Eric W. Biedermanaba35662016-08-08 14:20:23 -050050 if (err)
51 goto fail_free;
Al Viro33c42942014-11-01 02:32:53 -040052 ns->ns.ops = &ipcns_operations;
Eric W. Biederman98f842e2011-06-15 10:21:48 -070053
Elena Reshetovaa2e06022017-09-08 16:17:38 -070054 refcount_set(&ns->count, 1);
Eric W. Biedermanb2360172016-05-31 12:26:41 -050055 ns->user_ns = get_user_ns(user_ns);
Eric W. Biedermanaba35662016-08-08 14:20:23 -050056 ns->ucounts = ucounts;
Eric W. Biedermanb2360172016-05-31 12:26:41 -050057
Guillaume Knispel0cfb6ae2017-09-08 16:17:55 -070058 err = mq_init_ns(ns);
59 if (err)
Davidlohr Buesoeae04d22018-08-21 22:01:56 -070060 goto fail_put;
61
62 sem_init_ns(ns);
63 msg_init_ns(ns);
64 shm_init_ns(ns);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080065
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080066 return ns;
Eric W. Biedermanaba35662016-08-08 14:20:23 -050067
68fail_put:
69 put_user_ns(ns->user_ns);
70 ns_free_inum(&ns->ns);
71fail_free:
72 kfree(ns);
73fail_dec:
74 dec_ipc_namespaces(ucounts);
75fail:
76 return ERR_PTR(err);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080077}
78
Serge E. Hallynb0e77592011-03-23 16:43:24 -070079struct ipc_namespace *copy_ipcs(unsigned long flags,
Eric W. Biedermanbcf58e72012-07-26 04:02:49 -070080 struct user_namespace *user_ns, struct ipc_namespace *ns)
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080081{
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080082 if (!(flags & CLONE_NEWIPC))
Alexey Dobriyan64424282009-06-17 16:27:54 -070083 return get_ipc_ns(ns);
Eric W. Biedermanbcf58e72012-07-26 04:02:49 -070084 return create_ipc_ns(user_ns, ns);
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -080085}
86
Pierre Peiffer01b8b072008-02-08 04:18:57 -080087/*
88 * free_ipcs - free all ipcs of one type
89 * @ns: the namespace to remove the ipcs from
90 * @ids: the table of ipcs to free
91 * @free: the function called to free each individual ipc
92 *
93 * Called for each kind of ipc when an ipc_namespace exits.
94 */
95void free_ipcs(struct ipc_namespace *ns, struct ipc_ids *ids,
96 void (*free)(struct ipc_namespace *, struct kern_ipc_perm *))
97{
98 struct kern_ipc_perm *perm;
99 int next_id;
100 int total, in_use;
101
Davidlohr Buesod9a605e2013-09-11 14:26:24 -0700102 down_write(&ids->rwsem);
Pierre Peiffer01b8b072008-02-08 04:18:57 -0800103
104 in_use = ids->in_use;
105
106 for (total = 0, next_id = 0; total < in_use; next_id++) {
107 perm = idr_find(&ids->ipcs_idr, next_id);
108 if (perm == NULL)
109 continue;
Davidlohr Bueso32a27502013-09-11 14:26:29 -0700110 rcu_read_lock();
111 ipc_lock_object(perm);
Pierre Peiffer01b8b072008-02-08 04:18:57 -0800112 free(ns, perm);
113 total++;
114 }
Davidlohr Buesod9a605e2013-09-11 14:26:24 -0700115 up_write(&ids->rwsem);
Pierre Peiffer01b8b072008-02-08 04:18:57 -0800116}
117
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700118static void free_ipc_ns(struct ipc_namespace *ns)
119{
Giuseppe Scrivanoe1eb26f2020-06-07 21:40:10 -0700120 /* mq_put_mnt() waits for a grace period as kern_unmount()
121 * uses synchronize_rcu().
122 */
123 mq_put_mnt(ns);
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700124 sem_exit_ns(ns);
125 msg_exit_ns(ns);
126 shm_exit_ns(ns);
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700127
Eric W. Biedermanaba35662016-08-08 14:20:23 -0500128 dec_ipc_namespaces(ns->ucounts);
Serge E. Hallynb5154982011-03-23 16:43:23 -0700129 put_user_ns(ns->user_ns);
Al Viro6344c432014-11-01 00:45:45 -0400130 ns_free_inum(&ns->ns);
Xiaotian Fengbe4d2502011-03-25 01:57:01 -0700131 kfree(ns);
Alexey Dobriyanb4188de2009-06-17 16:27:56 -0700132}
133
Giuseppe Scrivanoe1eb26f2020-06-07 21:40:10 -0700134static LLIST_HEAD(free_ipc_list);
135static void free_ipc(struct work_struct *unused)
136{
137 struct llist_node *node = llist_del_all(&free_ipc_list);
138 struct ipc_namespace *n, *t;
139
140 llist_for_each_entry_safe(n, t, node, mnt_llist)
141 free_ipc_ns(n);
142}
143
144/*
145 * The work queue is used to avoid the cost of synchronize_rcu in kern_unmount.
146 */
147static DECLARE_WORK(free_ipc_work, free_ipc);
148
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -0700149/*
150 * put_ipc_ns - drop a reference to an ipc namespace.
151 * @ns: the namespace to put
152 *
153 * If this is the last task in the namespace exiting, and
154 * it is dropping the refcount to 0, then it can race with
155 * a task in another ipc namespace but in a mounts namespace
156 * which has this ipcns's mqueuefs mounted, doing some action
157 * with one of the mqueuefs files. That can raise the refcount.
158 * So dropping the refcount, and raising the refcount when
159 * accessing it through the VFS, are protected with mq_lock.
160 *
161 * (Clearly, a task raising the refcount on its own ipc_ns
162 * needn't take mq_lock since it can't race with the last task
163 * in the ipcns exiting).
164 */
165void put_ipc_ns(struct ipc_namespace *ns)
Pavel Emelyanovae5e1b22008-02-08 04:18:22 -0800166{
Elena Reshetovaa2e06022017-09-08 16:17:38 -0700167 if (refcount_dec_and_lock(&ns->count, &mq_lock)) {
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -0700168 mq_clear_sbinfo(ns);
169 spin_unlock(&mq_lock);
Giuseppe Scrivanoe1eb26f2020-06-07 21:40:10 -0700170
171 if (llist_add(&ns->mnt_llist, &free_ipc_list))
172 schedule_work(&free_ipc_work);
Serge E. Hallyn7eafd7c2009-04-06 19:01:10 -0700173 }
174}
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800175
Al Viro3c041182014-11-01 00:25:30 -0400176static inline struct ipc_namespace *to_ipc_ns(struct ns_common *ns)
177{
178 return container_of(ns, struct ipc_namespace, ns);
179}
180
Al Viro64964522014-11-01 00:37:32 -0400181static struct ns_common *ipcns_get(struct task_struct *task)
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800182{
183 struct ipc_namespace *ns = NULL;
184 struct nsproxy *nsproxy;
185
Eric W. Biederman728dba32014-02-03 19:13:49 -0800186 task_lock(task);
187 nsproxy = task->nsproxy;
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800188 if (nsproxy)
189 ns = get_ipc_ns(nsproxy->ipc_ns);
Eric W. Biederman728dba32014-02-03 19:13:49 -0800190 task_unlock(task);
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800191
Al Viro3c041182014-11-01 00:25:30 -0400192 return ns ? &ns->ns : NULL;
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800193}
194
Al Viro64964522014-11-01 00:37:32 -0400195static void ipcns_put(struct ns_common *ns)
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800196{
Al Viro3c041182014-11-01 00:25:30 -0400197 return put_ipc_ns(to_ipc_ns(ns));
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800198}
199
Christian Braunerf2a8d522020-05-05 16:04:30 +0200200static int ipcns_install(struct nsset *nsset, struct ns_common *new)
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800201{
Christian Braunerf2a8d522020-05-05 16:04:30 +0200202 struct nsproxy *nsproxy = nsset->nsproxy;
Al Viro3c041182014-11-01 00:25:30 -0400203 struct ipc_namespace *ns = to_ipc_ns(new);
Eric W. Biederman5e4a0842012-12-14 07:55:36 -0800204 if (!ns_capable(ns->user_ns, CAP_SYS_ADMIN) ||
Christian Braunerf2a8d522020-05-05 16:04:30 +0200205 !ns_capable(nsset->cred->user_ns, CAP_SYS_ADMIN))
Eric W. Biederman142e1d12012-07-26 01:13:20 -0700206 return -EPERM;
207
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800208 put_ipc_ns(nsproxy->ipc_ns);
209 nsproxy->ipc_ns = get_ipc_ns(ns);
210 return 0;
211}
212
Andrey Vaginbcac25a2016-09-06 00:47:13 -0700213static struct user_namespace *ipcns_owner(struct ns_common *ns)
214{
215 return to_ipc_ns(ns)->user_ns;
216}
217
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800218const struct proc_ns_operations ipcns_operations = {
219 .name = "ipc",
220 .type = CLONE_NEWIPC,
221 .get = ipcns_get,
222 .put = ipcns_put,
223 .install = ipcns_install,
Andrey Vaginbcac25a2016-09-06 00:47:13 -0700224 .owner = ipcns_owner,
Eric W. Biedermana00eaf12010-03-07 18:48:39 -0800225};