namespace.c 4.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11
/*
 * linux/ipc/namespace.c
 * Copyright (C) 2006 Pavel Emelyanov <xemul@openvz.org> OpenVZ, SWsoft Inc.
 */

#include <linux/ipc.h>
#include <linux/msg.h>
#include <linux/ipc_namespace.h>
#include <linux/rcupdate.h>
#include <linux/nsproxy.h>
#include <linux/slab.h>
12 13
#include <linux/fs.h>
#include <linux/mount.h>
14
#include <linux/user_namespace.h>
15
#include <linux/proc_ns.h>
16 17 18

#include "util.h"

19
static struct ipc_namespace *create_ipc_ns(struct user_namespace *user_ns,
20
					   struct ipc_namespace *old_ns)
21 22
{
	struct ipc_namespace *ns;
23
	int err;
24 25 26

	ns = kmalloc(sizeof(struct ipc_namespace), GFP_KERNEL);
	if (ns == NULL)
27
		return ERR_PTR(-ENOMEM);
28

A
Al Viro 已提交
29
	err = ns_alloc_inum(&ns->ns);
30 31 32 33 34
	if (err) {
		kfree(ns);
		return ERR_PTR(err);
	}

35 36 37
	atomic_set(&ns->count, 1);
	err = mq_init_ns(ns);
	if (err) {
A
Al Viro 已提交
38
		ns_free_inum(&ns->ns);
39 40 41
		kfree(ns);
		return ERR_PTR(err);
	}
42 43
	atomic_inc(&nr_ipc_ns);

44 45 46
	sem_init_ns(ns);
	msg_init_ns(ns);
	shm_init_ns(ns);
47

48 49 50 51 52 53
	/*
	 * msgmni has already been computed for the new ipc ns.
	 * Thus, do the ipcns creation notification before registering that
	 * new ipcns in the chain.
	 */
	ipcns_notify(IPCNS_CREATED);
54 55
	register_ipcns_notifier(ns);

56
	ns->user_ns = get_user_ns(user_ns);
57

58 59 60
	return ns;
}

61
struct ipc_namespace *copy_ipcs(unsigned long flags,
62
	struct user_namespace *user_ns, struct ipc_namespace *ns)
63 64
{
	if (!(flags & CLONE_NEWIPC))
65
		return get_ipc_ns(ns);
66
	return create_ipc_ns(user_ns, ns);
67 68
}

69 70 71 72 73 74 75 76 77 78 79 80 81 82 83
/*
 * free_ipcs - free all ipcs of one type
 * @ns:   the namespace to remove the ipcs from
 * @ids:  the table of ipcs to free
 * @free: the function called to free each individual ipc
 *
 * Called for each kind of ipc when an ipc_namespace exits.
 */
void free_ipcs(struct ipc_namespace *ns, struct ipc_ids *ids,
	       void (*free)(struct ipc_namespace *, struct kern_ipc_perm *))
{
	struct kern_ipc_perm *perm;
	int next_id;
	int total, in_use;

D
Davidlohr Bueso 已提交
84
	down_write(&ids->rwsem);
85 86 87 88 89 90 91

	in_use = ids->in_use;

	for (total = 0, next_id = 0; total < in_use; next_id++) {
		perm = idr_find(&ids->ipcs_idr, next_id);
		if (perm == NULL)
			continue;
D
Davidlohr Bueso 已提交
92 93
		rcu_read_lock();
		ipc_lock_object(perm);
94 95 96
		free(ns, perm);
		total++;
	}
D
Davidlohr Bueso 已提交
97
	up_write(&ids->rwsem);
98 99
}

100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120
static void free_ipc_ns(struct ipc_namespace *ns)
{
	/*
	 * Unregistering the hotplug notifier at the beginning guarantees
	 * that the ipc namespace won't be freed while we are inside the
	 * callback routine. Since the blocking_notifier_chain_XXX routines
	 * hold a rw lock on the notifier list, unregister_ipcns_notifier()
	 * won't take the rw lock before blocking_notifier_call_chain() has
	 * released the rd lock.
	 */
	unregister_ipcns_notifier(ns);
	sem_exit_ns(ns);
	msg_exit_ns(ns);
	shm_exit_ns(ns);
	atomic_dec(&nr_ipc_ns);

	/*
	 * Do the ipcns removal notification after decrementing nr_ipc_ns in
	 * order to have a correct value when recomputing msgmni.
	 */
	ipcns_notify(IPCNS_REMOVED);
121
	put_user_ns(ns->user_ns);
A
Al Viro 已提交
122
	ns_free_inum(&ns->ns);
123
	kfree(ns);
124 125
}

126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142
/*
 * put_ipc_ns - drop a reference to an ipc namespace.
 * @ns: the namespace to put
 *
 * If this is the last task in the namespace exiting, and
 * it is dropping the refcount to 0, then it can race with
 * a task in another ipc namespace but in a mounts namespace
 * which has this ipcns's mqueuefs mounted, doing some action
 * with one of the mqueuefs files.  That can raise the refcount.
 * So dropping the refcount, and raising the refcount when
 * accessing it through the VFS, are protected with mq_lock.
 *
 * (Clearly, a task raising the refcount on its own ipc_ns
 * needn't take mq_lock since it can't race with the last task
 * in the ipcns exiting).
 */
void put_ipc_ns(struct ipc_namespace *ns)
143
{
144 145 146 147 148 149 150
	if (atomic_dec_and_lock(&ns->count, &mq_lock)) {
		mq_clear_sbinfo(ns);
		spin_unlock(&mq_lock);
		mq_put_mnt(ns);
		free_ipc_ns(ns);
	}
}
151

152 153 154 155 156
static inline struct ipc_namespace *to_ipc_ns(struct ns_common *ns)
{
	return container_of(ns, struct ipc_namespace, ns);
}

157
static struct ns_common *ipcns_get(struct task_struct *task)
158 159 160 161
{
	struct ipc_namespace *ns = NULL;
	struct nsproxy *nsproxy;

162 163
	task_lock(task);
	nsproxy = task->nsproxy;
164 165
	if (nsproxy)
		ns = get_ipc_ns(nsproxy->ipc_ns);
166
	task_unlock(task);
167

168
	return ns ? &ns->ns : NULL;
169 170
}

171
static void ipcns_put(struct ns_common *ns)
172
{
173
	return put_ipc_ns(to_ipc_ns(ns));
174 175
}

176
static int ipcns_install(struct nsproxy *nsproxy, struct ns_common *new)
177
{
178
	struct ipc_namespace *ns = to_ipc_ns(new);
179
	if (!ns_capable(ns->user_ns, CAP_SYS_ADMIN) ||
180
	    !ns_capable(current_user_ns(), CAP_SYS_ADMIN))
181 182
		return -EPERM;

183 184 185 186 187 188 189 190 191 192 193 194 195 196
	/* Ditch state from the old ipc namespace */
	exit_sem(current);
	put_ipc_ns(nsproxy->ipc_ns);
	nsproxy->ipc_ns = get_ipc_ns(ns);
	return 0;
}

const struct proc_ns_operations ipcns_operations = {
	.name		= "ipc",
	.type		= CLONE_NEWIPC,
	.get		= ipcns_get,
	.put		= ipcns_put,
	.install	= ipcns_install,
};