genetlink.c 25.6 KB
Newer Older
T
Thomas Graf 已提交
1 2 3 4 5
/*
 * NETLINK      Generic Netlink Family
 *
 * 		Authors:	Jamal Hadi Salim
 * 				Thomas Graf <tgraf@suug.ch>
6
 *				Johannes Berg <johannes@sipsolutions.net>
T
Thomas Graf 已提交
7 8 9 10
 */

#include <linux/module.h>
#include <linux/kernel.h>
11
#include <linux/slab.h>
T
Thomas Graf 已提交
12 13 14 15 16
#include <linux/errno.h>
#include <linux/types.h>
#include <linux/socket.h>
#include <linux/string.h>
#include <linux/skbuff.h>
17
#include <linux/mutex.h>
18
#include <linux/bitmap.h>
19
#include <linux/rwsem.h>
T
Thomas Graf 已提交
20 21 22
#include <net/sock.h>
#include <net/genetlink.h>

23
static DEFINE_MUTEX(genl_mutex); /* serialization of message processing */
24
static DECLARE_RWSEM(cb_lock);
T
Thomas Graf 已提交
25

26 27 28
atomic_t genl_sk_destructing_cnt = ATOMIC_INIT(0);
DECLARE_WAIT_QUEUE_HEAD(genl_sk_destructing_waitq);

29
void genl_lock(void)
T
Thomas Graf 已提交
30
{
31
	mutex_lock(&genl_mutex);
T
Thomas Graf 已提交
32
}
33
EXPORT_SYMBOL(genl_lock);
T
Thomas Graf 已提交
34

35
void genl_unlock(void)
T
Thomas Graf 已提交
36
{
37
	mutex_unlock(&genl_mutex);
T
Thomas Graf 已提交
38
}
39
EXPORT_SYMBOL(genl_unlock);
T
Thomas Graf 已提交
40

41
#ifdef CONFIG_LOCKDEP
42
bool lockdep_genl_is_held(void)
43 44 45 46 47 48
{
	return lockdep_is_held(&genl_mutex);
}
EXPORT_SYMBOL(lockdep_genl_is_held);
#endif

49 50 51 52 53 54 55 56 57 58 59 60
static void genl_lock_all(void)
{
	down_write(&cb_lock);
	genl_lock();
}

static void genl_unlock_all(void)
{
	genl_unlock();
	up_write(&cb_lock);
}

T
Thomas Graf 已提交
61 62 63 64
#define GENL_FAM_TAB_SIZE	16
#define GENL_FAM_TAB_MASK	(GENL_FAM_TAB_SIZE - 1)

static struct list_head family_ht[GENL_FAM_TAB_SIZE];
65 66 67 68 69 70
/*
 * Bitmap of multicast groups that are currently in use.
 *
 * To avoid an allocation at boot of just one unsigned long,
 * declare it global instead.
 * Bit 0 is marked as already used since group 0 is invalid.
71 72 73 74
 * Bit 1 is marked as already used since the drop-monitor code
 * abuses the API and thinks it can statically use group 1.
 * That group will typically conflict with other groups that
 * any proper users use.
75 76
 * Bit 16 is marked as used since it's used for generic netlink
 * and the code no longer marks pre-reserved IDs as used.
77 78 79
 * Bit 17 is marked as already used since the VFS quota code
 * also abused this API and relied on family == group ID, we
 * cater to that by giving it a static family and group ID.
80 81
 * Bit 18 is marked as already used since the PMCRAID driver
 * did the same thing as the VFS quota code (maybe copied?)
82
 */
83
static unsigned long mc_group_start = 0x3 | BIT(GENL_ID_CTRL) |
84 85
				      BIT(GENL_ID_VFS_DQUOT) |
				      BIT(GENL_ID_PMCRAID);
86 87
static unsigned long *mc_groups = &mc_group_start;
static unsigned long mc_groups_longs = 1;
T
Thomas Graf 已提交
88

89
static int genl_ctrl_event(int event, struct genl_family *family,
90 91
			   const struct genl_multicast_group *grp,
			   int grp_id);
T
Thomas Graf 已提交
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126

static inline unsigned int genl_family_hash(unsigned int id)
{
	return id & GENL_FAM_TAB_MASK;
}

static inline struct list_head *genl_family_chain(unsigned int id)
{
	return &family_ht[genl_family_hash(id)];
}

static struct genl_family *genl_family_find_byid(unsigned int id)
{
	struct genl_family *f;

	list_for_each_entry(f, genl_family_chain(id), family_list)
		if (f->id == id)
			return f;

	return NULL;
}

static struct genl_family *genl_family_find_byname(char *name)
{
	struct genl_family *f;
	int i;

	for (i = 0; i < GENL_FAM_TAB_SIZE; i++)
		list_for_each_entry(f, genl_family_chain(i), family_list)
			if (strcmp(f->name, name) == 0)
				return f;

	return NULL;
}

J
Johannes Berg 已提交
127
static const struct genl_ops *genl_get_cmd(u8 cmd, struct genl_family *family)
T
Thomas Graf 已提交
128
{
129
	int i;
T
Thomas Graf 已提交
130

131 132 133
	for (i = 0; i < family->n_ops; i++)
		if (family->ops[i].cmd == cmd)
			return &family->ops[i];
T
Thomas Graf 已提交
134 135 136 137 138 139 140

	return NULL;
}

/* Of course we are going to have problems once we hit
 * 2^16 alive types, but that can only happen by year 2K
*/
141
static u16 genl_generate_id(void)
T
Thomas Graf 已提交
142
{
143 144
	static u16 id_gen_idx = GENL_MIN_ID;
	int i;
T
Thomas Graf 已提交
145

146
	for (i = 0; i <= GENL_MAX_ID - GENL_MIN_ID; i++) {
147
		if (id_gen_idx != GENL_ID_VFS_DQUOT &&
148
		    id_gen_idx != GENL_ID_PMCRAID &&
149
		    !genl_family_find_byid(id_gen_idx))
150 151
			return id_gen_idx;
		if (++id_gen_idx > GENL_MAX_ID)
T
Thomas Graf 已提交
152
			id_gen_idx = GENL_MIN_ID;
153
	}
T
Thomas Graf 已提交
154

155
	return 0;
T
Thomas Graf 已提交
156 157
}

158
static int genl_allocate_reserve_groups(int n_groups, int *first_id)
159 160
{
	unsigned long *new_groups;
161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186
	int start = 0;
	int i;
	int id;
	bool fits;

	do {
		if (start == 0)
			id = find_first_zero_bit(mc_groups,
						 mc_groups_longs *
						 BITS_PER_LONG);
		else
			id = find_next_zero_bit(mc_groups,
						mc_groups_longs * BITS_PER_LONG,
						start);

		fits = true;
		for (i = id;
		     i < min_t(int, id + n_groups,
			       mc_groups_longs * BITS_PER_LONG);
		     i++) {
			if (test_bit(i, mc_groups)) {
				start = i;
				fits = false;
				break;
			}
		}
187

188
		if (id + n_groups > mc_groups_longs * BITS_PER_LONG) {
189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210
			unsigned long new_longs = mc_groups_longs +
						  BITS_TO_LONGS(n_groups);
			size_t nlen = new_longs * sizeof(unsigned long);

			if (mc_groups == &mc_group_start) {
				new_groups = kzalloc(nlen, GFP_KERNEL);
				if (!new_groups)
					return -ENOMEM;
				mc_groups = new_groups;
				*mc_groups = mc_group_start;
			} else {
				new_groups = krealloc(mc_groups, nlen,
						      GFP_KERNEL);
				if (!new_groups)
					return -ENOMEM;
				mc_groups = new_groups;
				for (i = 0; i < BITS_TO_LONGS(n_groups); i++)
					mc_groups[mc_groups_longs + i] = 0;
			}
			mc_groups_longs = new_longs;
		}
	} while (!fits);
211

212 213 214 215 216 217 218 219 220 221 222 223
	for (i = id; i < id + n_groups; i++)
		set_bit(i, mc_groups);
	*first_id = id;
	return 0;
}

static struct genl_family genl_ctrl;

static int genl_validate_assign_mc_groups(struct genl_family *family)
{
	int first_id;
	int n_groups = family->n_mcgrps;
224
	int err = 0, i;
225 226 227 228 229 230 231 232 233 234 235 236 237
	bool groups_allocated = false;

	if (!n_groups)
		return 0;

	for (i = 0; i < n_groups; i++) {
		const struct genl_multicast_group *grp = &family->mcgrps[i];

		if (WARN_ON(grp->name[0] == '\0'))
			return -EINVAL;
		if (WARN_ON(memchr(grp->name, '\0', GENL_NAMSIZ) == NULL))
			return -EINVAL;
	}
238

239
	/* special-case our own group and hacks */
240 241 242 243 244 245
	if (family == &genl_ctrl) {
		first_id = GENL_ID_CTRL;
		BUG_ON(n_groups != 1);
	} else if (strcmp(family->name, "NET_DM") == 0) {
		first_id = 1;
		BUG_ON(n_groups != 1);
246
	} else if (family->id == GENL_ID_VFS_DQUOT) {
247 248
		first_id = GENL_ID_VFS_DQUOT;
		BUG_ON(n_groups != 1);
249 250 251
	} else if (family->id == GENL_ID_PMCRAID) {
		first_id = GENL_ID_PMCRAID;
		BUG_ON(n_groups != 1);
252 253 254 255 256
	} else {
		groups_allocated = true;
		err = genl_allocate_reserve_groups(n_groups, &first_id);
		if (err)
			return err;
257 258
	}

259 260 261 262 263 264
	family->mcgrp_offset = first_id;

	/* if still initializing, can't and don't need to to realloc bitmaps */
	if (!init_net.genl_sock)
		return 0;

J
Johannes Berg 已提交
265 266 267
	if (family->netnsok) {
		struct net *net;

268
		netlink_table_grab();
J
Johannes Berg 已提交
269 270
		rcu_read_lock();
		for_each_net_rcu(net) {
271
			err = __netlink_change_ngroups(net->genl_sock,
J
Johannes Berg 已提交
272 273 274 275 276 277 278 279
					mc_groups_longs * BITS_PER_LONG);
			if (err) {
				/*
				 * No need to roll back, can only fail if
				 * memory allocation fails and then the
				 * number of _possible_ groups has been
				 * increased on some sockets which is ok.
				 */
280
				break;
J
Johannes Berg 已提交
281 282 283
			}
		}
		rcu_read_unlock();
284
		netlink_table_ungrab();
J
Johannes Berg 已提交
285 286 287 288
	} else {
		err = netlink_change_ngroups(init_net.genl_sock,
					     mc_groups_longs * BITS_PER_LONG);
	}
289

290 291 292 293
	if (groups_allocated && err) {
		for (i = 0; i < family->n_mcgrps; i++)
			clear_bit(family->mcgrp_offset + i, mc_groups);
	}
294

295
	return err;
296 297
}

298
static void genl_unregister_mc_groups(struct genl_family *family)
299
{
J
Johannes Berg 已提交
300
	struct net *net;
301
	int i;
J
Johannes Berg 已提交
302

303
	netlink_table_grab();
J
Johannes Berg 已提交
304
	rcu_read_lock();
305 306 307 308 309
	for_each_net_rcu(net) {
		for (i = 0; i < family->n_mcgrps; i++)
			__netlink_clear_multicast_users(
				net->genl_sock, family->mcgrp_offset + i);
	}
J
Johannes Berg 已提交
310
	rcu_read_unlock();
311
	netlink_table_ungrab();
J
Johannes Berg 已提交
312

313 314
	for (i = 0; i < family->n_mcgrps; i++) {
		int grp_id = family->mcgrp_offset + i;
315

316 317 318 319 320
		if (grp_id != 1)
			clear_bit(grp_id, mc_groups);
		genl_ctrl_event(CTRL_CMD_DELMCAST_GRP, family,
				&family->mcgrps[i], grp_id);
	}
321 322
}

323
static int genl_validate_ops(const struct genl_family *family)
T
Thomas Graf 已提交
324
{
325 326
	const struct genl_ops *ops = family->ops;
	unsigned int n_ops = family->n_ops;
327 328
	int i, j;

329 330 331 332 333 334
	if (WARN_ON(n_ops && !ops))
		return -EINVAL;

	if (!n_ops)
		return 0;

335 336 337 338 339 340
	for (i = 0; i < n_ops; i++) {
		if (ops[i].dumpit == NULL && ops[i].doit == NULL)
			return -EINVAL;
		for (j = i + 1; j < n_ops; j++)
			if (ops[i].cmd == ops[j].cmd)
				return -EINVAL;
T
Thomas Graf 已提交
341 342
	}

343
	return 0;
T
Thomas Graf 已提交
344 345 346
}

/**
347
 * __genl_register_family - register a generic netlink family
T
Thomas Graf 已提交
348 349 350 351 352 353 354
 * @family: generic netlink family
 *
 * Registers the specified family after validating it first. Only one
 * family may be registered with the same family name or identifier.
 * The family id may equal GENL_ID_GENERATE causing an unique id to
 * be automatically generated and assigned.
 *
355 356 357
 * The family's ops array must already be assigned, you can use the
 * genl_register_family_with_ops() helper function.
 *
T
Thomas Graf 已提交
358 359
 * Return 0 on success or a negative error code.
 */
360
int __genl_register_family(struct genl_family *family)
T
Thomas Graf 已提交
361
{
362
	int err = -EINVAL, i;
T
Thomas Graf 已提交
363 364 365 366 367 368 369

	if (family->id && family->id < GENL_MIN_ID)
		goto errout;

	if (family->id > GENL_MAX_ID)
		goto errout;

370 371 372 373
	err = genl_validate_ops(family);
	if (err)
		return err;

374
	genl_lock_all();
T
Thomas Graf 已提交
375 376 377 378 379 380 381 382 383 384 385 386 387 388 389

	if (genl_family_find_byname(family->name)) {
		err = -EEXIST;
		goto errout_locked;
	}

	if (family->id == GENL_ID_GENERATE) {
		u16 newid = genl_generate_id();

		if (!newid) {
			err = -ENOMEM;
			goto errout_locked;
		}

		family->id = newid;
390 391 392
	} else if (genl_family_find_byid(family->id)) {
		err = -EEXIST;
		goto errout_locked;
T
Thomas Graf 已提交
393 394
	}

395
	if (family->maxattr && !family->parallel_ops) {
T
Thomas Graf 已提交
396 397 398 399
		family->attrbuf = kmalloc((family->maxattr+1) *
					sizeof(struct nlattr *), GFP_KERNEL);
		if (family->attrbuf == NULL) {
			err = -ENOMEM;
400
			goto errout_locked;
T
Thomas Graf 已提交
401 402 403 404
		}
	} else
		family->attrbuf = NULL;

405 406 407 408
	err = genl_validate_assign_mc_groups(family);
	if (err)
		goto errout_locked;

T
Thomas Graf 已提交
409
	list_add_tail(&family->family_list, genl_family_chain(family->id));
410
	genl_unlock_all();
T
Thomas Graf 已提交
411

412 413 414 415 416
	/* send all events */
	genl_ctrl_event(CTRL_CMD_NEWFAMILY, family, NULL, 0);
	for (i = 0; i < family->n_mcgrps; i++)
		genl_ctrl_event(CTRL_CMD_NEWMCAST_GRP, family,
				&family->mcgrps[i], family->mcgrp_offset + i);
T
Thomas Graf 已提交
417 418 419 420

	return 0;

errout_locked:
421
	genl_unlock_all();
T
Thomas Graf 已提交
422 423 424
errout:
	return err;
}
425
EXPORT_SYMBOL(__genl_register_family);
T
Thomas Graf 已提交
426 427 428 429 430 431 432 433 434 435 436 437 438

/**
 * genl_unregister_family - unregister generic netlink family
 * @family: generic netlink family
 *
 * Unregisters the specified family.
 *
 * Returns 0 on success or a negative error code.
 */
int genl_unregister_family(struct genl_family *family)
{
	struct genl_family *rc;

439
	genl_lock_all();
T
Thomas Graf 已提交
440 441 442 443 444

	list_for_each_entry(rc, genl_family_chain(family->id), family_list) {
		if (family->id != rc->id || strcmp(rc->name, family->name))
			continue;

445 446
		genl_unregister_mc_groups(family);

T
Thomas Graf 已提交
447
		list_del(&rc->family_list);
448
		family->n_ops = 0;
449 450 451 452
		up_write(&cb_lock);
		wait_event(genl_sk_destructing_waitq,
			   atomic_read(&genl_sk_destructing_cnt) == 0);
		genl_unlock();
T
Thomas Graf 已提交
453 454

		kfree(family->attrbuf);
455
		genl_ctrl_event(CTRL_CMD_DELFAMILY, family, NULL, 0);
T
Thomas Graf 已提交
456 457 458
		return 0;
	}

459
	genl_unlock_all();
T
Thomas Graf 已提交
460 461 462

	return -ENOENT;
}
463
EXPORT_SYMBOL(genl_unregister_family);
T
Thomas Graf 已提交
464

465 466 467
/**
 * genlmsg_put - Add generic netlink header to netlink message
 * @skb: socket buffer holding the message
468
 * @portid: netlink portid the message is addressed to
469 470
 * @seq: sequence number (usually the one of the sender)
 * @family: generic netlink family
471
 * @flags: netlink message flags
472 473 474 475
 * @cmd: generic netlink command
 *
 * Returns pointer to user specific header
 */
476
void *genlmsg_put(struct sk_buff *skb, u32 portid, u32 seq,
477 478 479 480 481
				struct genl_family *family, int flags, u8 cmd)
{
	struct nlmsghdr *nlh;
	struct genlmsghdr *hdr;

482
	nlh = nlmsg_put(skb, portid, seq, family->id, GENL_HDRLEN +
483 484 485 486 487 488 489 490 491 492 493 494 495
			family->hdrsize, flags);
	if (nlh == NULL)
		return NULL;

	hdr = nlmsg_data(nlh);
	hdr->cmd = cmd;
	hdr->version = family->version;
	hdr->reserved = 0;

	return (char *) hdr + GENL_HDRLEN;
}
EXPORT_SYMBOL(genlmsg_put);

496 497 498 499 500 501 502 503 504 505 506 507 508 509
static int genl_lock_start(struct netlink_callback *cb)
{
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
	int rc = 0;

	if (ops->start) {
		genl_lock();
		rc = ops->start(cb);
		genl_unlock();
	}
	return rc;
}

510 511
static int genl_lock_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
{
J
Johannes Berg 已提交
512 513
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
514 515 516 517 518 519 520 521 522 523
	int rc;

	genl_lock();
	rc = ops->dumpit(skb, cb);
	genl_unlock();
	return rc;
}

static int genl_lock_done(struct netlink_callback *cb)
{
J
Johannes Berg 已提交
524 525
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
526 527 528 529 530 531 532 533 534 535
	int rc = 0;

	if (ops->done) {
		genl_lock();
		rc = ops->done(cb);
		genl_unlock();
	}
	return rc;
}

536 537 538
static int genl_family_rcv_msg(struct genl_family *family,
			       struct sk_buff *skb,
			       struct nlmsghdr *nlh)
T
Thomas Graf 已提交
539
{
J
Johannes Berg 已提交
540
	const struct genl_ops *ops;
J
Johannes Berg 已提交
541
	struct net *net = sock_net(skb->sk);
T
Thomas Graf 已提交
542 543
	struct genl_info info;
	struct genlmsghdr *hdr = nlmsg_data(nlh);
544
	struct nlattr **attrbuf;
545
	int hdrlen, err;
T
Thomas Graf 已提交
546

J
Johannes Berg 已提交
547 548 549 550
	/* this family doesn't exist in this netns */
	if (!family->netnsok && !net_eq(net, &init_net))
		return -ENOENT;

T
Thomas Graf 已提交
551 552
	hdrlen = GENL_HDRLEN + family->hdrsize;
	if (nlh->nlmsg_len < nlmsg_msg_size(hdrlen))
553
		return -EINVAL;
T
Thomas Graf 已提交
554 555

	ops = genl_get_cmd(hdr->cmd, family);
556 557
	if (ops == NULL)
		return -EOPNOTSUPP;
T
Thomas Graf 已提交
558

559
	if ((ops->flags & GENL_ADMIN_PERM) &&
560
	    !netlink_capable(skb, CAP_NET_ADMIN))
561
		return -EPERM;
T
Thomas Graf 已提交
562

563 564 565 566
	if ((ops->flags & GENL_UNS_ADMIN_PERM) &&
	    !netlink_ns_capable(skb, net->user_ns, CAP_NET_ADMIN))
		return -EPERM;

567
	if ((nlh->nlmsg_flags & NLM_F_DUMP) == NLM_F_DUMP) {
568
		int rc;
569

570 571
		if (ops->dumpit == NULL)
			return -EOPNOTSUPP;
T
Thomas Graf 已提交
572

573 574
		if (!family->parallel_ops) {
			struct netlink_dump_control c = {
575
				.module = family->module,
J
Johannes Berg 已提交
576 577
				/* we have const, but the netlink API doesn't */
				.data = (void *)ops,
578
				.start = genl_lock_start,
579 580 581 582 583
				.dump = genl_lock_dumpit,
				.done = genl_lock_done,
			};

			genl_unlock();
584
			rc = __netlink_dump_start(net->genl_sock, skb, nlh, &c);
585 586 587 588
			genl_lock();

		} else {
			struct netlink_dump_control c = {
589
				.module = family->module,
590
				.start = ops->start,
591 592 593 594
				.dump = ops->dumpit,
				.done = ops->done,
			};

595
			rc = __netlink_dump_start(net->genl_sock, skb, nlh, &c);
596 597 598
		}

		return rc;
T
Thomas Graf 已提交
599 600
	}

601 602
	if (ops->doit == NULL)
		return -EOPNOTSUPP;
T
Thomas Graf 已提交
603

604 605 606 607 608 609 610 611 612 613
	if (family->maxattr && family->parallel_ops) {
		attrbuf = kmalloc((family->maxattr+1) *
					sizeof(struct nlattr *), GFP_KERNEL);
		if (attrbuf == NULL)
			return -ENOMEM;
	} else
		attrbuf = family->attrbuf;

	if (attrbuf) {
		err = nlmsg_parse(nlh, hdrlen, attrbuf, family->maxattr,
T
Thomas Graf 已提交
614 615
				  ops->policy);
		if (err < 0)
616
			goto out;
T
Thomas Graf 已提交
617 618 619
	}

	info.snd_seq = nlh->nlmsg_seq;
620
	info.snd_portid = NETLINK_CB(skb).portid;
T
Thomas Graf 已提交
621 622 623
	info.nlhdr = nlh;
	info.genlhdr = nlmsg_data(nlh);
	info.userhdr = nlmsg_data(nlh) + GENL_HDRLEN;
624
	info.attrs = attrbuf;
J
Johannes Berg 已提交
625
	genl_info_net_set(&info, net);
626
	memset(&info.user_ptr, 0, sizeof(info.user_ptr));
T
Thomas Graf 已提交
627

628 629 630
	if (family->pre_doit) {
		err = family->pre_doit(ops, skb, &info);
		if (err)
631
			goto out;
632 633 634 635 636 637 638
	}

	err = ops->doit(skb, &info);

	if (family->post_doit)
		family->post_doit(ops, skb, &info);

639
out:
640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662
	if (family->parallel_ops)
		kfree(attrbuf);

	return err;
}

static int genl_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh)
{
	struct genl_family *family;
	int err;

	family = genl_family_find_byid(nlh->nlmsg_type);
	if (family == NULL)
		return -ENOENT;

	if (!family->parallel_ops)
		genl_lock();

	err = genl_family_rcv_msg(family, skb, nlh);

	if (!family->parallel_ops)
		genl_unlock();

663
	return err;
T
Thomas Graf 已提交
664 665
}

666
static void genl_rcv(struct sk_buff *skb)
T
Thomas Graf 已提交
667
{
668
	down_read(&cb_lock);
669
	netlink_rcv_skb(skb, &genl_rcv_msg);
670
	up_read(&cb_lock);
T
Thomas Graf 已提交
671 672 673 674 675 676
}

/**************************************************************************
 * Controller
 **************************************************************************/

677 678 679
static struct genl_family genl_ctrl = {
	.id = GENL_ID_CTRL,
	.name = "nlctrl",
680
	.version = 0x2,
681
	.maxattr = CTRL_ATTR_MAX,
J
Johannes Berg 已提交
682
	.netnsok = true,
683 684
};

685
static int ctrl_fill_info(struct genl_family *family, u32 portid, u32 seq,
T
Thomas Graf 已提交
686 687 688 689
			  u32 flags, struct sk_buff *skb, u8 cmd)
{
	void *hdr;

690
	hdr = genlmsg_put(skb, portid, seq, &genl_ctrl, flags, cmd);
T
Thomas Graf 已提交
691 692 693
	if (hdr == NULL)
		return -1;

694 695 696 697 698 699
	if (nla_put_string(skb, CTRL_ATTR_FAMILY_NAME, family->name) ||
	    nla_put_u16(skb, CTRL_ATTR_FAMILY_ID, family->id) ||
	    nla_put_u32(skb, CTRL_ATTR_VERSION, family->version) ||
	    nla_put_u32(skb, CTRL_ATTR_HDRSIZE, family->hdrsize) ||
	    nla_put_u32(skb, CTRL_ATTR_MAXATTR, family->maxattr))
		goto nla_put_failure;
700

701
	if (family->n_ops) {
702
		struct nlattr *nla_ops;
703
		int i;
704

705 706
		nla_ops = nla_nest_start(skb, CTRL_ATTR_OPS);
		if (nla_ops == NULL)
707 708
			goto nla_put_failure;

709
		for (i = 0; i < family->n_ops; i++) {
710
			struct nlattr *nest;
J
Johannes Berg 已提交
711
			const struct genl_ops *ops = &family->ops[i];
712
			u32 op_flags = ops->flags;
J
Johannes Berg 已提交
713 714

			if (ops->dumpit)
715
				op_flags |= GENL_CMD_CAP_DUMP;
J
Johannes Berg 已提交
716
			if (ops->doit)
717
				op_flags |= GENL_CMD_CAP_DO;
J
Johannes Berg 已提交
718
			if (ops->policy)
719
				op_flags |= GENL_CMD_CAP_HASPOL;
720

721
			nest = nla_nest_start(skb, i + 1);
722 723
			if (nest == NULL)
				goto nla_put_failure;
724

725
			if (nla_put_u32(skb, CTRL_ATTR_OP_ID, ops->cmd) ||
726
			    nla_put_u32(skb, CTRL_ATTR_OP_FLAGS, op_flags))
727
				goto nla_put_failure;
728

729 730 731 732 733
			nla_nest_end(skb, nest);
		}

		nla_nest_end(skb, nla_ops);
	}
T
Thomas Graf 已提交
734

735
	if (family->n_mcgrps) {
736
		struct nlattr *nla_grps;
737
		int i;
738 739 740 741 742

		nla_grps = nla_nest_start(skb, CTRL_ATTR_MCAST_GROUPS);
		if (nla_grps == NULL)
			goto nla_put_failure;

743
		for (i = 0; i < family->n_mcgrps; i++) {
744
			struct nlattr *nest;
745
			const struct genl_multicast_group *grp;
746

747 748 749
			grp = &family->mcgrps[i];

			nest = nla_nest_start(skb, i + 1);
750 751 752
			if (nest == NULL)
				goto nla_put_failure;

753 754
			if (nla_put_u32(skb, CTRL_ATTR_MCAST_GRP_ID,
					family->mcgrp_offset + i) ||
755 756 757
			    nla_put_string(skb, CTRL_ATTR_MCAST_GRP_NAME,
					   grp->name))
				goto nla_put_failure;
758 759 760 761 762 763

			nla_nest_end(skb, nest);
		}
		nla_nest_end(skb, nla_grps);
	}

764 765
	genlmsg_end(skb, hdr);
	return 0;
766 767

nla_put_failure:
768 769
	genlmsg_cancel(skb, hdr);
	return -EMSGSIZE;
770 771
}

772
static int ctrl_fill_mcgrp_info(struct genl_family *family,
773 774 775
				const struct genl_multicast_group *grp,
				int grp_id, u32 portid, u32 seq, u32 flags,
				struct sk_buff *skb, u8 cmd)
776 777 778 779 780
{
	void *hdr;
	struct nlattr *nla_grps;
	struct nlattr *nest;

781
	hdr = genlmsg_put(skb, portid, seq, &genl_ctrl, flags, cmd);
782 783 784
	if (hdr == NULL)
		return -1;

785 786
	if (nla_put_string(skb, CTRL_ATTR_FAMILY_NAME, family->name) ||
	    nla_put_u16(skb, CTRL_ATTR_FAMILY_ID, family->id))
787
		goto nla_put_failure;
788 789 790 791 792 793 794 795 796

	nla_grps = nla_nest_start(skb, CTRL_ATTR_MCAST_GROUPS);
	if (nla_grps == NULL)
		goto nla_put_failure;

	nest = nla_nest_start(skb, 1);
	if (nest == NULL)
		goto nla_put_failure;

797
	if (nla_put_u32(skb, CTRL_ATTR_MCAST_GRP_ID, grp_id) ||
798 799 800
	    nla_put_string(skb, CTRL_ATTR_MCAST_GRP_NAME,
			   grp->name))
		goto nla_put_failure;
801 802 803 804

	nla_nest_end(skb, nest);
	nla_nest_end(skb, nla_grps);

805 806
	genlmsg_end(skb, hdr);
	return 0;
T
Thomas Graf 已提交
807 808

nla_put_failure:
809 810
	genlmsg_cancel(skb, hdr);
	return -EMSGSIZE;
T
Thomas Graf 已提交
811 812 813 814 815 816 817
}

static int ctrl_dumpfamily(struct sk_buff *skb, struct netlink_callback *cb)
{

	int i, n = 0;
	struct genl_family *rt;
J
Johannes Berg 已提交
818
	struct net *net = sock_net(skb->sk);
T
Thomas Graf 已提交
819 820 821
	int chains_to_skip = cb->args[0];
	int fams_to_skip = cb->args[1];

822
	for (i = chains_to_skip; i < GENL_FAM_TAB_SIZE; i++) {
T
Thomas Graf 已提交
823 824
		n = 0;
		list_for_each_entry(rt, genl_family_chain(i), family_list) {
J
Johannes Berg 已提交
825 826
			if (!rt->netnsok && !net_eq(net, &init_net))
				continue;
T
Thomas Graf 已提交
827 828
			if (++n < fams_to_skip)
				continue;
829
			if (ctrl_fill_info(rt, NETLINK_CB(cb->skb).portid,
T
Thomas Graf 已提交
830 831 832 833 834 835 836 837 838 839 840 841 842 843 844
					   cb->nlh->nlmsg_seq, NLM_F_MULTI,
					   skb, CTRL_CMD_NEWFAMILY) < 0)
				goto errout;
		}

		fams_to_skip = 0;
	}

errout:
	cb->args[0] = i;
	cb->args[1] = n;

	return skb->len;
}

845
static struct sk_buff *ctrl_build_family_msg(struct genl_family *family,
846
					     u32 portid, int seq, u8 cmd)
T
Thomas Graf 已提交
847 848 849 850
{
	struct sk_buff *skb;
	int err;

851
	skb = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
T
Thomas Graf 已提交
852 853 854
	if (skb == NULL)
		return ERR_PTR(-ENOBUFS);

855
	err = ctrl_fill_info(family, portid, seq, 0, skb, cmd);
T
Thomas Graf 已提交
856 857 858 859 860 861 862 863
	if (err < 0) {
		nlmsg_free(skb);
		return ERR_PTR(err);
	}

	return skb;
}

864 865 866 867
static struct sk_buff *
ctrl_build_mcgrp_msg(struct genl_family *family,
		     const struct genl_multicast_group *grp,
		     int grp_id, u32 portid, int seq, u8 cmd)
868 869 870 871 872 873 874 875
{
	struct sk_buff *skb;
	int err;

	skb = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
	if (skb == NULL)
		return ERR_PTR(-ENOBUFS);

876 877
	err = ctrl_fill_mcgrp_info(family, grp, grp_id, portid,
				   seq, 0, skb, cmd);
878 879 880 881 882 883 884 885
	if (err < 0) {
		nlmsg_free(skb);
		return ERR_PTR(err);
	}

	return skb;
}

886
static const struct nla_policy ctrl_policy[CTRL_ATTR_MAX+1] = {
T
Thomas Graf 已提交
887
	[CTRL_ATTR_FAMILY_ID]	= { .type = NLA_U16 },
888 889
	[CTRL_ATTR_FAMILY_NAME]	= { .type = NLA_NUL_STRING,
				    .len = GENL_NAMSIZ - 1 },
T
Thomas Graf 已提交
890 891 892 893 894 895 896 897 898 899 900
};

static int ctrl_getfamily(struct sk_buff *skb, struct genl_info *info)
{
	struct sk_buff *msg;
	struct genl_family *res = NULL;
	int err = -EINVAL;

	if (info->attrs[CTRL_ATTR_FAMILY_ID]) {
		u16 id = nla_get_u16(info->attrs[CTRL_ATTR_FAMILY_ID]);
		res = genl_family_find_byid(id);
J
Johannes Berg 已提交
901
		err = -ENOENT;
T
Thomas Graf 已提交
902 903 904
	}

	if (info->attrs[CTRL_ATTR_FAMILY_NAME]) {
905
		char *name;
T
Thomas Graf 已提交
906

907
		name = nla_data(info->attrs[CTRL_ATTR_FAMILY_NAME]);
T
Thomas Graf 已提交
908
		res = genl_family_find_byname(name);
909 910 911
#ifdef CONFIG_MODULES
		if (res == NULL) {
			genl_unlock();
912
			up_read(&cb_lock);
913
			request_module("net-pf-%d-proto-%d-family-%s",
914
				       PF_NETLINK, NETLINK_GENERIC, name);
915
			down_read(&cb_lock);
916 917 918 919
			genl_lock();
			res = genl_family_find_byname(name);
		}
#endif
J
Johannes Berg 已提交
920
		err = -ENOENT;
T
Thomas Graf 已提交
921 922
	}

J
Johannes Berg 已提交
923 924 925 926 927 928
	if (res == NULL)
		return err;

	if (!res->netnsok && !net_eq(genl_info_net(info), &init_net)) {
		/* family doesn't exist here */
		return -ENOENT;
T
Thomas Graf 已提交
929 930
	}

931
	msg = ctrl_build_family_msg(res, info->snd_portid, info->snd_seq,
932
				    CTRL_CMD_NEWFAMILY);
J
Johannes Berg 已提交
933 934
	if (IS_ERR(msg))
		return PTR_ERR(msg);
T
Thomas Graf 已提交
935

J
Johannes Berg 已提交
936
	return genlmsg_reply(msg, info);
T
Thomas Graf 已提交
937 938
}

939
static int genl_ctrl_event(int event, struct genl_family *family,
940 941
			   const struct genl_multicast_group *grp,
			   int grp_id)
T
Thomas Graf 已提交
942 943 944
{
	struct sk_buff *msg;

J
Johannes Berg 已提交
945 946
	/* genl is still initialising */
	if (!init_net.genl_sock)
T
Thomas Graf 已提交
947 948 949 950 951
		return 0;

	switch (event) {
	case CTRL_CMD_NEWFAMILY:
	case CTRL_CMD_DELFAMILY:
952
		WARN_ON(grp);
J
Johannes Berg 已提交
953
		msg = ctrl_build_family_msg(family, 0, 0, event);
954 955 956
		break;
	case CTRL_CMD_NEWMCAST_GRP:
	case CTRL_CMD_DELMCAST_GRP:
957
		BUG_ON(!grp);
958
		msg = ctrl_build_mcgrp_msg(family, grp, grp_id, 0, 0, event);
T
Thomas Graf 已提交
959
		break;
J
Johannes Berg 已提交
960 961 962 963 964 965 966 967
	default:
		return -EINVAL;
	}

	if (IS_ERR(msg))
		return PTR_ERR(msg);

	if (!family->netnsok) {
968
		genlmsg_multicast_netns(&genl_ctrl, &init_net, msg, 0,
969
					0, GFP_KERNEL);
J
Johannes Berg 已提交
970 971
	} else {
		rcu_read_lock();
972
		genlmsg_multicast_allns(&genl_ctrl, msg, 0,
973
					0, GFP_ATOMIC);
J
Johannes Berg 已提交
974
		rcu_read_unlock();
T
Thomas Graf 已提交
975 976 977 978 979
	}

	return 0;
}

980 981 982 983 984 985 986
static struct genl_ops genl_ctrl_ops[] = {
	{
		.cmd		= CTRL_CMD_GETFAMILY,
		.doit		= ctrl_getfamily,
		.dumpit		= ctrl_dumpfamily,
		.policy		= ctrl_policy,
	},
T
Thomas Graf 已提交
987 988
};

989 990
static struct genl_multicast_group genl_ctrl_groups[] = {
	{ .name = "notify", },
991 992
};

993
static int genl_bind(struct net *net, int group)
994
{
995
	int i, err = -ENOENT;
996 997 998 999 1000 1001 1002 1003 1004 1005

	down_read(&cb_lock);
	for (i = 0; i < GENL_FAM_TAB_SIZE; i++) {
		struct genl_family *f;

		list_for_each_entry(f, genl_family_chain(i), family_list) {
			if (group >= f->mcgrp_offset &&
			    group < f->mcgrp_offset + f->n_mcgrps) {
				int fam_grp = group - f->mcgrp_offset;

1006 1007 1008 1009
				if (!f->netnsok && net != &init_net)
					err = -ENOENT;
				else if (f->mcast_bind)
					err = f->mcast_bind(net, fam_grp);
1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020
				else
					err = 0;
				break;
			}
		}
	}
	up_read(&cb_lock);

	return err;
}

1021
static void genl_unbind(struct net *net, int group)
1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034
{
	int i;

	down_read(&cb_lock);
	for (i = 0; i < GENL_FAM_TAB_SIZE; i++) {
		struct genl_family *f;

		list_for_each_entry(f, genl_family_chain(i), family_list) {
			if (group >= f->mcgrp_offset &&
			    group < f->mcgrp_offset + f->n_mcgrps) {
				int fam_grp = group - f->mcgrp_offset;

				if (f->mcast_unbind)
1035
					f->mcast_unbind(net, fam_grp);
1036 1037 1038 1039 1040 1041 1042
				break;
			}
		}
	}
	up_read(&cb_lock);
}

J
Johannes Berg 已提交
1043 1044
static int __net_init genl_pernet_init(struct net *net)
{
1045 1046
	struct netlink_kernel_cfg cfg = {
		.input		= genl_rcv,
1047
		.flags		= NL_CFG_F_NONROOT_RECV,
1048 1049
		.bind		= genl_bind,
		.unbind		= genl_unbind,
1050 1051
	};

J
Johannes Berg 已提交
1052
	/* we'll bump the group number right afterwards */
1053
	net->genl_sock = netlink_kernel_create(net, NETLINK_GENERIC, &cfg);
J
Johannes Berg 已提交
1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074

	if (!net->genl_sock && net_eq(net, &init_net))
		panic("GENL: Cannot initialize generic netlink\n");

	if (!net->genl_sock)
		return -ENOMEM;

	return 0;
}

static void __net_exit genl_pernet_exit(struct net *net)
{
	netlink_kernel_release(net->genl_sock);
	net->genl_sock = NULL;
}

static struct pernet_operations genl_pernet_ops = {
	.init = genl_pernet_init,
	.exit = genl_pernet_exit,
};

T
Thomas Graf 已提交
1075 1076 1077 1078 1079 1080 1081
static int __init genl_init(void)
{
	int i, err;

	for (i = 0; i < GENL_FAM_TAB_SIZE; i++)
		INIT_LIST_HEAD(&family_ht[i]);

1082 1083
	err = genl_register_family_with_ops_groups(&genl_ctrl, genl_ctrl_ops,
						   genl_ctrl_groups);
T
Thomas Graf 已提交
1084
	if (err < 0)
J
Johannes Berg 已提交
1085
		goto problem;
T
Thomas Graf 已提交
1086

J
Johannes Berg 已提交
1087 1088 1089
	err = register_pernet_subsys(&genl_pernet_ops);
	if (err)
		goto problem;
T
Thomas Graf 已提交
1090 1091 1092

	return 0;

J
Johannes Berg 已提交
1093
problem:
T
Thomas Graf 已提交
1094 1095 1096 1097 1098
	panic("GENL: Cannot register controller: %d\n", err);
}

subsys_initcall(genl_init);

1099
static int genlmsg_mcast(struct sk_buff *skb, u32 portid, unsigned long group,
J
Johannes Berg 已提交
1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113
			 gfp_t flags)
{
	struct sk_buff *tmp;
	struct net *net, *prev = NULL;
	int err;

	for_each_net_rcu(net) {
		if (prev) {
			tmp = skb_clone(skb, flags);
			if (!tmp) {
				err = -ENOMEM;
				goto error;
			}
			err = nlmsg_multicast(prev->genl_sock, tmp,
1114
					      portid, group, flags);
J
Johannes Berg 已提交
1115 1116 1117 1118 1119 1120 1121
			if (err)
				goto error;
		}

		prev = net;
	}

1122
	return nlmsg_multicast(prev->genl_sock, skb, portid, group, flags);
J
Johannes Berg 已提交
1123 1124 1125 1126 1127
 error:
	kfree_skb(skb);
	return err;
}

1128 1129
int genlmsg_multicast_allns(struct genl_family *family, struct sk_buff *skb,
			    u32 portid, unsigned int group, gfp_t flags)
J
Johannes Berg 已提交
1130
{
1131
	if (WARN_ON_ONCE(group >= family->n_mcgrps))
1132 1133
		return -EINVAL;
	group = family->mcgrp_offset + group;
1134
	return genlmsg_mcast(skb, portid, group, flags);
J
Johannes Berg 已提交
1135 1136
}
EXPORT_SYMBOL(genlmsg_multicast_allns);
P
Pravin B Shelar 已提交
1137

J
Jiri Benc 已提交
1138 1139
void genl_notify(struct genl_family *family, struct sk_buff *skb,
		 struct genl_info *info, u32 group, gfp_t flags)
P
Pravin B Shelar 已提交
1140
{
J
Jiri Benc 已提交
1141
	struct net *net = genl_info_net(info);
P
Pravin B Shelar 已提交
1142 1143 1144
	struct sock *sk = net->genl_sock;
	int report = 0;

J
Jiri Benc 已提交
1145 1146
	if (info->nlhdr)
		report = nlmsg_report(info->nlhdr);
P
Pravin B Shelar 已提交
1147

1148
	if (WARN_ON_ONCE(group >= family->n_mcgrps))
1149 1150
		return;
	group = family->mcgrp_offset + group;
J
Jiri Benc 已提交
1151
	nlmsg_notify(sk, skb, info->snd_portid, group, report, flags);
P
Pravin B Shelar 已提交
1152 1153
}
EXPORT_SYMBOL(genl_notify);