genetlink.c 26.2 KB
Newer Older
T
Thomas Graf 已提交
1 2 3 4 5
/*
 * NETLINK      Generic Netlink Family
 *
 * 		Authors:	Jamal Hadi Salim
 * 				Thomas Graf <tgraf@suug.ch>
6
 *				Johannes Berg <johannes@sipsolutions.net>
T
Thomas Graf 已提交
7 8 9 10
 */

#include <linux/module.h>
#include <linux/kernel.h>
11
#include <linux/slab.h>
T
Thomas Graf 已提交
12 13 14 15 16
#include <linux/errno.h>
#include <linux/types.h>
#include <linux/socket.h>
#include <linux/string.h>
#include <linux/skbuff.h>
17
#include <linux/mutex.h>
18
#include <linux/bitmap.h>
19
#include <linux/rwsem.h>
T
Thomas Graf 已提交
20 21 22
#include <net/sock.h>
#include <net/genetlink.h>

23
static DEFINE_MUTEX(genl_mutex); /* serialization of message processing */
24
static DECLARE_RWSEM(cb_lock);
T
Thomas Graf 已提交
25

26 27 28
atomic_t genl_sk_destructing_cnt = ATOMIC_INIT(0);
DECLARE_WAIT_QUEUE_HEAD(genl_sk_destructing_waitq);

29
void genl_lock(void)
T
Thomas Graf 已提交
30
{
31
	mutex_lock(&genl_mutex);
T
Thomas Graf 已提交
32
}
33
EXPORT_SYMBOL(genl_lock);
T
Thomas Graf 已提交
34

35
void genl_unlock(void)
T
Thomas Graf 已提交
36
{
37
	mutex_unlock(&genl_mutex);
T
Thomas Graf 已提交
38
}
39
EXPORT_SYMBOL(genl_unlock);
T
Thomas Graf 已提交
40

41
#ifdef CONFIG_LOCKDEP
42
bool lockdep_genl_is_held(void)
43 44 45 46 47 48
{
	return lockdep_is_held(&genl_mutex);
}
EXPORT_SYMBOL(lockdep_genl_is_held);
#endif

49 50 51 52 53 54 55 56 57 58 59 60
static void genl_lock_all(void)
{
	down_write(&cb_lock);
	genl_lock();
}

static void genl_unlock_all(void)
{
	genl_unlock();
	up_write(&cb_lock);
}

T
Thomas Graf 已提交
61 62 63 64
#define GENL_FAM_TAB_SIZE	16
#define GENL_FAM_TAB_MASK	(GENL_FAM_TAB_SIZE - 1)

static struct list_head family_ht[GENL_FAM_TAB_SIZE];
65 66 67 68 69 70
/*
 * Bitmap of multicast groups that are currently in use.
 *
 * To avoid an allocation at boot of just one unsigned long,
 * declare it global instead.
 * Bit 0 is marked as already used since group 0 is invalid.
71 72 73 74
 * Bit 1 is marked as already used since the drop-monitor code
 * abuses the API and thinks it can statically use group 1.
 * That group will typically conflict with other groups that
 * any proper users use.
75 76
 * Bit 16 is marked as used since it's used for generic netlink
 * and the code no longer marks pre-reserved IDs as used.
77 78 79
 * Bit 17 is marked as already used since the VFS quota code
 * also abused this API and relied on family == group ID, we
 * cater to that by giving it a static family and group ID.
80 81
 * Bit 18 is marked as already used since the PMCRAID driver
 * did the same thing as the VFS quota code (maybe copied?)
82
 */
83
static unsigned long mc_group_start = 0x3 | BIT(GENL_ID_CTRL) |
84 85
				      BIT(GENL_ID_VFS_DQUOT) |
				      BIT(GENL_ID_PMCRAID);
86 87
static unsigned long *mc_groups = &mc_group_start;
static unsigned long mc_groups_longs = 1;
T
Thomas Graf 已提交
88

89
static int genl_ctrl_event(int event, struct genl_family *family,
90 91
			   const struct genl_multicast_group *grp,
			   int grp_id);
T
Thomas Graf 已提交
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126

static inline unsigned int genl_family_hash(unsigned int id)
{
	return id & GENL_FAM_TAB_MASK;
}

static inline struct list_head *genl_family_chain(unsigned int id)
{
	return &family_ht[genl_family_hash(id)];
}

static struct genl_family *genl_family_find_byid(unsigned int id)
{
	struct genl_family *f;

	list_for_each_entry(f, genl_family_chain(id), family_list)
		if (f->id == id)
			return f;

	return NULL;
}

static struct genl_family *genl_family_find_byname(char *name)
{
	struct genl_family *f;
	int i;

	for (i = 0; i < GENL_FAM_TAB_SIZE; i++)
		list_for_each_entry(f, genl_family_chain(i), family_list)
			if (strcmp(f->name, name) == 0)
				return f;

	return NULL;
}

J
Johannes Berg 已提交
127
static const struct genl_ops *genl_get_cmd(u8 cmd, struct genl_family *family)
T
Thomas Graf 已提交
128
{
129
	int i;
T
Thomas Graf 已提交
130

131 132 133
	for (i = 0; i < family->n_ops; i++)
		if (family->ops[i].cmd == cmd)
			return &family->ops[i];
T
Thomas Graf 已提交
134 135 136 137 138 139 140

	return NULL;
}

/* Of course we are going to have problems once we hit
 * 2^16 alive types, but that can only happen by year 2K
*/
141
static u16 genl_generate_id(void)
T
Thomas Graf 已提交
142
{
143 144
	static u16 id_gen_idx = GENL_MIN_ID;
	int i;
T
Thomas Graf 已提交
145

146
	for (i = 0; i <= GENL_MAX_ID - GENL_MIN_ID; i++) {
147
		if (id_gen_idx != GENL_ID_VFS_DQUOT &&
148
		    id_gen_idx != GENL_ID_PMCRAID &&
149
		    !genl_family_find_byid(id_gen_idx))
150 151
			return id_gen_idx;
		if (++id_gen_idx > GENL_MAX_ID)
T
Thomas Graf 已提交
152
			id_gen_idx = GENL_MIN_ID;
153
	}
T
Thomas Graf 已提交
154

155
	return 0;
T
Thomas Graf 已提交
156 157
}

158
static int genl_allocate_reserve_groups(int n_groups, int *first_id)
159 160
{
	unsigned long *new_groups;
161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186
	int start = 0;
	int i;
	int id;
	bool fits;

	do {
		if (start == 0)
			id = find_first_zero_bit(mc_groups,
						 mc_groups_longs *
						 BITS_PER_LONG);
		else
			id = find_next_zero_bit(mc_groups,
						mc_groups_longs * BITS_PER_LONG,
						start);

		fits = true;
		for (i = id;
		     i < min_t(int, id + n_groups,
			       mc_groups_longs * BITS_PER_LONG);
		     i++) {
			if (test_bit(i, mc_groups)) {
				start = i;
				fits = false;
				break;
			}
		}
187

188
		if (id + n_groups >= mc_groups_longs * BITS_PER_LONG) {
189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210
			unsigned long new_longs = mc_groups_longs +
						  BITS_TO_LONGS(n_groups);
			size_t nlen = new_longs * sizeof(unsigned long);

			if (mc_groups == &mc_group_start) {
				new_groups = kzalloc(nlen, GFP_KERNEL);
				if (!new_groups)
					return -ENOMEM;
				mc_groups = new_groups;
				*mc_groups = mc_group_start;
			} else {
				new_groups = krealloc(mc_groups, nlen,
						      GFP_KERNEL);
				if (!new_groups)
					return -ENOMEM;
				mc_groups = new_groups;
				for (i = 0; i < BITS_TO_LONGS(n_groups); i++)
					mc_groups[mc_groups_longs + i] = 0;
			}
			mc_groups_longs = new_longs;
		}
	} while (!fits);
211

212 213 214 215 216 217 218 219 220 221 222 223
	for (i = id; i < id + n_groups; i++)
		set_bit(i, mc_groups);
	*first_id = id;
	return 0;
}

static struct genl_family genl_ctrl;

static int genl_validate_assign_mc_groups(struct genl_family *family)
{
	int first_id;
	int n_groups = family->n_mcgrps;
224
	int err = 0, i;
225 226 227 228 229 230 231 232 233 234 235 236 237
	bool groups_allocated = false;

	if (!n_groups)
		return 0;

	for (i = 0; i < n_groups; i++) {
		const struct genl_multicast_group *grp = &family->mcgrps[i];

		if (WARN_ON(grp->name[0] == '\0'))
			return -EINVAL;
		if (WARN_ON(memchr(grp->name, '\0', GENL_NAMSIZ) == NULL))
			return -EINVAL;
	}
238

239
	/* special-case our own group and hacks */
240 241 242 243 244 245
	if (family == &genl_ctrl) {
		first_id = GENL_ID_CTRL;
		BUG_ON(n_groups != 1);
	} else if (strcmp(family->name, "NET_DM") == 0) {
		first_id = 1;
		BUG_ON(n_groups != 1);
246
	} else if (family->id == GENL_ID_VFS_DQUOT) {
247 248
		first_id = GENL_ID_VFS_DQUOT;
		BUG_ON(n_groups != 1);
249 250 251
	} else if (family->id == GENL_ID_PMCRAID) {
		first_id = GENL_ID_PMCRAID;
		BUG_ON(n_groups != 1);
252 253 254 255 256
	} else {
		groups_allocated = true;
		err = genl_allocate_reserve_groups(n_groups, &first_id);
		if (err)
			return err;
257 258
	}

259 260 261 262 263 264
	family->mcgrp_offset = first_id;

	/* if still initializing, can't and don't need to to realloc bitmaps */
	if (!init_net.genl_sock)
		return 0;

J
Johannes Berg 已提交
265 266 267
	if (family->netnsok) {
		struct net *net;

268
		netlink_table_grab();
J
Johannes Berg 已提交
269 270
		rcu_read_lock();
		for_each_net_rcu(net) {
271
			err = __netlink_change_ngroups(net->genl_sock,
J
Johannes Berg 已提交
272 273 274 275 276 277 278 279
					mc_groups_longs * BITS_PER_LONG);
			if (err) {
				/*
				 * No need to roll back, can only fail if
				 * memory allocation fails and then the
				 * number of _possible_ groups has been
				 * increased on some sockets which is ok.
				 */
280
				break;
J
Johannes Berg 已提交
281 282 283
			}
		}
		rcu_read_unlock();
284
		netlink_table_ungrab();
J
Johannes Berg 已提交
285 286 287 288
	} else {
		err = netlink_change_ngroups(init_net.genl_sock,
					     mc_groups_longs * BITS_PER_LONG);
	}
289

290 291 292 293
	if (groups_allocated && err) {
		for (i = 0; i < family->n_mcgrps; i++)
			clear_bit(family->mcgrp_offset + i, mc_groups);
	}
294

295
	return err;
296 297
}

298
static void genl_unregister_mc_groups(struct genl_family *family)
299
{
J
Johannes Berg 已提交
300
	struct net *net;
301
	int i;
J
Johannes Berg 已提交
302

303
	netlink_table_grab();
J
Johannes Berg 已提交
304
	rcu_read_lock();
305 306 307 308 309
	for_each_net_rcu(net) {
		for (i = 0; i < family->n_mcgrps; i++)
			__netlink_clear_multicast_users(
				net->genl_sock, family->mcgrp_offset + i);
	}
J
Johannes Berg 已提交
310
	rcu_read_unlock();
311
	netlink_table_ungrab();
J
Johannes Berg 已提交
312

313 314
	for (i = 0; i < family->n_mcgrps; i++) {
		int grp_id = family->mcgrp_offset + i;
315

316 317 318 319 320
		if (grp_id != 1)
			clear_bit(grp_id, mc_groups);
		genl_ctrl_event(CTRL_CMD_DELMCAST_GRP, family,
				&family->mcgrps[i], grp_id);
	}
321 322
}

323
static int genl_validate_ops(const struct genl_family *family)
T
Thomas Graf 已提交
324
{
325 326
	const struct genl_ops *ops = family->ops;
	unsigned int n_ops = family->n_ops;
327 328
	int i, j;

329 330 331 332 333 334
	if (WARN_ON(n_ops && !ops))
		return -EINVAL;

	if (!n_ops)
		return 0;

335 336 337 338 339 340
	for (i = 0; i < n_ops; i++) {
		if (ops[i].dumpit == NULL && ops[i].doit == NULL)
			return -EINVAL;
		for (j = i + 1; j < n_ops; j++)
			if (ops[i].cmd == ops[j].cmd)
				return -EINVAL;
T
Thomas Graf 已提交
341 342
	}

343
	return 0;
T
Thomas Graf 已提交
344 345 346
}

/**
347
 * __genl_register_family - register a generic netlink family
T
Thomas Graf 已提交
348 349 350 351 352 353 354
 * @family: generic netlink family
 *
 * Registers the specified family after validating it first. Only one
 * family may be registered with the same family name or identifier.
 * The family id may equal GENL_ID_GENERATE causing an unique id to
 * be automatically generated and assigned.
 *
355 356 357
 * The family's ops array must already be assigned, you can use the
 * genl_register_family_with_ops() helper function.
 *
T
Thomas Graf 已提交
358 359
 * Return 0 on success or a negative error code.
 */
360
int __genl_register_family(struct genl_family *family)
T
Thomas Graf 已提交
361
{
362
	int err = -EINVAL, i;
T
Thomas Graf 已提交
363 364 365 366 367 368 369

	if (family->id && family->id < GENL_MIN_ID)
		goto errout;

	if (family->id > GENL_MAX_ID)
		goto errout;

370 371 372 373
	err = genl_validate_ops(family);
	if (err)
		return err;

374
	genl_lock_all();
T
Thomas Graf 已提交
375 376 377 378 379 380 381 382 383 384 385 386 387 388 389

	if (genl_family_find_byname(family->name)) {
		err = -EEXIST;
		goto errout_locked;
	}

	if (family->id == GENL_ID_GENERATE) {
		u16 newid = genl_generate_id();

		if (!newid) {
			err = -ENOMEM;
			goto errout_locked;
		}

		family->id = newid;
390 391 392
	} else if (genl_family_find_byid(family->id)) {
		err = -EEXIST;
		goto errout_locked;
T
Thomas Graf 已提交
393 394
	}

395
	if (family->maxattr && !family->parallel_ops) {
T
Thomas Graf 已提交
396 397 398 399
		family->attrbuf = kmalloc((family->maxattr+1) *
					sizeof(struct nlattr *), GFP_KERNEL);
		if (family->attrbuf == NULL) {
			err = -ENOMEM;
400
			goto errout_locked;
T
Thomas Graf 已提交
401 402 403 404
		}
	} else
		family->attrbuf = NULL;

405 406 407 408
	err = genl_validate_assign_mc_groups(family);
	if (err)
		goto errout_locked;

T
Thomas Graf 已提交
409
	list_add_tail(&family->family_list, genl_family_chain(family->id));
410
	genl_unlock_all();
T
Thomas Graf 已提交
411

412 413 414 415 416
	/* send all events */
	genl_ctrl_event(CTRL_CMD_NEWFAMILY, family, NULL, 0);
	for (i = 0; i < family->n_mcgrps; i++)
		genl_ctrl_event(CTRL_CMD_NEWMCAST_GRP, family,
				&family->mcgrps[i], family->mcgrp_offset + i);
T
Thomas Graf 已提交
417 418 419 420

	return 0;

errout_locked:
421
	genl_unlock_all();
T
Thomas Graf 已提交
422 423 424
errout:
	return err;
}
425
EXPORT_SYMBOL(__genl_register_family);
T
Thomas Graf 已提交
426 427 428 429 430 431 432 433 434 435 436 437 438

/**
 * genl_unregister_family - unregister generic netlink family
 * @family: generic netlink family
 *
 * Unregisters the specified family.
 *
 * Returns 0 on success or a negative error code.
 */
int genl_unregister_family(struct genl_family *family)
{
	struct genl_family *rc;

439
	genl_lock_all();
T
Thomas Graf 已提交
440 441 442 443 444

	list_for_each_entry(rc, genl_family_chain(family->id), family_list) {
		if (family->id != rc->id || strcmp(rc->name, family->name))
			continue;

445 446
		genl_unregister_mc_groups(family);

T
Thomas Graf 已提交
447
		list_del(&rc->family_list);
448
		family->n_ops = 0;
449 450 451 452
		up_write(&cb_lock);
		wait_event(genl_sk_destructing_waitq,
			   atomic_read(&genl_sk_destructing_cnt) == 0);
		genl_unlock();
T
Thomas Graf 已提交
453 454

		kfree(family->attrbuf);
455
		genl_ctrl_event(CTRL_CMD_DELFAMILY, family, NULL, 0);
T
Thomas Graf 已提交
456 457 458
		return 0;
	}

459
	genl_unlock_all();
T
Thomas Graf 已提交
460 461 462

	return -ENOENT;
}
463
EXPORT_SYMBOL(genl_unregister_family);
T
Thomas Graf 已提交
464

465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484
/**
 * genlmsg_new_unicast - Allocate generic netlink message for unicast
 * @payload: size of the message payload
 * @info: information on destination
 * @flags: the type of memory to allocate
 *
 * Allocates a new sk_buff large enough to cover the specified payload
 * plus required Netlink headers. Will check receiving socket for
 * memory mapped i/o capability and use it if enabled. Will fall back
 * to non-mapped skb if message size exceeds the frame size of the ring.
 */
struct sk_buff *genlmsg_new_unicast(size_t payload, struct genl_info *info,
				    gfp_t flags)
{
	size_t len = nlmsg_total_size(genlmsg_total_size(payload));

	return netlink_alloc_skb(info->dst_sk, len, info->snd_portid, flags);
}
EXPORT_SYMBOL_GPL(genlmsg_new_unicast);

485 486 487
/**
 * genlmsg_put - Add generic netlink header to netlink message
 * @skb: socket buffer holding the message
488
 * @portid: netlink portid the message is addressed to
489 490
 * @seq: sequence number (usually the one of the sender)
 * @family: generic netlink family
491
 * @flags: netlink message flags
492 493 494 495
 * @cmd: generic netlink command
 *
 * Returns pointer to user specific header
 */
496
void *genlmsg_put(struct sk_buff *skb, u32 portid, u32 seq,
497 498 499 500 501
				struct genl_family *family, int flags, u8 cmd)
{
	struct nlmsghdr *nlh;
	struct genlmsghdr *hdr;

502
	nlh = nlmsg_put(skb, portid, seq, family->id, GENL_HDRLEN +
503 504 505 506 507 508 509 510 511 512 513 514 515
			family->hdrsize, flags);
	if (nlh == NULL)
		return NULL;

	hdr = nlmsg_data(nlh);
	hdr->cmd = cmd;
	hdr->version = family->version;
	hdr->reserved = 0;

	return (char *) hdr + GENL_HDRLEN;
}
EXPORT_SYMBOL(genlmsg_put);

516 517 518 519 520 521 522 523 524 525 526 527 528 529
static int genl_lock_start(struct netlink_callback *cb)
{
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
	int rc = 0;

	if (ops->start) {
		genl_lock();
		rc = ops->start(cb);
		genl_unlock();
	}
	return rc;
}

530 531
static int genl_lock_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
{
J
Johannes Berg 已提交
532 533
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
534 535 536 537 538 539 540 541 542 543
	int rc;

	genl_lock();
	rc = ops->dumpit(skb, cb);
	genl_unlock();
	return rc;
}

static int genl_lock_done(struct netlink_callback *cb)
{
J
Johannes Berg 已提交
544 545
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
546 547 548 549 550 551 552 553 554 555
	int rc = 0;

	if (ops->done) {
		genl_lock();
		rc = ops->done(cb);
		genl_unlock();
	}
	return rc;
}

556 557 558
static int genl_family_rcv_msg(struct genl_family *family,
			       struct sk_buff *skb,
			       struct nlmsghdr *nlh)
T
Thomas Graf 已提交
559
{
J
Johannes Berg 已提交
560
	const struct genl_ops *ops;
J
Johannes Berg 已提交
561
	struct net *net = sock_net(skb->sk);
T
Thomas Graf 已提交
562 563
	struct genl_info info;
	struct genlmsghdr *hdr = nlmsg_data(nlh);
564
	struct nlattr **attrbuf;
565
	int hdrlen, err;
T
Thomas Graf 已提交
566

J
Johannes Berg 已提交
567 568 569 570
	/* this family doesn't exist in this netns */
	if (!family->netnsok && !net_eq(net, &init_net))
		return -ENOENT;

T
Thomas Graf 已提交
571 572
	hdrlen = GENL_HDRLEN + family->hdrsize;
	if (nlh->nlmsg_len < nlmsg_msg_size(hdrlen))
573
		return -EINVAL;
T
Thomas Graf 已提交
574 575

	ops = genl_get_cmd(hdr->cmd, family);
576 577
	if (ops == NULL)
		return -EOPNOTSUPP;
T
Thomas Graf 已提交
578

579
	if ((ops->flags & GENL_ADMIN_PERM) &&
580
	    !netlink_capable(skb, CAP_NET_ADMIN))
581
		return -EPERM;
T
Thomas Graf 已提交
582

583
	if ((nlh->nlmsg_flags & NLM_F_DUMP) == NLM_F_DUMP) {
584
		int rc;
585

586 587
		if (ops->dumpit == NULL)
			return -EOPNOTSUPP;
T
Thomas Graf 已提交
588

589 590
		if (!family->parallel_ops) {
			struct netlink_dump_control c = {
591
				.module = family->module,
J
Johannes Berg 已提交
592 593
				/* we have const, but the netlink API doesn't */
				.data = (void *)ops,
594
				.start = genl_lock_start,
595 596 597 598 599
				.dump = genl_lock_dumpit,
				.done = genl_lock_done,
			};

			genl_unlock();
600
			rc = __netlink_dump_start(net->genl_sock, skb, nlh, &c);
601 602 603 604
			genl_lock();

		} else {
			struct netlink_dump_control c = {
605
				.module = family->module,
606
				.start = ops->start,
607 608 609 610
				.dump = ops->dumpit,
				.done = ops->done,
			};

611
			rc = __netlink_dump_start(net->genl_sock, skb, nlh, &c);
612 613 614
		}

		return rc;
T
Thomas Graf 已提交
615 616
	}

617 618
	if (ops->doit == NULL)
		return -EOPNOTSUPP;
T
Thomas Graf 已提交
619

620 621 622 623 624 625 626 627 628 629
	if (family->maxattr && family->parallel_ops) {
		attrbuf = kmalloc((family->maxattr+1) *
					sizeof(struct nlattr *), GFP_KERNEL);
		if (attrbuf == NULL)
			return -ENOMEM;
	} else
		attrbuf = family->attrbuf;

	if (attrbuf) {
		err = nlmsg_parse(nlh, hdrlen, attrbuf, family->maxattr,
T
Thomas Graf 已提交
630 631
				  ops->policy);
		if (err < 0)
632
			goto out;
T
Thomas Graf 已提交
633 634 635
	}

	info.snd_seq = nlh->nlmsg_seq;
636
	info.snd_portid = NETLINK_CB(skb).portid;
T
Thomas Graf 已提交
637 638 639
	info.nlhdr = nlh;
	info.genlhdr = nlmsg_data(nlh);
	info.userhdr = nlmsg_data(nlh) + GENL_HDRLEN;
640
	info.attrs = attrbuf;
641
	info.dst_sk = skb->sk;
J
Johannes Berg 已提交
642
	genl_info_net_set(&info, net);
643
	memset(&info.user_ptr, 0, sizeof(info.user_ptr));
T
Thomas Graf 已提交
644

645 646 647
	if (family->pre_doit) {
		err = family->pre_doit(ops, skb, &info);
		if (err)
648
			goto out;
649 650 651 652 653 654 655
	}

	err = ops->doit(skb, &info);

	if (family->post_doit)
		family->post_doit(ops, skb, &info);

656
out:
657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679
	if (family->parallel_ops)
		kfree(attrbuf);

	return err;
}

static int genl_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh)
{
	struct genl_family *family;
	int err;

	family = genl_family_find_byid(nlh->nlmsg_type);
	if (family == NULL)
		return -ENOENT;

	if (!family->parallel_ops)
		genl_lock();

	err = genl_family_rcv_msg(family, skb, nlh);

	if (!family->parallel_ops)
		genl_unlock();

680
	return err;
T
Thomas Graf 已提交
681 682
}

683
static void genl_rcv(struct sk_buff *skb)
T
Thomas Graf 已提交
684
{
685
	down_read(&cb_lock);
686
	netlink_rcv_skb(skb, &genl_rcv_msg);
687
	up_read(&cb_lock);
T
Thomas Graf 已提交
688 689 690 691 692 693
}

/**************************************************************************
 * Controller
 **************************************************************************/

694 695 696
static struct genl_family genl_ctrl = {
	.id = GENL_ID_CTRL,
	.name = "nlctrl",
697
	.version = 0x2,
698
	.maxattr = CTRL_ATTR_MAX,
J
Johannes Berg 已提交
699
	.netnsok = true,
700 701
};

702
static int ctrl_fill_info(struct genl_family *family, u32 portid, u32 seq,
T
Thomas Graf 已提交
703 704 705 706
			  u32 flags, struct sk_buff *skb, u8 cmd)
{
	void *hdr;

707
	hdr = genlmsg_put(skb, portid, seq, &genl_ctrl, flags, cmd);
T
Thomas Graf 已提交
708 709 710
	if (hdr == NULL)
		return -1;

711 712 713 714 715 716
	if (nla_put_string(skb, CTRL_ATTR_FAMILY_NAME, family->name) ||
	    nla_put_u16(skb, CTRL_ATTR_FAMILY_ID, family->id) ||
	    nla_put_u32(skb, CTRL_ATTR_VERSION, family->version) ||
	    nla_put_u32(skb, CTRL_ATTR_HDRSIZE, family->hdrsize) ||
	    nla_put_u32(skb, CTRL_ATTR_MAXATTR, family->maxattr))
		goto nla_put_failure;
717

718
	if (family->n_ops) {
719
		struct nlattr *nla_ops;
720
		int i;
721

722 723
		nla_ops = nla_nest_start(skb, CTRL_ATTR_OPS);
		if (nla_ops == NULL)
724 725
			goto nla_put_failure;

726
		for (i = 0; i < family->n_ops; i++) {
727
			struct nlattr *nest;
J
Johannes Berg 已提交
728
			const struct genl_ops *ops = &family->ops[i];
729
			u32 op_flags = ops->flags;
J
Johannes Berg 已提交
730 731

			if (ops->dumpit)
732
				op_flags |= GENL_CMD_CAP_DUMP;
J
Johannes Berg 已提交
733
			if (ops->doit)
734
				op_flags |= GENL_CMD_CAP_DO;
J
Johannes Berg 已提交
735
			if (ops->policy)
736
				op_flags |= GENL_CMD_CAP_HASPOL;
737

738
			nest = nla_nest_start(skb, i + 1);
739 740
			if (nest == NULL)
				goto nla_put_failure;
741

742
			if (nla_put_u32(skb, CTRL_ATTR_OP_ID, ops->cmd) ||
743
			    nla_put_u32(skb, CTRL_ATTR_OP_FLAGS, op_flags))
744
				goto nla_put_failure;
745

746 747 748 749 750
			nla_nest_end(skb, nest);
		}

		nla_nest_end(skb, nla_ops);
	}
T
Thomas Graf 已提交
751

752
	if (family->n_mcgrps) {
753
		struct nlattr *nla_grps;
754
		int i;
755 756 757 758 759

		nla_grps = nla_nest_start(skb, CTRL_ATTR_MCAST_GROUPS);
		if (nla_grps == NULL)
			goto nla_put_failure;

760
		for (i = 0; i < family->n_mcgrps; i++) {
761
			struct nlattr *nest;
762
			const struct genl_multicast_group *grp;
763

764 765 766
			grp = &family->mcgrps[i];

			nest = nla_nest_start(skb, i + 1);
767 768 769
			if (nest == NULL)
				goto nla_put_failure;

770 771
			if (nla_put_u32(skb, CTRL_ATTR_MCAST_GRP_ID,
					family->mcgrp_offset + i) ||
772 773 774
			    nla_put_string(skb, CTRL_ATTR_MCAST_GRP_NAME,
					   grp->name))
				goto nla_put_failure;
775 776 777 778 779 780

			nla_nest_end(skb, nest);
		}
		nla_nest_end(skb, nla_grps);
	}

781 782
	genlmsg_end(skb, hdr);
	return 0;
783 784

nla_put_failure:
785 786
	genlmsg_cancel(skb, hdr);
	return -EMSGSIZE;
787 788
}

789
static int ctrl_fill_mcgrp_info(struct genl_family *family,
790 791 792
				const struct genl_multicast_group *grp,
				int grp_id, u32 portid, u32 seq, u32 flags,
				struct sk_buff *skb, u8 cmd)
793 794 795 796 797
{
	void *hdr;
	struct nlattr *nla_grps;
	struct nlattr *nest;

798
	hdr = genlmsg_put(skb, portid, seq, &genl_ctrl, flags, cmd);
799 800 801
	if (hdr == NULL)
		return -1;

802 803
	if (nla_put_string(skb, CTRL_ATTR_FAMILY_NAME, family->name) ||
	    nla_put_u16(skb, CTRL_ATTR_FAMILY_ID, family->id))
804
		goto nla_put_failure;
805 806 807 808 809 810 811 812 813

	nla_grps = nla_nest_start(skb, CTRL_ATTR_MCAST_GROUPS);
	if (nla_grps == NULL)
		goto nla_put_failure;

	nest = nla_nest_start(skb, 1);
	if (nest == NULL)
		goto nla_put_failure;

814
	if (nla_put_u32(skb, CTRL_ATTR_MCAST_GRP_ID, grp_id) ||
815 816 817
	    nla_put_string(skb, CTRL_ATTR_MCAST_GRP_NAME,
			   grp->name))
		goto nla_put_failure;
818 819 820 821

	nla_nest_end(skb, nest);
	nla_nest_end(skb, nla_grps);

822 823
	genlmsg_end(skb, hdr);
	return 0;
T
Thomas Graf 已提交
824 825

nla_put_failure:
826 827
	genlmsg_cancel(skb, hdr);
	return -EMSGSIZE;
T
Thomas Graf 已提交
828 829 830 831 832 833 834
}

static int ctrl_dumpfamily(struct sk_buff *skb, struct netlink_callback *cb)
{

	int i, n = 0;
	struct genl_family *rt;
J
Johannes Berg 已提交
835
	struct net *net = sock_net(skb->sk);
T
Thomas Graf 已提交
836 837 838
	int chains_to_skip = cb->args[0];
	int fams_to_skip = cb->args[1];

839
	for (i = chains_to_skip; i < GENL_FAM_TAB_SIZE; i++) {
T
Thomas Graf 已提交
840 841
		n = 0;
		list_for_each_entry(rt, genl_family_chain(i), family_list) {
J
Johannes Berg 已提交
842 843
			if (!rt->netnsok && !net_eq(net, &init_net))
				continue;
T
Thomas Graf 已提交
844 845
			if (++n < fams_to_skip)
				continue;
846
			if (ctrl_fill_info(rt, NETLINK_CB(cb->skb).portid,
T
Thomas Graf 已提交
847 848 849 850 851 852 853 854 855 856 857 858 859 860 861
					   cb->nlh->nlmsg_seq, NLM_F_MULTI,
					   skb, CTRL_CMD_NEWFAMILY) < 0)
				goto errout;
		}

		fams_to_skip = 0;
	}

errout:
	cb->args[0] = i;
	cb->args[1] = n;

	return skb->len;
}

862
static struct sk_buff *ctrl_build_family_msg(struct genl_family *family,
863
					     u32 portid, int seq, u8 cmd)
T
Thomas Graf 已提交
864 865 866 867
{
	struct sk_buff *skb;
	int err;

868
	skb = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
T
Thomas Graf 已提交
869 870 871
	if (skb == NULL)
		return ERR_PTR(-ENOBUFS);

872
	err = ctrl_fill_info(family, portid, seq, 0, skb, cmd);
T
Thomas Graf 已提交
873 874 875 876 877 878 879 880
	if (err < 0) {
		nlmsg_free(skb);
		return ERR_PTR(err);
	}

	return skb;
}

881 882 883 884
static struct sk_buff *
ctrl_build_mcgrp_msg(struct genl_family *family,
		     const struct genl_multicast_group *grp,
		     int grp_id, u32 portid, int seq, u8 cmd)
885 886 887 888 889 890 891 892
{
	struct sk_buff *skb;
	int err;

	skb = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
	if (skb == NULL)
		return ERR_PTR(-ENOBUFS);

893 894
	err = ctrl_fill_mcgrp_info(family, grp, grp_id, portid,
				   seq, 0, skb, cmd);
895 896 897 898 899 900 901 902
	if (err < 0) {
		nlmsg_free(skb);
		return ERR_PTR(err);
	}

	return skb;
}

903
static const struct nla_policy ctrl_policy[CTRL_ATTR_MAX+1] = {
T
Thomas Graf 已提交
904
	[CTRL_ATTR_FAMILY_ID]	= { .type = NLA_U16 },
905 906
	[CTRL_ATTR_FAMILY_NAME]	= { .type = NLA_NUL_STRING,
				    .len = GENL_NAMSIZ - 1 },
T
Thomas Graf 已提交
907 908 909 910 911 912 913 914 915 916 917
};

static int ctrl_getfamily(struct sk_buff *skb, struct genl_info *info)
{
	struct sk_buff *msg;
	struct genl_family *res = NULL;
	int err = -EINVAL;

	if (info->attrs[CTRL_ATTR_FAMILY_ID]) {
		u16 id = nla_get_u16(info->attrs[CTRL_ATTR_FAMILY_ID]);
		res = genl_family_find_byid(id);
J
Johannes Berg 已提交
918
		err = -ENOENT;
T
Thomas Graf 已提交
919 920 921
	}

	if (info->attrs[CTRL_ATTR_FAMILY_NAME]) {
922
		char *name;
T
Thomas Graf 已提交
923

924
		name = nla_data(info->attrs[CTRL_ATTR_FAMILY_NAME]);
T
Thomas Graf 已提交
925
		res = genl_family_find_byname(name);
926 927 928
#ifdef CONFIG_MODULES
		if (res == NULL) {
			genl_unlock();
929
			up_read(&cb_lock);
930
			request_module("net-pf-%d-proto-%d-family-%s",
931
				       PF_NETLINK, NETLINK_GENERIC, name);
932
			down_read(&cb_lock);
933 934 935 936
			genl_lock();
			res = genl_family_find_byname(name);
		}
#endif
J
Johannes Berg 已提交
937
		err = -ENOENT;
T
Thomas Graf 已提交
938 939
	}

J
Johannes Berg 已提交
940 941 942 943 944 945
	if (res == NULL)
		return err;

	if (!res->netnsok && !net_eq(genl_info_net(info), &init_net)) {
		/* family doesn't exist here */
		return -ENOENT;
T
Thomas Graf 已提交
946 947
	}

948
	msg = ctrl_build_family_msg(res, info->snd_portid, info->snd_seq,
949
				    CTRL_CMD_NEWFAMILY);
J
Johannes Berg 已提交
950 951
	if (IS_ERR(msg))
		return PTR_ERR(msg);
T
Thomas Graf 已提交
952

J
Johannes Berg 已提交
953
	return genlmsg_reply(msg, info);
T
Thomas Graf 已提交
954 955
}

956
static int genl_ctrl_event(int event, struct genl_family *family,
957 958
			   const struct genl_multicast_group *grp,
			   int grp_id)
T
Thomas Graf 已提交
959 960 961
{
	struct sk_buff *msg;

J
Johannes Berg 已提交
962 963
	/* genl is still initialising */
	if (!init_net.genl_sock)
T
Thomas Graf 已提交
964 965 966 967 968
		return 0;

	switch (event) {
	case CTRL_CMD_NEWFAMILY:
	case CTRL_CMD_DELFAMILY:
969
		WARN_ON(grp);
J
Johannes Berg 已提交
970
		msg = ctrl_build_family_msg(family, 0, 0, event);
971 972 973
		break;
	case CTRL_CMD_NEWMCAST_GRP:
	case CTRL_CMD_DELMCAST_GRP:
974
		BUG_ON(!grp);
975
		msg = ctrl_build_mcgrp_msg(family, grp, grp_id, 0, 0, event);
T
Thomas Graf 已提交
976
		break;
J
Johannes Berg 已提交
977 978 979 980 981 982 983 984
	default:
		return -EINVAL;
	}

	if (IS_ERR(msg))
		return PTR_ERR(msg);

	if (!family->netnsok) {
985
		genlmsg_multicast_netns(&genl_ctrl, &init_net, msg, 0,
986
					0, GFP_KERNEL);
J
Johannes Berg 已提交
987 988
	} else {
		rcu_read_lock();
989
		genlmsg_multicast_allns(&genl_ctrl, msg, 0,
990
					0, GFP_ATOMIC);
J
Johannes Berg 已提交
991
		rcu_read_unlock();
T
Thomas Graf 已提交
992 993 994 995 996
	}

	return 0;
}

997 998 999 1000 1001 1002 1003
static struct genl_ops genl_ctrl_ops[] = {
	{
		.cmd		= CTRL_CMD_GETFAMILY,
		.doit		= ctrl_getfamily,
		.dumpit		= ctrl_dumpfamily,
		.policy		= ctrl_policy,
	},
T
Thomas Graf 已提交
1004 1005
};

1006 1007
static struct genl_multicast_group genl_ctrl_groups[] = {
	{ .name = "notify", },
1008 1009
};

1010
static int genl_bind(struct net *net, int group)
1011
{
1012
	int i, err = -ENOENT;
1013 1014 1015 1016 1017 1018 1019 1020 1021 1022

	down_read(&cb_lock);
	for (i = 0; i < GENL_FAM_TAB_SIZE; i++) {
		struct genl_family *f;

		list_for_each_entry(f, genl_family_chain(i), family_list) {
			if (group >= f->mcgrp_offset &&
			    group < f->mcgrp_offset + f->n_mcgrps) {
				int fam_grp = group - f->mcgrp_offset;

1023 1024 1025 1026
				if (!f->netnsok && net != &init_net)
					err = -ENOENT;
				else if (f->mcast_bind)
					err = f->mcast_bind(net, fam_grp);
1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037
				else
					err = 0;
				break;
			}
		}
	}
	up_read(&cb_lock);

	return err;
}

1038
static void genl_unbind(struct net *net, int group)
1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051
{
	int i;

	down_read(&cb_lock);
	for (i = 0; i < GENL_FAM_TAB_SIZE; i++) {
		struct genl_family *f;

		list_for_each_entry(f, genl_family_chain(i), family_list) {
			if (group >= f->mcgrp_offset &&
			    group < f->mcgrp_offset + f->n_mcgrps) {
				int fam_grp = group - f->mcgrp_offset;

				if (f->mcast_unbind)
1052
					f->mcast_unbind(net, fam_grp);
1053 1054 1055 1056 1057 1058 1059
				break;
			}
		}
	}
	up_read(&cb_lock);
}

J
Johannes Berg 已提交
1060 1061
static int __net_init genl_pernet_init(struct net *net)
{
1062 1063
	struct netlink_kernel_cfg cfg = {
		.input		= genl_rcv,
1064
		.flags		= NL_CFG_F_NONROOT_RECV,
1065 1066
		.bind		= genl_bind,
		.unbind		= genl_unbind,
1067 1068
	};

J
Johannes Berg 已提交
1069
	/* we'll bump the group number right afterwards */
1070
	net->genl_sock = netlink_kernel_create(net, NETLINK_GENERIC, &cfg);
J
Johannes Berg 已提交
1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091

	if (!net->genl_sock && net_eq(net, &init_net))
		panic("GENL: Cannot initialize generic netlink\n");

	if (!net->genl_sock)
		return -ENOMEM;

	return 0;
}

static void __net_exit genl_pernet_exit(struct net *net)
{
	netlink_kernel_release(net->genl_sock);
	net->genl_sock = NULL;
}

static struct pernet_operations genl_pernet_ops = {
	.init = genl_pernet_init,
	.exit = genl_pernet_exit,
};

T
Thomas Graf 已提交
1092 1093 1094 1095 1096 1097 1098
static int __init genl_init(void)
{
	int i, err;

	for (i = 0; i < GENL_FAM_TAB_SIZE; i++)
		INIT_LIST_HEAD(&family_ht[i]);

1099 1100
	err = genl_register_family_with_ops_groups(&genl_ctrl, genl_ctrl_ops,
						   genl_ctrl_groups);
T
Thomas Graf 已提交
1101
	if (err < 0)
J
Johannes Berg 已提交
1102
		goto problem;
T
Thomas Graf 已提交
1103

J
Johannes Berg 已提交
1104 1105 1106
	err = register_pernet_subsys(&genl_pernet_ops);
	if (err)
		goto problem;
T
Thomas Graf 已提交
1107 1108 1109

	return 0;

J
Johannes Berg 已提交
1110
problem:
T
Thomas Graf 已提交
1111 1112 1113 1114 1115
	panic("GENL: Cannot register controller: %d\n", err);
}

subsys_initcall(genl_init);

1116
static int genlmsg_mcast(struct sk_buff *skb, u32 portid, unsigned long group,
J
Johannes Berg 已提交
1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130
			 gfp_t flags)
{
	struct sk_buff *tmp;
	struct net *net, *prev = NULL;
	int err;

	for_each_net_rcu(net) {
		if (prev) {
			tmp = skb_clone(skb, flags);
			if (!tmp) {
				err = -ENOMEM;
				goto error;
			}
			err = nlmsg_multicast(prev->genl_sock, tmp,
1131
					      portid, group, flags);
J
Johannes Berg 已提交
1132 1133 1134 1135 1136 1137 1138
			if (err)
				goto error;
		}

		prev = net;
	}

1139
	return nlmsg_multicast(prev->genl_sock, skb, portid, group, flags);
J
Johannes Berg 已提交
1140 1141 1142 1143 1144
 error:
	kfree_skb(skb);
	return err;
}

1145 1146
int genlmsg_multicast_allns(struct genl_family *family, struct sk_buff *skb,
			    u32 portid, unsigned int group, gfp_t flags)
J
Johannes Berg 已提交
1147
{
1148
	if (WARN_ON_ONCE(group >= family->n_mcgrps))
1149 1150
		return -EINVAL;
	group = family->mcgrp_offset + group;
1151
	return genlmsg_mcast(skb, portid, group, flags);
J
Johannes Berg 已提交
1152 1153
}
EXPORT_SYMBOL(genlmsg_multicast_allns);
P
Pravin B Shelar 已提交
1154

J
Jiri Benc 已提交
1155 1156
void genl_notify(struct genl_family *family, struct sk_buff *skb,
		 struct genl_info *info, u32 group, gfp_t flags)
P
Pravin B Shelar 已提交
1157
{
J
Jiri Benc 已提交
1158
	struct net *net = genl_info_net(info);
P
Pravin B Shelar 已提交
1159 1160 1161
	struct sock *sk = net->genl_sock;
	int report = 0;

J
Jiri Benc 已提交
1162 1163
	if (info->nlhdr)
		report = nlmsg_report(info->nlhdr);
P
Pravin B Shelar 已提交
1164

1165
	if (WARN_ON_ONCE(group >= family->n_mcgrps))
1166 1167
		return;
	group = family->mcgrp_offset + group;
J
Jiri Benc 已提交
1168
	nlmsg_notify(sk, skb, info->snd_portid, group, report, flags);
P
Pravin B Shelar 已提交
1169 1170
}
EXPORT_SYMBOL(genl_notify);