genetlink.c 25.7 KB
Newer Older
T
Thomas Graf 已提交
1 2 3 4 5
/*
 * NETLINK      Generic Netlink Family
 *
 * 		Authors:	Jamal Hadi Salim
 * 				Thomas Graf <tgraf@suug.ch>
6
 *				Johannes Berg <johannes@sipsolutions.net>
T
Thomas Graf 已提交
7 8 9 10
 */

#include <linux/module.h>
#include <linux/kernel.h>
11
#include <linux/slab.h>
T
Thomas Graf 已提交
12 13 14 15 16
#include <linux/errno.h>
#include <linux/types.h>
#include <linux/socket.h>
#include <linux/string.h>
#include <linux/skbuff.h>
17
#include <linux/mutex.h>
18
#include <linux/bitmap.h>
19
#include <linux/rwsem.h>
T
Thomas Graf 已提交
20 21 22
#include <net/sock.h>
#include <net/genetlink.h>

23
static DEFINE_MUTEX(genl_mutex); /* serialization of message processing */
24
static DECLARE_RWSEM(cb_lock);
T
Thomas Graf 已提交
25

26
void genl_lock(void)
T
Thomas Graf 已提交
27
{
28
	mutex_lock(&genl_mutex);
T
Thomas Graf 已提交
29
}
30
EXPORT_SYMBOL(genl_lock);
T
Thomas Graf 已提交
31

32
void genl_unlock(void)
T
Thomas Graf 已提交
33
{
34
	mutex_unlock(&genl_mutex);
T
Thomas Graf 已提交
35
}
36
EXPORT_SYMBOL(genl_unlock);
T
Thomas Graf 已提交
37

38
#ifdef CONFIG_LOCKDEP
39 40 41 42 43 44 45
int lockdep_genl_is_held(void)
{
	return lockdep_is_held(&genl_mutex);
}
EXPORT_SYMBOL(lockdep_genl_is_held);
#endif

46 47 48 49 50 51 52 53 54 55 56 57
static void genl_lock_all(void)
{
	down_write(&cb_lock);
	genl_lock();
}

static void genl_unlock_all(void)
{
	genl_unlock();
	up_write(&cb_lock);
}

T
Thomas Graf 已提交
58 59 60 61
#define GENL_FAM_TAB_SIZE	16
#define GENL_FAM_TAB_MASK	(GENL_FAM_TAB_SIZE - 1)

static struct list_head family_ht[GENL_FAM_TAB_SIZE];
62 63 64 65 66 67
/*
 * Bitmap of multicast groups that are currently in use.
 *
 * To avoid an allocation at boot of just one unsigned long,
 * declare it global instead.
 * Bit 0 is marked as already used since group 0 is invalid.
68 69 70 71
 * Bit 1 is marked as already used since the drop-monitor code
 * abuses the API and thinks it can statically use group 1.
 * That group will typically conflict with other groups that
 * any proper users use.
72 73
 * Bit 16 is marked as used since it's used for generic netlink
 * and the code no longer marks pre-reserved IDs as used.
74 75 76
 * Bit 17 is marked as already used since the VFS quota code
 * also abused this API and relied on family == group ID, we
 * cater to that by giving it a static family and group ID.
77 78
 * Bit 18 is marked as already used since the PMCRAID driver
 * did the same thing as the VFS quota code (maybe copied?)
79
 */
80
static unsigned long mc_group_start = 0x3 | BIT(GENL_ID_CTRL) |
81 82
				      BIT(GENL_ID_VFS_DQUOT) |
				      BIT(GENL_ID_PMCRAID);
83 84
static unsigned long *mc_groups = &mc_group_start;
static unsigned long mc_groups_longs = 1;
T
Thomas Graf 已提交
85

86
static int genl_ctrl_event(int event, struct genl_family *family,
87 88
			   const struct genl_multicast_group *grp,
			   int grp_id);
T
Thomas Graf 已提交
89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123

static inline unsigned int genl_family_hash(unsigned int id)
{
	return id & GENL_FAM_TAB_MASK;
}

static inline struct list_head *genl_family_chain(unsigned int id)
{
	return &family_ht[genl_family_hash(id)];
}

static struct genl_family *genl_family_find_byid(unsigned int id)
{
	struct genl_family *f;

	list_for_each_entry(f, genl_family_chain(id), family_list)
		if (f->id == id)
			return f;

	return NULL;
}

static struct genl_family *genl_family_find_byname(char *name)
{
	struct genl_family *f;
	int i;

	for (i = 0; i < GENL_FAM_TAB_SIZE; i++)
		list_for_each_entry(f, genl_family_chain(i), family_list)
			if (strcmp(f->name, name) == 0)
				return f;

	return NULL;
}

J
Johannes Berg 已提交
124
static const struct genl_ops *genl_get_cmd(u8 cmd, struct genl_family *family)
T
Thomas Graf 已提交
125
{
126
	int i;
T
Thomas Graf 已提交
127

128 129 130
	for (i = 0; i < family->n_ops; i++)
		if (family->ops[i].cmd == cmd)
			return &family->ops[i];
T
Thomas Graf 已提交
131 132 133 134 135 136 137

	return NULL;
}

/* Of course we are going to have problems once we hit
 * 2^16 alive types, but that can only happen by year 2K
*/
138
static u16 genl_generate_id(void)
T
Thomas Graf 已提交
139
{
140 141
	static u16 id_gen_idx = GENL_MIN_ID;
	int i;
T
Thomas Graf 已提交
142

143
	for (i = 0; i <= GENL_MAX_ID - GENL_MIN_ID; i++) {
144
		if (id_gen_idx != GENL_ID_VFS_DQUOT &&
145
		    id_gen_idx != GENL_ID_PMCRAID &&
146
		    !genl_family_find_byid(id_gen_idx))
147 148
			return id_gen_idx;
		if (++id_gen_idx > GENL_MAX_ID)
T
Thomas Graf 已提交
149
			id_gen_idx = GENL_MIN_ID;
150
	}
T
Thomas Graf 已提交
151

152
	return 0;
T
Thomas Graf 已提交
153 154
}

155
static int genl_allocate_reserve_groups(int n_groups, int *first_id)
156 157
{
	unsigned long *new_groups;
158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183
	int start = 0;
	int i;
	int id;
	bool fits;

	do {
		if (start == 0)
			id = find_first_zero_bit(mc_groups,
						 mc_groups_longs *
						 BITS_PER_LONG);
		else
			id = find_next_zero_bit(mc_groups,
						mc_groups_longs * BITS_PER_LONG,
						start);

		fits = true;
		for (i = id;
		     i < min_t(int, id + n_groups,
			       mc_groups_longs * BITS_PER_LONG);
		     i++) {
			if (test_bit(i, mc_groups)) {
				start = i;
				fits = false;
				break;
			}
		}
184

185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207
		if (id >= mc_groups_longs * BITS_PER_LONG) {
			unsigned long new_longs = mc_groups_longs +
						  BITS_TO_LONGS(n_groups);
			size_t nlen = new_longs * sizeof(unsigned long);

			if (mc_groups == &mc_group_start) {
				new_groups = kzalloc(nlen, GFP_KERNEL);
				if (!new_groups)
					return -ENOMEM;
				mc_groups = new_groups;
				*mc_groups = mc_group_start;
			} else {
				new_groups = krealloc(mc_groups, nlen,
						      GFP_KERNEL);
				if (!new_groups)
					return -ENOMEM;
				mc_groups = new_groups;
				for (i = 0; i < BITS_TO_LONGS(n_groups); i++)
					mc_groups[mc_groups_longs + i] = 0;
			}
			mc_groups_longs = new_longs;
		}
	} while (!fits);
208

209 210 211 212 213 214 215 216 217 218 219 220
	for (i = id; i < id + n_groups; i++)
		set_bit(i, mc_groups);
	*first_id = id;
	return 0;
}

static struct genl_family genl_ctrl;

static int genl_validate_assign_mc_groups(struct genl_family *family)
{
	int first_id;
	int n_groups = family->n_mcgrps;
221
	int err = 0, i;
222 223 224 225 226 227 228 229 230 231 232 233 234
	bool groups_allocated = false;

	if (!n_groups)
		return 0;

	for (i = 0; i < n_groups; i++) {
		const struct genl_multicast_group *grp = &family->mcgrps[i];

		if (WARN_ON(grp->name[0] == '\0'))
			return -EINVAL;
		if (WARN_ON(memchr(grp->name, '\0', GENL_NAMSIZ) == NULL))
			return -EINVAL;
	}
235

236
	/* special-case our own group and hacks */
237 238 239 240 241 242
	if (family == &genl_ctrl) {
		first_id = GENL_ID_CTRL;
		BUG_ON(n_groups != 1);
	} else if (strcmp(family->name, "NET_DM") == 0) {
		first_id = 1;
		BUG_ON(n_groups != 1);
243
	} else if (family->id == GENL_ID_VFS_DQUOT) {
244 245
		first_id = GENL_ID_VFS_DQUOT;
		BUG_ON(n_groups != 1);
246 247 248
	} else if (family->id == GENL_ID_PMCRAID) {
		first_id = GENL_ID_PMCRAID;
		BUG_ON(n_groups != 1);
249 250 251 252 253
	} else {
		groups_allocated = true;
		err = genl_allocate_reserve_groups(n_groups, &first_id);
		if (err)
			return err;
254 255
	}

256 257 258 259 260 261
	family->mcgrp_offset = first_id;

	/* if still initializing, can't and don't need to to realloc bitmaps */
	if (!init_net.genl_sock)
		return 0;

J
Johannes Berg 已提交
262 263 264
	if (family->netnsok) {
		struct net *net;

265
		netlink_table_grab();
J
Johannes Berg 已提交
266 267
		rcu_read_lock();
		for_each_net_rcu(net) {
268
			err = __netlink_change_ngroups(net->genl_sock,
J
Johannes Berg 已提交
269 270 271 272 273 274 275 276
					mc_groups_longs * BITS_PER_LONG);
			if (err) {
				/*
				 * No need to roll back, can only fail if
				 * memory allocation fails and then the
				 * number of _possible_ groups has been
				 * increased on some sockets which is ok.
				 */
277
				break;
J
Johannes Berg 已提交
278 279 280
			}
		}
		rcu_read_unlock();
281
		netlink_table_ungrab();
J
Johannes Berg 已提交
282 283 284 285
	} else {
		err = netlink_change_ngroups(init_net.genl_sock,
					     mc_groups_longs * BITS_PER_LONG);
	}
286

287 288 289 290
	if (groups_allocated && err) {
		for (i = 0; i < family->n_mcgrps; i++)
			clear_bit(family->mcgrp_offset + i, mc_groups);
	}
291

292
	return err;
293 294
}

295
static void genl_unregister_mc_groups(struct genl_family *family)
296
{
J
Johannes Berg 已提交
297
	struct net *net;
298
	int i;
J
Johannes Berg 已提交
299

300
	netlink_table_grab();
J
Johannes Berg 已提交
301
	rcu_read_lock();
302 303 304 305 306
	for_each_net_rcu(net) {
		for (i = 0; i < family->n_mcgrps; i++)
			__netlink_clear_multicast_users(
				net->genl_sock, family->mcgrp_offset + i);
	}
J
Johannes Berg 已提交
307
	rcu_read_unlock();
308
	netlink_table_ungrab();
J
Johannes Berg 已提交
309

310 311
	for (i = 0; i < family->n_mcgrps; i++) {
		int grp_id = family->mcgrp_offset + i;
312

313 314 315 316 317
		if (grp_id != 1)
			clear_bit(grp_id, mc_groups);
		genl_ctrl_event(CTRL_CMD_DELMCAST_GRP, family,
				&family->mcgrps[i], grp_id);
	}
318 319
}

320
static int genl_validate_ops(const struct genl_family *family)
T
Thomas Graf 已提交
321
{
322 323
	const struct genl_ops *ops = family->ops;
	unsigned int n_ops = family->n_ops;
324 325
	int i, j;

326 327 328 329 330 331
	if (WARN_ON(n_ops && !ops))
		return -EINVAL;

	if (!n_ops)
		return 0;

332 333 334 335 336 337
	for (i = 0; i < n_ops; i++) {
		if (ops[i].dumpit == NULL && ops[i].doit == NULL)
			return -EINVAL;
		for (j = i + 1; j < n_ops; j++)
			if (ops[i].cmd == ops[j].cmd)
				return -EINVAL;
T
Thomas Graf 已提交
338 339
	}

340
	return 0;
T
Thomas Graf 已提交
341 342 343
}

/**
344
 * __genl_register_family - register a generic netlink family
T
Thomas Graf 已提交
345 346 347 348 349 350 351
 * @family: generic netlink family
 *
 * Registers the specified family after validating it first. Only one
 * family may be registered with the same family name or identifier.
 * The family id may equal GENL_ID_GENERATE causing an unique id to
 * be automatically generated and assigned.
 *
352 353 354
 * The family's ops array must already be assigned, you can use the
 * genl_register_family_with_ops() helper function.
 *
T
Thomas Graf 已提交
355 356
 * Return 0 on success or a negative error code.
 */
357
int __genl_register_family(struct genl_family *family)
T
Thomas Graf 已提交
358
{
359
	int err = -EINVAL, i;
T
Thomas Graf 已提交
360 361 362 363 364 365 366

	if (family->id && family->id < GENL_MIN_ID)
		goto errout;

	if (family->id > GENL_MAX_ID)
		goto errout;

367 368 369 370
	err = genl_validate_ops(family);
	if (err)
		return err;

371
	genl_lock_all();
T
Thomas Graf 已提交
372 373 374 375 376 377 378 379 380 381 382 383 384 385 386

	if (genl_family_find_byname(family->name)) {
		err = -EEXIST;
		goto errout_locked;
	}

	if (family->id == GENL_ID_GENERATE) {
		u16 newid = genl_generate_id();

		if (!newid) {
			err = -ENOMEM;
			goto errout_locked;
		}

		family->id = newid;
387 388 389
	} else if (genl_family_find_byid(family->id)) {
		err = -EEXIST;
		goto errout_locked;
T
Thomas Graf 已提交
390 391
	}

392
	if (family->maxattr && !family->parallel_ops) {
T
Thomas Graf 已提交
393 394 395 396
		family->attrbuf = kmalloc((family->maxattr+1) *
					sizeof(struct nlattr *), GFP_KERNEL);
		if (family->attrbuf == NULL) {
			err = -ENOMEM;
397
			goto errout_locked;
T
Thomas Graf 已提交
398 399 400 401
		}
	} else
		family->attrbuf = NULL;

402 403 404 405
	err = genl_validate_assign_mc_groups(family);
	if (err)
		goto errout_locked;

T
Thomas Graf 已提交
406
	list_add_tail(&family->family_list, genl_family_chain(family->id));
407
	genl_unlock_all();
T
Thomas Graf 已提交
408

409 410 411 412 413
	/* send all events */
	genl_ctrl_event(CTRL_CMD_NEWFAMILY, family, NULL, 0);
	for (i = 0; i < family->n_mcgrps; i++)
		genl_ctrl_event(CTRL_CMD_NEWMCAST_GRP, family,
				&family->mcgrps[i], family->mcgrp_offset + i);
T
Thomas Graf 已提交
414 415 416 417

	return 0;

errout_locked:
418
	genl_unlock_all();
T
Thomas Graf 已提交
419 420 421
errout:
	return err;
}
422
EXPORT_SYMBOL(__genl_register_family);
T
Thomas Graf 已提交
423 424 425 426 427 428 429 430 431 432 433 434 435

/**
 * genl_unregister_family - unregister generic netlink family
 * @family: generic netlink family
 *
 * Unregisters the specified family.
 *
 * Returns 0 on success or a negative error code.
 */
int genl_unregister_family(struct genl_family *family)
{
	struct genl_family *rc;

436
	genl_lock_all();
T
Thomas Graf 已提交
437

438 439
	genl_unregister_mc_groups(family);

T
Thomas Graf 已提交
440 441 442 443 444
	list_for_each_entry(rc, genl_family_chain(family->id), family_list) {
		if (family->id != rc->id || strcmp(rc->name, family->name))
			continue;

		list_del(&rc->family_list);
445
		family->n_ops = 0;
446
		genl_unlock_all();
T
Thomas Graf 已提交
447 448

		kfree(family->attrbuf);
449
		genl_ctrl_event(CTRL_CMD_DELFAMILY, family, NULL, 0);
T
Thomas Graf 已提交
450 451 452
		return 0;
	}

453
	genl_unlock_all();
T
Thomas Graf 已提交
454 455 456

	return -ENOENT;
}
457
EXPORT_SYMBOL(genl_unregister_family);
T
Thomas Graf 已提交
458

459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478
/**
 * genlmsg_new_unicast - Allocate generic netlink message for unicast
 * @payload: size of the message payload
 * @info: information on destination
 * @flags: the type of memory to allocate
 *
 * Allocates a new sk_buff large enough to cover the specified payload
 * plus required Netlink headers. Will check receiving socket for
 * memory mapped i/o capability and use it if enabled. Will fall back
 * to non-mapped skb if message size exceeds the frame size of the ring.
 */
struct sk_buff *genlmsg_new_unicast(size_t payload, struct genl_info *info,
				    gfp_t flags)
{
	size_t len = nlmsg_total_size(genlmsg_total_size(payload));

	return netlink_alloc_skb(info->dst_sk, len, info->snd_portid, flags);
}
EXPORT_SYMBOL_GPL(genlmsg_new_unicast);

479 480 481
/**
 * genlmsg_put - Add generic netlink header to netlink message
 * @skb: socket buffer holding the message
482
 * @portid: netlink portid the message is addressed to
483 484
 * @seq: sequence number (usually the one of the sender)
 * @family: generic netlink family
485
 * @flags: netlink message flags
486 487 488 489
 * @cmd: generic netlink command
 *
 * Returns pointer to user specific header
 */
490
void *genlmsg_put(struct sk_buff *skb, u32 portid, u32 seq,
491 492 493 494 495
				struct genl_family *family, int flags, u8 cmd)
{
	struct nlmsghdr *nlh;
	struct genlmsghdr *hdr;

496
	nlh = nlmsg_put(skb, portid, seq, family->id, GENL_HDRLEN +
497 498 499 500 501 502 503 504 505 506 507 508 509
			family->hdrsize, flags);
	if (nlh == NULL)
		return NULL;

	hdr = nlmsg_data(nlh);
	hdr->cmd = cmd;
	hdr->version = family->version;
	hdr->reserved = 0;

	return (char *) hdr + GENL_HDRLEN;
}
EXPORT_SYMBOL(genlmsg_put);

510 511
static int genl_lock_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
{
J
Johannes Berg 已提交
512 513
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
514 515 516 517 518 519 520 521 522 523
	int rc;

	genl_lock();
	rc = ops->dumpit(skb, cb);
	genl_unlock();
	return rc;
}

static int genl_lock_done(struct netlink_callback *cb)
{
J
Johannes Berg 已提交
524 525
	/* our ops are always const - netlink API doesn't propagate that */
	const struct genl_ops *ops = cb->data;
526 527 528 529 530 531 532 533 534 535
	int rc = 0;

	if (ops->done) {
		genl_lock();
		rc = ops->done(cb);
		genl_unlock();
	}
	return rc;
}

536 537 538
static int genl_family_rcv_msg(struct genl_family *family,
			       struct sk_buff *skb,
			       struct nlmsghdr *nlh)
T
Thomas Graf 已提交
539
{
J
Johannes Berg 已提交
540
	const struct genl_ops *ops;
J
Johannes Berg 已提交
541
	struct net *net = sock_net(skb->sk);
T
Thomas Graf 已提交
542 543
	struct genl_info info;
	struct genlmsghdr *hdr = nlmsg_data(nlh);
544
	struct nlattr **attrbuf;
545
	int hdrlen, err;
T
Thomas Graf 已提交
546

J
Johannes Berg 已提交
547 548 549 550
	/* this family doesn't exist in this netns */
	if (!family->netnsok && !net_eq(net, &init_net))
		return -ENOENT;

T
Thomas Graf 已提交
551 552
	hdrlen = GENL_HDRLEN + family->hdrsize;
	if (nlh->nlmsg_len < nlmsg_msg_size(hdrlen))
553
		return -EINVAL;
T
Thomas Graf 已提交
554 555

	ops = genl_get_cmd(hdr->cmd, family);
556 557
	if (ops == NULL)
		return -EOPNOTSUPP;
T
Thomas Graf 已提交
558

559
	if ((ops->flags & GENL_ADMIN_PERM) &&
560
	    !netlink_capable(skb, CAP_NET_ADMIN))
561
		return -EPERM;
T
Thomas Graf 已提交
562

563
	if ((nlh->nlmsg_flags & NLM_F_DUMP) == NLM_F_DUMP) {
564
		int rc;
565

566 567
		if (ops->dumpit == NULL)
			return -EOPNOTSUPP;
T
Thomas Graf 已提交
568

569 570
		if (!family->parallel_ops) {
			struct netlink_dump_control c = {
571
				.module = family->module,
J
Johannes Berg 已提交
572 573
				/* we have const, but the netlink API doesn't */
				.data = (void *)ops,
574 575 576 577 578
				.dump = genl_lock_dumpit,
				.done = genl_lock_done,
			};

			genl_unlock();
579
			rc = __netlink_dump_start(net->genl_sock, skb, nlh, &c);
580 581 582 583
			genl_lock();

		} else {
			struct netlink_dump_control c = {
584
				.module = family->module,
585 586 587 588
				.dump = ops->dumpit,
				.done = ops->done,
			};

589
			rc = __netlink_dump_start(net->genl_sock, skb, nlh, &c);
590 591 592
		}

		return rc;
T
Thomas Graf 已提交
593 594
	}

595 596
	if (ops->doit == NULL)
		return -EOPNOTSUPP;
T
Thomas Graf 已提交
597

598 599 600 601 602 603 604 605 606 607
	if (family->maxattr && family->parallel_ops) {
		attrbuf = kmalloc((family->maxattr+1) *
					sizeof(struct nlattr *), GFP_KERNEL);
		if (attrbuf == NULL)
			return -ENOMEM;
	} else
		attrbuf = family->attrbuf;

	if (attrbuf) {
		err = nlmsg_parse(nlh, hdrlen, attrbuf, family->maxattr,
T
Thomas Graf 已提交
608 609
				  ops->policy);
		if (err < 0)
610
			goto out;
T
Thomas Graf 已提交
611 612 613
	}

	info.snd_seq = nlh->nlmsg_seq;
614
	info.snd_portid = NETLINK_CB(skb).portid;
T
Thomas Graf 已提交
615 616 617
	info.nlhdr = nlh;
	info.genlhdr = nlmsg_data(nlh);
	info.userhdr = nlmsg_data(nlh) + GENL_HDRLEN;
618
	info.attrs = attrbuf;
619
	info.dst_sk = skb->sk;
J
Johannes Berg 已提交
620
	genl_info_net_set(&info, net);
621
	memset(&info.user_ptr, 0, sizeof(info.user_ptr));
T
Thomas Graf 已提交
622

623 624 625
	if (family->pre_doit) {
		err = family->pre_doit(ops, skb, &info);
		if (err)
626
			goto out;
627 628 629 630 631 632 633
	}

	err = ops->doit(skb, &info);

	if (family->post_doit)
		family->post_doit(ops, skb, &info);

634
out:
635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657
	if (family->parallel_ops)
		kfree(attrbuf);

	return err;
}

static int genl_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh)
{
	struct genl_family *family;
	int err;

	family = genl_family_find_byid(nlh->nlmsg_type);
	if (family == NULL)
		return -ENOENT;

	if (!family->parallel_ops)
		genl_lock();

	err = genl_family_rcv_msg(family, skb, nlh);

	if (!family->parallel_ops)
		genl_unlock();

658
	return err;
T
Thomas Graf 已提交
659 660
}

661
static void genl_rcv(struct sk_buff *skb)
T
Thomas Graf 已提交
662
{
663
	down_read(&cb_lock);
664
	netlink_rcv_skb(skb, &genl_rcv_msg);
665
	up_read(&cb_lock);
T
Thomas Graf 已提交
666 667 668 669 670 671
}

/**************************************************************************
 * Controller
 **************************************************************************/

672 673 674
static struct genl_family genl_ctrl = {
	.id = GENL_ID_CTRL,
	.name = "nlctrl",
675
	.version = 0x2,
676
	.maxattr = CTRL_ATTR_MAX,
J
Johannes Berg 已提交
677
	.netnsok = true,
678 679
};

680
static int ctrl_fill_info(struct genl_family *family, u32 portid, u32 seq,
T
Thomas Graf 已提交
681 682 683 684
			  u32 flags, struct sk_buff *skb, u8 cmd)
{
	void *hdr;

685
	hdr = genlmsg_put(skb, portid, seq, &genl_ctrl, flags, cmd);
T
Thomas Graf 已提交
686 687 688
	if (hdr == NULL)
		return -1;

689 690 691 692 693 694
	if (nla_put_string(skb, CTRL_ATTR_FAMILY_NAME, family->name) ||
	    nla_put_u16(skb, CTRL_ATTR_FAMILY_ID, family->id) ||
	    nla_put_u32(skb, CTRL_ATTR_VERSION, family->version) ||
	    nla_put_u32(skb, CTRL_ATTR_HDRSIZE, family->hdrsize) ||
	    nla_put_u32(skb, CTRL_ATTR_MAXATTR, family->maxattr))
		goto nla_put_failure;
695

696
	if (family->n_ops) {
697
		struct nlattr *nla_ops;
698
		int i;
699

700 701
		nla_ops = nla_nest_start(skb, CTRL_ATTR_OPS);
		if (nla_ops == NULL)
702 703
			goto nla_put_failure;

704
		for (i = 0; i < family->n_ops; i++) {
705
			struct nlattr *nest;
J
Johannes Berg 已提交
706
			const struct genl_ops *ops = &family->ops[i];
707
			u32 op_flags = ops->flags;
J
Johannes Berg 已提交
708 709

			if (ops->dumpit)
710
				op_flags |= GENL_CMD_CAP_DUMP;
J
Johannes Berg 已提交
711
			if (ops->doit)
712
				op_flags |= GENL_CMD_CAP_DO;
J
Johannes Berg 已提交
713
			if (ops->policy)
714
				op_flags |= GENL_CMD_CAP_HASPOL;
715

716
			nest = nla_nest_start(skb, i + 1);
717 718
			if (nest == NULL)
				goto nla_put_failure;
719

720
			if (nla_put_u32(skb, CTRL_ATTR_OP_ID, ops->cmd) ||
721
			    nla_put_u32(skb, CTRL_ATTR_OP_FLAGS, op_flags))
722
				goto nla_put_failure;
723

724 725 726 727 728
			nla_nest_end(skb, nest);
		}

		nla_nest_end(skb, nla_ops);
	}
T
Thomas Graf 已提交
729

730
	if (family->n_mcgrps) {
731
		struct nlattr *nla_grps;
732
		int i;
733 734 735 736 737

		nla_grps = nla_nest_start(skb, CTRL_ATTR_MCAST_GROUPS);
		if (nla_grps == NULL)
			goto nla_put_failure;

738
		for (i = 0; i < family->n_mcgrps; i++) {
739
			struct nlattr *nest;
740
			const struct genl_multicast_group *grp;
741

742 743 744
			grp = &family->mcgrps[i];

			nest = nla_nest_start(skb, i + 1);
745 746 747
			if (nest == NULL)
				goto nla_put_failure;

748 749
			if (nla_put_u32(skb, CTRL_ATTR_MCAST_GRP_ID,
					family->mcgrp_offset + i) ||
750 751 752
			    nla_put_string(skb, CTRL_ATTR_MCAST_GRP_NAME,
					   grp->name))
				goto nla_put_failure;
753 754 755 756 757 758 759 760 761

			nla_nest_end(skb, nest);
		}
		nla_nest_end(skb, nla_grps);
	}

	return genlmsg_end(skb, hdr);

nla_put_failure:
762 763
	genlmsg_cancel(skb, hdr);
	return -EMSGSIZE;
764 765
}

766
static int ctrl_fill_mcgrp_info(struct genl_family *family,
767 768 769
				const struct genl_multicast_group *grp,
				int grp_id, u32 portid, u32 seq, u32 flags,
				struct sk_buff *skb, u8 cmd)
770 771 772 773 774
{
	void *hdr;
	struct nlattr *nla_grps;
	struct nlattr *nest;

775
	hdr = genlmsg_put(skb, portid, seq, &genl_ctrl, flags, cmd);
776 777 778
	if (hdr == NULL)
		return -1;

779 780
	if (nla_put_string(skb, CTRL_ATTR_FAMILY_NAME, family->name) ||
	    nla_put_u16(skb, CTRL_ATTR_FAMILY_ID, family->id))
781
		goto nla_put_failure;
782 783 784 785 786 787 788 789 790

	nla_grps = nla_nest_start(skb, CTRL_ATTR_MCAST_GROUPS);
	if (nla_grps == NULL)
		goto nla_put_failure;

	nest = nla_nest_start(skb, 1);
	if (nest == NULL)
		goto nla_put_failure;

791
	if (nla_put_u32(skb, CTRL_ATTR_MCAST_GRP_ID, grp_id) ||
792 793 794
	    nla_put_string(skb, CTRL_ATTR_MCAST_GRP_NAME,
			   grp->name))
		goto nla_put_failure;
795 796 797 798

	nla_nest_end(skb, nest);
	nla_nest_end(skb, nla_grps);

T
Thomas Graf 已提交
799 800 801
	return genlmsg_end(skb, hdr);

nla_put_failure:
802 803
	genlmsg_cancel(skb, hdr);
	return -EMSGSIZE;
T
Thomas Graf 已提交
804 805 806 807 808 809 810
}

static int ctrl_dumpfamily(struct sk_buff *skb, struct netlink_callback *cb)
{

	int i, n = 0;
	struct genl_family *rt;
J
Johannes Berg 已提交
811
	struct net *net = sock_net(skb->sk);
T
Thomas Graf 已提交
812 813 814
	int chains_to_skip = cb->args[0];
	int fams_to_skip = cb->args[1];

815
	for (i = chains_to_skip; i < GENL_FAM_TAB_SIZE; i++) {
T
Thomas Graf 已提交
816 817
		n = 0;
		list_for_each_entry(rt, genl_family_chain(i), family_list) {
J
Johannes Berg 已提交
818 819
			if (!rt->netnsok && !net_eq(net, &init_net))
				continue;
T
Thomas Graf 已提交
820 821
			if (++n < fams_to_skip)
				continue;
822
			if (ctrl_fill_info(rt, NETLINK_CB(cb->skb).portid,
T
Thomas Graf 已提交
823 824 825 826 827 828 829 830 831 832 833 834 835 836 837
					   cb->nlh->nlmsg_seq, NLM_F_MULTI,
					   skb, CTRL_CMD_NEWFAMILY) < 0)
				goto errout;
		}

		fams_to_skip = 0;
	}

errout:
	cb->args[0] = i;
	cb->args[1] = n;

	return skb->len;
}

838
static struct sk_buff *ctrl_build_family_msg(struct genl_family *family,
839
					     u32 portid, int seq, u8 cmd)
T
Thomas Graf 已提交
840 841 842 843
{
	struct sk_buff *skb;
	int err;

844
	skb = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
T
Thomas Graf 已提交
845 846 847
	if (skb == NULL)
		return ERR_PTR(-ENOBUFS);

848
	err = ctrl_fill_info(family, portid, seq, 0, skb, cmd);
T
Thomas Graf 已提交
849 850 851 852 853 854 855 856
	if (err < 0) {
		nlmsg_free(skb);
		return ERR_PTR(err);
	}

	return skb;
}

857 858 859 860
static struct sk_buff *
ctrl_build_mcgrp_msg(struct genl_family *family,
		     const struct genl_multicast_group *grp,
		     int grp_id, u32 portid, int seq, u8 cmd)
861 862 863 864 865 866 867 868
{
	struct sk_buff *skb;
	int err;

	skb = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
	if (skb == NULL)
		return ERR_PTR(-ENOBUFS);

869 870
	err = ctrl_fill_mcgrp_info(family, grp, grp_id, portid,
				   seq, 0, skb, cmd);
871 872 873 874 875 876 877 878
	if (err < 0) {
		nlmsg_free(skb);
		return ERR_PTR(err);
	}

	return skb;
}

879
static const struct nla_policy ctrl_policy[CTRL_ATTR_MAX+1] = {
T
Thomas Graf 已提交
880
	[CTRL_ATTR_FAMILY_ID]	= { .type = NLA_U16 },
881 882
	[CTRL_ATTR_FAMILY_NAME]	= { .type = NLA_NUL_STRING,
				    .len = GENL_NAMSIZ - 1 },
T
Thomas Graf 已提交
883 884 885 886 887 888 889 890 891 892 893
};

static int ctrl_getfamily(struct sk_buff *skb, struct genl_info *info)
{
	struct sk_buff *msg;
	struct genl_family *res = NULL;
	int err = -EINVAL;

	if (info->attrs[CTRL_ATTR_FAMILY_ID]) {
		u16 id = nla_get_u16(info->attrs[CTRL_ATTR_FAMILY_ID]);
		res = genl_family_find_byid(id);
J
Johannes Berg 已提交
894
		err = -ENOENT;
T
Thomas Graf 已提交
895 896 897
	}

	if (info->attrs[CTRL_ATTR_FAMILY_NAME]) {
898
		char *name;
T
Thomas Graf 已提交
899

900
		name = nla_data(info->attrs[CTRL_ATTR_FAMILY_NAME]);
T
Thomas Graf 已提交
901
		res = genl_family_find_byname(name);
902 903 904
#ifdef CONFIG_MODULES
		if (res == NULL) {
			genl_unlock();
905
			up_read(&cb_lock);
906
			request_module("net-pf-%d-proto-%d-family-%s",
907
				       PF_NETLINK, NETLINK_GENERIC, name);
908
			down_read(&cb_lock);
909 910 911 912
			genl_lock();
			res = genl_family_find_byname(name);
		}
#endif
J
Johannes Berg 已提交
913
		err = -ENOENT;
T
Thomas Graf 已提交
914 915
	}

J
Johannes Berg 已提交
916 917 918 919 920 921
	if (res == NULL)
		return err;

	if (!res->netnsok && !net_eq(genl_info_net(info), &init_net)) {
		/* family doesn't exist here */
		return -ENOENT;
T
Thomas Graf 已提交
922 923
	}

924
	msg = ctrl_build_family_msg(res, info->snd_portid, info->snd_seq,
925
				    CTRL_CMD_NEWFAMILY);
J
Johannes Berg 已提交
926 927
	if (IS_ERR(msg))
		return PTR_ERR(msg);
T
Thomas Graf 已提交
928

J
Johannes Berg 已提交
929
	return genlmsg_reply(msg, info);
T
Thomas Graf 已提交
930 931
}

932
static int genl_ctrl_event(int event, struct genl_family *family,
933 934
			   const struct genl_multicast_group *grp,
			   int grp_id)
T
Thomas Graf 已提交
935 936 937
{
	struct sk_buff *msg;

J
Johannes Berg 已提交
938 939
	/* genl is still initialising */
	if (!init_net.genl_sock)
T
Thomas Graf 已提交
940 941 942 943 944
		return 0;

	switch (event) {
	case CTRL_CMD_NEWFAMILY:
	case CTRL_CMD_DELFAMILY:
945
		WARN_ON(grp);
J
Johannes Berg 已提交
946
		msg = ctrl_build_family_msg(family, 0, 0, event);
947 948 949
		break;
	case CTRL_CMD_NEWMCAST_GRP:
	case CTRL_CMD_DELMCAST_GRP:
950
		BUG_ON(!grp);
951
		msg = ctrl_build_mcgrp_msg(family, grp, grp_id, 0, 0, event);
T
Thomas Graf 已提交
952
		break;
J
Johannes Berg 已提交
953 954 955 956 957 958 959 960
	default:
		return -EINVAL;
	}

	if (IS_ERR(msg))
		return PTR_ERR(msg);

	if (!family->netnsok) {
961
		genlmsg_multicast_netns(&genl_ctrl, &init_net, msg, 0,
962
					0, GFP_KERNEL);
J
Johannes Berg 已提交
963 964
	} else {
		rcu_read_lock();
965
		genlmsg_multicast_allns(&genl_ctrl, msg, 0,
966
					0, GFP_ATOMIC);
J
Johannes Berg 已提交
967
		rcu_read_unlock();
T
Thomas Graf 已提交
968 969 970 971 972
	}

	return 0;
}

973 974 975 976 977 978 979
static struct genl_ops genl_ctrl_ops[] = {
	{
		.cmd		= CTRL_CMD_GETFAMILY,
		.doit		= ctrl_getfamily,
		.dumpit		= ctrl_dumpfamily,
		.policy		= ctrl_policy,
	},
T
Thomas Graf 已提交
980 981
};

982 983
static struct genl_multicast_group genl_ctrl_groups[] = {
	{ .name = "notify", },
984 985
};

986
static int genl_bind(struct net *net, int group)
987
{
988
	int i, err = -ENOENT;
989 990 991 992 993 994 995 996 997 998

	down_read(&cb_lock);
	for (i = 0; i < GENL_FAM_TAB_SIZE; i++) {
		struct genl_family *f;

		list_for_each_entry(f, genl_family_chain(i), family_list) {
			if (group >= f->mcgrp_offset &&
			    group < f->mcgrp_offset + f->n_mcgrps) {
				int fam_grp = group - f->mcgrp_offset;

999 1000 1001 1002
				if (!f->netnsok && net != &init_net)
					err = -ENOENT;
				else if (f->mcast_bind)
					err = f->mcast_bind(net, fam_grp);
1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013
				else
					err = 0;
				break;
			}
		}
	}
	up_read(&cb_lock);

	return err;
}

1014
static void genl_unbind(struct net *net, int group)
1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028
{
	int i;
	bool found = false;

	down_read(&cb_lock);
	for (i = 0; i < GENL_FAM_TAB_SIZE; i++) {
		struct genl_family *f;

		list_for_each_entry(f, genl_family_chain(i), family_list) {
			if (group >= f->mcgrp_offset &&
			    group < f->mcgrp_offset + f->n_mcgrps) {
				int fam_grp = group - f->mcgrp_offset;

				if (f->mcast_unbind)
1029
					f->mcast_unbind(net, fam_grp);
1030 1031 1032 1033 1034 1035 1036 1037 1038 1039
				found = true;
				break;
			}
		}
	}
	up_read(&cb_lock);

	WARN_ON(!found);
}

J
Johannes Berg 已提交
1040 1041
static int __net_init genl_pernet_init(struct net *net)
{
1042 1043
	struct netlink_kernel_cfg cfg = {
		.input		= genl_rcv,
1044
		.flags		= NL_CFG_F_NONROOT_RECV,
1045 1046
		.bind		= genl_bind,
		.unbind		= genl_unbind,
1047 1048
	};

J
Johannes Berg 已提交
1049
	/* we'll bump the group number right afterwards */
1050
	net->genl_sock = netlink_kernel_create(net, NETLINK_GENERIC, &cfg);
J
Johannes Berg 已提交
1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071

	if (!net->genl_sock && net_eq(net, &init_net))
		panic("GENL: Cannot initialize generic netlink\n");

	if (!net->genl_sock)
		return -ENOMEM;

	return 0;
}

static void __net_exit genl_pernet_exit(struct net *net)
{
	netlink_kernel_release(net->genl_sock);
	net->genl_sock = NULL;
}

static struct pernet_operations genl_pernet_ops = {
	.init = genl_pernet_init,
	.exit = genl_pernet_exit,
};

T
Thomas Graf 已提交
1072 1073 1074 1075 1076 1077 1078
static int __init genl_init(void)
{
	int i, err;

	for (i = 0; i < GENL_FAM_TAB_SIZE; i++)
		INIT_LIST_HEAD(&family_ht[i]);

1079 1080
	err = genl_register_family_with_ops_groups(&genl_ctrl, genl_ctrl_ops,
						   genl_ctrl_groups);
T
Thomas Graf 已提交
1081
	if (err < 0)
J
Johannes Berg 已提交
1082
		goto problem;
T
Thomas Graf 已提交
1083

J
Johannes Berg 已提交
1084 1085 1086
	err = register_pernet_subsys(&genl_pernet_ops);
	if (err)
		goto problem;
T
Thomas Graf 已提交
1087 1088 1089

	return 0;

J
Johannes Berg 已提交
1090
problem:
T
Thomas Graf 已提交
1091 1092 1093 1094 1095
	panic("GENL: Cannot register controller: %d\n", err);
}

subsys_initcall(genl_init);

1096
static int genlmsg_mcast(struct sk_buff *skb, u32 portid, unsigned long group,
J
Johannes Berg 已提交
1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110
			 gfp_t flags)
{
	struct sk_buff *tmp;
	struct net *net, *prev = NULL;
	int err;

	for_each_net_rcu(net) {
		if (prev) {
			tmp = skb_clone(skb, flags);
			if (!tmp) {
				err = -ENOMEM;
				goto error;
			}
			err = nlmsg_multicast(prev->genl_sock, tmp,
1111
					      portid, group, flags);
J
Johannes Berg 已提交
1112 1113 1114 1115 1116 1117 1118
			if (err)
				goto error;
		}

		prev = net;
	}

1119
	return nlmsg_multicast(prev->genl_sock, skb, portid, group, flags);
J
Johannes Berg 已提交
1120 1121 1122 1123 1124
 error:
	kfree_skb(skb);
	return err;
}

1125 1126
int genlmsg_multicast_allns(struct genl_family *family, struct sk_buff *skb,
			    u32 portid, unsigned int group, gfp_t flags)
J
Johannes Berg 已提交
1127
{
1128
	if (WARN_ON_ONCE(group >= family->n_mcgrps))
1129 1130
		return -EINVAL;
	group = family->mcgrp_offset + group;
1131
	return genlmsg_mcast(skb, portid, group, flags);
J
Johannes Berg 已提交
1132 1133
}
EXPORT_SYMBOL(genlmsg_multicast_allns);
P
Pravin B Shelar 已提交
1134

1135 1136
void genl_notify(struct genl_family *family,
		 struct sk_buff *skb, struct net *net, u32 portid, u32 group,
P
Pravin B Shelar 已提交
1137 1138 1139 1140 1141 1142 1143 1144
		 struct nlmsghdr *nlh, gfp_t flags)
{
	struct sock *sk = net->genl_sock;
	int report = 0;

	if (nlh)
		report = nlmsg_report(nlh);

1145
	if (WARN_ON_ONCE(group >= family->n_mcgrps))
1146 1147
		return;
	group = family->mcgrp_offset + group;
1148
	nlmsg_notify(sk, skb, portid, group, report, flags);
P
Pravin B Shelar 已提交
1149 1150
}
EXPORT_SYMBOL(genl_notify);