x_tables.c 30.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * x_tables core - Backend for {ip,ip6,arp}_tables
 *
 * Copyright (C) 2006-2006 Harald Welte <laforge@netfilter.org>
 *
 * Based on existing ip_tables code which is
 *   Copyright (C) 1999 Paul `Rusty' Russell & Michael J. Neuling
 *   Copyright (C) 2000-2005 Netfilter Core Team <coreteam@netfilter.org>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 *
 */
15
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
16 17 18 19 20 21 22
#include <linux/kernel.h>
#include <linux/socket.h>
#include <linux/net.h>
#include <linux/proc_fs.h>
#include <linux/seq_file.h>
#include <linux/string.h>
#include <linux/vmalloc.h>
I
Ingo Molnar 已提交
23
#include <linux/mutex.h>
A
Al Viro 已提交
24
#include <linux/mm.h>
25
#include <net/net_namespace.h>
26 27 28

#include <linux/netfilter/x_tables.h>
#include <linux/netfilter_arp.h>
29 30 31
#include <linux/netfilter_ipv4/ip_tables.h>
#include <linux/netfilter_ipv6/ip6_tables.h>
#include <linux/netfilter_arp/arp_tables.h>
I
Ingo Molnar 已提交
32

33 34
MODULE_LICENSE("GPL");
MODULE_AUTHOR("Harald Welte <laforge@netfilter.org>");
35
MODULE_DESCRIPTION("{ip,ip6,arp,eb}_tables backend module");
36 37 38

#define SMP_ALIGN(x) (((x) + SMP_CACHE_BYTES-1) & ~(SMP_CACHE_BYTES-1))

39 40 41
struct compat_delta {
	struct compat_delta *next;
	unsigned int offset;
42
	int delta;
43 44
};

45
struct xt_af {
I
Ingo Molnar 已提交
46
	struct mutex mutex;
47 48
	struct list_head match;
	struct list_head target;
49
#ifdef CONFIG_COMPAT
50
	struct mutex compat_mutex;
51 52
	struct compat_delta *compat_offsets;
#endif
53 54 55 56
};

static struct xt_af *xt;

57 58 59 60 61 62
static const char *const xt_prefix[NFPROTO_NUMPROTO] = {
	[NFPROTO_UNSPEC] = "x",
	[NFPROTO_IPV4]   = "ip",
	[NFPROTO_ARP]    = "arp",
	[NFPROTO_BRIDGE] = "eb",
	[NFPROTO_IPV6]   = "ip6",
63 64
};

65 66
/* Registration hooks for targets. */
int
67
xt_register_target(struct xt_target *target)
68
{
69 70
	u_int8_t af = target->family;
	int ret;
71

I
Ingo Molnar 已提交
72
	ret = mutex_lock_interruptible(&xt[af].mutex);
73 74 75
	if (ret != 0)
		return ret;
	list_add(&target->list, &xt[af].target);
I
Ingo Molnar 已提交
76
	mutex_unlock(&xt[af].mutex);
77 78 79 80 81
	return ret;
}
EXPORT_SYMBOL(xt_register_target);

void
82
xt_unregister_target(struct xt_target *target)
83
{
84
	u_int8_t af = target->family;
85

I
Ingo Molnar 已提交
86
	mutex_lock(&xt[af].mutex);
P
Patrick McHardy 已提交
87
	list_del(&target->list);
I
Ingo Molnar 已提交
88
	mutex_unlock(&xt[af].mutex);
89 90 91
}
EXPORT_SYMBOL(xt_unregister_target);

92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121
int
xt_register_targets(struct xt_target *target, unsigned int n)
{
	unsigned int i;
	int err = 0;

	for (i = 0; i < n; i++) {
		err = xt_register_target(&target[i]);
		if (err)
			goto err;
	}
	return err;

err:
	if (i > 0)
		xt_unregister_targets(target, i);
	return err;
}
EXPORT_SYMBOL(xt_register_targets);

void
xt_unregister_targets(struct xt_target *target, unsigned int n)
{
	unsigned int i;

	for (i = 0; i < n; i++)
		xt_unregister_target(&target[i]);
}
EXPORT_SYMBOL(xt_unregister_targets);

122
int
123
xt_register_match(struct xt_match *match)
124
{
125 126
	u_int8_t af = match->family;
	int ret;
127

I
Ingo Molnar 已提交
128
	ret = mutex_lock_interruptible(&xt[af].mutex);
129 130 131 132
	if (ret != 0)
		return ret;

	list_add(&match->list, &xt[af].match);
I
Ingo Molnar 已提交
133
	mutex_unlock(&xt[af].mutex);
134 135 136 137 138 139

	return ret;
}
EXPORT_SYMBOL(xt_register_match);

void
140
xt_unregister_match(struct xt_match *match)
141
{
142
	u_int8_t af = match->family;
143

I
Ingo Molnar 已提交
144
	mutex_lock(&xt[af].mutex);
P
Patrick McHardy 已提交
145
	list_del(&match->list);
I
Ingo Molnar 已提交
146
	mutex_unlock(&xt[af].mutex);
147 148 149
}
EXPORT_SYMBOL(xt_unregister_match);

150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179
int
xt_register_matches(struct xt_match *match, unsigned int n)
{
	unsigned int i;
	int err = 0;

	for (i = 0; i < n; i++) {
		err = xt_register_match(&match[i]);
		if (err)
			goto err;
	}
	return err;

err:
	if (i > 0)
		xt_unregister_matches(match, i);
	return err;
}
EXPORT_SYMBOL(xt_register_matches);

void
xt_unregister_matches(struct xt_match *match, unsigned int n)
{
	unsigned int i;

	for (i = 0; i < n; i++)
		xt_unregister_match(&match[i]);
}
EXPORT_SYMBOL(xt_unregister_matches);

180 181 182 183 184 185 186 187

/*
 * These are weird, but module loading must not be done with mutex
 * held (since they will register), and we have to have a single
 * function to use try_then_request_module().
 */

/* Find match, grabs ref.  Returns ERR_PTR() on error. */
188
struct xt_match *xt_find_match(u8 af, const char *name, u8 revision)
189 190 191 192
{
	struct xt_match *m;
	int err = 0;

I
Ingo Molnar 已提交
193
	if (mutex_lock_interruptible(&xt[af].mutex) != 0)
194 195 196 197 198 199
		return ERR_PTR(-EINTR);

	list_for_each_entry(m, &xt[af].match, list) {
		if (strcmp(m->name, name) == 0) {
			if (m->revision == revision) {
				if (try_module_get(m->me)) {
I
Ingo Molnar 已提交
200
					mutex_unlock(&xt[af].mutex);
201 202 203 204 205 206
					return m;
				}
			} else
				err = -EPROTOTYPE; /* Found something. */
		}
	}
I
Ingo Molnar 已提交
207
	mutex_unlock(&xt[af].mutex);
208 209 210 211 212

	if (af != NFPROTO_UNSPEC)
		/* Try searching again in the family-independent list */
		return xt_find_match(NFPROTO_UNSPEC, name, revision);

213 214 215 216
	return ERR_PTR(err);
}
EXPORT_SYMBOL(xt_find_match);

217 218 219 220 221 222 223 224 225 226 227
struct xt_match *
xt_request_find_match(uint8_t nfproto, const char *name, uint8_t revision)
{
	struct xt_match *match;

	match = try_then_request_module(xt_find_match(nfproto, name, revision),
					"%st_%s", xt_prefix[nfproto], name);
	return (match != NULL) ? match : ERR_PTR(-ENOENT);
}
EXPORT_SYMBOL_GPL(xt_request_find_match);

228
/* Find target, grabs ref.  Returns ERR_PTR() on error. */
229
struct xt_target *xt_find_target(u8 af, const char *name, u8 revision)
230 231 232 233
{
	struct xt_target *t;
	int err = 0;

I
Ingo Molnar 已提交
234
	if (mutex_lock_interruptible(&xt[af].mutex) != 0)
235 236 237 238 239 240
		return ERR_PTR(-EINTR);

	list_for_each_entry(t, &xt[af].target, list) {
		if (strcmp(t->name, name) == 0) {
			if (t->revision == revision) {
				if (try_module_get(t->me)) {
I
Ingo Molnar 已提交
241
					mutex_unlock(&xt[af].mutex);
242 243 244 245 246 247
					return t;
				}
			} else
				err = -EPROTOTYPE; /* Found something. */
		}
	}
I
Ingo Molnar 已提交
248
	mutex_unlock(&xt[af].mutex);
249 250 251 252 253

	if (af != NFPROTO_UNSPEC)
		/* Try searching again in the family-independent list */
		return xt_find_target(NFPROTO_UNSPEC, name, revision);

254 255 256 257
	return ERR_PTR(err);
}
EXPORT_SYMBOL(xt_find_target);

258
struct xt_target *xt_request_find_target(u8 af, const char *name, u8 revision)
259 260 261 262
{
	struct xt_target *target;

	target = try_then_request_module(xt_find_target(af, name, revision),
263
					 "%st_%s", xt_prefix[af], name);
264
	return (target != NULL) ? target : ERR_PTR(-ENOENT);
265 266 267
}
EXPORT_SYMBOL_GPL(xt_request_find_target);

268
static int match_revfn(u8 af, const char *name, u8 revision, int *bestp)
269
{
270
	const struct xt_match *m;
271 272 273 274 275 276 277 278 279 280
	int have_rev = 0;

	list_for_each_entry(m, &xt[af].match, list) {
		if (strcmp(m->name, name) == 0) {
			if (m->revision > *bestp)
				*bestp = m->revision;
			if (m->revision == revision)
				have_rev = 1;
		}
	}
281 282 283 284

	if (af != NFPROTO_UNSPEC && !have_rev)
		return match_revfn(NFPROTO_UNSPEC, name, revision, bestp);

285 286 287
	return have_rev;
}

288
static int target_revfn(u8 af, const char *name, u8 revision, int *bestp)
289
{
290
	const struct xt_target *t;
291 292 293 294 295 296 297 298 299 300
	int have_rev = 0;

	list_for_each_entry(t, &xt[af].target, list) {
		if (strcmp(t->name, name) == 0) {
			if (t->revision > *bestp)
				*bestp = t->revision;
			if (t->revision == revision)
				have_rev = 1;
		}
	}
301 302 303 304

	if (af != NFPROTO_UNSPEC && !have_rev)
		return target_revfn(NFPROTO_UNSPEC, name, revision, bestp);

305 306 307 308
	return have_rev;
}

/* Returns true or false (if no such extension at all) */
309
int xt_find_revision(u8 af, const char *name, u8 revision, int target,
310 311 312 313
		     int *err)
{
	int have_rev, best = -1;

I
Ingo Molnar 已提交
314
	if (mutex_lock_interruptible(&xt[af].mutex) != 0) {
315 316 317 318 319 320 321
		*err = -EINTR;
		return 1;
	}
	if (target == 1)
		have_rev = target_revfn(af, name, revision, &best);
	else
		have_rev = match_revfn(af, name, revision, &best);
I
Ingo Molnar 已提交
322
	mutex_unlock(&xt[af].mutex);
323 324 325 326 327 328 329 330 331 332 333 334 335 336

	/* Nothing at all?  Return 0 to try loading module. */
	if (best == -1) {
		*err = -ENOENT;
		return 0;
	}

	*err = best;
	if (!have_rev)
		*err = -EPROTONOSUPPORT;
	return 1;
}
EXPORT_SYMBOL_GPL(xt_find_revision);

337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362
static char *textify_hooks(char *buf, size_t size, unsigned int mask)
{
	static const char *const names[] = {
		"PREROUTING", "INPUT", "FORWARD",
		"OUTPUT", "POSTROUTING", "BROUTING",
	};
	unsigned int i;
	char *p = buf;
	bool np = false;
	int res;

	*p = '\0';
	for (i = 0; i < ARRAY_SIZE(names); ++i) {
		if (!(mask & (1 << i)))
			continue;
		res = snprintf(p, size, "%s%s", np ? "/" : "", names[i]);
		if (res > 0) {
			size -= res;
			p += res;
		}
		np = true;
	}

	return buf;
}

363
int xt_check_match(struct xt_mtchk_param *par,
364
		   unsigned int size, u_int8_t proto, bool inv_proto)
365
{
366 367
	int ret;

368 369
	if (XT_ALIGN(par->match->matchsize) != size &&
	    par->match->matchsize != -1) {
370 371 372 373
		/*
		 * ebt_among is exempt from centralized matchsize checking
		 * because it uses a dynamic-size data set.
		 */
374 375
		pr_err("%s_tables: %s.%u match: invalid size "
		       "%u (kernel) != (user) %u\n",
376
		       xt_prefix[par->family], par->match->name,
377
		       par->match->revision,
378
		       XT_ALIGN(par->match->matchsize), size);
379 380
		return -EINVAL;
	}
381 382
	if (par->match->table != NULL &&
	    strcmp(par->match->table, par->table) != 0) {
J
Joe Perches 已提交
383
		pr_err("%s_tables: %s match: only valid in %s table, not %s\n",
384
		       xt_prefix[par->family], par->match->name,
385
		       par->match->table, par->table);
386 387
		return -EINVAL;
	}
388
	if (par->match->hooks && (par->hook_mask & ~par->match->hooks) != 0) {
389 390
		char used[64], allow[64];

J
Joe Perches 已提交
391
		pr_err("%s_tables: %s match: used from hooks %s, but only "
392
		       "valid from %s\n",
393
		       xt_prefix[par->family], par->match->name,
394 395
		       textify_hooks(used, sizeof(used), par->hook_mask),
		       textify_hooks(allow, sizeof(allow), par->match->hooks));
396 397
		return -EINVAL;
	}
398
	if (par->match->proto && (par->match->proto != proto || inv_proto)) {
J
Joe Perches 已提交
399
		pr_err("%s_tables: %s match: only valid for protocol %u\n",
400 401
		       xt_prefix[par->family], par->match->name,
		       par->match->proto);
402 403
		return -EINVAL;
	}
404 405 406 407 408 409 410 411
	if (par->match->checkentry != NULL) {
		ret = par->match->checkentry(par);
		if (ret < 0)
			return ret;
		else if (ret > 0)
			/* Flag up potential errors. */
			return -EIO;
	}
412 413 414 415
	return 0;
}
EXPORT_SYMBOL_GPL(xt_check_match);

416
#ifdef CONFIG_COMPAT
417
int xt_compat_add_offset(u_int8_t af, unsigned int offset, short delta)
418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438
{
	struct compat_delta *tmp;

	tmp = kmalloc(sizeof(struct compat_delta), GFP_KERNEL);
	if (!tmp)
		return -ENOMEM;

	tmp->offset = offset;
	tmp->delta = delta;

	if (xt[af].compat_offsets) {
		tmp->next = xt[af].compat_offsets->next;
		xt[af].compat_offsets->next = tmp;
	} else {
		xt[af].compat_offsets = tmp;
		tmp->next = NULL;
	}
	return 0;
}
EXPORT_SYMBOL_GPL(xt_compat_add_offset);

439
void xt_compat_flush_offsets(u_int8_t af)
440 441 442 443 444 445 446 447 448 449 450 451 452
{
	struct compat_delta *tmp, *next;

	if (xt[af].compat_offsets) {
		for (tmp = xt[af].compat_offsets; tmp; tmp = next) {
			next = tmp->next;
			kfree(tmp);
		}
		xt[af].compat_offsets = NULL;
	}
}
EXPORT_SYMBOL_GPL(xt_compat_flush_offsets);

453
int xt_compat_calc_jump(u_int8_t af, unsigned int offset)
454 455
{
	struct compat_delta *tmp;
456
	int delta;
457 458 459 460 461 462 463 464

	for (tmp = xt[af].compat_offsets, delta = 0; tmp; tmp = tmp->next)
		if (tmp->offset < offset)
			delta += tmp->delta;
	return delta;
}
EXPORT_SYMBOL_GPL(xt_compat_calc_jump);

465
int xt_compat_match_offset(const struct xt_match *match)
466
{
467 468 469 470 471
	u_int16_t csize = match->compatsize ? : match->matchsize;
	return XT_ALIGN(match->matchsize) - COMPAT_XT_ALIGN(csize);
}
EXPORT_SYMBOL_GPL(xt_compat_match_offset);

472
int xt_compat_match_from_user(struct xt_entry_match *m, void **dstptr,
473
			      unsigned int *size)
474
{
475
	const struct xt_match *match = m->u.kernel.match;
476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494
	struct compat_xt_entry_match *cm = (struct compat_xt_entry_match *)m;
	int pad, off = xt_compat_match_offset(match);
	u_int16_t msize = cm->u.user.match_size;

	m = *dstptr;
	memcpy(m, cm, sizeof(*cm));
	if (match->compat_from_user)
		match->compat_from_user(m->data, cm->data);
	else
		memcpy(m->data, cm->data, msize - sizeof(*cm));
	pad = XT_ALIGN(match->matchsize) - match->matchsize;
	if (pad > 0)
		memset(m->data + match->matchsize, 0, pad);

	msize += off;
	m->u.user.match_size = msize;

	*size += off;
	*dstptr += msize;
495
	return 0;
496 497 498
}
EXPORT_SYMBOL_GPL(xt_compat_match_from_user);

499 500
int xt_compat_match_to_user(const struct xt_entry_match *m,
			    void __user **dstptr, unsigned int *size)
501
{
502
	const struct xt_match *match = m->u.kernel.match;
503 504 505 506 507
	struct compat_xt_entry_match __user *cm = *dstptr;
	int off = xt_compat_match_offset(match);
	u_int16_t msize = m->u.user.match_size - off;

	if (copy_to_user(cm, m, sizeof(*cm)) ||
508 509 510
	    put_user(msize, &cm->u.user.match_size) ||
	    copy_to_user(cm->u.user.name, m->u.kernel.match->name,
			 strlen(m->u.kernel.match->name) + 1))
511
		return -EFAULT;
512 513 514 515 516 517 518

	if (match->compat_to_user) {
		if (match->compat_to_user((void __user *)cm->data, m->data))
			return -EFAULT;
	} else {
		if (copy_to_user(cm->data, m->data, msize - sizeof(*cm)))
			return -EFAULT;
519
	}
520 521 522 523

	*size -= off;
	*dstptr += msize;
	return 0;
524
}
525 526
EXPORT_SYMBOL_GPL(xt_compat_match_to_user);
#endif /* CONFIG_COMPAT */
527

528
int xt_check_target(struct xt_tgchk_param *par,
529
		    unsigned int size, u_int8_t proto, bool inv_proto)
530
{
531
	if (XT_ALIGN(par->target->targetsize) != size) {
532 533
		pr_err("%s_tables: %s.%u target: invalid size "
		       "%u (kernel) != (user) %u\n",
534
		       xt_prefix[par->family], par->target->name,
535
		       par->target->revision,
536
		       XT_ALIGN(par->target->targetsize), size);
537 538
		return -EINVAL;
	}
539 540
	if (par->target->table != NULL &&
	    strcmp(par->target->table, par->table) != 0) {
J
Joe Perches 已提交
541
		pr_err("%s_tables: %s target: only valid in %s table, not %s\n",
542
		       xt_prefix[par->family], par->target->name,
543
		       par->target->table, par->table);
544 545
		return -EINVAL;
	}
546
	if (par->target->hooks && (par->hook_mask & ~par->target->hooks) != 0) {
547 548
		char used[64], allow[64];

J
Joe Perches 已提交
549
		pr_err("%s_tables: %s target: used from hooks %s, but only "
550
		       "usable from %s\n",
551
		       xt_prefix[par->family], par->target->name,
552 553
		       textify_hooks(used, sizeof(used), par->hook_mask),
		       textify_hooks(allow, sizeof(allow), par->target->hooks));
554 555
		return -EINVAL;
	}
556
	if (par->target->proto && (par->target->proto != proto || inv_proto)) {
J
Joe Perches 已提交
557
		pr_err("%s_tables: %s target: only valid for protocol %u\n",
558
		       xt_prefix[par->family], par->target->name,
559
		       par->target->proto);
560 561
		return -EINVAL;
	}
562
	if (par->target->checkentry != NULL && !par->target->checkentry(par))
563
		return -EINVAL;
564 565 566 567
	return 0;
}
EXPORT_SYMBOL_GPL(xt_check_target);

568
#ifdef CONFIG_COMPAT
569
int xt_compat_target_offset(const struct xt_target *target)
570
{
571 572 573 574 575 576
	u_int16_t csize = target->compatsize ? : target->targetsize;
	return XT_ALIGN(target->targetsize) - COMPAT_XT_ALIGN(csize);
}
EXPORT_SYMBOL_GPL(xt_compat_target_offset);

void xt_compat_target_from_user(struct xt_entry_target *t, void **dstptr,
577
				unsigned int *size)
578
{
579
	const struct xt_target *target = t->u.kernel.target;
580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601
	struct compat_xt_entry_target *ct = (struct compat_xt_entry_target *)t;
	int pad, off = xt_compat_target_offset(target);
	u_int16_t tsize = ct->u.user.target_size;

	t = *dstptr;
	memcpy(t, ct, sizeof(*ct));
	if (target->compat_from_user)
		target->compat_from_user(t->data, ct->data);
	else
		memcpy(t->data, ct->data, tsize - sizeof(*ct));
	pad = XT_ALIGN(target->targetsize) - target->targetsize;
	if (pad > 0)
		memset(t->data + target->targetsize, 0, pad);

	tsize += off;
	t->u.user.target_size = tsize;

	*size += off;
	*dstptr += tsize;
}
EXPORT_SYMBOL_GPL(xt_compat_target_from_user);

602 603
int xt_compat_target_to_user(const struct xt_entry_target *t,
			     void __user **dstptr, unsigned int *size)
604
{
605
	const struct xt_target *target = t->u.kernel.target;
606 607 608 609 610
	struct compat_xt_entry_target __user *ct = *dstptr;
	int off = xt_compat_target_offset(target);
	u_int16_t tsize = t->u.user.target_size - off;

	if (copy_to_user(ct, t, sizeof(*ct)) ||
611 612 613
	    put_user(tsize, &ct->u.user.target_size) ||
	    copy_to_user(ct->u.user.name, t->u.kernel.target->name,
			 strlen(t->u.kernel.target->name) + 1))
614
		return -EFAULT;
615 616 617 618 619 620 621

	if (target->compat_to_user) {
		if (target->compat_to_user((void __user *)ct->data, t->data))
			return -EFAULT;
	} else {
		if (copy_to_user(ct->data, t->data, tsize - sizeof(*ct)))
			return -EFAULT;
622
	}
623 624 625 626

	*size -= off;
	*dstptr += tsize;
	return 0;
627
}
628
EXPORT_SYMBOL_GPL(xt_compat_target_to_user);
629 630
#endif

631 632 633 634 635 636
struct xt_table_info *xt_alloc_table_info(unsigned int size)
{
	struct xt_table_info *newinfo;
	int cpu;

	/* Pedantry: prevent them from hitting BUG() in vmalloc.c --RR */
637
	if ((SMP_ALIGN(size) >> PAGE_SHIFT) + 2 > totalram_pages)
638 639
		return NULL;

640
	newinfo = kzalloc(XT_TABLE_INFO_SZ, GFP_KERNEL);
641 642 643 644 645
	if (!newinfo)
		return NULL;

	newinfo->size = size;

646
	for_each_possible_cpu(cpu) {
647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668
		if (size <= PAGE_SIZE)
			newinfo->entries[cpu] = kmalloc_node(size,
							GFP_KERNEL,
							cpu_to_node(cpu));
		else
			newinfo->entries[cpu] = vmalloc_node(size,
							cpu_to_node(cpu));

		if (newinfo->entries[cpu] == NULL) {
			xt_free_table_info(newinfo);
			return NULL;
		}
	}

	return newinfo;
}
EXPORT_SYMBOL(xt_alloc_table_info);

void xt_free_table_info(struct xt_table_info *info)
{
	int cpu;

669
	for_each_possible_cpu(cpu) {
670 671 672 673 674 675 676 677 678 679
		if (info->size <= PAGE_SIZE)
			kfree(info->entries[cpu]);
		else
			vfree(info->entries[cpu]);
	}
	kfree(info);
}
EXPORT_SYMBOL(xt_free_table_info);

/* Find table by name, grabs mutex & ref.  Returns ERR_PTR() on error. */
680 681
struct xt_table *xt_find_table_lock(struct net *net, u_int8_t af,
				    const char *name)
682 683 684
{
	struct xt_table *t;

I
Ingo Molnar 已提交
685
	if (mutex_lock_interruptible(&xt[af].mutex) != 0)
686 687
		return ERR_PTR(-EINTR);

688
	list_for_each_entry(t, &net->xt.tables[af], list)
689 690
		if (strcmp(t->name, name) == 0 && try_module_get(t->me))
			return t;
I
Ingo Molnar 已提交
691
	mutex_unlock(&xt[af].mutex);
692 693 694 695 696 697
	return NULL;
}
EXPORT_SYMBOL_GPL(xt_find_table_lock);

void xt_table_unlock(struct xt_table *table)
{
I
Ingo Molnar 已提交
698
	mutex_unlock(&xt[table->af].mutex);
699 700 701
}
EXPORT_SYMBOL_GPL(xt_table_unlock);

702
#ifdef CONFIG_COMPAT
703
void xt_compat_lock(u_int8_t af)
704 705 706 707 708
{
	mutex_lock(&xt[af].compat_mutex);
}
EXPORT_SYMBOL_GPL(xt_compat_lock);

709
void xt_compat_unlock(u_int8_t af)
710 711 712 713 714
{
	mutex_unlock(&xt[af].compat_mutex);
}
EXPORT_SYMBOL_GPL(xt_compat_unlock);
#endif
715

716 717 718 719
DEFINE_PER_CPU(struct xt_info_lock, xt_info_locks);
EXPORT_PER_CPU_SYMBOL_GPL(xt_info_locks);


720 721 722 723 724 725
struct xt_table_info *
xt_replace_table(struct xt_table *table,
	      unsigned int num_counters,
	      struct xt_table_info *newinfo,
	      int *error)
{
726
	struct xt_table_info *private;
727 728

	/* Do the substitution. */
729
	local_bh_disable();
730
	private = table->private;
731

732 733
	/* Check inside lock: is the old number correct? */
	if (num_counters != private->number) {
734
		pr_debug("num_counters != table->private->number (%u/%u)\n",
735
			 num_counters, private->number);
736
		local_bh_enable();
737 738 739 740
		*error = -EAGAIN;
		return NULL;
	}

741 742 743 744 745 746 747 748 749 750 751 752
	table->private = newinfo;
	newinfo->initial_entries = private->initial_entries;

	/*
	 * Even though table entries have now been swapped, other CPU's
	 * may still be using the old entries. This is okay, because
	 * resynchronization happens because of the locking done
	 * during the get_counters() routine.
	 */
	local_bh_enable();

	return private;
753 754 755
}
EXPORT_SYMBOL_GPL(xt_replace_table);

756 757
struct xt_table *xt_register_table(struct net *net,
				   const struct xt_table *input_table,
758 759
				   struct xt_table_info *bootstrap,
				   struct xt_table_info *newinfo)
760 761 762
{
	int ret;
	struct xt_table_info *private;
763
	struct xt_table *t, *table;
764

765
	/* Don't add one object to multiple lists. */
766
	table = kmemdup(input_table, sizeof(struct xt_table), GFP_KERNEL);
767 768 769 770 771
	if (!table) {
		ret = -ENOMEM;
		goto out;
	}

I
Ingo Molnar 已提交
772
	ret = mutex_lock_interruptible(&xt[table->af].mutex);
773
	if (ret != 0)
774
		goto out_free;
775 776

	/* Don't autoload: we'd eat our tail... */
777
	list_for_each_entry(t, &net->xt.tables[table->af], list) {
P
Patrick McHardy 已提交
778 779 780 781
		if (strcmp(t->name, table->name) == 0) {
			ret = -EEXIST;
			goto unlock;
		}
782 783 784 785
	}

	/* Simplifies replace_table code. */
	table->private = bootstrap;
786

787 788 789 790
	if (!xt_replace_table(table, 0, newinfo, &ret))
		goto unlock;

	private = table->private;
791
	pr_debug("table->private->number = %u\n", private->number);
792 793 794 795

	/* save number of initial entries */
	private->initial_entries = private->number;

796
	list_add(&table->list, &net->xt.tables[table->af]);
797 798
	mutex_unlock(&xt[table->af].mutex);
	return table;
799 800

 unlock:
I
Ingo Molnar 已提交
801
	mutex_unlock(&xt[table->af].mutex);
802 803
out_free:
	kfree(table);
804 805
out:
	return ERR_PTR(ret);
806 807 808 809 810 811 812
}
EXPORT_SYMBOL_GPL(xt_register_table);

void *xt_unregister_table(struct xt_table *table)
{
	struct xt_table_info *private;

I
Ingo Molnar 已提交
813
	mutex_lock(&xt[table->af].mutex);
814
	private = table->private;
P
Patrick McHardy 已提交
815
	list_del(&table->list);
I
Ingo Molnar 已提交
816
	mutex_unlock(&xt[table->af].mutex);
817
	kfree(table);
818 819 820 821 822 823

	return private;
}
EXPORT_SYMBOL_GPL(xt_unregister_table);

#ifdef CONFIG_PROC_FS
824 825
struct xt_names_priv {
	struct seq_net_private p;
826
	u_int8_t af;
827
};
828
static void *xt_table_seq_start(struct seq_file *seq, loff_t *pos)
829
{
830
	struct xt_names_priv *priv = seq->private;
831
	struct net *net = seq_file_net(seq);
832
	u_int8_t af = priv->af;
833

834
	mutex_lock(&xt[af].mutex);
835
	return seq_list_start(&net->xt.tables[af], *pos);
836
}
837

838 839
static void *xt_table_seq_next(struct seq_file *seq, void *v, loff_t *pos)
{
840
	struct xt_names_priv *priv = seq->private;
841
	struct net *net = seq_file_net(seq);
842
	u_int8_t af = priv->af;
843

844
	return seq_list_next(v, &net->xt.tables[af], pos);
845 846
}

847
static void xt_table_seq_stop(struct seq_file *seq, void *v)
848
{
849
	struct xt_names_priv *priv = seq->private;
850
	u_int8_t af = priv->af;
851

852 853
	mutex_unlock(&xt[af].mutex);
}
854

855 856 857
static int xt_table_seq_show(struct seq_file *seq, void *v)
{
	struct xt_table *table = list_entry(v, struct xt_table, list);
858

859 860 861 862 863
	if (strlen(table->name))
		return seq_printf(seq, "%s\n", table->name);
	else
		return 0;
}
864

865 866 867 868 869 870 871 872 873 874
static const struct seq_operations xt_table_seq_ops = {
	.start	= xt_table_seq_start,
	.next	= xt_table_seq_next,
	.stop	= xt_table_seq_stop,
	.show	= xt_table_seq_show,
};

static int xt_table_open(struct inode *inode, struct file *file)
{
	int ret;
875
	struct xt_names_priv *priv;
876

877 878
	ret = seq_open_net(inode, file, &xt_table_seq_ops,
			   sizeof(struct xt_names_priv));
879
	if (!ret) {
880 881
		priv = ((struct seq_file *)file->private_data)->private;
		priv->af = (unsigned long)PDE(inode)->data;
882 883
	}
	return ret;
884 885
}

886 887 888 889 890
static const struct file_operations xt_table_ops = {
	.owner	 = THIS_MODULE,
	.open	 = xt_table_open,
	.read	 = seq_read,
	.llseek	 = seq_lseek,
891
	.release = seq_release_net,
892 893
};

894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911
/*
 * Traverse state for ip{,6}_{tables,matches} for helping crossing
 * the multi-AF mutexes.
 */
struct nf_mttg_trav {
	struct list_head *head, *curr;
	uint8_t class, nfproto;
};

enum {
	MTTG_TRAV_INIT,
	MTTG_TRAV_NFP_UNSPEC,
	MTTG_TRAV_NFP_SPEC,
	MTTG_TRAV_DONE,
};

static void *xt_mttg_seq_next(struct seq_file *seq, void *v, loff_t *ppos,
    bool is_target)
912
{
913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943
	static const uint8_t next_class[] = {
		[MTTG_TRAV_NFP_UNSPEC] = MTTG_TRAV_NFP_SPEC,
		[MTTG_TRAV_NFP_SPEC]   = MTTG_TRAV_DONE,
	};
	struct nf_mttg_trav *trav = seq->private;

	switch (trav->class) {
	case MTTG_TRAV_INIT:
		trav->class = MTTG_TRAV_NFP_UNSPEC;
		mutex_lock(&xt[NFPROTO_UNSPEC].mutex);
		trav->head = trav->curr = is_target ?
			&xt[NFPROTO_UNSPEC].target : &xt[NFPROTO_UNSPEC].match;
 		break;
	case MTTG_TRAV_NFP_UNSPEC:
		trav->curr = trav->curr->next;
		if (trav->curr != trav->head)
			break;
		mutex_unlock(&xt[NFPROTO_UNSPEC].mutex);
		mutex_lock(&xt[trav->nfproto].mutex);
		trav->head = trav->curr = is_target ?
			&xt[trav->nfproto].target : &xt[trav->nfproto].match;
		trav->class = next_class[trav->class];
		break;
	case MTTG_TRAV_NFP_SPEC:
		trav->curr = trav->curr->next;
		if (trav->curr != trav->head)
			break;
		/* fallthru, _stop will unlock */
	default:
		return NULL;
	}
944

945 946 947
	if (ppos != NULL)
		++*ppos;
	return trav;
948
}
949

950 951
static void *xt_mttg_seq_start(struct seq_file *seq, loff_t *pos,
    bool is_target)
952
{
953 954
	struct nf_mttg_trav *trav = seq->private;
	unsigned int j;
955

956 957 958 959 960
	trav->class = MTTG_TRAV_INIT;
	for (j = 0; j < *pos; ++j)
		if (xt_mttg_seq_next(seq, NULL, NULL, is_target) == NULL)
			return NULL;
	return trav;
961 962
}

963
static void xt_mttg_seq_stop(struct seq_file *seq, void *v)
964
{
965 966 967 968 969 970 971 972 973 974 975
	struct nf_mttg_trav *trav = seq->private;

	switch (trav->class) {
	case MTTG_TRAV_NFP_UNSPEC:
		mutex_unlock(&xt[NFPROTO_UNSPEC].mutex);
		break;
	case MTTG_TRAV_NFP_SPEC:
		mutex_unlock(&xt[trav->nfproto].mutex);
		break;
	}
}
976

977 978 979
static void *xt_match_seq_start(struct seq_file *seq, loff_t *pos)
{
	return xt_mttg_seq_start(seq, pos, false);
980 981
}

982
static void *xt_match_seq_next(struct seq_file *seq, void *v, loff_t *ppos)
983
{
984 985
	return xt_mttg_seq_next(seq, v, ppos, false);
}
986

987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001
static int xt_match_seq_show(struct seq_file *seq, void *v)
{
	const struct nf_mttg_trav *trav = seq->private;
	const struct xt_match *match;

	switch (trav->class) {
	case MTTG_TRAV_NFP_UNSPEC:
	case MTTG_TRAV_NFP_SPEC:
		if (trav->curr == trav->head)
			return 0;
		match = list_entry(trav->curr, struct xt_match, list);
		return (*match->name == '\0') ? 0 :
		       seq_printf(seq, "%s\n", match->name);
	}
	return 0;
1002 1003
}

1004 1005 1006
static const struct seq_operations xt_match_seq_ops = {
	.start	= xt_match_seq_start,
	.next	= xt_match_seq_next,
1007
	.stop	= xt_mttg_seq_stop,
1008
	.show	= xt_match_seq_show,
1009 1010
};

1011
static int xt_match_open(struct inode *inode, struct file *file)
1012
{
1013 1014
	struct seq_file *seq;
	struct nf_mttg_trav *trav;
1015 1016
	int ret;

1017 1018 1019
	trav = kmalloc(sizeof(*trav), GFP_KERNEL);
	if (trav == NULL)
		return -ENOMEM;
1020

1021 1022 1023 1024
	ret = seq_open(file, &xt_match_seq_ops);
	if (ret < 0) {
		kfree(trav);
		return ret;
1025
	}
1026 1027 1028 1029 1030

	seq = file->private_data;
	seq->private = trav;
	trav->nfproto = (unsigned long)PDE(inode)->data;
	return 0;
1031 1032 1033 1034 1035 1036 1037
}

static const struct file_operations xt_match_ops = {
	.owner	 = THIS_MODULE,
	.open	 = xt_match_open,
	.read	 = seq_read,
	.llseek	 = seq_lseek,
1038
	.release = seq_release_private,
1039
};
1040

1041 1042
static void *xt_target_seq_start(struct seq_file *seq, loff_t *pos)
{
1043
	return xt_mttg_seq_start(seq, pos, true);
1044 1045
}

1046
static void *xt_target_seq_next(struct seq_file *seq, void *v, loff_t *ppos)
1047
{
1048
	return xt_mttg_seq_next(seq, v, ppos, true);
1049 1050 1051 1052
}

static int xt_target_seq_show(struct seq_file *seq, void *v)
{
1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065
	const struct nf_mttg_trav *trav = seq->private;
	const struct xt_target *target;

	switch (trav->class) {
	case MTTG_TRAV_NFP_UNSPEC:
	case MTTG_TRAV_NFP_SPEC:
		if (trav->curr == trav->head)
			return 0;
		target = list_entry(trav->curr, struct xt_target, list);
		return (*target->name == '\0') ? 0 :
		       seq_printf(seq, "%s\n", target->name);
	}
	return 0;
1066 1067 1068 1069 1070
}

static const struct seq_operations xt_target_seq_ops = {
	.start	= xt_target_seq_start,
	.next	= xt_target_seq_next,
1071
	.stop	= xt_mttg_seq_stop,
1072 1073 1074 1075 1076
	.show	= xt_target_seq_show,
};

static int xt_target_open(struct inode *inode, struct file *file)
{
1077 1078
	struct seq_file *seq;
	struct nf_mttg_trav *trav;
1079 1080
	int ret;

1081 1082 1083
	trav = kmalloc(sizeof(*trav), GFP_KERNEL);
	if (trav == NULL)
		return -ENOMEM;
1084

1085 1086 1087 1088
	ret = seq_open(file, &xt_target_seq_ops);
	if (ret < 0) {
		kfree(trav);
		return ret;
1089
	}
1090 1091 1092 1093 1094

	seq = file->private_data;
	seq->private = trav;
	trav->nfproto = (unsigned long)PDE(inode)->data;
	return 0;
1095 1096
}

1097
static const struct file_operations xt_target_ops = {
1098
	.owner	 = THIS_MODULE,
1099
	.open	 = xt_target_open,
1100 1101
	.read	 = seq_read,
	.llseek	 = seq_lseek,
1102
	.release = seq_release_private,
1103 1104 1105 1106 1107 1108 1109 1110
};

#define FORMAT_TABLES	"_tables_names"
#define	FORMAT_MATCHES	"_tables_matches"
#define FORMAT_TARGETS 	"_tables_targets"

#endif /* CONFIG_PROC_FS */

1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164
/**
 * xt_hook_link - set up hooks for a new table
 * @table:	table with metadata needed to set up hooks
 * @fn:		Hook function
 *
 * This function will take care of creating and registering the necessary
 * Netfilter hooks for XT tables.
 */
struct nf_hook_ops *xt_hook_link(const struct xt_table *table, nf_hookfn *fn)
{
	unsigned int hook_mask = table->valid_hooks;
	uint8_t i, num_hooks = hweight32(hook_mask);
	uint8_t hooknum;
	struct nf_hook_ops *ops;
	int ret;

	ops = kmalloc(sizeof(*ops) * num_hooks, GFP_KERNEL);
	if (ops == NULL)
		return ERR_PTR(-ENOMEM);

	for (i = 0, hooknum = 0; i < num_hooks && hook_mask != 0;
	     hook_mask >>= 1, ++hooknum) {
		if (!(hook_mask & 1))
			continue;
		ops[i].hook     = fn;
		ops[i].owner    = table->me;
		ops[i].pf       = table->af;
		ops[i].hooknum  = hooknum;
		ops[i].priority = table->priority;
		++i;
	}

	ret = nf_register_hooks(ops, num_hooks);
	if (ret < 0) {
		kfree(ops);
		return ERR_PTR(ret);
	}

	return ops;
}
EXPORT_SYMBOL_GPL(xt_hook_link);

/**
 * xt_hook_unlink - remove hooks for a table
 * @ops:	nf_hook_ops array as returned by nf_hook_link
 * @hook_mask:	the very same mask that was passed to nf_hook_link
 */
void xt_hook_unlink(const struct xt_table *table, struct nf_hook_ops *ops)
{
	nf_unregister_hooks(ops, hweight32(table->valid_hooks));
	kfree(ops);
}
EXPORT_SYMBOL_GPL(xt_hook_unlink);

1165
int xt_proto_init(struct net *net, u_int8_t af)
1166 1167 1168 1169 1170 1171
{
#ifdef CONFIG_PROC_FS
	char buf[XT_FUNCTION_MAXNAMELEN];
	struct proc_dir_entry *proc;
#endif

1172
	if (af >= ARRAY_SIZE(xt_prefix))
1173 1174 1175 1176
		return -EINVAL;


#ifdef CONFIG_PROC_FS
1177
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1178
	strlcat(buf, FORMAT_TABLES, sizeof(buf));
1179 1180
	proc = proc_create_data(buf, 0440, net->proc_net, &xt_table_ops,
				(void *)(unsigned long)af);
1181 1182 1183
	if (!proc)
		goto out;

1184
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1185
	strlcat(buf, FORMAT_MATCHES, sizeof(buf));
1186 1187
	proc = proc_create_data(buf, 0440, net->proc_net, &xt_match_ops,
				(void *)(unsigned long)af);
1188 1189 1190
	if (!proc)
		goto out_remove_tables;

1191
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1192
	strlcat(buf, FORMAT_TARGETS, sizeof(buf));
1193 1194
	proc = proc_create_data(buf, 0440, net->proc_net, &xt_target_ops,
				(void *)(unsigned long)af);
1195 1196 1197 1198 1199 1200 1201 1202
	if (!proc)
		goto out_remove_matches;
#endif

	return 0;

#ifdef CONFIG_PROC_FS
out_remove_matches:
1203
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1204
	strlcat(buf, FORMAT_MATCHES, sizeof(buf));
1205
	proc_net_remove(net, buf);
1206 1207

out_remove_tables:
1208
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1209
	strlcat(buf, FORMAT_TABLES, sizeof(buf));
1210
	proc_net_remove(net, buf);
1211 1212 1213 1214 1215 1216
out:
	return -1;
#endif
}
EXPORT_SYMBOL_GPL(xt_proto_init);

1217
void xt_proto_fini(struct net *net, u_int8_t af)
1218 1219 1220 1221
{
#ifdef CONFIG_PROC_FS
	char buf[XT_FUNCTION_MAXNAMELEN];

1222
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1223
	strlcat(buf, FORMAT_TABLES, sizeof(buf));
1224
	proc_net_remove(net, buf);
1225

1226
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1227
	strlcat(buf, FORMAT_TARGETS, sizeof(buf));
1228
	proc_net_remove(net, buf);
1229

1230
	strlcpy(buf, xt_prefix[af], sizeof(buf));
1231
	strlcat(buf, FORMAT_MATCHES, sizeof(buf));
1232
	proc_net_remove(net, buf);
1233 1234 1235 1236
#endif /*CONFIG_PROC_FS*/
}
EXPORT_SYMBOL_GPL(xt_proto_fini);

1237 1238 1239 1240
static int __net_init xt_net_init(struct net *net)
{
	int i;

1241
	for (i = 0; i < NFPROTO_NUMPROTO; i++)
1242 1243 1244 1245 1246 1247 1248
		INIT_LIST_HEAD(&net->xt.tables[i]);
	return 0;
}

static struct pernet_operations xt_net_ops = {
	.init = xt_net_init,
};
1249 1250 1251

static int __init xt_init(void)
{
1252 1253 1254 1255 1256 1257 1258 1259
	unsigned int i;
	int rv;

	for_each_possible_cpu(i) {
		struct xt_info_lock *lock = &per_cpu(xt_info_locks, i);
		spin_lock_init(&lock->lock);
		lock->readers = 0;
	}
1260

1261
	xt = kmalloc(sizeof(struct xt_af) * NFPROTO_NUMPROTO, GFP_KERNEL);
1262 1263 1264
	if (!xt)
		return -ENOMEM;

1265
	for (i = 0; i < NFPROTO_NUMPROTO; i++) {
I
Ingo Molnar 已提交
1266
		mutex_init(&xt[i].mutex);
1267 1268
#ifdef CONFIG_COMPAT
		mutex_init(&xt[i].compat_mutex);
1269
		xt[i].compat_offsets = NULL;
1270
#endif
1271 1272 1273
		INIT_LIST_HEAD(&xt[i].target);
		INIT_LIST_HEAD(&xt[i].match);
	}
1274 1275 1276 1277
	rv = register_pernet_subsys(&xt_net_ops);
	if (rv < 0)
		kfree(xt);
	return rv;
1278 1279 1280 1281
}

static void __exit xt_fini(void)
{
1282
	unregister_pernet_subsys(&xt_net_ops);
1283 1284 1285 1286 1287 1288
	kfree(xt);
}

module_init(xt_init);
module_exit(xt_fini);