x_tables.h 15.9 KB
Newer Older
1 2 3
#ifndef _X_TABLES_H
#define _X_TABLES_H

4 5
#include <linux/types.h>

6 7 8
#define XT_FUNCTION_MAXNAMELEN 30
#define XT_TABLE_MAXNAMELEN 32

E
Eric Dumazet 已提交
9
struct xt_entry_match {
10 11
	union {
		struct {
12
			__u16 match_size;
13 14 15 16

			/* Used by userspace */
			char name[XT_FUNCTION_MAXNAMELEN-1];

17
			__u8 revision;
18 19
		} user;
		struct {
20
			__u16 match_size;
21 22 23 24 25 26

			/* Used inside the kernel */
			struct xt_match *match;
		} kernel;

		/* Total length */
27
		__u16 match_size;
28 29 30 31 32
	} u;

	unsigned char data[0];
};

E
Eric Dumazet 已提交
33
struct xt_entry_target {
34 35
	union {
		struct {
36
			__u16 target_size;
37 38 39 40

			/* Used by userspace */
			char name[XT_FUNCTION_MAXNAMELEN-1];

41
			__u8 revision;
42 43
		} user;
		struct {
44
			__u16 target_size;
45 46 47 48 49 50

			/* Used inside the kernel */
			struct xt_target *target;
		} kernel;

		/* Total length */
51
		__u16 target_size;
52 53 54 55 56
	} u;

	unsigned char data[0];
};

57 58 59 60 61 62 63 64
#define XT_TARGET_INIT(__name, __size)					       \
{									       \
	.target.u.user = {						       \
		.target_size	= XT_ALIGN(__size),			       \
		.name		= __name,				       \
	},								       \
}

E
Eric Dumazet 已提交
65
struct xt_standard_target {
66 67 68 69
	struct xt_entry_target target;
	int verdict;
};

70 71
/* The argument to IPT_SO_GET_REVISION_*.  Returns highest revision
 * kernel supports, if >= revision. */
E
Eric Dumazet 已提交
72
struct xt_get_revision {
73 74
	char name[XT_FUNCTION_MAXNAMELEN-1];

75
	__u8 revision;
76 77 78 79 80 81 82 83
};

/* CONTINUE verdict for targets */
#define XT_CONTINUE 0xFFFFFFFF

/* For standard target */
#define XT_RETURN (-NF_REPEAT - 1)

84 85 86 87 88
/* this is a dummy structure to find out the alignment requirement for a struct
 * containing all the fundamental data types that are used in ipt_entry,
 * ip6t_entry and arpt_entry.  This sucks, and it is a hack.  It will be my
 * personal pleasure to remove it -HW
 */
E
Eric Dumazet 已提交
89
struct _xt_align {
90 91 92 93
	__u8 u8;
	__u16 u16;
	__u32 u32;
	__u64 u64;
94 95 96 97
};

#define XT_ALIGN(s) (((s) + (__alignof__(struct _xt_align)-1)) 	\
			& ~(__alignof__(struct _xt_align)-1))
98 99 100 101 102 103 104 105 106

/* Standard return verdict, or do jump. */
#define XT_STANDARD_TARGET ""
/* Error verdict. */
#define XT_ERROR_TARGET "ERROR"

#define SET_COUNTER(c,b,p) do { (c).bcnt = (b); (c).pcnt = (p); } while(0)
#define ADD_COUNTER(c,b,p) do { (c).bcnt += (b); (c).pcnt += (p); } while(0)

E
Eric Dumazet 已提交
107
struct xt_counters {
108
	__u64 pcnt, bcnt;			/* Packet and byte counters */
109 110 111
};

/* The argument to IPT_SO_ADD_COUNTERS. */
E
Eric Dumazet 已提交
112
struct xt_counters_info {
113 114 115 116 117 118 119 120 121 122 123
	/* Which table. */
	char name[XT_TABLE_MAXNAMELEN];

	unsigned int num_counters;

	/* The counters (actually `number' of these). */
	struct xt_counters counters[0];
};

#define XT_INV_PROTO		0x40	/* Invert the sense of PROTO. */

124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166
/* fn returns 0 to continue iteration */
#define XT_MATCH_ITERATE(type, e, fn, args...)			\
({								\
	unsigned int __i;					\
	int __ret = 0;						\
	struct xt_entry_match *__m;				\
								\
	for (__i = sizeof(type);				\
	     __i < (e)->target_offset;				\
	     __i += __m->u.match_size) {			\
		__m = (void *)e + __i;				\
								\
		__ret = fn(__m , ## args);			\
		if (__ret != 0)					\
			break;					\
	}							\
	__ret;							\
})

/* fn returns 0 to continue iteration */
#define XT_ENTRY_ITERATE_CONTINUE(type, entries, size, n, fn, args...) \
({								\
	unsigned int __i, __n;					\
	int __ret = 0;						\
	type *__entry;						\
								\
	for (__i = 0, __n = 0; __i < (size);			\
	     __i += __entry->next_offset, __n++) { 		\
		__entry = (void *)(entries) + __i;		\
		if (__n < n)					\
			continue;				\
								\
		__ret = fn(__entry , ## args);			\
		if (__ret != 0)					\
			break;					\
	}							\
	__ret;							\
})

/* fn returns 0 to continue iteration */
#define XT_ENTRY_ITERATE(type, entries, size, fn, args...) \
	XT_ENTRY_ITERATE_CONTINUE(type, entries, size, 0, fn, args)

167 168 169 170
#ifdef __KERNEL__

#include <linux/netdevice.h>

171 172 173 174 175 176 177 178 179
/**
 * struct xt_match_param - parameters for match extensions' match functions
 *
 * @in:		input netdevice
 * @out:	output netdevice
 * @match:	struct xt_match through which this function was invoked
 * @matchinfo:	per-match data
 * @fragoff:	packet is a fragment, this is the data offset
 * @thoff:	position of transport header relative to skb->data
180
 * @hook:	hook number given packet came from
181 182
 * @family:	Actual NFPROTO_* through which the function is invoked
 * 		(helpful when match->family == NFPROTO_UNSPEC)
183
 * @hotdrop:	drop packet if we had inspection problems
184 185 186 187 188 189 190
 */
struct xt_match_param {
	const struct net_device *in, *out;
	const struct xt_match *match;
	const void *matchinfo;
	int fragoff;
	unsigned int thoff;
191
	unsigned int hooknum;
192
	u_int8_t family;
193
	bool *hotdrop;
194 195
};

196 197 198 199 200 201 202 203 204 205 206 207
/**
 * struct xt_mtchk_param - parameters for match extensions'
 * checkentry functions
 *
 * @table:	table the rule is tried to be inserted into
 * @entryinfo:	the family-specific rule data
 * 		(struct ipt_ip, ip6t_ip, ebt_entry)
 * @match:	struct xt_match through which this function was invoked
 * @matchinfo:	per-match data
 * @hook_mask:	via which hooks the new rule is reachable
 */
struct xt_mtchk_param {
208
	struct net *net;
209 210 211 212 213
	const char *table;
	const void *entryinfo;
	const struct xt_match *match;
	void *matchinfo;
	unsigned int hook_mask;
214
	u_int8_t family;
215 216
};

217 218
/* Match destructor parameters */
struct xt_mtdtor_param {
219
	struct net *net;
220 221
	const struct xt_match *match;
	void *matchinfo;
222
	u_int8_t family;
223 224
};

225 226 227 228 229 230 231 232 233 234 235 236 237
/**
 * struct xt_target_param - parameters for target extensions' target functions
 *
 * @hooknum:	hook through which this target was invoked
 * @target:	struct xt_target through which this function was invoked
 * @targinfo:	per-target data
 *
 * Other fields see above.
 */
struct xt_target_param {
	const struct net_device *in, *out;
	const struct xt_target *target;
	const void *targinfo;
238
	unsigned int hooknum;
239
	u_int8_t family;
240 241
};

242 243 244 245 246 247 248 249 250 251 252
/**
 * struct xt_tgchk_param - parameters for target extensions'
 * checkentry functions
 *
 * @entryinfo:	the family-specific rule data
 * 		(struct ipt_entry, ip6t_entry, arpt_entry, ebt_entry)
 *
 * Other fields see above.
 */
struct xt_tgchk_param {
	const char *table;
253
	const void *entryinfo;
254 255 256
	const struct xt_target *target;
	void *targinfo;
	unsigned int hook_mask;
257
	u_int8_t family;
258 259
};

260 261 262 263
/* Target destructor parameters */
struct xt_tgdtor_param {
	const struct xt_target *target;
	void *targinfo;
264
	u_int8_t family;
265 266
};

E
Eric Dumazet 已提交
267
struct xt_match {
268 269 270
	struct list_head list;

	const char name[XT_FUNCTION_MAXNAMELEN-1];
271
	u_int8_t revision;
272 273 274 275 276 277

	/* Return true or false: return FALSE and set *hotdrop = 1 to
           force immediate packet drop. */
	/* Arguments changed since 2.6.9, as this must now handle
	   non-linear skb, using skb_header_pointer and
	   skb_ip_make_writable. */
278
	bool (*match)(const struct sk_buff *skb,
279
		      const struct xt_match_param *);
280 281

	/* Called when user tries to insert an entry of this type. */
282
	bool (*checkentry)(const struct xt_mtchk_param *);
283 284

	/* Called when entry of this type deleted. */
285
	void (*destroy)(const struct xt_mtdtor_param *);
286

287
	/* Called when userspace align differs from kernel space one */
288 289
	void (*compat_from_user)(void *dst, void *src);
	int (*compat_to_user)(void __user *dst, void *src);
290

291 292
	/* Set this to THIS_MODULE if you are a module, otherwise NULL */
	struct module *me;
293

294 295 296
	/* Free to use by each match */
	unsigned long data;

297
	const char *table;
298
	unsigned int matchsize;
299
	unsigned int compatsize;
300 301
	unsigned int hooks;
	unsigned short proto;
302 303

	unsigned short family;
304 305 306
};

/* Registration hooks for targets. */
E
Eric Dumazet 已提交
307
struct xt_target {
308 309 310 311 312 313 314
	struct list_head list;

	const char name[XT_FUNCTION_MAXNAMELEN-1];

	/* Returns verdict. Argument order changed since 2.6.9, as this
	   must now handle non-linear skbs, using skb_copy_bits and
	   skb_ip_make_writable. */
315
	unsigned int (*target)(struct sk_buff *skb,
316
			       const struct xt_target_param *);
317 318 319 320 321

	/* Called when user tries to insert an entry of this type:
           hook_mask is a bitmask of hooks from which it can be
           called. */
	/* Should return true or false. */
322
	bool (*checkentry)(const struct xt_tgchk_param *);
323 324

	/* Called when entry of this type deleted. */
325
	void (*destroy)(const struct xt_tgdtor_param *);
326

327
	/* Called when userspace align differs from kernel space one */
328 329
	void (*compat_from_user)(void *dst, void *src);
	int (*compat_to_user)(void __user *dst, void *src);
330

331 332
	/* Set this to THIS_MODULE if you are a module, otherwise NULL */
	struct module *me;
333

334
	const char *table;
335
	unsigned int targetsize;
336
	unsigned int compatsize;
337 338
	unsigned int hooks;
	unsigned short proto;
339 340

	unsigned short family;
341
	u_int8_t revision;
342 343 344
};

/* Furniture shopping... */
E
Eric Dumazet 已提交
345
struct xt_table {
346 347 348 349 350 351
	struct list_head list;

	/* What hooks you will enter on */
	unsigned int valid_hooks;

	/* Man behind the curtain... */
352
	struct xt_table_info *private;
353 354 355 356

	/* Set this to THIS_MODULE if you are a module, otherwise NULL */
	struct module *me;

357
	u_int8_t af;		/* address/protocol family */
358 359 360

	/* A unique name... */
	const char name[XT_TABLE_MAXNAMELEN];
361 362 363 364 365
};

#include <linux/netfilter_ipv4.h>

/* The table itself */
E
Eric Dumazet 已提交
366
struct xt_table_info {
367 368 369 370 371 372 373 374
	/* Size per table */
	unsigned int size;
	/* Number of entries: FIXME. --RR */
	unsigned int number;
	/* Initial number of entries. Needed for module usage count */
	unsigned int initial_entries;

	/* Entry points and underflows */
375 376
	unsigned int hook_entry[NF_INET_NUMHOOKS];
	unsigned int underflow[NF_INET_NUMHOOKS];
377 378

	/* ipt_entry tables: one per CPU */
379
	/* Note : this field MUST be the last one, see XT_TABLE_INFO_SZ */
380
	void *entries[1];
381 382
};

383 384
#define XT_TABLE_INFO_SZ (offsetof(struct xt_table_info, entries) \
			  + nr_cpu_ids * sizeof(char *))
385 386
extern int xt_register_target(struct xt_target *target);
extern void xt_unregister_target(struct xt_target *target);
387 388 389
extern int xt_register_targets(struct xt_target *target, unsigned int n);
extern void xt_unregister_targets(struct xt_target *target, unsigned int n);

390 391
extern int xt_register_match(struct xt_match *target);
extern void xt_unregister_match(struct xt_match *target);
392 393
extern int xt_register_matches(struct xt_match *match, unsigned int n);
extern void xt_unregister_matches(struct xt_match *match, unsigned int n);
394

395
extern int xt_check_match(struct xt_mtchk_param *,
396
			  unsigned int size, u_int8_t proto, bool inv_proto);
397
extern int xt_check_target(struct xt_tgchk_param *,
398
			   unsigned int size, u_int8_t proto, bool inv_proto);
399

400
extern struct xt_table *xt_register_table(struct net *net,
401
					  const struct xt_table *table,
402 403
					  struct xt_table_info *bootstrap,
					  struct xt_table_info *newinfo);
404 405 406 407 408 409 410
extern void *xt_unregister_table(struct xt_table *table);

extern struct xt_table_info *xt_replace_table(struct xt_table *table,
					      unsigned int num_counters,
					      struct xt_table_info *newinfo,
					      int *error);

411 412 413
extern struct xt_match *xt_find_match(u8 af, const char *name, u8 revision);
extern struct xt_target *xt_find_target(u8 af, const char *name, u8 revision);
extern struct xt_target *xt_request_find_target(u8 af, const char *name,
414
						u8 revision);
415 416
extern int xt_find_revision(u8 af, const char *name, u8 revision,
			    int target, int *err);
417

418
extern struct xt_table *xt_find_table_lock(struct net *net, u_int8_t af,
419
					   const char *name);
420 421
extern void xt_table_unlock(struct xt_table *t);

422 423
extern int xt_proto_init(struct net *net, u_int8_t af);
extern void xt_proto_fini(struct net *net, u_int8_t af);
424 425 426

extern struct xt_table_info *xt_alloc_table_info(unsigned int size);
extern void xt_free_table_info(struct xt_table_info *info);
427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467

/*
 * Per-CPU spinlock associated with per-cpu table entries, and
 * with a counter for the "reading" side that allows a recursive
 * reader to avoid taking the lock and deadlocking.
 *
 * "reading" is used by ip/arp/ip6 tables rule processing which runs per-cpu.
 * It needs to ensure that the rules are not being changed while the packet
 * is being processed. In some cases, the read lock will be acquired
 * twice on the same CPU; this is okay because of the count.
 *
 * "writing" is used when reading counters.
 *  During replace any readers that are using the old tables have to complete
 *  before freeing the old table. This is handled by the write locking
 *  necessary for reading the counters.
 */
struct xt_info_lock {
	spinlock_t lock;
	unsigned char readers;
};
DECLARE_PER_CPU(struct xt_info_lock, xt_info_locks);

/*
 * Note: we need to ensure that preemption is disabled before acquiring
 * the per-cpu-variable, so we do it as a two step process rather than
 * using "spin_lock_bh()".
 *
 * We _also_ need to disable bottom half processing before updating our
 * nesting count, to make sure that the only kind of re-entrancy is this
 * code being called by itself: since the count+lock is not an atomic
 * operation, we can allow no races.
 *
 * _Only_ that special combination of being per-cpu and never getting
 * re-entered asynchronously means that the count is safe.
 */
static inline void xt_info_rdlock_bh(void)
{
	struct xt_info_lock *lock;

	local_bh_disable();
	lock = &__get_cpu_var(xt_info_locks);
468
	if (likely(!lock->readers++))
469 470 471 472 473 474 475
		spin_lock(&lock->lock);
}

static inline void xt_info_rdunlock_bh(void)
{
	struct xt_info_lock *lock = &__get_cpu_var(xt_info_locks);

476
	if (likely(!--lock->readers))
477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494
		spin_unlock(&lock->lock);
	local_bh_enable();
}

/*
 * The "writer" side needs to get exclusive access to the lock,
 * regardless of readers.  This must be called with bottom half
 * processing (and thus also preemption) disabled.
 */
static inline void xt_info_wrlock(unsigned int cpu)
{
	spin_lock(&per_cpu(xt_info_locks, cpu).lock);
}

static inline void xt_info_wrunlock(unsigned int cpu)
{
	spin_unlock(&per_cpu(xt_info_locks, cpu).lock);
}
495

496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518
/*
 * This helper is performance critical and must be inlined
 */
static inline unsigned long ifname_compare_aligned(const char *_a,
						   const char *_b,
						   const char *_mask)
{
	const unsigned long *a = (const unsigned long *)_a;
	const unsigned long *b = (const unsigned long *)_b;
	const unsigned long *mask = (const unsigned long *)_mask;
	unsigned long ret;

	ret = (a[0] ^ b[0]) & mask[0];
	if (IFNAMSIZ > sizeof(unsigned long))
		ret |= (a[1] ^ b[1]) & mask[1];
	if (IFNAMSIZ > 2 * sizeof(unsigned long))
		ret |= (a[2] ^ b[2]) & mask[2];
	if (IFNAMSIZ > 3 * sizeof(unsigned long))
		ret |= (a[3] ^ b[3]) & mask[3];
	BUILD_BUG_ON(IFNAMSIZ > 4 * sizeof(unsigned long));
	return ret;
}

519 520 521
#ifdef CONFIG_COMPAT
#include <net/compat.h>

E
Eric Dumazet 已提交
522
struct compat_xt_entry_match {
523 524 525 526 527 528
	union {
		struct {
			u_int16_t match_size;
			char name[XT_FUNCTION_MAXNAMELEN - 1];
			u_int8_t revision;
		} user;
529 530 531 532
		struct {
			u_int16_t match_size;
			compat_uptr_t match;
		} kernel;
533 534 535 536 537
		u_int16_t match_size;
	} u;
	unsigned char data[0];
};

E
Eric Dumazet 已提交
538
struct compat_xt_entry_target {
539 540 541 542 543 544
	union {
		struct {
			u_int16_t target_size;
			char name[XT_FUNCTION_MAXNAMELEN - 1];
			u_int8_t revision;
		} user;
545 546 547 548
		struct {
			u_int16_t target_size;
			compat_uptr_t target;
		} kernel;
549 550 551 552 553 554 555 556 557
		u_int16_t target_size;
	} u;
	unsigned char data[0];
};

/* FIXME: this works only on 32 bit tasks
 * need to change whole approach in order to calculate align as function of
 * current task alignment */

E
Eric Dumazet 已提交
558
struct compat_xt_counters {
559
#if defined(CONFIG_X86_64) || defined(CONFIG_IA64)
560
	u_int32_t cnt[4];
561 562 563
#else
	u_int64_t cnt[2];
#endif
564 565
};

E
Eric Dumazet 已提交
566
struct compat_xt_counters_info {
567 568 569 570 571 572 573 574
	char name[XT_TABLE_MAXNAMELEN];
	compat_uint_t num_counters;
	struct compat_xt_counters counters[0];
};

#define COMPAT_XT_ALIGN(s) (((s) + (__alignof__(struct compat_xt_counters)-1)) \
		& ~(__alignof__(struct compat_xt_counters)-1))

575 576
extern void xt_compat_lock(u_int8_t af);
extern void xt_compat_unlock(u_int8_t af);
577

578 579 580
extern int xt_compat_add_offset(u_int8_t af, unsigned int offset, short delta);
extern void xt_compat_flush_offsets(u_int8_t af);
extern short xt_compat_calc_jump(u_int8_t af, unsigned int offset);
581

582
extern int xt_compat_match_offset(const struct xt_match *match);
583
extern int xt_compat_match_from_user(struct xt_entry_match *m,
584
				     void **dstptr, unsigned int *size);
585
extern int xt_compat_match_to_user(struct xt_entry_match *m,
586
				   void __user **dstptr, unsigned int *size);
587

588
extern int xt_compat_target_offset(const struct xt_target *target);
589
extern void xt_compat_target_from_user(struct xt_entry_target *t,
590
				       void **dstptr, unsigned int *size);
591
extern int xt_compat_target_to_user(struct xt_entry_target *t,
592
				    void __user **dstptr, unsigned int *size);
593 594

#endif /* CONFIG_COMPAT */
595 596 597
#endif /* __KERNEL__ */

#endif /* _X_TABLES_H */