cls_u32.c 27.7 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33
/*
 * net/sched/cls_u32.c	Ugly (or Universal) 32bit key Packet Classifier.
 *
 *		This program is free software; you can redistribute it and/or
 *		modify it under the terms of the GNU General Public License
 *		as published by the Free Software Foundation; either version
 *		2 of the License, or (at your option) any later version.
 *
 * Authors:	Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
 *
 *	The filters are packed to hash tables of key nodes
 *	with a set of 32bit key/mask pairs at every node.
 *	Nodes reference next level hash tables etc.
 *
 *	This scheme is the best universal classifier I managed to
 *	invent; it is not super-fast, but it is not slow (provided you
 *	program it correctly), and general enough.  And its relative
 *	speed grows as the number of rules becomes larger.
 *
 *	It seems that it represents the best middle point between
 *	speed and manageability both by human and by machine.
 *
 *	It is especially useful for link sharing combined with QoS;
 *	pure RSVP doesn't need such a general approach and can use
 *	much simpler (and faster) schemes, sort of cls_rsvp.c.
 *
 *	JHS: We should remove the CONFIG_NET_CLS_IND from here
 *	eventually when the meta match extension is made available
 *
 *	nfmark match added by Catalin(ux aka Dino) BOIE <catab at umbrella.ro>
 */

#include <linux/module.h>
34
#include <linux/slab.h>
L
Linus Torvalds 已提交
35 36 37 38
#include <linux/types.h>
#include <linux/kernel.h>
#include <linux/string.h>
#include <linux/errno.h>
39
#include <linux/percpu.h>
L
Linus Torvalds 已提交
40 41
#include <linux/rtnetlink.h>
#include <linux/skbuff.h>
42
#include <linux/bitmap.h>
43
#include <net/netlink.h>
L
Linus Torvalds 已提交
44 45
#include <net/act_api.h>
#include <net/pkt_cls.h>
46
#include <linux/netdevice.h>
L
Linus Torvalds 已提交
47

E
Eric Dumazet 已提交
48
struct tc_u_knode {
49
	struct tc_u_knode __rcu	*next;
L
Linus Torvalds 已提交
50
	u32			handle;
51
	struct tc_u_hnode __rcu	*ht_up;
L
Linus Torvalds 已提交
52 53
	struct tcf_exts		exts;
#ifdef CONFIG_NET_CLS_IND
54
	int			ifindex;
L
Linus Torvalds 已提交
55 56 57
#endif
	u8			fshift;
	struct tcf_result	res;
58
	struct tc_u_hnode __rcu	*ht_down;
L
Linus Torvalds 已提交
59
#ifdef CONFIG_CLS_U32_PERF
60
	struct tc_u32_pcnt __percpu *pf;
L
Linus Torvalds 已提交
61
#endif
62
	u32			flags;
L
Linus Torvalds 已提交
63
#ifdef CONFIG_CLS_U32_MARK
64 65 66
	u32			val;
	u32			mask;
	u32 __percpu		*pcpu_success;
L
Linus Torvalds 已提交
67
#endif
68 69
	struct tcf_proto	*tp;
	struct rcu_head		rcu;
70 71 72 73
	/* The 'sel' field MUST be the last field in structure to allow for
	 * tc_u32_keys allocated at end of structure.
	 */
	struct tc_u32_sel	sel;
L
Linus Torvalds 已提交
74 75
};

E
Eric Dumazet 已提交
76
struct tc_u_hnode {
77
	struct tc_u_hnode __rcu	*next;
L
Linus Torvalds 已提交
78 79 80 81
	u32			handle;
	u32			prio;
	struct tc_u_common	*tp_c;
	int			refcnt;
E
Eric Dumazet 已提交
82
	unsigned int		divisor;
83
	struct rcu_head		rcu;
84 85 86 87
	/* The 'ht' field MUST be the last field in structure to allow for
	 * more entries allocated at end of structure.
	 */
	struct tc_u_knode __rcu	*ht[1];
L
Linus Torvalds 已提交
88 89
};

E
Eric Dumazet 已提交
90
struct tc_u_common {
91
	struct tc_u_hnode __rcu	*hlist;
L
Linus Torvalds 已提交
92 93 94
	struct Qdisc		*q;
	int			refcnt;
	u32			hgenerator;
95
	struct rcu_head		rcu;
L
Linus Torvalds 已提交
96 97
};

E
Eric Dumazet 已提交
98 99 100
static inline unsigned int u32_hash_fold(__be32 key,
					 const struct tc_u32_sel *sel,
					 u8 fshift)
L
Linus Torvalds 已提交
101
{
E
Eric Dumazet 已提交
102
	unsigned int h = ntohl(key & sel->hmask) >> fshift;
L
Linus Torvalds 已提交
103 104 105 106

	return h;
}

J
Jamal Hadi Salim 已提交
107 108
static int u32_classify(struct sk_buff *skb, const struct tcf_proto *tp,
			struct tcf_result *res)
L
Linus Torvalds 已提交
109 110 111
{
	struct {
		struct tc_u_knode *knode;
112
		unsigned int	  off;
L
Linus Torvalds 已提交
113 114
	} stack[TC_U32_MAXDEPTH];

115
	struct tc_u_hnode *ht = rcu_dereference_bh(tp->root);
116
	unsigned int off = skb_network_offset(skb);
L
Linus Torvalds 已提交
117 118 119 120 121 122 123 124 125 126
	struct tc_u_knode *n;
	int sdepth = 0;
	int off2 = 0;
	int sel = 0;
#ifdef CONFIG_CLS_U32_PERF
	int j;
#endif
	int i, r;

next_ht:
127
	n = rcu_dereference_bh(ht->ht[sel]);
L
Linus Torvalds 已提交
128 129 130 131 132 133

next_knode:
	if (n) {
		struct tc_u32_key *key = n->sel.keys;

#ifdef CONFIG_CLS_U32_PERF
134
		__this_cpu_inc(n->pf->rcnt);
L
Linus Torvalds 已提交
135 136 137
		j = 0;
#endif

138 139 140 141 142
		if (tc_skip_sw(n->flags)) {
			n = rcu_dereference_bh(n->next);
			goto next_knode;
		}

L
Linus Torvalds 已提交
143
#ifdef CONFIG_CLS_U32_MARK
144
		if ((skb->mark & n->mask) != n->val) {
145
			n = rcu_dereference_bh(n->next);
L
Linus Torvalds 已提交
146 147
			goto next_knode;
		} else {
148
			__this_cpu_inc(*n->pcpu_success);
L
Linus Torvalds 已提交
149 150 151
		}
#endif

E
Eric Dumazet 已提交
152
		for (i = n->sel.nkeys; i > 0; i--, key++) {
S
stephen hemminger 已提交
153
			int toff = off + key->off + (off2 & key->offmask);
S
stephen hemminger 已提交
154
			__be32 *data, hdata;
155

D
Dan Carpenter 已提交
156
			if (skb_headroom(skb) + toff > INT_MAX)
S
stephen hemminger 已提交
157 158
				goto out;

S
stephen hemminger 已提交
159
			data = skb_header_pointer(skb, toff, 4, &hdata);
160 161 162
			if (!data)
				goto out;
			if ((*data ^ key->val) & key->mask) {
163
				n = rcu_dereference_bh(n->next);
L
Linus Torvalds 已提交
164 165 166
				goto next_knode;
			}
#ifdef CONFIG_CLS_U32_PERF
167
			__this_cpu_inc(n->pf->kcnts[j]);
L
Linus Torvalds 已提交
168 169 170
			j++;
#endif
		}
171 172 173

		ht = rcu_dereference_bh(n->ht_down);
		if (!ht) {
L
Linus Torvalds 已提交
174
check_terminal:
E
Eric Dumazet 已提交
175
			if (n->sel.flags & TC_U32_TERMINAL) {
L
Linus Torvalds 已提交
176 177 178

				*res = n->res;
#ifdef CONFIG_NET_CLS_IND
179
				if (!tcf_match_indev(skb, n->ifindex)) {
180
					n = rcu_dereference_bh(n->next);
L
Linus Torvalds 已提交
181 182 183 184
					goto next_knode;
				}
#endif
#ifdef CONFIG_CLS_U32_PERF
185
				__this_cpu_inc(n->pf->rhit);
L
Linus Torvalds 已提交
186 187 188
#endif
				r = tcf_exts_exec(skb, &n->exts, res);
				if (r < 0) {
189
					n = rcu_dereference_bh(n->next);
L
Linus Torvalds 已提交
190 191 192 193 194
					goto next_knode;
				}

				return r;
			}
195
			n = rcu_dereference_bh(n->next);
L
Linus Torvalds 已提交
196 197 198 199 200 201 202
			goto next_knode;
		}

		/* PUSH */
		if (sdepth >= TC_U32_MAXDEPTH)
			goto deadloop;
		stack[sdepth].knode = n;
203
		stack[sdepth].off = off;
L
Linus Torvalds 已提交
204 205
		sdepth++;

206
		ht = rcu_dereference_bh(n->ht_down);
L
Linus Torvalds 已提交
207
		sel = 0;
208
		if (ht->divisor) {
S
stephen hemminger 已提交
209
			__be32 *data, hdata;
210 211

			data = skb_header_pointer(skb, off + n->sel.hoff, 4,
S
stephen hemminger 已提交
212
						  &hdata);
213 214 215 216 217
			if (!data)
				goto out;
			sel = ht->divisor & u32_hash_fold(*data, &n->sel,
							  n->fshift);
		}
E
Eric Dumazet 已提交
218
		if (!(n->sel.flags & (TC_U32_VAROFFSET | TC_U32_OFFSET | TC_U32_EAT)))
L
Linus Torvalds 已提交
219 220
			goto next_ht;

E
Eric Dumazet 已提交
221
		if (n->sel.flags & (TC_U32_OFFSET | TC_U32_VAROFFSET)) {
L
Linus Torvalds 已提交
222
			off2 = n->sel.off + 3;
223
			if (n->sel.flags & TC_U32_VAROFFSET) {
S
stephen hemminger 已提交
224
				__be16 *data, hdata;
225 226 227

				data = skb_header_pointer(skb,
							  off + n->sel.offoff,
S
stephen hemminger 已提交
228
							  2, &hdata);
229 230 231 232 233
				if (!data)
					goto out;
				off2 += ntohs(n->sel.offmask & *data) >>
					n->sel.offshift;
			}
L
Linus Torvalds 已提交
234 235
			off2 &= ~3;
		}
E
Eric Dumazet 已提交
236
		if (n->sel.flags & TC_U32_EAT) {
237
			off += off2;
L
Linus Torvalds 已提交
238 239 240
			off2 = 0;
		}

241
		if (off < skb->len)
L
Linus Torvalds 已提交
242 243 244 245 246 247
			goto next_ht;
	}

	/* POP */
	if (sdepth--) {
		n = stack[sdepth].knode;
248
		ht = rcu_dereference_bh(n->ht_up);
249
		off = stack[sdepth].off;
L
Linus Torvalds 已提交
250 251
		goto check_terminal;
	}
252
out:
L
Linus Torvalds 已提交
253 254 255
	return -1;

deadloop:
256
	net_warn_ratelimited("cls_u32: dead loop\n");
L
Linus Torvalds 已提交
257 258 259
	return -1;
}

J
Jamal Hadi Salim 已提交
260
static struct tc_u_hnode *u32_lookup_ht(struct tc_u_common *tp_c, u32 handle)
L
Linus Torvalds 已提交
261 262 263
{
	struct tc_u_hnode *ht;

264 265 266
	for (ht = rtnl_dereference(tp_c->hlist);
	     ht;
	     ht = rtnl_dereference(ht->next))
L
Linus Torvalds 已提交
267 268 269 270 271 272
		if (ht->handle == handle)
			break;

	return ht;
}

J
Jamal Hadi Salim 已提交
273
static struct tc_u_knode *u32_lookup_key(struct tc_u_hnode *ht, u32 handle)
L
Linus Torvalds 已提交
274
{
E
Eric Dumazet 已提交
275
	unsigned int sel;
L
Linus Torvalds 已提交
276 277 278 279 280 281
	struct tc_u_knode *n = NULL;

	sel = TC_U32_HASH(handle);
	if (sel > ht->divisor)
		goto out;

282 283 284
	for (n = rtnl_dereference(ht->ht[sel]);
	     n;
	     n = rtnl_dereference(n->next))
L
Linus Torvalds 已提交
285 286 287 288 289 290 291 292 293 294 295 296 297
		if (n->handle == handle)
			break;
out:
	return n;
}


static unsigned long u32_get(struct tcf_proto *tp, u32 handle)
{
	struct tc_u_hnode *ht;
	struct tc_u_common *tp_c = tp->data;

	if (TC_U32_HTID(handle) == TC_U32_ROOT)
298
		ht = rtnl_dereference(tp->root);
L
Linus Torvalds 已提交
299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314
	else
		ht = u32_lookup_ht(tp_c, TC_U32_HTID(handle));

	if (!ht)
		return 0;

	if (TC_U32_KEY(handle) == 0)
		return (unsigned long)ht;

	return (unsigned long)u32_lookup_key(ht, handle);
}

static u32 gen_new_htid(struct tc_u_common *tp_c)
{
	int i = 0x800;

315 316 317
	/* hgenerator only used inside rtnl lock it is safe to increment
	 * without read _copy_ update semantics
	 */
L
Linus Torvalds 已提交
318 319 320
	do {
		if (++tp_c->hgenerator == 0x7FF)
			tp_c->hgenerator = 1;
E
Eric Dumazet 已提交
321
	} while (--i > 0 && u32_lookup_ht(tp_c, (tp_c->hgenerator|0x800)<<20));
L
Linus Torvalds 已提交
322 323 324 325 326 327 328 329 330

	return i > 0 ? (tp_c->hgenerator|0x800)<<20 : 0;
}

static int u32_init(struct tcf_proto *tp)
{
	struct tc_u_hnode *root_ht;
	struct tc_u_common *tp_c;

331
	tp_c = tp->q->u32_node;
L
Linus Torvalds 已提交
332

333
	root_ht = kzalloc(sizeof(*root_ht), GFP_KERNEL);
L
Linus Torvalds 已提交
334 335 336 337 338 339 340 341
	if (root_ht == NULL)
		return -ENOBUFS;

	root_ht->refcnt++;
	root_ht->handle = tp_c ? gen_new_htid(tp_c) : 0x80000000;
	root_ht->prio = tp->prio;

	if (tp_c == NULL) {
342
		tp_c = kzalloc(sizeof(*tp_c), GFP_KERNEL);
L
Linus Torvalds 已提交
343 344 345 346 347
		if (tp_c == NULL) {
			kfree(root_ht);
			return -ENOBUFS;
		}
		tp_c->q = tp->q;
348
		tp->q->u32_node = tp_c;
L
Linus Torvalds 已提交
349 350 351
	}

	tp_c->refcnt++;
352 353
	RCU_INIT_POINTER(root_ht->next, tp_c->hlist);
	rcu_assign_pointer(tp_c->hlist, root_ht);
L
Linus Torvalds 已提交
354 355
	root_ht->tp_c = tp_c;

356
	rcu_assign_pointer(tp->root, root_ht);
L
Linus Torvalds 已提交
357 358 359 360
	tp->data = tp_c;
	return 0;
}

J
Jamal Hadi Salim 已提交
361
static int u32_destroy_key(struct tcf_proto *tp, struct tc_u_knode *n,
362
			   bool free_pf)
L
Linus Torvalds 已提交
363
{
364
	tcf_exts_destroy(&n->exts);
L
Linus Torvalds 已提交
365 366 367
	if (n->ht_down)
		n->ht_down->refcnt--;
#ifdef CONFIG_CLS_U32_PERF
368 369
	if (free_pf)
		free_percpu(n->pf);
370 371
#endif
#ifdef CONFIG_CLS_U32_MARK
372 373
	if (free_pf)
		free_percpu(n->pcpu_success);
L
Linus Torvalds 已提交
374 375 376 377 378
#endif
	kfree(n);
	return 0;
}

379 380 381 382 383 384 385 386
/* u32_delete_key_rcu should be called when free'ing a copied
 * version of a tc_u_knode obtained from u32_init_knode(). When
 * copies are obtained from u32_init_knode() the statistics are
 * shared between the old and new copies to allow readers to
 * continue to update the statistics during the copy. To support
 * this the u32_delete_key_rcu variant does not free the percpu
 * statistics.
 */
387 388 389 390
static void u32_delete_key_rcu(struct rcu_head *rcu)
{
	struct tc_u_knode *key = container_of(rcu, struct tc_u_knode, rcu);

391 392 393 394 395 396 397 398 399 400 401 402 403 404 405
	u32_destroy_key(key->tp, key, false);
}

/* u32_delete_key_freepf_rcu is the rcu callback variant
 * that free's the entire structure including the statistics
 * percpu variables. Only use this if the key is not a copy
 * returned by u32_init_knode(). See u32_delete_key_rcu()
 * for the variant that should be used with keys return from
 * u32_init_knode()
 */
static void u32_delete_key_freepf_rcu(struct rcu_head *rcu)
{
	struct tc_u_knode *key = container_of(rcu, struct tc_u_knode, rcu);

	u32_destroy_key(key->tp, key, true);
406 407
}

408
static int u32_delete_key(struct tcf_proto *tp, struct tc_u_knode *key)
L
Linus Torvalds 已提交
409
{
410 411
	struct tc_u_knode __rcu **kp;
	struct tc_u_knode *pkp;
412
	struct tc_u_hnode *ht = rtnl_dereference(key->ht_up);
L
Linus Torvalds 已提交
413 414

	if (ht) {
415 416 417 418 419
		kp = &ht->ht[TC_U32_HASH(key->handle)];
		for (pkp = rtnl_dereference(*kp); pkp;
		     kp = &pkp->next, pkp = rtnl_dereference(*kp)) {
			if (pkp == key) {
				RCU_INIT_POINTER(*kp, key->next);
L
Linus Torvalds 已提交
420

421
				tcf_unbind_filter(tp, &key->res);
422
				call_rcu(&key->rcu, u32_delete_key_freepf_rcu);
L
Linus Torvalds 已提交
423 424 425 426
				return 0;
			}
		}
	}
427
	WARN_ON(1);
L
Linus Torvalds 已提交
428 429 430
	return 0;
}

431 432 433 434 435 436 437 438 439
static void u32_remove_hw_knode(struct tcf_proto *tp, u32 handle)
{
	struct net_device *dev = tp->q->dev_queue->dev;
	struct tc_cls_u32_offload u32_offload = {0};
	struct tc_to_netdev offload;

	offload.type = TC_SETUP_CLSU32;
	offload.cls_u32 = &u32_offload;

440
	if (tc_should_offload(dev, tp, 0)) {
441 442 443 444 445 446 447
		offload.cls_u32->command = TC_CLSU32_DELETE_KNODE;
		offload.cls_u32->knode.handle = handle;
		dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle,
					      tp->protocol, &offload);
	}
}

J
Jamal Hadi Salim 已提交
448 449
static int u32_replace_hw_hnode(struct tcf_proto *tp, struct tc_u_hnode *h,
				u32 flags)
450 451 452 453
{
	struct net_device *dev = tp->q->dev_queue->dev;
	struct tc_cls_u32_offload u32_offload = {0};
	struct tc_to_netdev offload;
454
	int err;
455

456
	if (!tc_should_offload(dev, tp, flags))
457 458
		return tc_skip_sw(flags) ? -EINVAL : 0;

459 460 461
	offload.type = TC_SETUP_CLSU32;
	offload.cls_u32 = &u32_offload;

462 463 464 465
	offload.cls_u32->command = TC_CLSU32_NEW_HNODE;
	offload.cls_u32->hnode.divisor = h->divisor;
	offload.cls_u32->hnode.handle = h->handle;
	offload.cls_u32->hnode.prio = h->prio;
466

467 468 469 470
	err = dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle,
					    tp->protocol, &offload);
	if (tc_skip_sw(flags))
		return err;
471 472

	return 0;
473 474 475 476 477 478 479 480 481 482 483
}

static void u32_clear_hw_hnode(struct tcf_proto *tp, struct tc_u_hnode *h)
{
	struct net_device *dev = tp->q->dev_queue->dev;
	struct tc_cls_u32_offload u32_offload = {0};
	struct tc_to_netdev offload;

	offload.type = TC_SETUP_CLSU32;
	offload.cls_u32 = &u32_offload;

484
	if (tc_should_offload(dev, tp, 0)) {
485 486 487 488 489 490 491 492 493 494
		offload.cls_u32->command = TC_CLSU32_DELETE_HNODE;
		offload.cls_u32->hnode.divisor = h->divisor;
		offload.cls_u32->hnode.handle = h->handle;
		offload.cls_u32->hnode.prio = h->prio;

		dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle,
					      tp->protocol, &offload);
	}
}

J
Jamal Hadi Salim 已提交
495 496
static int u32_replace_hw_knode(struct tcf_proto *tp, struct tc_u_knode *n,
				u32 flags)
497 498 499 500
{
	struct net_device *dev = tp->q->dev_queue->dev;
	struct tc_cls_u32_offload u32_offload = {0};
	struct tc_to_netdev offload;
501
	int err;
502 503 504 505

	offload.type = TC_SETUP_CLSU32;
	offload.cls_u32 = &u32_offload;

506 507 508 509 510 511
	if (!tc_should_offload(dev, tp, flags))
		return tc_skip_sw(flags) ? -EINVAL : 0;

	offload.cls_u32->command = TC_CLSU32_REPLACE_KNODE;
	offload.cls_u32->knode.handle = n->handle;
	offload.cls_u32->knode.fshift = n->fshift;
512
#ifdef CONFIG_CLS_U32_MARK
513 514
	offload.cls_u32->knode.val = n->val;
	offload.cls_u32->knode.mask = n->mask;
515
#else
516 517
	offload.cls_u32->knode.val = 0;
	offload.cls_u32->knode.mask = 0;
518
#endif
519 520 521 522 523 524 525 526 527
	offload.cls_u32->knode.sel = &n->sel;
	offload.cls_u32->knode.exts = &n->exts;
	if (n->ht_down)
		offload.cls_u32->knode.link_handle = n->ht_down->handle;

	err = dev->netdev_ops->ndo_setup_tc(dev, tp->q->handle,
					    tp->protocol, &offload);
	if (tc_skip_sw(flags))
		return err;
528 529

	return 0;
530 531
}

532
static void u32_clear_hnode(struct tcf_proto *tp, struct tc_u_hnode *ht)
L
Linus Torvalds 已提交
533 534
{
	struct tc_u_knode *n;
E
Eric Dumazet 已提交
535
	unsigned int h;
L
Linus Torvalds 已提交
536

E
Eric Dumazet 已提交
537
	for (h = 0; h <= ht->divisor; h++) {
538 539 540
		while ((n = rtnl_dereference(ht->ht[h])) != NULL) {
			RCU_INIT_POINTER(ht->ht[h],
					 rtnl_dereference(n->next));
541
			tcf_unbind_filter(tp, &n->res);
542
			u32_remove_hw_knode(tp, n->handle);
543
			call_rcu(&n->rcu, u32_delete_key_freepf_rcu);
L
Linus Torvalds 已提交
544 545 546 547 548 549 550
		}
	}
}

static int u32_destroy_hnode(struct tcf_proto *tp, struct tc_u_hnode *ht)
{
	struct tc_u_common *tp_c = tp->data;
551 552
	struct tc_u_hnode __rcu **hn;
	struct tc_u_hnode *phn;
L
Linus Torvalds 已提交
553

554
	WARN_ON(ht->refcnt);
L
Linus Torvalds 已提交
555

556
	u32_clear_hnode(tp, ht);
L
Linus Torvalds 已提交
557

558 559 560 561 562
	hn = &tp_c->hlist;
	for (phn = rtnl_dereference(*hn);
	     phn;
	     hn = &phn->next, phn = rtnl_dereference(*hn)) {
		if (phn == ht) {
563
			u32_clear_hw_hnode(tp, ht);
564 565
			RCU_INIT_POINTER(*hn, ht->next);
			kfree_rcu(ht, rcu);
L
Linus Torvalds 已提交
566 567 568 569 570 571 572
			return 0;
		}
	}

	return -ENOENT;
}

573 574 575 576 577 578 579 580 581 582 583 584
static bool ht_empty(struct tc_u_hnode *ht)
{
	unsigned int h;

	for (h = 0; h <= ht->divisor; h++)
		if (rcu_access_pointer(ht->ht[h]))
			return false;

	return true;
}

static bool u32_destroy(struct tcf_proto *tp, bool force)
L
Linus Torvalds 已提交
585 586
{
	struct tc_u_common *tp_c = tp->data;
587
	struct tc_u_hnode *root_ht = rtnl_dereference(tp->root);
L
Linus Torvalds 已提交
588

589
	WARN_ON(root_ht == NULL);
L
Linus Torvalds 已提交
590

591 592 593 594 595 596 597 598 599
	if (!force) {
		if (root_ht) {
			if (root_ht->refcnt > 1)
				return false;
			if (root_ht->refcnt == 1) {
				if (!ht_empty(root_ht))
					return false;
			}
		}
600 601 602 603 604 605 606 607 608 609 610 611 612

		if (tp_c->refcnt > 1)
			return false;

		if (tp_c->refcnt == 1) {
			struct tc_u_hnode *ht;

			for (ht = rtnl_dereference(tp_c->hlist);
			     ht;
			     ht = rtnl_dereference(ht->next))
				if (!ht_empty(ht))
					return false;
		}
613 614
	}

L
Linus Torvalds 已提交
615 616 617 618 619 620
	if (root_ht && --root_ht->refcnt == 0)
		u32_destroy_hnode(tp, root_ht);

	if (--tp_c->refcnt == 0) {
		struct tc_u_hnode *ht;

621
		tp->q->u32_node = NULL;
L
Linus Torvalds 已提交
622

623 624 625
		for (ht = rtnl_dereference(tp_c->hlist);
		     ht;
		     ht = rtnl_dereference(ht->next)) {
626
			ht->refcnt--;
627
			u32_clear_hnode(tp, ht);
628
		}
L
Linus Torvalds 已提交
629

630 631 632
		while ((ht = rtnl_dereference(tp_c->hlist)) != NULL) {
			RCU_INIT_POINTER(tp_c->hlist, ht->next);
			kfree_rcu(ht, rcu);
633
		}
L
Linus Torvalds 已提交
634 635 636 637 638

		kfree(tp_c);
	}

	tp->data = NULL;
639
	return true;
L
Linus Torvalds 已提交
640 641 642 643
}

static int u32_delete(struct tcf_proto *tp, unsigned long arg)
{
E
Eric Dumazet 已提交
644
	struct tc_u_hnode *ht = (struct tc_u_hnode *)arg;
645
	struct tc_u_hnode *root_ht = rtnl_dereference(tp->root);
L
Linus Torvalds 已提交
646 647 648 649

	if (ht == NULL)
		return 0;

650 651
	if (TC_U32_KEY(ht->handle)) {
		u32_remove_hw_knode(tp, ht->handle);
E
Eric Dumazet 已提交
652
		return u32_delete_key(tp, (struct tc_u_knode *)ht);
653
	}
L
Linus Torvalds 已提交
654

655
	if (root_ht == ht)
L
Linus Torvalds 已提交
656 657
		return -EINVAL;

658 659
	if (ht->refcnt == 1) {
		ht->refcnt--;
L
Linus Torvalds 已提交
660
		u32_destroy_hnode(tp, ht);
661 662 663
	} else {
		return -EBUSY;
	}
L
Linus Torvalds 已提交
664 665 666 667

	return 0;
}

668
#define NR_U32_NODE (1<<12)
L
Linus Torvalds 已提交
669 670 671
static u32 gen_new_kid(struct tc_u_hnode *ht, u32 handle)
{
	struct tc_u_knode *n;
672 673 674 675 676
	unsigned long i;
	unsigned long *bitmap = kzalloc(BITS_TO_LONGS(NR_U32_NODE) * sizeof(unsigned long),
					GFP_KERNEL);
	if (!bitmap)
		return handle | 0xFFF;
L
Linus Torvalds 已提交
677

678 679 680
	for (n = rtnl_dereference(ht->ht[TC_U32_HASH(handle)]);
	     n;
	     n = rtnl_dereference(n->next))
681
		set_bit(TC_U32_NODE(n->handle), bitmap);
L
Linus Torvalds 已提交
682

683 684 685 686 687 688
	i = find_next_zero_bit(bitmap, NR_U32_NODE, 0x800);
	if (i >= NR_U32_NODE)
		i = find_next_zero_bit(bitmap, NR_U32_NODE, 1);

	kfree(bitmap);
	return handle | (i >= NR_U32_NODE ? 0xFFF : i);
L
Linus Torvalds 已提交
689 690
}

691 692 693 694 695 696 697 698
static const struct nla_policy u32_policy[TCA_U32_MAX + 1] = {
	[TCA_U32_CLASSID]	= { .type = NLA_U32 },
	[TCA_U32_HASH]		= { .type = NLA_U32 },
	[TCA_U32_LINK]		= { .type = NLA_U32 },
	[TCA_U32_DIVISOR]	= { .type = NLA_U32 },
	[TCA_U32_SEL]		= { .len = sizeof(struct tc_u32_sel) },
	[TCA_U32_INDEV]		= { .type = NLA_STRING, .len = IFNAMSIZ },
	[TCA_U32_MARK]		= { .len = sizeof(struct tc_u32_mark) },
699
	[TCA_U32_FLAGS]		= { .type = NLA_U32 },
700 701
};

702 703
static int u32_set_parms(struct net *net, struct tcf_proto *tp,
			 unsigned long base, struct tc_u_hnode *ht,
704
			 struct tc_u_knode *n, struct nlattr **tb,
705
			 struct nlattr *est, bool ovr)
L
Linus Torvalds 已提交
706 707
{
	struct tcf_exts e;
708
	int err;
L
Linus Torvalds 已提交
709

710
	err = tcf_exts_init(&e, TCA_U32_ACT, TCA_U32_POLICE);
L
Linus Torvalds 已提交
711 712
	if (err < 0)
		return err;
713 714 715
	err = tcf_exts_validate(net, tp, tb, est, &e, ovr);
	if (err < 0)
		goto errout;
L
Linus Torvalds 已提交
716 717

	err = -EINVAL;
718
	if (tb[TCA_U32_LINK]) {
719
		u32 handle = nla_get_u32(tb[TCA_U32_LINK]);
720
		struct tc_u_hnode *ht_down = NULL, *ht_old;
L
Linus Torvalds 已提交
721 722 723 724 725 726 727 728 729 730 731 732

		if (TC_U32_KEY(handle))
			goto errout;

		if (handle) {
			ht_down = u32_lookup_ht(ht->tp_c, handle);

			if (ht_down == NULL)
				goto errout;
			ht_down->refcnt++;
		}

733 734
		ht_old = rtnl_dereference(n->ht_down);
		rcu_assign_pointer(n->ht_down, ht_down);
L
Linus Torvalds 已提交
735

736 737
		if (ht_old)
			ht_old->refcnt--;
L
Linus Torvalds 已提交
738
	}
739
	if (tb[TCA_U32_CLASSID]) {
740
		n->res.classid = nla_get_u32(tb[TCA_U32_CLASSID]);
L
Linus Torvalds 已提交
741 742 743 744
		tcf_bind_filter(tp, &n->res, base);
	}

#ifdef CONFIG_NET_CLS_IND
745
	if (tb[TCA_U32_INDEV]) {
746 747 748
		int ret;
		ret = tcf_change_indev(net, tb[TCA_U32_INDEV]);
		if (ret < 0)
L
Linus Torvalds 已提交
749
			goto errout;
750
		n->ifindex = ret;
L
Linus Torvalds 已提交
751 752 753 754 755 756
	}
#endif
	tcf_exts_change(tp, &n->exts, &e);

	return 0;
errout:
757
	tcf_exts_destroy(&e);
L
Linus Torvalds 已提交
758 759 760
	return err;
}

J
Jamal Hadi Salim 已提交
761
static void u32_replace_knode(struct tcf_proto *tp, struct tc_u_common *tp_c,
762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807
			      struct tc_u_knode *n)
{
	struct tc_u_knode __rcu **ins;
	struct tc_u_knode *pins;
	struct tc_u_hnode *ht;

	if (TC_U32_HTID(n->handle) == TC_U32_ROOT)
		ht = rtnl_dereference(tp->root);
	else
		ht = u32_lookup_ht(tp_c, TC_U32_HTID(n->handle));

	ins = &ht->ht[TC_U32_HASH(n->handle)];

	/* The node must always exist for it to be replaced if this is not the
	 * case then something went very wrong elsewhere.
	 */
	for (pins = rtnl_dereference(*ins); ;
	     ins = &pins->next, pins = rtnl_dereference(*ins))
		if (pins->handle == n->handle)
			break;

	RCU_INIT_POINTER(n->next, pins->next);
	rcu_assign_pointer(*ins, n);
}

static struct tc_u_knode *u32_init_knode(struct tcf_proto *tp,
					 struct tc_u_knode *n)
{
	struct tc_u_knode *new;
	struct tc_u32_sel *s = &n->sel;

	new = kzalloc(sizeof(*n) + s->nkeys*sizeof(struct tc_u32_key),
		      GFP_KERNEL);

	if (!new)
		return NULL;

	RCU_INIT_POINTER(new->next, n->next);
	new->handle = n->handle;
	RCU_INIT_POINTER(new->ht_up, n->ht_up);

#ifdef CONFIG_NET_CLS_IND
	new->ifindex = n->ifindex;
#endif
	new->fshift = n->fshift;
	new->res = n->res;
808
	new->flags = n->flags;
809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831
	RCU_INIT_POINTER(new->ht_down, n->ht_down);

	/* bump reference count as long as we hold pointer to structure */
	if (new->ht_down)
		new->ht_down->refcnt++;

#ifdef CONFIG_CLS_U32_PERF
	/* Statistics may be incremented by readers during update
	 * so we must keep them in tact. When the node is later destroyed
	 * a special destroy call must be made to not free the pf memory.
	 */
	new->pf = n->pf;
#endif

#ifdef CONFIG_CLS_U32_MARK
	new->val = n->val;
	new->mask = n->mask;
	/* Similarly success statistics must be moved as pointers */
	new->pcpu_success = n->pcpu_success;
#endif
	new->tp = tp;
	memcpy(&new->sel, s, sizeof(*s) + s->nkeys*sizeof(struct tc_u32_key));

832 833 834 835
	if (tcf_exts_init(&new->exts, TCA_U32_ACT, TCA_U32_POLICE)) {
		kfree(new);
		return NULL;
	}
836 837 838 839

	return new;
}

840
static int u32_change(struct net *net, struct sk_buff *in_skb,
841
		      struct tcf_proto *tp, unsigned long base, u32 handle,
J
Jamal Hadi Salim 已提交
842
		      struct nlattr **tca, unsigned long *arg, bool ovr)
L
Linus Torvalds 已提交
843 844 845 846 847
{
	struct tc_u_common *tp_c = tp->data;
	struct tc_u_hnode *ht;
	struct tc_u_knode *n;
	struct tc_u32_sel *s;
848 849
	struct nlattr *opt = tca[TCA_OPTIONS];
	struct nlattr *tb[TCA_U32_MAX + 1];
850
	u32 htid, flags = 0;
L
Linus Torvalds 已提交
851
	int err;
852 853 854
#ifdef CONFIG_CLS_U32_PERF
	size_t size;
#endif
L
Linus Torvalds 已提交
855 856 857 858

	if (opt == NULL)
		return handle ? -EINVAL : 0;

859
	err = nla_parse_nested(tb, TCA_U32_MAX, opt, u32_policy);
860 861
	if (err < 0)
		return err;
L
Linus Torvalds 已提交
862

863
	if (tb[TCA_U32_FLAGS]) {
864
		flags = nla_get_u32(tb[TCA_U32_FLAGS]);
865
		if (!tc_flags_valid(flags))
866
			return -EINVAL;
867
	}
868

E
Eric Dumazet 已提交
869 870
	n = (struct tc_u_knode *)*arg;
	if (n) {
871 872
		struct tc_u_knode *new;

L
Linus Torvalds 已提交
873 874 875
		if (TC_U32_KEY(n->handle) == 0)
			return -EINVAL;

876 877 878
		if (n->flags != flags)
			return -EINVAL;

879 880 881 882 883 884 885 886 887 888 889 890 891
		new = u32_init_knode(tp, n);
		if (!new)
			return -ENOMEM;

		err = u32_set_parms(net, tp, base,
				    rtnl_dereference(n->ht_up), new, tb,
				    tca[TCA_RATE], ovr);

		if (err) {
			u32_destroy_key(tp, new, false);
			return err;
		}

892 893 894 895 896 897
		err = u32_replace_hw_knode(tp, new, flags);
		if (err) {
			u32_destroy_key(tp, new, false);
			return err;
		}

898
		u32_replace_knode(tp, tp_c, new);
899
		tcf_unbind_filter(tp, &n->res);
900 901
		call_rcu(&n->rcu, u32_delete_key_rcu);
		return 0;
L
Linus Torvalds 已提交
902 903
	}

904
	if (tb[TCA_U32_DIVISOR]) {
E
Eric Dumazet 已提交
905
		unsigned int divisor = nla_get_u32(tb[TCA_U32_DIVISOR]);
L
Linus Torvalds 已提交
906 907 908 909 910 911 912 913 914 915

		if (--divisor > 0x100)
			return -EINVAL;
		if (TC_U32_KEY(handle))
			return -EINVAL;
		if (handle == 0) {
			handle = gen_new_htid(tp->data);
			if (handle == 0)
				return -ENOMEM;
		}
E
Eric Dumazet 已提交
916
		ht = kzalloc(sizeof(*ht) + divisor*sizeof(void *), GFP_KERNEL);
L
Linus Torvalds 已提交
917 918 919
		if (ht == NULL)
			return -ENOBUFS;
		ht->tp_c = tp_c;
920
		ht->refcnt = 1;
L
Linus Torvalds 已提交
921 922 923
		ht->divisor = divisor;
		ht->handle = handle;
		ht->prio = tp->prio;
924 925 926 927 928 929 930

		err = u32_replace_hw_hnode(tp, ht, flags);
		if (err) {
			kfree(ht);
			return err;
		}

931 932
		RCU_INIT_POINTER(ht->next, tp_c->hlist);
		rcu_assign_pointer(tp_c->hlist, ht);
L
Linus Torvalds 已提交
933
		*arg = (unsigned long)ht;
934

L
Linus Torvalds 已提交
935 936 937
		return 0;
	}

938
	if (tb[TCA_U32_HASH]) {
939
		htid = nla_get_u32(tb[TCA_U32_HASH]);
L
Linus Torvalds 已提交
940
		if (TC_U32_HTID(htid) == TC_U32_ROOT) {
941
			ht = rtnl_dereference(tp->root);
L
Linus Torvalds 已提交
942 943 944 945 946 947 948
			htid = ht->handle;
		} else {
			ht = u32_lookup_ht(tp->data, TC_U32_HTID(htid));
			if (ht == NULL)
				return -EINVAL;
		}
	} else {
949
		ht = rtnl_dereference(tp->root);
L
Linus Torvalds 已提交
950 951 952 953 954 955 956 957 958 959 960 961 962
		htid = ht->handle;
	}

	if (ht->divisor < TC_U32_HASH(htid))
		return -EINVAL;

	if (handle) {
		if (TC_U32_HTID(handle) && TC_U32_HTID(handle^htid))
			return -EINVAL;
		handle = htid | TC_U32_NODE(handle);
	} else
		handle = gen_new_kid(ht, htid);

963
	if (tb[TCA_U32_SEL] == NULL)
L
Linus Torvalds 已提交
964 965
		return -EINVAL;

966
	s = nla_data(tb[TCA_U32_SEL]);
L
Linus Torvalds 已提交
967

968
	n = kzalloc(sizeof(*n) + s->nkeys*sizeof(struct tc_u32_key), GFP_KERNEL);
L
Linus Torvalds 已提交
969 970 971 972
	if (n == NULL)
		return -ENOBUFS;

#ifdef CONFIG_CLS_U32_PERF
973 974 975
	size = sizeof(struct tc_u32_pcnt) + s->nkeys * sizeof(u64);
	n->pf = __alloc_percpu(size, __alignof__(struct tc_u32_pcnt));
	if (!n->pf) {
L
Linus Torvalds 已提交
976 977 978 979 980 981
		kfree(n);
		return -ENOBUFS;
	}
#endif

	memcpy(&n->sel, s, sizeof(*s) + s->nkeys*sizeof(struct tc_u32_key));
982
	RCU_INIT_POINTER(n->ht_up, ht);
L
Linus Torvalds 已提交
983
	n->handle = handle;
984
	n->fshift = s->hmask ? ffs(ntohl(s->hmask)) - 1 : 0;
985
	n->flags = flags;
986
	n->tp = tp;
L
Linus Torvalds 已提交
987

988 989 990 991
	err = tcf_exts_init(&n->exts, TCA_U32_ACT, TCA_U32_POLICE);
	if (err < 0)
		goto errout;

L
Linus Torvalds 已提交
992
#ifdef CONFIG_CLS_U32_MARK
993
	n->pcpu_success = alloc_percpu(u32);
994 995 996 997
	if (!n->pcpu_success) {
		err = -ENOMEM;
		goto errout;
	}
998

999
	if (tb[TCA_U32_MARK]) {
L
Linus Torvalds 已提交
1000 1001
		struct tc_u32_mark *mark;

1002
		mark = nla_data(tb[TCA_U32_MARK]);
1003 1004
		n->val = mark->val;
		n->mask = mark->mask;
L
Linus Torvalds 已提交
1005 1006 1007
	}
#endif

1008
	err = u32_set_parms(net, tp, base, ht, n, tb, tca[TCA_RATE], ovr);
L
Linus Torvalds 已提交
1009
	if (err == 0) {
1010 1011 1012
		struct tc_u_knode __rcu **ins;
		struct tc_u_knode *pins;

1013 1014 1015 1016
		err = u32_replace_hw_knode(tp, n, flags);
		if (err)
			goto errhw;

1017 1018 1019 1020
		ins = &ht->ht[TC_U32_HASH(handle)];
		for (pins = rtnl_dereference(*ins); pins;
		     ins = &pins->next, pins = rtnl_dereference(*ins))
			if (TC_U32_NODE(handle) < TC_U32_NODE(pins->handle))
L
Linus Torvalds 已提交
1021 1022
				break;

1023 1024
		RCU_INIT_POINTER(n->next, pins);
		rcu_assign_pointer(*ins, n);
L
Linus Torvalds 已提交
1025 1026 1027
		*arg = (unsigned long)n;
		return 0;
	}
1028

1029
errhw:
1030 1031 1032 1033
#ifdef CONFIG_CLS_U32_MARK
	free_percpu(n->pcpu_success);
#endif

1034 1035
errout:
	tcf_exts_destroy(&n->exts);
L
Linus Torvalds 已提交
1036
#ifdef CONFIG_CLS_U32_PERF
1037
	free_percpu(n->pf);
L
Linus Torvalds 已提交
1038 1039 1040 1041 1042 1043 1044 1045 1046 1047
#endif
	kfree(n);
	return err;
}

static void u32_walk(struct tcf_proto *tp, struct tcf_walker *arg)
{
	struct tc_u_common *tp_c = tp->data;
	struct tc_u_hnode *ht;
	struct tc_u_knode *n;
E
Eric Dumazet 已提交
1048
	unsigned int h;
L
Linus Torvalds 已提交
1049 1050 1051 1052

	if (arg->stop)
		return;

1053 1054 1055
	for (ht = rtnl_dereference(tp_c->hlist);
	     ht;
	     ht = rtnl_dereference(ht->next)) {
L
Linus Torvalds 已提交
1056 1057 1058 1059 1060 1061 1062 1063 1064 1065
		if (ht->prio != tp->prio)
			continue;
		if (arg->count >= arg->skip) {
			if (arg->fn(tp, (unsigned long)ht, arg) < 0) {
				arg->stop = 1;
				return;
			}
		}
		arg->count++;
		for (h = 0; h <= ht->divisor; h++) {
1066 1067 1068
			for (n = rtnl_dereference(ht->ht[h]);
			     n;
			     n = rtnl_dereference(n->next)) {
L
Linus Torvalds 已提交
1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082
				if (arg->count < arg->skip) {
					arg->count++;
					continue;
				}
				if (arg->fn(tp, (unsigned long)n, arg) < 0) {
					arg->stop = 1;
					return;
				}
				arg->count++;
			}
		}
	}
}

1083
static int u32_dump(struct net *net, struct tcf_proto *tp, unsigned long fh,
J
Jamal Hadi Salim 已提交
1084
		    struct sk_buff *skb, struct tcmsg *t)
L
Linus Torvalds 已提交
1085
{
E
Eric Dumazet 已提交
1086
	struct tc_u_knode *n = (struct tc_u_knode *)fh;
1087
	struct tc_u_hnode *ht_up, *ht_down;
1088
	struct nlattr *nest;
L
Linus Torvalds 已提交
1089 1090 1091 1092 1093 1094

	if (n == NULL)
		return skb->len;

	t->tcm_handle = n->handle;

1095 1096 1097
	nest = nla_nest_start(skb, TCA_OPTIONS);
	if (nest == NULL)
		goto nla_put_failure;
L
Linus Torvalds 已提交
1098 1099

	if (TC_U32_KEY(n->handle) == 0) {
E
Eric Dumazet 已提交
1100 1101 1102
		struct tc_u_hnode *ht = (struct tc_u_hnode *)fh;
		u32 divisor = ht->divisor + 1;

1103 1104
		if (nla_put_u32(skb, TCA_U32_DIVISOR, divisor))
			goto nla_put_failure;
L
Linus Torvalds 已提交
1105
	} else {
1106 1107 1108
#ifdef CONFIG_CLS_U32_PERF
		struct tc_u32_pcnt *gpf;
		int cpu;
1109
#endif
1110

1111 1112 1113 1114
		if (nla_put(skb, TCA_U32_SEL,
			    sizeof(n->sel) + n->sel.nkeys*sizeof(struct tc_u32_key),
			    &n->sel))
			goto nla_put_failure;
1115 1116 1117

		ht_up = rtnl_dereference(n->ht_up);
		if (ht_up) {
L
Linus Torvalds 已提交
1118
			u32 htid = n->handle & 0xFFFFF000;
1119 1120
			if (nla_put_u32(skb, TCA_U32_HASH, htid))
				goto nla_put_failure;
L
Linus Torvalds 已提交
1121
		}
1122 1123 1124
		if (n->res.classid &&
		    nla_put_u32(skb, TCA_U32_CLASSID, n->res.classid))
			goto nla_put_failure;
1125 1126 1127 1128

		ht_down = rtnl_dereference(n->ht_down);
		if (ht_down &&
		    nla_put_u32(skb, TCA_U32_LINK, ht_down->handle))
1129
			goto nla_put_failure;
L
Linus Torvalds 已提交
1130

1131 1132 1133
		if (n->flags && nla_put_u32(skb, TCA_U32_FLAGS, n->flags))
			goto nla_put_failure;

L
Linus Torvalds 已提交
1134
#ifdef CONFIG_CLS_U32_MARK
1135 1136 1137 1138
		if ((n->val || n->mask)) {
			struct tc_u32_mark mark = {.val = n->val,
						   .mask = n->mask,
						   .success = 0};
1139
			int cpum;
1140

1141 1142
			for_each_possible_cpu(cpum) {
				__u32 cnt = *per_cpu_ptr(n->pcpu_success, cpum);
1143 1144 1145 1146 1147 1148 1149

				mark.success += cnt;
			}

			if (nla_put(skb, TCA_U32_MARK, sizeof(mark), &mark))
				goto nla_put_failure;
		}
L
Linus Torvalds 已提交
1150 1151
#endif

1152
		if (tcf_exts_dump(skb, &n->exts) < 0)
1153
			goto nla_put_failure;
L
Linus Torvalds 已提交
1154 1155

#ifdef CONFIG_NET_CLS_IND
1156 1157 1158 1159 1160 1161
		if (n->ifindex) {
			struct net_device *dev;
			dev = __dev_get_by_index(net, n->ifindex);
			if (dev && nla_put_string(skb, TCA_U32_INDEV, dev->name))
				goto nla_put_failure;
		}
L
Linus Torvalds 已提交
1162 1163
#endif
#ifdef CONFIG_CLS_U32_PERF
1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179
		gpf = kzalloc(sizeof(struct tc_u32_pcnt) +
			      n->sel.nkeys * sizeof(u64),
			      GFP_KERNEL);
		if (!gpf)
			goto nla_put_failure;

		for_each_possible_cpu(cpu) {
			int i;
			struct tc_u32_pcnt *pf = per_cpu_ptr(n->pf, cpu);

			gpf->rcnt += pf->rcnt;
			gpf->rhit += pf->rhit;
			for (i = 0; i < n->sel.nkeys; i++)
				gpf->kcnts[i] += pf->kcnts[i];
		}

1180 1181 1182 1183
		if (nla_put_64bit(skb, TCA_U32_PCNT,
				  sizeof(struct tc_u32_pcnt) +
				  n->sel.nkeys * sizeof(u64),
				  gpf, TCA_U32_PAD)) {
1184
			kfree(gpf);
1185
			goto nla_put_failure;
1186 1187
		}
		kfree(gpf);
L
Linus Torvalds 已提交
1188 1189 1190
#endif
	}

1191 1192
	nla_nest_end(skb, nest);

L
Linus Torvalds 已提交
1193
	if (TC_U32_KEY(n->handle))
1194
		if (tcf_exts_dump_stats(skb, &n->exts) < 0)
1195
			goto nla_put_failure;
L
Linus Torvalds 已提交
1196 1197
	return skb->len;

1198
nla_put_failure:
1199
	nla_nest_cancel(skb, nest);
L
Linus Torvalds 已提交
1200 1201 1202
	return -1;
}

1203
static struct tcf_proto_ops cls_u32_ops __read_mostly = {
L
Linus Torvalds 已提交
1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217
	.kind		=	"u32",
	.classify	=	u32_classify,
	.init		=	u32_init,
	.destroy	=	u32_destroy,
	.get		=	u32_get,
	.change		=	u32_change,
	.delete		=	u32_delete,
	.walk		=	u32_walk,
	.dump		=	u32_dump,
	.owner		=	THIS_MODULE,
};

static int __init init_u32(void)
{
1218
	pr_info("u32 classifier\n");
L
Linus Torvalds 已提交
1219
#ifdef CONFIG_CLS_U32_PERF
1220
	pr_info("    Performance counters on\n");
L
Linus Torvalds 已提交
1221 1222
#endif
#ifdef CONFIG_NET_CLS_IND
1223
	pr_info("    input device check on\n");
L
Linus Torvalds 已提交
1224 1225
#endif
#ifdef CONFIG_NET_CLS_ACT
1226
	pr_info("    Actions configured\n");
L
Linus Torvalds 已提交
1227 1228 1229 1230
#endif
	return register_tcf_proto_ops(&cls_u32_ops);
}

1231
static void __exit exit_u32(void)
L
Linus Torvalds 已提交
1232 1233 1234 1235 1236 1237 1238
{
	unregister_tcf_proto_ops(&cls_u32_ops);
}

module_init(init_u32)
module_exit(exit_u32)
MODULE_LICENSE("GPL");