br_fdb.c 25.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 *	Forwarding database
 *	Linux ethernet bridge
 *
 *	Authors:
 *	Lennert Buytenhek		<buytenh@gnu.org>
 *
 *	This program is free software; you can redistribute it and/or
 *	modify it under the terms of the GNU General Public License
 *	as published by the Free Software Foundation; either version
 *	2 of the License, or (at your option) any later version.
 */

#include <linux/kernel.h>
#include <linux/init.h>
16
#include <linux/rculist.h>
L
Linus Torvalds 已提交
17 18 19 20 21
#include <linux/spinlock.h>
#include <linux/times.h>
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
#include <linux/jhash.h>
22
#include <linux/random.h>
23
#include <linux/slab.h>
A
Arun Sharma 已提交
24
#include <linux/atomic.h>
25
#include <asm/unaligned.h>
26
#include <linux/if_vlan.h>
27
#include <net/switchdev.h>
L
Linus Torvalds 已提交
28 29
#include "br_private.h"

30
static struct kmem_cache *br_fdb_cache __read_mostly;
31 32 33
static struct net_bridge_fdb_entry *fdb_find(struct hlist_head *head,
					     const unsigned char *addr,
					     __u16 vid);
L
Linus Torvalds 已提交
34
static int fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
35
		      const unsigned char *addr, u16 vid);
36 37
static void fdb_notify(struct net_bridge *br,
		       const struct net_bridge_fdb_entry *, int);
L
Linus Torvalds 已提交
38

39 40
static u32 fdb_salt __read_mostly;

41
int __init br_fdb_init(void)
L
Linus Torvalds 已提交
42 43 44 45
{
	br_fdb_cache = kmem_cache_create("bridge_fdb_cache",
					 sizeof(struct net_bridge_fdb_entry),
					 0,
46
					 SLAB_HWCACHE_ALIGN, NULL);
47 48 49
	if (!br_fdb_cache)
		return -ENOMEM;

50
	get_random_bytes(&fdb_salt, sizeof(fdb_salt));
51
	return 0;
L
Linus Torvalds 已提交
52 53
}

A
Andrew Morton 已提交
54
void br_fdb_fini(void)
L
Linus Torvalds 已提交
55 56 57 58 59 60 61 62
{
	kmem_cache_destroy(br_fdb_cache);
}


/* if topology_changing then use forward_delay (default 15 sec)
 * otherwise keep longer (default 5 minutes)
 */
63
static inline unsigned long hold_time(const struct net_bridge *br)
L
Linus Torvalds 已提交
64 65 66 67
{
	return br->topology_change ? br->forward_delay : br->ageing_time;
}

68
static inline int has_expired(const struct net_bridge *br,
L
Linus Torvalds 已提交
69 70
				  const struct net_bridge_fdb_entry *fdb)
{
71
	return !fdb->is_static &&
72
		time_before_eq(fdb->updated + hold_time(br), jiffies);
L
Linus Torvalds 已提交
73 74
}

75
static inline int br_mac_hash(const unsigned char *mac, __u16 vid)
L
Linus Torvalds 已提交
76
{
77
	/* use 1 byte of OUI and 3 bytes of NIC */
78
	u32 key = get_unaligned((u32 *)(mac + 2));
79
	return jhash_2words(key, vid, fdb_salt) & (BR_HASH_SIZE - 1);
L
Linus Torvalds 已提交
80 81
}

82 83 84 85 86 87 88
static void fdb_rcu_free(struct rcu_head *head)
{
	struct net_bridge_fdb_entry *ent
		= container_of(head, struct net_bridge_fdb_entry, rcu);
	kmem_cache_free(br_fdb_cache, ent);
}

89 90 91 92 93
/* When a static FDB entry is added, the mac address from the entry is
 * added to the bridge private HW address list and all required ports
 * are then updated with the new information.
 * Called under RTNL.
 */
94
static void fdb_add_hw_addr(struct net_bridge *br, const unsigned char *addr)
95 96
{
	int err;
97
	struct net_bridge_port *p;
98 99 100 101 102 103 104 105 106 107 108 109 110

	ASSERT_RTNL();

	list_for_each_entry(p, &br->port_list, list) {
		if (!br_promisc_port(p)) {
			err = dev_uc_add(p->dev, addr);
			if (err)
				goto undo;
		}
	}

	return;
undo:
111 112 113
	list_for_each_entry_continue_reverse(p, &br->port_list, list) {
		if (!br_promisc_port(p))
			dev_uc_del(p->dev, addr);
114 115 116 117 118 119 120 121
	}
}

/* When a static FDB entry is deleted, the HW address from that entry is
 * also removed from the bridge private HW address list and updates all
 * the ports with needed information.
 * Called under RTNL.
 */
122
static void fdb_del_hw_addr(struct net_bridge *br, const unsigned char *addr)
123 124 125 126 127 128 129 130 131 132 133
{
	struct net_bridge_port *p;

	ASSERT_RTNL();

	list_for_each_entry(p, &br->port_list, list) {
		if (!br_promisc_port(p))
			dev_uc_del(p->dev, addr);
	}
}

134 135
static void fdb_del_external_learn(struct net_bridge_fdb_entry *f)
{
136
	struct switchdev_obj_port_fdb fdb = {
137
		.obj.id = SWITCHDEV_OBJ_ID_PORT_FDB,
138 139
		.addr = f->addr.addr,
		.vid = f->vlan_id,
140 141
	};

142
	switchdev_port_obj_del(f->dst->dev, &fdb.obj);
143 144
}

145
static void fdb_delete(struct net_bridge *br, struct net_bridge_fdb_entry *f)
L
Linus Torvalds 已提交
146
{
147
	if (f->is_static)
148
		fdb_del_hw_addr(br, f->addr.addr);
149

150 151 152
	if (f->added_by_external_learn)
		fdb_del_external_learn(f);

L
Linus Torvalds 已提交
153
	hlist_del_rcu(&f->hlist);
154
	fdb_notify(br, f, RTM_DELNEIGH);
155
	call_rcu(&f->rcu, fdb_rcu_free);
L
Linus Torvalds 已提交
156 157
}

158 159 160 161 162 163
/* Delete a local entry if no other port had the same address. */
static void fdb_delete_local(struct net_bridge *br,
			     const struct net_bridge_port *p,
			     struct net_bridge_fdb_entry *f)
{
	const unsigned char *addr = f->addr.addr;
164 165
	struct net_bridge_vlan_group *vg;
	const struct net_bridge_vlan *v;
166
	struct net_bridge_port *op;
167
	u16 vid = f->vlan_id;
168 169 170

	/* Maybe another port has same hw addr? */
	list_for_each_entry(op, &br->port_list, list) {
171
		vg = nbp_vlan_group(op);
172
		if (op != p && ether_addr_equal(op->dev->dev_addr, addr) &&
173
		    (!vid || br_vlan_find(vg, vid))) {
174
			f->dst = op;
175
			f->added_by_user = 0;
176 177 178 179
			return;
		}
	}

180 181
	vg = br_vlan_group(br);
	v = br_vlan_find(vg, vid);
182 183
	/* Maybe bridge device has same hw addr? */
	if (p && ether_addr_equal(br->dev->dev_addr, addr) &&
184
	    (!vid || (v && br_vlan_should_use(v)))) {
185
		f->dst = NULL;
186
		f->added_by_user = 0;
187 188 189 190 191 192
		return;
	}

	fdb_delete(br, f);
}

193 194 195 196 197 198 199 200 201 202 203 204 205 206
void br_fdb_find_delete_local(struct net_bridge *br,
			      const struct net_bridge_port *p,
			      const unsigned char *addr, u16 vid)
{
	struct hlist_head *head = &br->hash[br_mac_hash(addr, vid)];
	struct net_bridge_fdb_entry *f;

	spin_lock_bh(&br->hash_lock);
	f = fdb_find(head, addr, vid);
	if (f && f->is_local && !f->added_by_user && f->dst == p)
		fdb_delete_local(br, p, f);
	spin_unlock_bh(&br->hash_lock);
}

L
Linus Torvalds 已提交
207 208
void br_fdb_changeaddr(struct net_bridge_port *p, const unsigned char *newaddr)
{
209
	struct net_bridge_vlan_group *vg;
L
Linus Torvalds 已提交
210
	struct net_bridge *br = p->br;
211
	struct net_bridge_vlan *v;
L
Linus Torvalds 已提交
212
	int i;
213

L
Linus Torvalds 已提交
214 215
	spin_lock_bh(&br->hash_lock);

216
	vg = nbp_vlan_group(p);
L
Linus Torvalds 已提交
217 218 219 220 221 222 223
	/* Search all chains since old address/hash is unknown */
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct hlist_node *h;
		hlist_for_each(h, &br->hash[i]) {
			struct net_bridge_fdb_entry *f;

			f = hlist_entry(h, struct net_bridge_fdb_entry, hlist);
224
			if (f->dst == p && f->is_local && !f->added_by_user) {
L
Linus Torvalds 已提交
225
				/* delete old one */
226 227
				fdb_delete_local(br, p, f);

228 229 230 231
				/* if this port has no vlan information
				 * configured, we can safely be done at
				 * this point.
				 */
232
				if (!vg || !vg->num_vlans)
233
					goto insert;
L
Linus Torvalds 已提交
234 235 236 237
			}
		}
	}

238 239 240 241
insert:
	/* insert new address,  may fail if invalid address or dup. */
	fdb_insert(br, p, newaddr, 0);

242
	if (!vg || !vg->num_vlans)
243 244 245 246 247 248
		goto done;

	/* Now add entries for every VLAN configured on the port.
	 * This function runs under RTNL so the bitmap will not change
	 * from under us.
	 */
249 250
	list_for_each_entry(v, &vg->vlan_list, vlist)
		fdb_insert(br, p, newaddr, v->vid);
251

252
done:
L
Linus Torvalds 已提交
253 254 255
	spin_unlock_bh(&br->hash_lock);
}

256 257
void br_fdb_change_mac_address(struct net_bridge *br, const u8 *newaddr)
{
258
	struct net_bridge_vlan_group *vg;
259
	struct net_bridge_fdb_entry *f;
260
	struct net_bridge_vlan *v;
261

262 263
	spin_lock_bh(&br->hash_lock);

264
	/* If old entry was unassociated with any port, then delete it. */
265
	f = __br_fdb_get(br, br->dev->dev_addr, 0);
266
	if (f && f->is_local && !f->dst)
267
		fdb_delete_local(br, NULL, f);
268

269
	fdb_insert(br, NULL, newaddr, 0);
270 271 272
	vg = br_vlan_group(br);
	if (!vg || !vg->num_vlans)
		goto out;
273 274 275 276
	/* Now remove and add entries for every VLAN configured on the
	 * bridge.  This function runs under RTNL so the bitmap will not
	 * change from under us.
	 */
277 278
	list_for_each_entry(v, &vg->vlan_list, vlist) {
		f = __br_fdb_get(br, br->dev->dev_addr, v->vid);
279
		if (f && f->is_local && !f->dst)
280
			fdb_delete_local(br, NULL, f);
281
		fdb_insert(br, NULL, newaddr, v->vid);
282
	}
283 284
out:
	spin_unlock_bh(&br->hash_lock);
285 286
}

L
Linus Torvalds 已提交
287 288 289 290
void br_fdb_cleanup(unsigned long _data)
{
	struct net_bridge *br = (struct net_bridge *)_data;
	unsigned long delay = hold_time(br);
291
	unsigned long next_timer = jiffies + br->ageing_time;
L
Linus Torvalds 已提交
292 293
	int i;

294
	spin_lock(&br->hash_lock);
L
Linus Torvalds 已提交
295 296
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct net_bridge_fdb_entry *f;
297
		struct hlist_node *n;
L
Linus Torvalds 已提交
298

299
		hlist_for_each_entry_safe(f, n, &br->hash[i], hlist) {
300
			unsigned long this_timer;
301
			if (f->is_static)
302
				continue;
303 304
			if (f->added_by_external_learn)
				continue;
305
			this_timer = f->updated + delay;
306
			if (time_before_eq(this_timer, jiffies))
307
				fdb_delete(br, f);
308
			else if (time_before(this_timer, next_timer))
309
				next_timer = this_timer;
L
Linus Torvalds 已提交
310 311
		}
	}
312
	spin_unlock(&br->hash_lock);
L
Linus Torvalds 已提交
313

314
	mod_timer(&br->gc_timer, round_jiffies_up(next_timer));
L
Linus Torvalds 已提交
315 316
}

317 318 319 320 321 322 323 324
/* Completely flush all dynamic entries in forwarding database.*/
void br_fdb_flush(struct net_bridge *br)
{
	int i;

	spin_lock_bh(&br->hash_lock);
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct net_bridge_fdb_entry *f;
325 326
		struct hlist_node *n;
		hlist_for_each_entry_safe(f, n, &br->hash[i], hlist) {
327
			if (!f->is_static)
328
				fdb_delete(br, f);
329 330 331 332
		}
	}
	spin_unlock_bh(&br->hash_lock);
}
333

L
Lucas De Marchi 已提交
334
/* Flush all entries referring to a specific port.
335
 * if do_all is set also flush static entries
336
 * if vid is set delete all entries that match the vlan_id
337
 */
338 339
void br_fdb_delete_by_port(struct net_bridge *br,
			   const struct net_bridge_port *p,
340
			   u16 vid,
341
			   int do_all)
L
Linus Torvalds 已提交
342 343 344 345 346 347
{
	int i;

	spin_lock_bh(&br->hash_lock);
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct hlist_node *h, *g;
348

L
Linus Torvalds 已提交
349 350 351
		hlist_for_each_safe(h, g, &br->hash[i]) {
			struct net_bridge_fdb_entry *f
				= hlist_entry(h, struct net_bridge_fdb_entry, hlist);
352
			if (f->dst != p)
L
Linus Torvalds 已提交
353 354
				continue;

355 356 357
			if (!do_all)
				if (f->is_static || (vid && f->vlan_id != vid))
					continue;
L
Linus Torvalds 已提交
358

359 360 361 362
			if (f->is_local)
				fdb_delete_local(br, p, f);
			else
				fdb_delete(br, f);
L
Linus Torvalds 已提交
363 364 365 366 367
		}
	}
	spin_unlock_bh(&br->hash_lock);
}

368
/* No locking or refcounting, assumes caller has rcu_read_lock */
L
Linus Torvalds 已提交
369
struct net_bridge_fdb_entry *__br_fdb_get(struct net_bridge *br,
370 371
					  const unsigned char *addr,
					  __u16 vid)
L
Linus Torvalds 已提交
372 373 374
{
	struct net_bridge_fdb_entry *fdb;

375
	hlist_for_each_entry_rcu(fdb,
376 377 378
				&br->hash[br_mac_hash(addr, vid)], hlist) {
		if (ether_addr_equal(fdb->addr.addr, addr) &&
		    fdb->vlan_id == vid) {
L
Linus Torvalds 已提交
379 380 381 382 383 384 385 386 387
			if (unlikely(has_expired(br, fdb)))
				break;
			return fdb;
		}
	}

	return NULL;
}

I
Igor Maravić 已提交
388
#if IS_ENABLED(CONFIG_ATM_LANE)
389 390 391
/* Interface used by ATM LANE hook to test
 * if an addr is on some other bridge port */
int br_fdb_test_addr(struct net_device *dev, unsigned char *addr)
L
Linus Torvalds 已提交
392 393
{
	struct net_bridge_fdb_entry *fdb;
394
	struct net_bridge_port *port;
395 396
	int ret;

L
Linus Torvalds 已提交
397
	rcu_read_lock();
398 399 400 401
	port = br_port_get_rcu(dev);
	if (!port)
		ret = 0;
	else {
402
		fdb = __br_fdb_get(port->br, addr, 0);
403
		ret = fdb && fdb->dst && fdb->dst->dev != dev &&
404 405
			fdb->dst->state == BR_STATE_FORWARDING;
	}
L
Linus Torvalds 已提交
406 407
	rcu_read_unlock();

408
	return ret;
L
Linus Torvalds 已提交
409
}
410
#endif /* CONFIG_ATM_LANE */
L
Linus Torvalds 已提交
411 412

/*
413
 * Fill buffer with forwarding table records in
L
Linus Torvalds 已提交
414 415 416 417 418 419 420 421 422 423 424 425 426
 * the API format.
 */
int br_fdb_fillbuf(struct net_bridge *br, void *buf,
		   unsigned long maxnum, unsigned long skip)
{
	struct __fdb_entry *fe = buf;
	int i, num = 0;
	struct net_bridge_fdb_entry *f;

	memset(buf, 0, maxnum*sizeof(struct __fdb_entry));

	rcu_read_lock();
	for (i = 0; i < BR_HASH_SIZE; i++) {
427
		hlist_for_each_entry_rcu(f, &br->hash[i], hlist) {
L
Linus Torvalds 已提交
428 429 430
			if (num >= maxnum)
				goto out;

431
			if (has_expired(br, f))
L
Linus Torvalds 已提交
432 433
				continue;

434 435 436 437
			/* ignore pseudo entry for local MAC address */
			if (!f->dst)
				continue;

L
Linus Torvalds 已提交
438 439 440 441 442 443 444
			if (skip) {
				--skip;
				continue;
			}

			/* convert from internal format to API */
			memcpy(fe->mac_addr, f->addr.addr, ETH_ALEN);
445 446

			/* due to ABI compat need to split into hi/lo */
L
Linus Torvalds 已提交
447
			fe->port_no = f->dst->port_no;
448 449
			fe->port_hi = f->dst->port_no >> 8;

L
Linus Torvalds 已提交
450 451
			fe->is_local = f->is_local;
			if (!f->is_static)
452
				fe->ageing_timer_value = jiffies_delta_to_clock_t(jiffies - f->updated);
L
Linus Torvalds 已提交
453 454 455 456 457 458 459 460 461 462 463
			++fe;
			++num;
		}
	}

 out:
	rcu_read_unlock();

	return num;
}

464
static struct net_bridge_fdb_entry *fdb_find(struct hlist_head *head,
465 466
					     const unsigned char *addr,
					     __u16 vid)
467 468 469
{
	struct net_bridge_fdb_entry *fdb;

470
	hlist_for_each_entry(fdb, head, hlist) {
471 472
		if (ether_addr_equal(fdb->addr.addr, addr) &&
		    fdb->vlan_id == vid)
473 474 475 476 477 478
			return fdb;
	}
	return NULL;
}

static struct net_bridge_fdb_entry *fdb_find_rcu(struct hlist_head *head,
479 480
						 const unsigned char *addr,
						 __u16 vid)
L
Linus Torvalds 已提交
481 482 483
{
	struct net_bridge_fdb_entry *fdb;

484
	hlist_for_each_entry_rcu(fdb, head, hlist) {
485 486
		if (ether_addr_equal(fdb->addr.addr, addr) &&
		    fdb->vlan_id == vid)
L
Linus Torvalds 已提交
487 488 489 490 491 492 493
			return fdb;
	}
	return NULL;
}

static struct net_bridge_fdb_entry *fdb_create(struct hlist_head *head,
					       struct net_bridge_port *source,
494 495
					       const unsigned char *addr,
					       __u16 vid)
L
Linus Torvalds 已提交
496 497 498 499 500 501 502
{
	struct net_bridge_fdb_entry *fdb;

	fdb = kmem_cache_alloc(br_fdb_cache, GFP_ATOMIC);
	if (fdb) {
		memcpy(fdb->addr.addr, addr, ETH_ALEN);
		fdb->dst = source;
503
		fdb->vlan_id = vid;
504 505
		fdb->is_local = 0;
		fdb->is_static = 0;
506
		fdb->added_by_user = 0;
507
		fdb->added_by_external_learn = 0;
508
		fdb->updated = fdb->used = jiffies;
509
		hlist_add_head_rcu(&fdb->hlist, head);
L
Linus Torvalds 已提交
510 511 512 513 514
	}
	return fdb;
}

static int fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
515
		  const unsigned char *addr, u16 vid)
L
Linus Torvalds 已提交
516
{
517
	struct hlist_head *head = &br->hash[br_mac_hash(addr, vid)];
L
Linus Torvalds 已提交
518 519 520 521 522
	struct net_bridge_fdb_entry *fdb;

	if (!is_valid_ether_addr(addr))
		return -EINVAL;

523
	fdb = fdb_find(head, addr, vid);
L
Linus Torvalds 已提交
524
	if (fdb) {
525
		/* it is okay to have multiple ports with same
L
Linus Torvalds 已提交
526 527
		 * address, just use the first one.
		 */
528
		if (fdb->is_local)
L
Linus Torvalds 已提交
529
			return 0;
530
		br_warn(br, "adding interface %s with same address "
L
Linus Torvalds 已提交
531
		       "as a received packet\n",
532
		       source ? source->dev->name : br->dev->name);
533
		fdb_delete(br, fdb);
534
	}
L
Linus Torvalds 已提交
535

536
	fdb = fdb_create(head, source, addr, vid);
537
	if (!fdb)
L
Linus Torvalds 已提交
538 539
		return -ENOMEM;

540
	fdb->is_local = fdb->is_static = 1;
541
	fdb_add_hw_addr(br, addr);
542
	fdb_notify(br, fdb, RTM_NEWNEIGH);
L
Linus Torvalds 已提交
543 544 545
	return 0;
}

546
/* Add entry for local address of interface */
L
Linus Torvalds 已提交
547
int br_fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
548
		  const unsigned char *addr, u16 vid)
L
Linus Torvalds 已提交
549 550 551 552
{
	int ret;

	spin_lock_bh(&br->hash_lock);
553
	ret = fdb_insert(br, source, addr, vid);
L
Linus Torvalds 已提交
554 555 556 557 558
	spin_unlock_bh(&br->hash_lock);
	return ret;
}

void br_fdb_update(struct net_bridge *br, struct net_bridge_port *source,
559
		   const unsigned char *addr, u16 vid, bool added_by_user)
L
Linus Torvalds 已提交
560
{
561
	struct hlist_head *head = &br->hash[br_mac_hash(addr, vid)];
L
Linus Torvalds 已提交
562
	struct net_bridge_fdb_entry *fdb;
563
	bool fdb_modified = false;
L
Linus Torvalds 已提交
564 565 566 567 568

	/* some users want to always flood. */
	if (hold_time(br) == 0)
		return;

569 570 571 572 573
	/* ignore packets unless we are using this port */
	if (!(source->state == BR_STATE_LEARNING ||
	      source->state == BR_STATE_FORWARDING))
		return;

574
	fdb = fdb_find_rcu(head, addr, vid);
L
Linus Torvalds 已提交
575 576 577
	if (likely(fdb)) {
		/* attempt to update an entry for a local interface */
		if (unlikely(fdb->is_local)) {
578
			if (net_ratelimit())
579 580 581
				br_warn(br, "received packet on %s with "
					"own address as source address\n",
					source->dev->name);
L
Linus Torvalds 已提交
582 583
		} else {
			/* fastpath: update of existing entry */
584 585 586 587
			if (unlikely(source != fdb->dst)) {
				fdb->dst = source;
				fdb_modified = true;
			}
588
			fdb->updated = jiffies;
589 590
			if (unlikely(added_by_user))
				fdb->added_by_user = 1;
591 592
			if (unlikely(fdb_modified))
				fdb_notify(br, fdb, RTM_NEWNEIGH);
L
Linus Torvalds 已提交
593 594
		}
	} else {
595
		spin_lock(&br->hash_lock);
596 597
		if (likely(!fdb_find(head, addr, vid))) {
			fdb = fdb_create(head, source, addr, vid);
598 599 600
			if (fdb) {
				if (unlikely(added_by_user))
					fdb->added_by_user = 1;
601
				fdb_notify(br, fdb, RTM_NEWNEIGH);
602
			}
S
stephen hemminger 已提交
603
		}
L
Linus Torvalds 已提交
604 605 606
		/* else  we lose race and someone else inserts
		 * it first, don't bother updating
		 */
607
		spin_unlock(&br->hash_lock);
L
Linus Torvalds 已提交
608 609
	}
}
610 611 612 613 614 615 616 617 618 619 620 621 622

static int fdb_to_nud(const struct net_bridge_fdb_entry *fdb)
{
	if (fdb->is_local)
		return NUD_PERMANENT;
	else if (fdb->is_static)
		return NUD_NOARP;
	else if (has_expired(fdb->dst->br, fdb))
		return NUD_STALE;
	else
		return NUD_REACHABLE;
}

623
static int fdb_fill_info(struct sk_buff *skb, const struct net_bridge *br,
624
			 const struct net_bridge_fdb_entry *fdb,
625
			 u32 portid, u32 seq, int type, unsigned int flags)
626 627 628 629 630 631
{
	unsigned long now = jiffies;
	struct nda_cacheinfo ci;
	struct nlmsghdr *nlh;
	struct ndmsg *ndm;

632
	nlh = nlmsg_put(skb, portid, seq, type, sizeof(*ndm), flags);
633 634 635 636 637 638 639
	if (nlh == NULL)
		return -EMSGSIZE;

	ndm = nlmsg_data(nlh);
	ndm->ndm_family	 = AF_BRIDGE;
	ndm->ndm_pad1    = 0;
	ndm->ndm_pad2    = 0;
640
	ndm->ndm_flags	 = fdb->added_by_external_learn ? NTF_EXT_LEARNED : 0;
641
	ndm->ndm_type	 = 0;
642
	ndm->ndm_ifindex = fdb->dst ? fdb->dst->dev->ifindex : br->dev->ifindex;
643 644
	ndm->ndm_state   = fdb_to_nud(fdb);

D
David S. Miller 已提交
645 646
	if (nla_put(skb, NDA_LLADDR, ETH_ALEN, &fdb->addr))
		goto nla_put_failure;
647 648
	if (nla_put_u32(skb, NDA_MASTER, br->dev->ifindex))
		goto nla_put_failure;
649 650 651 652
	ci.ndm_used	 = jiffies_to_clock_t(now - fdb->used);
	ci.ndm_confirmed = 0;
	ci.ndm_updated	 = jiffies_to_clock_t(now - fdb->updated);
	ci.ndm_refcnt	 = 0;
D
David S. Miller 已提交
653 654
	if (nla_put(skb, NDA_CACHEINFO, sizeof(ci), &ci))
		goto nla_put_failure;
655

656
	if (fdb->vlan_id && nla_put(skb, NDA_VLAN, sizeof(u16), &fdb->vlan_id))
657 658
		goto nla_put_failure;

659 660
	nlmsg_end(skb, nlh);
	return 0;
661 662 663 664 665 666 667 668 669 670

nla_put_failure:
	nlmsg_cancel(skb, nlh);
	return -EMSGSIZE;
}

static inline size_t fdb_nlmsg_size(void)
{
	return NLMSG_ALIGN(sizeof(struct ndmsg))
		+ nla_total_size(ETH_ALEN) /* NDA_LLADDR */
671
		+ nla_total_size(sizeof(u32)) /* NDA_MASTER */
672
		+ nla_total_size(sizeof(u16)) /* NDA_VLAN */
673 674 675
		+ nla_total_size(sizeof(struct nda_cacheinfo));
}

676 677
static void fdb_notify(struct net_bridge *br,
		       const struct net_bridge_fdb_entry *fdb, int type)
678
{
679
	struct net *net = dev_net(br->dev);
680 681 682 683 684 685 686
	struct sk_buff *skb;
	int err = -ENOBUFS;

	skb = nlmsg_new(fdb_nlmsg_size(), GFP_ATOMIC);
	if (skb == NULL)
		goto errout;

687
	err = fdb_fill_info(skb, br, fdb, 0, 0, type, 0);
688 689 690 691 692 693 694 695 696
	if (err < 0) {
		/* -EMSGSIZE implies BUG in fdb_nlmsg_size() */
		WARN_ON(err == -EMSGSIZE);
		kfree_skb(skb);
		goto errout;
	}
	rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
	return;
errout:
697
	rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
698 699 700
}

/* Dump information about entries, in response to GETNEIGH */
701 702 703
int br_fdb_dump(struct sk_buff *skb,
		struct netlink_callback *cb,
		struct net_device *dev,
704
		struct net_device *filter_dev,
705
		int idx)
706
{
707 708
	struct net_bridge *br = netdev_priv(dev);
	int i;
709

710 711
	if (!(dev->priv_flags & IFF_EBRIDGE))
		goto out;
712

713 714 715
	if (!filter_dev)
		idx = ndo_dflt_fdb_dump(skb, cb, dev, NULL, idx);

716 717
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct net_bridge_fdb_entry *f;
718

719
		hlist_for_each_entry_rcu(f, &br->hash[i], hlist) {
720 721 722
			if (idx < cb->args[0])
				goto skip;

723 724 725 726
			if (filter_dev &&
			    (!f->dst || f->dst->dev != filter_dev)) {
				if (filter_dev != dev)
					goto skip;
727
				/* !f->dst is a special case for bridge
728 729 730 731 732 733 734
				 * It means the MAC belongs to the bridge
				 * Therefore need a little more filtering
				 * we only want to dump the !f->dst case
				 */
				if (f->dst)
					goto skip;
			}
735 736
			if (!filter_dev && f->dst)
				goto skip;
737

738
			if (fdb_fill_info(skb, br, f,
739
					  NETLINK_CB(cb->skb).portid,
740 741 742 743
					  cb->nlh->nlmsg_seq,
					  RTM_NEWNEIGH,
					  NLM_F_MULTI) < 0)
				break;
744
skip:
745
			++idx;
746 747 748
		}
	}

749 750
out:
	return idx;
751
}
752

S
stephen hemminger 已提交
753
/* Update (create or replace) forwarding database entry */
754
static int fdb_add_entry(struct net_bridge_port *source, const __u8 *addr,
755
			 __u16 state, __u16 flags, __u16 vid)
756 757
{
	struct net_bridge *br = source->br;
758
	struct hlist_head *head = &br->hash[br_mac_hash(addr, vid)];
759
	struct net_bridge_fdb_entry *fdb;
760
	bool modified = false;
761

762 763 764 765 766 767
	/* If the port cannot learn allow only local and static entries */
	if (!(state & NUD_PERMANENT) && !(state & NUD_NOARP) &&
	    !(source->state == BR_STATE_LEARNING ||
	      source->state == BR_STATE_FORWARDING))
		return -EPERM;

768
	fdb = fdb_find(head, addr, vid);
769 770 771
	if (fdb == NULL) {
		if (!(flags & NLM_F_CREATE))
			return -ENOENT;
772

773
		fdb = fdb_create(head, source, addr, vid);
774 775
		if (!fdb)
			return -ENOMEM;
776 777

		modified = true;
778 779 780
	} else {
		if (flags & NLM_F_EXCL)
			return -EEXIST;
781 782 783 784 785

		if (fdb->dst != source) {
			fdb->dst = source;
			modified = true;
		}
S
stephen hemminger 已提交
786 787 788
	}

	if (fdb_to_nud(fdb) != state) {
789 790 791 792
		if (state & NUD_PERMANENT) {
			fdb->is_local = 1;
			if (!fdb->is_static) {
				fdb->is_static = 1;
793
				fdb_add_hw_addr(br, addr);
794 795 796 797 798
			}
		} else if (state & NUD_NOARP) {
			fdb->is_local = 0;
			if (!fdb->is_static) {
				fdb->is_static = 1;
799
				fdb_add_hw_addr(br, addr);
800 801
			}
		} else {
S
stephen hemminger 已提交
802
			fdb->is_local = 0;
803 804
			if (fdb->is_static) {
				fdb->is_static = 0;
805
				fdb_del_hw_addr(br, addr);
806 807
			}
		}
808

809 810
		modified = true;
	}
811
	fdb->added_by_user = 1;
812 813 814 815

	fdb->used = jiffies;
	if (modified) {
		fdb->updated = jiffies;
816
		fdb_notify(br, fdb, RTM_NEWNEIGH);
817
	}
818 819 820 821

	return 0;
}

822 823 824 825 826 827
static int __br_fdb_add(struct ndmsg *ndm, struct net_bridge_port *p,
	       const unsigned char *addr, u16 nlh_flags, u16 vid)
{
	int err = 0;

	if (ndm->ndm_flags & NTF_USE) {
828
		local_bh_disable();
829
		rcu_read_lock();
830
		br_fdb_update(p->br, p, addr, vid, true);
831
		rcu_read_unlock();
832
		local_bh_enable();
833 834 835 836 837 838 839 840 841 842
	} else {
		spin_lock_bh(&p->br->hash_lock);
		err = fdb_add_entry(p, addr, ndm->ndm_state,
				    nlh_flags, vid);
		spin_unlock_bh(&p->br->hash_lock);
	}

	return err;
}

843
/* Add new permanent fdb entry with RTM_NEWNEIGH */
844 845
int br_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
	       struct net_device *dev,
846
	       const unsigned char *addr, u16 vid, u16 nlh_flags)
847
{
848
	struct net_bridge_vlan_group *vg;
849
	struct net_bridge_port *p;
850
	struct net_bridge_vlan *v;
851
	int err = 0;
852

S
stephen hemminger 已提交
853 854 855 856 857
	if (!(ndm->ndm_state & (NUD_PERMANENT|NUD_NOARP|NUD_REACHABLE))) {
		pr_info("bridge: RTM_NEWNEIGH with invalid state %#x\n", ndm->ndm_state);
		return -EINVAL;
	}

858 859 860 861 862
	if (is_zero_ether_addr(addr)) {
		pr_info("bridge: RTM_NEWNEIGH with invalid ether address\n");
		return -EINVAL;
	}

863 864 865 866 867 868 869
	p = br_port_get_rtnl(dev);
	if (p == NULL) {
		pr_info("bridge: RTM_NEWNEIGH %s not a bridge port\n",
			dev->name);
		return -EINVAL;
	}

870
	vg = nbp_vlan_group(p);
871
	if (vid) {
872 873
		v = br_vlan_find(vg, vid);
		if (!v) {
874 875 876 877 878 879 880
			pr_info("bridge: RTM_NEWNEIGH with unconfigured "
				"vlan %d on port %s\n", vid, dev->name);
			return -EINVAL;
		}

		/* VID was specified, so use it. */
		err = __br_fdb_add(ndm, p, addr, nlh_flags, vid);
S
stephen hemminger 已提交
881
	} else {
882
		err = __br_fdb_add(ndm, p, addr, nlh_flags, 0);
883
		if (err || !vg || !vg->num_vlans)
884 885 886 887 888 889
			goto out;

		/* We have vlans configured on this port and user didn't
		 * specify a VLAN.  To be nice, add/update entry for every
		 * vlan on this port.
		 */
890 891
		list_for_each_entry(v, &vg->vlan_list, vlist) {
			err = __br_fdb_add(ndm, p, addr, nlh_flags, v->vid);
892 893 894
			if (err)
				goto out;
		}
S
stephen hemminger 已提交
895
	}
896

897
out:
898 899 900
	return err;
}

901 902
static int fdb_delete_by_addr_and_port(struct net_bridge_port *p,
				       const u8 *addr, u16 vlan)
903
{
904
	struct net_bridge *br = p->br;
905
	struct hlist_head *head = &br->hash[br_mac_hash(addr, vlan)];
906 907
	struct net_bridge_fdb_entry *fdb;

908
	fdb = fdb_find(head, addr, vlan);
909
	if (!fdb || fdb->dst != p)
910 911
		return -ENOENT;

912
	fdb_delete(br, fdb);
913 914 915
	return 0;
}

916 917 918 919 920 921
static int __br_fdb_delete(struct net_bridge_port *p,
			   const unsigned char *addr, u16 vid)
{
	int err;

	spin_lock_bh(&p->br->hash_lock);
922
	err = fdb_delete_by_addr_and_port(p, addr, vid);
923 924 925 926 927
	spin_unlock_bh(&p->br->hash_lock);

	return err;
}

928
/* Remove neighbor entry with RTM_DELNEIGH */
929 930
int br_fdb_delete(struct ndmsg *ndm, struct nlattr *tb[],
		  struct net_device *dev,
931
		  const unsigned char *addr, u16 vid)
932
{
933
	struct net_bridge_vlan_group *vg;
934
	struct net_bridge_port *p;
935
	struct net_bridge_vlan *v;
936
	int err;
937

938 939 940 941 942 943 944
	p = br_port_get_rtnl(dev);
	if (p == NULL) {
		pr_info("bridge: RTM_DELNEIGH %s not a bridge port\n",
			dev->name);
		return -EINVAL;
	}

945
	vg = nbp_vlan_group(p);
946
	if (vid) {
947 948
		v = br_vlan_find(vg, vid);
		if (!v) {
949 950 951 952
			pr_info("bridge: RTM_DELNEIGH with unconfigured "
				"vlan %d on port %s\n", vid, dev->name);
			return -EINVAL;
		}
953

954 955
		err = __br_fdb_delete(p, addr, vid);
	} else {
956 957
		err = -ENOENT;
		err &= __br_fdb_delete(p, addr, 0);
958
		if (!vg || !vg->num_vlans)
959 960
			goto out;

961 962
		list_for_each_entry(v, &vg->vlan_list, vlist)
			err &= __br_fdb_delete(p, addr, v->vid);
963 964
	}
out:
965 966
	return err;
}
967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022

int br_fdb_sync_static(struct net_bridge *br, struct net_bridge_port *p)
{
	struct net_bridge_fdb_entry *fdb, *tmp;
	int i;
	int err;

	ASSERT_RTNL();

	for (i = 0; i < BR_HASH_SIZE; i++) {
		hlist_for_each_entry(fdb, &br->hash[i], hlist) {
			/* We only care for static entries */
			if (!fdb->is_static)
				continue;

			err = dev_uc_add(p->dev, fdb->addr.addr);
			if (err)
				goto rollback;
		}
	}
	return 0;

rollback:
	for (i = 0; i < BR_HASH_SIZE; i++) {
		hlist_for_each_entry(tmp, &br->hash[i], hlist) {
			/* If we reached the fdb that failed, we can stop */
			if (tmp == fdb)
				break;

			/* We only care for static entries */
			if (!tmp->is_static)
				continue;

			dev_uc_del(p->dev, tmp->addr.addr);
		}
	}
	return err;
}

void br_fdb_unsync_static(struct net_bridge *br, struct net_bridge_port *p)
{
	struct net_bridge_fdb_entry *fdb;
	int i;

	ASSERT_RTNL();

	for (i = 0; i < BR_HASH_SIZE; i++) {
		hlist_for_each_entry_rcu(fdb, &br->hash[i], hlist) {
			/* We only care for static entries */
			if (!fdb->is_static)
				continue;

			dev_uc_del(p->dev, fdb->addr.addr);
		}
	}
}
1023

1024
int br_fdb_external_learn_add(struct net_bridge *br, struct net_bridge_port *p,
1025 1026 1027 1028 1029 1030
			      const unsigned char *addr, u16 vid)
{
	struct hlist_head *head;
	struct net_bridge_fdb_entry *fdb;
	int err = 0;

1031
	ASSERT_RTNL();
1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059
	spin_lock_bh(&br->hash_lock);

	head = &br->hash[br_mac_hash(addr, vid)];
	fdb = fdb_find(head, addr, vid);
	if (!fdb) {
		fdb = fdb_create(head, p, addr, vid);
		if (!fdb) {
			err = -ENOMEM;
			goto err_unlock;
		}
		fdb->added_by_external_learn = 1;
		fdb_notify(br, fdb, RTM_NEWNEIGH);
	} else if (fdb->added_by_external_learn) {
		/* Refresh entry */
		fdb->updated = fdb->used = jiffies;
	} else if (!fdb->added_by_user) {
		/* Take over SW learned entry */
		fdb->added_by_external_learn = 1;
		fdb->updated = jiffies;
		fdb_notify(br, fdb, RTM_NEWNEIGH);
	}

err_unlock:
	spin_unlock_bh(&br->hash_lock);

	return err;
}

1060
int br_fdb_external_learn_del(struct net_bridge *br, struct net_bridge_port *p,
1061 1062 1063 1064 1065 1066
			      const unsigned char *addr, u16 vid)
{
	struct hlist_head *head;
	struct net_bridge_fdb_entry *fdb;
	int err = 0;

1067
	ASSERT_RTNL();
1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080
	spin_lock_bh(&br->hash_lock);

	head = &br->hash[br_mac_hash(addr, vid)];
	fdb = fdb_find(head, addr, vid);
	if (fdb && fdb->added_by_external_learn)
		fdb_delete(br, fdb);
	else
		err = -ENOENT;

	spin_unlock_bh(&br->hash_lock);

	return err;
}