br_fdb.c 29.8 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-or-later
L
Linus Torvalds 已提交
2 3 4 5 6 7 8 9 10 11
/*
 *	Forwarding database
 *	Linux ethernet bridge
 *
 *	Authors:
 *	Lennert Buytenhek		<buytenh@gnu.org>
 */

#include <linux/kernel.h>
#include <linux/init.h>
12
#include <linux/rculist.h>
L
Linus Torvalds 已提交
13 14 15 16 17
#include <linux/spinlock.h>
#include <linux/times.h>
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
#include <linux/jhash.h>
18
#include <linux/random.h>
19
#include <linux/slab.h>
A
Arun Sharma 已提交
20
#include <linux/atomic.h>
21
#include <asm/unaligned.h>
22
#include <linux/if_vlan.h>
23
#include <net/switchdev.h>
24
#include <trace/events/bridge.h>
L
Linus Torvalds 已提交
25 26
#include "br_private.h"

27 28 29 30 31 32 33
static const struct rhashtable_params br_fdb_rht_params = {
	.head_offset = offsetof(struct net_bridge_fdb_entry, rhnode),
	.key_offset = offsetof(struct net_bridge_fdb_entry, key),
	.key_len = sizeof(struct net_bridge_fdb_key),
	.automatic_shrinking = true,
};

34
static struct kmem_cache *br_fdb_cache __read_mostly;
L
Linus Torvalds 已提交
35
static int fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
36
		      const unsigned char *addr, u16 vid);
37
static void fdb_notify(struct net_bridge *br,
38
		       const struct net_bridge_fdb_entry *, int, bool);
L
Linus Torvalds 已提交
39

40
int __init br_fdb_init(void)
L
Linus Torvalds 已提交
41 42 43 44
{
	br_fdb_cache = kmem_cache_create("bridge_fdb_cache",
					 sizeof(struct net_bridge_fdb_entry),
					 0,
45
					 SLAB_HWCACHE_ALIGN, NULL);
46 47 48 49
	if (!br_fdb_cache)
		return -ENOMEM;

	return 0;
L
Linus Torvalds 已提交
50 51
}

A
Andrew Morton 已提交
52
void br_fdb_fini(void)
L
Linus Torvalds 已提交
53 54 55 56
{
	kmem_cache_destroy(br_fdb_cache);
}

57 58 59 60 61 62 63 64 65
int br_fdb_hash_init(struct net_bridge *br)
{
	return rhashtable_init(&br->fdb_hash_tbl, &br_fdb_rht_params);
}

void br_fdb_hash_fini(struct net_bridge *br)
{
	rhashtable_destroy(&br->fdb_hash_tbl);
}
L
Linus Torvalds 已提交
66 67 68 69

/* if topology_changing then use forward_delay (default 15 sec)
 * otherwise keep longer (default 5 minutes)
 */
70
static inline unsigned long hold_time(const struct net_bridge *br)
L
Linus Torvalds 已提交
71 72 73 74
{
	return br->topology_change ? br->forward_delay : br->ageing_time;
}

75
static inline int has_expired(const struct net_bridge *br,
L
Linus Torvalds 已提交
76 77
				  const struct net_bridge_fdb_entry *fdb)
{
78
	return !test_bit(BR_FDB_STATIC, &fdb->flags) &&
79
	       !test_bit(BR_FDB_ADDED_BY_EXT_LEARN, &fdb->flags) &&
80
	       time_before_eq(fdb->updated + hold_time(br), jiffies);
L
Linus Torvalds 已提交
81 82
}

83 84 85 86 87 88 89
static void fdb_rcu_free(struct rcu_head *head)
{
	struct net_bridge_fdb_entry *ent
		= container_of(head, struct net_bridge_fdb_entry, rcu);
	kmem_cache_free(br_fdb_cache, ent);
}

90
static struct net_bridge_fdb_entry *fdb_find_rcu(struct rhashtable *tbl,
91 92 93
						 const unsigned char *addr,
						 __u16 vid)
{
94
	struct net_bridge_fdb_key key;
95

96 97
	WARN_ON_ONCE(!rcu_read_lock_held());

98 99
	key.vlan_id = vid;
	memcpy(key.addr.addr, addr, sizeof(key.addr.addr));
100

101
	return rhashtable_lookup(tbl, &key, br_fdb_rht_params);
102 103 104 105 106 107 108 109 110
}

/* requires bridge hash_lock */
static struct net_bridge_fdb_entry *br_fdb_find(struct net_bridge *br,
						const unsigned char *addr,
						__u16 vid)
{
	struct net_bridge_fdb_entry *fdb;

111
	lockdep_assert_held_once(&br->hash_lock);
112

113
	rcu_read_lock();
114
	fdb = fdb_find_rcu(&br->fdb_hash_tbl, addr, vid);
115 116 117 118 119
	rcu_read_unlock();

	return fdb;
}

120 121 122 123 124 125 126 127 128 129 130 131 132 133
struct net_device *br_fdb_find_port(const struct net_device *br_dev,
				    const unsigned char *addr,
				    __u16 vid)
{
	struct net_bridge_fdb_entry *f;
	struct net_device *dev = NULL;
	struct net_bridge *br;

	ASSERT_RTNL();

	if (!netif_is_bridge_master(br_dev))
		return NULL;

	br = netdev_priv(br_dev);
134 135
	rcu_read_lock();
	f = br_fdb_find_rcu(br, addr, vid);
136 137
	if (f && f->dst)
		dev = f->dst->dev;
138
	rcu_read_unlock();
139 140 141 142 143

	return dev;
}
EXPORT_SYMBOL_GPL(br_fdb_find_port);

144 145 146 147
struct net_bridge_fdb_entry *br_fdb_find_rcu(struct net_bridge *br,
					     const unsigned char *addr,
					     __u16 vid)
{
148
	return fdb_find_rcu(&br->fdb_hash_tbl, addr, vid);
149 150
}

151 152 153 154 155
/* When a static FDB entry is added, the mac address from the entry is
 * added to the bridge private HW address list and all required ports
 * are then updated with the new information.
 * Called under RTNL.
 */
156
static void fdb_add_hw_addr(struct net_bridge *br, const unsigned char *addr)
157 158
{
	int err;
159
	struct net_bridge_port *p;
160 161 162 163 164 165 166 167 168 169 170 171 172

	ASSERT_RTNL();

	list_for_each_entry(p, &br->port_list, list) {
		if (!br_promisc_port(p)) {
			err = dev_uc_add(p->dev, addr);
			if (err)
				goto undo;
		}
	}

	return;
undo:
173 174 175
	list_for_each_entry_continue_reverse(p, &br->port_list, list) {
		if (!br_promisc_port(p))
			dev_uc_del(p->dev, addr);
176 177 178 179 180 181 182 183
	}
}

/* When a static FDB entry is deleted, the HW address from that entry is
 * also removed from the bridge private HW address list and updates all
 * the ports with needed information.
 * Called under RTNL.
 */
184
static void fdb_del_hw_addr(struct net_bridge *br, const unsigned char *addr)
185 186 187 188 189 190 191 192 193 194 195
{
	struct net_bridge_port *p;

	ASSERT_RTNL();

	list_for_each_entry(p, &br->port_list, list) {
		if (!br_promisc_port(p))
			dev_uc_del(p->dev, addr);
	}
}

196 197
static void fdb_delete(struct net_bridge *br, struct net_bridge_fdb_entry *f,
		       bool swdev_notify)
L
Linus Torvalds 已提交
198
{
199 200
	trace_fdb_delete(br, f);

201
	if (test_bit(BR_FDB_STATIC, &f->flags))
202
		fdb_del_hw_addr(br, f->key.addr.addr);
203

204 205 206
	hlist_del_init_rcu(&f->fdb_node);
	rhashtable_remove_fast(&br->fdb_hash_tbl, &f->rhnode,
			       br_fdb_rht_params);
207
	fdb_notify(br, f, RTM_DELNEIGH, swdev_notify);
208
	call_rcu(&f->rcu, fdb_rcu_free);
L
Linus Torvalds 已提交
209 210
}

211 212 213 214 215
/* Delete a local entry if no other port had the same address. */
static void fdb_delete_local(struct net_bridge *br,
			     const struct net_bridge_port *p,
			     struct net_bridge_fdb_entry *f)
{
216
	const unsigned char *addr = f->key.addr.addr;
217 218
	struct net_bridge_vlan_group *vg;
	const struct net_bridge_vlan *v;
219
	struct net_bridge_port *op;
220
	u16 vid = f->key.vlan_id;
221 222 223

	/* Maybe another port has same hw addr? */
	list_for_each_entry(op, &br->port_list, list) {
224
		vg = nbp_vlan_group(op);
225
		if (op != p && ether_addr_equal(op->dev->dev_addr, addr) &&
226
		    (!vid || br_vlan_find(vg, vid))) {
227
			f->dst = op;
228
			clear_bit(BR_FDB_ADDED_BY_USER, &f->flags);
229 230 231 232
			return;
		}
	}

233 234
	vg = br_vlan_group(br);
	v = br_vlan_find(vg, vid);
235 236
	/* Maybe bridge device has same hw addr? */
	if (p && ether_addr_equal(br->dev->dev_addr, addr) &&
237
	    (!vid || (v && br_vlan_should_use(v)))) {
238
		f->dst = NULL;
239
		clear_bit(BR_FDB_ADDED_BY_USER, &f->flags);
240 241 242
		return;
	}

243
	fdb_delete(br, f, true);
244 245
}

246 247 248 249 250 251 252
void br_fdb_find_delete_local(struct net_bridge *br,
			      const struct net_bridge_port *p,
			      const unsigned char *addr, u16 vid)
{
	struct net_bridge_fdb_entry *f;

	spin_lock_bh(&br->hash_lock);
253
	f = br_fdb_find(br, addr, vid);
254
	if (f && test_bit(BR_FDB_LOCAL, &f->flags) &&
255
	    !test_bit(BR_FDB_ADDED_BY_USER, &f->flags) && f->dst == p)
256 257 258 259
		fdb_delete_local(br, p, f);
	spin_unlock_bh(&br->hash_lock);
}

L
Linus Torvalds 已提交
260 261
void br_fdb_changeaddr(struct net_bridge_port *p, const unsigned char *newaddr)
{
262
	struct net_bridge_vlan_group *vg;
263
	struct net_bridge_fdb_entry *f;
L
Linus Torvalds 已提交
264
	struct net_bridge *br = p->br;
265
	struct net_bridge_vlan *v;
266

L
Linus Torvalds 已提交
267
	spin_lock_bh(&br->hash_lock);
268
	vg = nbp_vlan_group(p);
269
	hlist_for_each_entry(f, &br->fdb_list, fdb_node) {
270
		if (f->dst == p && test_bit(BR_FDB_LOCAL, &f->flags) &&
271
		    !test_bit(BR_FDB_ADDED_BY_USER, &f->flags)) {
272 273 274 275 276 277 278 279 280
			/* delete old one */
			fdb_delete_local(br, p, f);

			/* if this port has no vlan information
			 * configured, we can safely be done at
			 * this point.
			 */
			if (!vg || !vg->num_vlans)
				goto insert;
L
Linus Torvalds 已提交
281 282 283
		}
	}

284 285 286 287
insert:
	/* insert new address,  may fail if invalid address or dup. */
	fdb_insert(br, p, newaddr, 0);

288
	if (!vg || !vg->num_vlans)
289 290 291 292 293 294
		goto done;

	/* Now add entries for every VLAN configured on the port.
	 * This function runs under RTNL so the bitmap will not change
	 * from under us.
	 */
295 296
	list_for_each_entry(v, &vg->vlan_list, vlist)
		fdb_insert(br, p, newaddr, v->vid);
297

298
done:
L
Linus Torvalds 已提交
299 300 301
	spin_unlock_bh(&br->hash_lock);
}

302 303
void br_fdb_change_mac_address(struct net_bridge *br, const u8 *newaddr)
{
304
	struct net_bridge_vlan_group *vg;
305
	struct net_bridge_fdb_entry *f;
306
	struct net_bridge_vlan *v;
307

308 309
	spin_lock_bh(&br->hash_lock);

310
	/* If old entry was unassociated with any port, then delete it. */
311
	f = br_fdb_find(br, br->dev->dev_addr, 0);
312
	if (f && test_bit(BR_FDB_LOCAL, &f->flags) &&
313
	    !f->dst && !test_bit(BR_FDB_ADDED_BY_USER, &f->flags))
314
		fdb_delete_local(br, NULL, f);
315

316
	fdb_insert(br, NULL, newaddr, 0);
317 318 319
	vg = br_vlan_group(br);
	if (!vg || !vg->num_vlans)
		goto out;
320 321 322 323
	/* Now remove and add entries for every VLAN configured on the
	 * bridge.  This function runs under RTNL so the bitmap will not
	 * change from under us.
	 */
324
	list_for_each_entry(v, &vg->vlan_list, vlist) {
325 326
		if (!br_vlan_should_use(v))
			continue;
327
		f = br_fdb_find(br, br->dev->dev_addr, v->vid);
328
		if (f && test_bit(BR_FDB_LOCAL, &f->flags) &&
329
		    !f->dst && !test_bit(BR_FDB_ADDED_BY_USER, &f->flags))
330
			fdb_delete_local(br, NULL, f);
331
		fdb_insert(br, NULL, newaddr, v->vid);
332
	}
333 334
out:
	spin_unlock_bh(&br->hash_lock);
335 336
}

337
void br_fdb_cleanup(struct work_struct *work)
L
Linus Torvalds 已提交
338
{
339 340
	struct net_bridge *br = container_of(work, struct net_bridge,
					     gc_work.work);
341
	struct net_bridge_fdb_entry *f = NULL;
L
Linus Torvalds 已提交
342
	unsigned long delay = hold_time(br);
343 344
	unsigned long work_delay = delay;
	unsigned long now = jiffies;
L
Linus Torvalds 已提交
345

346 347 348 349 350 351 352
	/* this part is tricky, in order to avoid blocking learning and
	 * consequently forwarding, we rely on rcu to delete objects with
	 * delayed freeing allowing us to continue traversing
	 */
	rcu_read_lock();
	hlist_for_each_entry_rcu(f, &br->fdb_list, fdb_node) {
		unsigned long this_timer;
L
Linus Torvalds 已提交
353

354
		if (test_bit(BR_FDB_STATIC, &f->flags) ||
355
		    test_bit(BR_FDB_ADDED_BY_EXT_LEARN, &f->flags))
356
			continue;
357 358 359 360 361 362
		this_timer = f->updated + delay;
		if (time_after(this_timer, now)) {
			work_delay = min(work_delay, this_timer - now);
		} else {
			spin_lock_bh(&br->hash_lock);
			if (!hlist_unhashed(&f->fdb_node))
363
				fdb_delete(br, f, true);
364
			spin_unlock_bh(&br->hash_lock);
L
Linus Torvalds 已提交
365 366
		}
	}
367
	rcu_read_unlock();
L
Linus Torvalds 已提交
368

369 370 371
	/* Cleanup minimum 10 milliseconds apart */
	work_delay = max_t(unsigned long, work_delay, msecs_to_jiffies(10));
	mod_delayed_work(system_long_wq, &br->gc_work, work_delay);
L
Linus Torvalds 已提交
372 373
}

374 375 376
/* Completely flush all dynamic entries in forwarding database.*/
void br_fdb_flush(struct net_bridge *br)
{
377 378
	struct net_bridge_fdb_entry *f;
	struct hlist_node *tmp;
379 380

	spin_lock_bh(&br->hash_lock);
381
	hlist_for_each_entry_safe(f, tmp, &br->fdb_list, fdb_node) {
382
		if (!test_bit(BR_FDB_STATIC, &f->flags))
383
			fdb_delete(br, f, true);
384 385 386
	}
	spin_unlock_bh(&br->hash_lock);
}
387

L
Lucas De Marchi 已提交
388
/* Flush all entries referring to a specific port.
389
 * if do_all is set also flush static entries
390
 * if vid is set delete all entries that match the vlan_id
391
 */
392 393
void br_fdb_delete_by_port(struct net_bridge *br,
			   const struct net_bridge_port *p,
394
			   u16 vid,
395
			   int do_all)
L
Linus Torvalds 已提交
396
{
397 398
	struct net_bridge_fdb_entry *f;
	struct hlist_node *tmp;
L
Linus Torvalds 已提交
399 400

	spin_lock_bh(&br->hash_lock);
401 402 403
	hlist_for_each_entry_safe(f, tmp, &br->fdb_list, fdb_node) {
		if (f->dst != p)
			continue;
404

405
		if (!do_all)
406 407
			if (test_bit(BR_FDB_STATIC, &f->flags) ||
			    (vid && f->key.vlan_id != vid))
L
Linus Torvalds 已提交
408 409
				continue;

410
		if (test_bit(BR_FDB_LOCAL, &f->flags))
411 412
			fdb_delete_local(br, p, f);
		else
413
			fdb_delete(br, f, true);
L
Linus Torvalds 已提交
414 415 416 417
	}
	spin_unlock_bh(&br->hash_lock);
}

I
Igor Maravić 已提交
418
#if IS_ENABLED(CONFIG_ATM_LANE)
419 420 421
/* Interface used by ATM LANE hook to test
 * if an addr is on some other bridge port */
int br_fdb_test_addr(struct net_device *dev, unsigned char *addr)
L
Linus Torvalds 已提交
422 423
{
	struct net_bridge_fdb_entry *fdb;
424
	struct net_bridge_port *port;
425 426
	int ret;

L
Linus Torvalds 已提交
427
	rcu_read_lock();
428 429 430 431
	port = br_port_get_rcu(dev);
	if (!port)
		ret = 0;
	else {
432
		fdb = br_fdb_find_rcu(port->br, addr, 0);
433
		ret = fdb && fdb->dst && fdb->dst->dev != dev &&
434 435
			fdb->dst->state == BR_STATE_FORWARDING;
	}
L
Linus Torvalds 已提交
436 437
	rcu_read_unlock();

438
	return ret;
L
Linus Torvalds 已提交
439
}
440
#endif /* CONFIG_ATM_LANE */
L
Linus Torvalds 已提交
441 442

/*
443
 * Fill buffer with forwarding table records in
L
Linus Torvalds 已提交
444 445 446 447 448 449
 * the API format.
 */
int br_fdb_fillbuf(struct net_bridge *br, void *buf,
		   unsigned long maxnum, unsigned long skip)
{
	struct net_bridge_fdb_entry *f;
450 451
	struct __fdb_entry *fe = buf;
	int num = 0;
L
Linus Torvalds 已提交
452 453 454 455

	memset(buf, 0, maxnum*sizeof(struct __fdb_entry));

	rcu_read_lock();
456 457 458
	hlist_for_each_entry_rcu(f, &br->fdb_list, fdb_node) {
		if (num >= maxnum)
			break;
L
Linus Torvalds 已提交
459

460 461
		if (has_expired(br, f))
			continue;
L
Linus Torvalds 已提交
462

463 464 465
		/* ignore pseudo entry for local MAC address */
		if (!f->dst)
			continue;
466

467 468 469 470
		if (skip) {
			--skip;
			continue;
		}
L
Linus Torvalds 已提交
471

472 473
		/* convert from internal format to API */
		memcpy(fe->mac_addr, f->key.addr.addr, ETH_ALEN);
474

475 476 477
		/* due to ABI compat need to split into hi/lo */
		fe->port_no = f->dst->port_no;
		fe->port_hi = f->dst->port_no >> 8;
478

479
		fe->is_local = test_bit(BR_FDB_LOCAL, &f->flags);
480
		if (!test_bit(BR_FDB_STATIC, &f->flags))
481 482 483
			fe->ageing_timer_value = jiffies_delta_to_clock_t(jiffies - f->updated);
		++fe;
		++num;
L
Linus Torvalds 已提交
484 485 486 487 488 489
	}
	rcu_read_unlock();

	return num;
}

490
static struct net_bridge_fdb_entry *fdb_create(struct net_bridge *br,
L
Linus Torvalds 已提交
491
					       struct net_bridge_port *source,
492
					       const unsigned char *addr,
493 494 495
					       __u16 vid,
					       unsigned char is_local,
					       unsigned char is_static)
L
Linus Torvalds 已提交
496 497 498 499 500
{
	struct net_bridge_fdb_entry *fdb;

	fdb = kmem_cache_alloc(br_fdb_cache, GFP_ATOMIC);
	if (fdb) {
501
		memcpy(fdb->key.addr.addr, addr, ETH_ALEN);
L
Linus Torvalds 已提交
502
		fdb->dst = source;
503
		fdb->key.vlan_id = vid;
504 505 506
		fdb->flags = 0;
		if (is_local)
			set_bit(BR_FDB_LOCAL, &fdb->flags);
507 508
		if (is_static)
			set_bit(BR_FDB_STATIC, &fdb->flags);
509
		fdb->updated = fdb->used = jiffies;
510 511 512 513 514 515 516 517
		if (rhashtable_lookup_insert_fast(&br->fdb_hash_tbl,
						  &fdb->rhnode,
						  br_fdb_rht_params)) {
			kmem_cache_free(br_fdb_cache, fdb);
			fdb = NULL;
		} else {
			hlist_add_head_rcu(&fdb->fdb_node, &br->fdb_list);
		}
L
Linus Torvalds 已提交
518 519 520 521 522
	}
	return fdb;
}

static int fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
523
		  const unsigned char *addr, u16 vid)
L
Linus Torvalds 已提交
524 525 526 527 528 529
{
	struct net_bridge_fdb_entry *fdb;

	if (!is_valid_ether_addr(addr))
		return -EINVAL;

530
	fdb = br_fdb_find(br, addr, vid);
L
Linus Torvalds 已提交
531
	if (fdb) {
532
		/* it is okay to have multiple ports with same
L
Linus Torvalds 已提交
533 534
		 * address, just use the first one.
		 */
535
		if (test_bit(BR_FDB_LOCAL, &fdb->flags))
L
Linus Torvalds 已提交
536
			return 0;
537 538
		br_warn(br, "adding interface %s with same address as a received packet (addr:%pM, vlan:%u)\n",
		       source ? source->dev->name : br->dev->name, addr, vid);
539
		fdb_delete(br, fdb, true);
540
	}
L
Linus Torvalds 已提交
541

542
	fdb = fdb_create(br, source, addr, vid, 1, 1);
543
	if (!fdb)
L
Linus Torvalds 已提交
544 545
		return -ENOMEM;

546
	fdb_add_hw_addr(br, addr);
547
	fdb_notify(br, fdb, RTM_NEWNEIGH, true);
L
Linus Torvalds 已提交
548 549 550
	return 0;
}

551
/* Add entry for local address of interface */
L
Linus Torvalds 已提交
552
int br_fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
553
		  const unsigned char *addr, u16 vid)
L
Linus Torvalds 已提交
554 555 556 557
{
	int ret;

	spin_lock_bh(&br->hash_lock);
558
	ret = fdb_insert(br, source, addr, vid);
L
Linus Torvalds 已提交
559 560 561 562 563
	spin_unlock_bh(&br->hash_lock);
	return ret;
}

void br_fdb_update(struct net_bridge *br, struct net_bridge_port *source,
564
		   const unsigned char *addr, u16 vid, bool added_by_user)
L
Linus Torvalds 已提交
565 566
{
	struct net_bridge_fdb_entry *fdb;
567
	bool fdb_modified = false;
L
Linus Torvalds 已提交
568 569 570 571 572

	/* some users want to always flood. */
	if (hold_time(br) == 0)
		return;

573 574 575 576 577
	/* ignore packets unless we are using this port */
	if (!(source->state == BR_STATE_LEARNING ||
	      source->state == BR_STATE_FORWARDING))
		return;

578
	fdb = fdb_find_rcu(&br->fdb_hash_tbl, addr, vid);
L
Linus Torvalds 已提交
579 580
	if (likely(fdb)) {
		/* attempt to update an entry for a local interface */
581
		if (unlikely(test_bit(BR_FDB_LOCAL, &fdb->flags))) {
582
			if (net_ratelimit())
583 584
				br_warn(br, "received packet on %s with own address as source address (addr:%pM, vlan:%u)\n",
					source->dev->name, addr, vid);
L
Linus Torvalds 已提交
585
		} else {
586 587
			unsigned long now = jiffies;

L
Linus Torvalds 已提交
588
			/* fastpath: update of existing entry */
589 590
			if (unlikely(source != fdb->dst &&
				     !test_bit(BR_FDB_STICKY, &fdb->flags))) {
591 592
				fdb->dst = source;
				fdb_modified = true;
593
				/* Take over HW learned entry */
594 595
				test_and_clear_bit(BR_FDB_ADDED_BY_EXT_LEARN,
						   &fdb->flags);
596
			}
597 598
			if (now != fdb->updated)
				fdb->updated = now;
599
			if (unlikely(added_by_user))
600
				set_bit(BR_FDB_ADDED_BY_USER, &fdb->flags);
601 602
			if (unlikely(fdb_modified)) {
				trace_br_fdb_update(br, source, addr, vid, added_by_user);
603
				fdb_notify(br, fdb, RTM_NEWNEIGH, true);
604
			}
L
Linus Torvalds 已提交
605 606
		}
	} else {
607
		spin_lock(&br->hash_lock);
608 609 610
		fdb = fdb_create(br, source, addr, vid, 0, 0);
		if (fdb) {
			if (unlikely(added_by_user))
611
				set_bit(BR_FDB_ADDED_BY_USER, &fdb->flags);
612 613
			trace_br_fdb_update(br, source, addr, vid,
					    added_by_user);
614
			fdb_notify(br, fdb, RTM_NEWNEIGH, true);
S
stephen hemminger 已提交
615
		}
L
Linus Torvalds 已提交
616 617 618
		/* else  we lose race and someone else inserts
		 * it first, don't bother updating
		 */
619
		spin_unlock(&br->hash_lock);
L
Linus Torvalds 已提交
620 621
	}
}
622

623 624
static int fdb_to_nud(const struct net_bridge *br,
		      const struct net_bridge_fdb_entry *fdb)
625
{
626
	if (test_bit(BR_FDB_LOCAL, &fdb->flags))
627
		return NUD_PERMANENT;
628
	else if (test_bit(BR_FDB_STATIC, &fdb->flags))
629
		return NUD_NOARP;
630
	else if (has_expired(br, fdb))
631 632 633 634 635
		return NUD_STALE;
	else
		return NUD_REACHABLE;
}

636
static int fdb_fill_info(struct sk_buff *skb, const struct net_bridge *br,
637
			 const struct net_bridge_fdb_entry *fdb,
638
			 u32 portid, u32 seq, int type, unsigned int flags)
639 640 641 642 643 644
{
	unsigned long now = jiffies;
	struct nda_cacheinfo ci;
	struct nlmsghdr *nlh;
	struct ndmsg *ndm;

645
	nlh = nlmsg_put(skb, portid, seq, type, sizeof(*ndm), flags);
646 647 648 649 650 651 652
	if (nlh == NULL)
		return -EMSGSIZE;

	ndm = nlmsg_data(nlh);
	ndm->ndm_family	 = AF_BRIDGE;
	ndm->ndm_pad1    = 0;
	ndm->ndm_pad2    = 0;
653
	ndm->ndm_flags	 = 0;
654
	ndm->ndm_type	 = 0;
655
	ndm->ndm_ifindex = fdb->dst ? fdb->dst->dev->ifindex : br->dev->ifindex;
656
	ndm->ndm_state   = fdb_to_nud(br, fdb);
657

658
	if (test_bit(BR_FDB_OFFLOADED, &fdb->flags))
659
		ndm->ndm_flags |= NTF_OFFLOADED;
660
	if (test_bit(BR_FDB_ADDED_BY_EXT_LEARN, &fdb->flags))
661
		ndm->ndm_flags |= NTF_EXT_LEARNED;
662
	if (test_bit(BR_FDB_STICKY, &fdb->flags))
663
		ndm->ndm_flags |= NTF_STICKY;
664

665
	if (nla_put(skb, NDA_LLADDR, ETH_ALEN, &fdb->key.addr))
D
David S. Miller 已提交
666
		goto nla_put_failure;
667 668
	if (nla_put_u32(skb, NDA_MASTER, br->dev->ifindex))
		goto nla_put_failure;
669 670 671 672
	ci.ndm_used	 = jiffies_to_clock_t(now - fdb->used);
	ci.ndm_confirmed = 0;
	ci.ndm_updated	 = jiffies_to_clock_t(now - fdb->updated);
	ci.ndm_refcnt	 = 0;
D
David S. Miller 已提交
673 674
	if (nla_put(skb, NDA_CACHEINFO, sizeof(ci), &ci))
		goto nla_put_failure;
675

676 677
	if (fdb->key.vlan_id && nla_put(skb, NDA_VLAN, sizeof(u16),
					&fdb->key.vlan_id))
678 679
		goto nla_put_failure;

680 681
	nlmsg_end(skb, nlh);
	return 0;
682 683 684 685 686 687 688 689 690 691

nla_put_failure:
	nlmsg_cancel(skb, nlh);
	return -EMSGSIZE;
}

static inline size_t fdb_nlmsg_size(void)
{
	return NLMSG_ALIGN(sizeof(struct ndmsg))
		+ nla_total_size(ETH_ALEN) /* NDA_LLADDR */
692
		+ nla_total_size(sizeof(u32)) /* NDA_MASTER */
693
		+ nla_total_size(sizeof(u16)) /* NDA_VLAN */
694 695 696
		+ nla_total_size(sizeof(struct nda_cacheinfo));
}

697
static void fdb_notify(struct net_bridge *br,
698 699
		       const struct net_bridge_fdb_entry *fdb, int type,
		       bool swdev_notify)
700
{
701
	struct net *net = dev_net(br->dev);
702 703 704
	struct sk_buff *skb;
	int err = -ENOBUFS;

705 706
	if (swdev_notify)
		br_switchdev_fdb_notify(fdb, type);
707

708 709 710 711
	skb = nlmsg_new(fdb_nlmsg_size(), GFP_ATOMIC);
	if (skb == NULL)
		goto errout;

712
	err = fdb_fill_info(skb, br, fdb, 0, 0, type, 0);
713 714 715 716 717 718 719 720 721
	if (err < 0) {
		/* -EMSGSIZE implies BUG in fdb_nlmsg_size() */
		WARN_ON(err == -EMSGSIZE);
		kfree_skb(skb);
		goto errout;
	}
	rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
	return;
errout:
722
	rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
723 724 725
}

/* Dump information about entries, in response to GETNEIGH */
726 727 728
int br_fdb_dump(struct sk_buff *skb,
		struct netlink_callback *cb,
		struct net_device *dev,
729
		struct net_device *filter_dev,
730
		int *idx)
731
{
732
	struct net_bridge *br = netdev_priv(dev);
733
	struct net_bridge_fdb_entry *f;
734
	int err = 0;
735

736
	if (!(dev->priv_flags & IFF_EBRIDGE))
737
		return err;
738

739 740 741
	if (!filter_dev) {
		err = ndo_dflt_fdb_dump(skb, cb, dev, NULL, idx);
		if (err < 0)
742
			return err;
743
	}
744

745 746 747 748 749 750
	rcu_read_lock();
	hlist_for_each_entry_rcu(f, &br->fdb_list, fdb_node) {
		if (*idx < cb->args[2])
			goto skip;
		if (filter_dev && (!f->dst || f->dst->dev != filter_dev)) {
			if (filter_dev != dev)
751
				goto skip;
752 753 754 755 756 757
			/* !f->dst is a special case for bridge
			 * It means the MAC belongs to the bridge
			 * Therefore need a little more filtering
			 * we only want to dump the !f->dst case
			 */
			if (f->dst)
758
				goto skip;
759
		}
760 761 762 763 764 765 766 767 768 769 770 771
		if (!filter_dev && f->dst)
			goto skip;

		err = fdb_fill_info(skb, br, f,
				    NETLINK_CB(cb->skb).portid,
				    cb->nlh->nlmsg_seq,
				    RTM_NEWNEIGH,
				    NLM_F_MULTI);
		if (err < 0)
			break;
skip:
		*idx += 1;
772
	}
773
	rcu_read_unlock();
774

775
	return err;
776
}
777

R
Roopa Prabhu 已提交
778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803
int br_fdb_get(struct sk_buff *skb,
	       struct nlattr *tb[],
	       struct net_device *dev,
	       const unsigned char *addr,
	       u16 vid, u32 portid, u32 seq,
	       struct netlink_ext_ack *extack)
{
	struct net_bridge *br = netdev_priv(dev);
	struct net_bridge_fdb_entry *f;
	int err = 0;

	rcu_read_lock();
	f = br_fdb_find_rcu(br, addr, vid);
	if (!f) {
		NL_SET_ERR_MSG(extack, "Fdb entry not found");
		err = -ENOENT;
		goto errout;
	}

	err = fdb_fill_info(skb, br, f, portid, seq,
			    RTM_NEWNEIGH, 0);
errout:
	rcu_read_unlock();
	return err;
}

S
stephen hemminger 已提交
804
/* Update (create or replace) forwarding database entry */
805
static int fdb_add_entry(struct net_bridge *br, struct net_bridge_port *source,
806 807
			 const u8 *addr, u16 state, u16 flags, u16 vid,
			 u8 ndm_flags)
808
{
809
	bool is_sticky = !!(ndm_flags & NTF_STICKY);
810
	struct net_bridge_fdb_entry *fdb;
811
	bool modified = false;
812

813
	/* If the port cannot learn allow only local and static entries */
814
	if (source && !(state & NUD_PERMANENT) && !(state & NUD_NOARP) &&
815 816 817 818
	    !(source->state == BR_STATE_LEARNING ||
	      source->state == BR_STATE_FORWARDING))
		return -EPERM;

819 820 821 822 823 824
	if (!source && !(state & NUD_PERMANENT)) {
		pr_info("bridge: RTM_NEWNEIGH %s without NUD_PERMANENT\n",
			br->dev->name);
		return -EINVAL;
	}

825 826 827
	if (is_sticky && (state & NUD_PERMANENT))
		return -EINVAL;

828
	fdb = br_fdb_find(br, addr, vid);
829 830 831
	if (fdb == NULL) {
		if (!(flags & NLM_F_CREATE))
			return -ENOENT;
832

833
		fdb = fdb_create(br, source, addr, vid, 0, 0);
834 835
		if (!fdb)
			return -ENOMEM;
836 837

		modified = true;
838 839 840
	} else {
		if (flags & NLM_F_EXCL)
			return -EEXIST;
841 842 843 844 845

		if (fdb->dst != source) {
			fdb->dst = source;
			modified = true;
		}
S
stephen hemminger 已提交
846 847
	}

848
	if (fdb_to_nud(br, fdb) != state) {
849
		if (state & NUD_PERMANENT) {
850
			set_bit(BR_FDB_LOCAL, &fdb->flags);
851
			if (!test_and_set_bit(BR_FDB_STATIC, &fdb->flags))
852
				fdb_add_hw_addr(br, addr);
853
		} else if (state & NUD_NOARP) {
854
			clear_bit(BR_FDB_LOCAL, &fdb->flags);
855
			if (!test_and_set_bit(BR_FDB_STATIC, &fdb->flags))
856
				fdb_add_hw_addr(br, addr);
857
		} else {
858
			clear_bit(BR_FDB_LOCAL, &fdb->flags);
859
			if (test_and_clear_bit(BR_FDB_STATIC, &fdb->flags))
860
				fdb_del_hw_addr(br, addr);
861
		}
862

863 864
		modified = true;
	}
865

866 867
	if (is_sticky != test_bit(BR_FDB_STICKY, &fdb->flags)) {
		change_bit(BR_FDB_STICKY, &fdb->flags);
868 869 870
		modified = true;
	}

871
	set_bit(BR_FDB_ADDED_BY_USER, &fdb->flags);
872 873 874 875

	fdb->used = jiffies;
	if (modified) {
		fdb->updated = jiffies;
876
		fdb_notify(br, fdb, RTM_NEWNEIGH, true);
877
	}
878 879 880 881

	return 0;
}

882 883 884
static int __br_fdb_add(struct ndmsg *ndm, struct net_bridge *br,
			struct net_bridge_port *p, const unsigned char *addr,
			u16 nlh_flags, u16 vid)
885 886 887 888
{
	int err = 0;

	if (ndm->ndm_flags & NTF_USE) {
889 890 891 892 893
		if (!p) {
			pr_info("bridge: RTM_NEWNEIGH %s with NTF_USE is not supported\n",
				br->dev->name);
			return -EINVAL;
		}
894
		local_bh_disable();
895
		rcu_read_lock();
896
		br_fdb_update(br, p, addr, vid, true);
897
		rcu_read_unlock();
898
		local_bh_enable();
899
	} else if (ndm->ndm_flags & NTF_EXT_LEARNED) {
900
		err = br_fdb_external_learn_add(br, p, addr, vid, true);
901
	} else {
902 903
		spin_lock_bh(&br->hash_lock);
		err = fdb_add_entry(br, p, addr, ndm->ndm_state,
904
				    nlh_flags, vid, ndm->ndm_flags);
905
		spin_unlock_bh(&br->hash_lock);
906 907 908 909 910
	}

	return err;
}

911
/* Add new permanent fdb entry with RTM_NEWNEIGH */
912 913
int br_fdb_add(struct ndmsg *ndm, struct nlattr *tb[],
	       struct net_device *dev,
914 915
	       const unsigned char *addr, u16 vid, u16 nlh_flags,
	       struct netlink_ext_ack *extack)
916
{
917
	struct net_bridge_vlan_group *vg;
918
	struct net_bridge_port *p = NULL;
919
	struct net_bridge_vlan *v;
920
	struct net_bridge *br = NULL;
921
	int err = 0;
922

923 924
	trace_br_fdb_add(ndm, dev, addr, vid, nlh_flags);

S
stephen hemminger 已提交
925 926 927 928 929
	if (!(ndm->ndm_state & (NUD_PERMANENT|NUD_NOARP|NUD_REACHABLE))) {
		pr_info("bridge: RTM_NEWNEIGH with invalid state %#x\n", ndm->ndm_state);
		return -EINVAL;
	}

930 931 932 933 934
	if (is_zero_ether_addr(addr)) {
		pr_info("bridge: RTM_NEWNEIGH with invalid ether address\n");
		return -EINVAL;
	}

935 936 937 938 939 940 941 942 943 944
	if (dev->priv_flags & IFF_EBRIDGE) {
		br = netdev_priv(dev);
		vg = br_vlan_group(br);
	} else {
		p = br_port_get_rtnl(dev);
		if (!p) {
			pr_info("bridge: RTM_NEWNEIGH %s not a bridge port\n",
				dev->name);
			return -EINVAL;
		}
945
		br = p->br;
946
		vg = nbp_vlan_group(p);
947 948
	}

949
	if (vid) {
950
		v = br_vlan_find(vg, vid);
951 952
		if (!v || !br_vlan_should_use(v)) {
			pr_info("bridge: RTM_NEWNEIGH with unconfigured vlan %d on %s\n", vid, dev->name);
953 954 955 956
			return -EINVAL;
		}

		/* VID was specified, so use it. */
957
		err = __br_fdb_add(ndm, br, p, addr, nlh_flags, vid);
S
stephen hemminger 已提交
958
	} else {
959
		err = __br_fdb_add(ndm, br, p, addr, nlh_flags, 0);
960
		if (err || !vg || !vg->num_vlans)
961 962 963 964 965 966
			goto out;

		/* We have vlans configured on this port and user didn't
		 * specify a VLAN.  To be nice, add/update entry for every
		 * vlan on this port.
		 */
967
		list_for_each_entry(v, &vg->vlan_list, vlist) {
968 969
			if (!br_vlan_should_use(v))
				continue;
970
			err = __br_fdb_add(ndm, br, p, addr, nlh_flags, v->vid);
971 972 973
			if (err)
				goto out;
		}
S
stephen hemminger 已提交
974
	}
975

976
out:
977 978 979
	return err;
}

980 981
static int fdb_delete_by_addr_and_port(struct net_bridge *br,
				       const struct net_bridge_port *p,
982
				       const u8 *addr, u16 vlan)
983 984 985
{
	struct net_bridge_fdb_entry *fdb;

986
	fdb = br_fdb_find(br, addr, vlan);
987
	if (!fdb || fdb->dst != p)
988 989
		return -ENOENT;

990
	fdb_delete(br, fdb, true);
991

992 993 994
	return 0;
}

995 996
static int __br_fdb_delete(struct net_bridge *br,
			   const struct net_bridge_port *p,
997 998 999 1000
			   const unsigned char *addr, u16 vid)
{
	int err;

1001 1002 1003
	spin_lock_bh(&br->hash_lock);
	err = fdb_delete_by_addr_and_port(br, p, addr, vid);
	spin_unlock_bh(&br->hash_lock);
1004 1005 1006 1007

	return err;
}

1008
/* Remove neighbor entry with RTM_DELNEIGH */
1009 1010
int br_fdb_delete(struct ndmsg *ndm, struct nlattr *tb[],
		  struct net_device *dev,
1011
		  const unsigned char *addr, u16 vid)
1012
{
1013
	struct net_bridge_vlan_group *vg;
1014
	struct net_bridge_port *p = NULL;
1015
	struct net_bridge_vlan *v;
1016
	struct net_bridge *br;
1017
	int err;
1018

1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029
	if (dev->priv_flags & IFF_EBRIDGE) {
		br = netdev_priv(dev);
		vg = br_vlan_group(br);
	} else {
		p = br_port_get_rtnl(dev);
		if (!p) {
			pr_info("bridge: RTM_DELNEIGH %s not a bridge port\n",
				dev->name);
			return -EINVAL;
		}
		vg = nbp_vlan_group(p);
1030
		br = p->br;
1031 1032
	}

1033
	if (vid) {
1034 1035
		v = br_vlan_find(vg, vid);
		if (!v) {
1036
			pr_info("bridge: RTM_DELNEIGH with unconfigured vlan %d on %s\n", vid, dev->name);
1037 1038
			return -EINVAL;
		}
1039

1040
		err = __br_fdb_delete(br, p, addr, vid);
1041
	} else {
1042
		err = -ENOENT;
1043
		err &= __br_fdb_delete(br, p, addr, 0);
1044
		if (!vg || !vg->num_vlans)
1045
			return err;
1046

1047 1048 1049
		list_for_each_entry(v, &vg->vlan_list, vlist) {
			if (!br_vlan_should_use(v))
				continue;
1050
			err &= __br_fdb_delete(br, p, addr, v->vid);
1051
		}
1052
	}
1053

1054 1055
	return err;
}
1056 1057 1058

int br_fdb_sync_static(struct net_bridge *br, struct net_bridge_port *p)
{
1059
	struct net_bridge_fdb_entry *f, *tmp;
1060
	int err = 0;
1061 1062 1063

	ASSERT_RTNL();

1064 1065 1066 1067
	/* the key here is that static entries change only under rtnl */
	rcu_read_lock();
	hlist_for_each_entry_rcu(f, &br->fdb_list, fdb_node) {
		/* We only care for static entries */
1068
		if (!test_bit(BR_FDB_STATIC, &f->flags))
1069 1070 1071 1072
			continue;
		err = dev_uc_add(p->dev, f->key.addr.addr);
		if (err)
			goto rollback;
1073
	}
1074 1075
done:
	rcu_read_unlock();
1076

1077
	return err;
1078

1079 1080 1081
rollback:
	hlist_for_each_entry_rcu(tmp, &br->fdb_list, fdb_node) {
		/* We only care for static entries */
1082
		if (!test_bit(BR_FDB_STATIC, &tmp->flags))
1083 1084 1085 1086
			continue;
		if (tmp == f)
			break;
		dev_uc_del(p->dev, tmp->key.addr.addr);
1087
	}
1088 1089

	goto done;
1090 1091 1092 1093
}

void br_fdb_unsync_static(struct net_bridge *br, struct net_bridge_port *p)
{
1094
	struct net_bridge_fdb_entry *f;
1095 1096 1097

	ASSERT_RTNL();

1098 1099 1100
	rcu_read_lock();
	hlist_for_each_entry_rcu(f, &br->fdb_list, fdb_node) {
		/* We only care for static entries */
1101
		if (!test_bit(BR_FDB_STATIC, &f->flags))
1102
			continue;
1103

1104
		dev_uc_del(p->dev, f->key.addr.addr);
1105
	}
1106
	rcu_read_unlock();
1107
}
1108

1109
int br_fdb_external_learn_add(struct net_bridge *br, struct net_bridge_port *p,
1110 1111
			      const unsigned char *addr, u16 vid,
			      bool swdev_notify)
1112 1113
{
	struct net_bridge_fdb_entry *fdb;
1114
	bool modified = false;
1115 1116
	int err = 0;

1117 1118
	trace_br_fdb_external_learn_add(br, p, addr, vid);

1119 1120
	spin_lock_bh(&br->hash_lock);

1121
	fdb = br_fdb_find(br, addr, vid);
1122
	if (!fdb) {
1123
		fdb = fdb_create(br, p, addr, vid, 0, 0);
1124 1125 1126 1127
		if (!fdb) {
			err = -ENOMEM;
			goto err_unlock;
		}
1128
		if (swdev_notify)
1129
			set_bit(BR_FDB_ADDED_BY_USER, &fdb->flags);
1130
		set_bit(BR_FDB_ADDED_BY_EXT_LEARN, &fdb->flags);
1131
		fdb_notify(br, fdb, RTM_NEWNEIGH, swdev_notify);
1132
	} else {
1133
		fdb->updated = jiffies;
1134 1135 1136 1137 1138 1139

		if (fdb->dst != p) {
			fdb->dst = p;
			modified = true;
		}

1140
		if (test_bit(BR_FDB_ADDED_BY_EXT_LEARN, &fdb->flags)) {
1141 1142
			/* Refresh entry */
			fdb->used = jiffies;
1143
		} else if (!test_bit(BR_FDB_ADDED_BY_USER, &fdb->flags)) {
1144
			/* Take over SW learned entry */
1145
			set_bit(BR_FDB_ADDED_BY_EXT_LEARN, &fdb->flags);
1146 1147 1148
			modified = true;
		}

1149
		if (swdev_notify)
1150
			set_bit(BR_FDB_ADDED_BY_USER, &fdb->flags);
1151

1152
		if (modified)
1153
			fdb_notify(br, fdb, RTM_NEWNEIGH, swdev_notify);
1154 1155 1156 1157 1158 1159 1160 1161
	}

err_unlock:
	spin_unlock_bh(&br->hash_lock);

	return err;
}

1162
int br_fdb_external_learn_del(struct net_bridge *br, struct net_bridge_port *p,
1163 1164
			      const unsigned char *addr, u16 vid,
			      bool swdev_notify)
1165 1166 1167 1168 1169 1170
{
	struct net_bridge_fdb_entry *fdb;
	int err = 0;

	spin_lock_bh(&br->hash_lock);

1171
	fdb = br_fdb_find(br, addr, vid);
1172
	if (fdb && test_bit(BR_FDB_ADDED_BY_EXT_LEARN, &fdb->flags))
1173
		fdb_delete(br, fdb, swdev_notify);
1174 1175 1176 1177 1178 1179 1180
	else
		err = -ENOENT;

	spin_unlock_bh(&br->hash_lock);

	return err;
}
1181 1182

void br_fdb_offloaded_set(struct net_bridge *br, struct net_bridge_port *p,
1183
			  const unsigned char *addr, u16 vid, bool offloaded)
1184 1185 1186 1187 1188 1189
{
	struct net_bridge_fdb_entry *fdb;

	spin_lock_bh(&br->hash_lock);

	fdb = br_fdb_find(br, addr, vid);
1190 1191
	if (fdb && offloaded != test_bit(BR_FDB_OFFLOADED, &fdb->flags))
		change_bit(BR_FDB_OFFLOADED, &fdb->flags);
1192 1193 1194

	spin_unlock_bh(&br->hash_lock);
}
P
Petr Machata 已提交
1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209

void br_fdb_clear_offload(const struct net_device *dev, u16 vid)
{
	struct net_bridge_fdb_entry *f;
	struct net_bridge_port *p;

	ASSERT_RTNL();

	p = br_port_get_rtnl(dev);
	if (!p)
		return;

	spin_lock_bh(&p->br->hash_lock);
	hlist_for_each_entry(f, &p->br->fdb_list, fdb_node) {
		if (f->dst == p && f->key.vlan_id == vid)
1210
			clear_bit(BR_FDB_OFFLOADED, &f->flags);
P
Petr Machata 已提交
1211 1212 1213 1214
	}
	spin_unlock_bh(&p->br->hash_lock);
}
EXPORT_SYMBOL_GPL(br_fdb_clear_offload);