br_fdb.c 9.8 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 *	Forwarding database
 *	Linux ethernet bridge
 *
 *	Authors:
 *	Lennert Buytenhek		<buytenh@gnu.org>
 *
 *	This program is free software; you can redistribute it and/or
 *	modify it under the terms of the GNU General Public License
 *	as published by the Free Software Foundation; either version
 *	2 of the License, or (at your option) any later version.
 */

#include <linux/kernel.h>
#include <linux/init.h>
16
#include <linux/rculist.h>
L
Linus Torvalds 已提交
17 18 19 20 21
#include <linux/spinlock.h>
#include <linux/times.h>
#include <linux/netdevice.h>
#include <linux/etherdevice.h>
#include <linux/jhash.h>
22
#include <linux/random.h>
23
#include <linux/slab.h>
L
Linus Torvalds 已提交
24
#include <asm/atomic.h>
25
#include <asm/unaligned.h>
L
Linus Torvalds 已提交
26 27
#include "br_private.h"

28
static struct kmem_cache *br_fdb_cache __read_mostly;
L
Linus Torvalds 已提交
29 30 31
static int fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
		      const unsigned char *addr);

32 33
static u32 fdb_salt __read_mostly;

34
int __init br_fdb_init(void)
L
Linus Torvalds 已提交
35 36 37 38
{
	br_fdb_cache = kmem_cache_create("bridge_fdb_cache",
					 sizeof(struct net_bridge_fdb_entry),
					 0,
39
					 SLAB_HWCACHE_ALIGN, NULL);
40 41 42
	if (!br_fdb_cache)
		return -ENOMEM;

43
	get_random_bytes(&fdb_salt, sizeof(fdb_salt));
44
	return 0;
L
Linus Torvalds 已提交
45 46
}

A
Andrew Morton 已提交
47
void br_fdb_fini(void)
L
Linus Torvalds 已提交
48 49 50 51 52 53 54 55
{
	kmem_cache_destroy(br_fdb_cache);
}


/* if topology_changing then use forward_delay (default 15 sec)
 * otherwise keep longer (default 5 minutes)
 */
56
static inline unsigned long hold_time(const struct net_bridge *br)
L
Linus Torvalds 已提交
57 58 59 60
{
	return br->topology_change ? br->forward_delay : br->ageing_time;
}

61
static inline int has_expired(const struct net_bridge *br,
L
Linus Torvalds 已提交
62 63
				  const struct net_bridge_fdb_entry *fdb)
{
64 65
	return !fdb->is_static &&
		time_before_eq(fdb->ageing_timer + hold_time(br), jiffies);
L
Linus Torvalds 已提交
66 67
}

68
static inline int br_mac_hash(const unsigned char *mac)
L
Linus Torvalds 已提交
69
{
70 71 72
	/* use 1 byte of OUI cnd 3 bytes of NIC */
	u32 key = get_unaligned((u32 *)(mac + 2));
	return jhash_1word(key, fdb_salt) & (BR_HASH_SIZE - 1);
L
Linus Torvalds 已提交
73 74
}

75 76 77 78 79 80 81
static void fdb_rcu_free(struct rcu_head *head)
{
	struct net_bridge_fdb_entry *ent
		= container_of(head, struct net_bridge_fdb_entry, rcu);
	kmem_cache_free(br_fdb_cache, ent);
}

82
static inline void fdb_delete(struct net_bridge_fdb_entry *f)
L
Linus Torvalds 已提交
83 84
{
	hlist_del_rcu(&f->hlist);
85
	call_rcu(&f->rcu, fdb_rcu_free);
L
Linus Torvalds 已提交
86 87 88 89 90 91
}

void br_fdb_changeaddr(struct net_bridge_port *p, const unsigned char *newaddr)
{
	struct net_bridge *br = p->br;
	int i;
92

L
Linus Torvalds 已提交
93 94 95 96 97 98 99 100 101 102 103 104 105
	spin_lock_bh(&br->hash_lock);

	/* Search all chains since old address/hash is unknown */
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct hlist_node *h;
		hlist_for_each(h, &br->hash[i]) {
			struct net_bridge_fdb_entry *f;

			f = hlist_entry(h, struct net_bridge_fdb_entry, hlist);
			if (f->dst == p && f->is_local) {
				/* maybe another port has same hw addr? */
				struct net_bridge_port *op;
				list_for_each_entry(op, &br->port_list, list) {
106
					if (op != p &&
S
Stephen Hemminger 已提交
107 108
					    !compare_ether_addr(op->dev->dev_addr,
								f->addr.addr)) {
L
Linus Torvalds 已提交
109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130
						f->dst = op;
						goto insert;
					}
				}

				/* delete old one */
				fdb_delete(f);
				goto insert;
			}
		}
	}
 insert:
	/* insert new address,  may fail if invalid address or dup. */
	fdb_insert(br, p, newaddr);

	spin_unlock_bh(&br->hash_lock);
}

void br_fdb_cleanup(unsigned long _data)
{
	struct net_bridge *br = (struct net_bridge *)_data;
	unsigned long delay = hold_time(br);
131
	unsigned long next_timer = jiffies + br->ageing_time;
L
Linus Torvalds 已提交
132 133 134 135 136 137 138 139
	int i;

	spin_lock_bh(&br->hash_lock);
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct net_bridge_fdb_entry *f;
		struct hlist_node *h, *n;

		hlist_for_each_entry_safe(f, h, n, &br->hash[i], hlist) {
140 141 142 143 144
			unsigned long this_timer;
			if (f->is_static)
				continue;
			this_timer = f->ageing_timer + delay;
			if (time_before_eq(this_timer, jiffies))
L
Linus Torvalds 已提交
145
				fdb_delete(f);
146
			else if (time_before(this_timer, next_timer))
147
				next_timer = this_timer;
L
Linus Torvalds 已提交
148 149 150 151
		}
	}
	spin_unlock_bh(&br->hash_lock);

152
	mod_timer(&br->gc_timer, round_jiffies_up(next_timer));
L
Linus Torvalds 已提交
153 154
}

155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
/* Completely flush all dynamic entries in forwarding database.*/
void br_fdb_flush(struct net_bridge *br)
{
	int i;

	spin_lock_bh(&br->hash_lock);
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct net_bridge_fdb_entry *f;
		struct hlist_node *h, *n;
		hlist_for_each_entry_safe(f, h, n, &br->hash[i], hlist) {
			if (!f->is_static)
				fdb_delete(f);
		}
	}
	spin_unlock_bh(&br->hash_lock);
}
171

172 173 174
/* Flush all entries refering to a specific port.
 * if do_all is set also flush static entries
 */
175 176 177
void br_fdb_delete_by_port(struct net_bridge *br,
			   const struct net_bridge_port *p,
			   int do_all)
L
Linus Torvalds 已提交
178 179 180 181 182 183
{
	int i;

	spin_lock_bh(&br->hash_lock);
	for (i = 0; i < BR_HASH_SIZE; i++) {
		struct hlist_node *h, *g;
184

L
Linus Torvalds 已提交
185 186 187
		hlist_for_each_safe(h, g, &br->hash[i]) {
			struct net_bridge_fdb_entry *f
				= hlist_entry(h, struct net_bridge_fdb_entry, hlist);
188
			if (f->dst != p)
L
Linus Torvalds 已提交
189 190
				continue;

191 192
			if (f->is_static && !do_all)
				continue;
L
Linus Torvalds 已提交
193 194 195 196 197 198 199 200
			/*
			 * if multiple ports all have the same device address
			 * then when one port is deleted, assign
			 * the local entry to other port
			 */
			if (f->is_local) {
				struct net_bridge_port *op;
				list_for_each_entry(op, &br->port_list, list) {
201
					if (op != p &&
S
Stephen Hemminger 已提交
202 203
					    !compare_ether_addr(op->dev->dev_addr,
								f->addr.addr)) {
L
Linus Torvalds 已提交
204 205 206 207 208 209 210 211 212 213 214 215 216
						f->dst = op;
						goto skip_delete;
					}
				}
			}

			fdb_delete(f);
		skip_delete: ;
		}
	}
	spin_unlock_bh(&br->hash_lock);
}

217
/* No locking or refcounting, assumes caller has rcu_read_lock */
L
Linus Torvalds 已提交
218 219 220 221 222 223 224
struct net_bridge_fdb_entry *__br_fdb_get(struct net_bridge *br,
					  const unsigned char *addr)
{
	struct hlist_node *h;
	struct net_bridge_fdb_entry *fdb;

	hlist_for_each_entry_rcu(fdb, h, &br->hash[br_mac_hash(addr)], hlist) {
S
Stephen Hemminger 已提交
225
		if (!compare_ether_addr(fdb->addr.addr, addr)) {
L
Linus Torvalds 已提交
226 227 228 229 230 231 232 233 234
			if (unlikely(has_expired(br, fdb)))
				break;
			return fdb;
		}
	}

	return NULL;
}

235 236 237 238
#if defined(CONFIG_ATM_LANE) || defined(CONFIG_ATM_LANE_MODULE)
/* Interface used by ATM LANE hook to test
 * if an addr is on some other bridge port */
int br_fdb_test_addr(struct net_device *dev, unsigned char *addr)
L
Linus Torvalds 已提交
239 240
{
	struct net_bridge_fdb_entry *fdb;
241
	struct net_bridge_port *port;
242 243
	int ret;

L
Linus Torvalds 已提交
244
	rcu_read_lock();
245 246 247 248 249 250 251 252
	port = br_port_get_rcu(dev);
	if (!port)
		ret = 0;
	else {
		fdb = __br_fdb_get(port->br, addr);
		ret = fdb && fdb->dst->dev != dev &&
			fdb->dst->state == BR_STATE_FORWARDING;
	}
L
Linus Torvalds 已提交
253 254
	rcu_read_unlock();

255
	return ret;
L
Linus Torvalds 已提交
256
}
257
#endif /* CONFIG_ATM_LANE */
L
Linus Torvalds 已提交
258 259

/*
260
 * Fill buffer with forwarding table records in
L
Linus Torvalds 已提交
261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278
 * the API format.
 */
int br_fdb_fillbuf(struct net_bridge *br, void *buf,
		   unsigned long maxnum, unsigned long skip)
{
	struct __fdb_entry *fe = buf;
	int i, num = 0;
	struct hlist_node *h;
	struct net_bridge_fdb_entry *f;

	memset(buf, 0, maxnum*sizeof(struct __fdb_entry));

	rcu_read_lock();
	for (i = 0; i < BR_HASH_SIZE; i++) {
		hlist_for_each_entry_rcu(f, h, &br->hash[i], hlist) {
			if (num >= maxnum)
				goto out;

279
			if (has_expired(br, f))
L
Linus Torvalds 已提交
280 281 282 283 284 285 286 287 288
				continue;

			if (skip) {
				--skip;
				continue;
			}

			/* convert from internal format to API */
			memcpy(fe->mac_addr, f->addr.addr, ETH_ALEN);
289 290

			/* due to ABI compat need to split into hi/lo */
L
Linus Torvalds 已提交
291
			fe->port_no = f->dst->port_no;
292 293
			fe->port_hi = f->dst->port_no >> 8;

L
Linus Torvalds 已提交
294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314
			fe->is_local = f->is_local;
			if (!f->is_static)
				fe->ageing_timer_value = jiffies_to_clock_t(jiffies - f->ageing_timer);
			++fe;
			++num;
		}
	}

 out:
	rcu_read_unlock();

	return num;
}

static inline struct net_bridge_fdb_entry *fdb_find(struct hlist_head *head,
						    const unsigned char *addr)
{
	struct hlist_node *h;
	struct net_bridge_fdb_entry *fdb;

	hlist_for_each_entry_rcu(fdb, h, head, hlist) {
S
Stephen Hemminger 已提交
315
		if (!compare_ether_addr(fdb->addr.addr, addr))
L
Linus Torvalds 已提交
316 317 318 319 320 321 322
			return fdb;
	}
	return NULL;
}

static struct net_bridge_fdb_entry *fdb_create(struct hlist_head *head,
					       struct net_bridge_port *source,
323
					       const unsigned char *addr)
L
Linus Torvalds 已提交
324 325 326 327 328 329 330
{
	struct net_bridge_fdb_entry *fdb;

	fdb = kmem_cache_alloc(br_fdb_cache, GFP_ATOMIC);
	if (fdb) {
		memcpy(fdb->addr.addr, addr, ETH_ALEN);
		fdb->dst = source;
331 332
		fdb->is_local = 0;
		fdb->is_static = 0;
L
Linus Torvalds 已提交
333
		fdb->ageing_timer = jiffies;
334
		hlist_add_head_rcu(&fdb->hlist, head);
L
Linus Torvalds 已提交
335 336 337 338 339 340 341 342 343 344 345 346 347 348 349
	}
	return fdb;
}

static int fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
		  const unsigned char *addr)
{
	struct hlist_head *head = &br->hash[br_mac_hash(addr)];
	struct net_bridge_fdb_entry *fdb;

	if (!is_valid_ether_addr(addr))
		return -EINVAL;

	fdb = fdb_find(head, addr);
	if (fdb) {
350
		/* it is okay to have multiple ports with same
L
Linus Torvalds 已提交
351 352
		 * address, just use the first one.
		 */
353
		if (fdb->is_local)
L
Linus Torvalds 已提交
354
			return 0;
355
		br_warn(br, "adding interface %s with same address "
L
Linus Torvalds 已提交
356 357 358
		       "as a received packet\n",
		       source->dev->name);
		fdb_delete(fdb);
359
	}
L
Linus Torvalds 已提交
360

361 362
	fdb = fdb_create(head, source, addr);
	if (!fdb)
L
Linus Torvalds 已提交
363 364
		return -ENOMEM;

365
	fdb->is_local = fdb->is_static = 1;
L
Linus Torvalds 已提交
366 367 368
	return 0;
}

369
/* Add entry for local address of interface */
L
Linus Torvalds 已提交
370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390
int br_fdb_insert(struct net_bridge *br, struct net_bridge_port *source,
		  const unsigned char *addr)
{
	int ret;

	spin_lock_bh(&br->hash_lock);
	ret = fdb_insert(br, source, addr);
	spin_unlock_bh(&br->hash_lock);
	return ret;
}

void br_fdb_update(struct net_bridge *br, struct net_bridge_port *source,
		   const unsigned char *addr)
{
	struct hlist_head *head = &br->hash[br_mac_hash(addr)];
	struct net_bridge_fdb_entry *fdb;

	/* some users want to always flood. */
	if (hold_time(br) == 0)
		return;

391 392 393 394 395
	/* ignore packets unless we are using this port */
	if (!(source->state == BR_STATE_LEARNING ||
	      source->state == BR_STATE_FORWARDING))
		return;

L
Linus Torvalds 已提交
396 397 398 399
	fdb = fdb_find(head, addr);
	if (likely(fdb)) {
		/* attempt to update an entry for a local interface */
		if (unlikely(fdb->is_local)) {
400
			if (net_ratelimit())
401 402 403
				br_warn(br, "received packet on %s with "
					"own address as source address\n",
					source->dev->name);
L
Linus Torvalds 已提交
404 405 406 407 408 409
		} else {
			/* fastpath: update of existing entry */
			fdb->dst = source;
			fdb->ageing_timer = jiffies;
		}
	} else {
410
		spin_lock(&br->hash_lock);
411 412 413
		if (likely(!fdb_find(head, addr)))
			fdb_create(head, source, addr);

L
Linus Torvalds 已提交
414 415 416
		/* else  we lose race and someone else inserts
		 * it first, don't bother updating
		 */
417
		spin_unlock(&br->hash_lock);
L
Linus Torvalds 已提交
418 419
	}
}