node.c 69.7 KB
Newer Older
P
Per Liden 已提交
1 2
/*
 * net/tipc/node.c: TIPC node management routines
3
 *
4
 * Copyright (c) 2000-2006, 2012-2016, Ericsson AB
5
 * Copyright (c) 2005-2006, 2010-2014, Wind River Systems
P
Per Liden 已提交
6 7
 * All rights reserved.
 *
P
Per Liden 已提交
8
 * Redistribution and use in source and binary forms, with or without
P
Per Liden 已提交
9 10
 * modification, are permitted provided that the following conditions are met:
 *
P
Per Liden 已提交
11 12 13 14 15 16 17 18
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. Neither the names of the copyright holders nor the names of its
 *    contributors may be used to endorse or promote products derived from
 *    this software without specific prior written permission.
P
Per Liden 已提交
19
 *
P
Per Liden 已提交
20 21 22 23 24 25 26 27 28 29 30 31 32 33
 * Alternatively, this software may be distributed under the terms of the
 * GNU General Public License ("GPL") version 2 as published by the Free
 * Software Foundation.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
P
Per Liden 已提交
34 35 36 37
 * POSSIBILITY OF SUCH DAMAGE.
 */

#include "core.h"
38
#include "link.h"
P
Per Liden 已提交
39 40
#include "node.h"
#include "name_distr.h"
41
#include "socket.h"
42
#include "bcast.h"
43
#include "monitor.h"
44
#include "discover.h"
45
#include "netlink.h"
T
Tuong Lien 已提交
46
#include "trace.h"
47

48
#define INVALID_NODE_SIG	0x10000
49
#define NODE_CLEANUP_AFTER	300000
50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91

/* Flags used to take different actions according to flag type
 * TIPC_NOTIFY_NODE_DOWN: notify node is down
 * TIPC_NOTIFY_NODE_UP: notify node is up
 * TIPC_DISTRIBUTE_NAME: publish or withdraw link state name type
 */
enum {
	TIPC_NOTIFY_NODE_DOWN		= (1 << 3),
	TIPC_NOTIFY_NODE_UP		= (1 << 4),
	TIPC_NOTIFY_LINK_UP		= (1 << 6),
	TIPC_NOTIFY_LINK_DOWN		= (1 << 7)
};

struct tipc_link_entry {
	struct tipc_link *link;
	spinlock_t lock; /* per link */
	u32 mtu;
	struct sk_buff_head inputq;
	struct tipc_media_addr maddr;
};

struct tipc_bclink_entry {
	struct tipc_link *link;
	struct sk_buff_head inputq1;
	struct sk_buff_head arrvq;
	struct sk_buff_head inputq2;
	struct sk_buff_head namedq;
};

/**
 * struct tipc_node - TIPC node structure
 * @addr: network address of node
 * @ref: reference counter to node object
 * @lock: rwlock governing access to structure
 * @net: the applicable net namespace
 * @hash: links to adjacent nodes in unsorted hash chain
 * @inputq: pointer to input queue containing messages for msg event
 * @namedq: pointer to name table input queue with name table messages
 * @active_links: bearer ids of active links, used as index into links[] array
 * @links: array containing references to all links to node
 * @action_flags: bit mask of different types of node actions
 * @state: connectivity state vs peer node
92
 * @preliminary: a preliminary node or not
93 94 95 96 97 98 99 100 101
 * @sync_point: sequence number where synch/failover is finished
 * @list: links to adjacent nodes in sorted list of cluster's nodes
 * @working_links: number of working links to node (both active and standby)
 * @link_cnt: number of links to node
 * @capabilities: bitmap, indicating peer node's functional capabilities
 * @signature: node instance identifier
 * @link_id: local and remote bearer ids of changing link, if any
 * @publ_list: list of publications
 * @rcu: rcu struct for tipc_node
102
 * @delete_at: indicates the time for deleting a down node
103 104 105 106 107 108 109 110 111 112 113 114 115
 */
struct tipc_node {
	u32 addr;
	struct kref kref;
	rwlock_t lock;
	struct net *net;
	struct hlist_node hash;
	int active_links[2];
	struct tipc_link_entry links[MAX_BEARERS];
	struct tipc_bclink_entry bc_entry;
	int action_flags;
	struct list_head list;
	int state;
116
	bool preliminary;
L
LUU Duc Canh 已提交
117
	bool failover_sent;
118 119 120 121 122 123
	u16 sync_point;
	int link_cnt;
	u16 working_links;
	u16 capabilities;
	u32 signature;
	u32 link_id;
124
	u8 peer_id[16];
125
	char peer_id_string[NODE_ID_STR_LEN];
126 127 128 129 130
	struct list_head publ_list;
	struct list_head conn_sks;
	unsigned long keepalive_intv;
	struct timer_list timer;
	struct rcu_head rcu;
131
	unsigned long delete_at;
132 133
	struct net *peer_net;
	u32 peer_hash_mix;
134 135
};

136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159
/* Node FSM states and events:
 */
enum {
	SELF_DOWN_PEER_DOWN    = 0xdd,
	SELF_UP_PEER_UP        = 0xaa,
	SELF_DOWN_PEER_LEAVING = 0xd1,
	SELF_UP_PEER_COMING    = 0xac,
	SELF_COMING_PEER_UP    = 0xca,
	SELF_LEAVING_PEER_DOWN = 0x1d,
	NODE_FAILINGOVER       = 0xf0,
	NODE_SYNCHING          = 0xcc
};

enum {
	SELF_ESTABL_CONTACT_EVT = 0xece,
	SELF_LOST_CONTACT_EVT   = 0x1ce,
	PEER_ESTABL_CONTACT_EVT = 0x9ece,
	PEER_LOST_CONTACT_EVT   = 0x91ce,
	NODE_FAILOVER_BEGIN_EVT = 0xfbe,
	NODE_FAILOVER_END_EVT   = 0xfee,
	NODE_SYNCH_BEGIN_EVT    = 0xcbe,
	NODE_SYNCH_END_EVT      = 0xcee
};

160 161 162 163 164 165
static void __tipc_node_link_down(struct tipc_node *n, int *bearer_id,
				  struct sk_buff_head *xmitq,
				  struct tipc_media_addr **maddr);
static void tipc_node_link_down(struct tipc_node *n, int bearer_id,
				bool delete);
static void node_lost_contact(struct tipc_node *n, struct sk_buff_head *inputq);
166
static void tipc_node_delete(struct tipc_node *node);
167
static void tipc_node_timeout(struct timer_list *t);
168
static void tipc_node_fsm_evt(struct tipc_node *n, int evt);
169
static struct tipc_node *tipc_node_find(struct net *net, u32 addr);
170
static struct tipc_node *tipc_node_find_by_id(struct net *net, u8 *id);
171
static void tipc_node_put(struct tipc_node *node);
172
static bool node_is_up(struct tipc_node *n);
173
static void tipc_node_delete_from_list(struct tipc_node *node);
P
Per Liden 已提交
174

175 176 177 178 179 180 181
struct tipc_sock_conn {
	u32 port;
	u32 peer_port;
	u32 peer_node;
	struct list_head list;
};

182 183 184 185 186 187 188 189 190 191
static struct tipc_link *node_active_link(struct tipc_node *n, int sel)
{
	int bearer_id = n->active_links[sel & 1];

	if (unlikely(bearer_id == INVALID_BEARER_ID))
		return NULL;

	return n->links[bearer_id].link;
}

192
int tipc_node_get_mtu(struct net *net, u32 addr, u32 sel, bool connected)
193 194 195 196 197 198 199 200 201
{
	struct tipc_node *n;
	int bearer_id;
	unsigned int mtu = MAX_MSG_SIZE;

	n = tipc_node_find(net, addr);
	if (unlikely(!n))
		return mtu;

202 203 204 205 206 207 208 209
	/* Allow MAX_MSG_SIZE when building connection oriented message
	 * if they are in the same core network
	 */
	if (n->peer_net && connected) {
		tipc_node_put(n);
		return mtu;
	}

210 211 212 213 214 215
	bearer_id = n->active_links[sel & 1];
	if (likely(bearer_id != INVALID_BEARER_ID))
		mtu = n->links[bearer_id].mtu;
	tipc_node_put(n);
	return mtu;
}
216

217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237
bool tipc_node_get_id(struct net *net, u32 addr, u8 *id)
{
	u8 *own_id = tipc_own_id(net);
	struct tipc_node *n;

	if (!own_id)
		return true;

	if (addr == tipc_own_addr(net)) {
		memcpy(id, own_id, TIPC_NODEID_LEN);
		return true;
	}
	n = tipc_node_find(net, addr);
	if (!n)
		return false;

	memcpy(id, &n->peer_id, TIPC_NODEID_LEN);
	tipc_node_put(n);
	return true;
}

238 239 240 241 242 243 244 245 246 247 248 249 250
u16 tipc_node_get_capabilities(struct net *net, u32 addr)
{
	struct tipc_node *n;
	u16 caps;

	n = tipc_node_find(net, addr);
	if (unlikely(!n))
		return TIPC_NODE_CAPABILITIES;
	caps = n->capabilities;
	tipc_node_put(n);
	return caps;
}

251 252 253 254 255 256 257 258 259 260
u32 tipc_node_get_addr(struct tipc_node *node)
{
	return (node) ? node->addr : 0;
}

char *tipc_node_get_id_str(struct tipc_node *node)
{
	return node->peer_id_string;
}

261 262
static void tipc_node_kref_release(struct kref *kref)
{
263
	struct tipc_node *n = container_of(kref, struct tipc_node, kref);
264

265 266
	kfree(n->bc_entry.link);
	kfree_rcu(n, rcu);
267 268
}

269
static void tipc_node_put(struct tipc_node *node)
270 271 272 273 274 275 276 277 278
{
	kref_put(&node->kref, tipc_node_kref_release);
}

static void tipc_node_get(struct tipc_node *node)
{
	kref_get(&node->kref);
}

279
/*
280 281
 * tipc_node_find - locate specified node object, if it exists
 */
282
static struct tipc_node *tipc_node_find(struct net *net, u32 addr)
283
{
284
	struct tipc_net *tn = tipc_net(net);
285
	struct tipc_node *node;
286
	unsigned int thash = tipc_hashfn(addr);
287

288
	rcu_read_lock();
289
	hlist_for_each_entry_rcu(node, &tn->node_htable[thash], hash) {
290
		if (node->addr != addr || node->preliminary)
291 292 293 294
			continue;
		if (!kref_get_unless_zero(&node->kref))
			node = NULL;
		break;
295
	}
296
	rcu_read_unlock();
297
	return node;
298 299
}

300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323
/* tipc_node_find_by_id - locate specified node object by its 128-bit id
 * Note: this function is called only when a discovery request failed
 * to find the node by its 32-bit id, and is not time critical
 */
static struct tipc_node *tipc_node_find_by_id(struct net *net, u8 *id)
{
	struct tipc_net *tn = tipc_net(net);
	struct tipc_node *n;
	bool found = false;

	rcu_read_lock();
	list_for_each_entry_rcu(n, &tn->node_list, list) {
		read_lock_bh(&n->lock);
		if (!memcmp(id, n->peer_id, 16) &&
		    kref_get_unless_zero(&n->kref))
			found = true;
		read_unlock_bh(&n->lock);
		if (found)
			break;
	}
	rcu_read_unlock();
	return found ? n : NULL;
}

324
static void tipc_node_read_lock(struct tipc_node *n)
J
Jon Paul Maloy 已提交
325 326 327 328
{
	read_lock_bh(&n->lock);
}

329
static void tipc_node_read_unlock(struct tipc_node *n)
J
Jon Paul Maloy 已提交
330 331 332 333 334 335 336 337 338
{
	read_unlock_bh(&n->lock);
}

static void tipc_node_write_lock(struct tipc_node *n)
{
	write_lock_bh(&n->lock);
}

339 340 341 342 343
static void tipc_node_write_unlock_fast(struct tipc_node *n)
{
	write_unlock_bh(&n->lock);
}

J
Jon Paul Maloy 已提交
344 345 346 347 348 349
static void tipc_node_write_unlock(struct tipc_node *n)
{
	struct net *net = n->net;
	u32 addr = 0;
	u32 flags = n->action_flags;
	u32 link_id = 0;
350
	u32 bearer_id;
J
Jon Paul Maloy 已提交
351 352 353 354 355 356 357 358 359
	struct list_head *publ_list;

	if (likely(!flags)) {
		write_unlock_bh(&n->lock);
		return;
	}

	addr = n->addr;
	link_id = n->link_id;
360
	bearer_id = link_id & 0xffff;
J
Jon Paul Maloy 已提交
361 362 363 364 365 366 367 368 369 370 371 372 373
	publ_list = &n->publ_list;

	n->action_flags &= ~(TIPC_NOTIFY_NODE_DOWN | TIPC_NOTIFY_NODE_UP |
			     TIPC_NOTIFY_LINK_DOWN | TIPC_NOTIFY_LINK_UP);

	write_unlock_bh(&n->lock);

	if (flags & TIPC_NOTIFY_NODE_DOWN)
		tipc_publ_notify(net, publ_list, addr);

	if (flags & TIPC_NOTIFY_NODE_UP)
		tipc_named_node_up(net, addr);

374 375
	if (flags & TIPC_NOTIFY_LINK_UP) {
		tipc_mon_peer_up(net, addr, bearer_id);
J
Jon Paul Maloy 已提交
376
		tipc_nametbl_publish(net, TIPC_LINK_STATE, addr, addr,
377
				     TIPC_NODE_SCOPE, link_id, link_id);
378 379 380
	}
	if (flags & TIPC_NOTIFY_LINK_DOWN) {
		tipc_mon_peer_down(net, addr, bearer_id);
J
Jon Paul Maloy 已提交
381
		tipc_nametbl_withdraw(net, TIPC_LINK_STATE, addr,
382
				      addr, link_id);
383
	}
J
Jon Paul Maloy 已提交
384 385
}

386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413
static void tipc_node_assign_peer_net(struct tipc_node *n, u32 hash_mixes)
{
	int net_id = tipc_netid(n->net);
	struct tipc_net *tn_peer;
	struct net *tmp;
	u32 hash_chk;

	if (n->peer_net)
		return;

	for_each_net_rcu(tmp) {
		tn_peer = tipc_net(tmp);
		if (!tn_peer)
			continue;
		/* Integrity checking whether node exists in namespace or not */
		if (tn_peer->net_id != net_id)
			continue;
		if (memcmp(n->peer_id, tn_peer->node_id, NODE_ID_LEN))
			continue;
		hash_chk = tipc_net_hash_mixes(tmp, tn_peer->random);
		if (hash_mixes ^ hash_chk)
			continue;
		n->peer_net = tmp;
		n->peer_hash_mix = hash_mixes;
		break;
	}
}

414
static struct tipc_node *tipc_node_create(struct net *net, u32 addr,
415
					  u8 *peer_id, u16 capabilities,
416
					  u32 hash_mixes, bool preliminary)
P
Per Liden 已提交
417
{
418
	struct tipc_net *tn = net_generic(net, tipc_net_id);
419
	struct tipc_node *n, *temp_node;
420
	struct tipc_link *l;
421
	unsigned long intv;
422
	int bearer_id;
J
Jon Paul Maloy 已提交
423
	int i;
P
Per Liden 已提交
424

425
	spin_lock_bh(&tn->node_list_lock);
426 427
	n = tipc_node_find(net, addr) ?:
		tipc_node_find_by_id(net, peer_id);
428
	if (n) {
429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448
		if (!n->preliminary)
			goto update;
		if (preliminary)
			goto exit;
		/* A preliminary node becomes "real" now, refresh its data */
		tipc_node_write_lock(n);
		n->preliminary = false;
		n->addr = addr;
		hlist_del_rcu(&n->hash);
		hlist_add_head_rcu(&n->hash,
				   &tn->node_htable[tipc_hashfn(addr)]);
		list_del_rcu(&n->list);
		list_for_each_entry_rcu(temp_node, &tn->node_list, list) {
			if (n->addr < temp_node->addr)
				break;
		}
		list_add_tail_rcu(&n->list, &temp_node->list);
		tipc_node_write_unlock_fast(n);

update:
449 450
		if (n->peer_hash_mix ^ hash_mixes)
			tipc_node_assign_peer_net(n, hash_mixes);
451 452
		if (n->capabilities == capabilities)
			goto exit;
453
		/* Same node may come back with new capabilities */
454
		tipc_node_write_lock(n);
455
		n->capabilities = capabilities;
456 457 458 459 460
		for (bearer_id = 0; bearer_id < MAX_BEARERS; bearer_id++) {
			l = n->links[bearer_id].link;
			if (l)
				tipc_link_update_caps(l, capabilities);
		}
461 462
		tipc_node_write_unlock_fast(n);

463 464 465 466 467
		/* Calculate cluster capabilities */
		tn->capabilities = TIPC_NODE_CAPABILITIES;
		list_for_each_entry_rcu(temp_node, &tn->node_list, list) {
			tn->capabilities &= temp_node->capabilities;
		}
468

469
		goto exit;
470
	}
471 472
	n = kzalloc(sizeof(*n), GFP_ATOMIC);
	if (!n) {
473
		pr_warn("Node creation failed, no memory\n");
474
		goto exit;
475
	}
476
	tipc_nodeid2string(n->peer_id_string, peer_id);
477
	n->addr = addr;
478
	n->preliminary = preliminary;
479
	memcpy(&n->peer_id, peer_id, 16);
480
	n->net = net;
481 482 483 484
	n->peer_net = NULL;
	n->peer_hash_mix = 0;
	/* Assign kernel local namespace if exists */
	tipc_node_assign_peer_net(n, hash_mixes);
485 486 487 488 489 490 491 492 493 494 495
	n->capabilities = capabilities;
	kref_init(&n->kref);
	rwlock_init(&n->lock);
	INIT_HLIST_NODE(&n->hash);
	INIT_LIST_HEAD(&n->list);
	INIT_LIST_HEAD(&n->publ_list);
	INIT_LIST_HEAD(&n->conn_sks);
	skb_queue_head_init(&n->bc_entry.namedq);
	skb_queue_head_init(&n->bc_entry.inputq1);
	__skb_queue_head_init(&n->bc_entry.arrvq);
	skb_queue_head_init(&n->bc_entry.inputq2);
J
Jon Paul Maloy 已提交
496
	for (i = 0; i < MAX_BEARERS; i++)
497 498
		spin_lock_init(&n->links[i].lock);
	n->state = SELF_DOWN_PEER_LEAVING;
499
	n->delete_at = jiffies + msecs_to_jiffies(NODE_CLEANUP_AFTER);
500 501 502
	n->signature = INVALID_NODE_SIG;
	n->active_links[0] = INVALID_BEARER_ID;
	n->active_links[1] = INVALID_BEARER_ID;
503
	n->bc_entry.link = NULL;
504
	tipc_node_get(n);
505
	timer_setup(&n->timer, tipc_node_timeout, 0);
506 507 508 509 510
	/* Start a slow timer anyway, crypto needs it */
	n->keepalive_intv = 10000;
	intv = jiffies + msecs_to_jiffies(n->keepalive_intv);
	if (!mod_timer(&n->timer, intv))
		tipc_node_get(n);
511 512 513 514 515 516
	hlist_add_head_rcu(&n->hash, &tn->node_htable[tipc_hashfn(addr)]);
	list_for_each_entry_rcu(temp_node, &tn->node_list, list) {
		if (n->addr < temp_node->addr)
			break;
	}
	list_add_tail_rcu(&n->list, &temp_node->list);
517 518 519 520 521
	/* Calculate cluster capabilities */
	tn->capabilities = TIPC_NODE_CAPABILITIES;
	list_for_each_entry_rcu(temp_node, &tn->node_list, list) {
		tn->capabilities &= temp_node->capabilities;
	}
T
Tuong Lien 已提交
522
	trace_tipc_node_create(n, true, " ");
523
exit:
524
	spin_unlock_bh(&tn->node_list_lock);
525
	return n;
P
Per Liden 已提交
526 527
}

528 529
static void tipc_node_calculate_timer(struct tipc_node *n, struct tipc_link *l)
{
530
	unsigned long tol = tipc_link_tolerance(l);
531 532 533
	unsigned long intv = ((tol / 4) > 500) ? 500 : tol / 4;

	/* Link with lowest tolerance determines timer interval */
534 535
	if (intv < n->keepalive_intv)
		n->keepalive_intv = intv;
536

537 538
	/* Ensure link's abort limit corresponds to current tolerance */
	tipc_link_set_abort_limit(l, tol / n->keepalive_intv);
539 540
}

541
static void tipc_node_delete_from_list(struct tipc_node *node)
P
Per Liden 已提交
542
{
543 544
	list_del_rcu(&node->list);
	hlist_del_rcu(&node->hash);
545
	tipc_node_put(node);
546 547 548 549
}

static void tipc_node_delete(struct tipc_node *node)
{
T
Tuong Lien 已提交
550
	trace_tipc_node_delete(node, true, " ");
551
	tipc_node_delete_from_list(node);
552 553 554

	del_timer_sync(&node->timer);
	tipc_node_put(node);
P
Per Liden 已提交
555 556
}

557
void tipc_node_stop(struct net *net)
558
{
559
	struct tipc_net *tn = tipc_net(net);
560 561
	struct tipc_node *node, *t_node;

562
	spin_lock_bh(&tn->node_list_lock);
563 564
	list_for_each_entry_safe(node, t_node, &tn->node_list, list)
		tipc_node_delete(node);
565
	spin_unlock_bh(&tn->node_list_lock);
566 567
}

568 569 570 571 572 573 574 575 576 577 578 579
void tipc_node_subscribe(struct net *net, struct list_head *subscr, u32 addr)
{
	struct tipc_node *n;

	if (in_own_node(net, addr))
		return;

	n = tipc_node_find(net, addr);
	if (!n) {
		pr_warn("Node subscribe rejected, unknown node 0x%x\n", addr);
		return;
	}
J
Jon Paul Maloy 已提交
580
	tipc_node_write_lock(n);
581
	list_add_tail(subscr, &n->publ_list);
582
	tipc_node_write_unlock_fast(n);
583 584 585 586 587 588 589 590 591 592 593 594 595 596 597
	tipc_node_put(n);
}

void tipc_node_unsubscribe(struct net *net, struct list_head *subscr, u32 addr)
{
	struct tipc_node *n;

	if (in_own_node(net, addr))
		return;

	n = tipc_node_find(net, addr);
	if (!n) {
		pr_warn("Node unsubscribe rejected, unknown node 0x%x\n", addr);
		return;
	}
J
Jon Paul Maloy 已提交
598
	tipc_node_write_lock(n);
599
	list_del_init(subscr);
600
	tipc_node_write_unlock_fast(n);
601 602 603
	tipc_node_put(n);
}

604
int tipc_node_add_conn(struct net *net, u32 dnode, u32 port, u32 peer_port)
605 606 607
{
	struct tipc_node *node;
	struct tipc_sock_conn *conn;
608
	int err = 0;
609

610
	if (in_own_node(net, dnode))
611 612
		return 0;

613
	node = tipc_node_find(net, dnode);
614 615 616 617 618
	if (!node) {
		pr_warn("Connecting sock to node 0x%x failed\n", dnode);
		return -EHOSTUNREACH;
	}
	conn = kmalloc(sizeof(*conn), GFP_ATOMIC);
619 620 621 622
	if (!conn) {
		err = -EHOSTUNREACH;
		goto exit;
	}
623 624 625 626
	conn->peer_node = dnode;
	conn->port = port;
	conn->peer_port = peer_port;

J
Jon Paul Maloy 已提交
627
	tipc_node_write_lock(node);
628
	list_add_tail(&conn->list, &node->conn_sks);
J
Jon Paul Maloy 已提交
629
	tipc_node_write_unlock(node);
630 631 632
exit:
	tipc_node_put(node);
	return err;
633 634
}

635
void tipc_node_remove_conn(struct net *net, u32 dnode, u32 port)
636 637 638 639
{
	struct tipc_node *node;
	struct tipc_sock_conn *conn, *safe;

640
	if (in_own_node(net, dnode))
641 642
		return;

643
	node = tipc_node_find(net, dnode);
644 645 646
	if (!node)
		return;

J
Jon Paul Maloy 已提交
647
	tipc_node_write_lock(node);
648 649 650 651 652 653
	list_for_each_entry_safe(conn, safe, &node->conn_sks, list) {
		if (port != conn->port)
			continue;
		list_del(&conn->list);
		kfree(conn);
	}
J
Jon Paul Maloy 已提交
654
	tipc_node_write_unlock(node);
655
	tipc_node_put(node);
656 657
}

658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675
static void  tipc_node_clear_links(struct tipc_node *node)
{
	int i;

	for (i = 0; i < MAX_BEARERS; i++) {
		struct tipc_link_entry *le = &node->links[i];

		if (le->link) {
			kfree(le->link);
			le->link = NULL;
			node->link_cnt--;
		}
	}
}

/* tipc_node_cleanup - delete nodes that does not
 * have active links for NODE_CLEANUP_AFTER time
 */
676
static bool tipc_node_cleanup(struct tipc_node *peer)
677
{
678
	struct tipc_node *temp_node;
679 680 681
	struct tipc_net *tn = tipc_net(peer->net);
	bool deleted = false;

682 683 684 685
	/* If lock held by tipc_node_stop() the node will be deleted anyway */
	if (!spin_trylock_bh(&tn->node_list_lock))
		return false;

686 687 688 689 690 691 692 693
	tipc_node_write_lock(peer);

	if (!node_is_up(peer) && time_after(jiffies, peer->delete_at)) {
		tipc_node_clear_links(peer);
		tipc_node_delete_from_list(peer);
		deleted = true;
	}
	tipc_node_write_unlock(peer);
694

695 696 697 698 699
	if (!deleted) {
		spin_unlock_bh(&tn->node_list_lock);
		return deleted;
	}

700 701 702 703 704 705
	/* Calculate cluster capabilities */
	tn->capabilities = TIPC_NODE_CAPABILITIES;
	list_for_each_entry_rcu(temp_node, &tn->node_list, list) {
		tn->capabilities &= temp_node->capabilities;
	}

706 707 708 709
	spin_unlock_bh(&tn->node_list_lock);
	return deleted;
}

710 711
/* tipc_node_timeout - handle expiration of node timer
 */
712
static void tipc_node_timeout(struct timer_list *t)
713
{
714
	struct tipc_node *n = from_timer(n, t, timer);
715
	struct tipc_link_entry *le;
716
	struct sk_buff_head xmitq;
717
	int remains = n->link_cnt;
718 719 720
	int bearer_id;
	int rc = 0;

T
Tuong Lien 已提交
721
	trace_tipc_node_timeout(n, false, " ");
722 723 724 725 726 727
	if (!node_is_up(n) && tipc_node_cleanup(n)) {
		/*Removing the reference of Timer*/
		tipc_node_put(n);
		return;
	}

728 729
	__skb_queue_head_init(&xmitq);

730 731 732 733 734 735
	/* Initial node interval to value larger (10 seconds), then it will be
	 * recalculated with link lowest tolerance
	 */
	tipc_node_read_lock(n);
	n->keepalive_intv = 10000;
	tipc_node_read_unlock(n);
736
	for (bearer_id = 0; remains && (bearer_id < MAX_BEARERS); bearer_id++) {
J
Jon Paul Maloy 已提交
737
		tipc_node_read_lock(n);
738 739
		le = &n->links[bearer_id];
		if (le->link) {
740
			spin_lock_bh(&le->lock);
741
			/* Link tolerance may change asynchronously: */
742 743
			tipc_node_calculate_timer(n, le->link);
			rc = tipc_link_timeout(le->link, &xmitq);
744 745
			spin_unlock_bh(&le->lock);
			remains--;
746
		}
J
Jon Paul Maloy 已提交
747
		tipc_node_read_unlock(n);
748 749 750
		tipc_bearer_xmit(n->net, bearer_id, &xmitq, &le->maddr);
		if (rc & TIPC_LINK_DOWN_EVT)
			tipc_node_link_down(n, bearer_id, false);
751
	}
752
	mod_timer(&n->timer, jiffies + msecs_to_jiffies(n->keepalive_intv));
753 754
}

P
Per Liden 已提交
755
/**
756 757
 * __tipc_node_link_up - handle addition of link
 * Node lock must be held by caller
P
Per Liden 已提交
758 759
 * Link becomes active (alone or shared) or standby, depending on its priority.
 */
760 761
static void __tipc_node_link_up(struct tipc_node *n, int bearer_id,
				struct sk_buff_head *xmitq)
P
Per Liden 已提交
762
{
763 764
	int *slot0 = &n->active_links[0];
	int *slot1 = &n->active_links[1];
765 766
	struct tipc_link *ol = node_active_link(n, 0);
	struct tipc_link *nl = n->links[bearer_id].link;
767

768
	if (!nl || tipc_link_is_up(nl))
769 770 771 772
		return;

	tipc_link_fsm_evt(nl, LINK_ESTABLISH_EVT);
	if (!tipc_link_is_up(nl))
773 774
		return;

775 776
	n->working_links++;
	n->action_flags |= TIPC_NOTIFY_LINK_UP;
777
	n->link_id = tipc_link_id(nl);
778 779

	/* Leave room for tunnel header when returning 'mtu' to users: */
780
	n->links[bearer_id].mtu = tipc_link_mtu(nl) - INT_H_SIZE;
Y
Ying Xue 已提交
781

782
	tipc_bearer_add_dest(n->net, bearer_id, n->addr);
783
	tipc_bcast_inc_bearer_dst_cnt(n->net, bearer_id);
784

785
	pr_debug("Established link <%s> on network plane %c\n",
786
		 tipc_link_name(nl), tipc_link_plane(nl));
T
Tuong Lien 已提交
787
	trace_tipc_node_link_up(n, true, " ");
788

789 790 791
	/* Ensure that a STATE message goes first */
	tipc_link_build_state_msg(nl, xmitq);

792 793
	/* First link? => give it both slots */
	if (!ol) {
794 795
		*slot0 = bearer_id;
		*slot1 = bearer_id;
796 797
		tipc_node_fsm_evt(n, SELF_ESTABL_CONTACT_EVT);
		n->action_flags |= TIPC_NOTIFY_NODE_UP;
798
		tipc_link_set_active(nl, true);
799
		tipc_bcast_add_peer(n->net, nl, xmitq);
800
		return;
P
Per Liden 已提交
801
	}
802

803
	/* Second link => redistribute slots */
804 805
	if (tipc_link_prio(nl) > tipc_link_prio(ol)) {
		pr_debug("Old link <%s> becomes standby\n", tipc_link_name(ol));
806
		*slot0 = bearer_id;
807
		*slot1 = bearer_id;
808 809
		tipc_link_set_active(nl, true);
		tipc_link_set_active(ol, false);
810
	} else if (tipc_link_prio(nl) == tipc_link_prio(ol)) {
811
		tipc_link_set_active(nl, true);
812
		*slot1 = bearer_id;
813
	} else {
814
		pr_debug("New link <%s> is standby\n", tipc_link_name(nl));
P
Per Liden 已提交
815 816
	}

817 818
	/* Prepare synchronization with first link */
	tipc_link_tnl_prepare(ol, nl, SYNCH_MSG, xmitq);
P
Per Liden 已提交
819 820 821
}

/**
822 823 824
 * tipc_node_link_up - handle addition of link
 *
 * Link becomes active (alone or shared) or standby, depending on its priority.
P
Per Liden 已提交
825
 */
826 827
static void tipc_node_link_up(struct tipc_node *n, int bearer_id,
			      struct sk_buff_head *xmitq)
P
Per Liden 已提交
828
{
829 830
	struct tipc_media_addr *maddr;

J
Jon Paul Maloy 已提交
831
	tipc_node_write_lock(n);
832
	__tipc_node_link_up(n, bearer_id, xmitq);
833 834
	maddr = &n->links[bearer_id].maddr;
	tipc_bearer_xmit(n->net, bearer_id, xmitq, maddr);
J
Jon Paul Maloy 已提交
835
	tipc_node_write_unlock(n);
836 837
}

838 839 840 841 842 843 844 845 846 847 848
/**
 * tipc_node_link_failover() - start failover in case "half-failover"
 *
 * This function is only called in a very special situation where link
 * failover can be already started on peer node but not on this node.
 * This can happen when e.g.
 *	1. Both links <1A-2A>, <1B-2B> down
 *	2. Link endpoint 2A up, but 1A still down (e.g. due to network
 *	   disturbance, wrong session, etc.)
 *	3. Link <1B-2B> up
 *	4. Link endpoint 2A down (e.g. due to link tolerance timeout)
849
 *	5. Node 2 starts failover onto link <1B-2B>
850
 *
851
 *	==> Node 1 does never start link/node failover!
852 853 854 855 856 857 858 859 860 861 862 863 864 865
 *
 * @n: tipc node structure
 * @l: link peer endpoint failingover (- can be NULL)
 * @tnl: tunnel link
 * @xmitq: queue for messages to be xmited on tnl link later
 */
static void tipc_node_link_failover(struct tipc_node *n, struct tipc_link *l,
				    struct tipc_link *tnl,
				    struct sk_buff_head *xmitq)
{
	/* Avoid to be "self-failover" that can never end */
	if (!tipc_link_is_up(tnl))
		return;

866 867 868 869
	/* Don't rush, failure link may be in the process of resetting */
	if (l && !tipc_link_is_reset(l))
		return;

870 871 872 873 874 875 876 877 878 879 880
	tipc_link_fsm_evt(tnl, LINK_SYNCH_END_EVT);
	tipc_node_fsm_evt(n, NODE_SYNCH_END_EVT);

	n->sync_point = tipc_link_rcv_nxt(tnl) + (U16_MAX / 2 - 1);
	tipc_link_failover_prepare(l, tnl, xmitq);

	if (l)
		tipc_link_fsm_evt(l, LINK_FAILOVER_BEGIN_EVT);
	tipc_node_fsm_evt(n, NODE_FAILOVER_BEGIN_EVT);
}

881 882 883 884 885 886 887 888
/**
 * __tipc_node_link_down - handle loss of link
 */
static void __tipc_node_link_down(struct tipc_node *n, int *bearer_id,
				  struct sk_buff_head *xmitq,
				  struct tipc_media_addr **maddr)
{
	struct tipc_link_entry *le = &n->links[*bearer_id];
889 890
	int *slot0 = &n->active_links[0];
	int *slot1 = &n->active_links[1];
891
	int i, highest = 0, prio;
892
	struct tipc_link *l, *_l, *tnl;
P
Per Liden 已提交
893

894
	l = n->links[*bearer_id].link;
895
	if (!l || tipc_link_is_reset(l))
896 897
		return;

898 899
	n->working_links--;
	n->action_flags |= TIPC_NOTIFY_LINK_DOWN;
900
	n->link_id = tipc_link_id(l);
901

902
	tipc_bearer_remove_dest(n->net, *bearer_id, n->addr);
903

904
	pr_debug("Lost link <%s> on network plane %c\n",
905
		 tipc_link_name(l), tipc_link_plane(l));
906

907 908 909 910 911 912 913
	/* Select new active link if any available */
	*slot0 = INVALID_BEARER_ID;
	*slot1 = INVALID_BEARER_ID;
	for (i = 0; i < MAX_BEARERS; i++) {
		_l = n->links[i].link;
		if (!_l || !tipc_link_is_up(_l))
			continue;
914 915
		if (_l == l)
			continue;
916 917
		prio = tipc_link_prio(_l);
		if (prio < highest)
918
			continue;
919 920
		if (prio > highest) {
			highest = prio;
921 922 923 924 925 926
			*slot0 = i;
			*slot1 = i;
			continue;
		}
		*slot1 = i;
	}
927

928
	if (!node_is_up(n)) {
929 930 931
		if (tipc_link_peer_is_down(l))
			tipc_node_fsm_evt(n, PEER_LOST_CONTACT_EVT);
		tipc_node_fsm_evt(n, SELF_LOST_CONTACT_EVT);
T
Tuong Lien 已提交
932
		trace_tipc_link_reset(l, TIPC_DUMP_ALL, "link down!");
933
		tipc_link_fsm_evt(l, LINK_RESET_EVT);
934
		tipc_link_reset(l);
935 936
		tipc_link_build_reset_msg(l, xmitq);
		*maddr = &n->links[*bearer_id].maddr;
937
		node_lost_contact(n, &le->inputq);
938
		tipc_bcast_dec_bearer_dst_cnt(n->net, *bearer_id);
939 940
		return;
	}
941
	tipc_bcast_dec_bearer_dst_cnt(n->net, *bearer_id);
942

943
	/* There is still a working link => initiate failover */
944 945
	*bearer_id = n->active_links[0];
	tnl = n->links[*bearer_id].link;
946 947
	tipc_link_fsm_evt(tnl, LINK_SYNCH_END_EVT);
	tipc_node_fsm_evt(n, NODE_SYNCH_END_EVT);
948
	n->sync_point = tipc_link_rcv_nxt(tnl) + (U16_MAX / 2 - 1);
949
	tipc_link_tnl_prepare(l, tnl, FAILOVER_MSG, xmitq);
T
Tuong Lien 已提交
950
	trace_tipc_link_reset(l, TIPC_DUMP_ALL, "link down -> failover!");
951
	tipc_link_reset(l);
952
	tipc_link_fsm_evt(l, LINK_RESET_EVT);
953
	tipc_link_fsm_evt(l, LINK_FAILOVER_BEGIN_EVT);
954
	tipc_node_fsm_evt(n, NODE_FAILOVER_BEGIN_EVT);
955
	*maddr = &n->links[*bearer_id].maddr;
956 957 958 959 960
}

static void tipc_node_link_down(struct tipc_node *n, int bearer_id, bool delete)
{
	struct tipc_link_entry *le = &n->links[bearer_id];
J
Jon Maloy 已提交
961
	struct tipc_media_addr *maddr = NULL;
962
	struct tipc_link *l = le->link;
963
	int old_bearer_id = bearer_id;
J
Jon Maloy 已提交
964
	struct sk_buff_head xmitq;
965

966 967 968
	if (!l)
		return;

969 970
	__skb_queue_head_init(&xmitq);

J
Jon Paul Maloy 已提交
971
	tipc_node_write_lock(n);
972 973 974 975
	if (!tipc_link_is_establishing(l)) {
		__tipc_node_link_down(n, &bearer_id, &xmitq, &maddr);
	} else {
		/* Defuse pending tipc_node_link_up() */
976
		tipc_link_reset(l);
977
		tipc_link_fsm_evt(l, LINK_RESET_EVT);
978
	}
979 980 981 982 983
	if (delete) {
		kfree(l);
		le->link = NULL;
		n->link_cnt--;
	}
T
Tuong Lien 已提交
984
	trace_tipc_node_link_down(n, true, "node link down or deleted!");
J
Jon Paul Maloy 已提交
985
	tipc_node_write_unlock(n);
986 987
	if (delete)
		tipc_mon_remove_peer(n->net, n->addr, old_bearer_id);
J
Jon Maloy 已提交
988 989
	if (!skb_queue_empty(&xmitq))
		tipc_bearer_xmit(n->net, bearer_id, &xmitq, maddr);
990
	tipc_sk_rcv(n->net, &le->inputq);
P
Per Liden 已提交
991 992
}

993
static bool node_is_up(struct tipc_node *n)
P
Per Liden 已提交
994
{
995
	return n->active_links[0] != INVALID_BEARER_ID;
P
Per Liden 已提交
996 997
}

998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013
bool tipc_node_is_up(struct net *net, u32 addr)
{
	struct tipc_node *n;
	bool retval = false;

	if (in_own_node(net, addr))
		return true;

	n = tipc_node_find(net, addr);
	if (!n)
		return false;
	retval = node_is_up(n);
	tipc_node_put(n);
	return retval;
}

1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026
static u32 tipc_node_suggest_addr(struct net *net, u32 addr)
{
	struct tipc_node *n;

	addr ^= tipc_net(net)->random;
	while ((n = tipc_node_find(net, addr))) {
		tipc_node_put(n);
		addr++;
	}
	return addr;
}

/* tipc_node_try_addr(): Check if addr can be used by peer, suggest other if not
1027
 * Returns suggested address if any, otherwise 0
1028 1029 1030 1031 1032
 */
u32 tipc_node_try_addr(struct net *net, u8 *id, u32 addr)
{
	struct tipc_net *tn = tipc_net(net);
	struct tipc_node *n;
1033 1034
	bool preliminary;
	u32 sugg_addr;
1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049

	/* Suggest new address if some other peer is using this one */
	n = tipc_node_find(net, addr);
	if (n) {
		if (!memcmp(n->peer_id, id, NODE_ID_LEN))
			addr = 0;
		tipc_node_put(n);
		if (!addr)
			return 0;
		return tipc_node_suggest_addr(net, addr);
	}

	/* Suggest previously used address if peer is known */
	n = tipc_node_find_by_id(net, id);
	if (n) {
1050 1051
		sugg_addr = n->addr;
		preliminary = n->preliminary;
1052
		tipc_node_put(n);
1053 1054
		if (!preliminary)
			return sugg_addr;
1055
	}
1056 1057

	/* Even this node may be in conflict */
1058 1059 1060
	if (tn->trial_addr == addr)
		return tipc_node_suggest_addr(net, addr);

1061
	return 0;
1062 1063 1064 1065
}

void tipc_node_check_dest(struct net *net, u32 addr,
			  u8 *peer_id, struct tipc_bearer *b,
1066
			  u16 capabilities, u32 signature, u32 hash_mixes,
1067 1068
			  struct tipc_media_addr *maddr,
			  bool *respond, bool *dupl_addr)
1069
{
1070
	struct tipc_node *n;
1071
	struct tipc_link *l, *snd_l;
J
Jon Paul Maloy 已提交
1072
	struct tipc_link_entry *le;
1073 1074 1075 1076
	bool addr_match = false;
	bool sign_match = false;
	bool link_up = false;
	bool accept_addr = false;
1077
	bool reset = true;
1078
	char *if_name;
1079
	unsigned long intv;
1080
	u16 session;
J
Jon Paul Maloy 已提交
1081

1082 1083 1084
	*dupl_addr = false;
	*respond = false;

1085 1086
	n = tipc_node_create(net, addr, peer_id, capabilities, hash_mixes,
			     false);
1087 1088
	if (!n)
		return;
1089

J
Jon Paul Maloy 已提交
1090
	tipc_node_write_lock(n);
1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105
	if (unlikely(!n->bc_entry.link)) {
		snd_l = tipc_bc_sndlink(net);
		if (!tipc_link_bc_create(net, tipc_own_addr(net),
					 addr, U16_MAX,
					 tipc_link_window(snd_l),
					 n->capabilities,
					 &n->bc_entry.inputq1,
					 &n->bc_entry.namedq, snd_l,
					 &n->bc_entry.link)) {
			pr_warn("Broadcast rcv link creation failed, no mem\n");
			tipc_node_write_unlock_fast(n);
			tipc_node_put(n);
			return;
		}
	}
1106

J
Jon Paul Maloy 已提交
1107
	le = &n->links[b->identity];
1108 1109

	/* Prepare to validate requesting node's signature and media address */
J
Jon Paul Maloy 已提交
1110
	l = le->link;
1111
	link_up = l && tipc_link_is_up(l);
J
Jon Paul Maloy 已提交
1112
	addr_match = l && !memcmp(&le->maddr, maddr, sizeof(*maddr));
1113 1114 1115 1116 1117 1118
	sign_match = (signature == n->signature);

	/* These three flags give us eight permutations: */

	if (sign_match && addr_match && link_up) {
		/* All is fine. Do nothing. */
1119
		reset = false;
1120 1121 1122
		/* Peer node is not a container/local namespace */
		if (!n->peer_hash_mix)
			n->peer_hash_mix = hash_mixes;
1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175
	} else if (sign_match && addr_match && !link_up) {
		/* Respond. The link will come up in due time */
		*respond = true;
	} else if (sign_match && !addr_match && link_up) {
		/* Peer has changed i/f address without rebooting.
		 * If so, the link will reset soon, and the next
		 * discovery will be accepted. So we can ignore it.
		 * It may also be an cloned or malicious peer having
		 * chosen the same node address and signature as an
		 * existing one.
		 * Ignore requests until the link goes down, if ever.
		 */
		*dupl_addr = true;
	} else if (sign_match && !addr_match && !link_up) {
		/* Peer link has changed i/f address without rebooting.
		 * It may also be a cloned or malicious peer; we can't
		 * distinguish between the two.
		 * The signature is correct, so we must accept.
		 */
		accept_addr = true;
		*respond = true;
	} else if (!sign_match && addr_match && link_up) {
		/* Peer node rebooted. Two possibilities:
		 *  - Delayed re-discovery; this link endpoint has already
		 *    reset and re-established contact with the peer, before
		 *    receiving a discovery message from that node.
		 *    (The peer happened to receive one from this node first).
		 *  - The peer came back so fast that our side has not
		 *    discovered it yet. Probing from this side will soon
		 *    reset the link, since there can be no working link
		 *    endpoint at the peer end, and the link will re-establish.
		 *  Accept the signature, since it comes from a known peer.
		 */
		n->signature = signature;
	} else if (!sign_match && addr_match && !link_up) {
		/*  The peer node has rebooted.
		 *  Accept signature, since it is a known peer.
		 */
		n->signature = signature;
		*respond = true;
	} else if (!sign_match && !addr_match && link_up) {
		/* Peer rebooted with new address, or a new/duplicate peer.
		 * Ignore until the link goes down, if ever.
		 */
		*dupl_addr = true;
	} else if (!sign_match && !addr_match && !link_up) {
		/* Peer rebooted with new address, or it is a new peer.
		 * Accept signature and address.
		 */
		n->signature = signature;
		accept_addr = true;
		*respond = true;
	}
1176

1177 1178
	if (!accept_addr)
		goto exit;
1179

1180
	/* Now create new link if not already existing */
1181
	if (!l) {
1182
		if (n->link_cnt == 2)
J
Jon Paul Maloy 已提交
1183
			goto exit;
1184

1185
		if_name = strchr(b->name, ':') + 1;
1186
		get_random_bytes(&session, sizeof(u16));
1187
		if (!tipc_link_create(net, if_name, b->identity, b->tolerance,
1188
				      b->net_plane, b->mtu, b->priority,
1189
				      b->window, session,
1190
				      tipc_own_addr(net), addr, peer_id,
1191
				      n->capabilities,
1192 1193 1194
				      tipc_bc_sndlink(n->net), n->bc_entry.link,
				      &le->inputq,
				      &n->bc_entry.namedq, &l)) {
1195 1196 1197
			*respond = false;
			goto exit;
		}
T
Tuong Lien 已提交
1198
		trace_tipc_link_reset(l, TIPC_DUMP_ALL, "link created!");
J
Jon Paul Maloy 已提交
1199
		tipc_link_reset(l);
1200
		tipc_link_fsm_evt(l, LINK_RESET_EVT);
1201 1202
		if (n->state == NODE_FAILINGOVER)
			tipc_link_fsm_evt(l, LINK_FAILOVER_BEGIN_EVT);
J
Jon Paul Maloy 已提交
1203 1204
		le->link = l;
		n->link_cnt++;
1205
		tipc_node_calculate_timer(n, l);
1206 1207 1208
		if (n->link_cnt == 1) {
			intv = jiffies + msecs_to_jiffies(n->keepalive_intv);
			if (!mod_timer(&n->timer, intv))
1209
				tipc_node_get(n);
1210
		}
1211
	}
J
Jon Paul Maloy 已提交
1212
	memcpy(&le->maddr, maddr, sizeof(*maddr));
1213
exit:
J
Jon Paul Maloy 已提交
1214
	tipc_node_write_unlock(n);
1215
	if (reset && l && !tipc_link_is_reset(l))
1216
		tipc_node_link_down(n, b->identity, false);
1217
	tipc_node_put(n);
1218 1219
}

1220 1221 1222 1223 1224 1225 1226
void tipc_node_delete_links(struct net *net, int bearer_id)
{
	struct tipc_net *tn = net_generic(net, tipc_net_id);
	struct tipc_node *n;

	rcu_read_lock();
	list_for_each_entry_rcu(n, &tn->node_list, list) {
1227
		tipc_node_link_down(n, bearer_id, true);
1228 1229 1230 1231 1232 1233
	}
	rcu_read_unlock();
}

static void tipc_node_reset_links(struct tipc_node *n)
{
1234
	int i;
1235

J
Jon Maloy 已提交
1236
	pr_warn("Resetting all links to %x\n", n->addr);
1237

T
Tuong Lien 已提交
1238
	trace_tipc_node_reset_links(n, true, " ");
1239
	for (i = 0; i < MAX_BEARERS; i++) {
1240
		tipc_node_link_down(n, i, false);
1241 1242 1243
	}
}

1244 1245 1246
/* tipc_node_fsm_evt - node finite state machine
 * Determines when contact is allowed with peer node
 */
1247
static void tipc_node_fsm_evt(struct tipc_node *n, int evt)
1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262
{
	int state = n->state;

	switch (state) {
	case SELF_DOWN_PEER_DOWN:
		switch (evt) {
		case SELF_ESTABL_CONTACT_EVT:
			state = SELF_UP_PEER_COMING;
			break;
		case PEER_ESTABL_CONTACT_EVT:
			state = SELF_COMING_PEER_UP;
			break;
		case SELF_LOST_CONTACT_EVT:
		case PEER_LOST_CONTACT_EVT:
			break;
J
Jon Paul Maloy 已提交
1263 1264 1265 1266
		case NODE_SYNCH_END_EVT:
		case NODE_SYNCH_BEGIN_EVT:
		case NODE_FAILOVER_BEGIN_EVT:
		case NODE_FAILOVER_END_EVT:
1267
		default:
J
Jon Paul Maloy 已提交
1268
			goto illegal_evt;
1269 1270 1271 1272 1273 1274 1275 1276 1277 1278
		}
		break;
	case SELF_UP_PEER_UP:
		switch (evt) {
		case SELF_LOST_CONTACT_EVT:
			state = SELF_DOWN_PEER_LEAVING;
			break;
		case PEER_LOST_CONTACT_EVT:
			state = SELF_LEAVING_PEER_DOWN;
			break;
J
Jon Paul Maloy 已提交
1279 1280 1281 1282 1283 1284
		case NODE_SYNCH_BEGIN_EVT:
			state = NODE_SYNCHING;
			break;
		case NODE_FAILOVER_BEGIN_EVT:
			state = NODE_FAILINGOVER;
			break;
1285 1286
		case SELF_ESTABL_CONTACT_EVT:
		case PEER_ESTABL_CONTACT_EVT:
J
Jon Paul Maloy 已提交
1287 1288
		case NODE_SYNCH_END_EVT:
		case NODE_FAILOVER_END_EVT:
1289 1290
			break;
		default:
J
Jon Paul Maloy 已提交
1291
			goto illegal_evt;
1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302
		}
		break;
	case SELF_DOWN_PEER_LEAVING:
		switch (evt) {
		case PEER_LOST_CONTACT_EVT:
			state = SELF_DOWN_PEER_DOWN;
			break;
		case SELF_ESTABL_CONTACT_EVT:
		case PEER_ESTABL_CONTACT_EVT:
		case SELF_LOST_CONTACT_EVT:
			break;
J
Jon Paul Maloy 已提交
1303 1304 1305 1306
		case NODE_SYNCH_END_EVT:
		case NODE_SYNCH_BEGIN_EVT:
		case NODE_FAILOVER_BEGIN_EVT:
		case NODE_FAILOVER_END_EVT:
1307
		default:
J
Jon Paul Maloy 已提交
1308
			goto illegal_evt;
1309 1310 1311 1312 1313 1314 1315 1316
		}
		break;
	case SELF_UP_PEER_COMING:
		switch (evt) {
		case PEER_ESTABL_CONTACT_EVT:
			state = SELF_UP_PEER_UP;
			break;
		case SELF_LOST_CONTACT_EVT:
J
Jon Paul Maloy 已提交
1317
			state = SELF_DOWN_PEER_DOWN;
1318 1319 1320
			break;
		case SELF_ESTABL_CONTACT_EVT:
		case PEER_LOST_CONTACT_EVT:
J
Jon Paul Maloy 已提交
1321 1322
		case NODE_SYNCH_END_EVT:
		case NODE_FAILOVER_BEGIN_EVT:
1323 1324
			break;
		case NODE_SYNCH_BEGIN_EVT:
J
Jon Paul Maloy 已提交
1325
		case NODE_FAILOVER_END_EVT:
1326
		default:
J
Jon Paul Maloy 已提交
1327
			goto illegal_evt;
1328 1329 1330 1331 1332 1333 1334 1335
		}
		break;
	case SELF_COMING_PEER_UP:
		switch (evt) {
		case SELF_ESTABL_CONTACT_EVT:
			state = SELF_UP_PEER_UP;
			break;
		case PEER_LOST_CONTACT_EVT:
J
Jon Paul Maloy 已提交
1336
			state = SELF_DOWN_PEER_DOWN;
1337 1338 1339 1340
			break;
		case SELF_LOST_CONTACT_EVT:
		case PEER_ESTABL_CONTACT_EVT:
			break;
J
Jon Paul Maloy 已提交
1341 1342 1343 1344
		case NODE_SYNCH_END_EVT:
		case NODE_SYNCH_BEGIN_EVT:
		case NODE_FAILOVER_BEGIN_EVT:
		case NODE_FAILOVER_END_EVT:
1345
		default:
J
Jon Paul Maloy 已提交
1346
			goto illegal_evt;
1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357
		}
		break;
	case SELF_LEAVING_PEER_DOWN:
		switch (evt) {
		case SELF_LOST_CONTACT_EVT:
			state = SELF_DOWN_PEER_DOWN;
			break;
		case SELF_ESTABL_CONTACT_EVT:
		case PEER_ESTABL_CONTACT_EVT:
		case PEER_LOST_CONTACT_EVT:
			break;
J
Jon Paul Maloy 已提交
1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382
		case NODE_SYNCH_END_EVT:
		case NODE_SYNCH_BEGIN_EVT:
		case NODE_FAILOVER_BEGIN_EVT:
		case NODE_FAILOVER_END_EVT:
		default:
			goto illegal_evt;
		}
		break;
	case NODE_FAILINGOVER:
		switch (evt) {
		case SELF_LOST_CONTACT_EVT:
			state = SELF_DOWN_PEER_LEAVING;
			break;
		case PEER_LOST_CONTACT_EVT:
			state = SELF_LEAVING_PEER_DOWN;
			break;
		case NODE_FAILOVER_END_EVT:
			state = SELF_UP_PEER_UP;
			break;
		case NODE_FAILOVER_BEGIN_EVT:
		case SELF_ESTABL_CONTACT_EVT:
		case PEER_ESTABL_CONTACT_EVT:
			break;
		case NODE_SYNCH_BEGIN_EVT:
		case NODE_SYNCH_END_EVT:
1383
		default:
J
Jon Paul Maloy 已提交
1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407
			goto illegal_evt;
		}
		break;
	case NODE_SYNCHING:
		switch (evt) {
		case SELF_LOST_CONTACT_EVT:
			state = SELF_DOWN_PEER_LEAVING;
			break;
		case PEER_LOST_CONTACT_EVT:
			state = SELF_LEAVING_PEER_DOWN;
			break;
		case NODE_SYNCH_END_EVT:
			state = SELF_UP_PEER_UP;
			break;
		case NODE_FAILOVER_BEGIN_EVT:
			state = NODE_FAILINGOVER;
			break;
		case NODE_SYNCH_BEGIN_EVT:
		case SELF_ESTABL_CONTACT_EVT:
		case PEER_ESTABL_CONTACT_EVT:
			break;
		case NODE_FAILOVER_END_EVT:
		default:
			goto illegal_evt;
1408 1409 1410 1411 1412 1413
		}
		break;
	default:
		pr_err("Unknown node fsm state %x\n", state);
		break;
	}
T
Tuong Lien 已提交
1414
	trace_tipc_node_fsm(n->peer_id, n->state, state, evt);
1415
	n->state = state;
J
Jon Paul Maloy 已提交
1416 1417 1418 1419
	return;

illegal_evt:
	pr_err("Illegal node fsm evt %x in state %x\n", evt, state);
T
Tuong Lien 已提交
1420
	trace_tipc_node_fsm(n->peer_id, n->state, state, evt);
1421 1422
}

1423
static void node_lost_contact(struct tipc_node *n,
1424
			      struct sk_buff_head *inputq)
P
Per Liden 已提交
1425
{
1426
	struct tipc_sock_conn *conn, *safe;
1427
	struct tipc_link *l;
1428
	struct list_head *conns = &n->conn_sks;
1429 1430
	struct sk_buff *skb;
	uint i;
P
Per Liden 已提交
1431

J
Jon Maloy 已提交
1432
	pr_debug("Lost contact with %x\n", n->addr);
1433
	n->delete_at = jiffies + msecs_to_jiffies(NODE_CLEANUP_AFTER);
T
Tuong Lien 已提交
1434
	trace_tipc_node_lost_contact(n, true, " ");
1435

1436
	/* Clean up broadcast state */
1437
	tipc_bcast_remove_peer(n->net, n->bc_entry.link);
P
Per Liden 已提交
1438

1439
	/* Abort any ongoing link failover */
P
Per Liden 已提交
1440
	for (i = 0; i < MAX_BEARERS; i++) {
1441
		l = n->links[i].link;
1442 1443
		if (l)
			tipc_link_fsm_evt(l, LINK_FAILOVER_END_EVT);
P
Per Liden 已提交
1444
	}
1445

1446
	/* Notify publications from this node */
1447
	n->action_flags |= TIPC_NOTIFY_NODE_DOWN;
1448 1449
	n->peer_net = NULL;
	n->peer_hash_mix = 0;
1450 1451 1452
	/* Notify sockets connected to node */
	list_for_each_entry_safe(conn, safe, conns, list) {
		skb = tipc_msg_create(TIPC_CRITICAL_IMPORTANCE, TIPC_CONN_MSG,
1453
				      SHORT_H_SIZE, 0, tipc_own_addr(n->net),
1454 1455
				      conn->peer_node, conn->port,
				      conn->peer_port, TIPC_ERR_NO_NODE);
1456
		if (likely(skb))
1457
			skb_queue_tail(inputq, skb);
1458 1459 1460
		list_del(&conn->list);
		kfree(conn);
	}
P
Per Liden 已提交
1461 1462
}

E
Erik Hugne 已提交
1463 1464 1465 1466 1467 1468 1469 1470 1471
/**
 * tipc_node_get_linkname - get the name of a link
 *
 * @bearer_id: id of the bearer
 * @node: peer node address
 * @linkname: link name output buffer
 *
 * Returns 0 on success
 */
1472 1473
int tipc_node_get_linkname(struct net *net, u32 bearer_id, u32 addr,
			   char *linkname, size_t len)
E
Erik Hugne 已提交
1474 1475
{
	struct tipc_link *link;
1476
	int err = -EINVAL;
1477
	struct tipc_node *node = tipc_node_find(net, addr);
E
Erik Hugne 已提交
1478

1479 1480 1481 1482 1483 1484
	if (!node)
		return err;

	if (bearer_id >= MAX_BEARERS)
		goto exit;

J
Jon Paul Maloy 已提交
1485
	tipc_node_read_lock(node);
1486
	link = node->links[bearer_id].link;
E
Erik Hugne 已提交
1487
	if (link) {
1488
		strncpy(linkname, tipc_link_name(link), len);
1489
		err = 0;
E
Erik Hugne 已提交
1490
	}
J
Jon Paul Maloy 已提交
1491
	tipc_node_read_unlock(node);
1492
exit:
1493 1494
	tipc_node_put(node);
	return err;
E
Erik Hugne 已提交
1495
}
1496

1497
/* Caller should hold node lock for the passed node */
1498
static int __tipc_nl_add_node(struct tipc_nl_msg *msg, struct tipc_node *node)
1499 1500 1501 1502
{
	void *hdr;
	struct nlattr *attrs;

1503
	hdr = genlmsg_put(msg->skb, msg->portid, msg->seq, &tipc_genl_family,
1504 1505 1506 1507
			  NLM_F_MULTI, TIPC_NL_NODE_GET);
	if (!hdr)
		return -EMSGSIZE;

1508
	attrs = nla_nest_start_noflag(msg->skb, TIPC_NLA_NODE);
1509 1510 1511 1512 1513
	if (!attrs)
		goto msg_full;

	if (nla_put_u32(msg->skb, TIPC_NLA_NODE_ADDR, node->addr))
		goto attr_msg_full;
1514
	if (node_is_up(node))
1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530
		if (nla_put_flag(msg->skb, TIPC_NLA_NODE_UP))
			goto attr_msg_full;

	nla_nest_end(msg->skb, attrs);
	genlmsg_end(msg->skb, hdr);

	return 0;

attr_msg_full:
	nla_nest_cancel(msg->skb, attrs);
msg_full:
	genlmsg_cancel(msg->skb, hdr);

	return -EMSGSIZE;
}

1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580
static void tipc_lxc_xmit(struct net *peer_net, struct sk_buff_head *list)
{
	struct tipc_msg *hdr = buf_msg(skb_peek(list));
	struct sk_buff_head inputq;

	switch (msg_user(hdr)) {
	case TIPC_LOW_IMPORTANCE:
	case TIPC_MEDIUM_IMPORTANCE:
	case TIPC_HIGH_IMPORTANCE:
	case TIPC_CRITICAL_IMPORTANCE:
		if (msg_connected(hdr) || msg_named(hdr)) {
			tipc_loopback_trace(peer_net, list);
			spin_lock_init(&list->lock);
			tipc_sk_rcv(peer_net, list);
			return;
		}
		if (msg_mcast(hdr)) {
			tipc_loopback_trace(peer_net, list);
			skb_queue_head_init(&inputq);
			tipc_sk_mcast_rcv(peer_net, list, &inputq);
			__skb_queue_purge(list);
			skb_queue_purge(&inputq);
			return;
		}
		return;
	case MSG_FRAGMENTER:
		if (tipc_msg_assemble(list)) {
			tipc_loopback_trace(peer_net, list);
			skb_queue_head_init(&inputq);
			tipc_sk_mcast_rcv(peer_net, list, &inputq);
			__skb_queue_purge(list);
			skb_queue_purge(&inputq);
		}
		return;
	case GROUP_PROTOCOL:
	case CONN_MANAGER:
		tipc_loopback_trace(peer_net, list);
		spin_lock_init(&list->lock);
		tipc_sk_rcv(peer_net, list);
		return;
	case LINK_PROTOCOL:
	case NAME_DISTRIBUTOR:
	case TUNNEL_PROTOCOL:
	case BCAST_PROTOCOL:
		return;
	default:
		return;
	};
}

1581 1582 1583 1584 1585 1586
/**
 * tipc_node_xmit() is the general link level function for message sending
 * @net: the applicable net namespace
 * @list: chain of buffers containing message
 * @dnode: address of destination node
 * @selector: a number used for deterministic link selection
1587
 * Consumes the buffer chain.
1588
 * Returns 0 if success, otherwise: -ELINKCONG,-EHOSTUNREACH,-EMSGSIZE,-ENOBUF
1589 1590 1591 1592
 */
int tipc_node_xmit(struct net *net, struct sk_buff_head *list,
		   u32 dnode, int selector)
{
J
Jon Paul Maloy 已提交
1593
	struct tipc_link_entry *le = NULL;
1594 1595
	struct tipc_node *n;
	struct sk_buff_head xmitq;
1596
	bool node_up = false;
1597 1598 1599 1600
	int bearer_id;
	int rc;

	if (in_own_node(net, dnode)) {
1601
		tipc_loopback_trace(net, list);
1602
		spin_lock_init(&list->lock);
1603 1604 1605
		tipc_sk_rcv(net, list);
		return 0;
	}
1606 1607

	n = tipc_node_find(net, dnode);
1608
	if (unlikely(!n)) {
1609
		__skb_queue_purge(list);
1610 1611 1612 1613
		return -EHOSTUNREACH;
	}

	tipc_node_read_lock(n);
1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624
	node_up = node_is_up(n);
	if (node_up && n->peer_net && check_net(n->peer_net)) {
		/* xmit inner linux container */
		tipc_lxc_xmit(n->peer_net, list);
		if (likely(skb_queue_empty(list))) {
			tipc_node_read_unlock(n);
			tipc_node_put(n);
			return 0;
		}
	}

1625 1626
	bearer_id = n->active_links[selector & 1];
	if (unlikely(bearer_id == INVALID_BEARER_ID)) {
J
Jon Paul Maloy 已提交
1627
		tipc_node_read_unlock(n);
1628
		tipc_node_put(n);
1629
		__skb_queue_purge(list);
1630
		return -EHOSTUNREACH;
1631
	}
J
Jon Paul Maloy 已提交
1632

1633 1634 1635 1636 1637 1638 1639
	__skb_queue_head_init(&xmitq);
	le = &n->links[bearer_id];
	spin_lock_bh(&le->lock);
	rc = tipc_link_xmit(le->link, list, &xmitq);
	spin_unlock_bh(&le->lock);
	tipc_node_read_unlock(n);

1640
	if (unlikely(rc == -ENOBUFS))
1641
		tipc_node_link_down(n, bearer_id, false);
1642 1643
	else
		tipc_bearer_xmit(net, bearer_id, &xmitq, &le->maddr);
1644 1645 1646

	tipc_node_put(n);

1647
	return rc;
1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660
}

/* tipc_node_xmit_skb(): send single buffer to destination
 * Buffers sent via this functon are generally TIPC_SYSTEM_IMPORTANCE
 * messages, which will not be rejected
 * The only exception is datagram messages rerouted after secondary
 * lookup, which are rare and safe to dispose of anyway.
 */
int tipc_node_xmit_skb(struct net *net, struct sk_buff *skb, u32 dnode,
		       u32 selector)
{
	struct sk_buff_head head;

1661
	__skb_queue_head_init(&head);
1662
	__skb_queue_tail(&head, skb);
1663
	tipc_node_xmit(net, &head, dnode, selector);
1664 1665 1666
	return 0;
}

1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682
/* tipc_node_distr_xmit(): send single buffer msgs to individual destinations
 * Note: this is only for SYSTEM_IMPORTANCE messages, which cannot be rejected
 */
int tipc_node_distr_xmit(struct net *net, struct sk_buff_head *xmitq)
{
	struct sk_buff *skb;
	u32 selector, dnode;

	while ((skb = __skb_dequeue(xmitq))) {
		selector = msg_origport(buf_msg(skb));
		dnode = msg_destnode(buf_msg(skb));
		tipc_node_xmit_skb(net, skb, dnode, selector);
	}
	return 0;
}

1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693
void tipc_node_broadcast(struct net *net, struct sk_buff *skb)
{
	struct sk_buff *txskb;
	struct tipc_node *n;
	u32 dst;

	rcu_read_lock();
	list_for_each_entry_rcu(n, tipc_nodes(net), list) {
		dst = n->addr;
		if (in_own_node(net, dst))
			continue;
1694
		if (!node_is_up(n))
1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706
			continue;
		txskb = pskb_copy(skb, GFP_ATOMIC);
		if (!txskb)
			break;
		msg_set_destnode(buf_msg(txskb), dst);
		tipc_node_xmit_skb(net, txskb, dst, 0);
	}
	rcu_read_unlock();

	kfree_skb(skb);
}

1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719
static void tipc_node_mcast_rcv(struct tipc_node *n)
{
	struct tipc_bclink_entry *be = &n->bc_entry;

	/* 'arrvq' is under inputq2's lock protection */
	spin_lock_bh(&be->inputq2.lock);
	spin_lock_bh(&be->inputq1.lock);
	skb_queue_splice_tail_init(&be->inputq1, &be->arrvq);
	spin_unlock_bh(&be->inputq1.lock);
	spin_unlock_bh(&be->inputq2.lock);
	tipc_sk_mcast_rcv(n->net, &be->arrvq, &be->inputq2);
}

1720 1721 1722 1723 1724 1725 1726 1727 1728
static void tipc_node_bc_sync_rcv(struct tipc_node *n, struct tipc_msg *hdr,
				  int bearer_id, struct sk_buff_head *xmitq)
{
	struct tipc_link *ucl;
	int rc;

	rc = tipc_bcast_sync_rcv(n->net, n->bc_entry.link, hdr);

	if (rc & TIPC_LINK_DOWN_EVT) {
1729
		tipc_node_reset_links(n);
1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747
		return;
	}

	if (!(rc & TIPC_LINK_SND_STATE))
		return;

	/* If probe message, a STATE response will be sent anyway */
	if (msg_probe(hdr))
		return;

	/* Produce a STATE message carrying broadcast NACK */
	tipc_node_read_lock(n);
	ucl = n->links[bearer_id].link;
	if (ucl)
		tipc_link_build_state_msg(ucl, xmitq);
	tipc_node_read_unlock(n);
}

1748 1749 1750 1751 1752 1753 1754 1755
/**
 * tipc_node_bc_rcv - process TIPC broadcast packet arriving from off-node
 * @net: the applicable net namespace
 * @skb: TIPC packet
 * @bearer_id: id of bearer message arrived on
 *
 * Invoked with no locks held.
 */
1756
static void tipc_node_bc_rcv(struct net *net, struct sk_buff *skb, int bearer_id)
1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769 1770 1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783
{
	int rc;
	struct sk_buff_head xmitq;
	struct tipc_bclink_entry *be;
	struct tipc_link_entry *le;
	struct tipc_msg *hdr = buf_msg(skb);
	int usr = msg_user(hdr);
	u32 dnode = msg_destnode(hdr);
	struct tipc_node *n;

	__skb_queue_head_init(&xmitq);

	/* If NACK for other node, let rcv link for that node peek into it */
	if ((usr == BCAST_PROTOCOL) && (dnode != tipc_own_addr(net)))
		n = tipc_node_find(net, dnode);
	else
		n = tipc_node_find(net, msg_prevnode(hdr));
	if (!n) {
		kfree_skb(skb);
		return;
	}
	be = &n->bc_entry;
	le = &n->links[bearer_id];

	rc = tipc_bcast_rcv(net, be->link, skb);

	/* Broadcast ACKs are sent on a unicast link */
1784
	if (rc & TIPC_LINK_SND_STATE) {
J
Jon Paul Maloy 已提交
1785
		tipc_node_read_lock(n);
1786
		tipc_link_build_state_msg(le->link, &xmitq);
J
Jon Paul Maloy 已提交
1787
		tipc_node_read_unlock(n);
1788 1789 1790 1791 1792
	}

	if (!skb_queue_empty(&xmitq))
		tipc_bearer_xmit(net, bearer_id, &xmitq, &le->maddr);

1793 1794
	if (!skb_queue_empty(&be->inputq1))
		tipc_node_mcast_rcv(n);
1795

1796 1797 1798 1799
	/* Handle NAME_DISTRIBUTOR messages sent from 1.7 nodes */
	if (!skb_queue_empty(&n->bc_entry.namedq))
		tipc_named_rcv(net, &n->bc_entry.namedq);

1800 1801 1802
	/* If reassembly or retransmission failure => reset all links to peer */
	if (rc & TIPC_LINK_DOWN_EVT)
		tipc_node_reset_links(n);
1803

1804 1805 1806
	tipc_node_put(n);
}

1807 1808 1809 1810
/**
 * tipc_node_check_state - check and if necessary update node state
 * @skb: TIPC packet
 * @bearer_id: identity of bearer delivering the packet
1811
 * Returns true if state and msg are ok, otherwise false
1812
 */
1813
static bool tipc_node_check_state(struct tipc_node *n, struct sk_buff *skb,
1814
				  int bearer_id, struct sk_buff_head *xmitq)
1815 1816
{
	struct tipc_msg *hdr = buf_msg(skb);
1817 1818
	int usr = msg_user(hdr);
	int mtyp = msg_type(hdr);
1819
	u16 oseqno = msg_seqno(hdr);
1820
	u16 exp_pkts = msg_msgcnt(hdr);
1821
	u16 rcv_nxt, syncpt, dlv_nxt, inputq_len;
1822
	int state = n->state;
1823
	struct tipc_link *l, *tnl, *pl = NULL;
1824
	struct tipc_media_addr *maddr;
1825
	int pb_id;
1826

T
Tuong Lien 已提交
1827 1828 1829 1830
	if (trace_tipc_node_check_state_enabled()) {
		trace_tipc_skb_dump(skb, false, "skb for node state check");
		trace_tipc_node_check_state(n, true, " ");
	}
1831 1832 1833
	l = n->links[bearer_id].link;
	if (!l)
		return false;
1834
	rcv_nxt = tipc_link_rcv_nxt(l);
1835 1836


1837 1838
	if (likely((state == SELF_UP_PEER_UP) && (usr != TUNNEL_PROTOCOL)))
		return true;
1839

1840
	/* Find parallel link, if any */
1841 1842 1843
	for (pb_id = 0; pb_id < MAX_BEARERS; pb_id++) {
		if ((pb_id != bearer_id) && n->links[pb_id].link) {
			pl = n->links[pb_id].link;
1844 1845 1846
			break;
		}
	}
1847

T
Tuong Lien 已提交
1848 1849 1850
	if (!tipc_link_validate_msg(l, hdr)) {
		trace_tipc_skb_dump(skb, false, "PROTO invalid (2)!");
		trace_tipc_link_dump(l, TIPC_DUMP_NONE, "PROTO invalid (2)!");
1851
		return false;
T
Tuong Lien 已提交
1852
	}
1853

J
Jon Paul Maloy 已提交
1854
	/* Check and update node accesibility if applicable */
1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866
	if (state == SELF_UP_PEER_COMING) {
		if (!tipc_link_is_up(l))
			return true;
		if (!msg_peer_link_is_up(hdr))
			return true;
		tipc_node_fsm_evt(n, PEER_ESTABL_CONTACT_EVT);
	}

	if (state == SELF_DOWN_PEER_LEAVING) {
		if (msg_peer_node_is_up(hdr))
			return false;
		tipc_node_fsm_evt(n, PEER_LOST_CONTACT_EVT);
1867
		return true;
1868 1869
	}

J
Jon Paul Maloy 已提交
1870 1871 1872
	if (state == SELF_LEAVING_PEER_DOWN)
		return false;

1873
	/* Ignore duplicate packets */
1874
	if ((usr != LINK_PROTOCOL) && less(oseqno, rcv_nxt))
1875 1876 1877 1878 1879
		return true;

	/* Initiate or update failover mode if applicable */
	if ((usr == TUNNEL_PROTOCOL) && (mtyp == FAILOVER_MSG)) {
		syncpt = oseqno + exp_pkts - 1;
1880
		if (pl && !tipc_link_is_reset(pl)) {
1881
			__tipc_node_link_down(n, &pb_id, xmitq, &maddr);
T
Tuong Lien 已提交
1882 1883
			trace_tipc_node_link_down(n, true,
						  "node link down <- failover!");
1884 1885
			tipc_skb_queue_splice_tail_init(tipc_link_inputq(pl),
							tipc_link_inputq(l));
1886
		}
1887

L
LUU Duc Canh 已提交
1888
		/* If parallel link was already down, and this happened before
1889 1890 1891 1892
		 * the tunnel link came up, node failover was never started.
		 * Ensure that a FAILOVER_MSG is sent to get peer out of
		 * NODE_FAILINGOVER state, also this node must accept
		 * TUNNEL_MSGs from peer.
L
LUU Duc Canh 已提交
1893
		 */
1894 1895 1896
		if (n->state != NODE_FAILINGOVER)
			tipc_node_link_failover(n, pl, l, xmitq);

1897 1898 1899 1900 1901 1902
		/* If pkts arrive out of order, use lowest calculated syncpt */
		if (less(syncpt, n->sync_point))
			n->sync_point = syncpt;
	}

	/* Open parallel link when tunnel link reaches synch point */
1903
	if ((n->state == NODE_FAILINGOVER) && tipc_link_is_up(l)) {
1904 1905
		if (!more(rcv_nxt, n->sync_point))
			return true;
1906 1907
		tipc_node_fsm_evt(n, NODE_FAILOVER_END_EVT);
		if (pl)
1908
			tipc_link_fsm_evt(pl, LINK_FAILOVER_END_EVT);
1909 1910 1911
		return true;
	}

1912 1913 1914 1915
	/* No synching needed if only one link */
	if (!pl || !tipc_link_is_up(pl))
		return true;

1916 1917
	/* Initiate synch mode if applicable */
	if ((usr == TUNNEL_PROTOCOL) && (mtyp == SYNCH_MSG) && (oseqno == 1)) {
1918 1919 1920 1921
		if (n->capabilities & TIPC_TUNNEL_ENHANCED)
			syncpt = msg_syncpt(hdr);
		else
			syncpt = msg_seqno(msg_inner_hdr(hdr)) + exp_pkts - 1;
1922
		if (!tipc_link_is_up(l))
1923
			__tipc_node_link_up(n, bearer_id, xmitq);
1924 1925
		if (n->state == SELF_UP_PEER_UP) {
			n->sync_point = syncpt;
1926
			tipc_link_fsm_evt(l, LINK_SYNCH_BEGIN_EVT);
1927 1928
			tipc_node_fsm_evt(n, NODE_SYNCH_BEGIN_EVT);
		}
1929
	}
1930 1931

	/* Open tunnel link when parallel link reaches synch point */
1932
	if (n->state == NODE_SYNCHING) {
1933 1934 1935 1936 1937 1938
		if (tipc_link_is_synching(l)) {
			tnl = l;
		} else {
			tnl = pl;
			pl = l;
		}
1939 1940
		inputq_len = skb_queue_len(tipc_link_inputq(pl));
		dlv_nxt = tipc_link_rcv_nxt(pl) - inputq_len;
1941
		if (more(dlv_nxt, n->sync_point)) {
1942
			tipc_link_fsm_evt(tnl, LINK_SYNCH_END_EVT);
1943 1944 1945
			tipc_node_fsm_evt(n, NODE_SYNCH_END_EVT);
			return true;
		}
1946 1947
		if (l == pl)
			return true;
1948 1949 1950 1951 1952 1953 1954
		if ((usr == TUNNEL_PROTOCOL) && (mtyp == SYNCH_MSG))
			return true;
		if (usr == LINK_PROTOCOL)
			return true;
		return false;
	}
	return true;
1955 1956
}

1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969
/**
 * tipc_rcv - process TIPC packets/messages arriving from off-node
 * @net: the applicable net namespace
 * @skb: TIPC packet
 * @bearer: pointer to bearer message arrived on
 *
 * Invoked with no locks held. Bearer pointer must point to a valid bearer
 * structure (i.e. cannot be NULL), but bearer can be inactive.
 */
void tipc_rcv(struct net *net, struct sk_buff *skb, struct tipc_bearer *b)
{
	struct sk_buff_head xmitq;
	struct tipc_node *n;
1970
	struct tipc_msg *hdr;
1971
	int bearer_id = b->identity;
1972
	struct tipc_link_entry *le;
1973
	u32 self = tipc_own_addr(net);
1974 1975
	int usr, rc = 0;
	u16 bc_ack;
1976 1977 1978

	__skb_queue_head_init(&xmitq);

1979
	/* Ensure message is well-formed before touching the header */
1980
	TIPC_SKB_CB(skb)->validated = false;
1981
	if (unlikely(!tipc_msg_validate(&skb)))
1982
		goto discard;
1983 1984 1985
	hdr = buf_msg(skb);
	usr = msg_user(hdr);
	bc_ack = msg_bcast_ack(hdr);
1986

1987
	/* Handle arrival of discovery or broadcast packet */
1988
	if (unlikely(msg_non_seq(hdr))) {
1989 1990
		if (unlikely(usr == LINK_CONFIG))
			return tipc_disc_rcv(net, skb, b);
1991
		else
1992
			return tipc_node_bc_rcv(net, skb, bearer_id);
1993 1994
	}

1995 1996 1997 1998
	/* Discard unicast link messages destined for another node */
	if (unlikely(!msg_short(hdr) && (msg_destnode(hdr) != self)))
		goto discard;

1999 2000 2001 2002
	/* Locate neighboring node that sent packet */
	n = tipc_node_find(net, msg_prevnode(hdr));
	if (unlikely(!n))
		goto discard;
2003
	le = &n->links[bearer_id];
2004

2005 2006
	/* Ensure broadcast reception is in synch with peer's send state */
	if (unlikely(usr == LINK_PROTOCOL))
2007
		tipc_node_bc_sync_rcv(n, hdr, bearer_id, &xmitq);
2008
	else if (unlikely(tipc_link_acked(n->bc_entry.link) != bc_ack))
2009
		tipc_bcast_ack_rcv(net, n->bc_entry.link, hdr);
2010

J
Jon Paul Maloy 已提交
2011 2012 2013
	/* Receive packet directly if conditions permit */
	tipc_node_read_lock(n);
	if (likely((n->state == SELF_UP_PEER_UP) && (usr != TUNNEL_PROTOCOL))) {
J
Jon Paul Maloy 已提交
2014
		spin_lock_bh(&le->lock);
J
Jon Paul Maloy 已提交
2015 2016 2017 2018
		if (le->link) {
			rc = tipc_link_rcv(le->link, skb, &xmitq);
			skb = NULL;
		}
J
Jon Paul Maloy 已提交
2019
		spin_unlock_bh(&le->lock);
2020
	}
J
Jon Paul Maloy 已提交
2021 2022 2023 2024
	tipc_node_read_unlock(n);

	/* Check/update node state before receiving */
	if (unlikely(skb)) {
2025 2026
		if (unlikely(skb_linearize(skb)))
			goto discard;
J
Jon Paul Maloy 已提交
2027 2028 2029 2030 2031 2032 2033 2034 2035
		tipc_node_write_lock(n);
		if (tipc_node_check_state(n, skb, bearer_id, &xmitq)) {
			if (le->link) {
				rc = tipc_link_rcv(le->link, skb, &xmitq);
				skb = NULL;
			}
		}
		tipc_node_write_unlock(n);
	}
2036 2037

	if (unlikely(rc & TIPC_LINK_UP_EVT))
2038 2039
		tipc_node_link_up(n, bearer_id, &xmitq);

2040
	if (unlikely(rc & TIPC_LINK_DOWN_EVT))
2041
		tipc_node_link_down(n, bearer_id, false);
2042

2043 2044
	if (unlikely(!skb_queue_empty(&n->bc_entry.namedq)))
		tipc_named_rcv(net, &n->bc_entry.namedq);
2045

2046 2047 2048
	if (unlikely(!skb_queue_empty(&n->bc_entry.inputq1)))
		tipc_node_mcast_rcv(n);

2049 2050 2051 2052 2053 2054
	if (!skb_queue_empty(&le->inputq))
		tipc_sk_rcv(net, &le->inputq);

	if (!skb_queue_empty(&xmitq))
		tipc_bearer_xmit(net, bearer_id, &xmitq, &le->maddr);

2055 2056 2057 2058 2059
	tipc_node_put(n);
discard:
	kfree_skb(skb);
}

2060 2061
void tipc_node_apply_property(struct net *net, struct tipc_bearer *b,
			      int prop)
2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075
{
	struct tipc_net *tn = tipc_net(net);
	int bearer_id = b->identity;
	struct sk_buff_head xmitq;
	struct tipc_link_entry *e;
	struct tipc_node *n;

	__skb_queue_head_init(&xmitq);

	rcu_read_lock();

	list_for_each_entry_rcu(n, &tn->node_list, list) {
		tipc_node_write_lock(n);
		e = &n->links[bearer_id];
2076 2077 2078 2079 2080 2081 2082
		if (e->link) {
			if (prop == TIPC_NLA_PROP_TOL)
				tipc_link_set_tolerance(e->link, b->tolerance,
							&xmitq);
			else if (prop == TIPC_NLA_PROP_MTU)
				tipc_link_set_mtu(e->link, b->mtu);
		}
2083 2084 2085 2086 2087 2088 2089
		tipc_node_write_unlock(n);
		tipc_bearer_xmit(net, bearer_id, &xmitq, &e->maddr);
	}

	rcu_read_unlock();
}

2090 2091 2092 2093 2094
int tipc_nl_peer_rm(struct sk_buff *skb, struct genl_info *info)
{
	struct net *net = sock_net(skb->sk);
	struct tipc_net *tn = net_generic(net, tipc_net_id);
	struct nlattr *attrs[TIPC_NLA_NET_MAX + 1];
2095
	struct tipc_node *peer, *temp_node;
2096 2097 2098 2099 2100 2101 2102
	u32 addr;
	int err;

	/* We identify the peer by its net */
	if (!info->attrs[TIPC_NLA_NET])
		return -EINVAL;

2103 2104 2105
	err = nla_parse_nested_deprecated(attrs, TIPC_NLA_NET_MAX,
					  info->attrs[TIPC_NLA_NET],
					  tipc_nl_net_policy, info->extack);
2106 2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126 2127 2128 2129 2130 2131
	if (err)
		return err;

	if (!attrs[TIPC_NLA_NET_ADDR])
		return -EINVAL;

	addr = nla_get_u32(attrs[TIPC_NLA_NET_ADDR]);

	if (in_own_node(net, addr))
		return -ENOTSUPP;

	spin_lock_bh(&tn->node_list_lock);
	peer = tipc_node_find(net, addr);
	if (!peer) {
		spin_unlock_bh(&tn->node_list_lock);
		return -ENXIO;
	}

	tipc_node_write_lock(peer);
	if (peer->state != SELF_DOWN_PEER_DOWN &&
	    peer->state != SELF_DOWN_PEER_LEAVING) {
		tipc_node_write_unlock(peer);
		err = -EBUSY;
		goto err_out;
	}

2132
	tipc_node_clear_links(peer);
2133 2134 2135
	tipc_node_write_unlock(peer);
	tipc_node_delete(peer);

2136 2137 2138 2139 2140
	/* Calculate cluster capabilities */
	tn->capabilities = TIPC_NODE_CAPABILITIES;
	list_for_each_entry_rcu(temp_node, &tn->node_list, list) {
		tn->capabilities &= temp_node->capabilities;
	}
2141 2142 2143 2144 2145 2146 2147 2148
	err = 0;
err_out:
	tipc_node_put(peer);
	spin_unlock_bh(&tn->node_list_lock);

	return err;
}

2149 2150 2151
int tipc_nl_node_dump(struct sk_buff *skb, struct netlink_callback *cb)
{
	int err;
2152 2153
	struct net *net = sock_net(skb->sk);
	struct tipc_net *tn = net_generic(net, tipc_net_id);
2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166
	int done = cb->args[0];
	int last_addr = cb->args[1];
	struct tipc_node *node;
	struct tipc_nl_msg msg;

	if (done)
		return 0;

	msg.skb = skb;
	msg.portid = NETLINK_CB(cb->skb).portid;
	msg.seq = cb->nlh->nlmsg_seq;

	rcu_read_lock();
2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181
	if (last_addr) {
		node = tipc_node_find(net, last_addr);
		if (!node) {
			rcu_read_unlock();
			/* We never set seq or call nl_dump_check_consistent()
			 * this means that setting prev_seq here will cause the
			 * consistence check to fail in the netlink callback
			 * handler. Resulting in the NLMSG_DONE message having
			 * the NLM_F_DUMP_INTR flag set if the node state
			 * changed while we released the lock.
			 */
			cb->prev_seq = 1;
			return -EPIPE;
		}
		tipc_node_put(node);
2182 2183
	}

2184
	list_for_each_entry_rcu(node, &tn->node_list, list) {
2185 2186
		if (node->preliminary)
			continue;
2187 2188 2189 2190 2191 2192 2193
		if (last_addr) {
			if (node->addr == last_addr)
				last_addr = 0;
			else
				continue;
		}

J
Jon Paul Maloy 已提交
2194
		tipc_node_read_lock(node);
2195 2196 2197
		err = __tipc_nl_add_node(&msg, node);
		if (err) {
			last_addr = node->addr;
J
Jon Paul Maloy 已提交
2198
			tipc_node_read_unlock(node);
2199 2200 2201
			goto out;
		}

J
Jon Paul Maloy 已提交
2202
		tipc_node_read_unlock(node);
2203 2204 2205 2206 2207 2208 2209 2210 2211
	}
	done = 1;
out:
	cb->args[0] = done;
	cb->args[1] = last_addr;
	rcu_read_unlock();

	return skb->len;
}
2212

2213
/* tipc_node_find_by_name - locate owner node of link by link's name
2214 2215 2216 2217 2218 2219
 * @net: the applicable net namespace
 * @name: pointer to link name string
 * @bearer_id: pointer to index in 'node->links' array where the link was found.
 *
 * Returns pointer to node owning the link, or 0 if no matching link is found.
 */
2220 2221 2222
static struct tipc_node *tipc_node_find_by_name(struct net *net,
						const char *link_name,
						unsigned int *bearer_id)
2223 2224
{
	struct tipc_net *tn = net_generic(net, tipc_net_id);
2225 2226
	struct tipc_link *l;
	struct tipc_node *n;
2227 2228 2229 2230 2231
	struct tipc_node *found_node = NULL;
	int i;

	*bearer_id = 0;
	rcu_read_lock();
2232 2233
	list_for_each_entry_rcu(n, &tn->node_list, list) {
		tipc_node_read_lock(n);
2234
		for (i = 0; i < MAX_BEARERS; i++) {
2235 2236
			l = n->links[i].link;
			if (l && !strcmp(tipc_link_name(l), link_name)) {
2237
				*bearer_id = i;
2238
				found_node = n;
2239 2240 2241
				break;
			}
		}
2242
		tipc_node_read_unlock(n);
2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258
		if (found_node)
			break;
	}
	rcu_read_unlock();

	return found_node;
}

int tipc_nl_node_set_link(struct sk_buff *skb, struct genl_info *info)
{
	int err;
	int res = 0;
	int bearer_id;
	char *name;
	struct tipc_link *link;
	struct tipc_node *node;
2259
	struct sk_buff_head xmitq;
2260 2261 2262
	struct nlattr *attrs[TIPC_NLA_LINK_MAX + 1];
	struct net *net = sock_net(skb->sk);

2263 2264
	__skb_queue_head_init(&xmitq);

2265 2266 2267
	if (!info->attrs[TIPC_NLA_LINK])
		return -EINVAL;

2268 2269 2270
	err = nla_parse_nested_deprecated(attrs, TIPC_NLA_LINK_MAX,
					  info->attrs[TIPC_NLA_LINK],
					  tipc_nl_link_policy, info->extack);
2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281
	if (err)
		return err;

	if (!attrs[TIPC_NLA_LINK_NAME])
		return -EINVAL;

	name = nla_data(attrs[TIPC_NLA_LINK_NAME]);

	if (strcmp(name, tipc_bclink_name) == 0)
		return tipc_nl_bc_link_set(net, attrs);

2282
	node = tipc_node_find_by_name(net, name, &bearer_id);
2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307
	if (!node)
		return -EINVAL;

	tipc_node_read_lock(node);

	link = node->links[bearer_id].link;
	if (!link) {
		res = -EINVAL;
		goto out;
	}

	if (attrs[TIPC_NLA_LINK_PROP]) {
		struct nlattr *props[TIPC_NLA_PROP_MAX + 1];

		err = tipc_nl_parse_link_prop(attrs[TIPC_NLA_LINK_PROP],
					      props);
		if (err) {
			res = err;
			goto out;
		}

		if (props[TIPC_NLA_PROP_TOL]) {
			u32 tol;

			tol = nla_get_u32(props[TIPC_NLA_PROP_TOL]);
2308
			tipc_link_set_tolerance(link, tol, &xmitq);
2309 2310 2311 2312 2313
		}
		if (props[TIPC_NLA_PROP_PRIO]) {
			u32 prio;

			prio = nla_get_u32(props[TIPC_NLA_PROP_PRIO]);
2314
			tipc_link_set_prio(link, prio, &xmitq);
2315 2316 2317 2318 2319 2320 2321 2322 2323 2324 2325
		}
		if (props[TIPC_NLA_PROP_WIN]) {
			u32 win;

			win = nla_get_u32(props[TIPC_NLA_PROP_WIN]);
			tipc_link_set_queue_limits(link, win);
		}
	}

out:
	tipc_node_read_unlock(node);
2326
	tipc_bearer_xmit(net, bearer_id, &xmitq, &node->links[bearer_id].maddr);
2327 2328 2329 2330 2331 2332
	return res;
}

int tipc_nl_node_get_link(struct sk_buff *skb, struct genl_info *info)
{
	struct net *net = genl_info_net(info);
2333
	struct nlattr *attrs[TIPC_NLA_LINK_MAX + 1];
2334 2335 2336 2337 2338 2339 2340
	struct tipc_nl_msg msg;
	char *name;
	int err;

	msg.portid = info->snd_portid;
	msg.seq = info->snd_seq;

2341
	if (!info->attrs[TIPC_NLA_LINK])
2342
		return -EINVAL;
2343

2344 2345 2346
	err = nla_parse_nested_deprecated(attrs, TIPC_NLA_LINK_MAX,
					  info->attrs[TIPC_NLA_LINK],
					  tipc_nl_link_policy, info->extack);
2347 2348 2349 2350 2351 2352 2353
	if (err)
		return err;

	if (!attrs[TIPC_NLA_LINK_NAME])
		return -EINVAL;

	name = nla_data(attrs[TIPC_NLA_LINK_NAME]);
2354 2355 2356 2357 2358 2359 2360

	msg.skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
	if (!msg.skb)
		return -ENOMEM;

	if (strcmp(name, tipc_bclink_name) == 0) {
		err = tipc_nl_add_bc_link(net, &msg);
2361 2362
		if (err)
			goto err_free;
2363 2364 2365 2366 2367
	} else {
		int bearer_id;
		struct tipc_node *node;
		struct tipc_link *link;

2368
		node = tipc_node_find_by_name(net, name, &bearer_id);
2369 2370 2371 2372
		if (!node) {
			err = -EINVAL;
			goto err_free;
		}
2373 2374 2375 2376 2377

		tipc_node_read_lock(node);
		link = node->links[bearer_id].link;
		if (!link) {
			tipc_node_read_unlock(node);
2378 2379
			err = -EINVAL;
			goto err_free;
2380 2381 2382 2383
		}

		err = __tipc_nl_add_link(net, &msg, link, 0);
		tipc_node_read_unlock(node);
2384 2385
		if (err)
			goto err_free;
2386 2387 2388
	}

	return genlmsg_reply(msg.skb, info);
2389 2390 2391 2392

err_free:
	nlmsg_free(msg.skb);
	return err;
2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408
}

int tipc_nl_node_reset_link_stats(struct sk_buff *skb, struct genl_info *info)
{
	int err;
	char *link_name;
	unsigned int bearer_id;
	struct tipc_link *link;
	struct tipc_node *node;
	struct nlattr *attrs[TIPC_NLA_LINK_MAX + 1];
	struct net *net = sock_net(skb->sk);
	struct tipc_link_entry *le;

	if (!info->attrs[TIPC_NLA_LINK])
		return -EINVAL;

2409 2410 2411
	err = nla_parse_nested_deprecated(attrs, TIPC_NLA_LINK_MAX,
					  info->attrs[TIPC_NLA_LINK],
					  tipc_nl_link_policy, info->extack);
2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426
	if (err)
		return err;

	if (!attrs[TIPC_NLA_LINK_NAME])
		return -EINVAL;

	link_name = nla_data(attrs[TIPC_NLA_LINK_NAME]);

	if (strcmp(link_name, tipc_bclink_name) == 0) {
		err = tipc_bclink_reset_stats(net);
		if (err)
			return err;
		return 0;
	}

2427
	node = tipc_node_find_by_name(net, link_name, &bearer_id);
2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439
	if (!node)
		return -EINVAL;

	le = &node->links[bearer_id];
	tipc_node_read_lock(node);
	spin_lock_bh(&le->lock);
	link = node->links[bearer_id].link;
	if (!link) {
		spin_unlock_bh(&le->lock);
		tipc_node_read_unlock(node);
		return -EINVAL;
	}
2440
	tipc_link_reset_stats(link);
2441 2442 2443 2444 2445 2446 2447 2448 2449 2450 2451 2452 2453 2454 2455 2456 2457 2458 2459 2460 2461 2462 2463 2464 2465 2466 2467 2468
	spin_unlock_bh(&le->lock);
	tipc_node_read_unlock(node);
	return 0;
}

/* Caller should hold node lock  */
static int __tipc_nl_add_node_links(struct net *net, struct tipc_nl_msg *msg,
				    struct tipc_node *node, u32 *prev_link)
{
	u32 i;
	int err;

	for (i = *prev_link; i < MAX_BEARERS; i++) {
		*prev_link = i;

		if (!node->links[i].link)
			continue;

		err = __tipc_nl_add_link(net, msg,
					 node->links[i].link, NLM_F_MULTI);
		if (err)
			return err;
	}
	*prev_link = 0;

	return 0;
}

2469
int tipc_nl_node_dump_link(struct sk_buff *skb, struct netlink_callback *cb)
2470 2471 2472 2473 2474 2475 2476 2477 2478 2479 2480 2481 2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504 2505 2506 2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518 2519 2520 2521 2522 2523 2524 2525 2526 2527 2528 2529 2530 2531 2532 2533 2534 2535 2536 2537 2538
{
	struct net *net = sock_net(skb->sk);
	struct tipc_net *tn = net_generic(net, tipc_net_id);
	struct tipc_node *node;
	struct tipc_nl_msg msg;
	u32 prev_node = cb->args[0];
	u32 prev_link = cb->args[1];
	int done = cb->args[2];
	int err;

	if (done)
		return 0;

	msg.skb = skb;
	msg.portid = NETLINK_CB(cb->skb).portid;
	msg.seq = cb->nlh->nlmsg_seq;

	rcu_read_lock();
	if (prev_node) {
		node = tipc_node_find(net, prev_node);
		if (!node) {
			/* We never set seq or call nl_dump_check_consistent()
			 * this means that setting prev_seq here will cause the
			 * consistence check to fail in the netlink callback
			 * handler. Resulting in the last NLMSG_DONE message
			 * having the NLM_F_DUMP_INTR flag set.
			 */
			cb->prev_seq = 1;
			goto out;
		}
		tipc_node_put(node);

		list_for_each_entry_continue_rcu(node, &tn->node_list,
						 list) {
			tipc_node_read_lock(node);
			err = __tipc_nl_add_node_links(net, &msg, node,
						       &prev_link);
			tipc_node_read_unlock(node);
			if (err)
				goto out;

			prev_node = node->addr;
		}
	} else {
		err = tipc_nl_add_bc_link(net, &msg);
		if (err)
			goto out;

		list_for_each_entry_rcu(node, &tn->node_list, list) {
			tipc_node_read_lock(node);
			err = __tipc_nl_add_node_links(net, &msg, node,
						       &prev_link);
			tipc_node_read_unlock(node);
			if (err)
				goto out;

			prev_node = node->addr;
		}
	}
	done = 1;
out:
	rcu_read_unlock();

	cb->args[0] = prev_node;
	cb->args[1] = prev_link;
	cb->args[2] = done;

	return skb->len;
}
2539 2540 2541 2542 2543 2544 2545 2546 2547 2548

int tipc_nl_node_set_monitor(struct sk_buff *skb, struct genl_info *info)
{
	struct nlattr *attrs[TIPC_NLA_MON_MAX + 1];
	struct net *net = sock_net(skb->sk);
	int err;

	if (!info->attrs[TIPC_NLA_MON])
		return -EINVAL;

2549 2550 2551 2552
	err = nla_parse_nested_deprecated(attrs, TIPC_NLA_MON_MAX,
					  info->attrs[TIPC_NLA_MON],
					  tipc_nl_monitor_policy,
					  info->extack);
2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563 2564 2565 2566
	if (err)
		return err;

	if (attrs[TIPC_NLA_MON_ACTIVATION_THRESHOLD]) {
		u32 val;

		val = nla_get_u32(attrs[TIPC_NLA_MON_ACTIVATION_THRESHOLD]);
		err = tipc_nl_monitor_set_threshold(net, val);
		if (err)
			return err;
	}

	return 0;
}
2567 2568 2569 2570 2571 2572 2573 2574 2575 2576 2577 2578

static int __tipc_nl_add_monitor_prop(struct net *net, struct tipc_nl_msg *msg)
{
	struct nlattr *attrs;
	void *hdr;
	u32 val;

	hdr = genlmsg_put(msg->skb, msg->portid, msg->seq, &tipc_genl_family,
			  0, TIPC_NL_MON_GET);
	if (!hdr)
		return -EMSGSIZE;

2579
	attrs = nla_nest_start_noflag(msg->skb, TIPC_NLA_MON);
2580 2581 2582 2583 2584 2585 2586 2587 2588 2589 2590 2591 2592 2593 2594 2595 2596 2597 2598 2599 2600 2601 2602 2603 2604 2605 2606 2607
	if (!attrs)
		goto msg_full;

	val = tipc_nl_monitor_get_threshold(net);

	if (nla_put_u32(msg->skb, TIPC_NLA_MON_ACTIVATION_THRESHOLD, val))
		goto attr_msg_full;

	nla_nest_end(msg->skb, attrs);
	genlmsg_end(msg->skb, hdr);

	return 0;

attr_msg_full:
	nla_nest_cancel(msg->skb, attrs);
msg_full:
	genlmsg_cancel(msg->skb, hdr);

	return -EMSGSIZE;
}

int tipc_nl_node_get_monitor(struct sk_buff *skb, struct genl_info *info)
{
	struct net *net = sock_net(skb->sk);
	struct tipc_nl_msg msg;
	int err;

	msg.skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
P
Pan Bian 已提交
2608 2609
	if (!msg.skb)
		return -ENOMEM;
2610 2611 2612 2613 2614 2615 2616 2617 2618 2619 2620
	msg.portid = info->snd_portid;
	msg.seq = info->snd_seq;

	err = __tipc_nl_add_monitor_prop(net, &msg);
	if (err) {
		nlmsg_free(msg.skb);
		return err;
	}

	return genlmsg_reply(msg.skb, info);
}
2621 2622 2623 2624 2625 2626

int tipc_nl_node_dump_monitor(struct sk_buff *skb, struct netlink_callback *cb)
{
	struct net *net = sock_net(skb->sk);
	u32 prev_bearer = cb->args[0];
	struct tipc_nl_msg msg;
2627
	int bearer_id;
2628 2629 2630 2631 2632 2633 2634 2635 2636 2637
	int err;

	if (prev_bearer == MAX_BEARERS)
		return 0;

	msg.skb = skb;
	msg.portid = NETLINK_CB(cb->skb).portid;
	msg.seq = cb->nlh->nlmsg_seq;

	rtnl_lock();
2638
	for (bearer_id = prev_bearer; bearer_id < MAX_BEARERS; bearer_id++) {
2639
		err = __tipc_nl_add_monitor(net, &msg, bearer_id);
2640
		if (err)
2641
			break;
2642 2643
	}
	rtnl_unlock();
2644
	cb->args[0] = bearer_id;
2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659

	return skb->len;
}

int tipc_nl_node_dump_monitor_peer(struct sk_buff *skb,
				   struct netlink_callback *cb)
{
	struct net *net = sock_net(skb->sk);
	u32 prev_node = cb->args[1];
	u32 bearer_id = cb->args[2];
	int done = cb->args[0];
	struct tipc_nl_msg msg;
	int err;

	if (!prev_node) {
2660
		struct nlattr **attrs = genl_dumpit_info(cb)->attrs;
2661 2662 2663 2664 2665
		struct nlattr *mon[TIPC_NLA_MON_MAX + 1];

		if (!attrs[TIPC_NLA_MON])
			return -EINVAL;

2666 2667 2668 2669
		err = nla_parse_nested_deprecated(mon, TIPC_NLA_MON_MAX,
						  attrs[TIPC_NLA_MON],
						  tipc_nl_monitor_policy,
						  NULL);
2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687 2688 2689 2690 2691 2692 2693 2694 2695 2696 2697 2698 2699 2700
		if (err)
			return err;

		if (!mon[TIPC_NLA_MON_REF])
			return -EINVAL;

		bearer_id = nla_get_u32(mon[TIPC_NLA_MON_REF]);

		if (bearer_id >= MAX_BEARERS)
			return -EINVAL;
	}

	if (done)
		return 0;

	msg.skb = skb;
	msg.portid = NETLINK_CB(cb->skb).portid;
	msg.seq = cb->nlh->nlmsg_seq;

	rtnl_lock();
	err = tipc_nl_add_monitor_peer(net, &msg, bearer_id, &prev_node);
	if (!err)
		done = 1;

	rtnl_unlock();
	cb->args[0] = done;
	cb->args[1] = prev_node;
	cb->args[2] = bearer_id;

	return skb->len;
}
T
Tuong Lien 已提交
2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718 2719 2720 2721 2722 2723 2724 2725 2726 2727 2728 2729 2730 2731 2732 2733 2734 2735 2736 2737 2738 2739 2740 2741 2742 2743 2744 2745 2746 2747 2748 2749 2750 2751 2752 2753 2754 2755 2756 2757

/**
 * tipc_node_dump - dump TIPC node data
 * @n: tipc node to be dumped
 * @more: dump more?
 *        - false: dump only tipc node data
 *        - true: dump node link data as well
 * @buf: returned buffer of dump data in format
 */
int tipc_node_dump(struct tipc_node *n, bool more, char *buf)
{
	int i = 0;
	size_t sz = (more) ? NODE_LMAX : NODE_LMIN;

	if (!n) {
		i += scnprintf(buf, sz, "node data: (null)\n");
		return i;
	}

	i += scnprintf(buf, sz, "node data: %x", n->addr);
	i += scnprintf(buf + i, sz - i, " %x", n->state);
	i += scnprintf(buf + i, sz - i, " %d", n->active_links[0]);
	i += scnprintf(buf + i, sz - i, " %d", n->active_links[1]);
	i += scnprintf(buf + i, sz - i, " %x", n->action_flags);
	i += scnprintf(buf + i, sz - i, " %u", n->failover_sent);
	i += scnprintf(buf + i, sz - i, " %u", n->sync_point);
	i += scnprintf(buf + i, sz - i, " %d", n->link_cnt);
	i += scnprintf(buf + i, sz - i, " %u", n->working_links);
	i += scnprintf(buf + i, sz - i, " %x", n->capabilities);
	i += scnprintf(buf + i, sz - i, " %lu\n", n->keepalive_intv);

	if (!more)
		return i;

	i += scnprintf(buf + i, sz - i, "link_entry[0]:\n");
	i += scnprintf(buf + i, sz - i, " mtu: %u\n", n->links[0].mtu);
	i += scnprintf(buf + i, sz - i, " media: ");
	i += tipc_media_addr_printf(buf + i, sz - i, &n->links[0].maddr);
	i += scnprintf(buf + i, sz - i, "\n");
	i += tipc_link_dump(n->links[0].link, TIPC_DUMP_NONE, buf + i);
	i += scnprintf(buf + i, sz - i, " inputq: ");
	i += tipc_list_dump(&n->links[0].inputq, false, buf + i);

	i += scnprintf(buf + i, sz - i, "link_entry[1]:\n");
	i += scnprintf(buf + i, sz - i, " mtu: %u\n", n->links[1].mtu);
	i += scnprintf(buf + i, sz - i, " media: ");
	i += tipc_media_addr_printf(buf + i, sz - i, &n->links[1].maddr);
	i += scnprintf(buf + i, sz - i, "\n");
	i += tipc_link_dump(n->links[1].link, TIPC_DUMP_NONE, buf + i);
	i += scnprintf(buf + i, sz - i, " inputq: ");
	i += tipc_list_dump(&n->links[1].inputq, false, buf + i);

	i += scnprintf(buf + i, sz - i, "bclink:\n ");
	i += tipc_link_dump(n->bc_entry.link, TIPC_DUMP_NONE, buf + i);

	return i;
}
2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780 2781 2782 2783 2784 2785 2786 2787

void tipc_node_pre_cleanup_net(struct net *exit_net)
{
	struct tipc_node *n;
	struct tipc_net *tn;
	struct net *tmp;

	rcu_read_lock();
	for_each_net_rcu(tmp) {
		if (tmp == exit_net)
			continue;
		tn = tipc_net(tmp);
		if (!tn)
			continue;
		spin_lock_bh(&tn->node_list_lock);
		list_for_each_entry_rcu(n, &tn->node_list, list) {
			if (!n->peer_net)
				continue;
			if (n->peer_net != exit_net)
				continue;
			tipc_node_write_lock(n);
			n->peer_net = NULL;
			n->peer_hash_mix = 0;
			tipc_node_write_unlock_fast(n);
			break;
		}
		spin_unlock_bh(&tn->node_list_lock);
	}
	rcu_read_unlock();
}