host.c 14.6 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * linux/fs/lockd/host.c
 *
 * Management for NLM peer hosts. The nlm_host struct is shared
 * between client and server implementation. The only reason to
 * do so is to reduce code bloat.
 *
 * Copyright (C) 1996, Olaf Kirch <okir@monad.swb.de>
 */

#include <linux/types.h>
#include <linux/slab.h>
#include <linux/in.h>
14
#include <linux/in6.h>
L
Linus Torvalds 已提交
15 16 17 18
#include <linux/sunrpc/clnt.h>
#include <linux/sunrpc/svc.h>
#include <linux/lockd/lockd.h>
#include <linux/lockd/sm_inter.h>
I
Ingo Molnar 已提交
19
#include <linux/mutex.h>
L
Linus Torvalds 已提交
20

21
#include <net/ipv6.h>
L
Linus Torvalds 已提交
22 23 24 25 26

#define NLMDBG_FACILITY		NLMDBG_HOSTCACHE
#define NLM_HOST_NRHASH		32
#define NLM_ADDRHASH(addr)	(ntohl(addr) & (NLM_HOST_NRHASH-1))
#define NLM_HOST_REBIND		(60 * HZ)
27 28
#define NLM_HOST_EXPIRE		(300 * HZ)
#define NLM_HOST_COLLECT	(120 * HZ)
L
Linus Torvalds 已提交
29

30
static struct hlist_head	nlm_hosts[NLM_HOST_NRHASH];
L
Linus Torvalds 已提交
31 32
static unsigned long		next_gc;
static int			nrhosts;
I
Ingo Molnar 已提交
33
static DEFINE_MUTEX(nlm_host_mutex);
L
Linus Torvalds 已提交
34 35 36


static void			nlm_gc_hosts(void);
37
static struct nsm_handle *	__nsm_find(const struct sockaddr_in *,
38
					const char *, unsigned int, int);
39 40
static struct nsm_handle *	nsm_find(const struct sockaddr_in *sin,
					 const char *hostname,
41
					 unsigned int hostname_len);
L
Linus Torvalds 已提交
42

43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
static void nlm_display_address(const struct sockaddr *sap,
				char *buf, const size_t len)
{
	const struct sockaddr_in *sin = (struct sockaddr_in *)sap;
	const struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)sap;

	switch (sap->sa_family) {
	case AF_UNSPEC:
		snprintf(buf, len, "unspecified");
		break;
	case AF_INET:
		snprintf(buf, len, NIPQUAD_FMT, NIPQUAD(sin->sin_addr.s_addr));
		break;
	case AF_INET6:
		if (ipv6_addr_v4mapped(&sin6->sin6_addr))
			snprintf(buf, len, NIPQUAD_FMT,
				 NIPQUAD(sin6->sin6_addr.s6_addr32[3]));
		else
			snprintf(buf, len, NIP6_FMT, NIP6(sin6->sin6_addr));
		break;
	default:
		snprintf(buf, len, "unsupported address family");
		break;
	}
}

L
Linus Torvalds 已提交
69 70 71
/*
 * Common host lookup routine for server & client
 */
72 73 74 75 76 77
static struct nlm_host *nlm_lookup_host(int server,
					const struct sockaddr_in *sin,
					int proto, u32 version,
					const char *hostname,
					unsigned int hostname_len,
					const struct sockaddr_in *ssin)
L
Linus Torvalds 已提交
78
{
79 80 81
	struct hlist_head *chain;
	struct hlist_node *pos;
	struct nlm_host	*host;
82
	struct nsm_handle *nsm = NULL;
L
Linus Torvalds 已提交
83 84
	int		hash;

85 86 87 88
	dprintk("lockd: nlm_lookup_host(proto=%d, vers=%u,"
			" my role is %s, hostname=%.*s)\n",
			proto, version, server ? "server" : "client",
			hostname_len, hostname ? hostname : "<none>");
L
Linus Torvalds 已提交
89 90 91 92

	hash = NLM_ADDRHASH(sin->sin_addr.s_addr);

	/* Lock hash table */
I
Ingo Molnar 已提交
93
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
94 95 96 97

	if (time_after_eq(jiffies, next_gc))
		nlm_gc_hosts();

98 99 100 101 102 103 104
	/* We may keep several nlm_host objects for a peer, because each
	 * nlm_host is identified by
	 * (address, protocol, version, server/client)
	 * We could probably simplify this a little by putting all those
	 * different NLM rpc_clients into one single nlm_host object.
	 * This would allow us to have one nlm_host per address.
	 */
105 106
	chain = &nlm_hosts[hash];
	hlist_for_each_entry(host, pos, chain, h_hash) {
107 108 109 110
		if (!nlm_cmp_addr(&host->h_addr, sin))
			continue;

		/* See if we have an NSM handle for this client */
111 112
		if (!nsm)
			nsm = host->h_nsmhandle;
113

L
Linus Torvalds 已提交
114 115 116 117 118 119
		if (host->h_proto != proto)
			continue;
		if (host->h_version != version)
			continue;
		if (host->h_server != server)
			continue;
120 121
		if (!nlm_cmp_addr(&host->h_saddr, ssin))
			continue;
L
Linus Torvalds 已提交
122

123 124 125 126
		/* Move to head of hash chain. */
		hlist_del(&host->h_hash);
		hlist_add_head(&host->h_hash, chain);

127
		nlm_get_host(host);
128 129
		dprintk("lockd: nlm_lookup_host found host %s (%s)\n",
				host->h_name, host->h_addrbuf);
130
		goto out;
L
Linus Torvalds 已提交
131 132
	}

133 134 135
	/*
	 * The host wasn't in our hash table.  If we don't
	 * have an NSM handle for it yet, create one.
136
	 */
137 138 139 140 141
	if (nsm)
		atomic_inc(&nsm->sm_count);
	else {
		host = NULL;
		nsm = nsm_find(sin, hostname, hostname_len);
142 143 144
		if (!nsm) {
			dprintk("lockd: nlm_lookup_host failed; "
				"no nsm handle\n");
145
			goto out;
146
		}
147
	}
L
Linus Torvalds 已提交
148

149
	host = kzalloc(sizeof(*host), GFP_KERNEL);
150 151
	if (!host) {
		nsm_release(nsm);
152
		dprintk("lockd: nlm_lookup_host failed; no memory\n");
153 154 155
		goto out;
	}
	host->h_name	   = nsm->sm_name;
L
Linus Torvalds 已提交
156 157
	host->h_addr       = *sin;
	host->h_addr.sin_port = 0;	/* ouch! */
158
	host->h_saddr	   = *ssin;
L
Linus Torvalds 已提交
159 160 161
	host->h_version    = version;
	host->h_proto      = proto;
	host->h_rpcclnt    = NULL;
T
Trond Myklebust 已提交
162
	mutex_init(&host->h_mutex);
L
Linus Torvalds 已提交
163 164 165 166
	host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	host->h_expires    = jiffies + NLM_HOST_EXPIRE;
	atomic_set(&host->h_count, 1);
	init_waitqueue_head(&host->h_gracewait);
T
Trond Myklebust 已提交
167
	init_rwsem(&host->h_rwsem);
L
Linus Torvalds 已提交
168 169
	host->h_state      = 0;			/* pseudo NSM state */
	host->h_nsmstate   = 0;			/* real NSM state */
170
	host->h_nsmhandle  = nsm;
L
Linus Torvalds 已提交
171
	host->h_server	   = server;
172
	hlist_add_head(&host->h_hash, chain);
L
Linus Torvalds 已提交
173 174
	INIT_LIST_HEAD(&host->h_lockowners);
	spin_lock_init(&host->h_lock);
175 176
	INIT_LIST_HEAD(&host->h_granted);
	INIT_LIST_HEAD(&host->h_reclaim);
L
Linus Torvalds 已提交
177

178
	nrhosts++;
179 180 181 182 183 184 185 186 187

	nlm_display_address((struct sockaddr *)&host->h_addr,
				host->h_addrbuf, sizeof(host->h_addrbuf));
	nlm_display_address((struct sockaddr *)&host->h_saddr,
				host->h_saddrbuf, sizeof(host->h_saddrbuf));

	dprintk("lockd: nlm_lookup_host created host %s\n",
			host->h_name);

188
out:
I
Ingo Molnar 已提交
189
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
190 191 192
	return host;
}

193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208
/*
 * Destroy a host
 */
static void
nlm_destroy_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

	BUG_ON(!list_empty(&host->h_lockowners));
	BUG_ON(atomic_read(&host->h_count));

	/*
	 * Release NSM handle and unmonitor host.
	 */
	nsm_unmonitor(host);

209 210 211
	clnt = host->h_rpcclnt;
	if (clnt != NULL)
		rpc_shutdown_client(clnt);
212 213 214
	kfree(host);
}

215 216 217
/*
 * Find an NLM server handle in the cache. If there is none, create it.
 */
218 219 220 221
struct nlm_host *nlmclnt_lookup_host(const struct sockaddr_in *sin,
				     int proto, u32 version,
				     const char *hostname,
				     unsigned int hostname_len)
222
{
223 224
	struct sockaddr_in ssin = {0};

225
	return nlm_lookup_host(0, sin, proto, version,
226
			       hostname, hostname_len, &ssin);
227 228 229 230 231 232 233
}

/*
 * Find an NLM client handle in the cache. If there is none, create it.
 */
struct nlm_host *
nlmsvc_lookup_host(struct svc_rqst *rqstp,
234
			const char *hostname, unsigned int hostname_len)
235
{
236 237 238
	struct sockaddr_in ssin = {0};

	ssin.sin_addr = rqstp->rq_daddr.addr;
239
	return nlm_lookup_host(1, svc_addr_in(rqstp),
240
			       rqstp->rq_prot, rqstp->rq_vers,
241
			       hostname, hostname_len, &ssin);
242 243
}

L
Linus Torvalds 已提交
244 245 246 247 248 249 250 251
/*
 * Create the NLM RPC client for an NLM peer
 */
struct rpc_clnt *
nlm_bind_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

252 253
	dprintk("lockd: nlm_bind_host %s (%s), my addr=%s\n",
			host->h_name, host->h_addrbuf, host->h_saddrbuf);
L
Linus Torvalds 已提交
254 255

	/* Lock host handle */
T
Trond Myklebust 已提交
256
	mutex_lock(&host->h_mutex);
L
Linus Torvalds 已提交
257 258 259 260 261

	/* If we've already created an RPC client, check whether
	 * RPC rebind is required
	 */
	if ((clnt = host->h_rpcclnt) != NULL) {
262
		if (time_after_eq(jiffies, host->h_nextrebind)) {
263
			rpc_force_rebind(clnt);
L
Linus Torvalds 已提交
264
			host->h_nextrebind = jiffies + NLM_HOST_REBIND;
265
			dprintk("lockd: next rebind in %lu jiffies\n",
L
Linus Torvalds 已提交
266 267 268
					host->h_nextrebind - jiffies);
		}
	} else {
269
		unsigned long increment = nlmsvc_timeout;
270 271 272 273 274 275 276 277 278 279
		struct rpc_timeout timeparms = {
			.to_initval	= increment,
			.to_increment	= increment,
			.to_maxval	= increment * 6UL,
			.to_retries	= 5U,
		};
		struct rpc_create_args args = {
			.protocol	= host->h_proto,
			.address	= (struct sockaddr *)&host->h_addr,
			.addrsize	= sizeof(host->h_addr),
280
			.saddress	= (struct sockaddr *)&host->h_saddr,
281 282 283 284 285
			.timeout	= &timeparms,
			.servername	= host->h_name,
			.program	= &nlm_program,
			.version	= host->h_version,
			.authflavor	= RPC_AUTH_UNIX,
286
			.flags		= (RPC_CLNT_CREATE_NOPING |
287 288 289
					   RPC_CLNT_CREATE_AUTOBIND),
		};

290 291 292 293 294 295 296 297
		/*
		 * lockd retries server side blocks automatically so we want
		 * those to be soft RPC calls. Client side calls need to be
		 * hard RPC tasks.
		 */
		if (!host->h_server)
			args.flags |= RPC_CLNT_CREATE_HARDRTRY;

298 299 300 301 302 303 304
		clnt = rpc_create(&args);
		if (!IS_ERR(clnt))
			host->h_rpcclnt = clnt;
		else {
			printk("lockd: couldn't create RPC handle for %s\n", host->h_name);
			clnt = NULL;
		}
L
Linus Torvalds 已提交
305 306
	}

T
Trond Myklebust 已提交
307
	mutex_unlock(&host->h_mutex);
L
Linus Torvalds 已提交
308 309 310 311 312 313 314 315 316 317 318
	return clnt;
}

/*
 * Force a portmap lookup of the remote lockd port
 */
void
nlm_rebind_host(struct nlm_host *host)
{
	dprintk("lockd: rebind host %s\n", host->h_name);
	if (host->h_rpcclnt && time_after_eq(jiffies, host->h_nextrebind)) {
319
		rpc_force_rebind(host->h_rpcclnt);
L
Linus Torvalds 已提交
320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344
		host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	}
}

/*
 * Increment NLM host count
 */
struct nlm_host * nlm_get_host(struct nlm_host *host)
{
	if (host) {
		dprintk("lockd: get host %s\n", host->h_name);
		atomic_inc(&host->h_count);
		host->h_expires = jiffies + NLM_HOST_EXPIRE;
	}
	return host;
}

/*
 * Release NLM host after use
 */
void nlm_release_host(struct nlm_host *host)
{
	if (host != NULL) {
		dprintk("lockd: release host %s\n", host->h_name);
		BUG_ON(atomic_read(&host->h_count) < 0);
345 346 347 348 349
		if (atomic_dec_and_test(&host->h_count)) {
			BUG_ON(!list_empty(&host->h_lockowners));
			BUG_ON(!list_empty(&host->h_granted));
			BUG_ON(!list_empty(&host->h_reclaim));
		}
L
Linus Torvalds 已提交
350 351 352
	}
}

353 354 355 356 357
/*
 * We were notified that the host indicated by address &sin
 * has rebooted.
 * Release all resources held by that peer.
 */
358
void nlm_host_rebooted(const struct sockaddr_in *sin,
359 360
				const char *hostname,
				unsigned int hostname_len,
361
				u32 new_state)
362
{
363 364
	struct hlist_head *chain;
	struct hlist_node *pos;
365
	struct nsm_handle *nsm;
366
	struct nlm_host	*host;
367

368
	/* Find the NSM handle for this peer */
369 370 371 372
	nsm = __nsm_find(sin, hostname, hostname_len, 0);
	if (nsm == NULL) {
		dprintk("lockd: never saw rebooted peer '%.*s' before\n",
				hostname_len, hostname);
373
		return;
374 375 376 377
	}

	dprintk("lockd: nlm_host_rebooted(%.*s, %s)\n",
			hostname_len, hostname, nsm->sm_addrbuf);
378

379 380 381 382 383 384 385 386 387 388
	/* When reclaiming locks on this peer, make sure that
	 * we set up a new notification */
	nsm->sm_monitored = 0;

	/* Mark all hosts tied to this NSM state as having rebooted.
	 * We run the loop repeatedly, because we drop the host table
	 * lock for this.
	 * To avoid processing a host several times, we match the nsmstate.
	 */
again:	mutex_lock(&nlm_host_mutex);
389 390
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash) {
391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411
			if (host->h_nsmhandle == nsm
			 && host->h_nsmstate != new_state) {
				host->h_nsmstate = new_state;
				host->h_state++;

				nlm_get_host(host);
				mutex_unlock(&nlm_host_mutex);

				if (host->h_server) {
					/* We're server for this guy, just ditch
					 * all the locks he held. */
					nlmsvc_free_host_resources(host);
				} else {
					/* He's the server, initiate lock recovery. */
					nlmclnt_recovery(host);
				}

				nlm_release_host(host);
				goto again;
			}
		}
412
	}
413 414

	mutex_unlock(&nlm_host_mutex);
415 416
}

L
Linus Torvalds 已提交
417 418 419 420 421 422 423
/*
 * Shut down the hosts module.
 * Note that this routine is called only at server shutdown time.
 */
void
nlm_shutdown_hosts(void)
{
424 425
	struct hlist_head *chain;
	struct hlist_node *pos;
L
Linus Torvalds 已提交
426 427 428
	struct nlm_host	*host;

	dprintk("lockd: shutting down host module\n");
I
Ingo Molnar 已提交
429
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
430 431 432

	/* First, make all hosts eligible for gc */
	dprintk("lockd: nuking all hosts...\n");
433
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
434
		hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
435
			host->h_expires = jiffies - 1;
436 437 438 439 440
			if (host->h_rpcclnt) {
				rpc_shutdown_client(host->h_rpcclnt);
				host->h_rpcclnt = NULL;
			}
		}
L
Linus Torvalds 已提交
441 442 443 444
	}

	/* Then, perform a garbage collection pass */
	nlm_gc_hosts();
I
Ingo Molnar 已提交
445
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
446 447 448 449 450

	/* complain if any hosts are left */
	if (nrhosts) {
		printk(KERN_WARNING "lockd: couldn't shutdown host module!\n");
		dprintk("lockd: %d hosts left:\n", nrhosts);
451 452
		for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
			hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468
				dprintk("       %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
			}
		}
	}
}

/*
 * Garbage collect any unused NLM hosts.
 * This GC combines reference counting for async operations with
 * mark & sweep for resources held by remote clients.
 */
static void
nlm_gc_hosts(void)
{
469 470 471
	struct hlist_head *chain;
	struct hlist_node *pos, *next;
	struct nlm_host	*host;
L
Linus Torvalds 已提交
472 473

	dprintk("lockd: host garbage collection\n");
474 475
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash)
L
Linus Torvalds 已提交
476 477 478 479 480 481
			host->h_inuse = 0;
	}

	/* Mark all hosts that hold locks, blocks or shares */
	nlmsvc_mark_resources();

482 483
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry_safe(host, pos, next, chain, h_hash) {
L
Linus Torvalds 已提交
484 485 486 487 488 489 490 491
			if (atomic_read(&host->h_count) || host->h_inuse
			 || time_before(jiffies, host->h_expires)) {
				dprintk("nlm_gc_hosts skipping %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
				continue;
			}
			dprintk("lockd: delete host %s\n", host->h_name);
492
			hlist_del_init(&host->h_hash);
493

494
			nlm_destroy_host(host);
L
Linus Torvalds 已提交
495 496 497 498 499 500 501
			nrhosts--;
		}
	}

	next_gc = jiffies + NLM_HOST_COLLECT;
}

502 503 504 505 506

/*
 * Manage NSM handles
 */
static LIST_HEAD(nsm_handles);
507
static DEFINE_SPINLOCK(nsm_lock);
508 509 510

static struct nsm_handle *
__nsm_find(const struct sockaddr_in *sin,
511
		const char *hostname, unsigned int hostname_len,
512 513 514
		int create)
{
	struct nsm_handle *nsm = NULL;
J
J. Bruce Fields 已提交
515
	struct nsm_handle *pos;
516 517 518 519 520 521 522 523 524 525 526 527 528

	if (!sin)
		return NULL;

	if (hostname && memchr(hostname, '/', hostname_len) != NULL) {
		if (printk_ratelimit()) {
			printk(KERN_WARNING "Invalid hostname \"%.*s\" "
					    "in NFS lock request\n",
				hostname_len, hostname);
		}
		return NULL;
	}

529 530
retry:
	spin_lock(&nsm_lock);
J
J. Bruce Fields 已提交
531
	list_for_each_entry(pos, &nsm_handles, sm_link) {
532

533
		if (hostname && nsm_use_hostnames) {
J
J. Bruce Fields 已提交
534 535
			if (strlen(pos->sm_name) != hostname_len
			 || memcmp(pos->sm_name, hostname, hostname_len))
536
				continue;
J
J. Bruce Fields 已提交
537
		} else if (!nlm_cmp_addr(&pos->sm_addr, sin))
538
			continue;
J
J. Bruce Fields 已提交
539
		atomic_inc(&pos->sm_count);
540
		kfree(nsm);
J
J. Bruce Fields 已提交
541
		nsm = pos;
542
		goto found;
543
	}
544 545 546
	if (nsm) {
		list_add(&nsm->sm_link, &nsm_handles);
		goto found;
547
	}
548 549 550 551
	spin_unlock(&nsm_lock);

	if (!create)
		return NULL;
552 553

	nsm = kzalloc(sizeof(*nsm) + hostname_len + 1, GFP_KERNEL);
J
J. Bruce Fields 已提交
554
	if (nsm == NULL)
555 556
		return NULL;

J
J. Bruce Fields 已提交
557 558 559 560
	nsm->sm_addr = *sin;
	nsm->sm_name = (char *) (nsm + 1);
	memcpy(nsm->sm_name, hostname, hostname_len);
	nsm->sm_name[hostname_len] = '\0';
561 562
	nlm_display_address((struct sockaddr *)&nsm->sm_addr,
				nsm->sm_addrbuf, sizeof(nsm->sm_addrbuf));
J
J. Bruce Fields 已提交
563
	atomic_set(&nsm->sm_count, 1);
564
	goto retry;
J
J. Bruce Fields 已提交
565

566 567
found:
	spin_unlock(&nsm_lock);
568 569 570
	return nsm;
}

571
static struct nsm_handle *
572 573
nsm_find(const struct sockaddr_in *sin, const char *hostname,
	 unsigned int hostname_len)
574 575 576 577 578 579 580 581 582 583 584 585
{
	return __nsm_find(sin, hostname, hostname_len, 1);
}

/*
 * Release an NSM handle
 */
void
nsm_release(struct nsm_handle *nsm)
{
	if (!nsm)
		return;
586
	if (atomic_dec_and_lock(&nsm->sm_count, &nsm_lock)) {
587
		list_del(&nsm->sm_link);
588
		spin_unlock(&nsm_lock);
589
		kfree(nsm);
590 591
	}
}