host.c 15.4 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * linux/fs/lockd/host.c
 *
 * Management for NLM peer hosts. The nlm_host struct is shared
 * between client and server implementation. The only reason to
 * do so is to reduce code bloat.
 *
 * Copyright (C) 1996, Olaf Kirch <okir@monad.swb.de>
 */

#include <linux/types.h>
#include <linux/slab.h>
#include <linux/in.h>
14
#include <linux/in6.h>
L
Linus Torvalds 已提交
15 16 17 18
#include <linux/sunrpc/clnt.h>
#include <linux/sunrpc/svc.h>
#include <linux/lockd/lockd.h>
#include <linux/lockd/sm_inter.h>
I
Ingo Molnar 已提交
19
#include <linux/mutex.h>
L
Linus Torvalds 已提交
20

21
#include <net/ipv6.h>
L
Linus Torvalds 已提交
22 23 24 25

#define NLMDBG_FACILITY		NLMDBG_HOSTCACHE
#define NLM_HOST_NRHASH		32
#define NLM_HOST_REBIND		(60 * HZ)
26 27
#define NLM_HOST_EXPIRE		(300 * HZ)
#define NLM_HOST_COLLECT	(120 * HZ)
L
Linus Torvalds 已提交
28

29
static struct hlist_head	nlm_hosts[NLM_HOST_NRHASH];
L
Linus Torvalds 已提交
30 31
static unsigned long		next_gc;
static int			nrhosts;
I
Ingo Molnar 已提交
32
static DEFINE_MUTEX(nlm_host_mutex);
L
Linus Torvalds 已提交
33 34 35

static void			nlm_gc_hosts(void);

36 37
struct nlm_lookup_host_info {
	const int		server;		/* search for server|client */
38 39
	const struct sockaddr	*sap;		/* address to search for */
	const size_t		salen;		/* it's length */
40 41 42 43
	const unsigned short	protocol;	/* transport to search for*/
	const u32		version;	/* NLM version to search for */
	const char		*hostname;	/* remote's hostname */
	const size_t		hostname_len;	/* it's length */
44
	const struct sockaddr	*src_sap;	/* our address (optional) */
45
	const size_t		src_len;	/* it's length */
46
	const int		noresvport;	/* use non-priv port */
47 48
};

49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90
/*
 * Hash function must work well on big- and little-endian platforms
 */
static unsigned int __nlm_hash32(const __be32 n)
{
	unsigned int hash = (__force u32)n ^ ((__force u32)n >> 16);
	return hash ^ (hash >> 8);
}

static unsigned int __nlm_hash_addr4(const struct sockaddr *sap)
{
	const struct sockaddr_in *sin = (struct sockaddr_in *)sap;
	return __nlm_hash32(sin->sin_addr.s_addr);
}

static unsigned int __nlm_hash_addr6(const struct sockaddr *sap)
{
	const struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)sap;
	const struct in6_addr addr = sin6->sin6_addr;
	return __nlm_hash32(addr.s6_addr32[0]) ^
	       __nlm_hash32(addr.s6_addr32[1]) ^
	       __nlm_hash32(addr.s6_addr32[2]) ^
	       __nlm_hash32(addr.s6_addr32[3]);
}

static unsigned int nlm_hash_address(const struct sockaddr *sap)
{
	unsigned int hash;

	switch (sap->sa_family) {
	case AF_INET:
		hash = __nlm_hash_addr4(sap);
		break;
	case AF_INET6:
		hash = __nlm_hash_addr6(sap);
		break;
	default:
		hash = 0;
	}
	return hash & (NLM_HOST_NRHASH - 1);
}

91 92 93 94 95 96 97 98 99 100 101 102
static void nlm_clear_port(struct sockaddr *sap)
{
	switch (sap->sa_family) {
	case AF_INET:
		((struct sockaddr_in *)sap)->sin_port = 0;
		break;
	case AF_INET6:
		((struct sockaddr_in6 *)sap)->sin6_port = 0;
		break;
	}
}

L
Linus Torvalds 已提交
103 104 105
/*
 * Common host lookup routine for server & client
 */
106
static struct nlm_host *nlm_lookup_host(struct nlm_lookup_host_info *ni)
L
Linus Torvalds 已提交
107
{
108 109 110
	struct hlist_head *chain;
	struct hlist_node *pos;
	struct nlm_host	*host;
111
	struct nsm_handle *nsm = NULL;
L
Linus Torvalds 已提交
112

I
Ingo Molnar 已提交
113
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
114 115 116 117

	if (time_after_eq(jiffies, next_gc))
		nlm_gc_hosts();

118 119 120 121 122 123 124
	/* We may keep several nlm_host objects for a peer, because each
	 * nlm_host is identified by
	 * (address, protocol, version, server/client)
	 * We could probably simplify this a little by putting all those
	 * different NLM rpc_clients into one single nlm_host object.
	 * This would allow us to have one nlm_host per address.
	 */
125
	chain = &nlm_hosts[nlm_hash_address(ni->sap)];
126
	hlist_for_each_entry(host, pos, chain, h_hash) {
127
		if (!nlm_cmp_addr(nlm_addr(host), ni->sap))
128 129 130
			continue;

		/* See if we have an NSM handle for this client */
131 132
		if (!nsm)
			nsm = host->h_nsmhandle;
133

134
		if (host->h_proto != ni->protocol)
L
Linus Torvalds 已提交
135
			continue;
136
		if (host->h_version != ni->version)
L
Linus Torvalds 已提交
137
			continue;
138
		if (host->h_server != ni->server)
L
Linus Torvalds 已提交
139
			continue;
140 141
		if (ni->server &&
		    !nlm_cmp_addr(nlm_srcaddr(host), ni->src_sap))
142
			continue;
L
Linus Torvalds 已提交
143

144 145 146 147
		/* Move to head of hash chain. */
		hlist_del(&host->h_hash);
		hlist_add_head(&host->h_hash, chain);

148
		nlm_get_host(host);
149 150
		dprintk("lockd: nlm_lookup_host found host %s (%s)\n",
				host->h_name, host->h_addrbuf);
151
		goto out;
L
Linus Torvalds 已提交
152 153
	}

154 155 156
	/*
	 * The host wasn't in our hash table.  If we don't
	 * have an NSM handle for it yet, create one.
157
	 */
158 159 160 161
	if (nsm)
		atomic_inc(&nsm->sm_count);
	else {
		host = NULL;
162
		nsm = nsm_find(ni->sap, ni->salen,
163
				ni->hostname, ni->hostname_len, 1);
164 165 166
		if (!nsm) {
			dprintk("lockd: nlm_lookup_host failed; "
				"no nsm handle\n");
167
			goto out;
168
		}
169
	}
L
Linus Torvalds 已提交
170

171
	host = kzalloc(sizeof(*host), GFP_KERNEL);
172 173
	if (!host) {
		nsm_release(nsm);
174
		dprintk("lockd: nlm_lookup_host failed; no memory\n");
175 176 177
		goto out;
	}
	host->h_name	   = nsm->sm_name;
178
	host->h_addrbuf    = nsm->sm_addrbuf;
179 180
	memcpy(nlm_addr(host), ni->sap, ni->salen);
	host->h_addrlen = ni->salen;
181
	nlm_clear_port(nlm_addr(host));
182
	memcpy(nlm_srcaddr(host), ni->src_sap, ni->src_len);
183 184
	host->h_version    = ni->version;
	host->h_proto      = ni->protocol;
L
Linus Torvalds 已提交
185
	host->h_rpcclnt    = NULL;
T
Trond Myklebust 已提交
186
	mutex_init(&host->h_mutex);
L
Linus Torvalds 已提交
187 188 189 190
	host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	host->h_expires    = jiffies + NLM_HOST_EXPIRE;
	atomic_set(&host->h_count, 1);
	init_waitqueue_head(&host->h_gracewait);
T
Trond Myklebust 已提交
191
	init_rwsem(&host->h_rwsem);
L
Linus Torvalds 已提交
192 193
	host->h_state      = 0;			/* pseudo NSM state */
	host->h_nsmstate   = 0;			/* real NSM state */
194
	host->h_nsmhandle  = nsm;
195
	host->h_server	   = ni->server;
196
	host->h_noresvport = ni->noresvport;
197
	hlist_add_head(&host->h_hash, chain);
L
Linus Torvalds 已提交
198 199
	INIT_LIST_HEAD(&host->h_lockowners);
	spin_lock_init(&host->h_lock);
200 201
	INIT_LIST_HEAD(&host->h_granted);
	INIT_LIST_HEAD(&host->h_reclaim);
L
Linus Torvalds 已提交
202

203
	nrhosts++;
204 205 206 207

	dprintk("lockd: nlm_lookup_host created host %s\n",
			host->h_name);

208
out:
I
Ingo Molnar 已提交
209
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
210 211 212
	return host;
}

213 214 215 216 217 218 219 220 221 222 223 224
/*
 * Destroy a host
 */
static void
nlm_destroy_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

	BUG_ON(!list_empty(&host->h_lockowners));
	BUG_ON(atomic_read(&host->h_count));

	nsm_unmonitor(host);
225
	nsm_release(host->h_nsmhandle);
226

227 228 229
	clnt = host->h_rpcclnt;
	if (clnt != NULL)
		rpc_shutdown_client(clnt);
230 231 232
	kfree(host);
}

233 234 235 236 237 238 239
/**
 * nlmclnt_lookup_host - Find an NLM host handle matching a remote server
 * @sap: network address of server
 * @salen: length of server address
 * @protocol: transport protocol to use
 * @version: NLM protocol version
 * @hostname: '\0'-terminated hostname of server
240
 * @noresvport: 1 if non-privileged port should be used
241 242 243 244 245
 *
 * Returns an nlm_host structure that matches the passed-in
 * [server address, transport protocol, NLM version, server hostname].
 * If one doesn't already exist in the host cache, a new handle is
 * created and returned.
246
 */
247 248 249
struct nlm_host *nlmclnt_lookup_host(const struct sockaddr *sap,
				     const size_t salen,
				     const unsigned short protocol,
250 251 252
				     const u32 version,
				     const char *hostname,
				     int noresvport)
253
{
254 255
	const struct sockaddr source = {
		.sa_family	= AF_UNSPEC,
256
	};
257 258
	struct nlm_lookup_host_info ni = {
		.server		= 0,
259 260 261
		.sap		= sap,
		.salen		= salen,
		.protocol	= protocol,
262 263
		.version	= version,
		.hostname	= hostname,
264
		.hostname_len	= strlen(hostname),
265 266
		.src_sap	= &source,
		.src_len	= sizeof(source),
267
		.noresvport	= noresvport,
268
	};
269

270 271
	dprintk("lockd: %s(host='%s', vers=%u, proto=%s)\n", __func__,
			(hostname ? hostname : "<none>"), version,
272
			(protocol == IPPROTO_UDP ? "udp" : "tcp"));
273 274

	return nlm_lookup_host(&ni);
275 276
}

277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293
/**
 * nlmsvc_lookup_host - Find an NLM host handle matching a remote client
 * @rqstp: incoming NLM request
 * @hostname: name of client host
 * @hostname_len: length of client hostname
 *
 * Returns an nlm_host structure that matches the [client address,
 * transport protocol, NLM version, client hostname] of the passed-in
 * NLM request.  If one doesn't already exist in the host cache, a
 * new handle is created and returned.
 *
 * Before possibly creating a new nlm_host, construct a sockaddr
 * for a specific source address in case the local system has
 * multiple network addresses.  The family of the address in
 * rq_daddr is guaranteed to be the same as the family of the
 * address in rq_addr, so it's safe to use the same family for
 * the source address.
294
 */
295 296 297
struct nlm_host *nlmsvc_lookup_host(const struct svc_rqst *rqstp,
				    const char *hostname,
				    const size_t hostname_len)
298
{
299
	struct sockaddr_in sin = {
300
		.sin_family	= AF_INET,
301 302 303
	};
	struct sockaddr_in6 sin6 = {
		.sin6_family	= AF_INET6,
304
	};
305 306
	struct nlm_lookup_host_info ni = {
		.server		= 1,
307 308
		.sap		= svc_addr(rqstp),
		.salen		= rqstp->rq_addrlen,
309 310 311 312
		.protocol	= rqstp->rq_prot,
		.version	= rqstp->rq_vers,
		.hostname	= hostname,
		.hostname_len	= hostname_len,
313
		.src_len	= rqstp->rq_addrlen,
314 315 316 317 318
	};

	dprintk("lockd: %s(host='%*s', vers=%u, proto=%s)\n", __func__,
			(int)hostname_len, hostname, rqstp->rq_vers,
			(rqstp->rq_prot == IPPROTO_UDP ? "udp" : "tcp"));
319

320 321 322 323 324 325 326 327 328 329 330 331 332
	switch (ni.sap->sa_family) {
	case AF_INET:
		sin.sin_addr.s_addr = rqstp->rq_daddr.addr.s_addr;
		ni.src_sap = (struct sockaddr *)&sin;
		break;
	case AF_INET6:
		ipv6_addr_copy(&sin6.sin6_addr, &rqstp->rq_daddr.addr6);
		ni.src_sap = (struct sockaddr *)&sin6;
		break;
	default:
		return NULL;
	}

333
	return nlm_lookup_host(&ni);
334 335
}

L
Linus Torvalds 已提交
336 337 338 339 340 341 342 343
/*
 * Create the NLM RPC client for an NLM peer
 */
struct rpc_clnt *
nlm_bind_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

344 345
	dprintk("lockd: nlm_bind_host %s (%s)\n",
			host->h_name, host->h_addrbuf);
L
Linus Torvalds 已提交
346 347

	/* Lock host handle */
T
Trond Myklebust 已提交
348
	mutex_lock(&host->h_mutex);
L
Linus Torvalds 已提交
349 350 351 352 353

	/* If we've already created an RPC client, check whether
	 * RPC rebind is required
	 */
	if ((clnt = host->h_rpcclnt) != NULL) {
354
		if (time_after_eq(jiffies, host->h_nextrebind)) {
355
			rpc_force_rebind(clnt);
L
Linus Torvalds 已提交
356
			host->h_nextrebind = jiffies + NLM_HOST_REBIND;
357
			dprintk("lockd: next rebind in %lu jiffies\n",
L
Linus Torvalds 已提交
358 359 360
					host->h_nextrebind - jiffies);
		}
	} else {
361
		unsigned long increment = nlmsvc_timeout;
362 363 364 365 366 367 368 369
		struct rpc_timeout timeparms = {
			.to_initval	= increment,
			.to_increment	= increment,
			.to_maxval	= increment * 6UL,
			.to_retries	= 5U,
		};
		struct rpc_create_args args = {
			.protocol	= host->h_proto,
370 371
			.address	= nlm_addr(host),
			.addrsize	= host->h_addrlen,
372
			.saddress	= nlm_srcaddr(host),
373 374 375 376 377
			.timeout	= &timeparms,
			.servername	= host->h_name,
			.program	= &nlm_program,
			.version	= host->h_version,
			.authflavor	= RPC_AUTH_UNIX,
378
			.flags		= (RPC_CLNT_CREATE_NOPING |
379 380 381
					   RPC_CLNT_CREATE_AUTOBIND),
		};

382 383 384 385 386 387 388
		/*
		 * lockd retries server side blocks automatically so we want
		 * those to be soft RPC calls. Client side calls need to be
		 * hard RPC tasks.
		 */
		if (!host->h_server)
			args.flags |= RPC_CLNT_CREATE_HARDRTRY;
389 390
		if (host->h_noresvport)
			args.flags |= RPC_CLNT_CREATE_NONPRIVPORT;
391

392 393 394 395 396 397 398
		clnt = rpc_create(&args);
		if (!IS_ERR(clnt))
			host->h_rpcclnt = clnt;
		else {
			printk("lockd: couldn't create RPC handle for %s\n", host->h_name);
			clnt = NULL;
		}
L
Linus Torvalds 已提交
399 400
	}

T
Trond Myklebust 已提交
401
	mutex_unlock(&host->h_mutex);
L
Linus Torvalds 已提交
402 403 404 405 406 407 408 409 410 411 412
	return clnt;
}

/*
 * Force a portmap lookup of the remote lockd port
 */
void
nlm_rebind_host(struct nlm_host *host)
{
	dprintk("lockd: rebind host %s\n", host->h_name);
	if (host->h_rpcclnt && time_after_eq(jiffies, host->h_nextrebind)) {
413
		rpc_force_rebind(host->h_rpcclnt);
L
Linus Torvalds 已提交
414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438
		host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	}
}

/*
 * Increment NLM host count
 */
struct nlm_host * nlm_get_host(struct nlm_host *host)
{
	if (host) {
		dprintk("lockd: get host %s\n", host->h_name);
		atomic_inc(&host->h_count);
		host->h_expires = jiffies + NLM_HOST_EXPIRE;
	}
	return host;
}

/*
 * Release NLM host after use
 */
void nlm_release_host(struct nlm_host *host)
{
	if (host != NULL) {
		dprintk("lockd: release host %s\n", host->h_name);
		BUG_ON(atomic_read(&host->h_count) < 0);
439 440 441 442 443
		if (atomic_dec_and_test(&host->h_count)) {
			BUG_ON(!list_empty(&host->h_lockowners));
			BUG_ON(!list_empty(&host->h_granted));
			BUG_ON(!list_empty(&host->h_reclaim));
		}
L
Linus Torvalds 已提交
444 445 446
	}
}

447 448 449 450 451
/*
 * We were notified that the host indicated by address &sin
 * has rebooted.
 * Release all resources held by that peer.
 */
452
void nlm_host_rebooted(const struct sockaddr_in *sin,
453 454
				const char *hostname,
				unsigned int hostname_len,
455
				u32 new_state)
456
{
457 458
	struct hlist_head *chain;
	struct hlist_node *pos;
459
	struct nsm_handle *nsm;
460
	struct nlm_host	*host;
461

462 463
	nsm = nsm_find((struct sockaddr *)sin, sizeof(*sin),
			hostname, hostname_len, 0);
464 465 466
	if (nsm == NULL) {
		dprintk("lockd: never saw rebooted peer '%.*s' before\n",
				hostname_len, hostname);
467
		return;
468 469 470 471
	}

	dprintk("lockd: nlm_host_rebooted(%.*s, %s)\n",
			hostname_len, hostname, nsm->sm_addrbuf);
472

473 474 475 476 477 478 479 480 481 482
	/* When reclaiming locks on this peer, make sure that
	 * we set up a new notification */
	nsm->sm_monitored = 0;

	/* Mark all hosts tied to this NSM state as having rebooted.
	 * We run the loop repeatedly, because we drop the host table
	 * lock for this.
	 * To avoid processing a host several times, we match the nsmstate.
	 */
again:	mutex_lock(&nlm_host_mutex);
483 484
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash) {
485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505
			if (host->h_nsmhandle == nsm
			 && host->h_nsmstate != new_state) {
				host->h_nsmstate = new_state;
				host->h_state++;

				nlm_get_host(host);
				mutex_unlock(&nlm_host_mutex);

				if (host->h_server) {
					/* We're server for this guy, just ditch
					 * all the locks he held. */
					nlmsvc_free_host_resources(host);
				} else {
					/* He's the server, initiate lock recovery. */
					nlmclnt_recovery(host);
				}

				nlm_release_host(host);
				goto again;
			}
		}
506
	}
507 508

	mutex_unlock(&nlm_host_mutex);
509 510
}

L
Linus Torvalds 已提交
511 512 513 514 515 516 517
/*
 * Shut down the hosts module.
 * Note that this routine is called only at server shutdown time.
 */
void
nlm_shutdown_hosts(void)
{
518 519
	struct hlist_head *chain;
	struct hlist_node *pos;
L
Linus Torvalds 已提交
520 521 522
	struct nlm_host	*host;

	dprintk("lockd: shutting down host module\n");
I
Ingo Molnar 已提交
523
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
524 525 526

	/* First, make all hosts eligible for gc */
	dprintk("lockd: nuking all hosts...\n");
527
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
528
		hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
529
			host->h_expires = jiffies - 1;
530 531 532 533 534
			if (host->h_rpcclnt) {
				rpc_shutdown_client(host->h_rpcclnt);
				host->h_rpcclnt = NULL;
			}
		}
L
Linus Torvalds 已提交
535 536 537 538
	}

	/* Then, perform a garbage collection pass */
	nlm_gc_hosts();
I
Ingo Molnar 已提交
539
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
540 541 542 543 544

	/* complain if any hosts are left */
	if (nrhosts) {
		printk(KERN_WARNING "lockd: couldn't shutdown host module!\n");
		dprintk("lockd: %d hosts left:\n", nrhosts);
545 546
		for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
			hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562
				dprintk("       %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
			}
		}
	}
}

/*
 * Garbage collect any unused NLM hosts.
 * This GC combines reference counting for async operations with
 * mark & sweep for resources held by remote clients.
 */
static void
nlm_gc_hosts(void)
{
563 564 565
	struct hlist_head *chain;
	struct hlist_node *pos, *next;
	struct nlm_host	*host;
L
Linus Torvalds 已提交
566 567

	dprintk("lockd: host garbage collection\n");
568 569
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash)
L
Linus Torvalds 已提交
570 571 572 573 574 575
			host->h_inuse = 0;
	}

	/* Mark all hosts that hold locks, blocks or shares */
	nlmsvc_mark_resources();

576 577
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry_safe(host, pos, next, chain, h_hash) {
L
Linus Torvalds 已提交
578 579 580 581 582 583 584 585
			if (atomic_read(&host->h_count) || host->h_inuse
			 || time_before(jiffies, host->h_expires)) {
				dprintk("nlm_gc_hosts skipping %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
				continue;
			}
			dprintk("lockd: delete host %s\n", host->h_name);
586
			hlist_del_init(&host->h_hash);
587

588
			nlm_destroy_host(host);
L
Linus Torvalds 已提交
589 590 591 592 593 594
			nrhosts--;
		}
	}

	next_gc = jiffies + NLM_HOST_COLLECT;
}