host.c 14.6 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * linux/fs/lockd/host.c
 *
 * Management for NLM peer hosts. The nlm_host struct is shared
 * between client and server implementation. The only reason to
 * do so is to reduce code bloat.
 *
 * Copyright (C) 1996, Olaf Kirch <okir@monad.swb.de>
 */

#include <linux/types.h>
#include <linux/slab.h>
#include <linux/in.h>
14
#include <linux/in6.h>
L
Linus Torvalds 已提交
15 16 17 18
#include <linux/sunrpc/clnt.h>
#include <linux/sunrpc/svc.h>
#include <linux/lockd/lockd.h>
#include <linux/lockd/sm_inter.h>
I
Ingo Molnar 已提交
19
#include <linux/mutex.h>
L
Linus Torvalds 已提交
20

21
#include <net/ipv6.h>
L
Linus Torvalds 已提交
22 23 24 25 26

#define NLMDBG_FACILITY		NLMDBG_HOSTCACHE
#define NLM_HOST_NRHASH		32
#define NLM_ADDRHASH(addr)	(ntohl(addr) & (NLM_HOST_NRHASH-1))
#define NLM_HOST_REBIND		(60 * HZ)
27 28
#define NLM_HOST_EXPIRE		(300 * HZ)
#define NLM_HOST_COLLECT	(120 * HZ)
L
Linus Torvalds 已提交
29

30
static struct hlist_head	nlm_hosts[NLM_HOST_NRHASH];
L
Linus Torvalds 已提交
31 32
static unsigned long		next_gc;
static int			nrhosts;
I
Ingo Molnar 已提交
33
static DEFINE_MUTEX(nlm_host_mutex);
L
Linus Torvalds 已提交
34 35 36


static void			nlm_gc_hosts(void);
37
static struct nsm_handle *	__nsm_find(const struct sockaddr_in *,
38
					const char *, unsigned int, int);
39 40
static struct nsm_handle *	nsm_find(const struct sockaddr_in *sin,
					 const char *hostname,
41
					 unsigned int hostname_len);
L
Linus Torvalds 已提交
42

43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
static void nlm_display_address(const struct sockaddr *sap,
				char *buf, const size_t len)
{
	const struct sockaddr_in *sin = (struct sockaddr_in *)sap;
	const struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)sap;

	switch (sap->sa_family) {
	case AF_UNSPEC:
		snprintf(buf, len, "unspecified");
		break;
	case AF_INET:
		snprintf(buf, len, NIPQUAD_FMT, NIPQUAD(sin->sin_addr.s_addr));
		break;
	case AF_INET6:
		if (ipv6_addr_v4mapped(&sin6->sin6_addr))
			snprintf(buf, len, NIPQUAD_FMT,
				 NIPQUAD(sin6->sin6_addr.s6_addr32[3]));
		else
			snprintf(buf, len, NIP6_FMT, NIP6(sin6->sin6_addr));
		break;
	default:
		snprintf(buf, len, "unsupported address family");
		break;
	}
}

L
Linus Torvalds 已提交
69 70 71
/*
 * Common host lookup routine for server & client
 */
72 73 74 75 76 77
static struct nlm_host *nlm_lookup_host(int server,
					const struct sockaddr_in *sin,
					int proto, u32 version,
					const char *hostname,
					unsigned int hostname_len,
					const struct sockaddr_in *ssin)
L
Linus Torvalds 已提交
78
{
79 80 81
	struct hlist_head *chain;
	struct hlist_node *pos;
	struct nlm_host	*host;
82
	struct nsm_handle *nsm = NULL;
L
Linus Torvalds 已提交
83 84
	int		hash;

85 86 87 88
	dprintk("lockd: nlm_lookup_host(proto=%d, vers=%u,"
			" my role is %s, hostname=%.*s)\n",
			proto, version, server ? "server" : "client",
			hostname_len, hostname ? hostname : "<none>");
L
Linus Torvalds 已提交
89 90 91 92

	hash = NLM_ADDRHASH(sin->sin_addr.s_addr);

	/* Lock hash table */
I
Ingo Molnar 已提交
93
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
94 95 96 97

	if (time_after_eq(jiffies, next_gc))
		nlm_gc_hosts();

98 99 100 101 102 103 104
	/* We may keep several nlm_host objects for a peer, because each
	 * nlm_host is identified by
	 * (address, protocol, version, server/client)
	 * We could probably simplify this a little by putting all those
	 * different NLM rpc_clients into one single nlm_host object.
	 * This would allow us to have one nlm_host per address.
	 */
105 106
	chain = &nlm_hosts[hash];
	hlist_for_each_entry(host, pos, chain, h_hash) {
107 108 109 110
		if (!nlm_cmp_addr(&host->h_addr, sin))
			continue;

		/* See if we have an NSM handle for this client */
111 112
		if (!nsm)
			nsm = host->h_nsmhandle;
113

L
Linus Torvalds 已提交
114 115 116 117 118 119
		if (host->h_proto != proto)
			continue;
		if (host->h_version != version)
			continue;
		if (host->h_server != server)
			continue;
120 121
		if (!nlm_cmp_addr(&host->h_saddr, ssin))
			continue;
L
Linus Torvalds 已提交
122

123 124 125 126
		/* Move to head of hash chain. */
		hlist_del(&host->h_hash);
		hlist_add_head(&host->h_hash, chain);

127
		nlm_get_host(host);
128 129
		dprintk("lockd: nlm_lookup_host found host %s (%s)\n",
				host->h_name, host->h_addrbuf);
130
		goto out;
L
Linus Torvalds 已提交
131 132
	}

133 134 135
	/*
	 * The host wasn't in our hash table.  If we don't
	 * have an NSM handle for it yet, create one.
136
	 */
137 138 139 140 141
	if (nsm)
		atomic_inc(&nsm->sm_count);
	else {
		host = NULL;
		nsm = nsm_find(sin, hostname, hostname_len);
142 143 144
		if (!nsm) {
			dprintk("lockd: nlm_lookup_host failed; "
				"no nsm handle\n");
145
			goto out;
146
		}
147
	}
L
Linus Torvalds 已提交
148

149
	host = kzalloc(sizeof(*host), GFP_KERNEL);
150 151
	if (!host) {
		nsm_release(nsm);
152
		dprintk("lockd: nlm_lookup_host failed; no memory\n");
153 154 155
		goto out;
	}
	host->h_name	   = nsm->sm_name;
L
Linus Torvalds 已提交
156 157
	host->h_addr       = *sin;
	host->h_addr.sin_port = 0;	/* ouch! */
158
	host->h_saddr	   = *ssin;
L
Linus Torvalds 已提交
159 160 161
	host->h_version    = version;
	host->h_proto      = proto;
	host->h_rpcclnt    = NULL;
T
Trond Myklebust 已提交
162
	mutex_init(&host->h_mutex);
L
Linus Torvalds 已提交
163 164 165 166
	host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	host->h_expires    = jiffies + NLM_HOST_EXPIRE;
	atomic_set(&host->h_count, 1);
	init_waitqueue_head(&host->h_gracewait);
T
Trond Myklebust 已提交
167
	init_rwsem(&host->h_rwsem);
L
Linus Torvalds 已提交
168 169
	host->h_state      = 0;			/* pseudo NSM state */
	host->h_nsmstate   = 0;			/* real NSM state */
170
	host->h_nsmhandle  = nsm;
L
Linus Torvalds 已提交
171
	host->h_server	   = server;
172
	hlist_add_head(&host->h_hash, chain);
L
Linus Torvalds 已提交
173 174
	INIT_LIST_HEAD(&host->h_lockowners);
	spin_lock_init(&host->h_lock);
175 176
	INIT_LIST_HEAD(&host->h_granted);
	INIT_LIST_HEAD(&host->h_reclaim);
L
Linus Torvalds 已提交
177

178
	nrhosts++;
179 180 181 182 183 184 185 186 187

	nlm_display_address((struct sockaddr *)&host->h_addr,
				host->h_addrbuf, sizeof(host->h_addrbuf));
	nlm_display_address((struct sockaddr *)&host->h_saddr,
				host->h_saddrbuf, sizeof(host->h_saddrbuf));

	dprintk("lockd: nlm_lookup_host created host %s\n",
			host->h_name);

188
out:
I
Ingo Molnar 已提交
189
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
190 191 192
	return host;
}

193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208
/*
 * Destroy a host
 */
static void
nlm_destroy_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

	BUG_ON(!list_empty(&host->h_lockowners));
	BUG_ON(atomic_read(&host->h_count));

	/*
	 * Release NSM handle and unmonitor host.
	 */
	nsm_unmonitor(host);

209 210 211
	clnt = host->h_rpcclnt;
	if (clnt != NULL)
		rpc_shutdown_client(clnt);
212 213 214
	kfree(host);
}

215 216 217
/*
 * Find an NLM server handle in the cache. If there is none, create it.
 */
218 219 220 221
struct nlm_host *nlmclnt_lookup_host(const struct sockaddr_in *sin,
				     int proto, u32 version,
				     const char *hostname,
				     unsigned int hostname_len)
222
{
223 224 225
	const struct sockaddr_in source = {
		.sin_family	= AF_UNSPEC,
	};
226

227
	return nlm_lookup_host(0, sin, proto, version,
228
			       hostname, hostname_len, &source);
229 230 231 232 233 234 235
}

/*
 * Find an NLM client handle in the cache. If there is none, create it.
 */
struct nlm_host *
nlmsvc_lookup_host(struct svc_rqst *rqstp,
236
			const char *hostname, unsigned int hostname_len)
237
{
238 239 240 241
	const struct sockaddr_in source = {
		.sin_family	= AF_INET,
		.sin_addr	= rqstp->rq_daddr.addr,
	};
242

243
	return nlm_lookup_host(1, svc_addr_in(rqstp),
244
			       rqstp->rq_prot, rqstp->rq_vers,
245
			       hostname, hostname_len, &source);
246 247
}

L
Linus Torvalds 已提交
248 249 250 251 252 253 254 255
/*
 * Create the NLM RPC client for an NLM peer
 */
struct rpc_clnt *
nlm_bind_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

256 257
	dprintk("lockd: nlm_bind_host %s (%s), my addr=%s\n",
			host->h_name, host->h_addrbuf, host->h_saddrbuf);
L
Linus Torvalds 已提交
258 259

	/* Lock host handle */
T
Trond Myklebust 已提交
260
	mutex_lock(&host->h_mutex);
L
Linus Torvalds 已提交
261 262 263 264 265

	/* If we've already created an RPC client, check whether
	 * RPC rebind is required
	 */
	if ((clnt = host->h_rpcclnt) != NULL) {
266
		if (time_after_eq(jiffies, host->h_nextrebind)) {
267
			rpc_force_rebind(clnt);
L
Linus Torvalds 已提交
268
			host->h_nextrebind = jiffies + NLM_HOST_REBIND;
269
			dprintk("lockd: next rebind in %lu jiffies\n",
L
Linus Torvalds 已提交
270 271 272
					host->h_nextrebind - jiffies);
		}
	} else {
273
		unsigned long increment = nlmsvc_timeout;
274 275 276 277 278 279 280 281 282 283
		struct rpc_timeout timeparms = {
			.to_initval	= increment,
			.to_increment	= increment,
			.to_maxval	= increment * 6UL,
			.to_retries	= 5U,
		};
		struct rpc_create_args args = {
			.protocol	= host->h_proto,
			.address	= (struct sockaddr *)&host->h_addr,
			.addrsize	= sizeof(host->h_addr),
284
			.saddress	= (struct sockaddr *)&host->h_saddr,
285 286 287 288 289
			.timeout	= &timeparms,
			.servername	= host->h_name,
			.program	= &nlm_program,
			.version	= host->h_version,
			.authflavor	= RPC_AUTH_UNIX,
290
			.flags		= (RPC_CLNT_CREATE_NOPING |
291 292 293
					   RPC_CLNT_CREATE_AUTOBIND),
		};

294 295 296 297 298 299 300 301
		/*
		 * lockd retries server side blocks automatically so we want
		 * those to be soft RPC calls. Client side calls need to be
		 * hard RPC tasks.
		 */
		if (!host->h_server)
			args.flags |= RPC_CLNT_CREATE_HARDRTRY;

302 303 304 305 306 307 308
		clnt = rpc_create(&args);
		if (!IS_ERR(clnt))
			host->h_rpcclnt = clnt;
		else {
			printk("lockd: couldn't create RPC handle for %s\n", host->h_name);
			clnt = NULL;
		}
L
Linus Torvalds 已提交
309 310
	}

T
Trond Myklebust 已提交
311
	mutex_unlock(&host->h_mutex);
L
Linus Torvalds 已提交
312 313 314 315 316 317 318 319 320 321 322
	return clnt;
}

/*
 * Force a portmap lookup of the remote lockd port
 */
void
nlm_rebind_host(struct nlm_host *host)
{
	dprintk("lockd: rebind host %s\n", host->h_name);
	if (host->h_rpcclnt && time_after_eq(jiffies, host->h_nextrebind)) {
323
		rpc_force_rebind(host->h_rpcclnt);
L
Linus Torvalds 已提交
324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348
		host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	}
}

/*
 * Increment NLM host count
 */
struct nlm_host * nlm_get_host(struct nlm_host *host)
{
	if (host) {
		dprintk("lockd: get host %s\n", host->h_name);
		atomic_inc(&host->h_count);
		host->h_expires = jiffies + NLM_HOST_EXPIRE;
	}
	return host;
}

/*
 * Release NLM host after use
 */
void nlm_release_host(struct nlm_host *host)
{
	if (host != NULL) {
		dprintk("lockd: release host %s\n", host->h_name);
		BUG_ON(atomic_read(&host->h_count) < 0);
349 350 351 352 353
		if (atomic_dec_and_test(&host->h_count)) {
			BUG_ON(!list_empty(&host->h_lockowners));
			BUG_ON(!list_empty(&host->h_granted));
			BUG_ON(!list_empty(&host->h_reclaim));
		}
L
Linus Torvalds 已提交
354 355 356
	}
}

357 358 359 360 361
/*
 * We were notified that the host indicated by address &sin
 * has rebooted.
 * Release all resources held by that peer.
 */
362
void nlm_host_rebooted(const struct sockaddr_in *sin,
363 364
				const char *hostname,
				unsigned int hostname_len,
365
				u32 new_state)
366
{
367 368
	struct hlist_head *chain;
	struct hlist_node *pos;
369
	struct nsm_handle *nsm;
370
	struct nlm_host	*host;
371

372
	/* Find the NSM handle for this peer */
373 374 375 376
	nsm = __nsm_find(sin, hostname, hostname_len, 0);
	if (nsm == NULL) {
		dprintk("lockd: never saw rebooted peer '%.*s' before\n",
				hostname_len, hostname);
377
		return;
378 379 380 381
	}

	dprintk("lockd: nlm_host_rebooted(%.*s, %s)\n",
			hostname_len, hostname, nsm->sm_addrbuf);
382

383 384 385 386 387 388 389 390 391 392
	/* When reclaiming locks on this peer, make sure that
	 * we set up a new notification */
	nsm->sm_monitored = 0;

	/* Mark all hosts tied to this NSM state as having rebooted.
	 * We run the loop repeatedly, because we drop the host table
	 * lock for this.
	 * To avoid processing a host several times, we match the nsmstate.
	 */
again:	mutex_lock(&nlm_host_mutex);
393 394
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash) {
395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415
			if (host->h_nsmhandle == nsm
			 && host->h_nsmstate != new_state) {
				host->h_nsmstate = new_state;
				host->h_state++;

				nlm_get_host(host);
				mutex_unlock(&nlm_host_mutex);

				if (host->h_server) {
					/* We're server for this guy, just ditch
					 * all the locks he held. */
					nlmsvc_free_host_resources(host);
				} else {
					/* He's the server, initiate lock recovery. */
					nlmclnt_recovery(host);
				}

				nlm_release_host(host);
				goto again;
			}
		}
416
	}
417 418

	mutex_unlock(&nlm_host_mutex);
419 420
}

L
Linus Torvalds 已提交
421 422 423 424 425 426 427
/*
 * Shut down the hosts module.
 * Note that this routine is called only at server shutdown time.
 */
void
nlm_shutdown_hosts(void)
{
428 429
	struct hlist_head *chain;
	struct hlist_node *pos;
L
Linus Torvalds 已提交
430 431 432
	struct nlm_host	*host;

	dprintk("lockd: shutting down host module\n");
I
Ingo Molnar 已提交
433
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
434 435 436

	/* First, make all hosts eligible for gc */
	dprintk("lockd: nuking all hosts...\n");
437
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
438
		hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
439
			host->h_expires = jiffies - 1;
440 441 442 443 444
			if (host->h_rpcclnt) {
				rpc_shutdown_client(host->h_rpcclnt);
				host->h_rpcclnt = NULL;
			}
		}
L
Linus Torvalds 已提交
445 446 447 448
	}

	/* Then, perform a garbage collection pass */
	nlm_gc_hosts();
I
Ingo Molnar 已提交
449
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
450 451 452 453 454

	/* complain if any hosts are left */
	if (nrhosts) {
		printk(KERN_WARNING "lockd: couldn't shutdown host module!\n");
		dprintk("lockd: %d hosts left:\n", nrhosts);
455 456
		for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
			hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472
				dprintk("       %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
			}
		}
	}
}

/*
 * Garbage collect any unused NLM hosts.
 * This GC combines reference counting for async operations with
 * mark & sweep for resources held by remote clients.
 */
static void
nlm_gc_hosts(void)
{
473 474 475
	struct hlist_head *chain;
	struct hlist_node *pos, *next;
	struct nlm_host	*host;
L
Linus Torvalds 已提交
476 477

	dprintk("lockd: host garbage collection\n");
478 479
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash)
L
Linus Torvalds 已提交
480 481 482 483 484 485
			host->h_inuse = 0;
	}

	/* Mark all hosts that hold locks, blocks or shares */
	nlmsvc_mark_resources();

486 487
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry_safe(host, pos, next, chain, h_hash) {
L
Linus Torvalds 已提交
488 489 490 491 492 493 494 495
			if (atomic_read(&host->h_count) || host->h_inuse
			 || time_before(jiffies, host->h_expires)) {
				dprintk("nlm_gc_hosts skipping %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
				continue;
			}
			dprintk("lockd: delete host %s\n", host->h_name);
496
			hlist_del_init(&host->h_hash);
497

498
			nlm_destroy_host(host);
L
Linus Torvalds 已提交
499 500 501 502 503 504 505
			nrhosts--;
		}
	}

	next_gc = jiffies + NLM_HOST_COLLECT;
}

506 507 508 509 510

/*
 * Manage NSM handles
 */
static LIST_HEAD(nsm_handles);
511
static DEFINE_SPINLOCK(nsm_lock);
512 513 514

static struct nsm_handle *
__nsm_find(const struct sockaddr_in *sin,
515
		const char *hostname, unsigned int hostname_len,
516 517 518
		int create)
{
	struct nsm_handle *nsm = NULL;
J
J. Bruce Fields 已提交
519
	struct nsm_handle *pos;
520 521 522 523 524 525 526 527 528 529 530 531 532

	if (!sin)
		return NULL;

	if (hostname && memchr(hostname, '/', hostname_len) != NULL) {
		if (printk_ratelimit()) {
			printk(KERN_WARNING "Invalid hostname \"%.*s\" "
					    "in NFS lock request\n",
				hostname_len, hostname);
		}
		return NULL;
	}

533 534
retry:
	spin_lock(&nsm_lock);
J
J. Bruce Fields 已提交
535
	list_for_each_entry(pos, &nsm_handles, sm_link) {
536

537
		if (hostname && nsm_use_hostnames) {
J
J. Bruce Fields 已提交
538 539
			if (strlen(pos->sm_name) != hostname_len
			 || memcmp(pos->sm_name, hostname, hostname_len))
540
				continue;
J
J. Bruce Fields 已提交
541
		} else if (!nlm_cmp_addr(&pos->sm_addr, sin))
542
			continue;
J
J. Bruce Fields 已提交
543
		atomic_inc(&pos->sm_count);
544
		kfree(nsm);
J
J. Bruce Fields 已提交
545
		nsm = pos;
546
		goto found;
547
	}
548 549 550
	if (nsm) {
		list_add(&nsm->sm_link, &nsm_handles);
		goto found;
551
	}
552 553 554 555
	spin_unlock(&nsm_lock);

	if (!create)
		return NULL;
556 557

	nsm = kzalloc(sizeof(*nsm) + hostname_len + 1, GFP_KERNEL);
J
J. Bruce Fields 已提交
558
	if (nsm == NULL)
559 560
		return NULL;

J
J. Bruce Fields 已提交
561 562 563 564
	nsm->sm_addr = *sin;
	nsm->sm_name = (char *) (nsm + 1);
	memcpy(nsm->sm_name, hostname, hostname_len);
	nsm->sm_name[hostname_len] = '\0';
565 566
	nlm_display_address((struct sockaddr *)&nsm->sm_addr,
				nsm->sm_addrbuf, sizeof(nsm->sm_addrbuf));
J
J. Bruce Fields 已提交
567
	atomic_set(&nsm->sm_count, 1);
568
	goto retry;
J
J. Bruce Fields 已提交
569

570 571
found:
	spin_unlock(&nsm_lock);
572 573 574
	return nsm;
}

575
static struct nsm_handle *
576 577
nsm_find(const struct sockaddr_in *sin, const char *hostname,
	 unsigned int hostname_len)
578 579 580 581 582 583 584 585 586 587 588 589
{
	return __nsm_find(sin, hostname, hostname_len, 1);
}

/*
 * Release an NSM handle
 */
void
nsm_release(struct nsm_handle *nsm)
{
	if (!nsm)
		return;
590
	if (atomic_dec_and_lock(&nsm->sm_count, &nsm_lock)) {
591
		list_del(&nsm->sm_link);
592
		spin_unlock(&nsm_lock);
593
		kfree(nsm);
594 595
	}
}