host.c 13.2 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/*
 * linux/fs/lockd/host.c
 *
 * Management for NLM peer hosts. The nlm_host struct is shared
 * between client and server implementation. The only reason to
 * do so is to reduce code bloat.
 *
 * Copyright (C) 1996, Olaf Kirch <okir@monad.swb.de>
 */

#include <linux/types.h>
#include <linux/slab.h>
#include <linux/in.h>
#include <linux/sunrpc/clnt.h>
#include <linux/sunrpc/svc.h>
#include <linux/lockd/lockd.h>
#include <linux/lockd/sm_inter.h>
I
Ingo Molnar 已提交
18
#include <linux/mutex.h>
L
Linus Torvalds 已提交
19 20 21 22 23 24


#define NLMDBG_FACILITY		NLMDBG_HOSTCACHE
#define NLM_HOST_NRHASH		32
#define NLM_ADDRHASH(addr)	(ntohl(addr) & (NLM_HOST_NRHASH-1))
#define NLM_HOST_REBIND		(60 * HZ)
25 26
#define NLM_HOST_EXPIRE		(300 * HZ)
#define NLM_HOST_COLLECT	(120 * HZ)
L
Linus Torvalds 已提交
27

28
static struct hlist_head	nlm_hosts[NLM_HOST_NRHASH];
L
Linus Torvalds 已提交
29 30
static unsigned long		next_gc;
static int			nrhosts;
I
Ingo Molnar 已提交
31
static DEFINE_MUTEX(nlm_host_mutex);
L
Linus Torvalds 已提交
32 33 34


static void			nlm_gc_hosts(void);
35
static struct nsm_handle *	__nsm_find(const struct sockaddr_in *,
36
					const char *, unsigned int, int);
37 38
static struct nsm_handle *	nsm_find(const struct sockaddr_in *sin,
					 const char *hostname,
39
					 unsigned int hostname_len);
L
Linus Torvalds 已提交
40 41 42 43

/*
 * Common host lookup routine for server & client
 */
44
static struct nlm_host *
45
nlm_lookup_host(int server, const struct sockaddr_in *sin,
46
		int proto, int version, const char *hostname,
47 48
		unsigned int hostname_len,
		const struct sockaddr_in *ssin)
L
Linus Torvalds 已提交
49
{
50 51 52
	struct hlist_head *chain;
	struct hlist_node *pos;
	struct nlm_host	*host;
53
	struct nsm_handle *nsm = NULL;
L
Linus Torvalds 已提交
54 55
	int		hash;

56 57 58
	dprintk("lockd: nlm_lookup_host("NIPQUAD_FMT"->"NIPQUAD_FMT
			", p=%d, v=%d, my role=%s, name=%.*s)\n",
			NIPQUAD(ssin->sin_addr.s_addr),
59 60 61 62 63
			NIPQUAD(sin->sin_addr.s_addr), proto, version,
			server? "server" : "client",
			hostname_len,
			hostname? hostname : "<none>");

L
Linus Torvalds 已提交
64 65 66 67

	hash = NLM_ADDRHASH(sin->sin_addr.s_addr);

	/* Lock hash table */
I
Ingo Molnar 已提交
68
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
69 70 71 72

	if (time_after_eq(jiffies, next_gc))
		nlm_gc_hosts();

73 74 75 76 77 78 79
	/* We may keep several nlm_host objects for a peer, because each
	 * nlm_host is identified by
	 * (address, protocol, version, server/client)
	 * We could probably simplify this a little by putting all those
	 * different NLM rpc_clients into one single nlm_host object.
	 * This would allow us to have one nlm_host per address.
	 */
80 81
	chain = &nlm_hosts[hash];
	hlist_for_each_entry(host, pos, chain, h_hash) {
82 83 84 85
		if (!nlm_cmp_addr(&host->h_addr, sin))
			continue;

		/* See if we have an NSM handle for this client */
86 87
		if (!nsm)
			nsm = host->h_nsmhandle;
88

L
Linus Torvalds 已提交
89 90 91 92 93 94
		if (host->h_proto != proto)
			continue;
		if (host->h_version != version)
			continue;
		if (host->h_server != server)
			continue;
95 96
		if (!nlm_cmp_addr(&host->h_saddr, ssin))
			continue;
L
Linus Torvalds 已提交
97

98 99 100 101
		/* Move to head of hash chain. */
		hlist_del(&host->h_hash);
		hlist_add_head(&host->h_hash, chain);

102 103
		nlm_get_host(host);
		goto out;
L
Linus Torvalds 已提交
104
	}
105 106
	if (nsm)
		atomic_inc(&nsm->sm_count);
L
Linus Torvalds 已提交
107

108 109
	host = NULL;

110 111 112 113 114
	/* Sadly, the host isn't in our hash table yet. See if
	 * we have an NSM handle for it. If not, create one.
	 */
	if (!nsm && !(nsm = nsm_find(sin, hostname, hostname_len)))
		goto out;
L
Linus Torvalds 已提交
115

116
	host = kzalloc(sizeof(*host), GFP_KERNEL);
117 118 119 120 121
	if (!host) {
		nsm_release(nsm);
		goto out;
	}
	host->h_name	   = nsm->sm_name;
L
Linus Torvalds 已提交
122 123
	host->h_addr       = *sin;
	host->h_addr.sin_port = 0;	/* ouch! */
124
	host->h_saddr	   = *ssin;
L
Linus Torvalds 已提交
125 126 127
	host->h_version    = version;
	host->h_proto      = proto;
	host->h_rpcclnt    = NULL;
T
Trond Myklebust 已提交
128
	mutex_init(&host->h_mutex);
L
Linus Torvalds 已提交
129 130 131 132
	host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	host->h_expires    = jiffies + NLM_HOST_EXPIRE;
	atomic_set(&host->h_count, 1);
	init_waitqueue_head(&host->h_gracewait);
T
Trond Myklebust 已提交
133
	init_rwsem(&host->h_rwsem);
L
Linus Torvalds 已提交
134 135
	host->h_state      = 0;			/* pseudo NSM state */
	host->h_nsmstate   = 0;			/* real NSM state */
136
	host->h_nsmhandle  = nsm;
L
Linus Torvalds 已提交
137
	host->h_server	   = server;
138
	hlist_add_head(&host->h_hash, chain);
L
Linus Torvalds 已提交
139 140
	INIT_LIST_HEAD(&host->h_lockowners);
	spin_lock_init(&host->h_lock);
141 142
	INIT_LIST_HEAD(&host->h_granted);
	INIT_LIST_HEAD(&host->h_reclaim);
L
Linus Torvalds 已提交
143

144
	nrhosts++;
145
out:
I
Ingo Molnar 已提交
146
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
147 148 149
	return host;
}

150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165
/*
 * Destroy a host
 */
static void
nlm_destroy_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

	BUG_ON(!list_empty(&host->h_lockowners));
	BUG_ON(atomic_read(&host->h_count));

	/*
	 * Release NSM handle and unmonitor host.
	 */
	nsm_unmonitor(host);

166 167 168
	clnt = host->h_rpcclnt;
	if (clnt != NULL)
		rpc_shutdown_client(clnt);
169 170 171
	kfree(host);
}

172 173 174 175 176
/*
 * Find an NLM server handle in the cache. If there is none, create it.
 */
struct nlm_host *
nlmclnt_lookup_host(const struct sockaddr_in *sin, int proto, int version,
177
			const char *hostname, unsigned int hostname_len)
178
{
179 180
	struct sockaddr_in ssin = {0};

181
	return nlm_lookup_host(0, sin, proto, version,
182
			       hostname, hostname_len, &ssin);
183 184 185 186 187 188 189
}

/*
 * Find an NLM client handle in the cache. If there is none, create it.
 */
struct nlm_host *
nlmsvc_lookup_host(struct svc_rqst *rqstp,
190
			const char *hostname, unsigned int hostname_len)
191
{
192 193 194
	struct sockaddr_in ssin = {0};

	ssin.sin_addr = rqstp->rq_daddr.addr;
195
	return nlm_lookup_host(1, svc_addr_in(rqstp),
196
			       rqstp->rq_prot, rqstp->rq_vers,
197
			       hostname, hostname_len, &ssin);
198 199
}

L
Linus Torvalds 已提交
200 201 202 203 204 205 206 207
/*
 * Create the NLM RPC client for an NLM peer
 */
struct rpc_clnt *
nlm_bind_host(struct nlm_host *host)
{
	struct rpc_clnt	*clnt;

208 209 210
	dprintk("lockd: nlm_bind_host("NIPQUAD_FMT"->"NIPQUAD_FMT")\n",
			NIPQUAD(host->h_saddr.sin_addr),
			NIPQUAD(host->h_addr.sin_addr));
L
Linus Torvalds 已提交
211 212

	/* Lock host handle */
T
Trond Myklebust 已提交
213
	mutex_lock(&host->h_mutex);
L
Linus Torvalds 已提交
214 215 216 217 218

	/* If we've already created an RPC client, check whether
	 * RPC rebind is required
	 */
	if ((clnt = host->h_rpcclnt) != NULL) {
219
		if (time_after_eq(jiffies, host->h_nextrebind)) {
220
			rpc_force_rebind(clnt);
L
Linus Torvalds 已提交
221 222 223 224 225
			host->h_nextrebind = jiffies + NLM_HOST_REBIND;
			dprintk("lockd: next rebind in %ld jiffies\n",
					host->h_nextrebind - jiffies);
		}
	} else {
226
		unsigned long increment = nlmsvc_timeout;
227 228 229 230 231 232 233 234 235 236
		struct rpc_timeout timeparms = {
			.to_initval	= increment,
			.to_increment	= increment,
			.to_maxval	= increment * 6UL,
			.to_retries	= 5U,
		};
		struct rpc_create_args args = {
			.protocol	= host->h_proto,
			.address	= (struct sockaddr *)&host->h_addr,
			.addrsize	= sizeof(host->h_addr),
237
			.saddress	= (struct sockaddr *)&host->h_saddr,
238 239 240 241 242
			.timeout	= &timeparms,
			.servername	= host->h_name,
			.program	= &nlm_program,
			.version	= host->h_version,
			.authflavor	= RPC_AUTH_UNIX,
243
			.flags		= (RPC_CLNT_CREATE_NOPING |
244 245 246
					   RPC_CLNT_CREATE_AUTOBIND),
		};

247 248 249 250 251 252 253 254
		/*
		 * lockd retries server side blocks automatically so we want
		 * those to be soft RPC calls. Client side calls need to be
		 * hard RPC tasks.
		 */
		if (!host->h_server)
			args.flags |= RPC_CLNT_CREATE_HARDRTRY;

255 256 257 258 259 260 261
		clnt = rpc_create(&args);
		if (!IS_ERR(clnt))
			host->h_rpcclnt = clnt;
		else {
			printk("lockd: couldn't create RPC handle for %s\n", host->h_name);
			clnt = NULL;
		}
L
Linus Torvalds 已提交
262 263
	}

T
Trond Myklebust 已提交
264
	mutex_unlock(&host->h_mutex);
L
Linus Torvalds 已提交
265 266 267 268 269 270 271 272 273 274 275
	return clnt;
}

/*
 * Force a portmap lookup of the remote lockd port
 */
void
nlm_rebind_host(struct nlm_host *host)
{
	dprintk("lockd: rebind host %s\n", host->h_name);
	if (host->h_rpcclnt && time_after_eq(jiffies, host->h_nextrebind)) {
276
		rpc_force_rebind(host->h_rpcclnt);
L
Linus Torvalds 已提交
277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301
		host->h_nextrebind = jiffies + NLM_HOST_REBIND;
	}
}

/*
 * Increment NLM host count
 */
struct nlm_host * nlm_get_host(struct nlm_host *host)
{
	if (host) {
		dprintk("lockd: get host %s\n", host->h_name);
		atomic_inc(&host->h_count);
		host->h_expires = jiffies + NLM_HOST_EXPIRE;
	}
	return host;
}

/*
 * Release NLM host after use
 */
void nlm_release_host(struct nlm_host *host)
{
	if (host != NULL) {
		dprintk("lockd: release host %s\n", host->h_name);
		BUG_ON(atomic_read(&host->h_count) < 0);
302 303 304 305 306
		if (atomic_dec_and_test(&host->h_count)) {
			BUG_ON(!list_empty(&host->h_lockowners));
			BUG_ON(!list_empty(&host->h_granted));
			BUG_ON(!list_empty(&host->h_reclaim));
		}
L
Linus Torvalds 已提交
307 308 309
	}
}

310 311 312 313 314
/*
 * We were notified that the host indicated by address &sin
 * has rebooted.
 * Release all resources held by that peer.
 */
315
void nlm_host_rebooted(const struct sockaddr_in *sin,
316 317
				const char *hostname,
				unsigned int hostname_len,
318
				u32 new_state)
319
{
320 321
	struct hlist_head *chain;
	struct hlist_node *pos;
322
	struct nsm_handle *nsm;
323
	struct nlm_host	*host;
324

325 326 327 328 329
	dprintk("lockd: nlm_host_rebooted(%s, %u.%u.%u.%u)\n",
			hostname, NIPQUAD(sin->sin_addr));

	/* Find the NSM handle for this peer */
	if (!(nsm = __nsm_find(sin, hostname, hostname_len, 0)))
330 331
		return;

332 333 334 335 336 337 338 339 340 341
	/* When reclaiming locks on this peer, make sure that
	 * we set up a new notification */
	nsm->sm_monitored = 0;

	/* Mark all hosts tied to this NSM state as having rebooted.
	 * We run the loop repeatedly, because we drop the host table
	 * lock for this.
	 * To avoid processing a host several times, we match the nsmstate.
	 */
again:	mutex_lock(&nlm_host_mutex);
342 343
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash) {
344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364
			if (host->h_nsmhandle == nsm
			 && host->h_nsmstate != new_state) {
				host->h_nsmstate = new_state;
				host->h_state++;

				nlm_get_host(host);
				mutex_unlock(&nlm_host_mutex);

				if (host->h_server) {
					/* We're server for this guy, just ditch
					 * all the locks he held. */
					nlmsvc_free_host_resources(host);
				} else {
					/* He's the server, initiate lock recovery. */
					nlmclnt_recovery(host);
				}

				nlm_release_host(host);
				goto again;
			}
		}
365
	}
366 367

	mutex_unlock(&nlm_host_mutex);
368 369
}

L
Linus Torvalds 已提交
370 371 372 373 374 375 376
/*
 * Shut down the hosts module.
 * Note that this routine is called only at server shutdown time.
 */
void
nlm_shutdown_hosts(void)
{
377 378
	struct hlist_head *chain;
	struct hlist_node *pos;
L
Linus Torvalds 已提交
379 380 381
	struct nlm_host	*host;

	dprintk("lockd: shutting down host module\n");
I
Ingo Molnar 已提交
382
	mutex_lock(&nlm_host_mutex);
L
Linus Torvalds 已提交
383 384 385

	/* First, make all hosts eligible for gc */
	dprintk("lockd: nuking all hosts...\n");
386
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
387
		hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
388
			host->h_expires = jiffies - 1;
389 390 391 392 393
			if (host->h_rpcclnt) {
				rpc_shutdown_client(host->h_rpcclnt);
				host->h_rpcclnt = NULL;
			}
		}
L
Linus Torvalds 已提交
394 395 396 397
	}

	/* Then, perform a garbage collection pass */
	nlm_gc_hosts();
I
Ingo Molnar 已提交
398
	mutex_unlock(&nlm_host_mutex);
L
Linus Torvalds 已提交
399 400 401 402 403

	/* complain if any hosts are left */
	if (nrhosts) {
		printk(KERN_WARNING "lockd: couldn't shutdown host module!\n");
		dprintk("lockd: %d hosts left:\n", nrhosts);
404 405
		for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
			hlist_for_each_entry(host, pos, chain, h_hash) {
L
Linus Torvalds 已提交
406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421
				dprintk("       %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
			}
		}
	}
}

/*
 * Garbage collect any unused NLM hosts.
 * This GC combines reference counting for async operations with
 * mark & sweep for resources held by remote clients.
 */
static void
nlm_gc_hosts(void)
{
422 423 424
	struct hlist_head *chain;
	struct hlist_node *pos, *next;
	struct nlm_host	*host;
L
Linus Torvalds 已提交
425 426

	dprintk("lockd: host garbage collection\n");
427 428
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry(host, pos, chain, h_hash)
L
Linus Torvalds 已提交
429 430 431 432 433 434
			host->h_inuse = 0;
	}

	/* Mark all hosts that hold locks, blocks or shares */
	nlmsvc_mark_resources();

435 436
	for (chain = nlm_hosts; chain < nlm_hosts + NLM_HOST_NRHASH; ++chain) {
		hlist_for_each_entry_safe(host, pos, next, chain, h_hash) {
L
Linus Torvalds 已提交
437 438 439 440 441 442 443 444
			if (atomic_read(&host->h_count) || host->h_inuse
			 || time_before(jiffies, host->h_expires)) {
				dprintk("nlm_gc_hosts skipping %s (cnt %d use %d exp %ld)\n",
					host->h_name, atomic_read(&host->h_count),
					host->h_inuse, host->h_expires);
				continue;
			}
			dprintk("lockd: delete host %s\n", host->h_name);
445
			hlist_del_init(&host->h_hash);
446

447
			nlm_destroy_host(host);
L
Linus Torvalds 已提交
448 449 450 451 452 453 454
			nrhosts--;
		}
	}

	next_gc = jiffies + NLM_HOST_COLLECT;
}

455 456 457 458 459

/*
 * Manage NSM handles
 */
static LIST_HEAD(nsm_handles);
460
static DEFINE_MUTEX(nsm_mutex);
461 462 463

static struct nsm_handle *
__nsm_find(const struct sockaddr_in *sin,
464
		const char *hostname, unsigned int hostname_len,
465 466 467
		int create)
{
	struct nsm_handle *nsm = NULL;
J
J. Bruce Fields 已提交
468
	struct nsm_handle *pos;
469 470 471 472 473 474 475 476 477 478 479 480 481

	if (!sin)
		return NULL;

	if (hostname && memchr(hostname, '/', hostname_len) != NULL) {
		if (printk_ratelimit()) {
			printk(KERN_WARNING "Invalid hostname \"%.*s\" "
					    "in NFS lock request\n",
				hostname_len, hostname);
		}
		return NULL;
	}

482
	mutex_lock(&nsm_mutex);
J
J. Bruce Fields 已提交
483
	list_for_each_entry(pos, &nsm_handles, sm_link) {
484

485
		if (hostname && nsm_use_hostnames) {
J
J. Bruce Fields 已提交
486 487
			if (strlen(pos->sm_name) != hostname_len
			 || memcmp(pos->sm_name, hostname, hostname_len))
488
				continue;
J
J. Bruce Fields 已提交
489
		} else if (!nlm_cmp_addr(&pos->sm_addr, sin))
490
			continue;
J
J. Bruce Fields 已提交
491 492
		atomic_inc(&pos->sm_count);
		nsm = pos;
493 494 495 496 497 498 499 500 501
		goto out;
	}

	if (!create) {
		nsm = NULL;
		goto out;
	}

	nsm = kzalloc(sizeof(*nsm) + hostname_len + 1, GFP_KERNEL);
J
J. Bruce Fields 已提交
502 503 504 505 506 507 508 509 510
	if (nsm == NULL)
		goto out;
	nsm->sm_addr = *sin;
	nsm->sm_name = (char *) (nsm + 1);
	memcpy(nsm->sm_name, hostname, hostname_len);
	nsm->sm_name[hostname_len] = '\0';
	atomic_set(&nsm->sm_count, 1);

	list_add(&nsm->sm_link, &nsm_handles);
511

512 513
out:
	mutex_unlock(&nsm_mutex);
514 515 516
	return nsm;
}

517
static struct nsm_handle *
518 519
nsm_find(const struct sockaddr_in *sin, const char *hostname,
	 unsigned int hostname_len)
520 521 522 523 524 525 526 527 528 529 530 531
{
	return __nsm_find(sin, hostname, hostname_len, 1);
}

/*
 * Release an NSM handle
 */
void
nsm_release(struct nsm_handle *nsm)
{
	if (!nsm)
		return;
532
	mutex_lock(&nsm_mutex);
533
	if (atomic_dec_and_test(&nsm->sm_count)) {
534 535
		list_del(&nsm->sm_link);
		kfree(nsm);
536
	}
537
	mutex_unlock(&nsm_mutex);
538
}