state.h 16.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37
/*
 *  Copyright (c) 2001 The Regents of the University of Michigan.
 *  All rights reserved.
 *
 *  Kendrick Smith <kmsmith@umich.edu>
 *  Andy Adamson <andros@umich.edu>
 *  
 *  Redistribution and use in source and binary forms, with or without
 *  modification, are permitted provided that the following conditions
 *  are met:
 *  
 *  1. Redistributions of source code must retain the above copyright
 *     notice, this list of conditions and the following disclaimer.
 *  2. Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *  3. Neither the name of the University nor the names of its
 *     contributors may be used to endorse or promote products derived
 *     from this software without specific prior written permission.
 *
 *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
 *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
 *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
 *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
 *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *
 */

#ifndef _NFSD4_STATE_H
#define _NFSD4_STATE_H

38
#include <linux/sunrpc/svc_xprt.h>
39
#include <linux/nfsd/nfsfh.h>
40
#include "nfsfh.h"
L
Linus Torvalds 已提交
41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60

typedef struct {
	u32             cl_boot;
	u32             cl_id;
} clientid_t;

typedef struct {
	u32             so_boot;
	u32             so_stateownerid;
	u32             so_fileid;
} stateid_opaque_t;

typedef struct {
	u32                     si_generation;
	stateid_opaque_t        si_opaque;
} stateid_t;
#define si_boot           si_opaque.so_boot
#define si_stateownerid   si_opaque.so_stateownerid
#define si_fileid         si_opaque.so_fileid

61 62 63 64 65 66 67
#define STATEID_FMT	"(%08x/%08x/%08x/%08x)"
#define STATEID_VAL(s) \
	(s)->si_boot, \
	(s)->si_stateownerid, \
	(s)->si_fileid, \
	(s)->si_generation

68
struct nfsd4_callback {
69 70
	void *cb_op;
	struct nfs4_client *cb_clp;
71
	struct list_head cb_per_client;
72
	u32 cb_minorversion;
J
J. Bruce Fields 已提交
73 74
	struct rpc_message cb_msg;
	const struct rpc_call_ops *cb_ops;
75
	struct work_struct cb_work;
76
	bool cb_done;
77 78
};

79 80 81 82 83 84 85 86 87
struct nfs4_stid {
#define NFS4_OPEN_STID 1
#define NFS4_LOCK_STID 2
#define NFS4_DELEG_STID 4
	char sc_type;
	struct list_head sc_hash;
	stateid_t sc_stateid;
};

L
Linus Torvalds 已提交
88
struct nfs4_delegation {
89 90
	struct list_head	dl_perfile;
	struct list_head	dl_perclnt;
L
Linus Torvalds 已提交
91 92 93 94 95 96
	struct list_head	dl_recall_lru;  /* delegation recalled */
	atomic_t		dl_count;       /* ref count */
	struct nfs4_client	*dl_client;
	struct nfs4_file	*dl_file;
	u32			dl_type;
	time_t			dl_time;
97
/* For recall: */
98
	struct nfs4_stid	dl_stid;
99
	struct knfsd_fh		dl_fh;
100
	int			dl_retries;
101
	struct nfsd4_callback	dl_recall;
L
Linus Torvalds 已提交
102 103 104
};

/* client delegation callback info */
105
struct nfs4_cb_conn {
L
Linus Torvalds 已提交
106
	/* SETCLIENTID info */
107
	struct sockaddr_storage	cb_addr;
108
	struct sockaddr_storage	cb_saddr;
109
	size_t			cb_addrlen;
110 111
	u32                     cb_prog; /* used only in 4.0 case;
					    per-session otherwise */
112
	u32                     cb_ident;	/* minorversion 0 only */
113
	struct svc_xprt		*cb_xprt;	/* minorversion 1 only */
L
Linus Torvalds 已提交
114 115
};

116 117 118 119 120
static inline struct nfs4_delegation *delegstateid(struct nfs4_stid *s)
{
	return container_of(s, struct nfs4_delegation, dl_stid);
}

121 122
/* Maximum number of slots per session. 160 is useful for long haul TCP */
#define NFSD_MAX_SLOTS_PER_SESSION     160
A
Andy Adamson 已提交
123 124
/* Maximum number of operations per session compound */
#define NFSD_MAX_OPS_PER_COMPOUND	16
125 126
/* Maximum  session per slot cache size */
#define NFSD_SLOT_CACHE_SIZE		1024
127 128 129 130
/* Maximum number of NFSD_SLOT_CACHE_SIZE slots per session */
#define NFSD_CACHE_SIZE_SLOTS_PER_SESSION	32
#define NFSD_MAX_MEM_PER_SESSION  \
		(NFSD_CACHE_SIZE_SLOTS_PER_SESSION * NFSD_SLOT_CACHE_SIZE)
131

A
Andy Adamson 已提交
132
struct nfsd4_slot {
133 134 135 136 137 138 139
	bool	sl_inuse;
	bool	sl_cachethis;
	u16	sl_opcnt;
	u32	sl_seqid;
	__be32	sl_status;
	u32	sl_datalen;
	char	sl_data[];
A
Andy Adamson 已提交
140 141
};

142 143 144 145 146 147 148 149 150 151 152
struct nfsd4_channel_attrs {
	u32		headerpadsz;
	u32		maxreq_sz;
	u32		maxresp_sz;
	u32		maxresp_cached;
	u32		maxops;
	u32		maxreqs;
	u32		nr_rdma_attrs;
	u32		rdma_attrs;
};

153 154 155 156 157 158 159 160 161 162 163 164
struct nfsd4_create_session {
	clientid_t			clientid;
	struct nfs4_sessionid		sessionid;
	u32				seqid;
	u32				flags;
	struct nfsd4_channel_attrs	fore_channel;
	struct nfsd4_channel_attrs	back_channel;
	u32				callback_prog;
	u32				uid;
	u32				gid;
};

165 166 167 168 169
struct nfsd4_bind_conn_to_session {
	struct nfs4_sessionid		sessionid;
	u32				dir;
};

170 171 172 173 174 175 176
/* The single slot clientid cache structure */
struct nfsd4_clid_slot {
	u32				sl_seqid;
	__be32				sl_status;
	struct nfsd4_create_session	sl_cr_ses;
};

177 178 179
struct nfsd4_conn {
	struct list_head cn_persession;
	struct svc_xprt *cn_xprt;
180 181
	struct svc_xpt_user cn_xpt_user;
	struct nfsd4_session *cn_session;
182 183 184 185
/* CDFC4_FORE, CDFC4_BACK: */
	unsigned char cn_flags;
};

A
Andy Adamson 已提交
186 187 188 189 190
struct nfsd4_session {
	struct kref		se_ref;
	struct list_head	se_hash;	/* hash by sessionid */
	struct list_head	se_perclnt;
	u32			se_flags;
B
Benny Halevy 已提交
191
	struct nfs4_client	*se_client;
A
Andy Adamson 已提交
192
	struct nfs4_sessionid	se_sessionid;
193 194
	struct nfsd4_channel_attrs se_fchannel;
	struct nfsd4_channel_attrs se_bchannel;
195
	struct list_head	se_conns;
196
	u32			se_cb_prog;
197
	u32			se_cb_seq_nr;
198
	struct nfsd4_slot	*se_slots[];	/* forward channel slots */
A
Andy Adamson 已提交
199 200 201 202 203 204 205 206 207 208 209 210 211 212 213
};

static inline void
nfsd4_put_session(struct nfsd4_session *ses)
{
	extern void free_session(struct kref *kref);
	kref_put(&ses->se_ref, free_session);
}

static inline void
nfsd4_get_session(struct nfsd4_session *ses)
{
	kref_get(&ses->se_ref);
}

M
Marc Eshel 已提交
214 215 216 217 218 219 220
/* formatted contents of nfs4_sessionid */
struct nfsd4_sessionid {
	clientid_t	clientid;
	u32		sequence;
	u32		reserved;
};

N
NeilBrown 已提交
221 222
#define HEXDIR_LEN     33 /* hex version of 16 byte md5 of cl_name plus '\0' */

L
Linus Torvalds 已提交
223 224 225 226 227 228 229 230 231 232 233 234 235
/*
 * struct nfs4_client - one per client.  Clientids live here.
 * 	o Each nfs4_client is hashed by clientid.
 *
 * 	o Each nfs4_clients is also hashed by name 
 * 	  (the opaque quantity initially sent by the client to identify itself).
 * 	  
 *	o cl_perclient list is used to ensure no dangling stateowner references
 *	  when we expire the nfs4_client
 */
struct nfs4_client {
	struct list_head	cl_idhash; 	/* hash by cl_clientid.id */
	struct list_head	cl_strhash; 	/* hash by cl_name */
236 237
	struct list_head	cl_openowners;
	struct list_head	cl_delegations;
L
Linus Torvalds 已提交
238 239
	struct list_head        cl_lru;         /* tail queue */
	struct xdr_netobj	cl_name; 	/* id generated by client */
N
NeilBrown 已提交
240
	char                    cl_recdir[HEXDIR_LEN]; /* recovery dir */
L
Linus Torvalds 已提交
241 242
	nfs4_verifier		cl_verifier; 	/* generated by client */
	time_t                  cl_time;        /* time of last lease renewal */
243
	struct sockaddr_storage	cl_addr; 	/* client ipaddress */
244
	u32			cl_flavor;	/* setclientid pseudoflavor */
245
	char			*cl_principal;	/* setclientid principal name */
L
Linus Torvalds 已提交
246 247 248
	struct svc_cred		cl_cred; 	/* setclientid principal */
	clientid_t		cl_clientid;	/* generated by server */
	nfs4_verifier		cl_confirm;	/* generated by server */
249
	u32			cl_firststate;	/* recovery dir creation */
250
	u32			cl_minorversion;
251

252 253
	/* for v4.0 and v4.1 callbacks: */
	struct nfs4_cb_conn	cl_cb_conn;
254 255 256
#define NFSD4_CLIENT_CB_UPDATE	1
#define NFSD4_CLIENT_KILL	2
	unsigned long		cl_cb_flags;
257
	struct rpc_clnt		*cl_cb_client;
258
	u32			cl_cb_ident;
259 260 261 262
#define NFSD4_CB_UP		0
#define NFSD4_CB_UNKNOWN	1
#define NFSD4_CB_DOWN		2
	int			cl_cb_state;
263
	struct nfsd4_callback	cl_cb_null;
264
	struct nfsd4_session	*cl_cb_session;
265
	struct list_head	cl_callbacks; /* list of in-progress callbacks */
266

267 268 269
	/* for all client information that callback code might need: */
	spinlock_t		cl_lock;

270 271
	/* for nfs41 */
	struct list_head	cl_sessions;
272
	struct nfsd4_clid_slot	cl_cs_slot;	/* create_session slot */
A
Andy Adamson 已提交
273
	u32			cl_exchange_flags;
274 275
	/* number of rpc's in progress over an associated session: */
	atomic_t		cl_refcount;
276 277

	/* for nfs41 callbacks */
278 279 280 281
	/* We currently support a single back channel with a single slot */
	unsigned long		cl_cb_slot_busy;
	struct rpc_wait_queue	cl_cb_waitq;	/* backchannel callers may */
						/* wait here for slots */
L
Linus Torvalds 已提交
282 283
};

B
Benny Halevy 已提交
284 285 286 287 288 289 290 291 292 293 294 295
static inline void
mark_client_expired(struct nfs4_client *clp)
{
	clp->cl_time = 0;
}

static inline bool
is_client_expired(struct nfs4_client *clp)
{
	return clp->cl_time == 0;
}

L
Linus Torvalds 已提交
296 297 298 299 300 301 302
/* struct nfs4_client_reset
 * one per old client. Populates reset_str_hashtbl. Filled from conf_id_hashtbl
 * upon lease reset, or from upcall to state_daemon (to read in state
 * from non-volitile storage) upon reboot.
 */
struct nfs4_client_reclaim {
	struct list_head	cr_strhash;	/* hash by cr_name */
N
NeilBrown 已提交
303
	char			cr_recdir[HEXDIR_LEN]; /* recover dir */
L
Linus Torvalds 已提交
304 305 306 307 308 309
};

static inline void
update_stateid(stateid_t *stateid)
{
	stateid->si_generation++;
310 311 312
	/* Wraparound recommendation from 3530bis-13 9.1.3.2: */
	if (stateid->si_generation == 0)
		stateid->si_generation = 1;
L
Linus Torvalds 已提交
313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328
}

/* A reasonable value for REPLAY_ISIZE was estimated as follows:  
 * The OPEN response, typically the largest, requires 
 *   4(status) + 8(stateid) + 20(changeinfo) + 4(rflags) +  8(verifier) + 
 *   4(deleg. type) + 8(deleg. stateid) + 4(deleg. recall flag) + 
 *   20(deleg. space limit) + ~32(deleg. ace) = 112 bytes 
 */

#define NFSD4_REPLAY_ISIZE       112 

/*
 * Replay buffer, where the result of the last seqid-mutating operation 
 * is cached. 
 */
struct nfs4_replay {
329
	__be32			rp_status;
L
Linus Torvalds 已提交
330 331
	unsigned int		rp_buflen;
	char			*rp_buf;
332
	struct knfsd_fh		rp_openfh;
L
Linus Torvalds 已提交
333 334 335 336 337 338 339 340 341 342 343 344
	char			rp_ibuf[NFSD4_REPLAY_ISIZE];
};

/*
* nfs4_stateowner can either be an open_owner, or a lock_owner
*
*    so_idhash:  stateid_hashtbl[] for open owner, lockstateid_hashtbl[]
*         for lock_owner
*    so_strhash: ownerstr_hashtbl[] for open_owner, lock_ownerstr_hashtbl[]
*         for lock_owner
*    so_perclient: nfs4_client->cl_perclient entry - used when nfs4_client
*         struct is reaped.
345 346
*    so_perfilestate: heads the list of nfs4_ol_stateid (either open or lock) 
*         and is used to ensure no dangling nfs4_ol_stateid references when we 
L
Linus Torvalds 已提交
347
*         release a stateowner.
348
*    so_perlockowner: (open) nfs4_ol_stateid->st_perlockowner entry - used when
L
Linus Torvalds 已提交
349 350 351 352 353
*         close is called to reap associated byte-range locks
*    so_close_lru: (open) stateowner is placed on this list instead of being
*         reaped (when so_perfilestate is empty) to hold the last close replay.
*         reaped by laundramat thread after lease period.
*/
354

L
Linus Torvalds 已提交
355 356 357
struct nfs4_stateowner {
	struct list_head        so_idhash;   /* hash by so_id */
	struct list_head        so_strhash;   /* hash by op_name */
358
	struct list_head        so_stateids;
L
Linus Torvalds 已提交
359 360 361
	int			so_is_open_owner; /* 1=openowner,0=lockowner */
	u32                     so_id;
	struct nfs4_client *    so_client;
N
NeilBrown 已提交
362 363 364
	/* after increment in ENCODE_SEQID_OP_TAIL, represents the next
	 * sequence id expected from the client: */
	u32                     so_seqid;
L
Linus Torvalds 已提交
365 366 367 368
	struct xdr_netobj       so_owner;     /* open owner name */
	struct nfs4_replay	so_replay;
};

369 370 371 372
struct nfs4_openowner {
	struct nfs4_stateowner	oo_owner; /* must be first field */
	struct list_head        oo_perclient;
	struct list_head	oo_close_lru; /* tail queue */
373
	struct nfs4_ol_stateid *oo_last_closed_stid;
374
	time_t			oo_time; /* time of placement on so_close_lru */
375
#define NFS4_OO_CONFIRMED   1
376
#define NFS4_OO_PURGE_CLOSE 2
377
	unsigned char		oo_flags;
378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395
};

struct nfs4_lockowner {
	struct nfs4_stateowner	lo_owner; /* must be first element */
	struct list_head        lo_perstateid; /* for lockowners only */
	struct list_head	lo_list; /* for temporary uses */
};

static inline struct nfs4_openowner * openowner(struct nfs4_stateowner *so)
{
	return container_of(so, struct nfs4_openowner, oo_owner);
}

static inline struct nfs4_lockowner * lockowner(struct nfs4_stateowner *so)
{
	return container_of(so, struct nfs4_lockowner, lo_owner);
}

L
Linus Torvalds 已提交
396 397 398 399 400 401
/*
*  nfs4_file: a file opened by some number of (open) nfs4_stateowners.
*    o fi_perfile list is used to search for conflicting 
*      share_acces, share_deny on the file.
*/
struct nfs4_file {
402
	atomic_t		fi_ref;
L
Linus Torvalds 已提交
403
	struct list_head        fi_hash;    /* hash by "struct inode *" */
404 405
	struct list_head        fi_stateids;
	struct list_head	fi_delegations;
406 407 408
	/* One each for O_RDONLY, O_WRONLY, O_RDWR: */
	struct file *		fi_fds[3];
	/*
409 410 411
	 * Each open or lock stateid contributes 1 to either
	 * fi_access[O_RDONLY], fi_access[O_WRONLY], or both, depending
	 * on open or lock mode:
412
	 */
413
	atomic_t		fi_access[2];
414 415 416
	struct file		*fi_deleg_file;
	struct file_lock	*fi_lease;
	atomic_t		fi_delegees;
L
Linus Torvalds 已提交
417 418 419
	struct inode		*fi_inode;
	u32                     fi_id;      /* used with stateowner->so_id 
					     * for stateid_hashtbl hash */
420
	bool			fi_had_conflict;
L
Linus Torvalds 已提交
421 422
};

423 424 425 426
/* XXX: for first cut may fall back on returning file that doesn't work
 * at all? */
static inline struct file *find_writeable_file(struct nfs4_file *f)
{
427 428 429
	if (f->fi_fds[O_WRONLY])
		return f->fi_fds[O_WRONLY];
	return f->fi_fds[O_RDWR];
430 431 432 433
}

static inline struct file *find_readable_file(struct nfs4_file *f)
{
434 435 436
	if (f->fi_fds[O_RDONLY])
		return f->fi_fds[O_RDONLY];
	return f->fi_fds[O_RDWR];
437 438 439 440 441 442
}

static inline struct file *find_any_file(struct nfs4_file *f)
{
	if (f->fi_fds[O_RDWR])
		return f->fi_fds[O_RDWR];
443
	else if (f->fi_fds[O_WRONLY])
444 445 446 447 448
		return f->fi_fds[O_WRONLY];
	else
		return f->fi_fds[O_RDONLY];
}

L
Linus Torvalds 已提交
449
/*
450
* nfs4_ol_stateid can either be an open stateid or (eventually) a lock stateid
L
Linus Torvalds 已提交
451
*
452
* (open)nfs4_ol_stateid: one per (open)nfs4_stateowner, nfs4_file
L
Linus Torvalds 已提交
453 454 455 456 457 458 459
*
* 	st_hash: stateid_hashtbl[] entry or lockstateid_hashtbl entry
* 	st_perfile: file_hashtbl[] entry.
* 	st_perfile_state: nfs4_stateowner->so_perfilestate
*       st_perlockowner: (open stateid) list of lock nfs4_stateowners
* 	st_access_bmap: used only for open stateid
* 	st_deny_bmap: used only for open stateid
460 461 462 463
*	st_openstp: open stateid lock stateid was derived from
*
* XXX: open stateids and lock stateids have diverged sufficiently that
* we should consider defining separate structs for the two cases.
L
Linus Torvalds 已提交
464 465
*/

466
/* "ol" stands for "Open or Lock".  Better suggestions welcome. */
467 468
struct nfs4_ol_stateid {
	struct nfs4_stid    st_stid;
L
Linus Torvalds 已提交
469
	struct list_head              st_perfile;
470 471
	struct list_head              st_perstateowner;
	struct list_head              st_lockowners;
L
Linus Torvalds 已提交
472 473 474 475
	struct nfs4_stateowner      * st_stateowner;
	struct nfs4_file            * st_file;
	unsigned long                 st_access_bmap;
	unsigned long                 st_deny_bmap;
476
	struct nfs4_ol_stateid         * st_openstp;
L
Linus Torvalds 已提交
477 478
};

479 480 481 482 483
static inline struct nfs4_ol_stateid *openlockstateid(struct nfs4_stid *s)
{
	return container_of(s, struct nfs4_ol_stateid, st_stid);
}

L
Linus Torvalds 已提交
484 485 486 487
/* flags for preprocess_seqid_op() */
#define RD_STATE	        0x00000010
#define WR_STATE	        0x00000020

488 489 490
struct nfsd4_compound_state;

extern __be32 nfs4_preprocess_stateid_op(struct nfsd4_compound_state *cstate,
L
Linus Torvalds 已提交
491 492 493 494
		stateid_t *stateid, int flags, struct file **filp);
extern void nfs4_lock_state(void);
extern void nfs4_unlock_state(void);
extern int nfs4_in_grace(void);
495
extern __be32 nfs4_check_open_reclaim(clientid_t *clid);
496 497
extern void nfs4_free_openowner(struct nfs4_openowner *);
extern void nfs4_free_lockowner(struct nfs4_lockowner *);
498
extern int set_callback_cred(void);
499
extern void nfsd4_probe_callback(struct nfs4_client *clp);
500
extern void nfsd4_probe_callback_sync(struct nfs4_client *clp);
501
extern void nfsd4_change_callback(struct nfs4_client *clp, struct nfs4_cb_conn *);
502
extern void nfsd4_do_callback_rpc(struct work_struct *);
L
Linus Torvalds 已提交
503
extern void nfsd4_cb_recall(struct nfs4_delegation *dp);
504 505
extern int nfsd4_create_callback_queue(void);
extern void nfsd4_destroy_callback_queue(void);
506
extern void nfsd4_shutdown_callback(struct nfs4_client *);
L
Linus Torvalds 已提交
507
extern void nfs4_put_delegation(struct nfs4_delegation *dp);
508
extern __be32 nfs4_make_rec_clidname(char *clidname, struct xdr_netobj *clname);
509
extern void nfsd4_init_recdir(void);
510 511 512
extern int nfsd4_recdir_load(void);
extern void nfsd4_shutdown_recdir(void);
extern int nfs4_client_to_reclaim(const char *name);
513
extern int nfs4_has_reclaimed_state(const char *name, bool use_exchange_id);
514 515 516
extern void nfsd4_recdir_purge_old(void);
extern int nfsd4_create_clid_dir(struct nfs4_client *clp);
extern void nfsd4_remove_clid_dir(struct nfs4_client *clp);
517
extern void release_session_client(struct nfsd4_session *);
J
J. Bruce Fields 已提交
518
extern __be32 nfs4_validate_stateid(stateid_t *, bool);
519
extern void nfsd4_purge_closed_stateid(struct nfs4_stateowner *);
L
Linus Torvalds 已提交
520 521

#endif   /* NFSD4_STATE_H */