Blame - ap/os/linux/linux-3.4.x/fs/nfsd/nfs4state.c - T106_DC

blob: 6143a1ea63b1139b2efb0deca3a6899f1d9e7bcb [file] [log] [blame]

lh	9ed821d	2023-04-07 01:36:19 -0700	[diff] [blame]	1	/*
				2	* Copyright (c) 2001 The Regents of the University of Michigan.
				3	* All rights reserved.
				4	*
				5	* Kendrick Smith <kmsmith@umich.edu>
				6	* Andy Adamson <kandros@umich.edu>
				7	*
				8	* Redistribution and use in source and binary forms, with or without
				9	* modification, are permitted provided that the following conditions
				10	* are met:
				11	*
				12	* 1. Redistributions of source code must retain the above copyright
				13	* notice, this list of conditions and the following disclaimer.
				14	* 2. Redistributions in binary form must reproduce the above copyright
				15	* notice, this list of conditions and the following disclaimer in the
				16	* documentation and/or other materials provided with the distribution.
				17	* 3. Neither the name of the University nor the names of its
				18	* contributors may be used to endorse or promote products derived
				19	* from this software without specific prior written permission.
				20	*
				21	* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
				22	* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
				23	* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
				24	* DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
				25	* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
				26	* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
				27	* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
				28	* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
				29	* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
				30	* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
				31	* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				32	*
				33	*/
				34
				35	#include <linux/file.h>
				36	#include <linux/fs.h>
				37	#include <linux/slab.h>
				38	#include <linux/namei.h>
				39	#include <linux/swap.h>
				40	#include <linux/pagemap.h>
				41	#include <linux/sunrpc/svcauth_gss.h>
				42	#include <linux/sunrpc/clnt.h>
				43	#include "xdr4.h"
				44	#include "vfs.h"
				45
				46	#define NFSDDBG_FACILITY NFSDDBG_PROC
				47
				48	/* Globals */
				49	time_t nfsd4_lease = 90; /* default lease time */
				50	time_t nfsd4_grace = 90;
				51	static time_t boot_time;
				52
				53	#define all_ones {{~0,~0},~0}
				54	static const stateid_t one_stateid = {
				55	.si_generation = ~0,
				56	.si_opaque = all_ones,
				57	};
				58	static const stateid_t zero_stateid = {
				59	/* all fields zero */
				60	};
				61	static const stateid_t currentstateid = {
				62	.si_generation = 1,
				63	};
				64
				65	static u64 current_sessionid = 1;
				66
				67	#define ZERO_STATEID(stateid) (!memcmp((stateid), &zero_stateid, sizeof(stateid_t)))
				68	#define ONE_STATEID(stateid) (!memcmp((stateid), &one_stateid, sizeof(stateid_t)))
				69	#define CURRENT_STATEID(stateid) (!memcmp((stateid), &currentstateid, sizeof(stateid_t)))
				70
				71	/* forward declarations */
				72	static int check_for_locks(struct nfs4_file filp, struct nfs4_lockowner lowner);
				73
				74	/* Locking: */
				75
				76	/* Currently used for almost all code touching nfsv4 state: */
				77	static DEFINE_MUTEX(client_mutex);
				78
				79	/*
				80	* Currently used for the del_recall_lru and file hash table. In an
				81	* effort to decrease the scope of the client_mutex, this spinlock may
				82	* eventually cover more:
				83	*/
				84	static DEFINE_SPINLOCK(recall_lock);
				85
				86	static struct kmem_cache *openowner_slab = NULL;
				87	static struct kmem_cache *lockowner_slab = NULL;
				88	static struct kmem_cache *file_slab = NULL;
				89	static struct kmem_cache *stateid_slab = NULL;
				90	static struct kmem_cache *deleg_slab = NULL;
				91
				92	void
				93	nfs4_lock_state(void)
				94	{
				95	mutex_lock(&client_mutex);
				96	}
				97
				98	static void free_session(struct kref *);
				99
				100	/* Must be called under the client_lock */
				101	static void nfsd4_put_session_locked(struct nfsd4_session *ses)
				102	{
				103	kref_put(&ses->se_ref, free_session);
				104	}
				105
				106	static void nfsd4_get_session(struct nfsd4_session *ses)
				107	{
				108	kref_get(&ses->se_ref);
				109	}
				110
				111	void
				112	nfs4_unlock_state(void)
				113	{
				114	mutex_unlock(&client_mutex);
				115	}
				116
				117	static inline u32
				118	opaque_hashval(const void *ptr, int nbytes)
				119	{
				120	unsigned char cptr = (unsigned char ) ptr;
				121
				122	u32 x = 0;
				123	while (nbytes--) {
				124	x *= 37;
				125	x += *cptr++;
				126	}
				127	return x;
				128	}
				129
				130	static struct list_head del_recall_lru;
				131
				132	static void nfsd4_free_file(struct nfs4_file *f)
				133	{
				134	kmem_cache_free(file_slab, f);
				135	}
				136
				137	static inline void
				138	put_nfs4_file(struct nfs4_file *fi)
				139	{
				140	if (atomic_dec_and_lock(&fi->fi_ref, &recall_lock)) {
				141	list_del(&fi->fi_hash);
				142	spin_unlock(&recall_lock);
				143	iput(fi->fi_inode);
				144	nfsd4_free_file(fi);
				145	}
				146	}
				147
				148	static inline void
				149	get_nfs4_file(struct nfs4_file *fi)
				150	{
				151	atomic_inc(&fi->fi_ref);
				152	}
				153
				154	static int num_delegations;
				155	unsigned int max_delegations;
				156
				157	/*
				158	* Open owner state (share locks)
				159	*/
				160
				161	/* hash tables for lock and open owners */
				162	#define OWNER_HASH_BITS 8
				163	#define OWNER_HASH_SIZE (1 << OWNER_HASH_BITS)
				164	#define OWNER_HASH_MASK (OWNER_HASH_SIZE - 1)
				165
				166	static unsigned int ownerstr_hashval(u32 clientid, struct xdr_netobj *ownername)
				167	{
				168	unsigned int ret;
				169
				170	ret = opaque_hashval(ownername->data, ownername->len);
				171	ret += clientid;
				172	return ret & OWNER_HASH_MASK;
				173	}
				174
				175	static struct list_head ownerstr_hashtbl[OWNER_HASH_SIZE];
				176
				177	/* hash table for nfs4_file */
				178	#define FILE_HASH_BITS 8
				179	#define FILE_HASH_SIZE (1 << FILE_HASH_BITS)
				180
				181	static unsigned int file_hashval(struct inode *ino)
				182	{
				183	/* XXX: why are we hashing on inode pointer, anyway? */
				184	return hash_ptr(ino, FILE_HASH_BITS);
				185	}
				186
				187	static struct list_head file_hashtbl[FILE_HASH_SIZE];
				188
				189	static void __nfs4_file_get_access(struct nfs4_file *fp, int oflag)
				190	{
				191	BUG_ON(!(fp->fi_fds[oflag] \|\| fp->fi_fds[O_RDWR]));
				192	atomic_inc(&fp->fi_access[oflag]);
				193	}
				194
				195	static void nfs4_file_get_access(struct nfs4_file *fp, int oflag)
				196	{
				197	if (oflag == O_RDWR) {
				198	__nfs4_file_get_access(fp, O_RDONLY);
				199	__nfs4_file_get_access(fp, O_WRONLY);
				200	} else
				201	__nfs4_file_get_access(fp, oflag);
				202	}
				203
				204	static void nfs4_file_put_fd(struct nfs4_file *fp, int oflag)
				205	{
				206	if (fp->fi_fds[oflag]) {
				207	fput(fp->fi_fds[oflag]);
				208	fp->fi_fds[oflag] = NULL;
				209	}
				210	}
				211
				212	static void __nfs4_file_put_access(struct nfs4_file *fp, int oflag)
				213	{
				214	if (atomic_dec_and_test(&fp->fi_access[oflag])) {
				215	nfs4_file_put_fd(fp, oflag);
				216	if (atomic_read(&fp->fi_access[1 - oflag]) == 0)
				217	nfs4_file_put_fd(fp, O_RDWR);
				218	}
				219	}
				220
				221	static void nfs4_file_put_access(struct nfs4_file *fp, int oflag)
				222	{
				223	if (oflag == O_RDWR) {
				224	__nfs4_file_put_access(fp, O_RDONLY);
				225	__nfs4_file_put_access(fp, O_WRONLY);
				226	} else
				227	__nfs4_file_put_access(fp, oflag);
				228	}
				229
				230	static inline int get_new_stid(struct nfs4_stid *stid)
				231	{
				232	static int min_stateid = 0;
				233	struct idr *stateids = &stid->sc_client->cl_stateids;
				234	int new_stid;
				235	int error;
				236
				237	error = idr_get_new_above(stateids, stid, min_stateid, &new_stid);
				238	/*
				239	* Note: the necessary preallocation was done in
				240	* nfs4_alloc_stateid(). The idr code caps the number of
				241	* preallocations that can exist at a time, but the state lock
				242	* prevents anyone from using ours before we get here:
				243	*/
				244	BUG_ON(error);
				245	/*
				246	* It shouldn't be a problem to reuse an opaque stateid value.
				247	* I don't think it is for 4.1. But with 4.0 I worry that, for
				248	* example, a stray write retransmission could be accepted by
				249	* the server when it should have been rejected. Therefore,
				250	* adopt a trick from the sctp code to attempt to maximize the
				251	* amount of time until an id is reused, by ensuring they always
				252	* "increase" (mod INT_MAX):
				253	*/
				254
				255	min_stateid = new_stid+1;
				256	if (min_stateid == INT_MAX)
				257	min_stateid = 0;
				258	return new_stid;
				259	}
				260
				261	static void init_stid(struct nfs4_stid stid, struct nfs4_client cl, unsigned char type)
				262	{
				263	stateid_t *s = &stid->sc_stateid;
				264	int new_id;
				265
				266	stid->sc_type = type;
				267	stid->sc_client = cl;
				268	s->si_opaque.so_clid = cl->cl_clientid;
				269	new_id = get_new_stid(stid);
				270	s->si_opaque.so_id = (u32)new_id;
				271	/* Will be incremented before return to client: */
				272	s->si_generation = 0;
				273	}
				274
				275	static struct nfs4_stid nfs4_alloc_stid(struct nfs4_client cl, struct kmem_cache *slab)
				276	{
				277	struct idr *stateids = &cl->cl_stateids;
				278
				279	if (!idr_pre_get(stateids, GFP_KERNEL))
				280	return NULL;
				281	/*
				282	* Note: if we fail here (or any time between now and the time
				283	* we actually get the new idr), we won't need to undo the idr
				284	* preallocation, since the idr code caps the number of
				285	* preallocated entries.
				286	*/
				287	return kmem_cache_alloc(slab, GFP_KERNEL);
				288	}
				289
				290	static struct nfs4_ol_stateid * nfs4_alloc_stateid(struct nfs4_client *clp)
				291	{
				292	return openlockstateid(nfs4_alloc_stid(clp, stateid_slab));
				293	}
				294
				295	static struct nfs4_delegation *
				296	alloc_init_deleg(struct nfs4_client clp, struct nfs4_ol_stateid stp, struct svc_fh *current_fh, u32 type)
				297	{
				298	struct nfs4_delegation *dp;
				299	struct nfs4_file *fp = stp->st_file;
				300
				301	dprintk("NFSD alloc_init_deleg\n");
				302	/*
				303	* Major work on the lease subsystem (for example, to support
				304	* calbacks on stat) will be required before we can support
				305	* write delegations properly.
				306	*/
				307	if (type != NFS4_OPEN_DELEGATE_READ)
				308	return NULL;
				309	if (fp->fi_had_conflict)
				310	return NULL;
				311	if (num_delegations > max_delegations)
				312	return NULL;
				313	dp = delegstateid(nfs4_alloc_stid(clp, deleg_slab));
				314	if (dp == NULL)
				315	return dp;
				316	init_stid(&dp->dl_stid, clp, NFS4_DELEG_STID);
				317	/*
				318	* delegation seqid's are never incremented. The 4.1 special
				319	* meaning of seqid 0 isn't meaningful, really, but let's avoid
				320	* 0 anyway just for consistency and use 1:
				321	*/
				322	dp->dl_stid.sc_stateid.si_generation = 1;
				323	num_delegations++;
				324	INIT_LIST_HEAD(&dp->dl_perfile);
				325	INIT_LIST_HEAD(&dp->dl_perclnt);
				326	INIT_LIST_HEAD(&dp->dl_recall_lru);
				327	get_nfs4_file(fp);
				328	dp->dl_file = fp;
				329	dp->dl_type = type;
				330	fh_copy_shallow(&dp->dl_fh, &current_fh->fh_handle);
				331	dp->dl_time = 0;
				332	atomic_set(&dp->dl_count, 1);
				333	INIT_WORK(&dp->dl_recall.cb_work, nfsd4_do_callback_rpc);
				334	return dp;
				335	}
				336
				337	void
				338	nfs4_put_delegation(struct nfs4_delegation *dp)
				339	{
				340	if (atomic_dec_and_test(&dp->dl_count)) {
				341	dprintk("NFSD: freeing dp %p\n",dp);
				342	put_nfs4_file(dp->dl_file);
				343	kmem_cache_free(deleg_slab, dp);
				344	num_delegations--;
				345	}
				346	}
				347
				348	static void nfs4_put_deleg_lease(struct nfs4_file *fp)
				349	{
				350	if (atomic_dec_and_test(&fp->fi_delegees)) {
				351	vfs_setlease(fp->fi_deleg_file, F_UNLCK, &fp->fi_lease);
				352	fp->fi_lease = NULL;
				353	fput(fp->fi_deleg_file);
				354	fp->fi_deleg_file = NULL;
				355	}
				356	}
				357
				358	static void unhash_stid(struct nfs4_stid *s)
				359	{
				360	struct idr *stateids = &s->sc_client->cl_stateids;
				361
				362	idr_remove(stateids, s->sc_stateid.si_opaque.so_id);
				363	}
				364
				365	/* Called under the state lock. */
				366	static void
				367	unhash_delegation(struct nfs4_delegation *dp)
				368	{
				369	unhash_stid(&dp->dl_stid);
				370	list_del_init(&dp->dl_perclnt);
				371	spin_lock(&recall_lock);
				372	list_del_init(&dp->dl_perfile);
				373	list_del_init(&dp->dl_recall_lru);
				374	spin_unlock(&recall_lock);
				375	nfs4_put_deleg_lease(dp->dl_file);
				376	nfs4_put_delegation(dp);
				377	}
				378
				379	/*
				380	* SETCLIENTID state
				381	*/
				382
				383	/* client_lock protects the client lru list and session hash table */
				384	static DEFINE_SPINLOCK(client_lock);
				385
				386	/* Hash tables for nfs4_clientid state */
				387	#define CLIENT_HASH_BITS 4
				388	#define CLIENT_HASH_SIZE (1 << CLIENT_HASH_BITS)
				389	#define CLIENT_HASH_MASK (CLIENT_HASH_SIZE - 1)
				390
				391	static unsigned int clientid_hashval(u32 id)
				392	{
				393	return id & CLIENT_HASH_MASK;
				394	}
				395
				396	static unsigned int clientstr_hashval(const char *name)
				397	{
				398	return opaque_hashval(name, 8) & CLIENT_HASH_MASK;
				399	}
				400
				401	/*
				402	* reclaim_str_hashtbl[] holds known client info from previous reset/reboot
				403	* used in reboot/reset lease grace period processing
				404	*
				405	* conf_id_hashtbl[], and conf_str_hashtbl[] hold confirmed
				406	* setclientid_confirmed info.
				407	*
				408	* unconf_str_hastbl[] and unconf_id_hashtbl[] hold unconfirmed
				409	* setclientid info.
				410	*
				411	* client_lru holds client queue ordered by nfs4_client.cl_time
				412	* for lease renewal.
				413	*
				414	* close_lru holds (open) stateowner queue ordered by nfs4_stateowner.so_time
				415	* for last close replay.
				416	*/
				417	static struct list_head reclaim_str_hashtbl[CLIENT_HASH_SIZE];
				418	static int reclaim_str_hashtbl_size = 0;
				419	static struct list_head conf_id_hashtbl[CLIENT_HASH_SIZE];
				420	static struct list_head conf_str_hashtbl[CLIENT_HASH_SIZE];
				421	static struct list_head unconf_str_hashtbl[CLIENT_HASH_SIZE];
				422	static struct list_head unconf_id_hashtbl[CLIENT_HASH_SIZE];
				423	static struct list_head client_lru;
				424	static struct list_head close_lru;
				425
				426	/*
				427	* We store the NONE, READ, WRITE, and BOTH bits separately in the
				428	* st_{access,deny}_bmap field of the stateid, in order to track not
				429	* only what share bits are currently in force, but also what
				430	* combinations of share bits previous opens have used. This allows us
				431	* to enforce the recommendation of rfc 3530 14.2.19 that the server
				432	* return an error if the client attempt to downgrade to a combination
				433	* of share bits not explicable by closing some of its previous opens.
				434	*
				435	* XXX: This enforcement is actually incomplete, since we don't keep
				436	* track of access/deny bit combinations; so, e.g., we allow:
				437	*
				438	* OPEN allow read, deny write
				439	* OPEN allow both, deny none
				440	* DOWNGRADE allow read, deny none
				441	*
				442	* which we should reject.
				443	*/
				444	static void
				445	set_access(unsigned int *access, unsigned long bmap) {
				446	int i;
				447
				448	*access = 0;
				449	for (i = 1; i < 4; i++) {
				450	if (test_bit(i, &bmap))
				451	*access \|= i;
				452	}
				453	}
				454
				455	static void
				456	set_deny(unsigned int *deny, unsigned long bmap) {
				457	int i;
				458
				459	*deny = 0;
				460	for (i = 0; i < 4; i++) {
				461	if (test_bit(i, &bmap))
				462	*deny \|= i ;
				463	}
				464	}
				465
				466	static int
				467	test_share(struct nfs4_ol_stateid stp, struct nfsd4_open open) {
				468	unsigned int access, deny;
				469
				470	set_access(&access, stp->st_access_bmap);
				471	set_deny(&deny, stp->st_deny_bmap);
				472	if ((access & open->op_share_deny) \|\| (deny & open->op_share_access))
				473	return 0;
				474	return 1;
				475	}
				476
				477	static int nfs4_access_to_omode(u32 access)
				478	{
				479	switch (access & NFS4_SHARE_ACCESS_BOTH) {
				480	case NFS4_SHARE_ACCESS_READ:
				481	return O_RDONLY;
				482	case NFS4_SHARE_ACCESS_WRITE:
				483	return O_WRONLY;
				484	case NFS4_SHARE_ACCESS_BOTH:
				485	return O_RDWR;
				486	}
				487	BUG();
				488	}
				489
				490	static void unhash_generic_stateid(struct nfs4_ol_stateid *stp)
				491	{
				492	list_del(&stp->st_perfile);
				493	list_del(&stp->st_perstateowner);
				494	}
				495
				496	static void close_generic_stateid(struct nfs4_ol_stateid *stp)
				497	{
				498	int i;
				499
				500	if (stp->st_access_bmap) {
				501	for (i = 1; i < 4; i++) {
				502	if (test_bit(i, &stp->st_access_bmap))
				503	nfs4_file_put_access(stp->st_file,
				504	nfs4_access_to_omode(i));
				505	__clear_bit(i, &stp->st_access_bmap);
				506	}
				507	}
				508	put_nfs4_file(stp->st_file);
				509	stp->st_file = NULL;
				510	}
				511
				512	static void free_generic_stateid(struct nfs4_ol_stateid *stp)
				513	{
				514	kmem_cache_free(stateid_slab, stp);
				515	}
				516
				517	static void release_lock_stateid(struct nfs4_ol_stateid *stp)
				518	{
				519	struct file *file;
				520
				521	unhash_generic_stateid(stp);
				522	unhash_stid(&stp->st_stid);
				523	file = find_any_file(stp->st_file);
				524	if (file)
				525	locks_remove_posix(file, (fl_owner_t)lockowner(stp->st_stateowner));
				526	close_generic_stateid(stp);
				527	free_generic_stateid(stp);
				528	}
				529
				530	static void unhash_lockowner(struct nfs4_lockowner *lo)
				531	{
				532	struct nfs4_ol_stateid *stp;
				533
				534	list_del(&lo->lo_owner.so_strhash);
				535	list_del(&lo->lo_perstateid);
				536	list_del(&lo->lo_owner_ino_hash);
				537	while (!list_empty(&lo->lo_owner.so_stateids)) {
				538	stp = list_first_entry(&lo->lo_owner.so_stateids,
				539	struct nfs4_ol_stateid, st_perstateowner);
				540	release_lock_stateid(stp);
				541	}
				542	}
				543
				544	static void release_lockowner(struct nfs4_lockowner *lo)
				545	{
				546	unhash_lockowner(lo);
				547	nfs4_free_lockowner(lo);
				548	}
				549
				550	static void
				551	release_stateid_lockowners(struct nfs4_ol_stateid *open_stp)
				552	{
				553	struct nfs4_lockowner *lo;
				554
				555	while (!list_empty(&open_stp->st_lockowners)) {
				556	lo = list_entry(open_stp->st_lockowners.next,
				557	struct nfs4_lockowner, lo_perstateid);
				558	release_lockowner(lo);
				559	}
				560	}
				561
				562	static void unhash_open_stateid(struct nfs4_ol_stateid *stp)
				563	{
				564	unhash_generic_stateid(stp);
				565	release_stateid_lockowners(stp);
				566	close_generic_stateid(stp);
				567	}
				568
				569	static void release_open_stateid(struct nfs4_ol_stateid *stp)
				570	{
				571	unhash_open_stateid(stp);
				572	unhash_stid(&stp->st_stid);
				573	free_generic_stateid(stp);
				574	}
				575
				576	static void unhash_openowner(struct nfs4_openowner *oo)
				577	{
				578	struct nfs4_ol_stateid *stp;
				579
				580	list_del(&oo->oo_owner.so_strhash);
				581	list_del(&oo->oo_perclient);
				582	while (!list_empty(&oo->oo_owner.so_stateids)) {
				583	stp = list_first_entry(&oo->oo_owner.so_stateids,
				584	struct nfs4_ol_stateid, st_perstateowner);
				585	release_open_stateid(stp);
				586	}
				587	}
				588
				589	static void release_last_closed_stateid(struct nfs4_openowner *oo)
				590	{
				591	struct nfs4_ol_stateid *s = oo->oo_last_closed_stid;
				592
				593	if (s) {
				594	unhash_stid(&s->st_stid);
				595	free_generic_stateid(s);
				596	oo->oo_last_closed_stid = NULL;
				597	}
				598	}
				599
				600	static void release_openowner(struct nfs4_openowner *oo)
				601	{
				602	unhash_openowner(oo);
				603	list_del(&oo->oo_close_lru);
				604	release_last_closed_stateid(oo);
				605	nfs4_free_openowner(oo);
				606	}
				607
				608	#define SESSION_HASH_SIZE 512
				609	static struct list_head sessionid_hashtbl[SESSION_HASH_SIZE];
				610
				611	static inline int
				612	hash_sessionid(struct nfs4_sessionid *sessionid)
				613	{
				614	struct nfsd4_sessionid sid = (struct nfsd4_sessionid )sessionid;
				615
				616	return sid->sequence % SESSION_HASH_SIZE;
				617	}
				618
				619	#ifdef NFSD_DEBUG
				620	static inline void
				621	dump_sessionid(const char fn, struct nfs4_sessionid sessionid)
				622	{
				623	u32 ptr = (u32 )(&sessionid->data[0]);
				624	dprintk("%s: %u:%u:%u:%u\n", fn, ptr[0], ptr[1], ptr[2], ptr[3]);
				625	}
				626	#else
				627	static inline void
				628	dump_sessionid(const char fn, struct nfs4_sessionid sessionid)
				629	{
				630	}
				631	#endif
				632
				633
				634	static void
				635	gen_sessionid(struct nfsd4_session *ses)
				636	{
				637	struct nfs4_client *clp = ses->se_client;
				638	struct nfsd4_sessionid *sid;
				639
				640	sid = (struct nfsd4_sessionid *)ses->se_sessionid.data;
				641	sid->clientid = clp->cl_clientid;
				642	sid->sequence = current_sessionid++;
				643	sid->reserved = 0;
				644	}
				645
				646	/*
				647	* The protocol defines ca_maxresponssize_cached to include the size of
				648	* the rpc header, but all we need to cache is the data starting after
				649	* the end of the initial SEQUENCE operation--the rest we regenerate
				650	* each time. Therefore we can advertise a ca_maxresponssize_cached
				651	* value that is the number of bytes in our cache plus a few additional
				652	* bytes. In order to stay on the safe side, and not promise more than
				653	* we can cache, those additional bytes must be the minimum possible: 24
				654	* bytes of rpc header (xid through accept state, with AUTH_NULL
				655	* verifier), 12 for the compound header (with zero-length tag), and 44
				656	* for the SEQUENCE op response:
				657	*/
				658	#define NFSD_MIN_HDR_SEQ_SZ (24 + 12 + 44)
				659
				660	static void
				661	free_session_slots(struct nfsd4_session *ses)
				662	{
				663	int i;
				664
				665	for (i = 0; i < ses->se_fchannel.maxreqs; i++)
				666	kfree(ses->se_slots[i]);
				667	}
				668
				669	/*
				670	* We don't actually need to cache the rpc and session headers, so we
				671	* can allocate a little less for each slot:
				672	*/
				673	static inline int slot_bytes(struct nfsd4_channel_attrs *ca)
				674	{
				675	return ca->maxresp_cached - NFSD_MIN_HDR_SEQ_SZ;
				676	}
				677
				678	static int nfsd4_sanitize_slot_size(u32 size)
				679	{
				680	size -= NFSD_MIN_HDR_SEQ_SZ; /* We don't cache the rpc header */
				681	size = min_t(u32, size, NFSD_SLOT_CACHE_SIZE);
				682
				683	return size;
				684	}
				685
				686	/*
				687	* XXX: If we run out of reserved DRC memory we could (up to a point)
				688	* re-negotiate active sessions and reduce their slot usage to make
				689	* room for new connections. For now we just fail the create session.
				690	*/
				691	static int nfsd4_get_drc_mem(int slotsize, u32 num)
				692	{
				693	int avail;
				694
				695	num = min_t(u32, num, NFSD_MAX_SLOTS_PER_SESSION);
				696
				697	spin_lock(&nfsd_drc_lock);
				698	avail = min_t(int, NFSD_MAX_MEM_PER_SESSION,
				699	nfsd_drc_max_mem - nfsd_drc_mem_used);
				700	num = min_t(int, num, avail / slotsize);
				701	nfsd_drc_mem_used += num * slotsize;
				702	spin_unlock(&nfsd_drc_lock);
				703
				704	return num;
				705	}
				706
				707	static void nfsd4_put_drc_mem(int slotsize, int num)
				708	{
				709	spin_lock(&nfsd_drc_lock);
				710	nfsd_drc_mem_used -= slotsize * num;
				711	spin_unlock(&nfsd_drc_lock);
				712	}
				713
				714	static struct nfsd4_session *alloc_session(int slotsize, int numslots)
				715	{
				716	struct nfsd4_session *new;
				717	int mem, i;
				718
				719	BUILD_BUG_ON(NFSD_MAX_SLOTS_PER_SESSION * sizeof(struct nfsd4_slot *)
				720	+ sizeof(struct nfsd4_session) > PAGE_SIZE);
				721	mem = numslots * sizeof(struct nfsd4_slot *);
				722
				723	new = kzalloc(sizeof(*new) + mem, GFP_KERNEL);
				724	if (!new)
				725	return NULL;
				726	/* allocate each struct nfsd4_slot and data cache in one piece */
				727	for (i = 0; i < numslots; i++) {
				728	mem = sizeof(struct nfsd4_slot) + slotsize;
				729	new->se_slots[i] = kzalloc(mem, GFP_KERNEL);
				730	if (!new->se_slots[i])
				731	goto out_free;
				732	}
				733	return new;
				734	out_free:
				735	while (i--)
				736	kfree(new->se_slots[i]);
				737	kfree(new);
				738	return NULL;
				739	}
				740
				741	static void init_forechannel_attrs(struct nfsd4_channel_attrs new, struct nfsd4_channel_attrs req, int numslots, int slotsize)
				742	{
				743	u32 maxrpc = nfsd_serv->sv_max_mesg;
				744
				745	new->maxreqs = numslots;
				746	new->maxresp_cached = min_t(u32, req->maxresp_cached,
				747	slotsize + NFSD_MIN_HDR_SEQ_SZ);
				748	new->maxreq_sz = min_t(u32, req->maxreq_sz, maxrpc);
				749	new->maxresp_sz = min_t(u32, req->maxresp_sz, maxrpc);
				750	new->maxops = min_t(u32, req->maxops, NFSD_MAX_OPS_PER_COMPOUND);
				751	}
				752
				753	static void free_conn(struct nfsd4_conn *c)
				754	{
				755	svc_xprt_put(c->cn_xprt);
				756	kfree(c);
				757	}
				758
				759	static void nfsd4_conn_lost(struct svc_xpt_user *u)
				760	{
				761	struct nfsd4_conn *c = container_of(u, struct nfsd4_conn, cn_xpt_user);
				762	struct nfs4_client *clp = c->cn_session->se_client;
				763
				764	spin_lock(&clp->cl_lock);
				765	if (!list_empty(&c->cn_persession)) {
				766	list_del(&c->cn_persession);
				767	free_conn(c);
				768	}
				769	spin_unlock(&clp->cl_lock);
				770	nfsd4_probe_callback(clp);
				771	}
				772
				773	static struct nfsd4_conn alloc_conn(struct svc_rqst rqstp, u32 flags)
				774	{
				775	struct nfsd4_conn *conn;
				776
				777	conn = kmalloc(sizeof(struct nfsd4_conn), GFP_KERNEL);
				778	if (!conn)
				779	return NULL;
				780	svc_xprt_get(rqstp->rq_xprt);
				781	conn->cn_xprt = rqstp->rq_xprt;
				782	conn->cn_flags = flags;
				783	INIT_LIST_HEAD(&conn->cn_xpt_user.list);
				784	return conn;
				785	}
				786
				787	static void __nfsd4_hash_conn(struct nfsd4_conn conn, struct nfsd4_session ses)
				788	{
				789	conn->cn_session = ses;
				790	list_add(&conn->cn_persession, &ses->se_conns);
				791	}
				792
				793	static void nfsd4_hash_conn(struct nfsd4_conn conn, struct nfsd4_session ses)
				794	{
				795	struct nfs4_client *clp = ses->se_client;
				796
				797	spin_lock(&clp->cl_lock);
				798	__nfsd4_hash_conn(conn, ses);
				799	spin_unlock(&clp->cl_lock);
				800	}
				801
				802	static int nfsd4_register_conn(struct nfsd4_conn *conn)
				803	{
				804	conn->cn_xpt_user.callback = nfsd4_conn_lost;
				805	return register_xpt_user(conn->cn_xprt, &conn->cn_xpt_user);
				806	}
				807
				808	static __be32 nfsd4_new_conn(struct svc_rqst rqstp, struct nfsd4_session ses, u32 dir)
				809	{
				810	struct nfsd4_conn *conn;
				811	int ret;
				812
				813	conn = alloc_conn(rqstp, dir);
				814	if (!conn)
				815	return nfserr_jukebox;
				816	nfsd4_hash_conn(conn, ses);
				817	ret = nfsd4_register_conn(conn);
				818	if (ret)
				819	/* oops; xprt is already down: */
				820	nfsd4_conn_lost(&conn->cn_xpt_user);
				821	return nfs_ok;
				822	}
				823
				824	static __be32 nfsd4_new_conn_from_crses(struct svc_rqst rqstp, struct nfsd4_session ses)
				825	{
				826	u32 dir = NFS4_CDFC4_FORE;
				827
				828	if (ses->se_flags & SESSION4_BACK_CHAN)
				829	dir \|= NFS4_CDFC4_BACK;
				830
				831	return nfsd4_new_conn(rqstp, ses, dir);
				832	}
				833
				834	/* must be called under client_lock */
				835	static void nfsd4_del_conns(struct nfsd4_session *s)
				836	{
				837	struct nfs4_client *clp = s->se_client;
				838	struct nfsd4_conn *c;
				839
				840	spin_lock(&clp->cl_lock);
				841	while (!list_empty(&s->se_conns)) {
				842	c = list_first_entry(&s->se_conns, struct nfsd4_conn, cn_persession);
				843	list_del_init(&c->cn_persession);
				844	spin_unlock(&clp->cl_lock);
				845
				846	unregister_xpt_user(c->cn_xprt, &c->cn_xpt_user);
				847	free_conn(c);
				848
				849	spin_lock(&clp->cl_lock);
				850	}
				851	spin_unlock(&clp->cl_lock);
				852	}
				853
				854	static void free_session(struct kref *kref)
				855	{
				856	struct nfsd4_session *ses;
				857	int mem;
				858
				859	lockdep_assert_held(&client_lock);
				860	ses = container_of(kref, struct nfsd4_session, se_ref);
				861	nfsd4_del_conns(ses);
				862	spin_lock(&nfsd_drc_lock);
				863	mem = ses->se_fchannel.maxreqs * slot_bytes(&ses->se_fchannel);
				864	nfsd_drc_mem_used -= mem;
				865	spin_unlock(&nfsd_drc_lock);
				866	free_session_slots(ses);
				867	kfree(ses);
				868	}
				869
				870	void nfsd4_put_session(struct nfsd4_session *ses)
				871	{
				872	spin_lock(&client_lock);
				873	nfsd4_put_session_locked(ses);
				874	spin_unlock(&client_lock);
				875	}
				876
				877	static struct nfsd4_session alloc_init_session(struct svc_rqst rqstp, struct nfs4_client clp, struct nfsd4_create_session cses)
				878	{
				879	struct nfsd4_session *new;
				880	struct nfsd4_channel_attrs *fchan = &cses->fore_channel;
				881	int numslots, slotsize;
				882	int status;
				883	int idx;
				884
				885	/*
				886	* Note decreasing slot size below client's request may
				887	* make it difficult for client to function correctly, whereas
				888	* decreasing the number of slots will (just?) affect
				889	* performance. When short on memory we therefore prefer to
				890	* decrease number of slots instead of their size.
				891	*/
				892	slotsize = nfsd4_sanitize_slot_size(fchan->maxresp_cached);
				893	numslots = nfsd4_get_drc_mem(slotsize, fchan->maxreqs);
				894	if (numslots < 1)
				895	return NULL;
				896
				897	new = alloc_session(slotsize, numslots);
				898	if (!new) {
				899	nfsd4_put_drc_mem(slotsize, fchan->maxreqs);
				900	return NULL;
				901	}
				902	init_forechannel_attrs(&new->se_fchannel, fchan, numslots, slotsize);
				903
				904	new->se_client = clp;
				905	gen_sessionid(new);
				906
				907	INIT_LIST_HEAD(&new->se_conns);
				908
				909	new->se_cb_seq_nr = 1;
				910	new->se_flags = cses->flags;
				911	new->se_cb_prog = cses->callback_prog;
				912	kref_init(&new->se_ref);
				913	idx = hash_sessionid(&new->se_sessionid);
				914	spin_lock(&client_lock);
				915	list_add(&new->se_hash, &sessionid_hashtbl[idx]);
				916	spin_lock(&clp->cl_lock);
				917	list_add(&new->se_perclnt, &clp->cl_sessions);
				918	spin_unlock(&clp->cl_lock);
				919	spin_unlock(&client_lock);
				920
				921	status = nfsd4_new_conn_from_crses(rqstp, new);
				922	/* whoops: benny points out, status is ignored! (err, or bogus) */
				923	if (status) {
				924	spin_lock(&client_lock);
				925	free_session(&new->se_ref);
				926	spin_unlock(&client_lock);
				927	return NULL;
				928	}
				929	if (cses->flags & SESSION4_BACK_CHAN) {
				930	struct sockaddr *sa = svc_addr(rqstp);
				931	/*
				932	* This is a little silly; with sessions there's no real
				933	* use for the callback address. Use the peer address
				934	* as a reasonable default for now, but consider fixing
				935	* the rpc client not to require an address in the
				936	* future:
				937	*/
				938	rpc_copy_addr((struct sockaddr *)&clp->cl_cb_conn.cb_addr, sa);
				939	clp->cl_cb_conn.cb_addrlen = svc_addr_len(sa);
				940	}
				941	nfsd4_probe_callback(clp);
				942	return new;
				943	}
				944
				945	/* caller must hold client_lock */
				946	static struct nfsd4_session *
				947	find_in_sessionid_hashtbl(struct nfs4_sessionid *sessionid)
				948	{
				949	struct nfsd4_session *elem;
				950	int idx;
				951
				952	dump_sessionid(__func__, sessionid);
				953	idx = hash_sessionid(sessionid);
				954	/* Search in the appropriate list */
				955	list_for_each_entry(elem, &sessionid_hashtbl[idx], se_hash) {
				956	if (!memcmp(elem->se_sessionid.data, sessionid->data,
				957	NFS4_MAX_SESSIONID_LEN)) {
				958	return elem;
				959	}
				960	}
				961
				962	dprintk("%s: session not found\n", __func__);
				963	return NULL;
				964	}
				965
				966	/* caller must hold client_lock */
				967	static void
				968	unhash_session(struct nfsd4_session *ses)
				969	{
				970	list_del(&ses->se_hash);
				971	spin_lock(&ses->se_client->cl_lock);
				972	list_del(&ses->se_perclnt);
				973	spin_unlock(&ses->se_client->cl_lock);
				974	}
				975
				976	/* must be called under the client_lock */
				977	static inline void
				978	renew_client_locked(struct nfs4_client *clp)
				979	{
				980	if (is_client_expired(clp)) {
				981	dprintk("%s: client (clientid %08x/%08x) already expired\n",
				982	__func__,
				983	clp->cl_clientid.cl_boot,
				984	clp->cl_clientid.cl_id);
				985	return;
				986	}
				987
				988	dprintk("renewing client (clientid %08x/%08x)\n",
				989	clp->cl_clientid.cl_boot,
				990	clp->cl_clientid.cl_id);
				991	list_move_tail(&clp->cl_lru, &client_lru);
				992	clp->cl_time = get_seconds();
				993	}
				994
				995	static inline void
				996	renew_client(struct nfs4_client *clp)
				997	{
				998	spin_lock(&client_lock);
				999	renew_client_locked(clp);
				1000	spin_unlock(&client_lock);
				1001	}
				1002
				1003	/* SETCLIENTID and SETCLIENTID_CONFIRM Helper functions */
				1004	static int
				1005	STALE_CLIENTID(clientid_t *clid)
				1006	{
				1007	if (clid->cl_boot == boot_time)
				1008	return 0;
				1009	dprintk("NFSD stale clientid (%08x/%08x) boot_time %08lx\n",
				1010	clid->cl_boot, clid->cl_id, boot_time);
				1011	return 1;
				1012	}
				1013
				1014	/*
				1015	* XXX Should we use a slab cache ?
				1016	* This type of memory management is somewhat inefficient, but we use it
				1017	* anyway since SETCLIENTID is not a common operation.
				1018	*/
				1019	static struct nfs4_client *alloc_client(struct xdr_netobj name)
				1020	{
				1021	struct nfs4_client *clp;
				1022
				1023	clp = kzalloc(sizeof(struct nfs4_client), GFP_KERNEL);
				1024	if (clp == NULL)
				1025	return NULL;
				1026	clp->cl_name.data = kmemdup(name.data, name.len, GFP_KERNEL);
				1027	if (clp->cl_name.data == NULL) {
				1028	kfree(clp);
				1029	return NULL;
				1030	}
				1031	clp->cl_name.len = name.len;
				1032	return clp;
				1033	}
				1034
				1035	static inline void
				1036	free_client(struct nfs4_client *clp)
				1037	{
				1038	lockdep_assert_held(&client_lock);
				1039	while (!list_empty(&clp->cl_sessions)) {
				1040	struct nfsd4_session *ses;
				1041	ses = list_entry(clp->cl_sessions.next, struct nfsd4_session,
				1042	se_perclnt);
				1043	list_del(&ses->se_perclnt);
				1044	nfsd4_put_session_locked(ses);
				1045	}
				1046	if (clp->cl_cred.cr_group_info)
				1047	put_group_info(clp->cl_cred.cr_group_info);
				1048	kfree(clp->cl_principal);
				1049	kfree(clp->cl_name.data);
				1050	idr_remove_all(&clp->cl_stateids);
				1051	idr_destroy(&clp->cl_stateids);
				1052	kfree(clp);
				1053	}
				1054
				1055	void
				1056	release_session_client(struct nfsd4_session *session)
				1057	{
				1058	struct nfs4_client *clp = session->se_client;
				1059
				1060	if (!atomic_dec_and_lock(&clp->cl_refcount, &client_lock))
				1061	return;
				1062	if (is_client_expired(clp)) {
				1063	free_client(clp);
				1064	session->se_client = NULL;
				1065	} else
				1066	renew_client_locked(clp);
				1067	spin_unlock(&client_lock);
				1068	}
				1069
				1070	/* must be called under the client_lock */
				1071	static inline void
				1072	unhash_client_locked(struct nfs4_client *clp)
				1073	{
				1074	struct nfsd4_session *ses;
				1075
				1076	mark_client_expired(clp);
				1077	list_del(&clp->cl_lru);
				1078	spin_lock(&clp->cl_lock);
				1079	list_for_each_entry(ses, &clp->cl_sessions, se_perclnt)
				1080	list_del_init(&ses->se_hash);
				1081	spin_unlock(&clp->cl_lock);
				1082	}
				1083
				1084	static void
				1085	expire_client(struct nfs4_client *clp)
				1086	{
				1087	struct nfs4_openowner *oo;
				1088	struct nfs4_delegation *dp;
				1089	struct list_head reaplist;
				1090
				1091	INIT_LIST_HEAD(&reaplist);
				1092	spin_lock(&recall_lock);
				1093	while (!list_empty(&clp->cl_delegations)) {
				1094	dp = list_entry(clp->cl_delegations.next, struct nfs4_delegation, dl_perclnt);
				1095	list_del_init(&dp->dl_perclnt);
				1096	list_move(&dp->dl_recall_lru, &reaplist);
				1097	}
				1098	spin_unlock(&recall_lock);
				1099	while (!list_empty(&reaplist)) {
				1100	dp = list_entry(reaplist.next, struct nfs4_delegation, dl_recall_lru);
				1101	unhash_delegation(dp);
				1102	}
				1103	while (!list_empty(&clp->cl_openowners)) {
				1104	oo = list_entry(clp->cl_openowners.next, struct nfs4_openowner, oo_perclient);
				1105	release_openowner(oo);
				1106	}
				1107	nfsd4_shutdown_callback(clp);
				1108	if (clp->cl_cb_conn.cb_xprt)
				1109	svc_xprt_put(clp->cl_cb_conn.cb_xprt);
				1110	list_del(&clp->cl_idhash);
				1111	list_del(&clp->cl_strhash);
				1112	spin_lock(&client_lock);
				1113	unhash_client_locked(clp);
				1114	if (atomic_read(&clp->cl_refcount) == 0)
				1115	free_client(clp);
				1116	spin_unlock(&client_lock);
				1117	}
				1118
				1119	static void copy_verf(struct nfs4_client target, nfs4_verifier source)
				1120	{
				1121	memcpy(target->cl_verifier.data, source->data,
				1122	sizeof(target->cl_verifier.data));
				1123	}
				1124
				1125	static void copy_clid(struct nfs4_client target, struct nfs4_client source)
				1126	{
				1127	target->cl_clientid.cl_boot = source->cl_clientid.cl_boot;
				1128	target->cl_clientid.cl_id = source->cl_clientid.cl_id;
				1129	}
				1130
				1131	static void copy_cred(struct svc_cred target, struct svc_cred source)
				1132	{
				1133	target->cr_uid = source->cr_uid;
				1134	target->cr_gid = source->cr_gid;
				1135	target->cr_group_info = source->cr_group_info;
				1136	get_group_info(target->cr_group_info);
				1137	}
				1138
				1139	static int same_name(const char n1, const char n2)
				1140	{
				1141	return 0 == memcmp(n1, n2, HEXDIR_LEN);
				1142	}
				1143
				1144	static int
				1145	same_verf(nfs4_verifier v1, nfs4_verifier v2)
				1146	{
				1147	return 0 == memcmp(v1->data, v2->data, sizeof(v1->data));
				1148	}
				1149
				1150	static int
				1151	same_clid(clientid_t cl1, clientid_t cl2)
				1152	{
				1153	return (cl1->cl_boot == cl2->cl_boot) && (cl1->cl_id == cl2->cl_id);
				1154	}
				1155
				1156	/* XXX what about NGROUP */
				1157	static int
				1158	same_creds(struct svc_cred cr1, struct svc_cred cr2)
				1159	{
				1160	return cr1->cr_uid == cr2->cr_uid;
				1161	}
				1162
				1163	static void gen_clid(struct nfs4_client *clp)
				1164	{
				1165	static u32 current_clientid = 1;
				1166
				1167	clp->cl_clientid.cl_boot = boot_time;
				1168	clp->cl_clientid.cl_id = current_clientid++;
				1169	}
				1170
				1171	static void gen_confirm(struct nfs4_client *clp)
				1172	{
				1173	__be32 verf[2];
				1174	static u32 i;
				1175
				1176	verf[0] = (__be32)get_seconds();
				1177	verf[1] = (__be32)i++;
				1178	memcpy(clp->cl_confirm.data, verf, sizeof(clp->cl_confirm.data));
				1179	}
				1180
				1181	static struct nfs4_stid find_stateid(struct nfs4_client cl, stateid_t *t)
				1182	{
				1183	return idr_find(&cl->cl_stateids, t->si_opaque.so_id);
				1184	}
				1185
				1186	static struct nfs4_stid find_stateid_by_type(struct nfs4_client cl, stateid_t *t, char typemask)
				1187	{
				1188	struct nfs4_stid *s;
				1189
				1190	s = find_stateid(cl, t);
				1191	if (!s)
				1192	return NULL;
				1193	if (typemask & s->sc_type)
				1194	return s;
				1195	return NULL;
				1196	}
				1197
				1198	static struct nfs4_client create_client(struct xdr_netobj name, char recdir,
				1199	struct svc_rqst rqstp, nfs4_verifier verf)
				1200	{
				1201	struct nfs4_client *clp;
				1202	struct sockaddr *sa = svc_addr(rqstp);
				1203	char *princ;
				1204
				1205	clp = alloc_client(name);
				1206	if (clp == NULL)
				1207	return NULL;
				1208
				1209	INIT_LIST_HEAD(&clp->cl_sessions);
				1210
				1211	princ = svc_gss_principal(rqstp);
				1212	if (princ) {
				1213	clp->cl_principal = kstrdup(princ, GFP_KERNEL);
				1214	if (clp->cl_principal == NULL) {
				1215	spin_lock(&client_lock);
				1216	free_client(clp);
				1217	spin_unlock(&client_lock);
				1218	return NULL;
				1219	}
				1220	}
				1221
				1222	idr_init(&clp->cl_stateids);
				1223	memcpy(clp->cl_recdir, recdir, HEXDIR_LEN);
				1224	atomic_set(&clp->cl_refcount, 0);
				1225	clp->cl_cb_state = NFSD4_CB_UNKNOWN;
				1226	INIT_LIST_HEAD(&clp->cl_idhash);
				1227	INIT_LIST_HEAD(&clp->cl_strhash);
				1228	INIT_LIST_HEAD(&clp->cl_openowners);
				1229	INIT_LIST_HEAD(&clp->cl_delegations);
				1230	INIT_LIST_HEAD(&clp->cl_lru);
				1231	INIT_LIST_HEAD(&clp->cl_callbacks);
				1232	spin_lock_init(&clp->cl_lock);
				1233	INIT_WORK(&clp->cl_cb_null.cb_work, nfsd4_do_callback_rpc);
				1234	clp->cl_time = get_seconds();
				1235	clear_bit(0, &clp->cl_cb_slot_busy);
				1236	rpc_init_wait_queue(&clp->cl_cb_waitq, "Backchannel slot table");
				1237	copy_verf(clp, verf);
				1238	rpc_copy_addr((struct sockaddr *) &clp->cl_addr, sa);
				1239	clp->cl_flavor = rqstp->rq_flavor;
				1240	copy_cred(&clp->cl_cred, &rqstp->rq_cred);
				1241	gen_confirm(clp);
				1242	clp->cl_cb_session = NULL;
				1243	return clp;
				1244	}
				1245
				1246	static void
				1247	add_to_unconfirmed(struct nfs4_client *clp, unsigned int strhashval)
				1248	{
				1249	unsigned int idhashval;
				1250
				1251	list_add(&clp->cl_strhash, &unconf_str_hashtbl[strhashval]);
				1252	idhashval = clientid_hashval(clp->cl_clientid.cl_id);
				1253	list_add(&clp->cl_idhash, &unconf_id_hashtbl[idhashval]);
				1254	renew_client(clp);
				1255	}
				1256
				1257	static void
				1258	move_to_confirmed(struct nfs4_client *clp)
				1259	{
				1260	unsigned int idhashval = clientid_hashval(clp->cl_clientid.cl_id);
				1261	unsigned int strhashval;
				1262
				1263	dprintk("NFSD: move_to_confirm nfs4_client %p\n", clp);
				1264	list_move(&clp->cl_idhash, &conf_id_hashtbl[idhashval]);
				1265	strhashval = clientstr_hashval(clp->cl_recdir);
				1266	list_move(&clp->cl_strhash, &conf_str_hashtbl[strhashval]);
				1267	renew_client(clp);
				1268	}
				1269
				1270	static struct nfs4_client *
				1271	find_confirmed_client(clientid_t *clid)
				1272	{
				1273	struct nfs4_client *clp;
				1274	unsigned int idhashval = clientid_hashval(clid->cl_id);
				1275
				1276	list_for_each_entry(clp, &conf_id_hashtbl[idhashval], cl_idhash) {
				1277	if (same_clid(&clp->cl_clientid, clid)) {
				1278	renew_client(clp);
				1279	return clp;
				1280	}
				1281	}
				1282	return NULL;
				1283	}
				1284
				1285	static struct nfs4_client *
				1286	find_unconfirmed_client(clientid_t *clid)
				1287	{
				1288	struct nfs4_client *clp;
				1289	unsigned int idhashval = clientid_hashval(clid->cl_id);
				1290
				1291	list_for_each_entry(clp, &unconf_id_hashtbl[idhashval], cl_idhash) {
				1292	if (same_clid(&clp->cl_clientid, clid))
				1293	return clp;
				1294	}
				1295	return NULL;
				1296	}
				1297
				1298	static bool clp_used_exchangeid(struct nfs4_client *clp)
				1299	{
				1300	return clp->cl_exchange_flags != 0;
				1301	}
				1302
				1303	static struct nfs4_client *
				1304	find_confirmed_client_by_str(const char *dname, unsigned int hashval)
				1305	{
				1306	struct nfs4_client *clp;
				1307
				1308	list_for_each_entry(clp, &conf_str_hashtbl[hashval], cl_strhash) {
				1309	if (same_name(clp->cl_recdir, dname))
				1310	return clp;
				1311	}
				1312	return NULL;
				1313	}
				1314
				1315	static struct nfs4_client *
				1316	find_unconfirmed_client_by_str(const char *dname, unsigned int hashval)
				1317	{
				1318	struct nfs4_client *clp;
				1319
				1320	list_for_each_entry(clp, &unconf_str_hashtbl[hashval], cl_strhash) {
				1321	if (same_name(clp->cl_recdir, dname))
				1322	return clp;
				1323	}
				1324	return NULL;
				1325	}
				1326
				1327	static void
				1328	gen_callback(struct nfs4_client clp, struct nfsd4_setclientid se, struct svc_rqst *rqstp)
				1329	{
				1330	struct nfs4_cb_conn *conn = &clp->cl_cb_conn;
				1331	struct sockaddr *sa = svc_addr(rqstp);
				1332	u32 scopeid = rpc_get_scope_id(sa);
				1333	unsigned short expected_family;
				1334
				1335	/* Currently, we only support tcp and tcp6 for the callback channel */
				1336	if (se->se_callback_netid_len == 3 &&
				1337	!memcmp(se->se_callback_netid_val, "tcp", 3))
				1338	expected_family = AF_INET;
				1339	else if (se->se_callback_netid_len == 4 &&
				1340	!memcmp(se->se_callback_netid_val, "tcp6", 4))
				1341	expected_family = AF_INET6;
				1342	else
				1343	goto out_err;
				1344
				1345	conn->cb_addrlen = rpc_uaddr2sockaddr(&init_net, se->se_callback_addr_val,
				1346	se->se_callback_addr_len,
				1347	(struct sockaddr *)&conn->cb_addr,
				1348	sizeof(conn->cb_addr));
				1349
				1350	if (!conn->cb_addrlen \|\| conn->cb_addr.ss_family != expected_family)
				1351	goto out_err;
				1352
				1353	if (conn->cb_addr.ss_family == AF_INET6)
				1354	((struct sockaddr_in6 *)&conn->cb_addr)->sin6_scope_id = scopeid;
				1355
				1356	conn->cb_prog = se->se_callback_prog;
				1357	conn->cb_ident = se->se_callback_ident;
				1358	memcpy(&conn->cb_saddr, &rqstp->rq_daddr, rqstp->rq_daddrlen);
				1359	return;
				1360	out_err:
				1361	conn->cb_addr.ss_family = AF_UNSPEC;
				1362	conn->cb_addrlen = 0;
				1363	dprintk(KERN_INFO "NFSD: this client (clientid %08x/%08x) "
				1364	"will not receive delegations\n",
				1365	clp->cl_clientid.cl_boot, clp->cl_clientid.cl_id);
				1366
				1367	return;
				1368	}
				1369
				1370	/*
				1371	* Cache a reply. nfsd4_check_drc_limit() has bounded the cache size.
				1372	*/
				1373	void
				1374	nfsd4_store_cache_entry(struct nfsd4_compoundres *resp)
				1375	{
				1376	struct nfsd4_slot *slot = resp->cstate.slot;
				1377	unsigned int base;
				1378
				1379	dprintk("--> %s slot %p\n", __func__, slot);
				1380
				1381	slot->sl_opcnt = resp->opcnt;
				1382	slot->sl_status = resp->cstate.status;
				1383
				1384	slot->sl_flags \|= NFSD4_SLOT_INITIALIZED;
				1385	if (nfsd4_not_cached(resp)) {
				1386	slot->sl_datalen = 0;
				1387	return;
				1388	}
				1389	slot->sl_datalen = (char )resp->p - (char )resp->cstate.datap;
				1390	base = (char *)resp->cstate.datap -
				1391	(char *)resp->xbuf->head[0].iov_base;
				1392	if (read_bytes_from_xdr_buf(resp->xbuf, base, slot->sl_data,
				1393	slot->sl_datalen))
				1394	WARN("%s: sessions DRC could not cache compound\n", __func__);
				1395	return;
				1396	}
				1397
				1398	/*
				1399	* Encode the replay sequence operation from the slot values.
				1400	* If cachethis is FALSE encode the uncached rep error on the next
				1401	* operation which sets resp->p and increments resp->opcnt for
				1402	* nfs4svc_encode_compoundres.
				1403	*
				1404	*/
				1405	static __be32
				1406	nfsd4_enc_sequence_replay(struct nfsd4_compoundargs *args,
				1407	struct nfsd4_compoundres *resp)
				1408	{
				1409	struct nfsd4_op *op;
				1410	struct nfsd4_slot *slot = resp->cstate.slot;
				1411
				1412	/* Encode the replayed sequence operation */
				1413	op = &args->ops[resp->opcnt - 1];
				1414	nfsd4_encode_operation(resp, op);
				1415
				1416	/* Return nfserr_retry_uncached_rep in next operation. */
				1417	if (args->opcnt > 1 && !(slot->sl_flags & NFSD4_SLOT_CACHETHIS)) {
				1418	op = &args->ops[resp->opcnt++];
				1419	op->status = nfserr_retry_uncached_rep;
				1420	nfsd4_encode_operation(resp, op);
				1421	}
				1422	return op->status;
				1423	}
				1424
				1425	/*
				1426	* The sequence operation is not cached because we can use the slot and
				1427	* session values.
				1428	*/
				1429	__be32
				1430	nfsd4_replay_cache_entry(struct nfsd4_compoundres *resp,
				1431	struct nfsd4_sequence *seq)
				1432	{
				1433	struct nfsd4_slot *slot = resp->cstate.slot;
				1434	__be32 status;
				1435
				1436	dprintk("--> %s slot %p\n", __func__, slot);
				1437
				1438	/* Either returns 0 or nfserr_retry_uncached */
				1439	status = nfsd4_enc_sequence_replay(resp->rqstp->rq_argp, resp);
				1440	if (status == nfserr_retry_uncached_rep)
				1441	return status;
				1442
				1443	/* The sequence operation has been encoded, cstate->datap set. */
				1444	memcpy(resp->cstate.datap, slot->sl_data, slot->sl_datalen);
				1445
				1446	resp->opcnt = slot->sl_opcnt;
				1447	resp->p = resp->cstate.datap + XDR_QUADLEN(slot->sl_datalen);
				1448	status = slot->sl_status;
				1449
				1450	return status;
				1451	}
				1452
				1453	/*
				1454	* Set the exchange_id flags returned by the server.
				1455	*/
				1456	static void
				1457	nfsd4_set_ex_flags(struct nfs4_client new, struct nfsd4_exchange_id clid)
				1458	{
				1459	/* pNFS is not supported */
				1460	new->cl_exchange_flags \|= EXCHGID4_FLAG_USE_NON_PNFS;
				1461
				1462	/* Referrals are supported, Migration is not. */
				1463	new->cl_exchange_flags \|= EXCHGID4_FLAG_SUPP_MOVED_REFER;
				1464
				1465	/* set the wire flags to return to client. */
				1466	clid->flags = new->cl_exchange_flags;
				1467	}
				1468
				1469	__be32
				1470	nfsd4_exchange_id(struct svc_rqst *rqstp,
				1471	struct nfsd4_compound_state *cstate,
				1472	struct nfsd4_exchange_id *exid)
				1473	{
				1474	struct nfs4_client unconf, conf, *new;
				1475	int status;
				1476	unsigned int strhashval;
				1477	char dname[HEXDIR_LEN];
				1478	char addr_str[INET6_ADDRSTRLEN];
				1479	nfs4_verifier verf = exid->verifier;
				1480	struct sockaddr *sa = svc_addr(rqstp);
				1481
				1482	rpc_ntop(sa, addr_str, sizeof(addr_str));
				1483	dprintk("%s rqstp=%p exid=%p clname.len=%u clname.data=%p "
				1484	"ip_addr=%s flags %x, spa_how %d\n",
				1485	__func__, rqstp, exid, exid->clname.len, exid->clname.data,
				1486	addr_str, exid->flags, exid->spa_how);
				1487
				1488	if (exid->flags & ~EXCHGID4_FLAG_MASK_A)
				1489	return nfserr_inval;
				1490
				1491	/* Currently only support SP4_NONE */
				1492	switch (exid->spa_how) {
				1493	case SP4_NONE:
				1494	break;
				1495	case SP4_SSV:
				1496	return nfserr_serverfault;
				1497	default:
				1498	BUG(); /* checked by xdr code */
				1499	case SP4_MACH_CRED:
				1500	return nfserr_serverfault; /* no excuse :-/ */
				1501	}
				1502
				1503	status = nfs4_make_rec_clidname(dname, &exid->clname);
				1504
				1505	if (status)
				1506	goto error;
				1507
				1508	strhashval = clientstr_hashval(dname);
				1509
				1510	nfs4_lock_state();
				1511	status = nfs_ok;
				1512
				1513	conf = find_confirmed_client_by_str(dname, strhashval);
				1514	if (conf) {
				1515	if (!clp_used_exchangeid(conf)) {
				1516	status = nfserr_clid_inuse; /* XXX: ? */
				1517	goto out;
				1518	}
				1519	if (!same_verf(&verf, &conf->cl_verifier)) {
				1520	/* 18.35.4 case 8 */
				1521	if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
				1522	status = nfserr_not_same;
				1523	goto out;
				1524	}
				1525	/* Client reboot: destroy old state */
				1526	expire_client(conf);
				1527	goto out_new;
				1528	}
				1529	if (!same_creds(&conf->cl_cred, &rqstp->rq_cred)) {
				1530	/* 18.35.4 case 9 */
				1531	if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
				1532	status = nfserr_perm;
				1533	goto out;
				1534	}
				1535	expire_client(conf);
				1536	goto out_new;
				1537	}
				1538	/*
				1539	* Set bit when the owner id and verifier map to an already
				1540	* confirmed client id (18.35.3).
				1541	*/
				1542	exid->flags \|= EXCHGID4_FLAG_CONFIRMED_R;
				1543
				1544	/*
				1545	* Falling into 18.35.4 case 2, possible router replay.
				1546	* Leave confirmed record intact and return same result.
				1547	*/
				1548	copy_verf(conf, &verf);
				1549	new = conf;
				1550	goto out_copy;
				1551	}
				1552
				1553	/* 18.35.4 case 7 */
				1554	if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
				1555	status = nfserr_noent;
				1556	goto out;
				1557	}
				1558
				1559	unconf = find_unconfirmed_client_by_str(dname, strhashval);
				1560	if (unconf) {
				1561	/*
				1562	* Possible retry or client restart. Per 18.35.4 case 4,
				1563	* a new unconfirmed record should be generated regardless
				1564	* of whether any properties have changed.
				1565	*/
				1566	expire_client(unconf);
				1567	}
				1568
				1569	out_new:
				1570	/* Normal case */
				1571	new = create_client(exid->clname, dname, rqstp, &verf);
				1572	if (new == NULL) {
				1573	status = nfserr_jukebox;
				1574	goto out;
				1575	}
				1576
				1577	gen_clid(new);
				1578	add_to_unconfirmed(new, strhashval);
				1579	out_copy:
				1580	exid->clientid.cl_boot = new->cl_clientid.cl_boot;
				1581	exid->clientid.cl_id = new->cl_clientid.cl_id;
				1582
				1583	exid->seqid = 1;
				1584	nfsd4_set_ex_flags(new, exid);
				1585
				1586	dprintk("nfsd4_exchange_id seqid %d flags %x\n",
				1587	new->cl_cs_slot.sl_seqid, new->cl_exchange_flags);
				1588	status = nfs_ok;
				1589
				1590	out:
				1591	nfs4_unlock_state();
				1592	error:
				1593	dprintk("nfsd4_exchange_id returns %d\n", ntohl(status));
				1594	return status;
				1595	}
				1596
				1597	static int
				1598	check_slot_seqid(u32 seqid, u32 slot_seqid, int slot_inuse)
				1599	{
				1600	dprintk("%s enter. seqid %d slot_seqid %d\n", __func__, seqid,
				1601	slot_seqid);
				1602
				1603	/* The slot is in use, and no response has been sent. */
				1604	if (slot_inuse) {
				1605	if (seqid == slot_seqid)
				1606	return nfserr_jukebox;
				1607	else
				1608	return nfserr_seq_misordered;
				1609	}
				1610	/* Note unsigned 32-bit arithmetic handles wraparound: */
				1611	if (likely(seqid == slot_seqid + 1))
				1612	return nfs_ok;
				1613	if (seqid == slot_seqid)
				1614	return nfserr_replay_cache;
				1615	return nfserr_seq_misordered;
				1616	}
				1617
				1618	/*
				1619	* Cache the create session result into the create session single DRC
				1620	* slot cache by saving the xdr structure. sl_seqid has been set.
				1621	* Do this for solo or embedded create session operations.
				1622	*/
				1623	static void
				1624	nfsd4_cache_create_session(struct nfsd4_create_session *cr_ses,
				1625	struct nfsd4_clid_slot *slot, int nfserr)
				1626	{
				1627	slot->sl_status = nfserr;
				1628	memcpy(&slot->sl_cr_ses, cr_ses, sizeof(*cr_ses));
				1629	}
				1630
				1631	static __be32
				1632	nfsd4_replay_create_session(struct nfsd4_create_session *cr_ses,
				1633	struct nfsd4_clid_slot *slot)
				1634	{
				1635	memcpy(cr_ses, &slot->sl_cr_ses, sizeof(*cr_ses));
				1636	return slot->sl_status;
				1637	}
				1638
				1639	#define NFSD_MIN_REQ_HDR_SEQ_SZ ((\
				1640	2 * 2 + /* credential,verifier: AUTH_NULL, length 0 */ \
				1641	1 + /* MIN tag is length with zero, only length */ \
				1642	3 + /* version, opcount, opcode */ \
				1643	XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
				1644	/* seqid, slotID, slotID, cache */ \
				1645	4 ) * sizeof(__be32))
				1646
				1647	#define NFSD_MIN_RESP_HDR_SEQ_SZ ((\
				1648	2 + /* verifier: AUTH_NULL, length 0 */\
				1649	1 + /* status */ \
				1650	1 + /* MIN tag is length with zero, only length */ \
				1651	3 + /* opcount, opcode, opstatus*/ \
				1652	XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
				1653	/* seqid, slotID, slotID, slotID, status */ \
				1654	5 ) * sizeof(__be32))
				1655
				1656	static __be32 check_forechannel_attrs(struct nfsd4_channel_attrs fchannel)
				1657	{
				1658	return fchannel.maxreq_sz < NFSD_MIN_REQ_HDR_SEQ_SZ
				1659	\|\| fchannel.maxresp_sz < NFSD_MIN_RESP_HDR_SEQ_SZ;
				1660	}
				1661
				1662	__be32
				1663	nfsd4_create_session(struct svc_rqst *rqstp,
				1664	struct nfsd4_compound_state *cstate,
				1665	struct nfsd4_create_session *cr_ses)
				1666	{
				1667	struct sockaddr *sa = svc_addr(rqstp);
				1668	struct nfs4_client conf, unconf;
				1669	struct nfsd4_session *new;
				1670	struct nfsd4_clid_slot *cs_slot = NULL;
				1671	bool confirm_me = false;
				1672	int status = 0;
				1673
				1674	if (cr_ses->flags & ~SESSION4_FLAG_MASK_A)
				1675	return nfserr_inval;
				1676
				1677	nfs4_lock_state();
				1678	unconf = find_unconfirmed_client(&cr_ses->clientid);
				1679	conf = find_confirmed_client(&cr_ses->clientid);
				1680
				1681	if (conf) {
				1682	cs_slot = &conf->cl_cs_slot;
				1683	status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
				1684	if (status == nfserr_replay_cache) {
				1685	dprintk("Got a create_session replay! seqid= %d\n",
				1686	cs_slot->sl_seqid);
				1687	/* Return the cached reply status */
				1688	status = nfsd4_replay_create_session(cr_ses, cs_slot);
				1689	goto out;
				1690	} else if (cr_ses->seqid != cs_slot->sl_seqid + 1) {
				1691	status = nfserr_seq_misordered;
				1692	dprintk("Sequence misordered!\n");
				1693	dprintk("Expected seqid= %d but got seqid= %d\n",
				1694	cs_slot->sl_seqid, cr_ses->seqid);
				1695	goto out;
				1696	}
				1697	} else if (unconf) {
				1698	if (!same_creds(&unconf->cl_cred, &rqstp->rq_cred) \|\|
				1699	!rpc_cmp_addr(sa, (struct sockaddr *) &unconf->cl_addr)) {
				1700	status = nfserr_clid_inuse;
				1701	goto out;
				1702	}
				1703
				1704	cs_slot = &unconf->cl_cs_slot;
				1705	status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
				1706	if (status) {
				1707	/* an unconfirmed replay returns misordered */
				1708	status = nfserr_seq_misordered;
				1709	goto out;
				1710	}
				1711
				1712	confirm_me = true;
				1713	conf = unconf;
				1714	} else {
				1715	status = nfserr_stale_clientid;
				1716	goto out;
				1717	}
				1718
				1719	/*
				1720	* XXX: we should probably set this at creation time, and check
				1721	* for consistent minorversion use throughout:
				1722	*/
				1723	conf->cl_minorversion = 1;
				1724	/*
				1725	* We do not support RDMA or persistent sessions
				1726	*/
				1727	cr_ses->flags &= ~SESSION4_PERSIST;
				1728	cr_ses->flags &= ~SESSION4_RDMA;
				1729
				1730	status = nfserr_toosmall;
				1731	if (check_forechannel_attrs(cr_ses->fore_channel))
				1732	goto out;
				1733
				1734	status = nfserr_jukebox;
				1735	new = alloc_init_session(rqstp, conf, cr_ses);
				1736	if (!new)
				1737	goto out;
				1738	status = nfs_ok;
				1739	memcpy(cr_ses->sessionid.data, new->se_sessionid.data,
				1740	NFS4_MAX_SESSIONID_LEN);
				1741	memcpy(&cr_ses->fore_channel, &new->se_fchannel,
				1742	sizeof(struct nfsd4_channel_attrs));
				1743	cs_slot->sl_seqid++;
				1744	cr_ses->seqid = cs_slot->sl_seqid;
				1745
				1746	/* cache solo and embedded create sessions under the state lock */
				1747	nfsd4_cache_create_session(cr_ses, cs_slot, status);
				1748	if (confirm_me)
				1749	move_to_confirmed(conf);
				1750	out:
				1751	nfs4_unlock_state();
				1752	dprintk("%s returns %d\n", __func__, ntohl(status));
				1753	return status;
				1754	}
				1755
				1756	static bool nfsd4_last_compound_op(struct svc_rqst *rqstp)
				1757	{
				1758	struct nfsd4_compoundres *resp = rqstp->rq_resp;
				1759	struct nfsd4_compoundargs *argp = rqstp->rq_argp;
				1760
				1761	return argp->opcnt == resp->opcnt;
				1762	}
				1763
				1764	static __be32 nfsd4_map_bcts_dir(u32 *dir)
				1765	{
				1766	switch (*dir) {
				1767	case NFS4_CDFC4_FORE:
				1768	case NFS4_CDFC4_BACK:
				1769	return nfs_ok;
				1770	case NFS4_CDFC4_FORE_OR_BOTH:
				1771	case NFS4_CDFC4_BACK_OR_BOTH:
				1772	*dir = NFS4_CDFC4_BOTH;
				1773	return nfs_ok;
				1774	};
				1775	return nfserr_inval;
				1776	}
				1777
				1778	__be32 nfsd4_bind_conn_to_session(struct svc_rqst *rqstp,
				1779	struct nfsd4_compound_state *cstate,
				1780	struct nfsd4_bind_conn_to_session *bcts)
				1781	{
				1782	__be32 status;
				1783
				1784	if (!nfsd4_last_compound_op(rqstp))
				1785	return nfserr_not_only_op;
				1786	spin_lock(&client_lock);
				1787	cstate->session = find_in_sessionid_hashtbl(&bcts->sessionid);
				1788	/* Sorta weird: we only need the refcnt'ing because new_conn acquires
				1789	* client_lock iself: */
				1790	if (cstate->session) {
				1791	nfsd4_get_session(cstate->session);
				1792	atomic_inc(&cstate->session->se_client->cl_refcount);
				1793	}
				1794	spin_unlock(&client_lock);
				1795	if (!cstate->session)
				1796	return nfserr_badsession;
				1797
				1798	status = nfsd4_map_bcts_dir(&bcts->dir);
				1799	if (!status)
				1800	nfsd4_new_conn(rqstp, cstate->session, bcts->dir);
				1801	return status;
				1802	}
				1803
				1804	static bool nfsd4_compound_in_session(struct nfsd4_session session, struct nfs4_sessionid sid)
				1805	{
				1806	if (!session)
				1807	return 0;
				1808	return !memcmp(sid, &session->se_sessionid, sizeof(*sid));
				1809	}
				1810
				1811	__be32
				1812	nfsd4_destroy_session(struct svc_rqst *r,
				1813	struct nfsd4_compound_state *cstate,
				1814	struct nfsd4_destroy_session *sessionid)
				1815	{
				1816	struct nfsd4_session *ses;
				1817	u32 status = nfserr_badsession;
				1818
				1819	/* Notes:
				1820	* - The confirmed nfs4_client->cl_sessionid holds destroyed sessinid
				1821	* - Should we return nfserr_back_chan_busy if waiting for
				1822	* callbacks on to-be-destroyed session?
				1823	* - Do we need to clear any callback info from previous session?
				1824	*/
				1825
				1826	if (nfsd4_compound_in_session(cstate->session, &sessionid->sessionid)) {
				1827	if (!nfsd4_last_compound_op(r))
				1828	return nfserr_not_only_op;
				1829	}
				1830	dump_sessionid(__func__, &sessionid->sessionid);
				1831	spin_lock(&client_lock);
				1832	ses = find_in_sessionid_hashtbl(&sessionid->sessionid);
				1833	if (!ses) {
				1834	spin_unlock(&client_lock);
				1835	goto out;
				1836	}
				1837
				1838	unhash_session(ses);
				1839	spin_unlock(&client_lock);
				1840
				1841	nfs4_lock_state();
				1842	nfsd4_probe_callback_sync(ses->se_client);
				1843	nfs4_unlock_state();
				1844
				1845	spin_lock(&client_lock);
				1846	nfsd4_del_conns(ses);
				1847	nfsd4_put_session_locked(ses);
				1848	spin_unlock(&client_lock);
				1849	status = nfs_ok;
				1850	out:
				1851	dprintk("%s returns %d\n", __func__, ntohl(status));
				1852	return status;
				1853	}
				1854
				1855	static struct nfsd4_conn __nfsd4_find_conn(struct svc_xprt xpt, struct nfsd4_session *s)
				1856	{
				1857	struct nfsd4_conn *c;
				1858
				1859	list_for_each_entry(c, &s->se_conns, cn_persession) {
				1860	if (c->cn_xprt == xpt) {
				1861	return c;
				1862	}
				1863	}
				1864	return NULL;
				1865	}
				1866
				1867	static void nfsd4_sequence_check_conn(struct nfsd4_conn new, struct nfsd4_session ses)
				1868	{
				1869	struct nfs4_client *clp = ses->se_client;
				1870	struct nfsd4_conn *c;
				1871	int ret;
				1872
				1873	spin_lock(&clp->cl_lock);
				1874	c = __nfsd4_find_conn(new->cn_xprt, ses);
				1875	if (c) {
				1876	spin_unlock(&clp->cl_lock);
				1877	free_conn(new);
				1878	return;
				1879	}
				1880	__nfsd4_hash_conn(new, ses);
				1881	spin_unlock(&clp->cl_lock);
				1882	ret = nfsd4_register_conn(new);
				1883	if (ret)
				1884	/* oops; xprt is already down: */
				1885	nfsd4_conn_lost(&new->cn_xpt_user);
				1886	return;
				1887	}
				1888
				1889	static bool nfsd4_session_too_many_ops(struct svc_rqst rqstp, struct nfsd4_session session)
				1890	{
				1891	struct nfsd4_compoundargs *args = rqstp->rq_argp;
				1892
				1893	return args->opcnt > session->se_fchannel.maxops;
				1894	}
				1895
				1896	static bool nfsd4_request_too_big(struct svc_rqst *rqstp,
				1897	struct nfsd4_session *session)
				1898	{
				1899	struct xdr_buf *xb = &rqstp->rq_arg;
				1900
				1901	return xb->len > session->se_fchannel.maxreq_sz;
				1902	}
				1903
				1904	__be32
				1905	nfsd4_sequence(struct svc_rqst *rqstp,
				1906	struct nfsd4_compound_state *cstate,
				1907	struct nfsd4_sequence *seq)
				1908	{
				1909	struct nfsd4_compoundres *resp = rqstp->rq_resp;
				1910	struct nfsd4_session *session;
				1911	struct nfsd4_slot *slot;
				1912	struct nfsd4_conn *conn;
				1913	int status;
				1914
				1915	if (resp->opcnt != 1)
				1916	return nfserr_sequence_pos;
				1917
				1918	/*
				1919	* Will be either used or freed by nfsd4_sequence_check_conn
				1920	* below.
				1921	*/
				1922	conn = alloc_conn(rqstp, NFS4_CDFC4_FORE);
				1923	if (!conn)
				1924	return nfserr_jukebox;
				1925
				1926	spin_lock(&client_lock);
				1927	status = nfserr_badsession;
				1928	session = find_in_sessionid_hashtbl(&seq->sessionid);
				1929	if (!session)
				1930	goto out;
				1931
				1932	status = nfserr_too_many_ops;
				1933	if (nfsd4_session_too_many_ops(rqstp, session))
				1934	goto out;
				1935
				1936	status = nfserr_req_too_big;
				1937	if (nfsd4_request_too_big(rqstp, session))
				1938	goto out;
				1939
				1940	status = nfserr_badslot;
				1941	if (seq->slotid >= session->se_fchannel.maxreqs)
				1942	goto out;
				1943
				1944	slot = session->se_slots[seq->slotid];
				1945	dprintk("%s: slotid %d\n", __func__, seq->slotid);
				1946
				1947	/* We do not negotiate the number of slots yet, so set the
				1948	* maxslots to the session maxreqs which is used to encode
				1949	* sr_highest_slotid and the sr_target_slot id to maxslots */
				1950	seq->maxslots = session->se_fchannel.maxreqs;
				1951
				1952	status = check_slot_seqid(seq->seqid, slot->sl_seqid,
				1953	slot->sl_flags & NFSD4_SLOT_INUSE);
				1954	if (status == nfserr_replay_cache) {
				1955	status = nfserr_seq_misordered;
				1956	if (!(slot->sl_flags & NFSD4_SLOT_INITIALIZED))
				1957	goto out;
				1958	cstate->slot = slot;
				1959	cstate->session = session;
				1960	/* Return the cached reply status and set cstate->status
				1961	* for nfsd4_proc_compound processing */
				1962	status = nfsd4_replay_cache_entry(resp, seq);
				1963	cstate->status = nfserr_replay_cache;
				1964	goto out;
				1965	}
				1966	if (status)
				1967	goto out;
				1968
				1969	nfsd4_sequence_check_conn(conn, session);
				1970	conn = NULL;
				1971
				1972	/* Success! bump slot seqid */
				1973	slot->sl_seqid = seq->seqid;
				1974	slot->sl_flags \|= NFSD4_SLOT_INUSE;
				1975	if (seq->cachethis)
				1976	slot->sl_flags \|= NFSD4_SLOT_CACHETHIS;
				1977	else
				1978	slot->sl_flags &= ~NFSD4_SLOT_CACHETHIS;
				1979
				1980	cstate->slot = slot;
				1981	cstate->session = session;
				1982
				1983	out:
				1984	/* Hold a session reference until done processing the compound. */
				1985	if (cstate->session) {
				1986	struct nfs4_client *clp = session->se_client;
				1987
				1988	nfsd4_get_session(cstate->session);
				1989	atomic_inc(&clp->cl_refcount);
				1990	switch (clp->cl_cb_state) {
				1991	case NFSD4_CB_DOWN:
				1992	seq->status_flags = SEQ4_STATUS_CB_PATH_DOWN;
				1993	break;
				1994	case NFSD4_CB_FAULT:
				1995	seq->status_flags = SEQ4_STATUS_BACKCHANNEL_FAULT;
				1996	break;
				1997	default:
				1998	seq->status_flags = 0;
				1999	}
				2000	}
				2001	kfree(conn);
				2002	spin_unlock(&client_lock);
				2003	dprintk("%s: return %d\n", __func__, ntohl(status));
				2004	return status;
				2005	}
				2006
				2007	static inline bool has_resources(struct nfs4_client *clp)
				2008	{
				2009	return !list_empty(&clp->cl_openowners)
				2010	\|\| !list_empty(&clp->cl_delegations)
				2011	\|\| !list_empty(&clp->cl_sessions);
				2012	}
				2013
				2014	__be32
				2015	nfsd4_destroy_clientid(struct svc_rqst rqstp, struct nfsd4_compound_state cstate, struct nfsd4_destroy_clientid *dc)
				2016	{
				2017	struct nfs4_client conf, unconf, *clp;
				2018	int status = 0;
				2019
				2020	nfs4_lock_state();
				2021	unconf = find_unconfirmed_client(&dc->clientid);
				2022	conf = find_confirmed_client(&dc->clientid);
				2023
				2024	if (conf) {
				2025	clp = conf;
				2026
				2027	if (!is_client_expired(conf) && has_resources(conf)) {
				2028	status = nfserr_clientid_busy;
				2029	goto out;
				2030	}
				2031
				2032	/* rfc5661 18.50.3 */
				2033	if (cstate->session && conf == cstate->session->se_client) {
				2034	status = nfserr_clientid_busy;
				2035	goto out;
				2036	}
				2037	} else if (unconf)
				2038	clp = unconf;
				2039	else {
				2040	status = nfserr_stale_clientid;
				2041	goto out;
				2042	}
				2043
				2044	expire_client(clp);
				2045	out:
				2046	nfs4_unlock_state();
				2047	dprintk("%s return %d\n", __func__, ntohl(status));
				2048	return status;
				2049	}
				2050
				2051	__be32
				2052	nfsd4_reclaim_complete(struct svc_rqst rqstp, struct nfsd4_compound_state cstate, struct nfsd4_reclaim_complete *rc)
				2053	{
				2054	int status = 0;
				2055
				2056	if (rc->rca_one_fs) {
				2057	if (!cstate->current_fh.fh_dentry)
				2058	return nfserr_nofilehandle;
				2059	/*
				2060	* We don't take advantage of the rca_one_fs case.
				2061	* That's OK, it's optional, we can safely ignore it.
				2062	*/
				2063	return nfs_ok;
				2064	}
				2065
				2066	nfs4_lock_state();
				2067	status = nfserr_complete_already;
				2068	if (test_and_set_bit(NFSD4_CLIENT_RECLAIM_COMPLETE,
				2069	&cstate->session->se_client->cl_flags))
				2070	goto out;
				2071
				2072	status = nfserr_stale_clientid;
				2073	if (is_client_expired(cstate->session->se_client))
				2074	/*
				2075	* The following error isn't really legal.
				2076	* But we only get here if the client just explicitly
				2077	* destroyed the client. Surely it no longer cares what
				2078	* error it gets back on an operation for the dead
				2079	* client.
				2080	*/
				2081	goto out;
				2082
				2083	status = nfs_ok;
				2084	nfsd4_client_record_create(cstate->session->se_client);
				2085	out:
				2086	nfs4_unlock_state();
				2087	return status;
				2088	}
				2089
				2090	__be32
				2091	nfsd4_setclientid(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				2092	struct nfsd4_setclientid *setclid)
				2093	{
				2094	struct xdr_netobj clname = setclid->se_name;
				2095	nfs4_verifier clverifier = setclid->se_verf;
				2096	unsigned int strhashval;
				2097	struct nfs4_client conf, unconf, *new;
				2098	__be32 status;
				2099	char dname[HEXDIR_LEN];
				2100
				2101	status = nfs4_make_rec_clidname(dname, &clname);
				2102	if (status)
				2103	return status;
				2104
				2105	/*
				2106	* XXX The Duplicate Request Cache (DRC) has been checked (??)
				2107	* We get here on a DRC miss.
				2108	*/
				2109
				2110	strhashval = clientstr_hashval(dname);
				2111
				2112	nfs4_lock_state();
				2113	conf = find_confirmed_client_by_str(dname, strhashval);
				2114	if (conf) {
				2115	/* RFC 3530 14.2.33 CASE 0: */
				2116	status = nfserr_clid_inuse;
				2117	if (clp_used_exchangeid(conf))
				2118	goto out;
				2119	if (!same_creds(&conf->cl_cred, &rqstp->rq_cred)) {
				2120	char addr_str[INET6_ADDRSTRLEN];
				2121	rpc_ntop((struct sockaddr *) &conf->cl_addr, addr_str,
				2122	sizeof(addr_str));
				2123	dprintk("NFSD: setclientid: string in use by client "
				2124	"at %s\n", addr_str);
				2125	goto out;
				2126	}
				2127	}
				2128	/*
				2129	* section 14.2.33 of RFC 3530 (under the heading "IMPLEMENTATION")
				2130	* has a description of SETCLIENTID request processing consisting
				2131	* of 5 bullet points, labeled as CASE0 - CASE4 below.
				2132	*/
				2133	unconf = find_unconfirmed_client_by_str(dname, strhashval);
				2134	status = nfserr_jukebox;
				2135	if (!conf) {
				2136	/*
				2137	* RFC 3530 14.2.33 CASE 4:
				2138	* placed first, because it is the normal case
				2139	*/
				2140	if (unconf)
				2141	expire_client(unconf);
				2142	new = create_client(clname, dname, rqstp, &clverifier);
				2143	if (new == NULL)
				2144	goto out;
				2145	gen_clid(new);
				2146	} else if (same_verf(&conf->cl_verifier, &clverifier)) {
				2147	/*
				2148	* RFC 3530 14.2.33 CASE 1:
				2149	* probable callback update
				2150	*/
				2151	if (unconf) {
				2152	/* Note this is removing unconfirmed {x**},
				2153	* which is stronger than RFC recommended {vxc**}.
				2154	* This has the advantage that there is at most
				2155	* one {x**} in either list at any time.
				2156	*/
				2157	expire_client(unconf);
				2158	}
				2159	new = create_client(clname, dname, rqstp, &clverifier);
				2160	if (new == NULL)
				2161	goto out;
				2162	copy_clid(new, conf);
				2163	} else if (!unconf) {
				2164	/*
				2165	* RFC 3530 14.2.33 CASE 2:
				2166	* probable client reboot; state will be removed if
				2167	* confirmed.
				2168	*/
				2169	new = create_client(clname, dname, rqstp, &clverifier);
				2170	if (new == NULL)
				2171	goto out;
				2172	gen_clid(new);
				2173	} else {
				2174	/*
				2175	* RFC 3530 14.2.33 CASE 3:
				2176	* probable client reboot; state will be removed if
				2177	* confirmed.
				2178	*/
				2179	expire_client(unconf);
				2180	new = create_client(clname, dname, rqstp, &clverifier);
				2181	if (new == NULL)
				2182	goto out;
				2183	gen_clid(new);
				2184	}
				2185	/*
				2186	* XXX: we should probably set this at creation time, and check
				2187	* for consistent minorversion use throughout:
				2188	*/
				2189	new->cl_minorversion = 0;
				2190	gen_callback(new, setclid, rqstp);
				2191	add_to_unconfirmed(new, strhashval);
				2192	setclid->se_clientid.cl_boot = new->cl_clientid.cl_boot;
				2193	setclid->se_clientid.cl_id = new->cl_clientid.cl_id;
				2194	memcpy(setclid->se_confirm.data, new->cl_confirm.data, sizeof(setclid->se_confirm.data));
				2195	status = nfs_ok;
				2196	out:
				2197	nfs4_unlock_state();
				2198	return status;
				2199	}
				2200
				2201
				2202	/*
				2203	* Section 14.2.34 of RFC 3530 (under the heading "IMPLEMENTATION") has
				2204	* a description of SETCLIENTID_CONFIRM request processing consisting of 4
				2205	* bullets, labeled as CASE1 - CASE4 below.
				2206	*/
				2207	__be32
				2208	nfsd4_setclientid_confirm(struct svc_rqst *rqstp,
				2209	struct nfsd4_compound_state *cstate,
				2210	struct nfsd4_setclientid_confirm *setclientid_confirm)
				2211	{
				2212	struct sockaddr *sa = svc_addr(rqstp);
				2213	struct nfs4_client conf, unconf;
				2214	nfs4_verifier confirm = setclientid_confirm->sc_confirm;
				2215	clientid_t * clid = &setclientid_confirm->sc_clientid;
				2216	__be32 status;
				2217
				2218	if (STALE_CLIENTID(clid))
				2219	return nfserr_stale_clientid;
				2220	/*
				2221	* XXX The Duplicate Request Cache (DRC) has been checked (??)
				2222	* We get here on a DRC miss.
				2223	*/
				2224
				2225	nfs4_lock_state();
				2226
				2227	conf = find_confirmed_client(clid);
				2228	unconf = find_unconfirmed_client(clid);
				2229
				2230	status = nfserr_clid_inuse;
				2231	if (conf && !rpc_cmp_addr((struct sockaddr *) &conf->cl_addr, sa))
				2232	goto out;
				2233	if (unconf && !rpc_cmp_addr((struct sockaddr *) &unconf->cl_addr, sa))
				2234	goto out;
				2235
				2236	/*
				2237	* section 14.2.34 of RFC 3530 has a description of
				2238	* SETCLIENTID_CONFIRM request processing consisting
				2239	* of 4 bullet points, labeled as CASE1 - CASE4 below.
				2240	*/
				2241	if (conf && unconf && same_verf(&confirm, &unconf->cl_confirm)) {
				2242	/*
				2243	* RFC 3530 14.2.34 CASE 1:
				2244	* callback update
				2245	*/
				2246	if (!same_creds(&conf->cl_cred, &unconf->cl_cred))
				2247	status = nfserr_clid_inuse;
				2248	else {
				2249	nfsd4_change_callback(conf, &unconf->cl_cb_conn);
				2250	nfsd4_probe_callback(conf);
				2251	expire_client(unconf);
				2252	status = nfs_ok;
				2253
				2254	}
				2255	} else if (conf && !unconf) {
				2256	/*
				2257	* RFC 3530 14.2.34 CASE 2:
				2258	* probable retransmitted request; play it safe and
				2259	* do nothing.
				2260	*/
				2261	if (!same_creds(&conf->cl_cred, &rqstp->rq_cred))
				2262	status = nfserr_clid_inuse;
				2263	else
				2264	status = nfs_ok;
				2265	} else if (!conf && unconf
				2266	&& same_verf(&unconf->cl_confirm, &confirm)) {
				2267	/*
				2268	* RFC 3530 14.2.34 CASE 3:
				2269	* Normal case; new or rebooted client:
				2270	*/
				2271	if (!same_creds(&unconf->cl_cred, &rqstp->rq_cred)) {
				2272	status = nfserr_clid_inuse;
				2273	} else {
				2274	unsigned int hash =
				2275	clientstr_hashval(unconf->cl_recdir);
				2276	conf = find_confirmed_client_by_str(unconf->cl_recdir,
				2277	hash);
				2278	if (conf) {
				2279	nfsd4_client_record_remove(conf);
				2280	expire_client(conf);
				2281	}
				2282	move_to_confirmed(unconf);
				2283	conf = unconf;
				2284	nfsd4_probe_callback(conf);
				2285	status = nfs_ok;
				2286	}
				2287	} else if ((!conf \|\| (conf && !same_verf(&conf->cl_confirm, &confirm)))
				2288	&& (!unconf \|\| (unconf && !same_verf(&unconf->cl_confirm,
				2289	&confirm)))) {
				2290	/*
				2291	* RFC 3530 14.2.34 CASE 4:
				2292	* Client probably hasn't noticed that we rebooted yet.
				2293	*/
				2294	status = nfserr_stale_clientid;
				2295	} else {
				2296	/* check that we have hit one of the cases...*/
				2297	status = nfserr_clid_inuse;
				2298	}
				2299	out:
				2300	nfs4_unlock_state();
				2301	return status;
				2302	}
				2303
				2304	static struct nfs4_file *nfsd4_alloc_file(void)
				2305	{
				2306	return kmem_cache_alloc(file_slab, GFP_KERNEL);
				2307	}
				2308
				2309	/* OPEN Share state helper functions */
				2310	static void nfsd4_init_file(struct nfs4_file fp, struct inode ino)
				2311	{
				2312	unsigned int hashval = file_hashval(ino);
				2313
				2314	atomic_set(&fp->fi_ref, 1);
				2315	INIT_LIST_HEAD(&fp->fi_hash);
				2316	INIT_LIST_HEAD(&fp->fi_stateids);
				2317	INIT_LIST_HEAD(&fp->fi_delegations);
				2318	fp->fi_inode = igrab(ino);
				2319	fp->fi_had_conflict = false;
				2320	fp->fi_lease = NULL;
				2321	memset(fp->fi_fds, 0, sizeof(fp->fi_fds));
				2322	memset(fp->fi_access, 0, sizeof(fp->fi_access));
				2323	spin_lock(&recall_lock);
				2324	list_add(&fp->fi_hash, &file_hashtbl[hashval]);
				2325	spin_unlock(&recall_lock);
				2326	}
				2327
				2328	static void
				2329	nfsd4_free_slab(struct kmem_cache **slab)
				2330	{
				2331	if (*slab == NULL)
				2332	return;
				2333	kmem_cache_destroy(*slab);
				2334	*slab = NULL;
				2335	}
				2336
				2337	void
				2338	nfsd4_free_slabs(void)
				2339	{
				2340	nfsd4_free_slab(&openowner_slab);
				2341	nfsd4_free_slab(&lockowner_slab);
				2342	nfsd4_free_slab(&file_slab);
				2343	nfsd4_free_slab(&stateid_slab);
				2344	nfsd4_free_slab(&deleg_slab);
				2345	}
				2346
				2347	int
				2348	nfsd4_init_slabs(void)
				2349	{
				2350	openowner_slab = kmem_cache_create("nfsd4_openowners",
				2351	sizeof(struct nfs4_openowner), 0, 0, NULL);
				2352	if (openowner_slab == NULL)
				2353	goto out_nomem;
				2354	lockowner_slab = kmem_cache_create("nfsd4_lockowners",
				2355	sizeof(struct nfs4_lockowner), 0, 0, NULL);
				2356	if (lockowner_slab == NULL)
				2357	goto out_nomem;
				2358	file_slab = kmem_cache_create("nfsd4_files",
				2359	sizeof(struct nfs4_file), 0, 0, NULL);
				2360	if (file_slab == NULL)
				2361	goto out_nomem;
				2362	stateid_slab = kmem_cache_create("nfsd4_stateids",
				2363	sizeof(struct nfs4_ol_stateid), 0, 0, NULL);
				2364	if (stateid_slab == NULL)
				2365	goto out_nomem;
				2366	deleg_slab = kmem_cache_create("nfsd4_delegations",
				2367	sizeof(struct nfs4_delegation), 0, 0, NULL);
				2368	if (deleg_slab == NULL)
				2369	goto out_nomem;
				2370	return 0;
				2371	out_nomem:
				2372	nfsd4_free_slabs();
				2373	dprintk("nfsd4: out of memory while initializing nfsv4\n");
				2374	return -ENOMEM;
				2375	}
				2376
				2377	void nfs4_free_openowner(struct nfs4_openowner *oo)
				2378	{
				2379	kfree(oo->oo_owner.so_owner.data);
				2380	kmem_cache_free(openowner_slab, oo);
				2381	}
				2382
				2383	void nfs4_free_lockowner(struct nfs4_lockowner *lo)
				2384	{
				2385	kfree(lo->lo_owner.so_owner.data);
				2386	kmem_cache_free(lockowner_slab, lo);
				2387	}
				2388
				2389	static void init_nfs4_replay(struct nfs4_replay *rp)
				2390	{
				2391	rp->rp_status = nfserr_serverfault;
				2392	rp->rp_buflen = 0;
				2393	rp->rp_buf = rp->rp_ibuf;
				2394	}
				2395
				2396	static inline void alloc_stateowner(struct kmem_cache slab, struct xdr_netobj owner, struct nfs4_client clp)
				2397	{
				2398	struct nfs4_stateowner *sop;
				2399
				2400	sop = kmem_cache_alloc(slab, GFP_KERNEL);
				2401	if (!sop)
				2402	return NULL;
				2403
				2404	sop->so_owner.data = kmemdup(owner->data, owner->len, GFP_KERNEL);
				2405	if (!sop->so_owner.data) {
				2406	kmem_cache_free(slab, sop);
				2407	return NULL;
				2408	}
				2409	sop->so_owner.len = owner->len;
				2410
				2411	INIT_LIST_HEAD(&sop->so_stateids);
				2412	sop->so_client = clp;
				2413	init_nfs4_replay(&sop->so_replay);
				2414	return sop;
				2415	}
				2416
				2417	static void hash_openowner(struct nfs4_openowner oo, struct nfs4_client clp, unsigned int strhashval)
				2418	{
				2419	list_add(&oo->oo_owner.so_strhash, &ownerstr_hashtbl[strhashval]);
				2420	list_add(&oo->oo_perclient, &clp->cl_openowners);
				2421	}
				2422
				2423	static struct nfs4_openowner *
				2424	alloc_init_open_stateowner(unsigned int strhashval, struct nfs4_client clp, struct nfsd4_open open) {
				2425	struct nfs4_openowner *oo;
				2426
				2427	oo = alloc_stateowner(openowner_slab, &open->op_owner, clp);
				2428	if (!oo)
				2429	return NULL;
				2430	oo->oo_owner.so_is_open_owner = 1;
				2431	oo->oo_owner.so_seqid = open->op_seqid;
				2432	oo->oo_flags = NFS4_OO_NEW;
				2433	oo->oo_time = 0;
				2434	oo->oo_last_closed_stid = NULL;
				2435	INIT_LIST_HEAD(&oo->oo_close_lru);
				2436	hash_openowner(oo, clp, strhashval);
				2437	return oo;
				2438	}
				2439
				2440	static void init_open_stateid(struct nfs4_ol_stateid stp, struct nfs4_file fp, struct nfsd4_open *open) {
				2441	struct nfs4_openowner *oo = open->op_openowner;
				2442	struct nfs4_client *clp = oo->oo_owner.so_client;
				2443
				2444	init_stid(&stp->st_stid, clp, NFS4_OPEN_STID);
				2445	INIT_LIST_HEAD(&stp->st_lockowners);
				2446	list_add(&stp->st_perstateowner, &oo->oo_owner.so_stateids);
				2447	list_add(&stp->st_perfile, &fp->fi_stateids);
				2448	stp->st_stateowner = &oo->oo_owner;
				2449	get_nfs4_file(fp);
				2450	stp->st_file = fp;
				2451	stp->st_access_bmap = 0;
				2452	stp->st_deny_bmap = 0;
				2453	__set_bit(open->op_share_access, &stp->st_access_bmap);
				2454	__set_bit(open->op_share_deny, &stp->st_deny_bmap);
				2455	stp->st_openstp = NULL;
				2456	}
				2457
				2458	static void
				2459	move_to_close_lru(struct nfs4_openowner *oo)
				2460	{
				2461	dprintk("NFSD: move_to_close_lru nfs4_openowner %p\n", oo);
				2462
				2463	list_move_tail(&oo->oo_close_lru, &close_lru);
				2464	oo->oo_time = get_seconds();
				2465	}
				2466
				2467	static int
				2468	same_owner_str(struct nfs4_stateowner sop, struct xdr_netobj owner,
				2469	clientid_t *clid)
				2470	{
				2471	return (sop->so_owner.len == owner->len) &&
				2472	0 == memcmp(sop->so_owner.data, owner->data, owner->len) &&
				2473	(sop->so_client->cl_clientid.cl_id == clid->cl_id);
				2474	}
				2475
				2476	static struct nfs4_openowner *
				2477	find_openstateowner_str(unsigned int hashval, struct nfsd4_open *open)
				2478	{
				2479	struct nfs4_stateowner *so;
				2480	struct nfs4_openowner *oo;
				2481
				2482	list_for_each_entry(so, &ownerstr_hashtbl[hashval], so_strhash) {
				2483	if (!so->so_is_open_owner)
				2484	continue;
				2485	if (same_owner_str(so, &open->op_owner, &open->op_clientid)) {
				2486	oo = openowner(so);
				2487	renew_client(oo->oo_owner.so_client);
				2488	return oo;
				2489	}
				2490	}
				2491	return NULL;
				2492	}
				2493
				2494	/* search file_hashtbl[] for file */
				2495	static struct nfs4_file *
				2496	find_file(struct inode *ino)
				2497	{
				2498	unsigned int hashval = file_hashval(ino);
				2499	struct nfs4_file *fp;
				2500
				2501	spin_lock(&recall_lock);
				2502	list_for_each_entry(fp, &file_hashtbl[hashval], fi_hash) {
				2503	if (fp->fi_inode == ino) {
				2504	get_nfs4_file(fp);
				2505	spin_unlock(&recall_lock);
				2506	return fp;
				2507	}
				2508	}
				2509	spin_unlock(&recall_lock);
				2510	return NULL;
				2511	}
				2512
				2513	/*
				2514	* Called to check deny when READ with all zero stateid or
				2515	* WRITE with all zero or all one stateid
				2516	*/
				2517	static __be32
				2518	nfs4_share_conflict(struct svc_fh *current_fh, unsigned int deny_type)
				2519	{
				2520	struct inode *ino = current_fh->fh_dentry->d_inode;
				2521	struct nfs4_file *fp;
				2522	struct nfs4_ol_stateid *stp;
				2523	__be32 ret;
				2524
				2525	dprintk("NFSD: nfs4_share_conflict\n");
				2526
				2527	fp = find_file(ino);
				2528	if (!fp)
				2529	return nfs_ok;
				2530	ret = nfserr_locked;
				2531	/* Search for conflicting share reservations */
				2532	list_for_each_entry(stp, &fp->fi_stateids, st_perfile) {
				2533	if (test_bit(deny_type, &stp->st_deny_bmap) \|\|
				2534	test_bit(NFS4_SHARE_DENY_BOTH, &stp->st_deny_bmap))
				2535	goto out;
				2536	}
				2537	ret = nfs_ok;
				2538	out:
				2539	put_nfs4_file(fp);
				2540	return ret;
				2541	}
				2542
				2543	static void nfsd_break_one_deleg(struct nfs4_delegation *dp)
				2544	{
				2545	/* We're assuming the state code never drops its reference
				2546	* without first removing the lease. Since we're in this lease
				2547	* callback (and since the lease code is serialized by the kernel
				2548	* lock) we know the server hasn't removed the lease yet, we know
				2549	* it's safe to take a reference: */
				2550	atomic_inc(&dp->dl_count);
				2551
				2552	list_add_tail(&dp->dl_recall_lru, &del_recall_lru);
				2553
				2554	/* only place dl_time is set. protected by lock_flocks*/
				2555	dp->dl_time = get_seconds();
				2556
				2557	nfsd4_cb_recall(dp);
				2558	}
				2559
				2560	/* Called from break_lease() with lock_flocks() held. */
				2561	static void nfsd_break_deleg_cb(struct file_lock *fl)
				2562	{
				2563	struct nfs4_file fp = (struct nfs4_file )fl->fl_owner;
				2564	struct nfs4_delegation *dp;
				2565
				2566	BUG_ON(!fp);
				2567	/* We assume break_lease is only called once per lease: */
				2568	BUG_ON(fp->fi_had_conflict);
				2569	/*
				2570	* We don't want the locks code to timeout the lease for us;
				2571	* we'll remove it ourself if a delegation isn't returned
				2572	* in time:
				2573	*/
				2574	fl->fl_break_time = 0;
				2575
				2576	spin_lock(&recall_lock);
				2577	fp->fi_had_conflict = true;
				2578	list_for_each_entry(dp, &fp->fi_delegations, dl_perfile)
				2579	nfsd_break_one_deleg(dp);
				2580	spin_unlock(&recall_lock);
				2581	}
				2582
				2583	static
				2584	int nfsd_change_deleg_cb(struct file_lock **onlist, int arg)
				2585	{
				2586	if (arg & F_UNLCK)
				2587	return lease_modify(onlist, arg);
				2588	else
				2589	return -EAGAIN;
				2590	}
				2591
				2592	static const struct lock_manager_operations nfsd_lease_mng_ops = {
				2593	.lm_break = nfsd_break_deleg_cb,
				2594	.lm_change = nfsd_change_deleg_cb,
				2595	};
				2596
				2597	static __be32 nfsd4_check_seqid(struct nfsd4_compound_state cstate, struct nfs4_stateowner so, u32 seqid)
				2598	{
				2599	if (nfsd4_has_session(cstate))
				2600	return nfs_ok;
				2601	if (seqid == so->so_seqid - 1)
				2602	return nfserr_replay_me;
				2603	if (seqid == so->so_seqid)
				2604	return nfs_ok;
				2605	return nfserr_bad_seqid;
				2606	}
				2607
				2608	__be32
				2609	nfsd4_process_open1(struct nfsd4_compound_state *cstate,
				2610	struct nfsd4_open *open)
				2611	{
				2612	clientid_t *clientid = &open->op_clientid;
				2613	struct nfs4_client *clp = NULL;
				2614	unsigned int strhashval;
				2615	struct nfs4_openowner *oo = NULL;
				2616	__be32 status;
				2617
				2618	if (STALE_CLIENTID(&open->op_clientid))
				2619	return nfserr_stale_clientid;
				2620	/*
				2621	* In case we need it later, after we've already created the
				2622	* file and don't want to risk a further failure:
				2623	*/
				2624	open->op_file = nfsd4_alloc_file();
				2625	if (open->op_file == NULL)
				2626	return nfserr_jukebox;
				2627
				2628	strhashval = ownerstr_hashval(clientid->cl_id, &open->op_owner);
				2629	oo = find_openstateowner_str(strhashval, open);
				2630	open->op_openowner = oo;
				2631	if (!oo) {
				2632	clp = find_confirmed_client(clientid);
				2633	if (clp == NULL)
				2634	return nfserr_expired;
				2635	goto new_owner;
				2636	}
				2637	if (!(oo->oo_flags & NFS4_OO_CONFIRMED)) {
				2638	/* Replace unconfirmed owners without checking for replay. */
				2639	clp = oo->oo_owner.so_client;
				2640	release_openowner(oo);
				2641	open->op_openowner = NULL;
				2642	goto new_owner;
				2643	}
				2644	status = nfsd4_check_seqid(cstate, &oo->oo_owner, open->op_seqid);
				2645	if (status)
				2646	return status;
				2647	clp = oo->oo_owner.so_client;
				2648	goto alloc_stateid;
				2649	new_owner:
				2650	oo = alloc_init_open_stateowner(strhashval, clp, open);
				2651	if (oo == NULL)
				2652	return nfserr_jukebox;
				2653	open->op_openowner = oo;
				2654	alloc_stateid:
				2655	open->op_stp = nfs4_alloc_stateid(clp);
				2656	if (!open->op_stp)
				2657	return nfserr_jukebox;
				2658	return nfs_ok;
				2659	}
				2660
				2661	static inline __be32
				2662	nfs4_check_delegmode(struct nfs4_delegation *dp, int flags)
				2663	{
				2664	if ((flags & WR_STATE) && (dp->dl_type == NFS4_OPEN_DELEGATE_READ))
				2665	return nfserr_openmode;
				2666	else
				2667	return nfs_ok;
				2668	}
				2669
				2670	static int share_access_to_flags(u32 share_access)
				2671	{
				2672	return share_access == NFS4_SHARE_ACCESS_READ ? RD_STATE : WR_STATE;
				2673	}
				2674
				2675	static struct nfs4_delegation find_deleg_stateid(struct nfs4_client cl, stateid_t *s)
				2676	{
				2677	struct nfs4_stid *ret;
				2678
				2679	ret = find_stateid_by_type(cl, s, NFS4_DELEG_STID);
				2680	if (!ret)
				2681	return NULL;
				2682	return delegstateid(ret);
				2683	}
				2684
				2685	static bool nfsd4_is_deleg_cur(struct nfsd4_open *open)
				2686	{
				2687	return open->op_claim_type == NFS4_OPEN_CLAIM_DELEGATE_CUR \|\|
				2688	open->op_claim_type == NFS4_OPEN_CLAIM_DELEG_CUR_FH;
				2689	}
				2690
				2691	static __be32
				2692	nfs4_check_deleg(struct nfs4_client cl, struct nfs4_file fp, struct nfsd4_open *open,
				2693	struct nfs4_delegation **dp)
				2694	{
				2695	int flags;
				2696	__be32 status = nfserr_bad_stateid;
				2697
				2698	*dp = find_deleg_stateid(cl, &open->op_delegate_stateid);
				2699	if (*dp == NULL)
				2700	goto out;
				2701	flags = share_access_to_flags(open->op_share_access);
				2702	status = nfs4_check_delegmode(*dp, flags);
				2703	if (status)
				2704	*dp = NULL;
				2705	out:
				2706	if (!nfsd4_is_deleg_cur(open))
				2707	return nfs_ok;
				2708	if (status)
				2709	return status;
				2710	open->op_openowner->oo_flags \|= NFS4_OO_CONFIRMED;
				2711	return nfs_ok;
				2712	}
				2713
				2714	static __be32
				2715	nfs4_check_open(struct nfs4_file fp, struct nfsd4_open open, struct nfs4_ol_stateid **stpp)
				2716	{
				2717	struct nfs4_ol_stateid *local;
				2718	struct nfs4_openowner *oo = open->op_openowner;
				2719
				2720	list_for_each_entry(local, &fp->fi_stateids, st_perfile) {
				2721	/* ignore lock owners */
				2722	if (local->st_stateowner->so_is_open_owner == 0)
				2723	continue;
				2724	/* remember if we have seen this open owner */
				2725	if (local->st_stateowner == &oo->oo_owner)
				2726	*stpp = local;
				2727	/* check for conflicting share reservations */
				2728	if (!test_share(local, open))
				2729	return nfserr_share_denied;
				2730	}
				2731	return nfs_ok;
				2732	}
				2733
				2734	static void nfs4_free_stateid(struct nfs4_ol_stateid *s)
				2735	{
				2736	kmem_cache_free(stateid_slab, s);
				2737	}
				2738
				2739	static inline int nfs4_access_to_access(u32 nfs4_access)
				2740	{
				2741	int flags = 0;
				2742
				2743	if (nfs4_access & NFS4_SHARE_ACCESS_READ)
				2744	flags \|= NFSD_MAY_READ;
				2745	if (nfs4_access & NFS4_SHARE_ACCESS_WRITE)
				2746	flags \|= NFSD_MAY_WRITE;
				2747	return flags;
				2748	}
				2749
				2750	static __be32 nfs4_get_vfs_file(struct svc_rqst rqstp, struct nfs4_file fp,
				2751	struct svc_fh cur_fh, struct nfsd4_open open)
				2752	{
				2753	__be32 status;
				2754	int oflag = nfs4_access_to_omode(open->op_share_access);
				2755	int access = nfs4_access_to_access(open->op_share_access);
				2756
				2757	if (!fp->fi_fds[oflag]) {
				2758	status = nfsd_open(rqstp, cur_fh, S_IFREG, access,
				2759	&fp->fi_fds[oflag]);
				2760	if (status)
				2761	return status;
				2762	}
				2763	nfs4_file_get_access(fp, oflag);
				2764
				2765	return nfs_ok;
				2766	}
				2767
				2768	static inline __be32
				2769	nfsd4_truncate(struct svc_rqst rqstp, struct svc_fh fh,
				2770	struct nfsd4_open *open)
				2771	{
				2772	struct iattr iattr = {
				2773	.ia_valid = ATTR_SIZE,
				2774	.ia_size = 0,
				2775	};
				2776	if (!open->op_truncate)
				2777	return 0;
				2778	if (!(open->op_share_access & NFS4_SHARE_ACCESS_WRITE))
				2779	return nfserr_inval;
				2780	return nfsd_setattr(rqstp, fh, &iattr, 0, (time_t)0);
				2781	}
				2782
				2783	static __be32
				2784	nfs4_upgrade_open(struct svc_rqst rqstp, struct nfs4_file fp, struct svc_fh cur_fh, struct nfs4_ol_stateid stp, struct nfsd4_open *open)
				2785	{
				2786	u32 op_share_access = open->op_share_access;
				2787	bool new_access;
				2788	__be32 status;
				2789
				2790	new_access = !test_bit(op_share_access, &stp->st_access_bmap);
				2791	if (new_access) {
				2792	status = nfs4_get_vfs_file(rqstp, fp, cur_fh, open);
				2793	if (status)
				2794	return status;
				2795	}
				2796	status = nfsd4_truncate(rqstp, cur_fh, open);
				2797	if (status) {
				2798	if (new_access) {
				2799	int oflag = nfs4_access_to_omode(op_share_access);
				2800	nfs4_file_put_access(fp, oflag);
				2801	}
				2802	return status;
				2803	}
				2804	/* remember the open */
				2805	__set_bit(op_share_access, &stp->st_access_bmap);
				2806	__set_bit(open->op_share_deny, &stp->st_deny_bmap);
				2807
				2808	return nfs_ok;
				2809	}
				2810
				2811
				2812	static void
				2813	nfs4_set_claim_prev(struct nfsd4_open *open, bool has_session)
				2814	{
				2815	open->op_openowner->oo_flags \|= NFS4_OO_CONFIRMED;
				2816	}
				2817
				2818	/* Should we give out recallable state?: */
				2819	static bool nfsd4_cb_channel_good(struct nfs4_client *clp)
				2820	{
				2821	if (clp->cl_cb_state == NFSD4_CB_UP)
				2822	return true;
				2823	/*
				2824	* In the sessions case, since we don't have to establish a
				2825	* separate connection for callbacks, we assume it's OK
				2826	* until we hear otherwise:
				2827	*/
				2828	return clp->cl_minorversion && clp->cl_cb_state == NFSD4_CB_UNKNOWN;
				2829	}
				2830
				2831	static struct file_lock nfs4_alloc_init_lease(struct nfs4_delegation dp, int flag)
				2832	{
				2833	struct file_lock *fl;
				2834
				2835	fl = locks_alloc_lock();
				2836	if (!fl)
				2837	return NULL;
				2838	locks_init_lock(fl);
				2839	fl->fl_lmops = &nfsd_lease_mng_ops;
				2840	fl->fl_flags = FL_LEASE;
				2841	fl->fl_type = flag == NFS4_OPEN_DELEGATE_READ? F_RDLCK: F_WRLCK;
				2842	fl->fl_end = OFFSET_MAX;
				2843	fl->fl_owner = (fl_owner_t)(dp->dl_file);
				2844	fl->fl_pid = current->tgid;
				2845	return fl;
				2846	}
				2847
				2848	static int nfs4_setlease(struct nfs4_delegation *dp, int flag)
				2849	{
				2850	struct nfs4_file *fp = dp->dl_file;
				2851	struct file_lock *fl;
				2852	int status;
				2853
				2854	fl = nfs4_alloc_init_lease(dp, flag);
				2855	if (!fl)
				2856	return -ENOMEM;
				2857	fl->fl_file = find_readable_file(fp);
				2858	list_add(&dp->dl_perclnt, &dp->dl_stid.sc_client->cl_delegations);
				2859	status = vfs_setlease(fl->fl_file, fl->fl_type, &fl);
				2860	if (status) {
				2861	list_del_init(&dp->dl_perclnt);
				2862	locks_free_lock(fl);
				2863	return -ENOMEM;
				2864	}
				2865	fp->fi_lease = fl;
				2866	fp->fi_deleg_file = fl->fl_file;
				2867	get_file(fp->fi_deleg_file);
				2868	atomic_set(&fp->fi_delegees, 1);
				2869	list_add(&dp->dl_perfile, &fp->fi_delegations);
				2870	return 0;
				2871	}
				2872
				2873	static int nfs4_set_delegation(struct nfs4_delegation *dp, int flag)
				2874	{
				2875	struct nfs4_file *fp = dp->dl_file;
				2876
				2877	if (!fp->fi_lease)
				2878	return nfs4_setlease(dp, flag);
				2879	spin_lock(&recall_lock);
				2880	if (fp->fi_had_conflict) {
				2881	spin_unlock(&recall_lock);
				2882	return -EAGAIN;
				2883	}
				2884	atomic_inc(&fp->fi_delegees);
				2885	list_add(&dp->dl_perfile, &fp->fi_delegations);
				2886	spin_unlock(&recall_lock);
				2887	list_add(&dp->dl_perclnt, &dp->dl_stid.sc_client->cl_delegations);
				2888	return 0;
				2889	}
				2890
				2891	static void nfsd4_open_deleg_none_ext(struct nfsd4_open *open, int status)
				2892	{
				2893	open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
				2894	if (status == -EAGAIN)
				2895	open->op_why_no_deleg = WND4_CONTENTION;
				2896	else {
				2897	open->op_why_no_deleg = WND4_RESOURCE;
				2898	switch (open->op_deleg_want) {
				2899	case NFS4_SHARE_WANT_READ_DELEG:
				2900	case NFS4_SHARE_WANT_WRITE_DELEG:
				2901	case NFS4_SHARE_WANT_ANY_DELEG:
				2902	break;
				2903	case NFS4_SHARE_WANT_CANCEL:
				2904	open->op_why_no_deleg = WND4_CANCELLED;
				2905	break;
				2906	case NFS4_SHARE_WANT_NO_DELEG:
				2907	BUG(); /* not supposed to get here */
				2908	}
				2909	}
				2910	}
				2911
				2912	/*
				2913	* Attempt to hand out a delegation.
				2914	*/
				2915	static void
				2916	nfs4_open_delegation(struct svc_fh fh, struct nfsd4_open open, struct nfs4_ol_stateid *stp)
				2917	{
				2918	struct nfs4_delegation *dp;
				2919	struct nfs4_openowner *oo = container_of(stp->st_stateowner, struct nfs4_openowner, oo_owner);
				2920	int cb_up;
				2921	int status = 0, flag = 0;
				2922
				2923	cb_up = nfsd4_cb_channel_good(oo->oo_owner.so_client);
				2924	flag = NFS4_OPEN_DELEGATE_NONE;
				2925	open->op_recall = 0;
				2926	switch (open->op_claim_type) {
				2927	case NFS4_OPEN_CLAIM_PREVIOUS:
				2928	if (!cb_up)
				2929	open->op_recall = 1;
				2930	flag = open->op_delegate_type;
				2931	if (flag == NFS4_OPEN_DELEGATE_NONE)
				2932	goto out;
				2933	break;
				2934	case NFS4_OPEN_CLAIM_NULL:
				2935	/* Let's not give out any delegations till everyone's
				2936	* had the chance to reclaim theirs.... */
				2937	if (locks_in_grace())
				2938	goto out;
				2939	if (!cb_up \|\| !(oo->oo_flags & NFS4_OO_CONFIRMED))
				2940	goto out;
				2941	if (open->op_share_access & NFS4_SHARE_ACCESS_WRITE)
				2942	flag = NFS4_OPEN_DELEGATE_WRITE;
				2943	else
				2944	flag = NFS4_OPEN_DELEGATE_READ;
				2945	break;
				2946	default:
				2947	goto out;
				2948	}
				2949
				2950	dp = alloc_init_deleg(oo->oo_owner.so_client, stp, fh, flag);
				2951	if (dp == NULL)
				2952	goto out_no_deleg;
				2953	status = nfs4_set_delegation(dp, flag);
				2954	if (status)
				2955	goto out_free;
				2956
				2957	memcpy(&open->op_delegate_stateid, &dp->dl_stid.sc_stateid, sizeof(dp->dl_stid.sc_stateid));
				2958
				2959	dprintk("NFSD: delegation stateid=" STATEID_FMT "\n",
				2960	STATEID_VAL(&dp->dl_stid.sc_stateid));
				2961	out:
				2962	open->op_delegate_type = flag;
				2963	if (flag == NFS4_OPEN_DELEGATE_NONE) {
				2964	if (open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS &&
				2965	open->op_delegate_type != NFS4_OPEN_DELEGATE_NONE)
				2966	dprintk("NFSD: WARNING: refusing delegation reclaim\n");
				2967
				2968	/* 4.1 client asking for a delegation? */
				2969	if (open->op_deleg_want)
				2970	nfsd4_open_deleg_none_ext(open, status);
				2971	}
				2972	return;
				2973	out_free:
				2974	nfs4_put_delegation(dp);
				2975	out_no_deleg:
				2976	flag = NFS4_OPEN_DELEGATE_NONE;
				2977	goto out;
				2978	}
				2979
				2980	static void nfsd4_deleg_xgrade_none_ext(struct nfsd4_open *open,
				2981	struct nfs4_delegation *dp)
				2982	{
				2983	if (open->op_deleg_want == NFS4_SHARE_WANT_READ_DELEG &&
				2984	dp->dl_type == NFS4_OPEN_DELEGATE_WRITE) {
				2985	open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
				2986	open->op_why_no_deleg = WND4_NOT_SUPP_DOWNGRADE;
				2987	} else if (open->op_deleg_want == NFS4_SHARE_WANT_WRITE_DELEG &&
				2988	dp->dl_type == NFS4_OPEN_DELEGATE_WRITE) {
				2989	open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
				2990	open->op_why_no_deleg = WND4_NOT_SUPP_UPGRADE;
				2991	}
				2992	/* Otherwise the client must be confused wanting a delegation
				2993	* it already has, therefore we don't return
				2994	* NFS4_OPEN_DELEGATE_NONE_EXT and reason.
				2995	*/
				2996	}
				2997
				2998	/*
				2999	* called with nfs4_lock_state() held.
				3000	*/
				3001	__be32
				3002	nfsd4_process_open2(struct svc_rqst rqstp, struct svc_fh current_fh, struct nfsd4_open *open)
				3003	{
				3004	struct nfsd4_compoundres *resp = rqstp->rq_resp;
				3005	struct nfs4_client *cl = open->op_openowner->oo_owner.so_client;
				3006	struct nfs4_file *fp = NULL;
				3007	struct inode *ino = current_fh->fh_dentry->d_inode;
				3008	struct nfs4_ol_stateid *stp = NULL;
				3009	struct nfs4_delegation *dp = NULL;
				3010	__be32 status;
				3011
				3012	/*
				3013	* Lookup file; if found, lookup stateid and check open request,
				3014	* and check for delegations in the process of being recalled.
				3015	* If not found, create the nfs4_file struct
				3016	*/
				3017	fp = find_file(ino);
				3018	if (fp) {
				3019	if ((status = nfs4_check_open(fp, open, &stp)))
				3020	goto out;
				3021	status = nfs4_check_deleg(cl, fp, open, &dp);
				3022	if (status)
				3023	goto out;
				3024	} else {
				3025	status = nfserr_bad_stateid;
				3026	if (nfsd4_is_deleg_cur(open))
				3027	goto out;
				3028	status = nfserr_jukebox;
				3029	fp = open->op_file;
				3030	open->op_file = NULL;
				3031	nfsd4_init_file(fp, ino);
				3032	}
				3033
				3034	/*
				3035	* OPEN the file, or upgrade an existing OPEN.
				3036	* If truncate fails, the OPEN fails.
				3037	*/
				3038	if (stp) {
				3039	/* Stateid was found, this is an OPEN upgrade */
				3040	status = nfs4_upgrade_open(rqstp, fp, current_fh, stp, open);
				3041	if (status)
				3042	goto out;
				3043	} else {
				3044	status = nfs4_get_vfs_file(rqstp, fp, current_fh, open);
				3045	if (status)
				3046	goto out;
				3047	stp = open->op_stp;
				3048	open->op_stp = NULL;
				3049	init_open_stateid(stp, fp, open);
				3050	status = nfsd4_truncate(rqstp, current_fh, open);
				3051	if (status) {
				3052	release_open_stateid(stp);
				3053	goto out;
				3054	}
				3055	}
				3056	update_stateid(&stp->st_stid.sc_stateid);
				3057	memcpy(&open->op_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
				3058
				3059	if (nfsd4_has_session(&resp->cstate)) {
				3060	open->op_openowner->oo_flags \|= NFS4_OO_CONFIRMED;
				3061
				3062	if (open->op_deleg_want & NFS4_SHARE_WANT_NO_DELEG) {
				3063	open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
				3064	open->op_why_no_deleg = WND4_NOT_WANTED;
				3065	goto nodeleg;
				3066	}
				3067	}
				3068
				3069	/*
				3070	* Attempt to hand out a delegation. No error return, because the
				3071	* OPEN succeeds even if we fail.
				3072	*/
				3073	nfs4_open_delegation(current_fh, open, stp);
				3074	nodeleg:
				3075	status = nfs_ok;
				3076
				3077	dprintk("%s: stateid=" STATEID_FMT "\n", __func__,
				3078	STATEID_VAL(&stp->st_stid.sc_stateid));
				3079	out:
				3080	/* 4.1 client trying to upgrade/downgrade delegation? */
				3081	if (open->op_delegate_type == NFS4_OPEN_DELEGATE_NONE && dp &&
				3082	open->op_deleg_want)
				3083	nfsd4_deleg_xgrade_none_ext(open, dp);
				3084
				3085	if (fp)
				3086	put_nfs4_file(fp);
				3087	if (status == 0 && open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS)
				3088	nfs4_set_claim_prev(open, nfsd4_has_session(&resp->cstate));
				3089	/*
				3090	* To finish the open response, we just need to set the rflags.
				3091	*/
				3092	open->op_rflags = NFS4_OPEN_RESULT_LOCKTYPE_POSIX;
				3093	if (!(open->op_openowner->oo_flags & NFS4_OO_CONFIRMED) &&
				3094	!nfsd4_has_session(&resp->cstate))
				3095	open->op_rflags \|= NFS4_OPEN_RESULT_CONFIRM;
				3096
				3097	return status;
				3098	}
				3099
				3100	void nfsd4_cleanup_open_state(struct nfsd4_open *open, __be32 status)
				3101	{
				3102	if (open->op_openowner) {
				3103	struct nfs4_openowner *oo = open->op_openowner;
				3104
				3105	if (!list_empty(&oo->oo_owner.so_stateids))
				3106	list_del_init(&oo->oo_close_lru);
				3107	if (oo->oo_flags & NFS4_OO_NEW) {
				3108	if (status) {
				3109	release_openowner(oo);
				3110	open->op_openowner = NULL;
				3111	} else
				3112	oo->oo_flags &= ~NFS4_OO_NEW;
				3113	}
				3114	}
				3115	if (open->op_file)
				3116	nfsd4_free_file(open->op_file);
				3117	if (open->op_stp)
				3118	nfs4_free_stateid(open->op_stp);
				3119	}
				3120
				3121	__be32
				3122	nfsd4_renew(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				3123	clientid_t *clid)
				3124	{
				3125	struct nfs4_client *clp;
				3126	__be32 status;
				3127
				3128	nfs4_lock_state();
				3129	dprintk("process_renew(%08x/%08x): starting\n",
				3130	clid->cl_boot, clid->cl_id);
				3131	status = nfserr_stale_clientid;
				3132	if (STALE_CLIENTID(clid))
				3133	goto out;
				3134	clp = find_confirmed_client(clid);
				3135	status = nfserr_expired;
				3136	if (clp == NULL) {
				3137	/* We assume the client took too long to RENEW. */
				3138	dprintk("nfsd4_renew: clientid not found!\n");
				3139	goto out;
				3140	}
				3141	status = nfserr_cb_path_down;
				3142	if (!list_empty(&clp->cl_delegations)
				3143	&& clp->cl_cb_state != NFSD4_CB_UP)
				3144	goto out;
				3145	status = nfs_ok;
				3146	out:
				3147	nfs4_unlock_state();
				3148	return status;
				3149	}
				3150
				3151	static struct lock_manager nfsd4_manager = {
				3152	};
				3153
				3154	static void
				3155	nfsd4_end_grace(void)
				3156	{
				3157	dprintk("NFSD: end of grace period\n");
				3158	nfsd4_record_grace_done(&init_net, boot_time);
				3159	locks_end_grace(&nfsd4_manager);
				3160	/*
				3161	* Now that every NFSv4 client has had the chance to recover and
				3162	* to see the (possibly new, possibly shorter) lease time, we
				3163	* can safely set the next grace time to the current lease time:
				3164	*/
				3165	nfsd4_grace = nfsd4_lease;
				3166	}
				3167
				3168	static time_t
				3169	nfs4_laundromat(void)
				3170	{
				3171	struct nfs4_client *clp;
				3172	struct nfs4_openowner *oo;
				3173	struct nfs4_delegation *dp;
				3174	struct list_head pos, next, reaplist;
				3175	time_t cutoff = get_seconds() - nfsd4_lease;
				3176	time_t t, clientid_val = nfsd4_lease;
				3177	time_t u, test_val = nfsd4_lease;
				3178
				3179	nfs4_lock_state();
				3180
				3181	dprintk("NFSD: laundromat service - starting\n");
				3182	if (locks_in_grace())
				3183	nfsd4_end_grace();
				3184	INIT_LIST_HEAD(&reaplist);
				3185	spin_lock(&client_lock);
				3186	list_for_each_safe(pos, next, &client_lru) {
				3187	clp = list_entry(pos, struct nfs4_client, cl_lru);
				3188	if (time_after((unsigned long)clp->cl_time, (unsigned long)cutoff)) {
				3189	t = clp->cl_time - cutoff;
				3190	if (clientid_val > t)
				3191	clientid_val = t;
				3192	break;
				3193	}
				3194	if (atomic_read(&clp->cl_refcount)) {
				3195	dprintk("NFSD: client in use (clientid %08x)\n",
				3196	clp->cl_clientid.cl_id);
				3197	continue;
				3198	}
				3199	unhash_client_locked(clp);
				3200	list_add(&clp->cl_lru, &reaplist);
				3201	}
				3202	spin_unlock(&client_lock);
				3203	list_for_each_safe(pos, next, &reaplist) {
				3204	clp = list_entry(pos, struct nfs4_client, cl_lru);
				3205	dprintk("NFSD: purging unused client (clientid %08x)\n",
				3206	clp->cl_clientid.cl_id);
				3207	nfsd4_client_record_remove(clp);
				3208	expire_client(clp);
				3209	}
				3210	spin_lock(&recall_lock);
				3211	list_for_each_safe(pos, next, &del_recall_lru) {
				3212	dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
				3213	if (time_after((unsigned long)dp->dl_time, (unsigned long)cutoff)) {
				3214	u = dp->dl_time - cutoff;
				3215	if (test_val > u)
				3216	test_val = u;
				3217	break;
				3218	}
				3219	list_move(&dp->dl_recall_lru, &reaplist);
				3220	}
				3221	spin_unlock(&recall_lock);
				3222	list_for_each_safe(pos, next, &reaplist) {
				3223	dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
				3224	unhash_delegation(dp);
				3225	}
				3226	test_val = nfsd4_lease;
				3227	list_for_each_safe(pos, next, &close_lru) {
				3228	oo = container_of(pos, struct nfs4_openowner, oo_close_lru);
				3229	if (time_after((unsigned long)oo->oo_time, (unsigned long)cutoff)) {
				3230	u = oo->oo_time - cutoff;
				3231	if (test_val > u)
				3232	test_val = u;
				3233	break;
				3234	}
				3235	release_openowner(oo);
				3236	}
				3237	if (clientid_val < NFSD_LAUNDROMAT_MINTIMEOUT)
				3238	clientid_val = NFSD_LAUNDROMAT_MINTIMEOUT;
				3239	nfs4_unlock_state();
				3240	return clientid_val;
				3241	}
				3242
				3243	static struct workqueue_struct *laundry_wq;
				3244	static void laundromat_main(struct work_struct *);
				3245	static DECLARE_DELAYED_WORK(laundromat_work, laundromat_main);
				3246
				3247	static void
				3248	laundromat_main(struct work_struct *not_used)
				3249	{
				3250	time_t t;
				3251
				3252	t = nfs4_laundromat();
				3253	dprintk("NFSD: laundromat_main - sleeping for %ld seconds\n", t);
				3254	queue_delayed_work(laundry_wq, &laundromat_work, t*HZ);
				3255	}
				3256
				3257	static inline __be32 nfs4_check_fh(struct svc_fh fhp, struct nfs4_ol_stateid stp)
				3258	{
				3259	if (fhp->fh_dentry->d_inode != stp->st_file->fi_inode)
				3260	return nfserr_bad_stateid;
				3261	return nfs_ok;
				3262	}
				3263
				3264	static int
				3265	STALE_STATEID(stateid_t *stateid)
				3266	{
				3267	if (stateid->si_opaque.so_clid.cl_boot == boot_time)
				3268	return 0;
				3269	dprintk("NFSD: stale stateid " STATEID_FMT "!\n",
				3270	STATEID_VAL(stateid));
				3271	return 1;
				3272	}
				3273
				3274	static inline int
				3275	access_permit_read(unsigned long access_bmap)
				3276	{
				3277	return test_bit(NFS4_SHARE_ACCESS_READ, &access_bmap) \|\|
				3278	test_bit(NFS4_SHARE_ACCESS_BOTH, &access_bmap) \|\|
				3279	test_bit(NFS4_SHARE_ACCESS_WRITE, &access_bmap);
				3280	}
				3281
				3282	static inline int
				3283	access_permit_write(unsigned long access_bmap)
				3284	{
				3285	return test_bit(NFS4_SHARE_ACCESS_WRITE, &access_bmap) \|\|
				3286	test_bit(NFS4_SHARE_ACCESS_BOTH, &access_bmap);
				3287	}
				3288
				3289	static
				3290	__be32 nfs4_check_openmode(struct nfs4_ol_stateid *stp, int flags)
				3291	{
				3292	__be32 status = nfserr_openmode;
				3293
				3294	/* For lock stateid's, we test the parent open, not the lock: */
				3295	if (stp->st_openstp)
				3296	stp = stp->st_openstp;
				3297	if ((flags & WR_STATE) && (!access_permit_write(stp->st_access_bmap)))
				3298	goto out;
				3299	if ((flags & RD_STATE) && (!access_permit_read(stp->st_access_bmap)))
				3300	goto out;
				3301	status = nfs_ok;
				3302	out:
				3303	return status;
				3304	}
				3305
				3306	static inline __be32
				3307	check_special_stateids(svc_fh current_fh, stateid_t stateid, int flags)
				3308	{
				3309	if (ONE_STATEID(stateid) && (flags & RD_STATE))
				3310	return nfs_ok;
				3311	else if (locks_in_grace()) {
				3312	/* Answer in remaining cases depends on existence of
				3313	* conflicting state; so we must wait out the grace period. */
				3314	return nfserr_grace;
				3315	} else if (flags & WR_STATE)
				3316	return nfs4_share_conflict(current_fh,
				3317	NFS4_SHARE_DENY_WRITE);
				3318	else /* (flags & RD_STATE) && ZERO_STATEID(stateid) */
				3319	return nfs4_share_conflict(current_fh,
				3320	NFS4_SHARE_DENY_READ);
				3321	}
				3322
				3323	/*
				3324	* Allow READ/WRITE during grace period on recovered state only for files
				3325	* that are not able to provide mandatory locking.
				3326	*/
				3327	static inline int
				3328	grace_disallows_io(struct inode *inode)
				3329	{
				3330	return locks_in_grace() && mandatory_lock(inode);
				3331	}
				3332
				3333	/* Returns true iff a is later than b: */
				3334	static bool stateid_generation_after(stateid_t a, stateid_t b)
				3335	{
				3336	return (s32)a->si_generation - (s32)b->si_generation > 0;
				3337	}
				3338
				3339	static int check_stateid_generation(stateid_t in, stateid_t ref, bool has_session)
				3340	{
				3341	/*
				3342	* When sessions are used the stateid generation number is ignored
				3343	* when it is zero.
				3344	*/
				3345	if (has_session && in->si_generation == 0)
				3346	return nfs_ok;
				3347
				3348	if (in->si_generation == ref->si_generation)
				3349	return nfs_ok;
				3350
				3351	/* If the client sends us a stateid from the future, it's buggy: */
				3352	if (stateid_generation_after(in, ref))
				3353	return nfserr_bad_stateid;
				3354	/*
				3355	* However, we could see a stateid from the past, even from a
				3356	* non-buggy client. For example, if the client sends a lock
				3357	* while some IO is outstanding, the lock may bump si_generation
				3358	* while the IO is still in flight. The client could avoid that
				3359	* situation by waiting for responses on all the IO requests,
				3360	* but better performance may result in retrying IO that
				3361	* receives an old_stateid error if requests are rarely
				3362	* reordered in flight:
				3363	*/
				3364	return nfserr_old_stateid;
				3365	}
				3366
				3367	static __be32 nfsd4_check_openowner_confirmed(struct nfs4_ol_stateid *ols)
				3368	{
				3369	if (ols->st_stateowner->so_is_open_owner &&
				3370	!(openowner(ols->st_stateowner)->oo_flags & NFS4_OO_CONFIRMED))
				3371	return nfserr_bad_stateid;
				3372	return nfs_ok;
				3373	}
				3374
				3375	__be32 nfs4_validate_stateid(struct nfs4_client cl, stateid_t stateid)
				3376	{
				3377	struct nfs4_stid *s;
				3378	__be32 status;
				3379
				3380	if (STALE_STATEID(stateid))
				3381	return nfserr_stale_stateid;
				3382
				3383	s = find_stateid(cl, stateid);
				3384	if (!s)
				3385	return nfserr_stale_stateid;
				3386	status = check_stateid_generation(stateid, &s->sc_stateid, 1);
				3387	if (status)
				3388	return status;
				3389	if (!(s->sc_type & (NFS4_OPEN_STID \| NFS4_LOCK_STID)))
				3390	return nfs_ok;
				3391	return nfsd4_check_openowner_confirmed(openlockstateid(s));
				3392	}
				3393
				3394	static __be32 nfsd4_lookup_stateid(stateid_t stateid, unsigned char typemask, struct nfs4_stid *s)
				3395	{
				3396	struct nfs4_client *cl;
				3397
				3398	if (ZERO_STATEID(stateid) \|\| ONE_STATEID(stateid))
				3399	return nfserr_bad_stateid;
				3400	if (STALE_STATEID(stateid))
				3401	return nfserr_stale_stateid;
				3402	cl = find_confirmed_client(&stateid->si_opaque.so_clid);
				3403	if (!cl)
				3404	return nfserr_expired;
				3405	*s = find_stateid_by_type(cl, stateid, typemask);
				3406	if (!*s)
				3407	return nfserr_bad_stateid;
				3408	return nfs_ok;
				3409
				3410	}
				3411
				3412	/*
				3413	* Checks for stateid operations
				3414	*/
				3415	__be32
				3416	nfs4_preprocess_stateid_op(struct nfsd4_compound_state *cstate,
				3417	stateid_t stateid, int flags, struct file *filpp)
				3418	{
				3419	struct nfs4_stid *s;
				3420	struct nfs4_ol_stateid *stp = NULL;
				3421	struct nfs4_delegation *dp = NULL;
				3422	struct svc_fh *current_fh = &cstate->current_fh;
				3423	struct inode *ino = current_fh->fh_dentry->d_inode;
				3424	__be32 status;
				3425
				3426	if (filpp)
				3427	*filpp = NULL;
				3428
				3429	if (grace_disallows_io(ino))
				3430	return nfserr_grace;
				3431
				3432	if (ZERO_STATEID(stateid) \|\| ONE_STATEID(stateid))
				3433	return check_special_stateids(current_fh, stateid, flags);
				3434
				3435	status = nfsd4_lookup_stateid(stateid, NFS4_DELEG_STID\|NFS4_OPEN_STID\|NFS4_LOCK_STID, &s);
				3436	if (status)
				3437	return status;
				3438	status = check_stateid_generation(stateid, &s->sc_stateid, nfsd4_has_session(cstate));
				3439	if (status)
				3440	goto out;
				3441	switch (s->sc_type) {
				3442	case NFS4_DELEG_STID:
				3443	dp = delegstateid(s);
				3444	status = nfs4_check_delegmode(dp, flags);
				3445	if (status)
				3446	goto out;
				3447	if (filpp) {
				3448	*filpp = dp->dl_file->fi_deleg_file;
				3449	BUG_ON(!*filpp);
				3450	}
				3451	break;
				3452	case NFS4_OPEN_STID:
				3453	case NFS4_LOCK_STID:
				3454	stp = openlockstateid(s);
				3455	status = nfs4_check_fh(current_fh, stp);
				3456	if (status)
				3457	goto out;
				3458	status = nfsd4_check_openowner_confirmed(stp);
				3459	if (status)
				3460	goto out;
				3461	status = nfs4_check_openmode(stp, flags);
				3462	if (status)
				3463	goto out;
				3464	if (filpp) {
				3465	if (flags & RD_STATE)
				3466	*filpp = find_readable_file(stp->st_file);
				3467	else
				3468	*filpp = find_writeable_file(stp->st_file);
				3469	}
				3470	break;
				3471	default:
				3472	return nfserr_bad_stateid;
				3473	}
				3474	status = nfs_ok;
				3475	out:
				3476	return status;
				3477	}
				3478
				3479	static __be32
				3480	nfsd4_free_lock_stateid(struct nfs4_ol_stateid *stp)
				3481	{
				3482	struct nfs4_lockowner *lo = lockowner(stp->st_stateowner);
				3483
				3484	if (check_for_locks(stp->st_file, lo))
				3485	return nfserr_locks_held;
				3486	/*
				3487	* Currently there's a 1-1 lock stateid<->lockowner
				3488	* correspondance, and we have to delete the lockowner when we
				3489	* delete the lock stateid:
				3490	*/
				3491	release_lockowner(lo);
				3492	return nfs_ok;
				3493	}
				3494
				3495	/*
				3496	* Test if the stateid is valid
				3497	*/
				3498	__be32
				3499	nfsd4_test_stateid(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				3500	struct nfsd4_test_stateid *test_stateid)
				3501	{
				3502	struct nfsd4_test_stateid_id *stateid;
				3503	struct nfs4_client *cl = cstate->session->se_client;
				3504
				3505	nfs4_lock_state();
				3506	list_for_each_entry(stateid, &test_stateid->ts_stateid_list, ts_id_list)
				3507	stateid->ts_id_status = nfs4_validate_stateid(cl, &stateid->ts_id_stateid);
				3508	nfs4_unlock_state();
				3509
				3510	return nfs_ok;
				3511	}
				3512
				3513	__be32
				3514	nfsd4_free_stateid(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				3515	struct nfsd4_free_stateid *free_stateid)
				3516	{
				3517	stateid_t *stateid = &free_stateid->fr_stateid;
				3518	struct nfs4_stid *s;
				3519	struct nfs4_client *cl = cstate->session->se_client;
				3520	__be32 ret = nfserr_bad_stateid;
				3521
				3522	nfs4_lock_state();
				3523	s = find_stateid(cl, stateid);
				3524	if (!s)
				3525	goto out;
				3526	switch (s->sc_type) {
				3527	case NFS4_DELEG_STID:
				3528	ret = nfserr_locks_held;
				3529	goto out;
				3530	case NFS4_OPEN_STID:
				3531	case NFS4_LOCK_STID:
				3532	ret = check_stateid_generation(stateid, &s->sc_stateid, 1);
				3533	if (ret)
				3534	goto out;
				3535	if (s->sc_type == NFS4_LOCK_STID)
				3536	ret = nfsd4_free_lock_stateid(openlockstateid(s));
				3537	else
				3538	ret = nfserr_locks_held;
				3539	break;
				3540	default:
				3541	ret = nfserr_bad_stateid;
				3542	}
				3543	out:
				3544	nfs4_unlock_state();
				3545	return ret;
				3546	}
				3547
				3548	static inline int
				3549	setlkflg (int type)
				3550	{
				3551	return (type == NFS4_READW_LT \|\| type == NFS4_READ_LT) ?
				3552	RD_STATE : WR_STATE;
				3553	}
				3554
				3555	static __be32 nfs4_seqid_op_checks(struct nfsd4_compound_state cstate, stateid_t stateid, u32 seqid, struct nfs4_ol_stateid *stp)
				3556	{
				3557	struct svc_fh *current_fh = &cstate->current_fh;
				3558	struct nfs4_stateowner *sop = stp->st_stateowner;
				3559	__be32 status;
				3560
				3561	status = nfsd4_check_seqid(cstate, sop, seqid);
				3562	if (status)
				3563	return status;
				3564	if (stp->st_stid.sc_type == NFS4_CLOSED_STID)
				3565	/*
				3566	* "Closed" stateid's exist only to return
				3567	* nfserr_replay_me from the previous step.
				3568	*/
				3569	return nfserr_bad_stateid;
				3570	status = check_stateid_generation(stateid, &stp->st_stid.sc_stateid, nfsd4_has_session(cstate));
				3571	if (status)
				3572	return status;
				3573	return nfs4_check_fh(current_fh, stp);
				3574	}
				3575
				3576	/*
				3577	* Checks for sequence id mutating operations.
				3578	*/
				3579	static __be32
				3580	nfs4_preprocess_seqid_op(struct nfsd4_compound_state *cstate, u32 seqid,
				3581	stateid_t *stateid, char typemask,
				3582	struct nfs4_ol_stateid **stpp)
				3583	{
				3584	__be32 status;
				3585	struct nfs4_stid *s;
				3586
				3587	dprintk("NFSD: %s: seqid=%d stateid = " STATEID_FMT "\n", __func__,
				3588	seqid, STATEID_VAL(stateid));
				3589
				3590	*stpp = NULL;
				3591	status = nfsd4_lookup_stateid(stateid, typemask, &s);
				3592	if (status)
				3593	return status;
				3594	*stpp = openlockstateid(s);
				3595	cstate->replay_owner = (*stpp)->st_stateowner;
				3596
				3597	return nfs4_seqid_op_checks(cstate, stateid, seqid, *stpp);
				3598	}
				3599
				3600	static __be32 nfs4_preprocess_confirmed_seqid_op(struct nfsd4_compound_state cstate, u32 seqid, stateid_t stateid, struct nfs4_ol_stateid **stpp)
				3601	{
				3602	__be32 status;
				3603	struct nfs4_openowner *oo;
				3604
				3605	status = nfs4_preprocess_seqid_op(cstate, seqid, stateid,
				3606	NFS4_OPEN_STID, stpp);
				3607	if (status)
				3608	return status;
				3609	oo = openowner((*stpp)->st_stateowner);
				3610	if (!(oo->oo_flags & NFS4_OO_CONFIRMED))
				3611	return nfserr_bad_stateid;
				3612	return nfs_ok;
				3613	}
				3614
				3615	__be32
				3616	nfsd4_open_confirm(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				3617	struct nfsd4_open_confirm *oc)
				3618	{
				3619	__be32 status;
				3620	struct nfs4_openowner *oo;
				3621	struct nfs4_ol_stateid *stp;
				3622
				3623	dprintk("NFSD: nfsd4_open_confirm on file %.*s\n",
				3624	(int)cstate->current_fh.fh_dentry->d_name.len,
				3625	cstate->current_fh.fh_dentry->d_name.name);
				3626
				3627	status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0);
				3628	if (status)
				3629	return status;
				3630
				3631	nfs4_lock_state();
				3632
				3633	status = nfs4_preprocess_seqid_op(cstate,
				3634	oc->oc_seqid, &oc->oc_req_stateid,
				3635	NFS4_OPEN_STID, &stp);
				3636	if (status)
				3637	goto out;
				3638	oo = openowner(stp->st_stateowner);
				3639	status = nfserr_bad_stateid;
				3640	if (oo->oo_flags & NFS4_OO_CONFIRMED)
				3641	goto out;
				3642	oo->oo_flags \|= NFS4_OO_CONFIRMED;
				3643	update_stateid(&stp->st_stid.sc_stateid);
				3644	memcpy(&oc->oc_resp_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
				3645	dprintk("NFSD: %s: success, seqid=%d stateid=" STATEID_FMT "\n",
				3646	__func__, oc->oc_seqid, STATEID_VAL(&stp->st_stid.sc_stateid));
				3647
				3648	nfsd4_client_record_create(oo->oo_owner.so_client);
				3649	status = nfs_ok;
				3650	out:
				3651	if (!cstate->replay_owner)
				3652	nfs4_unlock_state();
				3653	return status;
				3654	}
				3655
				3656	static inline void nfs4_stateid_downgrade_bit(struct nfs4_ol_stateid *stp, u32 access)
				3657	{
				3658	if (!test_bit(access, &stp->st_access_bmap))
				3659	return;
				3660	nfs4_file_put_access(stp->st_file, nfs4_access_to_omode(access));
				3661	__clear_bit(access, &stp->st_access_bmap);
				3662	}
				3663
				3664	static inline void nfs4_stateid_downgrade(struct nfs4_ol_stateid *stp, u32 to_access)
				3665	{
				3666	switch (to_access) {
				3667	case NFS4_SHARE_ACCESS_READ:
				3668	nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_WRITE);
				3669	nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
				3670	break;
				3671	case NFS4_SHARE_ACCESS_WRITE:
				3672	nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_READ);
				3673	nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
				3674	break;
				3675	case NFS4_SHARE_ACCESS_BOTH:
				3676	break;
				3677	default:
				3678	BUG();
				3679	}
				3680	}
				3681
				3682	static void
				3683	reset_union_bmap_deny(unsigned long deny, unsigned long *bmap)
				3684	{
				3685	int i;
				3686	for (i = 0; i < 4; i++) {
				3687	if ((i & deny) != i)
				3688	__clear_bit(i, bmap);
				3689	}
				3690	}
				3691
				3692	__be32
				3693	nfsd4_open_downgrade(struct svc_rqst *rqstp,
				3694	struct nfsd4_compound_state *cstate,
				3695	struct nfsd4_open_downgrade *od)
				3696	{
				3697	__be32 status;
				3698	struct nfs4_ol_stateid *stp;
				3699
				3700	dprintk("NFSD: nfsd4_open_downgrade on file %.*s\n",
				3701	(int)cstate->current_fh.fh_dentry->d_name.len,
				3702	cstate->current_fh.fh_dentry->d_name.name);
				3703
				3704	/* We don't yet support WANT bits: */
				3705	if (od->od_deleg_want)
				3706	dprintk("NFSD: %s: od_deleg_want=0x%x ignored\n", __func__,
				3707	od->od_deleg_want);
				3708
				3709	nfs4_lock_state();
				3710	status = nfs4_preprocess_confirmed_seqid_op(cstate, od->od_seqid,
				3711	&od->od_stateid, &stp);
				3712	if (status)
				3713	goto out;
				3714	status = nfserr_inval;
				3715	if (!test_bit(od->od_share_access, &stp->st_access_bmap)) {
				3716	dprintk("NFSD:access not a subset current bitmap: 0x%lx, input access=%08x\n",
				3717	stp->st_access_bmap, od->od_share_access);
				3718	goto out;
				3719	}
				3720	if (!test_bit(od->od_share_deny, &stp->st_deny_bmap)) {
				3721	dprintk("NFSD:deny not a subset current bitmap: 0x%lx, input deny=%08x\n",
				3722	stp->st_deny_bmap, od->od_share_deny);
				3723	goto out;
				3724	}
				3725	nfs4_stateid_downgrade(stp, od->od_share_access);
				3726
				3727	reset_union_bmap_deny(od->od_share_deny, &stp->st_deny_bmap);
				3728
				3729	update_stateid(&stp->st_stid.sc_stateid);
				3730	memcpy(&od->od_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
				3731	status = nfs_ok;
				3732	out:
				3733	if (!cstate->replay_owner)
				3734	nfs4_unlock_state();
				3735	return status;
				3736	}
				3737
				3738	void nfsd4_purge_closed_stateid(struct nfs4_stateowner *so)
				3739	{
				3740	struct nfs4_openowner *oo;
				3741	struct nfs4_ol_stateid *s;
				3742
				3743	if (!so->so_is_open_owner)
				3744	return;
				3745	oo = openowner(so);
				3746	s = oo->oo_last_closed_stid;
				3747	if (!s)
				3748	return;
				3749	if (!(oo->oo_flags & NFS4_OO_PURGE_CLOSE)) {
				3750	/* Release the last_closed_stid on the next seqid bump: */
				3751	oo->oo_flags \|= NFS4_OO_PURGE_CLOSE;
				3752	return;
				3753	}
				3754	oo->oo_flags &= ~NFS4_OO_PURGE_CLOSE;
				3755	release_last_closed_stateid(oo);
				3756	}
				3757
				3758	static void nfsd4_close_open_stateid(struct nfs4_ol_stateid *s)
				3759	{
				3760	unhash_open_stateid(s);
				3761	s->st_stid.sc_type = NFS4_CLOSED_STID;
				3762	}
				3763
				3764	/*
				3765	* nfs4_unlock_state() called after encode
				3766	*/
				3767	__be32
				3768	nfsd4_close(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				3769	struct nfsd4_close *close)
				3770	{
				3771	__be32 status;
				3772	struct nfs4_openowner *oo;
				3773	struct nfs4_ol_stateid *stp;
				3774
				3775	dprintk("NFSD: nfsd4_close on file %.*s\n",
				3776	(int)cstate->current_fh.fh_dentry->d_name.len,
				3777	cstate->current_fh.fh_dentry->d_name.name);
				3778
				3779	nfs4_lock_state();
				3780	status = nfs4_preprocess_seqid_op(cstate, close->cl_seqid,
				3781	&close->cl_stateid,
				3782	NFS4_OPEN_STID\|NFS4_CLOSED_STID,
				3783	&stp);
				3784	if (status)
				3785	goto out;
				3786	oo = openowner(stp->st_stateowner);
				3787	status = nfs_ok;
				3788	update_stateid(&stp->st_stid.sc_stateid);
				3789	memcpy(&close->cl_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
				3790
				3791	nfsd4_close_open_stateid(stp);
				3792	release_last_closed_stateid(oo);
				3793	oo->oo_last_closed_stid = stp;
				3794
				3795	/* place unused nfs4_stateowners on so_close_lru list to be
				3796	* released by the laundromat service after the lease period
				3797	* to enable us to handle CLOSE replay
				3798	*/
				3799	if (list_empty(&oo->oo_owner.so_stateids))
				3800	move_to_close_lru(oo);
				3801	out:
				3802	if (!cstate->replay_owner)
				3803	nfs4_unlock_state();
				3804	return status;
				3805	}
				3806
				3807	__be32
				3808	nfsd4_delegreturn(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				3809	struct nfsd4_delegreturn *dr)
				3810	{
				3811	struct nfs4_delegation *dp;
				3812	stateid_t *stateid = &dr->dr_stateid;
				3813	struct nfs4_stid *s;
				3814	struct inode *inode;
				3815	__be32 status;
				3816
				3817	if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
				3818	return status;
				3819	inode = cstate->current_fh.fh_dentry->d_inode;
				3820
				3821	nfs4_lock_state();
				3822	status = nfsd4_lookup_stateid(stateid, NFS4_DELEG_STID, &s);
				3823	if (status)
				3824	goto out;
				3825	dp = delegstateid(s);
				3826	status = check_stateid_generation(stateid, &dp->dl_stid.sc_stateid, nfsd4_has_session(cstate));
				3827	if (status)
				3828	goto out;
				3829
				3830	unhash_delegation(dp);
				3831	out:
				3832	nfs4_unlock_state();
				3833
				3834	return status;
				3835	}
				3836
				3837
				3838	#define LOFF_OVERFLOW(start, len) ((u64)(len) > ~(u64)(start))
				3839
				3840	#define LOCKOWNER_INO_HASH_BITS 8
				3841	#define LOCKOWNER_INO_HASH_SIZE (1 << LOCKOWNER_INO_HASH_BITS)
				3842	#define LOCKOWNER_INO_HASH_MASK (LOCKOWNER_INO_HASH_SIZE - 1)
				3843
				3844	static inline u64
				3845	end_offset(u64 start, u64 len)
				3846	{
				3847	u64 end;
				3848
				3849	end = start + len;
				3850	return end >= start ? end: NFS4_MAX_UINT64;
				3851	}
				3852
				3853	/* last octet in a range */
				3854	static inline u64
				3855	last_byte_offset(u64 start, u64 len)
				3856	{
				3857	u64 end;
				3858
				3859	BUG_ON(!len);
				3860	end = start + len;
				3861	return end > start ? end - 1: NFS4_MAX_UINT64;
				3862	}
				3863
				3864	static unsigned int lockowner_ino_hashval(struct inode inode, u32 cl_id, struct xdr_netobj ownername)
				3865	{
				3866	return (file_hashval(inode) + cl_id
				3867	+ opaque_hashval(ownername->data, ownername->len))
				3868	& LOCKOWNER_INO_HASH_MASK;
				3869	}
				3870
				3871	static struct list_head lockowner_ino_hashtbl[LOCKOWNER_INO_HASH_SIZE];
				3872
				3873	/*
				3874	* TODO: Linux file offsets are _signed_ 64-bit quantities, which means that
				3875	* we can't properly handle lock requests that go beyond the (2^63 - 1)-th
				3876	* byte, because of sign extension problems. Since NFSv4 calls for 64-bit
				3877	* locking, this prevents us from being completely protocol-compliant. The
				3878	* real solution to this problem is to start using unsigned file offsets in
				3879	* the VFS, but this is a very deep change!
				3880	*/
				3881	static inline void
				3882	nfs4_transform_lock_offset(struct file_lock *lock)
				3883	{
				3884	if (lock->fl_start < 0)
				3885	lock->fl_start = OFFSET_MAX;
				3886	if (lock->fl_end < 0)
				3887	lock->fl_end = OFFSET_MAX;
				3888	}
				3889
				3890	/* Hack!: For now, we're defining this just so we can use a pointer to it
				3891	* as a unique cookie to identify our (NFSv4's) posix locks. */
				3892	static const struct lock_manager_operations nfsd_posix_mng_ops = {
				3893	};
				3894
				3895	static inline void
				3896	nfs4_set_lock_denied(struct file_lock fl, struct nfsd4_lock_denied deny)
				3897	{
				3898	struct nfs4_lockowner *lo;
				3899
				3900	if (fl->fl_lmops == &nfsd_posix_mng_ops) {
				3901	lo = (struct nfs4_lockowner *) fl->fl_owner;
				3902	deny->ld_owner.data = kmemdup(lo->lo_owner.so_owner.data,
				3903	lo->lo_owner.so_owner.len, GFP_KERNEL);
				3904	if (!deny->ld_owner.data)
				3905	/* We just don't care that much */
				3906	goto nevermind;
				3907	deny->ld_owner.len = lo->lo_owner.so_owner.len;
				3908	deny->ld_clientid = lo->lo_owner.so_client->cl_clientid;
				3909	} else {
				3910	nevermind:
				3911	deny->ld_owner.len = 0;
				3912	deny->ld_owner.data = NULL;
				3913	deny->ld_clientid.cl_boot = 0;
				3914	deny->ld_clientid.cl_id = 0;
				3915	}
				3916	deny->ld_start = fl->fl_start;
				3917	deny->ld_length = NFS4_MAX_UINT64;
				3918	if (fl->fl_end != NFS4_MAX_UINT64)
				3919	deny->ld_length = fl->fl_end - fl->fl_start + 1;
				3920	deny->ld_type = NFS4_READ_LT;
				3921	if (fl->fl_type != F_RDLCK)
				3922	deny->ld_type = NFS4_WRITE_LT;
				3923	}
				3924
				3925	static bool same_lockowner_ino(struct nfs4_lockowner lo, struct inode inode, clientid_t clid, struct xdr_netobj owner)
				3926	{
				3927	struct nfs4_ol_stateid *lst;
				3928
				3929	if (!same_owner_str(&lo->lo_owner, owner, clid))
				3930	return false;
				3931	if (list_empty(&lo->lo_owner.so_stateids)) {
				3932	WARN_ON_ONCE(1);
				3933	return false;
				3934	}
				3935	lst = list_first_entry(&lo->lo_owner.so_stateids,
				3936	struct nfs4_ol_stateid, st_perstateowner);
				3937	return lst->st_file->fi_inode == inode;
				3938	}
				3939
				3940	static struct nfs4_lockowner *
				3941	find_lockowner_str(struct inode inode, clientid_t clid,
				3942	struct xdr_netobj *owner)
				3943	{
				3944	unsigned int hashval = lockowner_ino_hashval(inode, clid->cl_id, owner);
				3945	struct nfs4_lockowner *lo;
				3946
				3947	list_for_each_entry(lo, &lockowner_ino_hashtbl[hashval], lo_owner_ino_hash) {
				3948	if (same_lockowner_ino(lo, inode, clid, owner))
				3949	return lo;
				3950	}
				3951	return NULL;
				3952	}
				3953
				3954	static void hash_lockowner(struct nfs4_lockowner lo, unsigned int strhashval, struct nfs4_client clp, struct nfs4_ol_stateid *open_stp)
				3955	{
				3956	struct inode *inode = open_stp->st_file->fi_inode;
				3957	unsigned int inohash = lockowner_ino_hashval(inode,
				3958	clp->cl_clientid.cl_id, &lo->lo_owner.so_owner);
				3959
				3960	list_add(&lo->lo_owner.so_strhash, &ownerstr_hashtbl[strhashval]);
				3961	list_add(&lo->lo_owner_ino_hash, &lockowner_ino_hashtbl[inohash]);
				3962	list_add(&lo->lo_perstateid, &open_stp->st_lockowners);
				3963	}
				3964
				3965	/*
				3966	* Alloc a lock owner structure.
				3967	* Called in nfsd4_lock - therefore, OPEN and OPEN_CONFIRM (if needed) has
				3968	* occurred.
				3969	*
				3970	* strhashval = ownerstr_hashval
				3971	*/
				3972
				3973	static struct nfs4_lockowner *
				3974	alloc_init_lock_stateowner(unsigned int strhashval, struct nfs4_client clp, struct nfs4_ol_stateid open_stp, struct nfsd4_lock *lock) {
				3975	struct nfs4_lockowner *lo;
				3976
				3977	lo = alloc_stateowner(lockowner_slab, &lock->lk_new_owner, clp);
				3978	if (!lo)
				3979	return NULL;
				3980	INIT_LIST_HEAD(&lo->lo_owner.so_stateids);
				3981	lo->lo_owner.so_is_open_owner = 0;
				3982	/* It is the openowner seqid that will be incremented in encode in the
				3983	* case of new lockowners; so increment the lock seqid manually: */
				3984	lo->lo_owner.so_seqid = lock->lk_new_lock_seqid + 1;
				3985	hash_lockowner(lo, strhashval, clp, open_stp);
				3986	return lo;
				3987	}
				3988
				3989	static struct nfs4_ol_stateid *
				3990	alloc_init_lock_stateid(struct nfs4_lockowner lo, struct nfs4_file fp, struct nfs4_ol_stateid *open_stp)
				3991	{
				3992	struct nfs4_ol_stateid *stp;
				3993	struct nfs4_client *clp = lo->lo_owner.so_client;
				3994
				3995	stp = nfs4_alloc_stateid(clp);
				3996	if (stp == NULL)
				3997	return NULL;
				3998	init_stid(&stp->st_stid, clp, NFS4_LOCK_STID);
				3999	list_add(&stp->st_perfile, &fp->fi_stateids);
				4000	list_add(&stp->st_perstateowner, &lo->lo_owner.so_stateids);
				4001	stp->st_stateowner = &lo->lo_owner;
				4002	get_nfs4_file(fp);
				4003	stp->st_file = fp;
				4004	stp->st_access_bmap = 0;
				4005	stp->st_deny_bmap = open_stp->st_deny_bmap;
				4006	stp->st_openstp = open_stp;
				4007	return stp;
				4008	}
				4009
				4010	static int
				4011	check_lock_length(u64 offset, u64 length)
				4012	{
				4013	return ((length == 0) \|\| ((length != NFS4_MAX_UINT64) &&
				4014	LOFF_OVERFLOW(offset, length)));
				4015	}
				4016
				4017	static void get_lock_access(struct nfs4_ol_stateid *lock_stp, u32 access)
				4018	{
				4019	struct nfs4_file *fp = lock_stp->st_file;
				4020	int oflag = nfs4_access_to_omode(access);
				4021
				4022	if (test_bit(access, &lock_stp->st_access_bmap))
				4023	return;
				4024	nfs4_file_get_access(fp, oflag);
				4025	__set_bit(access, &lock_stp->st_access_bmap);
				4026	}
				4027
				4028	__be32 lookup_or_create_lock_state(struct nfsd4_compound_state cstate, struct nfs4_ol_stateid ost, struct nfsd4_lock lock, struct nfs4_ol_stateid lst, bool new)
				4029	{
				4030	struct nfs4_file *fi = ost->st_file;
				4031	struct nfs4_openowner *oo = openowner(ost->st_stateowner);
				4032	struct nfs4_client *cl = oo->oo_owner.so_client;
				4033	struct nfs4_lockowner *lo;
				4034	unsigned int strhashval;
				4035
				4036	lo = find_lockowner_str(fi->fi_inode, &cl->cl_clientid, &lock->v.new.owner);
				4037	if (lo) {
				4038	if (!cstate->minorversion)
				4039	return nfserr_bad_seqid;
				4040	/* XXX: a lockowner always has exactly one stateid: */
				4041	*lst = list_first_entry(&lo->lo_owner.so_stateids,
				4042	struct nfs4_ol_stateid, st_perstateowner);
				4043	return nfs_ok;
				4044	}
				4045	strhashval = ownerstr_hashval(cl->cl_clientid.cl_id,
				4046	&lock->v.new.owner);
				4047	lo = alloc_init_lock_stateowner(strhashval, cl, ost, lock);
				4048	if (lo == NULL)
				4049	return nfserr_jukebox;
				4050	*lst = alloc_init_lock_stateid(lo, fi, ost);
				4051	if (*lst == NULL) {
				4052	release_lockowner(lo);
				4053	return nfserr_jukebox;
				4054	}
				4055	*new = true;
				4056	return nfs_ok;
				4057	}
				4058
				4059	/*
				4060	* LOCK operation
				4061	*/
				4062	__be32
				4063	nfsd4_lock(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				4064	struct nfsd4_lock *lock)
				4065	{
				4066	struct nfs4_openowner *open_sop = NULL;
				4067	struct nfs4_lockowner *lock_sop = NULL;
				4068	struct nfs4_ol_stateid *lock_stp;
				4069	struct nfs4_file *fp;
				4070	struct file *filp = NULL;
				4071	struct file_lock file_lock;
				4072	struct file_lock conflock;
				4073	__be32 status = 0;
				4074	bool new_state = false;
				4075	int lkflg;
				4076	int err;
				4077
				4078	dprintk("NFSD: nfsd4_lock: start=%Ld length=%Ld\n",
				4079	(long long) lock->lk_offset,
				4080	(long long) lock->lk_length);
				4081
				4082	if (check_lock_length(lock->lk_offset, lock->lk_length))
				4083	return nfserr_inval;
				4084
				4085	if ((status = fh_verify(rqstp, &cstate->current_fh,
				4086	S_IFREG, NFSD_MAY_LOCK))) {
				4087	dprintk("NFSD: nfsd4_lock: permission denied!\n");
				4088	return status;
				4089	}
				4090
				4091	nfs4_lock_state();
				4092
				4093	if (lock->lk_is_new) {
				4094	/*
				4095	* Client indicates that this is a new lockowner.
				4096	* Use open owner and open stateid to create lock owner and
				4097	* lock stateid.
				4098	*/
				4099	struct nfs4_ol_stateid *open_stp = NULL;
				4100
				4101	if (nfsd4_has_session(cstate))
				4102	/* See rfc 5661 18.10.3: given clientid is ignored: */
				4103	memcpy(&lock->v.new.clientid,
				4104	&cstate->session->se_client->cl_clientid,
				4105	sizeof(clientid_t));
				4106
				4107	status = nfserr_stale_clientid;
				4108	if (STALE_CLIENTID(&lock->lk_new_clientid))
				4109	goto out;
				4110
				4111	/* validate and update open stateid and open seqid */
				4112	status = nfs4_preprocess_confirmed_seqid_op(cstate,
				4113	lock->lk_new_open_seqid,
				4114	&lock->lk_new_open_stateid,
				4115	&open_stp);
				4116	if (status)
				4117	goto out;
				4118	open_sop = openowner(open_stp->st_stateowner);
				4119	status = nfserr_bad_stateid;
				4120	if (!same_clid(&open_sop->oo_owner.so_client->cl_clientid,
				4121	&lock->v.new.clientid))
				4122	goto out;
				4123	status = lookup_or_create_lock_state(cstate, open_stp, lock,
				4124	&lock_stp, &new_state);
				4125	if (status)
				4126	goto out;
				4127	} else {
				4128	/* lock (lock owner + lock stateid) already exists */
				4129	status = nfs4_preprocess_seqid_op(cstate,
				4130	lock->lk_old_lock_seqid,
				4131	&lock->lk_old_lock_stateid,
				4132	NFS4_LOCK_STID, &lock_stp);
				4133	if (status)
				4134	goto out;
				4135	}
				4136	lock_sop = lockowner(lock_stp->st_stateowner);
				4137	fp = lock_stp->st_file;
				4138
				4139	lkflg = setlkflg(lock->lk_type);
				4140	status = nfs4_check_openmode(lock_stp, lkflg);
				4141	if (status)
				4142	goto out;
				4143
				4144	status = nfserr_grace;
				4145	if (locks_in_grace() && !lock->lk_reclaim)
				4146	goto out;
				4147	status = nfserr_no_grace;
				4148	if (!locks_in_grace() && lock->lk_reclaim)
				4149	goto out;
				4150
				4151	locks_init_lock(&file_lock);
				4152	switch (lock->lk_type) {
				4153	case NFS4_READ_LT:
				4154	case NFS4_READW_LT:
				4155	filp = find_readable_file(lock_stp->st_file);
				4156	if (filp)
				4157	get_lock_access(lock_stp, NFS4_SHARE_ACCESS_READ);
				4158	file_lock.fl_type = F_RDLCK;
				4159	break;
				4160	case NFS4_WRITE_LT:
				4161	case NFS4_WRITEW_LT:
				4162	filp = find_writeable_file(lock_stp->st_file);
				4163	if (filp)
				4164	get_lock_access(lock_stp, NFS4_SHARE_ACCESS_WRITE);
				4165	file_lock.fl_type = F_WRLCK;
				4166	break;
				4167	default:
				4168	status = nfserr_inval;
				4169	goto out;
				4170	}
				4171	if (!filp) {
				4172	status = nfserr_openmode;
				4173	goto out;
				4174	}
				4175	file_lock.fl_owner = (fl_owner_t)lock_sop;
				4176	file_lock.fl_pid = current->tgid;
				4177	file_lock.fl_file = filp;
				4178	file_lock.fl_flags = FL_POSIX;
				4179	file_lock.fl_lmops = &nfsd_posix_mng_ops;
				4180
				4181	file_lock.fl_start = lock->lk_offset;
				4182	file_lock.fl_end = last_byte_offset(lock->lk_offset, lock->lk_length);
				4183	nfs4_transform_lock_offset(&file_lock);
				4184
				4185	/*
				4186	* Try to lock the file in the VFS.
				4187	* Note: locks.c uses the BKL to protect the inode's lock list.
				4188	*/
				4189
				4190	err = vfs_lock_file(filp, F_SETLK, &file_lock, &conflock);
				4191	switch (-err) {
				4192	case 0: /* success! */
				4193	update_stateid(&lock_stp->st_stid.sc_stateid);
				4194	memcpy(&lock->lk_resp_stateid, &lock_stp->st_stid.sc_stateid,
				4195	sizeof(stateid_t));
				4196	status = 0;
				4197	break;
				4198	case (EAGAIN): /* conflock holds conflicting lock */
				4199	status = nfserr_denied;
				4200	dprintk("NFSD: nfsd4_lock: conflicting lock found!\n");
				4201	nfs4_set_lock_denied(&conflock, &lock->lk_denied);
				4202	break;
				4203	case (EDEADLK):
				4204	status = nfserr_deadlock;
				4205	break;
				4206	default:
				4207	dprintk("NFSD: nfsd4_lock: vfs_lock_file() failed! status %d\n",err);
				4208	status = nfserrno(err);
				4209	break;
				4210	}
				4211	out:
				4212	if (status && new_state)
				4213	release_lockowner(lock_sop);
				4214	if (!cstate->replay_owner)
				4215	nfs4_unlock_state();
				4216	return status;
				4217	}
				4218
				4219	/*
				4220	* The NFSv4 spec allows a client to do a LOCKT without holding an OPEN,
				4221	* so we do a temporary open here just to get an open file to pass to
				4222	* vfs_test_lock. (Arguably perhaps test_lock should be done with an
				4223	* inode operation.)
				4224	*/
				4225	static __be32 nfsd_test_lock(struct svc_rqst rqstp, struct svc_fh fhp, struct file_lock *lock)
				4226	{
				4227	struct file *file;
				4228	__be32 err = nfsd_open(rqstp, fhp, S_IFREG, NFSD_MAY_READ, &file);
				4229	if (!err) {
				4230	err = nfserrno(vfs_test_lock(file, lock));
				4231	nfsd_close(file);
				4232	}
				4233	return err;
				4234	}
				4235
				4236	/*
				4237	* LOCKT operation
				4238	*/
				4239	__be32
				4240	nfsd4_lockt(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				4241	struct nfsd4_lockt *lockt)
				4242	{
				4243	struct inode *inode;
				4244	struct file_lock file_lock;
				4245	struct nfs4_lockowner *lo;
				4246	__be32 status;
				4247
				4248	if (locks_in_grace())
				4249	return nfserr_grace;
				4250
				4251	if (check_lock_length(lockt->lt_offset, lockt->lt_length))
				4252	return nfserr_inval;
				4253
				4254	nfs4_lock_state();
				4255
				4256	status = nfserr_stale_clientid;
				4257	if (!nfsd4_has_session(cstate) && STALE_CLIENTID(&lockt->lt_clientid))
				4258	goto out;
				4259
				4260	if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
				4261	goto out;
				4262
				4263	inode = cstate->current_fh.fh_dentry->d_inode;
				4264	locks_init_lock(&file_lock);
				4265	switch (lockt->lt_type) {
				4266	case NFS4_READ_LT:
				4267	case NFS4_READW_LT:
				4268	file_lock.fl_type = F_RDLCK;
				4269	break;
				4270	case NFS4_WRITE_LT:
				4271	case NFS4_WRITEW_LT:
				4272	file_lock.fl_type = F_WRLCK;
				4273	break;
				4274	default:
				4275	dprintk("NFSD: nfs4_lockt: bad lock type!\n");
				4276	status = nfserr_inval;
				4277	goto out;
				4278	}
				4279
				4280	lo = find_lockowner_str(inode, &lockt->lt_clientid, &lockt->lt_owner);
				4281	if (lo)
				4282	file_lock.fl_owner = (fl_owner_t)lo;
				4283	file_lock.fl_pid = current->tgid;
				4284	file_lock.fl_flags = FL_POSIX;
				4285
				4286	file_lock.fl_start = lockt->lt_offset;
				4287	file_lock.fl_end = last_byte_offset(lockt->lt_offset, lockt->lt_length);
				4288
				4289	nfs4_transform_lock_offset(&file_lock);
				4290
				4291	status = nfsd_test_lock(rqstp, &cstate->current_fh, &file_lock);
				4292	if (status)
				4293	goto out;
				4294
				4295	if (file_lock.fl_type != F_UNLCK) {
				4296	status = nfserr_denied;
				4297	nfs4_set_lock_denied(&file_lock, &lockt->lt_denied);
				4298	}
				4299	out:
				4300	nfs4_unlock_state();
				4301	return status;
				4302	}
				4303
				4304	__be32
				4305	nfsd4_locku(struct svc_rqst rqstp, struct nfsd4_compound_state cstate,
				4306	struct nfsd4_locku *locku)
				4307	{
				4308	struct nfs4_ol_stateid *stp;
				4309	struct file *filp = NULL;
				4310	struct file_lock file_lock;
				4311	__be32 status;
				4312	int err;
				4313
				4314	dprintk("NFSD: nfsd4_locku: start=%Ld length=%Ld\n",
				4315	(long long) locku->lu_offset,
				4316	(long long) locku->lu_length);
				4317
				4318	if (check_lock_length(locku->lu_offset, locku->lu_length))
				4319	return nfserr_inval;
				4320
				4321	nfs4_lock_state();
				4322
				4323	status = nfs4_preprocess_seqid_op(cstate, locku->lu_seqid,
				4324	&locku->lu_stateid, NFS4_LOCK_STID, &stp);
				4325	if (status)
				4326	goto out;
				4327	filp = find_any_file(stp->st_file);
				4328	if (!filp) {
				4329	status = nfserr_lock_range;
				4330	goto out;
				4331	}
				4332	BUG_ON(!filp);
				4333	locks_init_lock(&file_lock);
				4334	file_lock.fl_type = F_UNLCK;
				4335	file_lock.fl_owner = (fl_owner_t)lockowner(stp->st_stateowner);
				4336	file_lock.fl_pid = current->tgid;
				4337	file_lock.fl_file = filp;
				4338	file_lock.fl_flags = FL_POSIX;
				4339	file_lock.fl_lmops = &nfsd_posix_mng_ops;
				4340	file_lock.fl_start = locku->lu_offset;
				4341
				4342	file_lock.fl_end = last_byte_offset(locku->lu_offset, locku->lu_length);
				4343	nfs4_transform_lock_offset(&file_lock);
				4344
				4345	/*
				4346	* Try to unlock the file in the VFS.
				4347	*/
				4348	err = vfs_lock_file(filp, F_SETLK, &file_lock, NULL);
				4349	if (err) {
				4350	dprintk("NFSD: nfs4_locku: vfs_lock_file failed!\n");
				4351	goto out_nfserr;
				4352	}
				4353	/*
				4354	* OK, unlock succeeded; the only thing left to do is update the stateid.
				4355	*/
				4356	update_stateid(&stp->st_stid.sc_stateid);
				4357	memcpy(&locku->lu_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
				4358
				4359	out:
				4360	if (!cstate->replay_owner)
				4361	nfs4_unlock_state();
				4362	return status;
				4363
				4364	out_nfserr:
				4365	status = nfserrno(err);
				4366	goto out;
				4367	}
				4368
				4369	/*
				4370	* returns
				4371	* 1: locks held by lockowner
				4372	* 0: no locks held by lockowner
				4373	*/
				4374	static int
				4375	check_for_locks(struct nfs4_file filp, struct nfs4_lockowner lowner)
				4376	{
				4377	struct file_lock **flpp;
				4378	struct inode *inode = filp->fi_inode;
				4379	int status = 0;
				4380
				4381	lock_flocks();
				4382	for (flpp = &inode->i_flock; flpp != NULL; flpp = &(flpp)->fl_next) {
				4383	if ((*flpp)->fl_owner == (fl_owner_t)lowner) {
				4384	status = 1;
				4385	goto out;
				4386	}
				4387	}
				4388	out:
				4389	unlock_flocks();
				4390	return status;
				4391	}
				4392
				4393	__be32
				4394	nfsd4_release_lockowner(struct svc_rqst *rqstp,
				4395	struct nfsd4_compound_state *cstate,
				4396	struct nfsd4_release_lockowner *rlockowner)
				4397	{
				4398	clientid_t *clid = &rlockowner->rl_clientid;
				4399	struct nfs4_stateowner *sop;
				4400	struct nfs4_lockowner *lo;
				4401	struct nfs4_ol_stateid *stp;
				4402	struct xdr_netobj *owner = &rlockowner->rl_owner;
				4403	struct list_head matches;
				4404	unsigned int hashval = ownerstr_hashval(clid->cl_id, owner);
				4405	__be32 status;
				4406
				4407	dprintk("nfsd4_release_lockowner clientid: (%08x/%08x):\n",
				4408	clid->cl_boot, clid->cl_id);
				4409
				4410	/* XXX check for lease expiration */
				4411
				4412	status = nfserr_stale_clientid;
				4413	if (STALE_CLIENTID(clid))
				4414	return status;
				4415
				4416	nfs4_lock_state();
				4417
				4418	status = nfserr_locks_held;
				4419	INIT_LIST_HEAD(&matches);
				4420
				4421	list_for_each_entry(sop, &ownerstr_hashtbl[hashval], so_strhash) {
				4422	if (sop->so_is_open_owner)
				4423	continue;
				4424	if (!same_owner_str(sop, owner, clid))
				4425	continue;
				4426	list_for_each_entry(stp, &sop->so_stateids,
				4427	st_perstateowner) {
				4428	lo = lockowner(sop);
				4429	if (check_for_locks(stp->st_file, lo))
				4430	goto out;
				4431	list_add(&lo->lo_list, &matches);
				4432	}
				4433	}
				4434	/* Clients probably won't expect us to return with some (but not all)
				4435	* of the lockowner state released; so don't release any until all
				4436	* have been checked. */
				4437	status = nfs_ok;
				4438	while (!list_empty(&matches)) {
				4439	lo = list_entry(matches.next, struct nfs4_lockowner,
				4440	lo_list);
				4441	/* unhash_stateowner deletes so_perclient only
				4442	* for openowners. */
				4443	list_del(&lo->lo_list);
				4444	release_lockowner(lo);
				4445	}
				4446	out:
				4447	nfs4_unlock_state();
				4448	return status;
				4449	}
				4450
				4451	static inline struct nfs4_client_reclaim *
				4452	alloc_reclaim(void)
				4453	{
				4454	return kmalloc(sizeof(struct nfs4_client_reclaim), GFP_KERNEL);
				4455	}
				4456
				4457	int
				4458	nfs4_has_reclaimed_state(const char *name, bool use_exchange_id)
				4459	{
				4460	unsigned int strhashval = clientstr_hashval(name);
				4461	struct nfs4_client *clp;
				4462
				4463	clp = find_confirmed_client_by_str(name, strhashval);
				4464	if (!clp)
				4465	return 0;
				4466	return test_bit(NFSD4_CLIENT_STABLE, &clp->cl_flags);
				4467	}
				4468
				4469	/*
				4470	* failure => all reset bets are off, nfserr_no_grace...
				4471	*/
				4472	int
				4473	nfs4_client_to_reclaim(const char *name)
				4474	{
				4475	unsigned int strhashval;
				4476	struct nfs4_client_reclaim *crp = NULL;
				4477
				4478	dprintk("NFSD nfs4_client_to_reclaim NAME: %.*s\n", HEXDIR_LEN, name);
				4479	crp = alloc_reclaim();
				4480	if (!crp)
				4481	return 0;
				4482	strhashval = clientstr_hashval(name);
				4483	INIT_LIST_HEAD(&crp->cr_strhash);
				4484	list_add(&crp->cr_strhash, &reclaim_str_hashtbl[strhashval]);
				4485	memcpy(crp->cr_recdir, name, HEXDIR_LEN);
				4486	reclaim_str_hashtbl_size++;
				4487	return 1;
				4488	}
				4489
				4490	void
				4491	nfs4_release_reclaim(void)
				4492	{
				4493	struct nfs4_client_reclaim *crp = NULL;
				4494	int i;
				4495
				4496	for (i = 0; i < CLIENT_HASH_SIZE; i++) {
				4497	while (!list_empty(&reclaim_str_hashtbl[i])) {
				4498	crp = list_entry(reclaim_str_hashtbl[i].next,
				4499	struct nfs4_client_reclaim, cr_strhash);
				4500	list_del(&crp->cr_strhash);
				4501	kfree(crp);
				4502	reclaim_str_hashtbl_size--;
				4503	}
				4504	}
				4505	BUG_ON(reclaim_str_hashtbl_size);
				4506	}
				4507
				4508	/*
				4509	* called from OPEN, CLAIM_PREVIOUS with a new clientid. */
				4510	struct nfs4_client_reclaim *
				4511	nfsd4_find_reclaim_client(struct nfs4_client *clp)
				4512	{
				4513	unsigned int strhashval;
				4514	struct nfs4_client_reclaim *crp = NULL;
				4515
				4516	dprintk("NFSD: nfs4_find_reclaim_client for %.*s with recdir %s\n",
				4517	clp->cl_name.len, clp->cl_name.data,
				4518	clp->cl_recdir);
				4519
				4520	/* find clp->cl_name in reclaim_str_hashtbl */
				4521	strhashval = clientstr_hashval(clp->cl_recdir);
				4522	list_for_each_entry(crp, &reclaim_str_hashtbl[strhashval], cr_strhash) {
				4523	if (same_name(crp->cr_recdir, clp->cl_recdir)) {
				4524	return crp;
				4525	}
				4526	}
				4527	return NULL;
				4528	}
				4529
				4530	/*
				4531	* Called from OPEN. Look for clientid in reclaim list.
				4532	*/
				4533	__be32
				4534	nfs4_check_open_reclaim(clientid_t *clid)
				4535	{
				4536	struct nfs4_client *clp;
				4537
				4538	/* find clientid in conf_id_hashtbl */
				4539	clp = find_confirmed_client(clid);
				4540	if (clp == NULL)
				4541	return nfserr_reclaim_bad;
				4542
				4543	return nfsd4_client_record_check(clp) ? nfserr_reclaim_bad : nfs_ok;
				4544	}
				4545
				4546	#ifdef CONFIG_NFSD_FAULT_INJECTION
				4547
				4548	void nfsd_forget_clients(u64 num)
				4549	{
				4550	struct nfs4_client clp, next;
				4551	int count = 0;
				4552
				4553	nfs4_lock_state();
				4554	list_for_each_entry_safe(clp, next, &client_lru, cl_lru) {
				4555	nfsd4_client_record_remove(clp);
				4556	expire_client(clp);
				4557	if (++count == num)
				4558	break;
				4559	}
				4560	nfs4_unlock_state();
				4561
				4562	printk(KERN_INFO "NFSD: Forgot %d clients", count);
				4563	}
				4564
				4565	static void release_lockowner_sop(struct nfs4_stateowner *sop)
				4566	{
				4567	release_lockowner(lockowner(sop));
				4568	}
				4569
				4570	static void release_openowner_sop(struct nfs4_stateowner *sop)
				4571	{
				4572	release_openowner(openowner(sop));
				4573	}
				4574
				4575	static int nfsd_release_n_owners(u64 num, bool is_open_owner,
				4576	void (release_sop)(struct nfs4_stateowner ))
				4577	{
				4578	int i, count = 0;
				4579	struct nfs4_stateowner sop, next;
				4580
				4581	for (i = 0; i < OWNER_HASH_SIZE; i++) {
				4582	list_for_each_entry_safe(sop, next, &ownerstr_hashtbl[i], so_strhash) {
				4583	if (sop->so_is_open_owner != is_open_owner)
				4584	continue;
				4585	release_sop(sop);
				4586	if (++count == num)
				4587	return count;
				4588	}
				4589	}
				4590	return count;
				4591	}
				4592
				4593	void nfsd_forget_locks(u64 num)
				4594	{
				4595	int count;
				4596
				4597	nfs4_lock_state();
				4598	count = nfsd_release_n_owners(num, false, release_lockowner_sop);
				4599	nfs4_unlock_state();
				4600
				4601	printk(KERN_INFO "NFSD: Forgot %d locks", count);
				4602	}
				4603
				4604	void nfsd_forget_openowners(u64 num)
				4605	{
				4606	int count;
				4607
				4608	nfs4_lock_state();
				4609	count = nfsd_release_n_owners(num, true, release_openowner_sop);
				4610	nfs4_unlock_state();
				4611
				4612	printk(KERN_INFO "NFSD: Forgot %d open owners", count);
				4613	}
				4614
				4615	int nfsd_process_n_delegations(u64 num, void (deleg_func)(struct nfs4_delegation ))
				4616	{
				4617	int i, count = 0;
				4618	struct nfs4_file fp, fnext;
				4619	struct nfs4_delegation dp, dnext;
				4620
				4621	for (i = 0; i < FILE_HASH_SIZE; i++) {
				4622	list_for_each_entry_safe(fp, fnext, &file_hashtbl[i], fi_hash) {
				4623	list_for_each_entry_safe(dp, dnext, &fp->fi_delegations, dl_perfile) {
				4624	deleg_func(dp);
				4625	if (++count == num)
				4626	return count;
				4627	}
				4628	}
				4629	}
				4630
				4631	return count;
				4632	}
				4633
				4634	void nfsd_forget_delegations(u64 num)
				4635	{
				4636	unsigned int count;
				4637
				4638	nfs4_lock_state();
				4639	count = nfsd_process_n_delegations(num, unhash_delegation);
				4640	nfs4_unlock_state();
				4641
				4642	printk(KERN_INFO "NFSD: Forgot %d delegations", count);
				4643	}
				4644
				4645	void nfsd_recall_delegations(u64 num)
				4646	{
				4647	unsigned int count;
				4648
				4649	nfs4_lock_state();
				4650	spin_lock(&recall_lock);
				4651	count = nfsd_process_n_delegations(num, nfsd_break_one_deleg);
				4652	spin_unlock(&recall_lock);
				4653	nfs4_unlock_state();
				4654
				4655	printk(KERN_INFO "NFSD: Recalled %d delegations", count);
				4656	}
				4657
				4658	#endif /* CONFIG_NFSD_FAULT_INJECTION */
				4659
				4660	/* initialization to perform at module load time: */
				4661
				4662	void
				4663	nfs4_state_init(void)
				4664	{
				4665	int i;
				4666
				4667	for (i = 0; i < CLIENT_HASH_SIZE; i++) {
				4668	INIT_LIST_HEAD(&conf_id_hashtbl[i]);
				4669	INIT_LIST_HEAD(&conf_str_hashtbl[i]);
				4670	INIT_LIST_HEAD(&unconf_str_hashtbl[i]);
				4671	INIT_LIST_HEAD(&unconf_id_hashtbl[i]);
				4672	INIT_LIST_HEAD(&reclaim_str_hashtbl[i]);
				4673	}
				4674	for (i = 0; i < SESSION_HASH_SIZE; i++)
				4675	INIT_LIST_HEAD(&sessionid_hashtbl[i]);
				4676	for (i = 0; i < FILE_HASH_SIZE; i++) {
				4677	INIT_LIST_HEAD(&file_hashtbl[i]);
				4678	}
				4679	for (i = 0; i < OWNER_HASH_SIZE; i++) {
				4680	INIT_LIST_HEAD(&ownerstr_hashtbl[i]);
				4681	}
				4682	for (i = 0; i < LOCKOWNER_INO_HASH_SIZE; i++)
				4683	INIT_LIST_HEAD(&lockowner_ino_hashtbl[i]);
				4684	INIT_LIST_HEAD(&close_lru);
				4685	INIT_LIST_HEAD(&client_lru);
				4686	INIT_LIST_HEAD(&del_recall_lru);
				4687	reclaim_str_hashtbl_size = 0;
				4688	}
				4689
				4690	/*
				4691	* Since the lifetime of a delegation isn't limited to that of an open, a
				4692	* client may quite reasonably hang on to a delegation as long as it has
				4693	* the inode cached. This becomes an obvious problem the first time a
				4694	* client's inode cache approaches the size of the server's total memory.
				4695	*
				4696	* For now we avoid this problem by imposing a hard limit on the number
				4697	* of delegations, which varies according to the server's memory size.
				4698	*/
				4699	static void
				4700	set_max_delegations(void)
				4701	{
				4702	/*
				4703	* Allow at most 4 delegations per megabyte of RAM. Quick
				4704	* estimates suggest that in the worst case (where every delegation
				4705	* is for a different inode), a delegation could take about 1.5K,
				4706	* giving a worst case usage of about 6% of memory.
				4707	*/
				4708	max_delegations = nr_free_buffer_pages() >> (20 - 2 - PAGE_SHIFT);
				4709	}
				4710
				4711	/* initialization to perform when the nfsd service is started: */
				4712
				4713	int
				4714	nfs4_state_start(void)
				4715	{
				4716	int ret;
				4717
				4718	/*
				4719	* FIXME: For now, we hang most of the pernet global stuff off of
				4720	* init_net until nfsd is fully containerized. Eventually, we'll
				4721	* need to pass a net pointer into this function, take a reference
				4722	* to that instead and then do most of the rest of this on a per-net
				4723	* basis.
				4724	*/
				4725	get_net(&init_net);
				4726	nfsd4_client_tracking_init(&init_net);
				4727	boot_time = get_seconds();
				4728	locks_start_grace(&nfsd4_manager);
				4729	printk(KERN_INFO "NFSD: starting %ld-second grace period\n",
				4730	nfsd4_grace);
				4731	ret = set_callback_cred();
				4732	if (ret) {
				4733	ret = -ENOMEM;
				4734	goto out_recovery;
				4735	}
				4736	laundry_wq = create_singlethread_workqueue("nfsd4");
				4737	if (laundry_wq == NULL) {
				4738	ret = -ENOMEM;
				4739	goto out_recovery;
				4740	}
				4741	ret = nfsd4_create_callback_queue();
				4742	if (ret)
				4743	goto out_free_laundry;
				4744	queue_delayed_work(laundry_wq, &laundromat_work, nfsd4_grace * HZ);
				4745	set_max_delegations();
				4746	return 0;
				4747	out_free_laundry:
				4748	destroy_workqueue(laundry_wq);
				4749	out_recovery:
				4750	nfsd4_client_tracking_exit(&init_net);
				4751	put_net(&init_net);
				4752	return ret;
				4753	}
				4754
				4755	static void
				4756	__nfs4_state_shutdown(void)
				4757	{
				4758	int i;
				4759	struct nfs4_client *clp = NULL;
				4760	struct nfs4_delegation *dp = NULL;
				4761	struct list_head pos, next, reaplist;
				4762
				4763	for (i = 0; i < CLIENT_HASH_SIZE; i++) {
				4764	while (!list_empty(&conf_id_hashtbl[i])) {
				4765	clp = list_entry(conf_id_hashtbl[i].next, struct nfs4_client, cl_idhash);
				4766	expire_client(clp);
				4767	}
				4768	while (!list_empty(&unconf_str_hashtbl[i])) {
				4769	clp = list_entry(unconf_str_hashtbl[i].next, struct nfs4_client, cl_strhash);
				4770	expire_client(clp);
				4771	}
				4772	}
				4773	INIT_LIST_HEAD(&reaplist);
				4774	spin_lock(&recall_lock);
				4775	list_for_each_safe(pos, next, &del_recall_lru) {
				4776	dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
				4777	list_move(&dp->dl_recall_lru, &reaplist);
				4778	}
				4779	spin_unlock(&recall_lock);
				4780	list_for_each_safe(pos, next, &reaplist) {
				4781	dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
				4782	unhash_delegation(dp);
				4783	}
				4784
				4785	nfsd4_client_tracking_exit(&init_net);
				4786	put_net(&init_net);
				4787	}
				4788
				4789	void
				4790	nfs4_state_shutdown(void)
				4791	{
				4792	cancel_delayed_work_sync(&laundromat_work);
				4793	destroy_workqueue(laundry_wq);
				4794	locks_end_grace(&nfsd4_manager);
				4795	nfs4_lock_state();
				4796	__nfs4_state_shutdown();
				4797	nfs4_unlock_state();
				4798	nfsd4_destroy_callback_queue();
				4799	}
				4800
				4801	static void
				4802	get_stateid(struct nfsd4_compound_state cstate, stateid_t stateid)
				4803	{
				4804	if (HAS_STATE_ID(cstate, CURRENT_STATE_ID_FLAG) && CURRENT_STATEID(stateid))
				4805	memcpy(stateid, &cstate->current_stateid, sizeof(stateid_t));
				4806	}
				4807
				4808	static void
				4809	put_stateid(struct nfsd4_compound_state cstate, stateid_t stateid)
				4810	{
				4811	if (cstate->minorversion) {
				4812	memcpy(&cstate->current_stateid, stateid, sizeof(stateid_t));
				4813	SET_STATE_ID(cstate, CURRENT_STATE_ID_FLAG);
				4814	}
				4815	}
				4816
				4817	void
				4818	clear_current_stateid(struct nfsd4_compound_state *cstate)
				4819	{
				4820	CLEAR_STATE_ID(cstate, CURRENT_STATE_ID_FLAG);
				4821	}
				4822
				4823	/*
				4824	* functions to set current state id
				4825	*/
				4826	void
				4827	nfsd4_set_opendowngradestateid(struct nfsd4_compound_state cstate, struct nfsd4_open_downgrade odp)
				4828	{
				4829	put_stateid(cstate, &odp->od_stateid);
				4830	}
				4831
				4832	void
				4833	nfsd4_set_openstateid(struct nfsd4_compound_state cstate, struct nfsd4_open open)
				4834	{
				4835	put_stateid(cstate, &open->op_stateid);
				4836	}
				4837
				4838	void
				4839	nfsd4_set_closestateid(struct nfsd4_compound_state cstate, struct nfsd4_close close)
				4840	{
				4841	put_stateid(cstate, &close->cl_stateid);
				4842	}
				4843
				4844	void
				4845	nfsd4_set_lockstateid(struct nfsd4_compound_state cstate, struct nfsd4_lock lock)
				4846	{
				4847	put_stateid(cstate, &lock->lk_resp_stateid);
				4848	}
				4849
				4850	/*
				4851	* functions to consume current state id
				4852	*/
				4853
				4854	void
				4855	nfsd4_get_opendowngradestateid(struct nfsd4_compound_state cstate, struct nfsd4_open_downgrade odp)
				4856	{
				4857	get_stateid(cstate, &odp->od_stateid);
				4858	}
				4859
				4860	void
				4861	nfsd4_get_delegreturnstateid(struct nfsd4_compound_state cstate, struct nfsd4_delegreturn drp)
				4862	{
				4863	get_stateid(cstate, &drp->dr_stateid);
				4864	}
				4865
				4866	void
				4867	nfsd4_get_freestateid(struct nfsd4_compound_state cstate, struct nfsd4_free_stateid fsp)
				4868	{
				4869	get_stateid(cstate, &fsp->fr_stateid);
				4870	}
				4871
				4872	void
				4873	nfsd4_get_setattrstateid(struct nfsd4_compound_state cstate, struct nfsd4_setattr setattr)
				4874	{
				4875	get_stateid(cstate, &setattr->sa_stateid);
				4876	}
				4877
				4878	void
				4879	nfsd4_get_closestateid(struct nfsd4_compound_state cstate, struct nfsd4_close close)
				4880	{
				4881	get_stateid(cstate, &close->cl_stateid);
				4882	}
				4883
				4884	void
				4885	nfsd4_get_lockustateid(struct nfsd4_compound_state cstate, struct nfsd4_locku locku)
				4886	{
				4887	get_stateid(cstate, &locku->lu_stateid);
				4888	}
				4889
				4890	void
				4891	nfsd4_get_readstateid(struct nfsd4_compound_state cstate, struct nfsd4_read read)
				4892	{
				4893	get_stateid(cstate, &read->rd_stateid);
				4894	}
				4895
				4896	void
				4897	nfsd4_get_writestateid(struct nfsd4_compound_state cstate, struct nfsd4_write write)
				4898	{
				4899	get_stateid(cstate, &write->wr_stateid);
				4900	}