]> git.proxmox.com Git - mirror_ubuntu-hirsute-kernel.git/blame - fs/nfsd/nfs4state.c
nfsd4: remove unneeded CLAIM_DELEGATE_CUR workaround
[mirror_ubuntu-hirsute-kernel.git] / fs / nfsd / nfs4state.c
CommitLineData
1da177e4 1/*
1da177e4
LT
2* Copyright (c) 2001 The Regents of the University of Michigan.
3* All rights reserved.
4*
5* Kendrick Smith <kmsmith@umich.edu>
6* Andy Adamson <kandros@umich.edu>
7*
8* Redistribution and use in source and binary forms, with or without
9* modification, are permitted provided that the following conditions
10* are met:
11*
12* 1. Redistributions of source code must retain the above copyright
13* notice, this list of conditions and the following disclaimer.
14* 2. Redistributions in binary form must reproduce the above copyright
15* notice, this list of conditions and the following disclaimer in the
16* documentation and/or other materials provided with the distribution.
17* 3. Neither the name of the University nor the names of its
18* contributors may be used to endorse or promote products derived
19* from this software without specific prior written permission.
20*
21* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24* DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32*
33*/
34
aceaf78d 35#include <linux/file.h>
b89f4321 36#include <linux/fs.h>
5a0e3ad6 37#include <linux/slab.h>
0964a3d3 38#include <linux/namei.h>
c2f1a551 39#include <linux/swap.h>
17456804 40#include <linux/pagemap.h>
68e76ad0 41#include <linux/sunrpc/svcauth_gss.h>
363168b4 42#include <linux/sunrpc/clnt.h>
9a74af21 43#include "xdr4.h"
0a3adade 44#include "vfs.h"
1da177e4
LT
45
46#define NFSDDBG_FACILITY NFSDDBG_PROC
47
48/* Globals */
cf07d2ea 49time_t nfsd4_lease = 90; /* default lease time */
efc4bb4f 50time_t nfsd4_grace = 90;
fd39ca9a 51static time_t boot_time;
fd39ca9a
N
52static stateid_t zerostateid; /* bits all 0 */
53static stateid_t onestateid; /* bits all 1 */
ec6b5d7b 54static u64 current_sessionid = 1;
fd39ca9a
N
55
56#define ZERO_STATEID(stateid) (!memcmp((stateid), &zerostateid, sizeof(stateid_t)))
57#define ONE_STATEID(stateid) (!memcmp((stateid), &onestateid, sizeof(stateid_t)))
1da177e4 58
1da177e4 59/* forward declarations */
fe0750e5 60static int check_for_locks(struct nfs4_file *filp, struct nfs4_lockowner *lowner);
1da177e4 61
8b671b80
BF
62/* Locking: */
63
64/* Currently used for almost all code touching nfsv4 state: */
353ab6e9 65static DEFINE_MUTEX(client_mutex);
1da177e4 66
8b671b80
BF
67/*
68 * Currently used for the del_recall_lru and file hash table. In an
69 * effort to decrease the scope of the client_mutex, this spinlock may
70 * eventually cover more:
71 */
72static DEFINE_SPINLOCK(recall_lock);
73
fe0750e5
BF
74static struct kmem_cache *openowner_slab = NULL;
75static struct kmem_cache *lockowner_slab = NULL;
e18b890b
CL
76static struct kmem_cache *file_slab = NULL;
77static struct kmem_cache *stateid_slab = NULL;
78static struct kmem_cache *deleg_slab = NULL;
e60d4398 79
1da177e4
LT
80void
81nfs4_lock_state(void)
82{
353ab6e9 83 mutex_lock(&client_mutex);
1da177e4
LT
84}
85
86void
87nfs4_unlock_state(void)
88{
353ab6e9 89 mutex_unlock(&client_mutex);
1da177e4
LT
90}
91
92static inline u32
93opaque_hashval(const void *ptr, int nbytes)
94{
95 unsigned char *cptr = (unsigned char *) ptr;
96
97 u32 x = 0;
98 while (nbytes--) {
99 x *= 37;
100 x += *cptr++;
101 }
102 return x;
103}
104
1da177e4
LT
105static struct list_head del_recall_lru;
106
32513b40
BF
107static void nfsd4_free_file(struct nfs4_file *f)
108{
109 kmem_cache_free(file_slab, f);
110}
111
13cd2184
N
112static inline void
113put_nfs4_file(struct nfs4_file *fi)
114{
8b671b80
BF
115 if (atomic_dec_and_lock(&fi->fi_ref, &recall_lock)) {
116 list_del(&fi->fi_hash);
117 spin_unlock(&recall_lock);
118 iput(fi->fi_inode);
32513b40 119 nfsd4_free_file(fi);
8b671b80 120 }
13cd2184
N
121}
122
123static inline void
124get_nfs4_file(struct nfs4_file *fi)
125{
8b671b80 126 atomic_inc(&fi->fi_ref);
13cd2184
N
127}
128
ef0f3390 129static int num_delegations;
c2f1a551 130unsigned int max_delegations;
ef0f3390
N
131
132/*
133 * Open owner state (share locks)
134 */
135
506f275f
BF
136/* hash tables for open owners */
137#define OPEN_OWNER_HASH_BITS 8
138#define OPEN_OWNER_HASH_SIZE (1 << OPEN_OWNER_HASH_BITS)
139#define OPEN_OWNER_HASH_MASK (OPEN_OWNER_HASH_SIZE - 1)
ef0f3390 140
506f275f 141static unsigned int open_ownerstr_hashval(u32 clientid, struct xdr_netobj *ownername)
ddc04c41
BF
142{
143 unsigned int ret;
144
145 ret = opaque_hashval(ownername->data, ownername->len);
146 ret += clientid;
506f275f 147 return ret & OPEN_OWNER_HASH_MASK;
ddc04c41 148}
ef0f3390 149
506f275f 150static struct list_head open_ownerstr_hashtbl[OPEN_OWNER_HASH_SIZE];
ef0f3390
N
151
152/* hash table for nfs4_file */
153#define FILE_HASH_BITS 8
154#define FILE_HASH_SIZE (1 << FILE_HASH_BITS)
35079582 155
ddc04c41
BF
156static unsigned int file_hashval(struct inode *ino)
157{
158 /* XXX: why are we hashing on inode pointer, anyway? */
159 return hash_ptr(ino, FILE_HASH_BITS);
160}
161
ef0f3390 162static struct list_head file_hashtbl[FILE_HASH_SIZE];
ef0f3390 163
998db52c 164static void __nfs4_file_get_access(struct nfs4_file *fp, int oflag)
f9d7562f
BF
165{
166 BUG_ON(!(fp->fi_fds[oflag] || fp->fi_fds[O_RDWR]));
167 atomic_inc(&fp->fi_access[oflag]);
168}
169
998db52c
BF
170static void nfs4_file_get_access(struct nfs4_file *fp, int oflag)
171{
172 if (oflag == O_RDWR) {
173 __nfs4_file_get_access(fp, O_RDONLY);
174 __nfs4_file_get_access(fp, O_WRONLY);
175 } else
176 __nfs4_file_get_access(fp, oflag);
177}
178
179static void nfs4_file_put_fd(struct nfs4_file *fp, int oflag)
f9d7562f
BF
180{
181 if (fp->fi_fds[oflag]) {
182 fput(fp->fi_fds[oflag]);
183 fp->fi_fds[oflag] = NULL;
184 }
185}
186
998db52c 187static void __nfs4_file_put_access(struct nfs4_file *fp, int oflag)
f9d7562f
BF
188{
189 if (atomic_dec_and_test(&fp->fi_access[oflag])) {
f9d7562f 190 nfs4_file_put_fd(fp, oflag);
3d02fa29
BF
191 /*
192 * It's also safe to get rid of the RDWR open *if*
193 * we no longer have need of the other kind of access
194 * or if we already have the other kind of open:
195 */
196 if (fp->fi_fds[1-oflag]
197 || atomic_read(&fp->fi_access[1 - oflag]) == 0)
198 nfs4_file_put_fd(fp, O_RDWR);
f9d7562f
BF
199 }
200}
201
998db52c
BF
202static void nfs4_file_put_access(struct nfs4_file *fp, int oflag)
203{
204 if (oflag == O_RDWR) {
205 __nfs4_file_put_access(fp, O_RDONLY);
206 __nfs4_file_put_access(fp, O_WRONLY);
207 } else
208 __nfs4_file_put_access(fp, oflag);
209}
210
6136d2b4 211static inline int get_new_stid(struct nfs4_stid *stid)
36d44c60 212{
6136d2b4 213 static int min_stateid = 0;
38c2f4b1 214 struct idr *stateids = &stid->sc_client->cl_stateids;
6136d2b4
BF
215 int new_stid;
216 int error;
217
38c2f4b1 218 error = idr_get_new_above(stateids, stid, min_stateid, &new_stid);
6136d2b4 219 /*
996e0938
BF
220 * Note: the necessary preallocation was done in
221 * nfs4_alloc_stateid(). The idr code caps the number of
222 * preallocations that can exist at a time, but the state lock
223 * prevents anyone from using ours before we get here:
6136d2b4
BF
224 */
225 BUG_ON(error);
226 /*
227 * It shouldn't be a problem to reuse an opaque stateid value.
228 * I don't think it is for 4.1. But with 4.0 I worry that, for
229 * example, a stray write retransmission could be accepted by
230 * the server when it should have been rejected. Therefore,
231 * adopt a trick from the sctp code to attempt to maximize the
232 * amount of time until an id is reused, by ensuring they always
233 * "increase" (mod INT_MAX):
234 */
36d44c60 235
6136d2b4
BF
236 min_stateid = new_stid+1;
237 if (min_stateid == INT_MAX)
238 min_stateid = 0;
239 return new_stid;
36d44c60
BF
240}
241
996e0938 242static void init_stid(struct nfs4_stid *stid, struct nfs4_client *cl, unsigned char type)
2a74aba7
BF
243{
244 stateid_t *s = &stid->sc_stateid;
6136d2b4 245 int new_id;
2a74aba7
BF
246
247 stid->sc_type = type;
248 stid->sc_client = cl;
249 s->si_opaque.so_clid = cl->cl_clientid;
6136d2b4 250 new_id = get_new_stid(stid);
6136d2b4 251 s->si_opaque.so_id = (u32)new_id;
2a74aba7
BF
252 /* Will be incremented before return to client: */
253 s->si_generation = 0;
996e0938
BF
254}
255
256static struct nfs4_stid *nfs4_alloc_stid(struct nfs4_client *cl, struct kmem_cache *slab)
257{
258 struct idr *stateids = &cl->cl_stateids;
259
260 if (!idr_pre_get(stateids, GFP_KERNEL))
261 return NULL;
262 /*
263 * Note: if we fail here (or any time between now and the time
264 * we actually get the new idr), we won't need to undo the idr
265 * preallocation, since the idr code caps the number of
266 * preallocated entries.
267 */
268 return kmem_cache_alloc(slab, GFP_KERNEL);
2a74aba7
BF
269}
270
4cdc951b
BF
271static struct nfs4_ol_stateid * nfs4_alloc_stateid(struct nfs4_client *clp)
272{
273 return openlockstateid(nfs4_alloc_stid(clp, stateid_slab));
274}
275
1da177e4 276static struct nfs4_delegation *
dcef0413 277alloc_init_deleg(struct nfs4_client *clp, struct nfs4_ol_stateid *stp, struct svc_fh *current_fh, u32 type)
1da177e4
LT
278{
279 struct nfs4_delegation *dp;
280 struct nfs4_file *fp = stp->st_file;
1da177e4
LT
281
282 dprintk("NFSD alloc_init_deleg\n");
c3e48080
BF
283 /*
284 * Major work on the lease subsystem (for example, to support
285 * calbacks on stat) will be required before we can support
286 * write delegations properly.
287 */
288 if (type != NFS4_OPEN_DELEGATE_READ)
289 return NULL;
47f9940c
MS
290 if (fp->fi_had_conflict)
291 return NULL;
c2f1a551 292 if (num_delegations > max_delegations)
ef0f3390 293 return NULL;
996e0938 294 dp = delegstateid(nfs4_alloc_stid(clp, deleg_slab));
5b2d21c1 295 if (dp == NULL)
1da177e4 296 return dp;
996e0938 297 init_stid(&dp->dl_stid, clp, NFS4_DELEG_STID);
2a74aba7
BF
298 /*
299 * delegation seqid's are never incremented. The 4.1 special
6136d2b4
BF
300 * meaning of seqid 0 isn't meaningful, really, but let's avoid
301 * 0 anyway just for consistency and use 1:
2a74aba7
BF
302 */
303 dp->dl_stid.sc_stateid.si_generation = 1;
ef0f3390 304 num_delegations++;
ea1da636
N
305 INIT_LIST_HEAD(&dp->dl_perfile);
306 INIT_LIST_HEAD(&dp->dl_perclnt);
1da177e4 307 INIT_LIST_HEAD(&dp->dl_recall_lru);
13cd2184 308 get_nfs4_file(fp);
1da177e4 309 dp->dl_file = fp;
1da177e4 310 dp->dl_type = type;
6c02eaa1 311 fh_copy_shallow(&dp->dl_fh, &current_fh->fh_handle);
1da177e4
LT
312 dp->dl_time = 0;
313 atomic_set(&dp->dl_count, 1);
b5a1a81e 314 INIT_WORK(&dp->dl_recall.cb_work, nfsd4_do_callback_rpc);
1da177e4
LT
315 return dp;
316}
317
318void
319nfs4_put_delegation(struct nfs4_delegation *dp)
320{
321 if (atomic_dec_and_test(&dp->dl_count)) {
322 dprintk("NFSD: freeing dp %p\n",dp);
13cd2184 323 put_nfs4_file(dp->dl_file);
5b2d21c1 324 kmem_cache_free(deleg_slab, dp);
ef0f3390 325 num_delegations--;
1da177e4
LT
326 }
327}
328
acfdf5c3 329static void nfs4_put_deleg_lease(struct nfs4_file *fp)
1da177e4 330{
acfdf5c3
BF
331 if (atomic_dec_and_test(&fp->fi_delegees)) {
332 vfs_setlease(fp->fi_deleg_file, F_UNLCK, &fp->fi_lease);
333 fp->fi_lease = NULL;
4ee63624 334 fput(fp->fi_deleg_file);
acfdf5c3
BF
335 fp->fi_deleg_file = NULL;
336 }
1da177e4
LT
337}
338
6136d2b4
BF
339static void unhash_stid(struct nfs4_stid *s)
340{
38c2f4b1
BF
341 struct idr *stateids = &s->sc_client->cl_stateids;
342
343 idr_remove(stateids, s->sc_stateid.si_opaque.so_id);
6136d2b4
BF
344}
345
1da177e4
LT
346/* Called under the state lock. */
347static void
348unhash_delegation(struct nfs4_delegation *dp)
349{
6136d2b4 350 unhash_stid(&dp->dl_stid);
ea1da636 351 list_del_init(&dp->dl_perclnt);
1da177e4 352 spin_lock(&recall_lock);
5d926e8c 353 list_del_init(&dp->dl_perfile);
1da177e4
LT
354 list_del_init(&dp->dl_recall_lru);
355 spin_unlock(&recall_lock);
acfdf5c3 356 nfs4_put_deleg_lease(dp->dl_file);
1da177e4
LT
357 nfs4_put_delegation(dp);
358}
359
360/*
361 * SETCLIENTID state
362 */
363
36acb66b 364/* client_lock protects the client lru list and session hash table */
9089f1b4
BH
365static DEFINE_SPINLOCK(client_lock);
366
1da177e4
LT
367/* Hash tables for nfs4_clientid state */
368#define CLIENT_HASH_BITS 4
369#define CLIENT_HASH_SIZE (1 << CLIENT_HASH_BITS)
370#define CLIENT_HASH_MASK (CLIENT_HASH_SIZE - 1)
371
ddc04c41
BF
372static unsigned int clientid_hashval(u32 id)
373{
374 return id & CLIENT_HASH_MASK;
375}
376
377static unsigned int clientstr_hashval(const char *name)
378{
379 return opaque_hashval(name, 8) & CLIENT_HASH_MASK;
380}
381
1da177e4
LT
382/*
383 * reclaim_str_hashtbl[] holds known client info from previous reset/reboot
384 * used in reboot/reset lease grace period processing
385 *
386 * conf_id_hashtbl[], and conf_str_hashtbl[] hold confirmed
387 * setclientid_confirmed info.
388 *
389 * unconf_str_hastbl[] and unconf_id_hashtbl[] hold unconfirmed
390 * setclientid info.
391 *
392 * client_lru holds client queue ordered by nfs4_client.cl_time
393 * for lease renewal.
394 *
395 * close_lru holds (open) stateowner queue ordered by nfs4_stateowner.so_time
396 * for last close replay.
397 */
398static struct list_head reclaim_str_hashtbl[CLIENT_HASH_SIZE];
399static int reclaim_str_hashtbl_size = 0;
400static struct list_head conf_id_hashtbl[CLIENT_HASH_SIZE];
401static struct list_head conf_str_hashtbl[CLIENT_HASH_SIZE];
402static struct list_head unconf_str_hashtbl[CLIENT_HASH_SIZE];
403static struct list_head unconf_id_hashtbl[CLIENT_HASH_SIZE];
404static struct list_head client_lru;
405static struct list_head close_lru;
406
f9d7562f
BF
407/*
408 * We store the NONE, READ, WRITE, and BOTH bits separately in the
409 * st_{access,deny}_bmap field of the stateid, in order to track not
410 * only what share bits are currently in force, but also what
411 * combinations of share bits previous opens have used. This allows us
412 * to enforce the recommendation of rfc 3530 14.2.19 that the server
413 * return an error if the client attempt to downgrade to a combination
414 * of share bits not explicable by closing some of its previous opens.
415 *
416 * XXX: This enforcement is actually incomplete, since we don't keep
417 * track of access/deny bit combinations; so, e.g., we allow:
418 *
419 * OPEN allow read, deny write
420 * OPEN allow both, deny none
421 * DOWNGRADE allow read, deny none
422 *
423 * which we should reject.
424 */
425static void
426set_access(unsigned int *access, unsigned long bmap) {
427 int i;
428
429 *access = 0;
430 for (i = 1; i < 4; i++) {
431 if (test_bit(i, &bmap))
432 *access |= i;
433 }
434}
435
436static void
437set_deny(unsigned int *deny, unsigned long bmap) {
438 int i;
439
440 *deny = 0;
441 for (i = 0; i < 4; i++) {
442 if (test_bit(i, &bmap))
443 *deny |= i ;
444 }
445}
446
447static int
dcef0413 448test_share(struct nfs4_ol_stateid *stp, struct nfsd4_open *open) {
f9d7562f
BF
449 unsigned int access, deny;
450
451 set_access(&access, stp->st_access_bmap);
452 set_deny(&deny, stp->st_deny_bmap);
453 if ((access & open->op_share_deny) || (deny & open->op_share_access))
454 return 0;
455 return 1;
456}
457
458static int nfs4_access_to_omode(u32 access)
459{
8f34a430 460 switch (access & NFS4_SHARE_ACCESS_BOTH) {
f9d7562f
BF
461 case NFS4_SHARE_ACCESS_READ:
462 return O_RDONLY;
463 case NFS4_SHARE_ACCESS_WRITE:
464 return O_WRONLY;
465 case NFS4_SHARE_ACCESS_BOTH:
466 return O_RDWR;
467 }
468 BUG();
469}
470
dcef0413 471static void unhash_generic_stateid(struct nfs4_ol_stateid *stp)
529d7b2a 472{
529d7b2a
BF
473 list_del(&stp->st_perfile);
474 list_del(&stp->st_perstateowner);
475}
476
dcef0413 477static void close_generic_stateid(struct nfs4_ol_stateid *stp)
529d7b2a 478{
499f3edc 479 int i;
0997b173 480
23fcf2ec 481 if (stp->st_access_bmap) {
499f3edc
BF
482 for (i = 1; i < 4; i++) {
483 if (test_bit(i, &stp->st_access_bmap))
484 nfs4_file_put_access(stp->st_file,
485 nfs4_access_to_omode(i));
4665e2ba 486 __clear_bit(i, &stp->st_access_bmap);
499f3edc 487 }
23fcf2ec 488 }
a96e5b90 489 put_nfs4_file(stp->st_file);
4665e2ba
BF
490 stp->st_file = NULL;
491}
492
dcef0413 493static void free_generic_stateid(struct nfs4_ol_stateid *stp)
4665e2ba 494{
529d7b2a
BF
495 kmem_cache_free(stateid_slab, stp);
496}
497
dcef0413 498static void release_lock_stateid(struct nfs4_ol_stateid *stp)
529d7b2a
BF
499{
500 struct file *file;
501
502 unhash_generic_stateid(stp);
6136d2b4 503 unhash_stid(&stp->st_stid);
529d7b2a
BF
504 file = find_any_file(stp->st_file);
505 if (file)
fe0750e5 506 locks_remove_posix(file, (fl_owner_t)lockowner(stp->st_stateowner));
38c387b5 507 close_generic_stateid(stp);
529d7b2a
BF
508 free_generic_stateid(stp);
509}
510
fe0750e5 511static void unhash_lockowner(struct nfs4_lockowner *lo)
529d7b2a 512{
dcef0413 513 struct nfs4_ol_stateid *stp;
529d7b2a 514
fe0750e5
BF
515 list_del(&lo->lo_owner.so_strhash);
516 list_del(&lo->lo_perstateid);
517 while (!list_empty(&lo->lo_owner.so_stateids)) {
518 stp = list_first_entry(&lo->lo_owner.so_stateids,
dcef0413 519 struct nfs4_ol_stateid, st_perstateowner);
529d7b2a
BF
520 release_lock_stateid(stp);
521 }
522}
523
fe0750e5 524static void release_lockowner(struct nfs4_lockowner *lo)
529d7b2a 525{
fe0750e5
BF
526 unhash_lockowner(lo);
527 nfs4_free_lockowner(lo);
529d7b2a
BF
528}
529
530static void
dcef0413 531release_stateid_lockowners(struct nfs4_ol_stateid *open_stp)
529d7b2a 532{
fe0750e5 533 struct nfs4_lockowner *lo;
529d7b2a
BF
534
535 while (!list_empty(&open_stp->st_lockowners)) {
fe0750e5
BF
536 lo = list_entry(open_stp->st_lockowners.next,
537 struct nfs4_lockowner, lo_perstateid);
538 release_lockowner(lo);
529d7b2a
BF
539 }
540}
541
38c387b5 542static void unhash_open_stateid(struct nfs4_ol_stateid *stp)
2283963f
BF
543{
544 unhash_generic_stateid(stp);
545 release_stateid_lockowners(stp);
38c387b5
BF
546 close_generic_stateid(stp);
547}
548
549static void release_open_stateid(struct nfs4_ol_stateid *stp)
550{
551 unhash_open_stateid(stp);
6136d2b4 552 unhash_stid(&stp->st_stid);
2283963f
BF
553 free_generic_stateid(stp);
554}
555
fe0750e5 556static void unhash_openowner(struct nfs4_openowner *oo)
f1d110ca 557{
dcef0413 558 struct nfs4_ol_stateid *stp;
f1d110ca 559
fe0750e5
BF
560 list_del(&oo->oo_owner.so_strhash);
561 list_del(&oo->oo_perclient);
562 while (!list_empty(&oo->oo_owner.so_stateids)) {
563 stp = list_first_entry(&oo->oo_owner.so_stateids,
dcef0413 564 struct nfs4_ol_stateid, st_perstateowner);
f044ff83 565 release_open_stateid(stp);
f1d110ca
BF
566 }
567}
568
f7a4d872
BF
569static void release_last_closed_stateid(struct nfs4_openowner *oo)
570{
571 struct nfs4_ol_stateid *s = oo->oo_last_closed_stid;
572
573 if (s) {
6136d2b4 574 unhash_stid(&s->st_stid);
f7a4d872
BF
575 free_generic_stateid(s);
576 oo->oo_last_closed_stid = NULL;
577 }
578}
579
fe0750e5 580static void release_openowner(struct nfs4_openowner *oo)
f1d110ca 581{
fe0750e5
BF
582 unhash_openowner(oo);
583 list_del(&oo->oo_close_lru);
f7a4d872 584 release_last_closed_stateid(oo);
fe0750e5 585 nfs4_free_openowner(oo);
f1d110ca
BF
586}
587
5282fd72
ME
588#define SESSION_HASH_SIZE 512
589static struct list_head sessionid_hashtbl[SESSION_HASH_SIZE];
590
591static inline int
592hash_sessionid(struct nfs4_sessionid *sessionid)
593{
594 struct nfsd4_sessionid *sid = (struct nfsd4_sessionid *)sessionid;
595
596 return sid->sequence % SESSION_HASH_SIZE;
597}
598
599static inline void
600dump_sessionid(const char *fn, struct nfs4_sessionid *sessionid)
601{
602 u32 *ptr = (u32 *)(&sessionid->data[0]);
603 dprintk("%s: %u:%u:%u:%u\n", fn, ptr[0], ptr[1], ptr[2], ptr[3]);
604}
605
ec6b5d7b
AA
606static void
607gen_sessionid(struct nfsd4_session *ses)
608{
609 struct nfs4_client *clp = ses->se_client;
610 struct nfsd4_sessionid *sid;
611
612 sid = (struct nfsd4_sessionid *)ses->se_sessionid.data;
613 sid->clientid = clp->cl_clientid;
614 sid->sequence = current_sessionid++;
615 sid->reserved = 0;
616}
617
618/*
a649637c
AA
619 * The protocol defines ca_maxresponssize_cached to include the size of
620 * the rpc header, but all we need to cache is the data starting after
621 * the end of the initial SEQUENCE operation--the rest we regenerate
622 * each time. Therefore we can advertise a ca_maxresponssize_cached
623 * value that is the number of bytes in our cache plus a few additional
624 * bytes. In order to stay on the safe side, and not promise more than
625 * we can cache, those additional bytes must be the minimum possible: 24
626 * bytes of rpc header (xid through accept state, with AUTH_NULL
627 * verifier), 12 for the compound header (with zero-length tag), and 44
628 * for the SEQUENCE op response:
629 */
630#define NFSD_MIN_HDR_SEQ_SZ (24 + 12 + 44)
631
557ce264
AA
632static void
633free_session_slots(struct nfsd4_session *ses)
634{
635 int i;
636
637 for (i = 0; i < ses->se_fchannel.maxreqs; i++)
638 kfree(ses->se_slots[i]);
639}
640
a649637c 641/*
efe0cb6d
BF
642 * We don't actually need to cache the rpc and session headers, so we
643 * can allocate a little less for each slot:
644 */
645static inline int slot_bytes(struct nfsd4_channel_attrs *ca)
646{
647 return ca->maxresp_cached - NFSD_MIN_HDR_SEQ_SZ;
648}
649
5b6feee9 650static int nfsd4_sanitize_slot_size(u32 size)
ec6b5d7b 651{
5b6feee9
BF
652 size -= NFSD_MIN_HDR_SEQ_SZ; /* We don't cache the rpc header */
653 size = min_t(u32, size, NFSD_SLOT_CACHE_SIZE);
ec6b5d7b 654
5b6feee9
BF
655 return size;
656}
ec6b5d7b 657
5b6feee9
BF
658/*
659 * XXX: If we run out of reserved DRC memory we could (up to a point)
a649637c
AA
660 * re-negotiate active sessions and reduce their slot usage to make
661 * rooom for new connections. For now we just fail the create session.
ec6b5d7b 662 */
5b6feee9 663static int nfsd4_get_drc_mem(int slotsize, u32 num)
ec6b5d7b 664{
5b6feee9 665 int avail;
ec6b5d7b 666
5b6feee9 667 num = min_t(u32, num, NFSD_MAX_SLOTS_PER_SESSION);
5d77ddfb 668
5b6feee9
BF
669 spin_lock(&nfsd_drc_lock);
670 avail = min_t(int, NFSD_MAX_MEM_PER_SESSION,
671 nfsd_drc_max_mem - nfsd_drc_mem_used);
672 num = min_t(int, num, avail / slotsize);
673 nfsd_drc_mem_used += num * slotsize;
674 spin_unlock(&nfsd_drc_lock);
ec6b5d7b 675
5b6feee9
BF
676 return num;
677}
ec6b5d7b 678
5b6feee9
BF
679static void nfsd4_put_drc_mem(int slotsize, int num)
680{
4bd9b0f4 681 spin_lock(&nfsd_drc_lock);
5b6feee9 682 nfsd_drc_mem_used -= slotsize * num;
4bd9b0f4 683 spin_unlock(&nfsd_drc_lock);
5b6feee9 684}
ec6b5d7b 685
5b6feee9
BF
686static struct nfsd4_session *alloc_session(int slotsize, int numslots)
687{
688 struct nfsd4_session *new;
689 int mem, i;
a649637c 690
5b6feee9
BF
691 BUILD_BUG_ON(NFSD_MAX_SLOTS_PER_SESSION * sizeof(struct nfsd4_slot *)
692 + sizeof(struct nfsd4_session) > PAGE_SIZE);
693 mem = numslots * sizeof(struct nfsd4_slot *);
ec6b5d7b 694
5b6feee9
BF
695 new = kzalloc(sizeof(*new) + mem, GFP_KERNEL);
696 if (!new)
697 return NULL;
557ce264 698 /* allocate each struct nfsd4_slot and data cache in one piece */
5b6feee9
BF
699 for (i = 0; i < numslots; i++) {
700 mem = sizeof(struct nfsd4_slot) + slotsize;
701 new->se_slots[i] = kzalloc(mem, GFP_KERNEL);
702 if (!new->se_slots[i])
557ce264 703 goto out_free;
557ce264 704 }
5b6feee9
BF
705 return new;
706out_free:
707 while (i--)
708 kfree(new->se_slots[i]);
709 kfree(new);
710 return NULL;
ec6b5d7b
AA
711}
712
5b6feee9 713static void init_forechannel_attrs(struct nfsd4_channel_attrs *new, struct nfsd4_channel_attrs *req, int numslots, int slotsize)
ec6b5d7b 714{
5b6feee9 715 u32 maxrpc = nfsd_serv->sv_max_mesg;
ec6b5d7b 716
5b6feee9 717 new->maxreqs = numslots;
d2b21743
MJ
718 new->maxresp_cached = min_t(u32, req->maxresp_cached,
719 slotsize + NFSD_MIN_HDR_SEQ_SZ);
5b6feee9
BF
720 new->maxreq_sz = min_t(u32, req->maxreq_sz, maxrpc);
721 new->maxresp_sz = min_t(u32, req->maxresp_sz, maxrpc);
722 new->maxops = min_t(u32, req->maxops, NFSD_MAX_OPS_PER_COMPOUND);
723}
ec6b5d7b 724
19cf5c02
BF
725static void free_conn(struct nfsd4_conn *c)
726{
727 svc_xprt_put(c->cn_xprt);
728 kfree(c);
729}
ec6b5d7b 730
19cf5c02
BF
731static void nfsd4_conn_lost(struct svc_xpt_user *u)
732{
733 struct nfsd4_conn *c = container_of(u, struct nfsd4_conn, cn_xpt_user);
734 struct nfs4_client *clp = c->cn_session->se_client;
ec6b5d7b 735
19cf5c02
BF
736 spin_lock(&clp->cl_lock);
737 if (!list_empty(&c->cn_persession)) {
738 list_del(&c->cn_persession);
739 free_conn(c);
740 }
741 spin_unlock(&clp->cl_lock);
eea49806 742 nfsd4_probe_callback(clp);
19cf5c02 743}
ec6b5d7b 744
d29c374c 745static struct nfsd4_conn *alloc_conn(struct svc_rqst *rqstp, u32 flags)
c7662518 746{
c7662518 747 struct nfsd4_conn *conn;
ec6b5d7b 748
c7662518
BF
749 conn = kmalloc(sizeof(struct nfsd4_conn), GFP_KERNEL);
750 if (!conn)
db90681d 751 return NULL;
c7662518
BF
752 svc_xprt_get(rqstp->rq_xprt);
753 conn->cn_xprt = rqstp->rq_xprt;
d29c374c 754 conn->cn_flags = flags;
db90681d
BF
755 INIT_LIST_HEAD(&conn->cn_xpt_user.list);
756 return conn;
757}
a649637c 758
328ead28
BF
759static void __nfsd4_hash_conn(struct nfsd4_conn *conn, struct nfsd4_session *ses)
760{
761 conn->cn_session = ses;
762 list_add(&conn->cn_persession, &ses->se_conns);
ec6b5d7b
AA
763}
764
db90681d 765static void nfsd4_hash_conn(struct nfsd4_conn *conn, struct nfsd4_session *ses)
557ce264 766{
db90681d 767 struct nfs4_client *clp = ses->se_client;
557ce264 768
c7662518 769 spin_lock(&clp->cl_lock);
328ead28 770 __nfsd4_hash_conn(conn, ses);
c7662518 771 spin_unlock(&clp->cl_lock);
557ce264
AA
772}
773
21b75b01 774static int nfsd4_register_conn(struct nfsd4_conn *conn)
efe0cb6d 775{
19cf5c02 776 conn->cn_xpt_user.callback = nfsd4_conn_lost;
21b75b01 777 return register_xpt_user(conn->cn_xprt, &conn->cn_xpt_user);
efe0cb6d
BF
778}
779
1d1bc8f2 780static __be32 nfsd4_new_conn(struct svc_rqst *rqstp, struct nfsd4_session *ses, u32 dir)
ec6b5d7b 781{
db90681d 782 struct nfsd4_conn *conn;
21b75b01 783 int ret;
ec6b5d7b 784
1d1bc8f2 785 conn = alloc_conn(rqstp, dir);
db90681d
BF
786 if (!conn)
787 return nfserr_jukebox;
788 nfsd4_hash_conn(conn, ses);
21b75b01
BF
789 ret = nfsd4_register_conn(conn);
790 if (ret)
791 /* oops; xprt is already down: */
792 nfsd4_conn_lost(&conn->cn_xpt_user);
c7662518
BF
793 return nfs_ok;
794}
ec6b5d7b 795
1d1bc8f2
BF
796static __be32 nfsd4_new_conn_from_crses(struct svc_rqst *rqstp, struct nfsd4_session *ses)
797{
798 u32 dir = NFS4_CDFC4_FORE;
799
800 if (ses->se_flags & SESSION4_BACK_CHAN)
801 dir |= NFS4_CDFC4_BACK;
802
803 return nfsd4_new_conn(rqstp, ses, dir);
804}
805
806/* must be called under client_lock */
19cf5c02 807static void nfsd4_del_conns(struct nfsd4_session *s)
c7662518 808{
19cf5c02
BF
809 struct nfs4_client *clp = s->se_client;
810 struct nfsd4_conn *c;
ec6b5d7b 811
19cf5c02
BF
812 spin_lock(&clp->cl_lock);
813 while (!list_empty(&s->se_conns)) {
814 c = list_first_entry(&s->se_conns, struct nfsd4_conn, cn_persession);
815 list_del_init(&c->cn_persession);
816 spin_unlock(&clp->cl_lock);
557ce264 817
19cf5c02
BF
818 unregister_xpt_user(c->cn_xprt, &c->cn_xpt_user);
819 free_conn(c);
ec6b5d7b 820
19cf5c02
BF
821 spin_lock(&clp->cl_lock);
822 }
823 spin_unlock(&clp->cl_lock);
c7662518 824}
ec6b5d7b 825
c7662518
BF
826void free_session(struct kref *kref)
827{
828 struct nfsd4_session *ses;
829 int mem;
830
831 ses = container_of(kref, struct nfsd4_session, se_ref);
19cf5c02 832 nfsd4_del_conns(ses);
c7662518
BF
833 spin_lock(&nfsd_drc_lock);
834 mem = ses->se_fchannel.maxreqs * slot_bytes(&ses->se_fchannel);
835 nfsd_drc_mem_used -= mem;
836 spin_unlock(&nfsd_drc_lock);
837 free_session_slots(ses);
838 kfree(ses);
839}
840
ac7c46f2 841static struct nfsd4_session *alloc_init_session(struct svc_rqst *rqstp, struct nfs4_client *clp, struct nfsd4_create_session *cses)
5b6feee9
BF
842{
843 struct nfsd4_session *new;
844 struct nfsd4_channel_attrs *fchan = &cses->fore_channel;
845 int numslots, slotsize;
c7662518 846 int status;
5b6feee9
BF
847 int idx;
848
849 /*
850 * Note decreasing slot size below client's request may
851 * make it difficult for client to function correctly, whereas
852 * decreasing the number of slots will (just?) affect
853 * performance. When short on memory we therefore prefer to
854 * decrease number of slots instead of their size.
855 */
856 slotsize = nfsd4_sanitize_slot_size(fchan->maxresp_cached);
857 numslots = nfsd4_get_drc_mem(slotsize, fchan->maxreqs);
ced6dfe9
MJ
858 if (numslots < 1)
859 return NULL;
5b6feee9
BF
860
861 new = alloc_session(slotsize, numslots);
862 if (!new) {
863 nfsd4_put_drc_mem(slotsize, fchan->maxreqs);
ac7c46f2 864 return NULL;
557ce264 865 }
5b6feee9 866 init_forechannel_attrs(&new->se_fchannel, fchan, numslots, slotsize);
557ce264 867
ec6b5d7b
AA
868 new->se_client = clp;
869 gen_sessionid(new);
ec6b5d7b 870
c7662518
BF
871 INIT_LIST_HEAD(&new->se_conns);
872
ac7c46f2 873 new->se_cb_seq_nr = 1;
ec6b5d7b 874 new->se_flags = cses->flags;
8b5ce5cd 875 new->se_cb_prog = cses->callback_prog;
ec6b5d7b 876 kref_init(&new->se_ref);
5b6feee9 877 idx = hash_sessionid(&new->se_sessionid);
9089f1b4 878 spin_lock(&client_lock);
ec6b5d7b 879 list_add(&new->se_hash, &sessionid_hashtbl[idx]);
4c649378 880 spin_lock(&clp->cl_lock);
ec6b5d7b 881 list_add(&new->se_perclnt, &clp->cl_sessions);
4c649378 882 spin_unlock(&clp->cl_lock);
9089f1b4 883 spin_unlock(&client_lock);
ec6b5d7b 884
1d1bc8f2 885 status = nfsd4_new_conn_from_crses(rqstp, new);
ac7c46f2 886 /* whoops: benny points out, status is ignored! (err, or bogus) */
c7662518
BF
887 if (status) {
888 free_session(&new->se_ref);
ac7c46f2 889 return NULL;
c7662518 890 }
dcbeaa68 891 if (cses->flags & SESSION4_BACK_CHAN) {
edd76786 892 struct sockaddr *sa = svc_addr(rqstp);
dcbeaa68
BF
893 /*
894 * This is a little silly; with sessions there's no real
895 * use for the callback address. Use the peer address
896 * as a reasonable default for now, but consider fixing
897 * the rpc client not to require an address in the
898 * future:
899 */
edd76786
BF
900 rpc_copy_addr((struct sockaddr *)&clp->cl_cb_conn.cb_addr, sa);
901 clp->cl_cb_conn.cb_addrlen = svc_addr_len(sa);
edd76786 902 }
dcbeaa68 903 nfsd4_probe_callback(clp);
ac7c46f2 904 return new;
ec6b5d7b
AA
905}
906
9089f1b4 907/* caller must hold client_lock */
5282fd72
ME
908static struct nfsd4_session *
909find_in_sessionid_hashtbl(struct nfs4_sessionid *sessionid)
910{
911 struct nfsd4_session *elem;
912 int idx;
913
914 dump_sessionid(__func__, sessionid);
915 idx = hash_sessionid(sessionid);
5282fd72
ME
916 /* Search in the appropriate list */
917 list_for_each_entry(elem, &sessionid_hashtbl[idx], se_hash) {
5282fd72
ME
918 if (!memcmp(elem->se_sessionid.data, sessionid->data,
919 NFS4_MAX_SESSIONID_LEN)) {
920 return elem;
921 }
922 }
923
924 dprintk("%s: session not found\n", __func__);
925 return NULL;
926}
927
9089f1b4 928/* caller must hold client_lock */
7116ed6b 929static void
5282fd72 930unhash_session(struct nfsd4_session *ses)
7116ed6b
AA
931{
932 list_del(&ses->se_hash);
4c649378 933 spin_lock(&ses->se_client->cl_lock);
7116ed6b 934 list_del(&ses->se_perclnt);
4c649378 935 spin_unlock(&ses->se_client->cl_lock);
5282fd72
ME
936}
937
36acb66b 938/* must be called under the client_lock */
1da177e4 939static inline void
36acb66b 940renew_client_locked(struct nfs4_client *clp)
1da177e4 941{
07cd4909
BH
942 if (is_client_expired(clp)) {
943 dprintk("%s: client (clientid %08x/%08x) already expired\n",
944 __func__,
945 clp->cl_clientid.cl_boot,
946 clp->cl_clientid.cl_id);
947 return;
948 }
949
1da177e4
LT
950 dprintk("renewing client (clientid %08x/%08x)\n",
951 clp->cl_clientid.cl_boot,
952 clp->cl_clientid.cl_id);
953 list_move_tail(&clp->cl_lru, &client_lru);
954 clp->cl_time = get_seconds();
955}
956
36acb66b
BH
957static inline void
958renew_client(struct nfs4_client *clp)
959{
960 spin_lock(&client_lock);
961 renew_client_locked(clp);
962 spin_unlock(&client_lock);
963}
964
1da177e4
LT
965/* SETCLIENTID and SETCLIENTID_CONFIRM Helper functions */
966static int
967STALE_CLIENTID(clientid_t *clid)
968{
969 if (clid->cl_boot == boot_time)
970 return 0;
60adfc50
AA
971 dprintk("NFSD stale clientid (%08x/%08x) boot_time %08lx\n",
972 clid->cl_boot, clid->cl_id, boot_time);
1da177e4
LT
973 return 1;
974}
975
976/*
977 * XXX Should we use a slab cache ?
978 * This type of memory management is somewhat inefficient, but we use it
979 * anyway since SETCLIENTID is not a common operation.
980 */
35bba9a3 981static struct nfs4_client *alloc_client(struct xdr_netobj name)
1da177e4
LT
982{
983 struct nfs4_client *clp;
984
35bba9a3
BF
985 clp = kzalloc(sizeof(struct nfs4_client), GFP_KERNEL);
986 if (clp == NULL)
987 return NULL;
988 clp->cl_name.data = kmalloc(name.len, GFP_KERNEL);
989 if (clp->cl_name.data == NULL) {
990 kfree(clp);
991 return NULL;
1da177e4 992 }
35bba9a3
BF
993 memcpy(clp->cl_name.data, name.data, name.len);
994 clp->cl_name.len = name.len;
1da177e4
LT
995 return clp;
996}
997
998static inline void
999free_client(struct nfs4_client *clp)
1000{
792c95dd
BF
1001 while (!list_empty(&clp->cl_sessions)) {
1002 struct nfsd4_session *ses;
1003 ses = list_entry(clp->cl_sessions.next, struct nfsd4_session,
1004 se_perclnt);
1005 list_del(&ses->se_perclnt);
1006 nfsd4_put_session(ses);
1007 }
1da177e4
LT
1008 if (clp->cl_cred.cr_group_info)
1009 put_group_info(clp->cl_cred.cr_group_info);
68e76ad0 1010 kfree(clp->cl_principal);
1da177e4
LT
1011 kfree(clp->cl_name.data);
1012 kfree(clp);
1013}
1014
d7682988
BH
1015void
1016release_session_client(struct nfsd4_session *session)
1017{
1018 struct nfs4_client *clp = session->se_client;
1019
1020 if (!atomic_dec_and_lock(&clp->cl_refcount, &client_lock))
1021 return;
1022 if (is_client_expired(clp)) {
1023 free_client(clp);
1024 session->se_client = NULL;
1025 } else
1026 renew_client_locked(clp);
1027 spin_unlock(&client_lock);
d7682988
BH
1028}
1029
84d38ac9
BH
1030/* must be called under the client_lock */
1031static inline void
1032unhash_client_locked(struct nfs4_client *clp)
1033{
792c95dd
BF
1034 struct nfsd4_session *ses;
1035
07cd4909 1036 mark_client_expired(clp);
84d38ac9 1037 list_del(&clp->cl_lru);
4c649378 1038 spin_lock(&clp->cl_lock);
792c95dd
BF
1039 list_for_each_entry(ses, &clp->cl_sessions, se_perclnt)
1040 list_del_init(&ses->se_hash);
4c649378 1041 spin_unlock(&clp->cl_lock);
84d38ac9
BH
1042}
1043
1da177e4
LT
1044static void
1045expire_client(struct nfs4_client *clp)
1046{
fe0750e5 1047 struct nfs4_openowner *oo;
1da177e4 1048 struct nfs4_delegation *dp;
1da177e4
LT
1049 struct list_head reaplist;
1050
1da177e4
LT
1051 INIT_LIST_HEAD(&reaplist);
1052 spin_lock(&recall_lock);
ea1da636
N
1053 while (!list_empty(&clp->cl_delegations)) {
1054 dp = list_entry(clp->cl_delegations.next, struct nfs4_delegation, dl_perclnt);
ea1da636 1055 list_del_init(&dp->dl_perclnt);
1da177e4
LT
1056 list_move(&dp->dl_recall_lru, &reaplist);
1057 }
1058 spin_unlock(&recall_lock);
1059 while (!list_empty(&reaplist)) {
1060 dp = list_entry(reaplist.next, struct nfs4_delegation, dl_recall_lru);
1061 list_del_init(&dp->dl_recall_lru);
1062 unhash_delegation(dp);
1063 }
ea1da636 1064 while (!list_empty(&clp->cl_openowners)) {
fe0750e5
BF
1065 oo = list_entry(clp->cl_openowners.next, struct nfs4_openowner, oo_perclient);
1066 release_openowner(oo);
1da177e4 1067 }
6ff8da08 1068 nfsd4_shutdown_callback(clp);
84d38ac9
BH
1069 if (clp->cl_cb_conn.cb_xprt)
1070 svc_xprt_put(clp->cl_cb_conn.cb_xprt);
36acb66b
BH
1071 list_del(&clp->cl_idhash);
1072 list_del(&clp->cl_strhash);
be1fdf6c 1073 spin_lock(&client_lock);
84d38ac9 1074 unhash_client_locked(clp);
46583e25
BH
1075 if (atomic_read(&clp->cl_refcount) == 0)
1076 free_client(clp);
be1fdf6c 1077 spin_unlock(&client_lock);
1da177e4
LT
1078}
1079
35bba9a3
BF
1080static void copy_verf(struct nfs4_client *target, nfs4_verifier *source)
1081{
1082 memcpy(target->cl_verifier.data, source->data,
1083 sizeof(target->cl_verifier.data));
1da177e4
LT
1084}
1085
35bba9a3
BF
1086static void copy_clid(struct nfs4_client *target, struct nfs4_client *source)
1087{
1da177e4
LT
1088 target->cl_clientid.cl_boot = source->cl_clientid.cl_boot;
1089 target->cl_clientid.cl_id = source->cl_clientid.cl_id;
1090}
1091
35bba9a3
BF
1092static void copy_cred(struct svc_cred *target, struct svc_cred *source)
1093{
1da177e4
LT
1094 target->cr_uid = source->cr_uid;
1095 target->cr_gid = source->cr_gid;
1096 target->cr_group_info = source->cr_group_info;
1097 get_group_info(target->cr_group_info);
1098}
1099
35bba9a3 1100static int same_name(const char *n1, const char *n2)
599e0a22 1101{
a55370a3 1102 return 0 == memcmp(n1, n2, HEXDIR_LEN);
1da177e4
LT
1103}
1104
1105static int
599e0a22
BF
1106same_verf(nfs4_verifier *v1, nfs4_verifier *v2)
1107{
1108 return 0 == memcmp(v1->data, v2->data, sizeof(v1->data));
1da177e4
LT
1109}
1110
1111static int
599e0a22
BF
1112same_clid(clientid_t *cl1, clientid_t *cl2)
1113{
1114 return (cl1->cl_boot == cl2->cl_boot) && (cl1->cl_id == cl2->cl_id);
1da177e4
LT
1115}
1116
1117/* XXX what about NGROUP */
1118static int
599e0a22
BF
1119same_creds(struct svc_cred *cr1, struct svc_cred *cr2)
1120{
1121 return cr1->cr_uid == cr2->cr_uid;
1da177e4
LT
1122}
1123
5ec7b46c
BF
1124static void gen_clid(struct nfs4_client *clp)
1125{
1126 static u32 current_clientid = 1;
1127
1da177e4
LT
1128 clp->cl_clientid.cl_boot = boot_time;
1129 clp->cl_clientid.cl_id = current_clientid++;
1130}
1131
deda2faa
BF
1132static void gen_confirm(struct nfs4_client *clp)
1133{
1134 static u32 i;
1135 u32 *p;
1da177e4 1136
1da177e4 1137 p = (u32 *)clp->cl_confirm.data;
deda2faa
BF
1138 *p++ = get_seconds();
1139 *p++ = i++;
1da177e4
LT
1140}
1141
38c2f4b1 1142static struct nfs4_stid *find_stateid(struct nfs4_client *cl, stateid_t *t)
4581d140 1143{
38c2f4b1 1144 return idr_find(&cl->cl_stateids, t->si_opaque.so_id);
4d71ab87
BF
1145}
1146
38c2f4b1 1147static struct nfs4_stid *find_stateid_by_type(struct nfs4_client *cl, stateid_t *t, char typemask)
f459e453
BF
1148{
1149 struct nfs4_stid *s;
4d71ab87 1150
38c2f4b1 1151 s = find_stateid(cl, t);
4d71ab87
BF
1152 if (!s)
1153 return NULL;
f459e453 1154 if (typemask & s->sc_type)
4581d140 1155 return s;
4581d140
BF
1156 return NULL;
1157}
1158
b09333c4
RL
1159static struct nfs4_client *create_client(struct xdr_netobj name, char *recdir,
1160 struct svc_rqst *rqstp, nfs4_verifier *verf)
1161{
1162 struct nfs4_client *clp;
1163 struct sockaddr *sa = svc_addr(rqstp);
1164 char *princ;
1165
1166 clp = alloc_client(name);
1167 if (clp == NULL)
1168 return NULL;
1169
792c95dd
BF
1170 INIT_LIST_HEAD(&clp->cl_sessions);
1171
b09333c4
RL
1172 princ = svc_gss_principal(rqstp);
1173 if (princ) {
1174 clp->cl_principal = kstrdup(princ, GFP_KERNEL);
1175 if (clp->cl_principal == NULL) {
1176 free_client(clp);
1177 return NULL;
1178 }
1179 }
1180
38c2f4b1 1181 idr_init(&clp->cl_stateids);
b09333c4 1182 memcpy(clp->cl_recdir, recdir, HEXDIR_LEN);
46583e25 1183 atomic_set(&clp->cl_refcount, 0);
77a3569d 1184 clp->cl_cb_state = NFSD4_CB_UNKNOWN;
b09333c4
RL
1185 INIT_LIST_HEAD(&clp->cl_idhash);
1186 INIT_LIST_HEAD(&clp->cl_strhash);
1187 INIT_LIST_HEAD(&clp->cl_openowners);
1188 INIT_LIST_HEAD(&clp->cl_delegations);
b09333c4 1189 INIT_LIST_HEAD(&clp->cl_lru);
5ce8ba25 1190 INIT_LIST_HEAD(&clp->cl_callbacks);
6ff8da08 1191 spin_lock_init(&clp->cl_lock);
cee277d9 1192 INIT_WORK(&clp->cl_cb_null.cb_work, nfsd4_do_callback_rpc);
07cd4909 1193 clp->cl_time = get_seconds();
b09333c4
RL
1194 clear_bit(0, &clp->cl_cb_slot_busy);
1195 rpc_init_wait_queue(&clp->cl_cb_waitq, "Backchannel slot table");
1196 copy_verf(clp, verf);
1197 rpc_copy_addr((struct sockaddr *) &clp->cl_addr, sa);
1198 clp->cl_flavor = rqstp->rq_flavor;
1199 copy_cred(&clp->cl_cred, &rqstp->rq_cred);
1200 gen_confirm(clp);
edd76786 1201 clp->cl_cb_session = NULL;
b09333c4
RL
1202 return clp;
1203}
1204
fd39ca9a 1205static void
1da177e4
LT
1206add_to_unconfirmed(struct nfs4_client *clp, unsigned int strhashval)
1207{
1208 unsigned int idhashval;
1209
1210 list_add(&clp->cl_strhash, &unconf_str_hashtbl[strhashval]);
1211 idhashval = clientid_hashval(clp->cl_clientid.cl_id);
1212 list_add(&clp->cl_idhash, &unconf_id_hashtbl[idhashval]);
36acb66b 1213 renew_client(clp);
1da177e4
LT
1214}
1215
fd39ca9a 1216static void
1da177e4
LT
1217move_to_confirmed(struct nfs4_client *clp)
1218{
1219 unsigned int idhashval = clientid_hashval(clp->cl_clientid.cl_id);
1220 unsigned int strhashval;
1221
1222 dprintk("NFSD: move_to_confirm nfs4_client %p\n", clp);
f116629d 1223 list_move(&clp->cl_idhash, &conf_id_hashtbl[idhashval]);
a55370a3 1224 strhashval = clientstr_hashval(clp->cl_recdir);
328efbab 1225 list_move(&clp->cl_strhash, &conf_str_hashtbl[strhashval]);
1da177e4
LT
1226 renew_client(clp);
1227}
1228
1229static struct nfs4_client *
1230find_confirmed_client(clientid_t *clid)
1231{
1232 struct nfs4_client *clp;
1233 unsigned int idhashval = clientid_hashval(clid->cl_id);
1234
1235 list_for_each_entry(clp, &conf_id_hashtbl[idhashval], cl_idhash) {
a50d2ad1
BF
1236 if (same_clid(&clp->cl_clientid, clid)) {
1237 renew_client(clp);
1da177e4 1238 return clp;
a50d2ad1 1239 }
1da177e4
LT
1240 }
1241 return NULL;
1242}
1243
1244static struct nfs4_client *
1245find_unconfirmed_client(clientid_t *clid)
1246{
1247 struct nfs4_client *clp;
1248 unsigned int idhashval = clientid_hashval(clid->cl_id);
1249
1250 list_for_each_entry(clp, &unconf_id_hashtbl[idhashval], cl_idhash) {
599e0a22 1251 if (same_clid(&clp->cl_clientid, clid))
1da177e4
LT
1252 return clp;
1253 }
1254 return NULL;
1255}
1256
6e5f15c9 1257static bool clp_used_exchangeid(struct nfs4_client *clp)
a1bcecd2 1258{
6e5f15c9 1259 return clp->cl_exchange_flags != 0;
e203d506 1260}
a1bcecd2 1261
28ce6054 1262static struct nfs4_client *
e203d506 1263find_confirmed_client_by_str(const char *dname, unsigned int hashval)
28ce6054
N
1264{
1265 struct nfs4_client *clp;
1266
1267 list_for_each_entry(clp, &conf_str_hashtbl[hashval], cl_strhash) {
e203d506 1268 if (same_name(clp->cl_recdir, dname))
28ce6054
N
1269 return clp;
1270 }
1271 return NULL;
1272}
1273
1274static struct nfs4_client *
e203d506 1275find_unconfirmed_client_by_str(const char *dname, unsigned int hashval)
28ce6054
N
1276{
1277 struct nfs4_client *clp;
1278
1279 list_for_each_entry(clp, &unconf_str_hashtbl[hashval], cl_strhash) {
e203d506 1280 if (same_name(clp->cl_recdir, dname))
28ce6054
N
1281 return clp;
1282 }
1283 return NULL;
1284}
1285
fd39ca9a 1286static void
6f3d772f 1287gen_callback(struct nfs4_client *clp, struct nfsd4_setclientid *se, struct svc_rqst *rqstp)
1da177e4 1288{
07263f1e 1289 struct nfs4_cb_conn *conn = &clp->cl_cb_conn;
6f3d772f
TU
1290 struct sockaddr *sa = svc_addr(rqstp);
1291 u32 scopeid = rpc_get_scope_id(sa);
7077ecba
JL
1292 unsigned short expected_family;
1293
1294 /* Currently, we only support tcp and tcp6 for the callback channel */
1295 if (se->se_callback_netid_len == 3 &&
1296 !memcmp(se->se_callback_netid_val, "tcp", 3))
1297 expected_family = AF_INET;
1298 else if (se->se_callback_netid_len == 4 &&
1299 !memcmp(se->se_callback_netid_val, "tcp6", 4))
1300 expected_family = AF_INET6;
1301 else
1da177e4
LT
1302 goto out_err;
1303
07263f1e 1304 conn->cb_addrlen = rpc_uaddr2sockaddr(se->se_callback_addr_val,
aa9a4ec7 1305 se->se_callback_addr_len,
07263f1e
BF
1306 (struct sockaddr *)&conn->cb_addr,
1307 sizeof(conn->cb_addr));
aa9a4ec7 1308
07263f1e 1309 if (!conn->cb_addrlen || conn->cb_addr.ss_family != expected_family)
1da177e4 1310 goto out_err;
aa9a4ec7 1311
07263f1e
BF
1312 if (conn->cb_addr.ss_family == AF_INET6)
1313 ((struct sockaddr_in6 *)&conn->cb_addr)->sin6_scope_id = scopeid;
fbf4665f 1314
07263f1e
BF
1315 conn->cb_prog = se->se_callback_prog;
1316 conn->cb_ident = se->se_callback_ident;
849a1cf1 1317 memcpy(&conn->cb_saddr, &rqstp->rq_daddr, rqstp->rq_daddrlen);
1da177e4
LT
1318 return;
1319out_err:
07263f1e
BF
1320 conn->cb_addr.ss_family = AF_UNSPEC;
1321 conn->cb_addrlen = 0;
849823c5 1322 dprintk(KERN_INFO "NFSD: this client (clientid %08x/%08x) "
1da177e4
LT
1323 "will not receive delegations\n",
1324 clp->cl_clientid.cl_boot, clp->cl_clientid.cl_id);
1325
1da177e4
LT
1326 return;
1327}
1328
074fe897 1329/*
557ce264 1330 * Cache a reply. nfsd4_check_drc_limit() has bounded the cache size.
074fe897 1331 */
074fe897
AA
1332void
1333nfsd4_store_cache_entry(struct nfsd4_compoundres *resp)
074fe897 1334{
557ce264
AA
1335 struct nfsd4_slot *slot = resp->cstate.slot;
1336 unsigned int base;
074fe897 1337
557ce264 1338 dprintk("--> %s slot %p\n", __func__, slot);
074fe897 1339
557ce264
AA
1340 slot->sl_opcnt = resp->opcnt;
1341 slot->sl_status = resp->cstate.status;
074fe897 1342
bf864a31 1343 if (nfsd4_not_cached(resp)) {
557ce264 1344 slot->sl_datalen = 0;
bf864a31 1345 return;
074fe897 1346 }
557ce264
AA
1347 slot->sl_datalen = (char *)resp->p - (char *)resp->cstate.datap;
1348 base = (char *)resp->cstate.datap -
1349 (char *)resp->xbuf->head[0].iov_base;
1350 if (read_bytes_from_xdr_buf(resp->xbuf, base, slot->sl_data,
1351 slot->sl_datalen))
1352 WARN("%s: sessions DRC could not cache compound\n", __func__);
1353 return;
074fe897
AA
1354}
1355
1356/*
abfabf8c
AA
1357 * Encode the replay sequence operation from the slot values.
1358 * If cachethis is FALSE encode the uncached rep error on the next
1359 * operation which sets resp->p and increments resp->opcnt for
1360 * nfs4svc_encode_compoundres.
074fe897 1361 *
074fe897 1362 */
abfabf8c
AA
1363static __be32
1364nfsd4_enc_sequence_replay(struct nfsd4_compoundargs *args,
1365 struct nfsd4_compoundres *resp)
074fe897 1366{
abfabf8c
AA
1367 struct nfsd4_op *op;
1368 struct nfsd4_slot *slot = resp->cstate.slot;
bf864a31 1369
abfabf8c 1370 dprintk("--> %s resp->opcnt %d cachethis %u \n", __func__,
557ce264 1371 resp->opcnt, resp->cstate.slot->sl_cachethis);
bf864a31 1372
abfabf8c
AA
1373 /* Encode the replayed sequence operation */
1374 op = &args->ops[resp->opcnt - 1];
1375 nfsd4_encode_operation(resp, op);
bf864a31 1376
abfabf8c 1377 /* Return nfserr_retry_uncached_rep in next operation. */
557ce264 1378 if (args->opcnt > 1 && slot->sl_cachethis == 0) {
abfabf8c
AA
1379 op = &args->ops[resp->opcnt++];
1380 op->status = nfserr_retry_uncached_rep;
1381 nfsd4_encode_operation(resp, op);
074fe897 1382 }
abfabf8c 1383 return op->status;
074fe897
AA
1384}
1385
1386/*
557ce264
AA
1387 * The sequence operation is not cached because we can use the slot and
1388 * session values.
074fe897
AA
1389 */
1390__be32
bf864a31
AA
1391nfsd4_replay_cache_entry(struct nfsd4_compoundres *resp,
1392 struct nfsd4_sequence *seq)
074fe897 1393{
557ce264 1394 struct nfsd4_slot *slot = resp->cstate.slot;
074fe897
AA
1395 __be32 status;
1396
557ce264 1397 dprintk("--> %s slot %p\n", __func__, slot);
074fe897 1398
abfabf8c
AA
1399 /* Either returns 0 or nfserr_retry_uncached */
1400 status = nfsd4_enc_sequence_replay(resp->rqstp->rq_argp, resp);
1401 if (status == nfserr_retry_uncached_rep)
1402 return status;
074fe897 1403
557ce264
AA
1404 /* The sequence operation has been encoded, cstate->datap set. */
1405 memcpy(resp->cstate.datap, slot->sl_data, slot->sl_datalen);
074fe897 1406
557ce264
AA
1407 resp->opcnt = slot->sl_opcnt;
1408 resp->p = resp->cstate.datap + XDR_QUADLEN(slot->sl_datalen);
1409 status = slot->sl_status;
074fe897
AA
1410
1411 return status;
1412}
1413
0733d213
AA
1414/*
1415 * Set the exchange_id flags returned by the server.
1416 */
1417static void
1418nfsd4_set_ex_flags(struct nfs4_client *new, struct nfsd4_exchange_id *clid)
1419{
1420 /* pNFS is not supported */
1421 new->cl_exchange_flags |= EXCHGID4_FLAG_USE_NON_PNFS;
1422
1423 /* Referrals are supported, Migration is not. */
1424 new->cl_exchange_flags |= EXCHGID4_FLAG_SUPP_MOVED_REFER;
1425
1426 /* set the wire flags to return to client. */
1427 clid->flags = new->cl_exchange_flags;
1428}
1429
069b6ad4
AA
1430__be32
1431nfsd4_exchange_id(struct svc_rqst *rqstp,
1432 struct nfsd4_compound_state *cstate,
1433 struct nfsd4_exchange_id *exid)
1434{
0733d213
AA
1435 struct nfs4_client *unconf, *conf, *new;
1436 int status;
1437 unsigned int strhashval;
1438 char dname[HEXDIR_LEN];
363168b4 1439 char addr_str[INET6_ADDRSTRLEN];
0733d213 1440 nfs4_verifier verf = exid->verifier;
363168b4 1441 struct sockaddr *sa = svc_addr(rqstp);
0733d213 1442
363168b4 1443 rpc_ntop(sa, addr_str, sizeof(addr_str));
0733d213 1444 dprintk("%s rqstp=%p exid=%p clname.len=%u clname.data=%p "
363168b4 1445 "ip_addr=%s flags %x, spa_how %d\n",
0733d213 1446 __func__, rqstp, exid, exid->clname.len, exid->clname.data,
363168b4 1447 addr_str, exid->flags, exid->spa_how);
0733d213 1448
a084daf5 1449 if (exid->flags & ~EXCHGID4_FLAG_MASK_A)
0733d213
AA
1450 return nfserr_inval;
1451
1452 /* Currently only support SP4_NONE */
1453 switch (exid->spa_how) {
1454 case SP4_NONE:
1455 break;
1456 case SP4_SSV:
044bc1d4 1457 return nfserr_serverfault;
0733d213
AA
1458 default:
1459 BUG(); /* checked by xdr code */
1460 case SP4_MACH_CRED:
1461 return nfserr_serverfault; /* no excuse :-/ */
1462 }
1463
1464 status = nfs4_make_rec_clidname(dname, &exid->clname);
1465
1466 if (status)
1467 goto error;
1468
1469 strhashval = clientstr_hashval(dname);
1470
1471 nfs4_lock_state();
1472 status = nfs_ok;
1473
e203d506 1474 conf = find_confirmed_client_by_str(dname, strhashval);
0733d213 1475 if (conf) {
e203d506
BF
1476 if (!clp_used_exchangeid(conf)) {
1477 status = nfserr_clid_inuse; /* XXX: ? */
1478 goto out;
1479 }
0733d213
AA
1480 if (!same_verf(&verf, &conf->cl_verifier)) {
1481 /* 18.35.4 case 8 */
1482 if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
1483 status = nfserr_not_same;
1484 goto out;
1485 }
1486 /* Client reboot: destroy old state */
1487 expire_client(conf);
1488 goto out_new;
1489 }
1490 if (!same_creds(&conf->cl_cred, &rqstp->rq_cred)) {
1491 /* 18.35.4 case 9 */
1492 if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
1493 status = nfserr_perm;
1494 goto out;
1495 }
1496 expire_client(conf);
1497 goto out_new;
1498 }
0733d213
AA
1499 /*
1500 * Set bit when the owner id and verifier map to an already
1501 * confirmed client id (18.35.3).
1502 */
1503 exid->flags |= EXCHGID4_FLAG_CONFIRMED_R;
1504
1505 /*
1506 * Falling into 18.35.4 case 2, possible router replay.
1507 * Leave confirmed record intact and return same result.
1508 */
1509 copy_verf(conf, &verf);
1510 new = conf;
1511 goto out_copy;
6ddbbbfe
MS
1512 }
1513
1514 /* 18.35.4 case 7 */
1515 if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
1516 status = nfserr_noent;
1517 goto out;
0733d213
AA
1518 }
1519
e203d506 1520 unconf = find_unconfirmed_client_by_str(dname, strhashval);
0733d213
AA
1521 if (unconf) {
1522 /*
1523 * Possible retry or client restart. Per 18.35.4 case 4,
1524 * a new unconfirmed record should be generated regardless
1525 * of whether any properties have changed.
1526 */
1527 expire_client(unconf);
1528 }
1529
1530out_new:
1531 /* Normal case */
b09333c4 1532 new = create_client(exid->clname, dname, rqstp, &verf);
0733d213 1533 if (new == NULL) {
4731030d 1534 status = nfserr_jukebox;
0733d213
AA
1535 goto out;
1536 }
1537
0733d213 1538 gen_clid(new);
0733d213
AA
1539 add_to_unconfirmed(new, strhashval);
1540out_copy:
1541 exid->clientid.cl_boot = new->cl_clientid.cl_boot;
1542 exid->clientid.cl_id = new->cl_clientid.cl_id;
1543
38eb76a5 1544 exid->seqid = 1;
0733d213
AA
1545 nfsd4_set_ex_flags(new, exid);
1546
1547 dprintk("nfsd4_exchange_id seqid %d flags %x\n",
49557cc7 1548 new->cl_cs_slot.sl_seqid, new->cl_exchange_flags);
0733d213
AA
1549 status = nfs_ok;
1550
1551out:
1552 nfs4_unlock_state();
1553error:
1554 dprintk("nfsd4_exchange_id returns %d\n", ntohl(status));
1555 return status;
069b6ad4
AA
1556}
1557
b85d4c01 1558static int
88e588d5 1559check_slot_seqid(u32 seqid, u32 slot_seqid, int slot_inuse)
b85d4c01 1560{
88e588d5
AA
1561 dprintk("%s enter. seqid %d slot_seqid %d\n", __func__, seqid,
1562 slot_seqid);
b85d4c01
BH
1563
1564 /* The slot is in use, and no response has been sent. */
88e588d5
AA
1565 if (slot_inuse) {
1566 if (seqid == slot_seqid)
b85d4c01
BH
1567 return nfserr_jukebox;
1568 else
1569 return nfserr_seq_misordered;
1570 }
1571 /* Normal */
88e588d5 1572 if (likely(seqid == slot_seqid + 1))
b85d4c01
BH
1573 return nfs_ok;
1574 /* Replay */
88e588d5 1575 if (seqid == slot_seqid)
b85d4c01
BH
1576 return nfserr_replay_cache;
1577 /* Wraparound */
88e588d5 1578 if (seqid == 1 && (slot_seqid + 1) == 0)
b85d4c01
BH
1579 return nfs_ok;
1580 /* Misordered replay or misordered new request */
1581 return nfserr_seq_misordered;
1582}
1583
49557cc7
AA
1584/*
1585 * Cache the create session result into the create session single DRC
1586 * slot cache by saving the xdr structure. sl_seqid has been set.
1587 * Do this for solo or embedded create session operations.
1588 */
1589static void
1590nfsd4_cache_create_session(struct nfsd4_create_session *cr_ses,
1591 struct nfsd4_clid_slot *slot, int nfserr)
1592{
1593 slot->sl_status = nfserr;
1594 memcpy(&slot->sl_cr_ses, cr_ses, sizeof(*cr_ses));
1595}
1596
1597static __be32
1598nfsd4_replay_create_session(struct nfsd4_create_session *cr_ses,
1599 struct nfsd4_clid_slot *slot)
1600{
1601 memcpy(cr_ses, &slot->sl_cr_ses, sizeof(*cr_ses));
1602 return slot->sl_status;
1603}
1604
1b74c25b
MJ
1605#define NFSD_MIN_REQ_HDR_SEQ_SZ ((\
1606 2 * 2 + /* credential,verifier: AUTH_NULL, length 0 */ \
1607 1 + /* MIN tag is length with zero, only length */ \
1608 3 + /* version, opcount, opcode */ \
1609 XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
1610 /* seqid, slotID, slotID, cache */ \
1611 4 ) * sizeof(__be32))
1612
1613#define NFSD_MIN_RESP_HDR_SEQ_SZ ((\
1614 2 + /* verifier: AUTH_NULL, length 0 */\
1615 1 + /* status */ \
1616 1 + /* MIN tag is length with zero, only length */ \
1617 3 + /* opcount, opcode, opstatus*/ \
1618 XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
1619 /* seqid, slotID, slotID, slotID, status */ \
1620 5 ) * sizeof(__be32))
1621
1622static __be32 check_forechannel_attrs(struct nfsd4_channel_attrs fchannel)
1623{
1624 return fchannel.maxreq_sz < NFSD_MIN_REQ_HDR_SEQ_SZ
1625 || fchannel.maxresp_sz < NFSD_MIN_RESP_HDR_SEQ_SZ;
1626}
1627
069b6ad4
AA
1628__be32
1629nfsd4_create_session(struct svc_rqst *rqstp,
1630 struct nfsd4_compound_state *cstate,
1631 struct nfsd4_create_session *cr_ses)
1632{
363168b4 1633 struct sockaddr *sa = svc_addr(rqstp);
ec6b5d7b 1634 struct nfs4_client *conf, *unconf;
ac7c46f2 1635 struct nfsd4_session *new;
49557cc7 1636 struct nfsd4_clid_slot *cs_slot = NULL;
86c3e16c 1637 bool confirm_me = false;
ec6b5d7b
AA
1638 int status = 0;
1639
a62573dc
MJ
1640 if (cr_ses->flags & ~SESSION4_FLAG_MASK_A)
1641 return nfserr_inval;
1642
ec6b5d7b
AA
1643 nfs4_lock_state();
1644 unconf = find_unconfirmed_client(&cr_ses->clientid);
1645 conf = find_confirmed_client(&cr_ses->clientid);
1646
1647 if (conf) {
49557cc7
AA
1648 cs_slot = &conf->cl_cs_slot;
1649 status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
38eb76a5 1650 if (status == nfserr_replay_cache) {
ec6b5d7b 1651 dprintk("Got a create_session replay! seqid= %d\n",
49557cc7 1652 cs_slot->sl_seqid);
38eb76a5 1653 /* Return the cached reply status */
49557cc7 1654 status = nfsd4_replay_create_session(cr_ses, cs_slot);
38eb76a5 1655 goto out;
49557cc7 1656 } else if (cr_ses->seqid != cs_slot->sl_seqid + 1) {
ec6b5d7b
AA
1657 status = nfserr_seq_misordered;
1658 dprintk("Sequence misordered!\n");
1659 dprintk("Expected seqid= %d but got seqid= %d\n",
49557cc7 1660 cs_slot->sl_seqid, cr_ses->seqid);
ec6b5d7b
AA
1661 goto out;
1662 }
ec6b5d7b
AA
1663 } else if (unconf) {
1664 if (!same_creds(&unconf->cl_cred, &rqstp->rq_cred) ||
363168b4 1665 !rpc_cmp_addr(sa, (struct sockaddr *) &unconf->cl_addr)) {
ec6b5d7b
AA
1666 status = nfserr_clid_inuse;
1667 goto out;
1668 }
1669
49557cc7
AA
1670 cs_slot = &unconf->cl_cs_slot;
1671 status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
38eb76a5
AA
1672 if (status) {
1673 /* an unconfirmed replay returns misordered */
ec6b5d7b 1674 status = nfserr_seq_misordered;
cd5b8144 1675 goto out;
ec6b5d7b
AA
1676 }
1677
86c3e16c 1678 confirm_me = true;
ec6b5d7b
AA
1679 conf = unconf;
1680 } else {
1681 status = nfserr_stale_clientid;
1682 goto out;
1683 }
1684
8323c3b2
BF
1685 /*
1686 * XXX: we should probably set this at creation time, and check
1687 * for consistent minorversion use throughout:
1688 */
1689 conf->cl_minorversion = 1;
408b79bc
BF
1690 /*
1691 * We do not support RDMA or persistent sessions
1692 */
1693 cr_ses->flags &= ~SESSION4_PERSIST;
1694 cr_ses->flags &= ~SESSION4_RDMA;
1695
1b74c25b
MJ
1696 status = nfserr_toosmall;
1697 if (check_forechannel_attrs(cr_ses->fore_channel))
1698 goto out;
1699
ac7c46f2
BF
1700 status = nfserr_jukebox;
1701 new = alloc_init_session(rqstp, conf, cr_ses);
1702 if (!new)
ec6b5d7b 1703 goto out;
ac7c46f2
BF
1704 status = nfs_ok;
1705 memcpy(cr_ses->sessionid.data, new->se_sessionid.data,
ec6b5d7b 1706 NFS4_MAX_SESSIONID_LEN);
12050657
MJ
1707 memcpy(&cr_ses->fore_channel, &new->se_fchannel,
1708 sizeof(struct nfsd4_channel_attrs));
86c3e16c 1709 cs_slot->sl_seqid++;
49557cc7 1710 cr_ses->seqid = cs_slot->sl_seqid;
ec6b5d7b 1711
49557cc7
AA
1712 /* cache solo and embedded create sessions under the state lock */
1713 nfsd4_cache_create_session(cr_ses, cs_slot, status);
86c3e16c
BF
1714 if (confirm_me)
1715 move_to_confirmed(conf);
ec6b5d7b
AA
1716out:
1717 nfs4_unlock_state();
1718 dprintk("%s returns %d\n", __func__, ntohl(status));
1719 return status;
069b6ad4
AA
1720}
1721
57716355
BF
1722static bool nfsd4_last_compound_op(struct svc_rqst *rqstp)
1723{
1724 struct nfsd4_compoundres *resp = rqstp->rq_resp;
1725 struct nfsd4_compoundargs *argp = rqstp->rq_argp;
1726
1727 return argp->opcnt == resp->opcnt;
1728}
1729
1d1bc8f2
BF
1730static __be32 nfsd4_map_bcts_dir(u32 *dir)
1731{
1732 switch (*dir) {
1733 case NFS4_CDFC4_FORE:
1734 case NFS4_CDFC4_BACK:
1735 return nfs_ok;
1736 case NFS4_CDFC4_FORE_OR_BOTH:
1737 case NFS4_CDFC4_BACK_OR_BOTH:
1738 *dir = NFS4_CDFC4_BOTH;
1739 return nfs_ok;
1740 };
1741 return nfserr_inval;
1742}
1743
1744__be32 nfsd4_bind_conn_to_session(struct svc_rqst *rqstp,
1745 struct nfsd4_compound_state *cstate,
1746 struct nfsd4_bind_conn_to_session *bcts)
1747{
1748 __be32 status;
1749
1750 if (!nfsd4_last_compound_op(rqstp))
1751 return nfserr_not_only_op;
1752 spin_lock(&client_lock);
1753 cstate->session = find_in_sessionid_hashtbl(&bcts->sessionid);
1754 /* Sorta weird: we only need the refcnt'ing because new_conn acquires
1755 * client_lock iself: */
1756 if (cstate->session) {
1757 nfsd4_get_session(cstate->session);
1758 atomic_inc(&cstate->session->se_client->cl_refcount);
1759 }
1760 spin_unlock(&client_lock);
1761 if (!cstate->session)
1762 return nfserr_badsession;
1763
1764 status = nfsd4_map_bcts_dir(&bcts->dir);
1db2b9dd
BS
1765 if (!status)
1766 nfsd4_new_conn(rqstp, cstate->session, bcts->dir);
1767 return status;
1d1bc8f2
BF
1768}
1769
5d4cec2f
BF
1770static bool nfsd4_compound_in_session(struct nfsd4_session *session, struct nfs4_sessionid *sid)
1771{
1772 if (!session)
1773 return 0;
1774 return !memcmp(sid, &session->se_sessionid, sizeof(*sid));
1775}
1776
069b6ad4
AA
1777__be32
1778nfsd4_destroy_session(struct svc_rqst *r,
1779 struct nfsd4_compound_state *cstate,
1780 struct nfsd4_destroy_session *sessionid)
1781{
e10e0cfc
BH
1782 struct nfsd4_session *ses;
1783 u32 status = nfserr_badsession;
1784
1785 /* Notes:
1786 * - The confirmed nfs4_client->cl_sessionid holds destroyed sessinid
1787 * - Should we return nfserr_back_chan_busy if waiting for
1788 * callbacks on to-be-destroyed session?
1789 * - Do we need to clear any callback info from previous session?
1790 */
1791
5d4cec2f 1792 if (nfsd4_compound_in_session(cstate->session, &sessionid->sessionid)) {
57716355
BF
1793 if (!nfsd4_last_compound_op(r))
1794 return nfserr_not_only_op;
1795 }
e10e0cfc 1796 dump_sessionid(__func__, &sessionid->sessionid);
9089f1b4 1797 spin_lock(&client_lock);
e10e0cfc
BH
1798 ses = find_in_sessionid_hashtbl(&sessionid->sessionid);
1799 if (!ses) {
9089f1b4 1800 spin_unlock(&client_lock);
e10e0cfc
BH
1801 goto out;
1802 }
1803
1804 unhash_session(ses);
9089f1b4 1805 spin_unlock(&client_lock);
e10e0cfc 1806
ab707e15 1807 nfs4_lock_state();
84f5f7cc 1808 nfsd4_probe_callback_sync(ses->se_client);
ab707e15 1809 nfs4_unlock_state();
19cf5c02
BF
1810
1811 nfsd4_del_conns(ses);
1812
e10e0cfc
BH
1813 nfsd4_put_session(ses);
1814 status = nfs_ok;
1815out:
1816 dprintk("%s returns %d\n", __func__, ntohl(status));
1817 return status;
069b6ad4
AA
1818}
1819
a663bdd8 1820static struct nfsd4_conn *__nfsd4_find_conn(struct svc_xprt *xpt, struct nfsd4_session *s)
328ead28
BF
1821{
1822 struct nfsd4_conn *c;
1823
1824 list_for_each_entry(c, &s->se_conns, cn_persession) {
a663bdd8 1825 if (c->cn_xprt == xpt) {
328ead28
BF
1826 return c;
1827 }
1828 }
1829 return NULL;
1830}
1831
a663bdd8 1832static void nfsd4_sequence_check_conn(struct nfsd4_conn *new, struct nfsd4_session *ses)
328ead28
BF
1833{
1834 struct nfs4_client *clp = ses->se_client;
a663bdd8 1835 struct nfsd4_conn *c;
21b75b01 1836 int ret;
328ead28
BF
1837
1838 spin_lock(&clp->cl_lock);
a663bdd8 1839 c = __nfsd4_find_conn(new->cn_xprt, ses);
328ead28
BF
1840 if (c) {
1841 spin_unlock(&clp->cl_lock);
1842 free_conn(new);
1843 return;
1844 }
1845 __nfsd4_hash_conn(new, ses);
1846 spin_unlock(&clp->cl_lock);
21b75b01
BF
1847 ret = nfsd4_register_conn(new);
1848 if (ret)
1849 /* oops; xprt is already down: */
1850 nfsd4_conn_lost(&new->cn_xpt_user);
328ead28
BF
1851 return;
1852}
1853
868b89c3
MJ
1854static bool nfsd4_session_too_many_ops(struct svc_rqst *rqstp, struct nfsd4_session *session)
1855{
1856 struct nfsd4_compoundargs *args = rqstp->rq_argp;
1857
1858 return args->opcnt > session->se_fchannel.maxops;
1859}
1860
ae82a8d0
MJ
1861static bool nfsd4_request_too_big(struct svc_rqst *rqstp,
1862 struct nfsd4_session *session)
1863{
1864 struct xdr_buf *xb = &rqstp->rq_arg;
1865
1866 return xb->len > session->se_fchannel.maxreq_sz;
1867}
1868
069b6ad4 1869__be32
b85d4c01 1870nfsd4_sequence(struct svc_rqst *rqstp,
069b6ad4
AA
1871 struct nfsd4_compound_state *cstate,
1872 struct nfsd4_sequence *seq)
1873{
f9bb94c4 1874 struct nfsd4_compoundres *resp = rqstp->rq_resp;
b85d4c01
BH
1875 struct nfsd4_session *session;
1876 struct nfsd4_slot *slot;
a663bdd8 1877 struct nfsd4_conn *conn;
b85d4c01
BH
1878 int status;
1879
f9bb94c4
AA
1880 if (resp->opcnt != 1)
1881 return nfserr_sequence_pos;
1882
a663bdd8
BF
1883 /*
1884 * Will be either used or freed by nfsd4_sequence_check_conn
1885 * below.
1886 */
1887 conn = alloc_conn(rqstp, NFS4_CDFC4_FORE);
1888 if (!conn)
1889 return nfserr_jukebox;
1890
9089f1b4 1891 spin_lock(&client_lock);
b85d4c01
BH
1892 status = nfserr_badsession;
1893 session = find_in_sessionid_hashtbl(&seq->sessionid);
1894 if (!session)
1895 goto out;
1896
868b89c3
MJ
1897 status = nfserr_too_many_ops;
1898 if (nfsd4_session_too_many_ops(rqstp, session))
1899 goto out;
1900
ae82a8d0
MJ
1901 status = nfserr_req_too_big;
1902 if (nfsd4_request_too_big(rqstp, session))
1903 goto out;
1904
b85d4c01 1905 status = nfserr_badslot;
6c18ba9f 1906 if (seq->slotid >= session->se_fchannel.maxreqs)
b85d4c01
BH
1907 goto out;
1908
557ce264 1909 slot = session->se_slots[seq->slotid];
b85d4c01
BH
1910 dprintk("%s: slotid %d\n", __func__, seq->slotid);
1911
a8dfdaeb
AA
1912 /* We do not negotiate the number of slots yet, so set the
1913 * maxslots to the session maxreqs which is used to encode
1914 * sr_highest_slotid and the sr_target_slot id to maxslots */
1915 seq->maxslots = session->se_fchannel.maxreqs;
1916
88e588d5 1917 status = check_slot_seqid(seq->seqid, slot->sl_seqid, slot->sl_inuse);
b85d4c01
BH
1918 if (status == nfserr_replay_cache) {
1919 cstate->slot = slot;
1920 cstate->session = session;
da3846a2 1921 /* Return the cached reply status and set cstate->status
557ce264 1922 * for nfsd4_proc_compound processing */
bf864a31 1923 status = nfsd4_replay_cache_entry(resp, seq);
da3846a2 1924 cstate->status = nfserr_replay_cache;
aaf84eb9 1925 goto out;
b85d4c01
BH
1926 }
1927 if (status)
1928 goto out;
1929
a663bdd8
BF
1930 nfsd4_sequence_check_conn(conn, session);
1931 conn = NULL;
328ead28 1932
b85d4c01
BH
1933 /* Success! bump slot seqid */
1934 slot->sl_inuse = true;
1935 slot->sl_seqid = seq->seqid;
557ce264 1936 slot->sl_cachethis = seq->cachethis;
b85d4c01
BH
1937
1938 cstate->slot = slot;
1939 cstate->session = session;
1940
b85d4c01 1941out:
26c0c75e 1942 /* Hold a session reference until done processing the compound. */
aaf84eb9 1943 if (cstate->session) {
0d7bb719
BF
1944 struct nfs4_client *clp = session->se_client;
1945
36acb66b 1946 nfsd4_get_session(cstate->session);
0d7bb719
BF
1947 atomic_inc(&clp->cl_refcount);
1948 if (clp->cl_cb_state == NFSD4_CB_DOWN)
1949 seq->status_flags |= SEQ4_STATUS_CB_PATH_DOWN;
aaf84eb9 1950 }
a663bdd8 1951 kfree(conn);
36acb66b 1952 spin_unlock(&client_lock);
b85d4c01
BH
1953 dprintk("%s: return %d\n", __func__, ntohl(status));
1954 return status;
069b6ad4
AA
1955}
1956
4dc6ec00
BF
1957__be32
1958nfsd4_reclaim_complete(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_reclaim_complete *rc)
1959{
bcecf1cc
MJ
1960 int status = 0;
1961
4dc6ec00
BF
1962 if (rc->rca_one_fs) {
1963 if (!cstate->current_fh.fh_dentry)
1964 return nfserr_nofilehandle;
1965 /*
1966 * We don't take advantage of the rca_one_fs case.
1967 * That's OK, it's optional, we can safely ignore it.
1968 */
1969 return nfs_ok;
1970 }
bcecf1cc 1971
4dc6ec00 1972 nfs4_lock_state();
bcecf1cc
MJ
1973 status = nfserr_complete_already;
1974 if (cstate->session->se_client->cl_firststate)
1975 goto out;
1976
1977 status = nfserr_stale_clientid;
1978 if (is_client_expired(cstate->session->se_client))
4dc6ec00
BF
1979 /*
1980 * The following error isn't really legal.
1981 * But we only get here if the client just explicitly
1982 * destroyed the client. Surely it no longer cares what
1983 * error it gets back on an operation for the dead
1984 * client.
1985 */
bcecf1cc
MJ
1986 goto out;
1987
1988 status = nfs_ok;
4dc6ec00 1989 nfsd4_create_clid_dir(cstate->session->se_client);
bcecf1cc 1990out:
4dc6ec00 1991 nfs4_unlock_state();
bcecf1cc 1992 return status;
4dc6ec00
BF
1993}
1994
b37ad28b 1995__be32
b591480b
BF
1996nfsd4_setclientid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
1997 struct nfsd4_setclientid *setclid)
1da177e4 1998{
a084daf5 1999 struct xdr_netobj clname = setclid->se_name;
1da177e4
LT
2000 nfs4_verifier clverifier = setclid->se_verf;
2001 unsigned int strhashval;
28ce6054 2002 struct nfs4_client *conf, *unconf, *new;
b37ad28b 2003 __be32 status;
a55370a3 2004 char dname[HEXDIR_LEN];
1da177e4 2005
a55370a3
N
2006 status = nfs4_make_rec_clidname(dname, &clname);
2007 if (status)
73aea4ec 2008 return status;
a55370a3 2009
1da177e4
LT
2010 /*
2011 * XXX The Duplicate Request Cache (DRC) has been checked (??)
2012 * We get here on a DRC miss.
2013 */
2014
a55370a3 2015 strhashval = clientstr_hashval(dname);
1da177e4 2016
1da177e4 2017 nfs4_lock_state();
e203d506 2018 conf = find_confirmed_client_by_str(dname, strhashval);
28ce6054 2019 if (conf) {
a186e767 2020 /* RFC 3530 14.2.33 CASE 0: */
1da177e4 2021 status = nfserr_clid_inuse;
e203d506
BF
2022 if (clp_used_exchangeid(conf))
2023 goto out;
026722c2 2024 if (!same_creds(&conf->cl_cred, &rqstp->rq_cred)) {
363168b4
JL
2025 char addr_str[INET6_ADDRSTRLEN];
2026 rpc_ntop((struct sockaddr *) &conf->cl_addr, addr_str,
2027 sizeof(addr_str));
2028 dprintk("NFSD: setclientid: string in use by client "
2029 "at %s\n", addr_str);
1da177e4
LT
2030 goto out;
2031 }
1da177e4 2032 }
a186e767
BF
2033 /*
2034 * section 14.2.33 of RFC 3530 (under the heading "IMPLEMENTATION")
2035 * has a description of SETCLIENTID request processing consisting
2036 * of 5 bullet points, labeled as CASE0 - CASE4 below.
2037 */
e203d506 2038 unconf = find_unconfirmed_client_by_str(dname, strhashval);
3e772463 2039 status = nfserr_jukebox;
1da177e4 2040 if (!conf) {
a186e767
BF
2041 /*
2042 * RFC 3530 14.2.33 CASE 4:
2043 * placed first, because it is the normal case
1da177e4
LT
2044 */
2045 if (unconf)
2046 expire_client(unconf);
b09333c4 2047 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2048 if (new == NULL)
1da177e4 2049 goto out;
1da177e4 2050 gen_clid(new);
599e0a22 2051 } else if (same_verf(&conf->cl_verifier, &clverifier)) {
1da177e4 2052 /*
a186e767
BF
2053 * RFC 3530 14.2.33 CASE 1:
2054 * probable callback update
1da177e4 2055 */
31f4a6c1
N
2056 if (unconf) {
2057 /* Note this is removing unconfirmed {*x***},
2058 * which is stronger than RFC recommended {vxc**}.
2059 * This has the advantage that there is at most
2060 * one {*x***} in either list at any time.
2061 */
2062 expire_client(unconf);
1da177e4 2063 }
b09333c4 2064 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2065 if (new == NULL)
1da177e4 2066 goto out;
1da177e4 2067 copy_clid(new, conf);
1da177e4
LT
2068 } else if (!unconf) {
2069 /*
a186e767
BF
2070 * RFC 3530 14.2.33 CASE 2:
2071 * probable client reboot; state will be removed if
2072 * confirmed.
1da177e4 2073 */
b09333c4 2074 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2075 if (new == NULL)
1da177e4 2076 goto out;
1da177e4 2077 gen_clid(new);
49ba8781 2078 } else {
a186e767
BF
2079 /*
2080 * RFC 3530 14.2.33 CASE 3:
2081 * probable client reboot; state will be removed if
2082 * confirmed.
1da177e4
LT
2083 */
2084 expire_client(unconf);
b09333c4 2085 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2086 if (new == NULL)
1da177e4 2087 goto out;
1da177e4 2088 gen_clid(new);
1da177e4 2089 }
8323c3b2
BF
2090 /*
2091 * XXX: we should probably set this at creation time, and check
2092 * for consistent minorversion use throughout:
2093 */
2094 new->cl_minorversion = 0;
6f3d772f 2095 gen_callback(new, setclid, rqstp);
c175b83c 2096 add_to_unconfirmed(new, strhashval);
1da177e4
LT
2097 setclid->se_clientid.cl_boot = new->cl_clientid.cl_boot;
2098 setclid->se_clientid.cl_id = new->cl_clientid.cl_id;
2099 memcpy(setclid->se_confirm.data, new->cl_confirm.data, sizeof(setclid->se_confirm.data));
2100 status = nfs_ok;
2101out:
2102 nfs4_unlock_state();
2103 return status;
2104}
2105
2106
2107/*
a186e767
BF
2108 * Section 14.2.34 of RFC 3530 (under the heading "IMPLEMENTATION") has
2109 * a description of SETCLIENTID_CONFIRM request processing consisting of 4
2110 * bullets, labeled as CASE1 - CASE4 below.
1da177e4 2111 */
b37ad28b 2112__be32
b591480b
BF
2113nfsd4_setclientid_confirm(struct svc_rqst *rqstp,
2114 struct nfsd4_compound_state *cstate,
2115 struct nfsd4_setclientid_confirm *setclientid_confirm)
1da177e4 2116{
363168b4 2117 struct sockaddr *sa = svc_addr(rqstp);
21ab45a4 2118 struct nfs4_client *conf, *unconf;
1da177e4
LT
2119 nfs4_verifier confirm = setclientid_confirm->sc_confirm;
2120 clientid_t * clid = &setclientid_confirm->sc_clientid;
b37ad28b 2121 __be32 status;
1da177e4
LT
2122
2123 if (STALE_CLIENTID(clid))
2124 return nfserr_stale_clientid;
2125 /*
2126 * XXX The Duplicate Request Cache (DRC) has been checked (??)
2127 * We get here on a DRC miss.
2128 */
2129
2130 nfs4_lock_state();
21ab45a4
N
2131
2132 conf = find_confirmed_client(clid);
2133 unconf = find_unconfirmed_client(clid);
2134
2135 status = nfserr_clid_inuse;
363168b4 2136 if (conf && !rpc_cmp_addr((struct sockaddr *) &conf->cl_addr, sa))
21ab45a4 2137 goto out;
363168b4 2138 if (unconf && !rpc_cmp_addr((struct sockaddr *) &unconf->cl_addr, sa))
21ab45a4
N
2139 goto out;
2140
a186e767
BF
2141 /*
2142 * section 14.2.34 of RFC 3530 has a description of
2143 * SETCLIENTID_CONFIRM request processing consisting
2144 * of 4 bullet points, labeled as CASE1 - CASE4 below.
2145 */
366e0c1d 2146 if (conf && unconf && same_verf(&confirm, &unconf->cl_confirm)) {
a186e767
BF
2147 /*
2148 * RFC 3530 14.2.34 CASE 1:
2149 * callback update
2150 */
599e0a22 2151 if (!same_creds(&conf->cl_cred, &unconf->cl_cred))
1da177e4
LT
2152 status = nfserr_clid_inuse;
2153 else {
5a3c9d71
BF
2154 nfsd4_change_callback(conf, &unconf->cl_cb_conn);
2155 nfsd4_probe_callback(conf);
1a69c179 2156 expire_client(unconf);
1da177e4 2157 status = nfs_ok;
1a69c179 2158
1da177e4 2159 }
f3aba4e5 2160 } else if (conf && !unconf) {
a186e767
BF
2161 /*
2162 * RFC 3530 14.2.34 CASE 2:
2163 * probable retransmitted request; play it safe and
2164 * do nothing.
7c79f737 2165 */
599e0a22 2166 if (!same_creds(&conf->cl_cred, &rqstp->rq_cred))
1da177e4 2167 status = nfserr_clid_inuse;
21ab45a4 2168 else
1da177e4 2169 status = nfs_ok;
7c79f737 2170 } else if (!conf && unconf
599e0a22 2171 && same_verf(&unconf->cl_confirm, &confirm)) {
a186e767
BF
2172 /*
2173 * RFC 3530 14.2.34 CASE 3:
2174 * Normal case; new or rebooted client:
7c79f737 2175 */
599e0a22 2176 if (!same_creds(&unconf->cl_cred, &rqstp->rq_cred)) {
1da177e4
LT
2177 status = nfserr_clid_inuse;
2178 } else {
1a69c179
N
2179 unsigned int hash =
2180 clientstr_hashval(unconf->cl_recdir);
2181 conf = find_confirmed_client_by_str(unconf->cl_recdir,
e203d506 2182 hash);
1a69c179 2183 if (conf) {
c7b9a459 2184 nfsd4_remove_clid_dir(conf);
1a69c179
N
2185 expire_client(conf);
2186 }
1da177e4 2187 move_to_confirmed(unconf);
21ab45a4 2188 conf = unconf;
5a3c9d71 2189 nfsd4_probe_callback(conf);
1a69c179 2190 status = nfs_ok;
1da177e4 2191 }
599e0a22
BF
2192 } else if ((!conf || (conf && !same_verf(&conf->cl_confirm, &confirm)))
2193 && (!unconf || (unconf && !same_verf(&unconf->cl_confirm,
7c79f737 2194 &confirm)))) {
a186e767
BF
2195 /*
2196 * RFC 3530 14.2.34 CASE 4:
2197 * Client probably hasn't noticed that we rebooted yet.
7c79f737 2198 */
1da177e4 2199 status = nfserr_stale_clientid;
7c79f737 2200 } else {
08e8987c
N
2201 /* check that we have hit one of the cases...*/
2202 status = nfserr_clid_inuse;
2203 }
1da177e4 2204out:
1da177e4
LT
2205 nfs4_unlock_state();
2206 return status;
2207}
2208
32513b40
BF
2209static struct nfs4_file *nfsd4_alloc_file(void)
2210{
2211 return kmem_cache_alloc(file_slab, GFP_KERNEL);
2212}
2213
1da177e4 2214/* OPEN Share state helper functions */
32513b40 2215static void nfsd4_init_file(struct nfs4_file *fp, struct inode *ino)
1da177e4 2216{
1da177e4
LT
2217 unsigned int hashval = file_hashval(ino);
2218
32513b40
BF
2219 atomic_set(&fp->fi_ref, 1);
2220 INIT_LIST_HEAD(&fp->fi_hash);
2221 INIT_LIST_HEAD(&fp->fi_stateids);
2222 INIT_LIST_HEAD(&fp->fi_delegations);
2223 fp->fi_inode = igrab(ino);
2224 fp->fi_had_conflict = false;
2225 fp->fi_lease = NULL;
2226 memset(fp->fi_fds, 0, sizeof(fp->fi_fds));
2227 memset(fp->fi_access, 0, sizeof(fp->fi_access));
2228 spin_lock(&recall_lock);
2229 list_add(&fp->fi_hash, &file_hashtbl[hashval]);
2230 spin_unlock(&recall_lock);
1da177e4
LT
2231}
2232
e60d4398 2233static void
e18b890b 2234nfsd4_free_slab(struct kmem_cache **slab)
1da177e4 2235{
e60d4398
N
2236 if (*slab == NULL)
2237 return;
1a1d92c1 2238 kmem_cache_destroy(*slab);
e60d4398 2239 *slab = NULL;
1da177e4
LT
2240}
2241
e8ff2a84 2242void
1da177e4
LT
2243nfsd4_free_slabs(void)
2244{
fe0750e5
BF
2245 nfsd4_free_slab(&openowner_slab);
2246 nfsd4_free_slab(&lockowner_slab);
e60d4398 2247 nfsd4_free_slab(&file_slab);
5ac049ac 2248 nfsd4_free_slab(&stateid_slab);
5b2d21c1 2249 nfsd4_free_slab(&deleg_slab);
e60d4398 2250}
1da177e4 2251
e60d4398
N
2252static int
2253nfsd4_init_slabs(void)
2254{
fe0750e5
BF
2255 openowner_slab = kmem_cache_create("nfsd4_openowners",
2256 sizeof(struct nfs4_openowner), 0, 0, NULL);
2257 if (openowner_slab == NULL)
2258 goto out_nomem;
2259 lockowner_slab = kmem_cache_create("nfsd4_lockowners",
2260 sizeof(struct nfs4_openowner), 0, 0, NULL);
2261 if (lockowner_slab == NULL)
e60d4398
N
2262 goto out_nomem;
2263 file_slab = kmem_cache_create("nfsd4_files",
20c2df83 2264 sizeof(struct nfs4_file), 0, 0, NULL);
e60d4398
N
2265 if (file_slab == NULL)
2266 goto out_nomem;
5ac049ac 2267 stateid_slab = kmem_cache_create("nfsd4_stateids",
dcef0413 2268 sizeof(struct nfs4_ol_stateid), 0, 0, NULL);
5ac049ac
N
2269 if (stateid_slab == NULL)
2270 goto out_nomem;
5b2d21c1 2271 deleg_slab = kmem_cache_create("nfsd4_delegations",
20c2df83 2272 sizeof(struct nfs4_delegation), 0, 0, NULL);
5b2d21c1
N
2273 if (deleg_slab == NULL)
2274 goto out_nomem;
e60d4398
N
2275 return 0;
2276out_nomem:
2277 nfsd4_free_slabs();
2278 dprintk("nfsd4: out of memory while initializing nfsv4\n");
2279 return -ENOMEM;
1da177e4
LT
2280}
2281
fe0750e5
BF
2282void nfs4_free_openowner(struct nfs4_openowner *oo)
2283{
2284 kfree(oo->oo_owner.so_owner.data);
2285 kmem_cache_free(openowner_slab, oo);
2286}
2287
2288void nfs4_free_lockowner(struct nfs4_lockowner *lo)
1da177e4 2289{
fe0750e5
BF
2290 kfree(lo->lo_owner.so_owner.data);
2291 kmem_cache_free(lockowner_slab, lo);
1da177e4
LT
2292}
2293
ff194bd9 2294static void init_nfs4_replay(struct nfs4_replay *rp)
1da177e4 2295{
ff194bd9
BF
2296 rp->rp_status = nfserr_serverfault;
2297 rp->rp_buflen = 0;
2298 rp->rp_buf = rp->rp_ibuf;
1da177e4
LT
2299}
2300
fe0750e5 2301static inline void *alloc_stateowner(struct kmem_cache *slab, struct xdr_netobj *owner, struct nfs4_client *clp)
ff194bd9 2302{
1da177e4 2303 struct nfs4_stateowner *sop;
1da177e4 2304
fe0750e5 2305 sop = kmem_cache_alloc(slab, GFP_KERNEL);
ff194bd9
BF
2306 if (!sop)
2307 return NULL;
2308
2309 sop->so_owner.data = kmemdup(owner->data, owner->len, GFP_KERNEL);
2310 if (!sop->so_owner.data) {
fe0750e5 2311 kmem_cache_free(slab, sop);
1da177e4 2312 return NULL;
ff194bd9
BF
2313 }
2314 sop->so_owner.len = owner->len;
2315
ea1da636 2316 INIT_LIST_HEAD(&sop->so_stateids);
ff194bd9
BF
2317 sop->so_client = clp;
2318 init_nfs4_replay(&sop->so_replay);
2319 return sop;
2320}
2321
fe0750e5 2322static void hash_openowner(struct nfs4_openowner *oo, struct nfs4_client *clp, unsigned int strhashval)
ff194bd9 2323{
fe0750e5
BF
2324 list_add(&oo->oo_owner.so_strhash, &open_ownerstr_hashtbl[strhashval]);
2325 list_add(&oo->oo_perclient, &clp->cl_openowners);
ff194bd9
BF
2326}
2327
fe0750e5 2328static struct nfs4_openowner *
ff194bd9 2329alloc_init_open_stateowner(unsigned int strhashval, struct nfs4_client *clp, struct nfsd4_open *open) {
fe0750e5 2330 struct nfs4_openowner *oo;
ff194bd9 2331
fe0750e5
BF
2332 oo = alloc_stateowner(openowner_slab, &open->op_owner, clp);
2333 if (!oo)
ff194bd9 2334 return NULL;
fe0750e5
BF
2335 oo->oo_owner.so_is_open_owner = 1;
2336 oo->oo_owner.so_seqid = open->op_seqid;
d29b20cd 2337 oo->oo_flags = NFS4_OO_NEW;
fe0750e5 2338 oo->oo_time = 0;
38c387b5 2339 oo->oo_last_closed_stid = NULL;
fe0750e5
BF
2340 INIT_LIST_HEAD(&oo->oo_close_lru);
2341 hash_openowner(oo, clp, strhashval);
2342 return oo;
1da177e4
LT
2343}
2344
996e0938 2345static void init_open_stateid(struct nfs4_ol_stateid *stp, struct nfs4_file *fp, struct nfsd4_open *open) {
fe0750e5 2346 struct nfs4_openowner *oo = open->op_openowner;
d3b313a4 2347 struct nfs4_client *clp = oo->oo_owner.so_client;
1da177e4 2348
996e0938 2349 init_stid(&stp->st_stid, clp, NFS4_OPEN_STID);
ea1da636 2350 INIT_LIST_HEAD(&stp->st_lockowners);
fe0750e5 2351 list_add(&stp->st_perstateowner, &oo->oo_owner.so_stateids);
8beefa24 2352 list_add(&stp->st_perfile, &fp->fi_stateids);
fe0750e5 2353 stp->st_stateowner = &oo->oo_owner;
13cd2184 2354 get_nfs4_file(fp);
1da177e4 2355 stp->st_file = fp;
1da177e4
LT
2356 stp->st_access_bmap = 0;
2357 stp->st_deny_bmap = 0;
b6d2f1ca 2358 __set_bit(open->op_share_access, &stp->st_access_bmap);
1da177e4 2359 __set_bit(open->op_share_deny, &stp->st_deny_bmap);
4c4cd222 2360 stp->st_openstp = NULL;
1da177e4
LT
2361}
2362
fd39ca9a 2363static void
fe0750e5 2364move_to_close_lru(struct nfs4_openowner *oo)
1da177e4 2365{
fe0750e5 2366 dprintk("NFSD: move_to_close_lru nfs4_openowner %p\n", oo);
1da177e4 2367
fe0750e5
BF
2368 list_move_tail(&oo->oo_close_lru, &close_lru);
2369 oo->oo_time = get_seconds();
1da177e4
LT
2370}
2371
1da177e4 2372static int
599e0a22
BF
2373same_owner_str(struct nfs4_stateowner *sop, struct xdr_netobj *owner,
2374 clientid_t *clid)
2375{
2376 return (sop->so_owner.len == owner->len) &&
2377 0 == memcmp(sop->so_owner.data, owner->data, owner->len) &&
2378 (sop->so_client->cl_clientid.cl_id == clid->cl_id);
1da177e4
LT
2379}
2380
fe0750e5 2381static struct nfs4_openowner *
1da177e4
LT
2382find_openstateowner_str(unsigned int hashval, struct nfsd4_open *open)
2383{
a50d2ad1
BF
2384 struct nfs4_stateowner *so;
2385 struct nfs4_openowner *oo;
1da177e4 2386
506f275f 2387 list_for_each_entry(so, &open_ownerstr_hashtbl[hashval], so_strhash) {
a50d2ad1
BF
2388 if (same_owner_str(so, &open->op_owner, &open->op_clientid)) {
2389 oo = openowner(so);
2390 renew_client(oo->oo_owner.so_client);
2391 return oo;
2392 }
1da177e4
LT
2393 }
2394 return NULL;
2395}
2396
2397/* search file_hashtbl[] for file */
2398static struct nfs4_file *
2399find_file(struct inode *ino)
2400{
2401 unsigned int hashval = file_hashval(ino);
2402 struct nfs4_file *fp;
2403
8b671b80 2404 spin_lock(&recall_lock);
1da177e4 2405 list_for_each_entry(fp, &file_hashtbl[hashval], fi_hash) {
13cd2184
N
2406 if (fp->fi_inode == ino) {
2407 get_nfs4_file(fp);
8b671b80 2408 spin_unlock(&recall_lock);
1da177e4 2409 return fp;
13cd2184 2410 }
1da177e4 2411 }
8b671b80 2412 spin_unlock(&recall_lock);
1da177e4
LT
2413 return NULL;
2414}
2415
1da177e4
LT
2416/*
2417 * Called to check deny when READ with all zero stateid or
2418 * WRITE with all zero or all one stateid
2419 */
b37ad28b 2420static __be32
1da177e4
LT
2421nfs4_share_conflict(struct svc_fh *current_fh, unsigned int deny_type)
2422{
2423 struct inode *ino = current_fh->fh_dentry->d_inode;
2424 struct nfs4_file *fp;
dcef0413 2425 struct nfs4_ol_stateid *stp;
b37ad28b 2426 __be32 ret;
1da177e4
LT
2427
2428 dprintk("NFSD: nfs4_share_conflict\n");
2429
2430 fp = find_file(ino);
13cd2184
N
2431 if (!fp)
2432 return nfs_ok;
b700949b 2433 ret = nfserr_locked;
1da177e4 2434 /* Search for conflicting share reservations */
13cd2184
N
2435 list_for_each_entry(stp, &fp->fi_stateids, st_perfile) {
2436 if (test_bit(deny_type, &stp->st_deny_bmap) ||
2437 test_bit(NFS4_SHARE_DENY_BOTH, &stp->st_deny_bmap))
2438 goto out;
1da177e4 2439 }
13cd2184
N
2440 ret = nfs_ok;
2441out:
2442 put_nfs4_file(fp);
2443 return ret;
1da177e4
LT
2444}
2445
6b57d9c8 2446static void nfsd_break_one_deleg(struct nfs4_delegation *dp)
1da177e4 2447{
1da177e4
LT
2448 /* We're assuming the state code never drops its reference
2449 * without first removing the lease. Since we're in this lease
2450 * callback (and since the lease code is serialized by the kernel
2451 * lock) we know the server hasn't removed the lease yet, we know
2452 * it's safe to take a reference: */
2453 atomic_inc(&dp->dl_count);
2454
1da177e4 2455 list_add_tail(&dp->dl_recall_lru, &del_recall_lru);
1da177e4 2456
460781b5 2457 /* only place dl_time is set. protected by lock_flocks*/
1da177e4
LT
2458 dp->dl_time = get_seconds();
2459
6b57d9c8
BF
2460 nfsd4_cb_recall(dp);
2461}
2462
acfdf5c3 2463/* Called from break_lease() with lock_flocks() held. */
6b57d9c8
BF
2464static void nfsd_break_deleg_cb(struct file_lock *fl)
2465{
acfdf5c3
BF
2466 struct nfs4_file *fp = (struct nfs4_file *)fl->fl_owner;
2467 struct nfs4_delegation *dp;
6b57d9c8 2468
acfdf5c3
BF
2469 BUG_ON(!fp);
2470 /* We assume break_lease is only called once per lease: */
2471 BUG_ON(fp->fi_had_conflict);
0272e1fd
BF
2472 /*
2473 * We don't want the locks code to timeout the lease for us;
acfdf5c3 2474 * we'll remove it ourself if a delegation isn't returned
6b57d9c8 2475 * in time:
0272e1fd
BF
2476 */
2477 fl->fl_break_time = 0;
1da177e4 2478
5d926e8c 2479 spin_lock(&recall_lock);
acfdf5c3
BF
2480 fp->fi_had_conflict = true;
2481 list_for_each_entry(dp, &fp->fi_delegations, dl_perfile)
2482 nfsd_break_one_deleg(dp);
5d926e8c 2483 spin_unlock(&recall_lock);
1da177e4
LT
2484}
2485
1da177e4
LT
2486static
2487int nfsd_change_deleg_cb(struct file_lock **onlist, int arg)
2488{
2489 if (arg & F_UNLCK)
2490 return lease_modify(onlist, arg);
2491 else
2492 return -EAGAIN;
2493}
2494
7b021967 2495static const struct lock_manager_operations nfsd_lease_mng_ops = {
8fb47a4f
BF
2496 .lm_break = nfsd_break_deleg_cb,
2497 .lm_change = nfsd_change_deleg_cb,
1da177e4
LT
2498};
2499
7a8711c9
BF
2500static __be32 nfsd4_check_seqid(struct nfsd4_compound_state *cstate, struct nfs4_stateowner *so, u32 seqid)
2501{
2502 if (nfsd4_has_session(cstate))
2503 return nfs_ok;
2504 if (seqid == so->so_seqid - 1)
2505 return nfserr_replay_me;
2506 if (seqid == so->so_seqid)
2507 return nfs_ok;
2508 return nfserr_bad_seqid;
2509}
1da177e4 2510
b37ad28b 2511__be32
6668958f
AA
2512nfsd4_process_open1(struct nfsd4_compound_state *cstate,
2513 struct nfsd4_open *open)
1da177e4 2514{
1da177e4
LT
2515 clientid_t *clientid = &open->op_clientid;
2516 struct nfs4_client *clp = NULL;
2517 unsigned int strhashval;
fe0750e5 2518 struct nfs4_openowner *oo = NULL;
4cdc951b 2519 __be32 status;
1da177e4 2520
1da177e4
LT
2521 if (STALE_CLIENTID(&open->op_clientid))
2522 return nfserr_stale_clientid;
32513b40
BF
2523 /*
2524 * In case we need it later, after we've already created the
2525 * file and don't want to risk a further failure:
2526 */
2527 open->op_file = nfsd4_alloc_file();
2528 if (open->op_file == NULL)
2529 return nfserr_jukebox;
1da177e4 2530
506f275f 2531 strhashval = open_ownerstr_hashval(clientid->cl_id, &open->op_owner);
fe0750e5
BF
2532 oo = find_openstateowner_str(strhashval, open);
2533 open->op_openowner = oo;
2534 if (!oo) {
1da177e4
LT
2535 clp = find_confirmed_client(clientid);
2536 if (clp == NULL)
0f442aa2 2537 return nfserr_expired;
bcf130f9 2538 goto new_owner;
1da177e4 2539 }
dad1c067 2540 if (!(oo->oo_flags & NFS4_OO_CONFIRMED)) {
0f442aa2 2541 /* Replace unconfirmed owners without checking for replay. */
fe0750e5
BF
2542 clp = oo->oo_owner.so_client;
2543 release_openowner(oo);
2544 open->op_openowner = NULL;
bcf130f9 2545 goto new_owner;
0f442aa2 2546 }
4cdc951b
BF
2547 status = nfsd4_check_seqid(cstate, &oo->oo_owner, open->op_seqid);
2548 if (status)
2549 return status;
2550 clp = oo->oo_owner.so_client;
2551 goto alloc_stateid;
bcf130f9
BF
2552new_owner:
2553 oo = alloc_init_open_stateowner(strhashval, clp, open);
2554 if (oo == NULL)
2555 return nfserr_jukebox;
2556 open->op_openowner = oo;
4cdc951b
BF
2557alloc_stateid:
2558 open->op_stp = nfs4_alloc_stateid(clp);
2559 if (!open->op_stp)
2560 return nfserr_jukebox;
0f442aa2 2561 return nfs_ok;
1da177e4
LT
2562}
2563
b37ad28b 2564static inline __be32
4a6e43e6
N
2565nfs4_check_delegmode(struct nfs4_delegation *dp, int flags)
2566{
2567 if ((flags & WR_STATE) && (dp->dl_type == NFS4_OPEN_DELEGATE_READ))
2568 return nfserr_openmode;
2569 else
2570 return nfs_ok;
2571}
2572
f459e453 2573static int share_access_to_flags(u32 share_access)
52f4fb43 2574{
f459e453 2575 share_access &= ~NFS4_SHARE_WANT_MASK;
52f4fb43 2576
f459e453 2577 return share_access == NFS4_SHARE_ACCESS_READ ? RD_STATE : WR_STATE;
52f4fb43
N
2578}
2579
38c2f4b1 2580static struct nfs4_delegation *find_deleg_stateid(struct nfs4_client *cl, stateid_t *s)
24a0111e 2581{
f459e453 2582 struct nfs4_stid *ret;
24a0111e 2583
38c2f4b1 2584 ret = find_stateid_by_type(cl, s, NFS4_DELEG_STID);
f459e453
BF
2585 if (!ret)
2586 return NULL;
2587 return delegstateid(ret);
24a0111e
BF
2588}
2589
b37ad28b 2590static __be32
38c2f4b1 2591nfs4_check_deleg(struct nfs4_client *cl, struct nfs4_file *fp, struct nfsd4_open *open,
567d9829
N
2592 struct nfs4_delegation **dp)
2593{
2594 int flags;
b37ad28b 2595 __be32 status = nfserr_bad_stateid;
567d9829 2596
38c2f4b1 2597 *dp = find_deleg_stateid(cl, &open->op_delegate_stateid);
567d9829 2598 if (*dp == NULL)
c44c5eeb 2599 goto out;
24a0111e 2600 flags = share_access_to_flags(open->op_share_access);
567d9829
N
2601 status = nfs4_check_delegmode(*dp, flags);
2602 if (status)
2603 *dp = NULL;
c44c5eeb
N
2604out:
2605 if (open->op_claim_type != NFS4_OPEN_CLAIM_DELEGATE_CUR)
2606 return nfs_ok;
2607 if (status)
2608 return status;
dad1c067 2609 open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
c44c5eeb 2610 return nfs_ok;
567d9829
N
2611}
2612
b37ad28b 2613static __be32
dcef0413 2614nfs4_check_open(struct nfs4_file *fp, struct nfsd4_open *open, struct nfs4_ol_stateid **stpp)
1da177e4 2615{
dcef0413 2616 struct nfs4_ol_stateid *local;
fe0750e5 2617 struct nfs4_openowner *oo = open->op_openowner;
1da177e4 2618
8beefa24 2619 list_for_each_entry(local, &fp->fi_stateids, st_perfile) {
1da177e4
LT
2620 /* ignore lock owners */
2621 if (local->st_stateowner->so_is_open_owner == 0)
2622 continue;
2623 /* remember if we have seen this open owner */
fe0750e5 2624 if (local->st_stateowner == &oo->oo_owner)
1da177e4
LT
2625 *stpp = local;
2626 /* check for conflicting share reservations */
2627 if (!test_share(local, open))
77eaae8d 2628 return nfserr_share_denied;
1da177e4 2629 }
77eaae8d 2630 return nfs_ok;
1da177e4
LT
2631}
2632
996e0938
BF
2633static void nfs4_free_stateid(struct nfs4_ol_stateid *s)
2634{
2635 kmem_cache_free(stateid_slab, s);
5ac049ac
N
2636}
2637
21fb4016
BF
2638static inline int nfs4_access_to_access(u32 nfs4_access)
2639{
2640 int flags = 0;
2641
2642 if (nfs4_access & NFS4_SHARE_ACCESS_READ)
2643 flags |= NFSD_MAY_READ;
2644 if (nfs4_access & NFS4_SHARE_ACCESS_WRITE)
2645 flags |= NFSD_MAY_WRITE;
2646 return flags;
2647}
2648
0c12eaff
CB
2649static __be32 nfs4_get_vfs_file(struct svc_rqst *rqstp, struct nfs4_file *fp,
2650 struct svc_fh *cur_fh, struct nfsd4_open *open)
f9d7562f
BF
2651{
2652 __be32 status;
0c12eaff
CB
2653 int oflag = nfs4_access_to_omode(open->op_share_access);
2654 int access = nfs4_access_to_access(open->op_share_access);
2655
f9d7562f
BF
2656 if (!fp->fi_fds[oflag]) {
2657 status = nfsd_open(rqstp, cur_fh, S_IFREG, access,
2658 &fp->fi_fds[oflag]);
f9d7562f
BF
2659 if (status)
2660 return status;
2661 }
2662 nfs4_file_get_access(fp, oflag);
2663
2664 return nfs_ok;
2665}
2666
b37ad28b 2667static inline __be32
1da177e4
LT
2668nfsd4_truncate(struct svc_rqst *rqstp, struct svc_fh *fh,
2669 struct nfsd4_open *open)
2670{
2671 struct iattr iattr = {
2672 .ia_valid = ATTR_SIZE,
2673 .ia_size = 0,
2674 };
2675 if (!open->op_truncate)
2676 return 0;
2677 if (!(open->op_share_access & NFS4_SHARE_ACCESS_WRITE))
9246585a 2678 return nfserr_inval;
1da177e4
LT
2679 return nfsd_setattr(rqstp, fh, &iattr, 0, (time_t)0);
2680}
2681
b37ad28b 2682static __be32
dcef0413 2683nfs4_upgrade_open(struct svc_rqst *rqstp, struct nfs4_file *fp, struct svc_fh *cur_fh, struct nfs4_ol_stateid *stp, struct nfsd4_open *open)
1da177e4 2684{
b6d2f1ca 2685 u32 op_share_access = open->op_share_access;
7d947842 2686 bool new_access;
b37ad28b 2687 __be32 status;
1da177e4 2688
7d947842 2689 new_access = !test_bit(op_share_access, &stp->st_access_bmap);
f9d7562f 2690 if (new_access) {
0c12eaff 2691 status = nfs4_get_vfs_file(rqstp, fp, cur_fh, open);
f9d7562f
BF
2692 if (status)
2693 return status;
6c26d08f 2694 }
1da177e4
LT
2695 status = nfsd4_truncate(rqstp, cur_fh, open);
2696 if (status) {
f9d7562f 2697 if (new_access) {
f197c271 2698 int oflag = nfs4_access_to_omode(op_share_access);
f9d7562f
BF
2699 nfs4_file_put_access(fp, oflag);
2700 }
1da177e4
LT
2701 return status;
2702 }
2703 /* remember the open */
24a0111e 2704 __set_bit(op_share_access, &stp->st_access_bmap);
b55e0ba1 2705 __set_bit(open->op_share_deny, &stp->st_deny_bmap);
1da177e4
LT
2706
2707 return nfs_ok;
2708}
2709
2710
1da177e4 2711static void
37515177 2712nfs4_set_claim_prev(struct nfsd4_open *open)
1da177e4 2713{
dad1c067 2714 open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
fe0750e5 2715 open->op_openowner->oo_owner.so_client->cl_firststate = 1;
1da177e4
LT
2716}
2717
14a24e99
BF
2718/* Should we give out recallable state?: */
2719static bool nfsd4_cb_channel_good(struct nfs4_client *clp)
2720{
2721 if (clp->cl_cb_state == NFSD4_CB_UP)
2722 return true;
2723 /*
2724 * In the sessions case, since we don't have to establish a
2725 * separate connection for callbacks, we assume it's OK
2726 * until we hear otherwise:
2727 */
2728 return clp->cl_minorversion && clp->cl_cb_state == NFSD4_CB_UNKNOWN;
2729}
2730
22d38c4c
BF
2731static struct file_lock *nfs4_alloc_init_lease(struct nfs4_delegation *dp, int flag)
2732{
2733 struct file_lock *fl;
2734
2735 fl = locks_alloc_lock();
2736 if (!fl)
2737 return NULL;
2738 locks_init_lock(fl);
2739 fl->fl_lmops = &nfsd_lease_mng_ops;
2740 fl->fl_flags = FL_LEASE;
2741 fl->fl_type = flag == NFS4_OPEN_DELEGATE_READ? F_RDLCK: F_WRLCK;
2742 fl->fl_end = OFFSET_MAX;
acfdf5c3 2743 fl->fl_owner = (fl_owner_t)(dp->dl_file);
22d38c4c 2744 fl->fl_pid = current->tgid;
22d38c4c
BF
2745 return fl;
2746}
2747
edab9782
BF
2748static int nfs4_setlease(struct nfs4_delegation *dp, int flag)
2749{
acfdf5c3 2750 struct nfs4_file *fp = dp->dl_file;
edab9782
BF
2751 struct file_lock *fl;
2752 int status;
2753
2754 fl = nfs4_alloc_init_lease(dp, flag);
2755 if (!fl)
2756 return -ENOMEM;
acfdf5c3 2757 fl->fl_file = find_readable_file(fp);
2a74aba7 2758 list_add(&dp->dl_perclnt, &dp->dl_stid.sc_client->cl_delegations);
acfdf5c3 2759 status = vfs_setlease(fl->fl_file, fl->fl_type, &fl);
edab9782 2760 if (status) {
acfdf5c3 2761 list_del_init(&dp->dl_perclnt);
edab9782
BF
2762 locks_free_lock(fl);
2763 return -ENOMEM;
2764 }
acfdf5c3
BF
2765 fp->fi_lease = fl;
2766 fp->fi_deleg_file = fl->fl_file;
2767 get_file(fp->fi_deleg_file);
2768 atomic_set(&fp->fi_delegees, 1);
2769 list_add(&dp->dl_perfile, &fp->fi_delegations);
2770 return 0;
2771}
2772
2773static int nfs4_set_delegation(struct nfs4_delegation *dp, int flag)
2774{
2775 struct nfs4_file *fp = dp->dl_file;
2776
2777 if (!fp->fi_lease)
2778 return nfs4_setlease(dp, flag);
2779 spin_lock(&recall_lock);
2780 if (fp->fi_had_conflict) {
2781 spin_unlock(&recall_lock);
2782 return -EAGAIN;
2783 }
2784 atomic_inc(&fp->fi_delegees);
2785 list_add(&dp->dl_perfile, &fp->fi_delegations);
2786 spin_unlock(&recall_lock);
2a74aba7 2787 list_add(&dp->dl_perclnt, &dp->dl_stid.sc_client->cl_delegations);
edab9782
BF
2788 return 0;
2789}
2790
1da177e4
LT
2791/*
2792 * Attempt to hand out a delegation.
2793 */
2794static void
dcef0413 2795nfs4_open_delegation(struct svc_fh *fh, struct nfsd4_open *open, struct nfs4_ol_stateid *stp)
1da177e4
LT
2796{
2797 struct nfs4_delegation *dp;
fe0750e5 2798 struct nfs4_openowner *oo = container_of(stp->st_stateowner, struct nfs4_openowner, oo_owner);
14a24e99 2799 int cb_up;
1da177e4
LT
2800 int status, flag = 0;
2801
fe0750e5 2802 cb_up = nfsd4_cb_channel_good(oo->oo_owner.so_client);
1da177e4 2803 flag = NFS4_OPEN_DELEGATE_NONE;
7b190fec
N
2804 open->op_recall = 0;
2805 switch (open->op_claim_type) {
2806 case NFS4_OPEN_CLAIM_PREVIOUS:
2bf23875 2807 if (!cb_up)
7b190fec
N
2808 open->op_recall = 1;
2809 flag = open->op_delegate_type;
2810 if (flag == NFS4_OPEN_DELEGATE_NONE)
2811 goto out;
2812 break;
2813 case NFS4_OPEN_CLAIM_NULL:
2814 /* Let's not give out any delegations till everyone's
2815 * had the chance to reclaim theirs.... */
af558e33 2816 if (locks_in_grace())
7b190fec 2817 goto out;
dad1c067 2818 if (!cb_up || !(oo->oo_flags & NFS4_OO_CONFIRMED))
7b190fec
N
2819 goto out;
2820 if (open->op_share_access & NFS4_SHARE_ACCESS_WRITE)
2821 flag = NFS4_OPEN_DELEGATE_WRITE;
2822 else
2823 flag = NFS4_OPEN_DELEGATE_READ;
2824 break;
2825 default:
2826 goto out;
2827 }
1da177e4 2828
fe0750e5 2829 dp = alloc_init_deleg(oo->oo_owner.so_client, stp, fh, flag);
dd239cc0
BF
2830 if (dp == NULL)
2831 goto out_no_deleg;
acfdf5c3 2832 status = nfs4_set_delegation(dp, flag);
edab9782 2833 if (status)
dd239cc0 2834 goto out_free;
1da177e4 2835
d5477a8d 2836 memcpy(&open->op_delegate_stateid, &dp->dl_stid.sc_stateid, sizeof(dp->dl_stid.sc_stateid));
1da177e4 2837
8c10cbdb 2838 dprintk("NFSD: delegation stateid=" STATEID_FMT "\n",
d5477a8d 2839 STATEID_VAL(&dp->dl_stid.sc_stateid));
1da177e4 2840out:
7b190fec
N
2841 if (open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS
2842 && flag == NFS4_OPEN_DELEGATE_NONE
2843 && open->op_delegate_type != NFS4_OPEN_DELEGATE_NONE)
2fdada03 2844 dprintk("NFSD: WARNING: refusing delegation reclaim\n");
1da177e4 2845 open->op_delegate_type = flag;
dd239cc0
BF
2846 return;
2847out_free:
acfdf5c3 2848 nfs4_put_delegation(dp);
dd239cc0
BF
2849out_no_deleg:
2850 flag = NFS4_OPEN_DELEGATE_NONE;
2851 goto out;
1da177e4
LT
2852}
2853
2854/*
2855 * called with nfs4_lock_state() held.
2856 */
b37ad28b 2857__be32
1da177e4
LT
2858nfsd4_process_open2(struct svc_rqst *rqstp, struct svc_fh *current_fh, struct nfsd4_open *open)
2859{
6668958f 2860 struct nfsd4_compoundres *resp = rqstp->rq_resp;
38c2f4b1 2861 struct nfs4_client *cl = open->op_openowner->oo_owner.so_client;
1da177e4
LT
2862 struct nfs4_file *fp = NULL;
2863 struct inode *ino = current_fh->fh_dentry->d_inode;
dcef0413 2864 struct nfs4_ol_stateid *stp = NULL;
567d9829 2865 struct nfs4_delegation *dp = NULL;
b37ad28b 2866 __be32 status;
1da177e4 2867
1da177e4
LT
2868 /*
2869 * Lookup file; if found, lookup stateid and check open request,
2870 * and check for delegations in the process of being recalled.
2871 * If not found, create the nfs4_file struct
2872 */
2873 fp = find_file(ino);
2874 if (fp) {
2875 if ((status = nfs4_check_open(fp, open, &stp)))
2876 goto out;
38c2f4b1 2877 status = nfs4_check_deleg(cl, fp, open, &dp);
c44c5eeb
N
2878 if (status)
2879 goto out;
1da177e4 2880 } else {
c44c5eeb
N
2881 status = nfserr_bad_stateid;
2882 if (open->op_claim_type == NFS4_OPEN_CLAIM_DELEGATE_CUR)
2883 goto out;
3e772463 2884 status = nfserr_jukebox;
32513b40
BF
2885 fp = open->op_file;
2886 open->op_file = NULL;
2887 nfsd4_init_file(fp, ino);
1da177e4
LT
2888 }
2889
2890 /*
2891 * OPEN the file, or upgrade an existing OPEN.
2892 * If truncate fails, the OPEN fails.
2893 */
2894 if (stp) {
2895 /* Stateid was found, this is an OPEN upgrade */
f9d7562f 2896 status = nfs4_upgrade_open(rqstp, fp, current_fh, stp, open);
1da177e4
LT
2897 if (status)
2898 goto out;
2899 } else {
4cdc951b 2900 status = nfs4_get_vfs_file(rqstp, fp, current_fh, open);
567d9829 2901 if (status)
1da177e4 2902 goto out;
4cdc951b
BF
2903 stp = open->op_stp;
2904 open->op_stp = NULL;
996e0938 2905 init_open_stateid(stp, fp, open);
1da177e4
LT
2906 status = nfsd4_truncate(rqstp, current_fh, open);
2907 if (status) {
2283963f 2908 release_open_stateid(stp);
1da177e4
LT
2909 goto out;
2910 }
2911 }
dcef0413
BF
2912 update_stateid(&stp->st_stid.sc_stateid);
2913 memcpy(&open->op_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4 2914
4dc6ec00 2915 if (nfsd4_has_session(&resp->cstate))
dad1c067 2916 open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
6668958f 2917
1da177e4
LT
2918 /*
2919 * Attempt to hand out a delegation. No error return, because the
2920 * OPEN succeeds even if we fail.
2921 */
2922 nfs4_open_delegation(current_fh, open, stp);
2923
2924 status = nfs_ok;
2925
8c10cbdb 2926 dprintk("%s: stateid=" STATEID_FMT "\n", __func__,
dcef0413 2927 STATEID_VAL(&stp->st_stid.sc_stateid));
1da177e4 2928out:
13cd2184
N
2929 if (fp)
2930 put_nfs4_file(fp);
37515177
N
2931 if (status == 0 && open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS)
2932 nfs4_set_claim_prev(open);
1da177e4
LT
2933 /*
2934 * To finish the open response, we just need to set the rflags.
2935 */
2936 open->op_rflags = NFS4_OPEN_RESULT_LOCKTYPE_POSIX;
dad1c067 2937 if (!(open->op_openowner->oo_flags & NFS4_OO_CONFIRMED) &&
6668958f 2938 !nfsd4_has_session(&resp->cstate))
1da177e4
LT
2939 open->op_rflags |= NFS4_OPEN_RESULT_CONFIRM;
2940
2941 return status;
2942}
2943
d29b20cd
BF
2944void nfsd4_cleanup_open_state(struct nfsd4_open *open, __be32 status)
2945{
2946 if (open->op_openowner) {
2947 struct nfs4_openowner *oo = open->op_openowner;
2948
2949 if (!list_empty(&oo->oo_owner.so_stateids))
2950 list_del_init(&oo->oo_close_lru);
2951 if (oo->oo_flags & NFS4_OO_NEW) {
2952 if (status) {
2953 release_openowner(oo);
2954 open->op_openowner = NULL;
2955 } else
2956 oo->oo_flags &= ~NFS4_OO_NEW;
2957 }
2958 }
32513b40
BF
2959 if (open->op_file)
2960 nfsd4_free_file(open->op_file);
4cdc951b
BF
2961 if (open->op_stp)
2962 nfs4_free_stateid(open->op_stp);
d29b20cd
BF
2963}
2964
b37ad28b 2965__be32
b591480b
BF
2966nfsd4_renew(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
2967 clientid_t *clid)
1da177e4
LT
2968{
2969 struct nfs4_client *clp;
b37ad28b 2970 __be32 status;
1da177e4
LT
2971
2972 nfs4_lock_state();
2973 dprintk("process_renew(%08x/%08x): starting\n",
2974 clid->cl_boot, clid->cl_id);
2975 status = nfserr_stale_clientid;
2976 if (STALE_CLIENTID(clid))
2977 goto out;
2978 clp = find_confirmed_client(clid);
2979 status = nfserr_expired;
2980 if (clp == NULL) {
2981 /* We assume the client took too long to RENEW. */
2982 dprintk("nfsd4_renew: clientid not found!\n");
2983 goto out;
2984 }
1da177e4 2985 status = nfserr_cb_path_down;
ea1da636 2986 if (!list_empty(&clp->cl_delegations)
77a3569d 2987 && clp->cl_cb_state != NFSD4_CB_UP)
1da177e4
LT
2988 goto out;
2989 status = nfs_ok;
2990out:
2991 nfs4_unlock_state();
2992 return status;
2993}
2994
c47d832b 2995static struct lock_manager nfsd4_manager = {
af558e33
BF
2996};
2997
a76b4319 2998static void
af558e33 2999nfsd4_end_grace(void)
a76b4319
N
3000{
3001 dprintk("NFSD: end of grace period\n");
c7b9a459 3002 nfsd4_recdir_purge_old();
af558e33 3003 locks_end_grace(&nfsd4_manager);
e46b498c
BF
3004 /*
3005 * Now that every NFSv4 client has had the chance to recover and
3006 * to see the (possibly new, possibly shorter) lease time, we
3007 * can safely set the next grace time to the current lease time:
3008 */
3009 nfsd4_grace = nfsd4_lease;
a76b4319
N
3010}
3011
fd39ca9a 3012static time_t
1da177e4
LT
3013nfs4_laundromat(void)
3014{
3015 struct nfs4_client *clp;
fe0750e5 3016 struct nfs4_openowner *oo;
1da177e4
LT
3017 struct nfs4_delegation *dp;
3018 struct list_head *pos, *next, reaplist;
cf07d2ea
BF
3019 time_t cutoff = get_seconds() - nfsd4_lease;
3020 time_t t, clientid_val = nfsd4_lease;
3021 time_t u, test_val = nfsd4_lease;
1da177e4
LT
3022
3023 nfs4_lock_state();
3024
3025 dprintk("NFSD: laundromat service - starting\n");
af558e33
BF
3026 if (locks_in_grace())
3027 nfsd4_end_grace();
36acb66b
BH
3028 INIT_LIST_HEAD(&reaplist);
3029 spin_lock(&client_lock);
1da177e4
LT
3030 list_for_each_safe(pos, next, &client_lru) {
3031 clp = list_entry(pos, struct nfs4_client, cl_lru);
3032 if (time_after((unsigned long)clp->cl_time, (unsigned long)cutoff)) {
3033 t = clp->cl_time - cutoff;
3034 if (clientid_val > t)
3035 clientid_val = t;
3036 break;
3037 }
d7682988
BH
3038 if (atomic_read(&clp->cl_refcount)) {
3039 dprintk("NFSD: client in use (clientid %08x)\n",
3040 clp->cl_clientid.cl_id);
3041 continue;
3042 }
3043 unhash_client_locked(clp);
3044 list_add(&clp->cl_lru, &reaplist);
36acb66b
BH
3045 }
3046 spin_unlock(&client_lock);
3047 list_for_each_safe(pos, next, &reaplist) {
3048 clp = list_entry(pos, struct nfs4_client, cl_lru);
1da177e4
LT
3049 dprintk("NFSD: purging unused client (clientid %08x)\n",
3050 clp->cl_clientid.cl_id);
c7b9a459 3051 nfsd4_remove_clid_dir(clp);
1da177e4
LT
3052 expire_client(clp);
3053 }
1da177e4
LT
3054 spin_lock(&recall_lock);
3055 list_for_each_safe(pos, next, &del_recall_lru) {
3056 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
3057 if (time_after((unsigned long)dp->dl_time, (unsigned long)cutoff)) {
3058 u = dp->dl_time - cutoff;
3059 if (test_val > u)
3060 test_val = u;
3061 break;
3062 }
1da177e4
LT
3063 list_move(&dp->dl_recall_lru, &reaplist);
3064 }
3065 spin_unlock(&recall_lock);
3066 list_for_each_safe(pos, next, &reaplist) {
3067 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
3068 list_del_init(&dp->dl_recall_lru);
3069 unhash_delegation(dp);
3070 }
cf07d2ea 3071 test_val = nfsd4_lease;
1da177e4 3072 list_for_each_safe(pos, next, &close_lru) {
fe0750e5
BF
3073 oo = container_of(pos, struct nfs4_openowner, oo_close_lru);
3074 if (time_after((unsigned long)oo->oo_time, (unsigned long)cutoff)) {
3075 u = oo->oo_time - cutoff;
1da177e4
LT
3076 if (test_val > u)
3077 test_val = u;
3078 break;
3079 }
fe0750e5 3080 release_openowner(oo);
1da177e4
LT
3081 }
3082 if (clientid_val < NFSD_LAUNDROMAT_MINTIMEOUT)
3083 clientid_val = NFSD_LAUNDROMAT_MINTIMEOUT;
3084 nfs4_unlock_state();
3085 return clientid_val;
3086}
3087
a254b246
HH
3088static struct workqueue_struct *laundry_wq;
3089static void laundromat_main(struct work_struct *);
3090static DECLARE_DELAYED_WORK(laundromat_work, laundromat_main);
3091
3092static void
c4028958 3093laundromat_main(struct work_struct *not_used)
1da177e4
LT
3094{
3095 time_t t;
3096
3097 t = nfs4_laundromat();
3098 dprintk("NFSD: laundromat_main - sleeping for %ld seconds\n", t);
58da282b 3099 queue_delayed_work(laundry_wq, &laundromat_work, t*HZ);
1da177e4
LT
3100}
3101
f7a4d872 3102static inline __be32 nfs4_check_fh(struct svc_fh *fhp, struct nfs4_ol_stateid *stp)
1da177e4 3103{
f7a4d872
BF
3104 if (fhp->fh_dentry->d_inode != stp->st_file->fi_inode)
3105 return nfserr_bad_stateid;
3106 return nfs_ok;
1da177e4
LT
3107}
3108
3109static int
3110STALE_STATEID(stateid_t *stateid)
3111{
d3b313a4 3112 if (stateid->si_opaque.so_clid.cl_boot == boot_time)
e4e83ea4
BF
3113 return 0;
3114 dprintk("NFSD: stale stateid " STATEID_FMT "!\n",
8c10cbdb 3115 STATEID_VAL(stateid));
e4e83ea4 3116 return 1;
1da177e4
LT
3117}
3118
3119static inline int
3120access_permit_read(unsigned long access_bmap)
3121{
3122 return test_bit(NFS4_SHARE_ACCESS_READ, &access_bmap) ||
3123 test_bit(NFS4_SHARE_ACCESS_BOTH, &access_bmap) ||
3124 test_bit(NFS4_SHARE_ACCESS_WRITE, &access_bmap);
3125}
3126
3127static inline int
3128access_permit_write(unsigned long access_bmap)
3129{
3130 return test_bit(NFS4_SHARE_ACCESS_WRITE, &access_bmap) ||
3131 test_bit(NFS4_SHARE_ACCESS_BOTH, &access_bmap);
3132}
3133
3134static
dcef0413 3135__be32 nfs4_check_openmode(struct nfs4_ol_stateid *stp, int flags)
1da177e4 3136{
b37ad28b 3137 __be32 status = nfserr_openmode;
1da177e4 3138
02921914
BF
3139 /* For lock stateid's, we test the parent open, not the lock: */
3140 if (stp->st_openstp)
3141 stp = stp->st_openstp;
1da177e4
LT
3142 if ((flags & WR_STATE) && (!access_permit_write(stp->st_access_bmap)))
3143 goto out;
3144 if ((flags & RD_STATE) && (!access_permit_read(stp->st_access_bmap)))
3145 goto out;
3146 status = nfs_ok;
3147out:
3148 return status;
3149}
3150
b37ad28b 3151static inline __be32
1da177e4
LT
3152check_special_stateids(svc_fh *current_fh, stateid_t *stateid, int flags)
3153{
203a8c8e 3154 if (ONE_STATEID(stateid) && (flags & RD_STATE))
1da177e4 3155 return nfs_ok;
af558e33 3156 else if (locks_in_grace()) {
25985edc 3157 /* Answer in remaining cases depends on existence of
1da177e4
LT
3158 * conflicting state; so we must wait out the grace period. */
3159 return nfserr_grace;
3160 } else if (flags & WR_STATE)
3161 return nfs4_share_conflict(current_fh,
3162 NFS4_SHARE_DENY_WRITE);
3163 else /* (flags & RD_STATE) && ZERO_STATEID(stateid) */
3164 return nfs4_share_conflict(current_fh,
3165 NFS4_SHARE_DENY_READ);
3166}
3167
3168/*
3169 * Allow READ/WRITE during grace period on recovered state only for files
3170 * that are not able to provide mandatory locking.
3171 */
3172static inline int
18f82731 3173grace_disallows_io(struct inode *inode)
1da177e4 3174{
203a8c8e 3175 return locks_in_grace() && mandatory_lock(inode);
1da177e4
LT
3176}
3177
81b82965
BF
3178/* Returns true iff a is later than b: */
3179static bool stateid_generation_after(stateid_t *a, stateid_t *b)
3180{
3181 return (s32)a->si_generation - (s32)b->si_generation > 0;
3182}
3183
28dde241 3184static int check_stateid_generation(stateid_t *in, stateid_t *ref, bool has_session)
0836f587 3185{
6668958f
AA
3186 /*
3187 * When sessions are used the stateid generation number is ignored
3188 * when it is zero.
3189 */
28dde241 3190 if (has_session && in->si_generation == 0)
81b82965
BF
3191 return nfs_ok;
3192
3193 if (in->si_generation == ref->si_generation)
3194 return nfs_ok;
6668958f 3195
0836f587 3196 /* If the client sends us a stateid from the future, it's buggy: */
81b82965 3197 if (stateid_generation_after(in, ref))
0836f587
BF
3198 return nfserr_bad_stateid;
3199 /*
81b82965
BF
3200 * However, we could see a stateid from the past, even from a
3201 * non-buggy client. For example, if the client sends a lock
3202 * while some IO is outstanding, the lock may bump si_generation
3203 * while the IO is still in flight. The client could avoid that
3204 * situation by waiting for responses on all the IO requests,
3205 * but better performance may result in retrying IO that
3206 * receives an old_stateid error if requests are rarely
3207 * reordered in flight:
0836f587 3208 */
81b82965 3209 return nfserr_old_stateid;
0836f587
BF
3210}
3211
38c2f4b1 3212__be32 nfs4_validate_stateid(struct nfs4_client *cl, stateid_t *stateid)
17456804 3213{
97b7e3b6
BF
3214 struct nfs4_stid *s;
3215 struct nfs4_ol_stateid *ols;
3216 __be32 status;
17456804
BS
3217
3218 if (STALE_STATEID(stateid))
97b7e3b6 3219 return nfserr_stale_stateid;
17456804 3220
38c2f4b1 3221 s = find_stateid(cl, stateid);
97b7e3b6
BF
3222 if (!s)
3223 return nfserr_stale_stateid;
36279ac1 3224 status = check_stateid_generation(stateid, &s->sc_stateid, 1);
17456804 3225 if (status)
97b7e3b6
BF
3226 return status;
3227 if (!(s->sc_type & (NFS4_OPEN_STID | NFS4_LOCK_STID)))
3228 return nfs_ok;
3229 ols = openlockstateid(s);
3230 if (ols->st_stateowner->so_is_open_owner
dad1c067 3231 && !(openowner(ols->st_stateowner)->oo_flags & NFS4_OO_CONFIRMED))
97b7e3b6
BF
3232 return nfserr_bad_stateid;
3233 return nfs_ok;
17456804
BS
3234}
3235
38c2f4b1
BF
3236static __be32 nfsd4_lookup_stateid(stateid_t *stateid, unsigned char typemask, struct nfs4_stid **s)
3237{
3238 struct nfs4_client *cl;
3239
3240 if (ZERO_STATEID(stateid) || ONE_STATEID(stateid))
3241 return nfserr_bad_stateid;
3242 if (STALE_STATEID(stateid))
3243 return nfserr_stale_stateid;
3244 cl = find_confirmed_client(&stateid->si_opaque.so_clid);
3245 if (!cl)
3246 return nfserr_expired;
3247 *s = find_stateid_by_type(cl, stateid, typemask);
3248 if (!*s)
3249 return nfserr_bad_stateid;
3250 return nfs_ok;
3251
3252}
3253
1da177e4
LT
3254/*
3255* Checks for stateid operations
3256*/
b37ad28b 3257__be32
dd453dfd
BH
3258nfs4_preprocess_stateid_op(struct nfsd4_compound_state *cstate,
3259 stateid_t *stateid, int flags, struct file **filpp)
1da177e4 3260{
69064a27 3261 struct nfs4_stid *s;
dcef0413 3262 struct nfs4_ol_stateid *stp = NULL;
1da177e4 3263 struct nfs4_delegation *dp = NULL;
dd453dfd 3264 struct svc_fh *current_fh = &cstate->current_fh;
1da177e4 3265 struct inode *ino = current_fh->fh_dentry->d_inode;
b37ad28b 3266 __be32 status;
1da177e4 3267
1da177e4
LT
3268 if (filpp)
3269 *filpp = NULL;
3270
18f82731 3271 if (grace_disallows_io(ino))
1da177e4
LT
3272 return nfserr_grace;
3273
3274 if (ZERO_STATEID(stateid) || ONE_STATEID(stateid))
3275 return check_special_stateids(current_fh, stateid, flags);
3276
38c2f4b1
BF
3277 status = nfsd4_lookup_stateid(stateid, NFS4_DELEG_STID|NFS4_OPEN_STID|NFS4_LOCK_STID, &s);
3278 if (status)
3279 return status;
69064a27
BF
3280 status = check_stateid_generation(stateid, &s->sc_stateid, nfsd4_has_session(cstate));
3281 if (status)
3282 goto out;
f7a4d872
BF
3283 switch (s->sc_type) {
3284 case NFS4_DELEG_STID:
69064a27 3285 dp = delegstateid(s);
dc9bf700
BF
3286 status = nfs4_check_delegmode(dp, flags);
3287 if (status)
3288 goto out;
43b0178e 3289 if (filpp) {
acfdf5c3 3290 *filpp = dp->dl_file->fi_deleg_file;
43b0178e
DC
3291 BUG_ON(!*filpp);
3292 }
f7a4d872
BF
3293 break;
3294 case NFS4_OPEN_STID:
3295 case NFS4_LOCK_STID:
69064a27 3296 stp = openlockstateid(s);
f7a4d872
BF
3297 status = nfs4_check_fh(current_fh, stp);
3298 if (status)
1da177e4 3299 goto out;
fe0750e5 3300 if (stp->st_stateowner->so_is_open_owner
dad1c067 3301 && !(openowner(stp->st_stateowner)->oo_flags & NFS4_OO_CONFIRMED))
1da177e4 3302 goto out;
a4455be0
BF
3303 status = nfs4_check_openmode(stp, flags);
3304 if (status)
1da177e4 3305 goto out;
f9d7562f
BF
3306 if (filpp) {
3307 if (flags & RD_STATE)
3308 *filpp = find_readable_file(stp->st_file);
3309 else
3310 *filpp = find_writeable_file(stp->st_file);
f9d7562f 3311 }
f7a4d872
BF
3312 break;
3313 default:
3314 return nfserr_bad_stateid;
1da177e4
LT
3315 }
3316 status = nfs_ok;
3317out:
3318 return status;
3319}
3320
e1ca12df 3321static __be32
dcef0413 3322nfsd4_free_lock_stateid(struct nfs4_ol_stateid *stp)
e1ca12df 3323{
fe0750e5 3324 if (check_for_locks(stp->st_file, lockowner(stp->st_stateowner)))
e1ca12df
BS
3325 return nfserr_locks_held;
3326 release_lock_stateid(stp);
3327 return nfs_ok;
3328}
3329
17456804
BS
3330/*
3331 * Test if the stateid is valid
3332 */
3333__be32
3334nfsd4_test_stateid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
3335 struct nfsd4_test_stateid *test_stateid)
3336{
36279ac1 3337 /* real work is done during encoding */
17456804
BS
3338 return nfs_ok;
3339}
3340
e1ca12df
BS
3341__be32
3342nfsd4_free_stateid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
3343 struct nfsd4_free_stateid *free_stateid)
3344{
3345 stateid_t *stateid = &free_stateid->fr_stateid;
2da1cec7 3346 struct nfs4_stid *s;
38c2f4b1 3347 struct nfs4_client *cl = cstate->session->se_client;
2da1cec7 3348 __be32 ret = nfserr_bad_stateid;
e1ca12df
BS
3349
3350 nfs4_lock_state();
38c2f4b1 3351 s = find_stateid(cl, stateid);
2da1cec7 3352 if (!s)
81b82965 3353 goto out;
2da1cec7
BF
3354 switch (s->sc_type) {
3355 case NFS4_DELEG_STID:
e1ca12df
BS
3356 ret = nfserr_locks_held;
3357 goto out;
2da1cec7
BF
3358 case NFS4_OPEN_STID:
3359 case NFS4_LOCK_STID:
3360 ret = check_stateid_generation(stateid, &s->sc_stateid, 1);
3361 if (ret)
3362 goto out;
3363 if (s->sc_type == NFS4_LOCK_STID)
3364 ret = nfsd4_free_lock_stateid(openlockstateid(s));
3365 else
3366 ret = nfserr_locks_held;
f7a4d872
BF
3367 break;
3368 default:
3369 ret = nfserr_bad_stateid;
e1ca12df 3370 }
e1ca12df
BS
3371out:
3372 nfs4_unlock_state();
3373 return ret;
3374}
3375
4c4cd222
N
3376static inline int
3377setlkflg (int type)
3378{
3379 return (type == NFS4_READW_LT || type == NFS4_READ_LT) ?
3380 RD_STATE : WR_STATE;
3381}
1da177e4 3382
dcef0413 3383static __be32 nfs4_seqid_op_checks(struct nfsd4_compound_state *cstate, stateid_t *stateid, u32 seqid, struct nfs4_ol_stateid *stp)
c0a5d93e
BF
3384{
3385 struct svc_fh *current_fh = &cstate->current_fh;
3386 struct nfs4_stateowner *sop = stp->st_stateowner;
3387 __be32 status;
3388
c0a5d93e
BF
3389 status = nfsd4_check_seqid(cstate, sop, seqid);
3390 if (status)
3391 return status;
f7a4d872
BF
3392 if (stp->st_stid.sc_type == NFS4_CLOSED_STID)
3393 /*
3394 * "Closed" stateid's exist *only* to return
3395 * nfserr_replay_me from the previous step.
3396 */
3397 return nfserr_bad_stateid;
3398 status = check_stateid_generation(stateid, &stp->st_stid.sc_stateid, nfsd4_has_session(cstate));
3399 if (status)
3400 return status;
3401 return nfs4_check_fh(current_fh, stp);
c0a5d93e
BF
3402}
3403
1da177e4
LT
3404/*
3405 * Checks for sequence id mutating operations.
3406 */
b37ad28b 3407static __be32
dd453dfd 3408nfs4_preprocess_seqid_op(struct nfsd4_compound_state *cstate, u32 seqid,
2288d0e3 3409 stateid_t *stateid, char typemask,
dcef0413 3410 struct nfs4_ol_stateid **stpp)
1da177e4 3411{
0836f587 3412 __be32 status;
38c2f4b1 3413 struct nfs4_stid *s;
1da177e4 3414
8c10cbdb
BH
3415 dprintk("NFSD: %s: seqid=%d stateid = " STATEID_FMT "\n", __func__,
3416 seqid, STATEID_VAL(stateid));
3a4f98bb 3417
1da177e4 3418 *stpp = NULL;
38c2f4b1 3419 status = nfsd4_lookup_stateid(stateid, typemask, &s);
c0a5d93e
BF
3420 if (status)
3421 return status;
38c2f4b1 3422 *stpp = openlockstateid(s);
c0a5d93e 3423 cstate->replay_owner = (*stpp)->st_stateowner;
1da177e4 3424
c0a5d93e
BF
3425 return nfs4_seqid_op_checks(cstate, stateid, seqid, *stpp);
3426}
39325bd0 3427
dcef0413 3428static __be32 nfs4_preprocess_confirmed_seqid_op(struct nfsd4_compound_state *cstate, u32 seqid, stateid_t *stateid, struct nfs4_ol_stateid **stpp)
c0a5d93e
BF
3429{
3430 __be32 status;
3431 struct nfs4_openowner *oo;
1da177e4 3432
c0a5d93e 3433 status = nfs4_preprocess_seqid_op(cstate, seqid, stateid,
2288d0e3 3434 NFS4_OPEN_STID, stpp);
7a8711c9
BF
3435 if (status)
3436 return status;
c0a5d93e 3437 oo = openowner((*stpp)->st_stateowner);
dad1c067 3438 if (!(oo->oo_flags & NFS4_OO_CONFIRMED))
3a4f98bb 3439 return nfserr_bad_stateid;
3a4f98bb 3440 return nfs_ok;
1da177e4
LT
3441}
3442
b37ad28b 3443__be32
ca364317 3444nfsd4_open_confirm(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 3445 struct nfsd4_open_confirm *oc)
1da177e4 3446{
b37ad28b 3447 __be32 status;
fe0750e5 3448 struct nfs4_openowner *oo;
dcef0413 3449 struct nfs4_ol_stateid *stp;
1da177e4
LT
3450
3451 dprintk("NFSD: nfsd4_open_confirm on file %.*s\n",
ca364317
BF
3452 (int)cstate->current_fh.fh_dentry->d_name.len,
3453 cstate->current_fh.fh_dentry->d_name.name);
1da177e4 3454
ca364317 3455 status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0);
a8cddc5d
BF
3456 if (status)
3457 return status;
1da177e4
LT
3458
3459 nfs4_lock_state();
3460
9072d5c6 3461 status = nfs4_preprocess_seqid_op(cstate,
ca364317 3462 oc->oc_seqid, &oc->oc_req_stateid,
2288d0e3 3463 NFS4_OPEN_STID, &stp);
9072d5c6 3464 if (status)
68b66e82 3465 goto out;
fe0750e5 3466 oo = openowner(stp->st_stateowner);
68b66e82 3467 status = nfserr_bad_stateid;
dad1c067 3468 if (oo->oo_flags & NFS4_OO_CONFIRMED)
68b66e82 3469 goto out;
dad1c067 3470 oo->oo_flags |= NFS4_OO_CONFIRMED;
dcef0413
BF
3471 update_stateid(&stp->st_stid.sc_stateid);
3472 memcpy(&oc->oc_resp_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
8c10cbdb 3473 dprintk("NFSD: %s: success, seqid=%d stateid=" STATEID_FMT "\n",
dcef0413 3474 __func__, oc->oc_seqid, STATEID_VAL(&stp->st_stid.sc_stateid));
c7b9a459 3475
fe0750e5 3476 nfsd4_create_clid_dir(oo->oo_owner.so_client);
68b66e82 3477 status = nfs_ok;
1da177e4 3478out:
5ec094c1
BF
3479 if (!cstate->replay_owner)
3480 nfs4_unlock_state();
1da177e4
LT
3481 return status;
3482}
3483
6409a5a6 3484static inline void nfs4_stateid_downgrade_bit(struct nfs4_ol_stateid *stp, u32 access)
1da177e4 3485{
6409a5a6
BF
3486 if (!test_bit(access, &stp->st_access_bmap))
3487 return;
3488 nfs4_file_put_access(stp->st_file, nfs4_access_to_omode(access));
3489 __clear_bit(access, &stp->st_access_bmap);
3490}
f197c271 3491
6409a5a6
BF
3492static inline void nfs4_stateid_downgrade(struct nfs4_ol_stateid *stp, u32 to_access)
3493{
3494 switch (to_access) {
3495 case NFS4_SHARE_ACCESS_READ:
3496 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_WRITE);
3497 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
3498 break;
3499 case NFS4_SHARE_ACCESS_WRITE:
3500 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_READ);
3501 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
3502 break;
3503 case NFS4_SHARE_ACCESS_BOTH:
3504 break;
3505 default:
3506 BUG();
1da177e4
LT
3507 }
3508}
3509
3510static void
3511reset_union_bmap_deny(unsigned long deny, unsigned long *bmap)
3512{
3513 int i;
3514 for (i = 0; i < 4; i++) {
3515 if ((i & deny) != i)
3516 __clear_bit(i, bmap);
3517 }
3518}
3519
b37ad28b 3520__be32
ca364317
BF
3521nfsd4_open_downgrade(struct svc_rqst *rqstp,
3522 struct nfsd4_compound_state *cstate,
a4f1706a 3523 struct nfsd4_open_downgrade *od)
1da177e4 3524{
b37ad28b 3525 __be32 status;
dcef0413 3526 struct nfs4_ol_stateid *stp;
1da177e4
LT
3527
3528 dprintk("NFSD: nfsd4_open_downgrade on file %.*s\n",
ca364317
BF
3529 (int)cstate->current_fh.fh_dentry->d_name.len,
3530 cstate->current_fh.fh_dentry->d_name.name);
1da177e4 3531
c30e92df
BF
3532 /* We don't yet support WANT bits: */
3533 od->od_share_access &= NFS4_SHARE_ACCESS_MASK;
1da177e4
LT
3534
3535 nfs4_lock_state();
c0a5d93e
BF
3536 status = nfs4_preprocess_confirmed_seqid_op(cstate, od->od_seqid,
3537 &od->od_stateid, &stp);
9072d5c6 3538 if (status)
1da177e4 3539 goto out;
1da177e4
LT
3540 status = nfserr_inval;
3541 if (!test_bit(od->od_share_access, &stp->st_access_bmap)) {
3542 dprintk("NFSD:access not a subset current bitmap: 0x%lx, input access=%08x\n",
3543 stp->st_access_bmap, od->od_share_access);
3544 goto out;
3545 }
3546 if (!test_bit(od->od_share_deny, &stp->st_deny_bmap)) {
3547 dprintk("NFSD:deny not a subset current bitmap: 0x%lx, input deny=%08x\n",
3548 stp->st_deny_bmap, od->od_share_deny);
3549 goto out;
3550 }
6409a5a6 3551 nfs4_stateid_downgrade(stp, od->od_share_access);
1da177e4 3552
1da177e4
LT
3553 reset_union_bmap_deny(od->od_share_deny, &stp->st_deny_bmap);
3554
dcef0413
BF
3555 update_stateid(&stp->st_stid.sc_stateid);
3556 memcpy(&od->od_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4
LT
3557 status = nfs_ok;
3558out:
5ec094c1
BF
3559 if (!cstate->replay_owner)
3560 nfs4_unlock_state();
1da177e4
LT
3561 return status;
3562}
3563
38c387b5
BF
3564void nfsd4_purge_closed_stateid(struct nfs4_stateowner *so)
3565{
3566 struct nfs4_openowner *oo;
3567 struct nfs4_ol_stateid *s;
3568
3569 if (!so->so_is_open_owner)
3570 return;
3571 oo = openowner(so);
3572 s = oo->oo_last_closed_stid;
3573 if (!s)
3574 return;
3575 if (!(oo->oo_flags & NFS4_OO_PURGE_CLOSE)) {
3576 /* Release the last_closed_stid on the next seqid bump: */
3577 oo->oo_flags |= NFS4_OO_PURGE_CLOSE;
3578 return;
3579 }
3580 oo->oo_flags &= ~NFS4_OO_PURGE_CLOSE;
f7a4d872
BF
3581 release_last_closed_stateid(oo);
3582}
3583
3584static void nfsd4_close_open_stateid(struct nfs4_ol_stateid *s)
3585{
3586 unhash_open_stateid(s);
3587 s->st_stid.sc_type = NFS4_CLOSED_STID;
38c387b5
BF
3588}
3589
1da177e4
LT
3590/*
3591 * nfs4_unlock_state() called after encode
3592 */
b37ad28b 3593__be32
ca364317 3594nfsd4_close(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 3595 struct nfsd4_close *close)
1da177e4 3596{
b37ad28b 3597 __be32 status;
fe0750e5 3598 struct nfs4_openowner *oo;
dcef0413 3599 struct nfs4_ol_stateid *stp;
1da177e4
LT
3600
3601 dprintk("NFSD: nfsd4_close on file %.*s\n",
ca364317
BF
3602 (int)cstate->current_fh.fh_dentry->d_name.len,
3603 cstate->current_fh.fh_dentry->d_name.name);
1da177e4
LT
3604
3605 nfs4_lock_state();
f7a4d872
BF
3606 status = nfs4_preprocess_seqid_op(cstate, close->cl_seqid,
3607 &close->cl_stateid,
3608 NFS4_OPEN_STID|NFS4_CLOSED_STID,
3609 &stp);
9072d5c6 3610 if (status)
1da177e4 3611 goto out;
fe0750e5 3612 oo = openowner(stp->st_stateowner);
1da177e4 3613 status = nfs_ok;
dcef0413
BF
3614 update_stateid(&stp->st_stid.sc_stateid);
3615 memcpy(&close->cl_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4 3616
f7a4d872 3617 nfsd4_close_open_stateid(stp);
38c387b5 3618 oo->oo_last_closed_stid = stp;
04ef5954
BF
3619
3620 /* place unused nfs4_stateowners on so_close_lru list to be
3621 * released by the laundromat service after the lease period
3622 * to enable us to handle CLOSE replay
3623 */
fe0750e5
BF
3624 if (list_empty(&oo->oo_owner.so_stateids))
3625 move_to_close_lru(oo);
1da177e4 3626out:
5ec094c1
BF
3627 if (!cstate->replay_owner)
3628 nfs4_unlock_state();
1da177e4
LT
3629 return status;
3630}
3631
b37ad28b 3632__be32
ca364317
BF
3633nfsd4_delegreturn(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
3634 struct nfsd4_delegreturn *dr)
1da177e4 3635{
203a8c8e
BF
3636 struct nfs4_delegation *dp;
3637 stateid_t *stateid = &dr->dr_stateid;
38c2f4b1 3638 struct nfs4_stid *s;
203a8c8e 3639 struct inode *inode;
b37ad28b 3640 __be32 status;
1da177e4 3641
ca364317 3642 if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
203a8c8e
BF
3643 return status;
3644 inode = cstate->current_fh.fh_dentry->d_inode;
1da177e4
LT
3645
3646 nfs4_lock_state();
38c2f4b1
BF
3647 status = nfsd4_lookup_stateid(stateid, NFS4_DELEG_STID, &s);
3648 if (status)
203a8c8e 3649 goto out;
38c2f4b1 3650 dp = delegstateid(s);
d5477a8d 3651 status = check_stateid_generation(stateid, &dp->dl_stid.sc_stateid, nfsd4_has_session(cstate));
203a8c8e
BF
3652 if (status)
3653 goto out;
203a8c8e
BF
3654
3655 unhash_delegation(dp);
1da177e4 3656out:
203a8c8e
BF
3657 nfs4_unlock_state();
3658
1da177e4
LT
3659 return status;
3660}
3661
3662
3663/*
3664 * Lock owner state (byte-range locks)
3665 */
3666#define LOFF_OVERFLOW(start, len) ((u64)(len) > ~(u64)(start))
3667#define LOCK_HASH_BITS 8
3668#define LOCK_HASH_SIZE (1 << LOCK_HASH_BITS)
3669#define LOCK_HASH_MASK (LOCK_HASH_SIZE - 1)
3670
87df4de8
BH
3671static inline u64
3672end_offset(u64 start, u64 len)
3673{
3674 u64 end;
3675
3676 end = start + len;
3677 return end >= start ? end: NFS4_MAX_UINT64;
3678}
3679
3680/* last octet in a range */
3681static inline u64
3682last_byte_offset(u64 start, u64 len)
3683{
3684 u64 end;
3685
3686 BUG_ON(!len);
3687 end = start + len;
3688 return end > start ? end - 1: NFS4_MAX_UINT64;
3689}
3690
1da177e4
LT
3691static inline unsigned int
3692lock_ownerstr_hashval(struct inode *inode, u32 cl_id,
3693 struct xdr_netobj *ownername)
3694{
3695 return (file_hashval(inode) + cl_id
3696 + opaque_hashval(ownername->data, ownername->len))
3697 & LOCK_HASH_MASK;
3698}
3699
1da177e4 3700static struct list_head lock_ownerstr_hashtbl[LOCK_HASH_SIZE];
1da177e4 3701
1da177e4
LT
3702/*
3703 * TODO: Linux file offsets are _signed_ 64-bit quantities, which means that
3704 * we can't properly handle lock requests that go beyond the (2^63 - 1)-th
3705 * byte, because of sign extension problems. Since NFSv4 calls for 64-bit
3706 * locking, this prevents us from being completely protocol-compliant. The
3707 * real solution to this problem is to start using unsigned file offsets in
3708 * the VFS, but this is a very deep change!
3709 */
3710static inline void
3711nfs4_transform_lock_offset(struct file_lock *lock)
3712{
3713 if (lock->fl_start < 0)
3714 lock->fl_start = OFFSET_MAX;
3715 if (lock->fl_end < 0)
3716 lock->fl_end = OFFSET_MAX;
3717}
3718
d5b9026a
N
3719/* Hack!: For now, we're defining this just so we can use a pointer to it
3720 * as a unique cookie to identify our (NFSv4's) posix locks. */
7b021967 3721static const struct lock_manager_operations nfsd_posix_mng_ops = {
d5b9026a 3722};
1da177e4
LT
3723
3724static inline void
3725nfs4_set_lock_denied(struct file_lock *fl, struct nfsd4_lock_denied *deny)
3726{
fe0750e5 3727 struct nfs4_lockowner *lo;
1da177e4 3728
d5b9026a 3729 if (fl->fl_lmops == &nfsd_posix_mng_ops) {
fe0750e5
BF
3730 lo = (struct nfs4_lockowner *) fl->fl_owner;
3731 deny->ld_owner.data = kmemdup(lo->lo_owner.so_owner.data,
3732 lo->lo_owner.so_owner.len, GFP_KERNEL);
7c13f344
BF
3733 if (!deny->ld_owner.data)
3734 /* We just don't care that much */
3735 goto nevermind;
fe0750e5
BF
3736 deny->ld_owner.len = lo->lo_owner.so_owner.len;
3737 deny->ld_clientid = lo->lo_owner.so_client->cl_clientid;
d5b9026a 3738 } else {
7c13f344
BF
3739nevermind:
3740 deny->ld_owner.len = 0;
3741 deny->ld_owner.data = NULL;
d5b9026a
N
3742 deny->ld_clientid.cl_boot = 0;
3743 deny->ld_clientid.cl_id = 0;
1da177e4
LT
3744 }
3745 deny->ld_start = fl->fl_start;
87df4de8
BH
3746 deny->ld_length = NFS4_MAX_UINT64;
3747 if (fl->fl_end != NFS4_MAX_UINT64)
1da177e4
LT
3748 deny->ld_length = fl->fl_end - fl->fl_start + 1;
3749 deny->ld_type = NFS4_READ_LT;
3750 if (fl->fl_type != F_RDLCK)
3751 deny->ld_type = NFS4_WRITE_LT;
3752}
3753
fe0750e5
BF
3754static struct nfs4_lockowner *
3755find_lockowner_str(struct inode *inode, clientid_t *clid,
1da177e4
LT
3756 struct xdr_netobj *owner)
3757{
3758 unsigned int hashval = lock_ownerstr_hashval(inode, clid->cl_id, owner);
3759 struct nfs4_stateowner *op;
3760
3761 list_for_each_entry(op, &lock_ownerstr_hashtbl[hashval], so_strhash) {
599e0a22 3762 if (same_owner_str(op, owner, clid))
fe0750e5 3763 return lockowner(op);
1da177e4
LT
3764 }
3765 return NULL;
3766}
3767
dcef0413 3768static void hash_lockowner(struct nfs4_lockowner *lo, unsigned int strhashval, struct nfs4_client *clp, struct nfs4_ol_stateid *open_stp)
ff194bd9 3769{
fe0750e5
BF
3770 list_add(&lo->lo_owner.so_strhash, &lock_ownerstr_hashtbl[strhashval]);
3771 list_add(&lo->lo_perstateid, &open_stp->st_lockowners);
ff194bd9
BF
3772}
3773
1da177e4
LT
3774/*
3775 * Alloc a lock owner structure.
3776 * Called in nfsd4_lock - therefore, OPEN and OPEN_CONFIRM (if needed) has
25985edc 3777 * occurred.
1da177e4
LT
3778 *
3779 * strhashval = lock_ownerstr_hashval
1da177e4
LT
3780 */
3781
fe0750e5 3782static struct nfs4_lockowner *
dcef0413 3783alloc_init_lock_stateowner(unsigned int strhashval, struct nfs4_client *clp, struct nfs4_ol_stateid *open_stp, struct nfsd4_lock *lock) {
fe0750e5 3784 struct nfs4_lockowner *lo;
1da177e4 3785
fe0750e5
BF
3786 lo = alloc_stateowner(lockowner_slab, &lock->lk_new_owner, clp);
3787 if (!lo)
1da177e4 3788 return NULL;
fe0750e5
BF
3789 INIT_LIST_HEAD(&lo->lo_owner.so_stateids);
3790 lo->lo_owner.so_is_open_owner = 0;
b59e3c0e
NB
3791 /* It is the openowner seqid that will be incremented in encode in the
3792 * case of new lockowners; so increment the lock seqid manually: */
fe0750e5
BF
3793 lo->lo_owner.so_seqid = lock->lk_new_lock_seqid + 1;
3794 hash_lockowner(lo, strhashval, clp, open_stp);
3795 return lo;
1da177e4
LT
3796}
3797
dcef0413
BF
3798static struct nfs4_ol_stateid *
3799alloc_init_lock_stateid(struct nfs4_lockowner *lo, struct nfs4_file *fp, struct nfs4_ol_stateid *open_stp)
1da177e4 3800{
dcef0413 3801 struct nfs4_ol_stateid *stp;
d3b313a4 3802 struct nfs4_client *clp = lo->lo_owner.so_client;
1da177e4 3803
996e0938 3804 stp = nfs4_alloc_stateid(clp);
5ac049ac 3805 if (stp == NULL)
6136d2b4 3806 return NULL;
996e0938 3807 init_stid(&stp->st_stid, clp, NFS4_LOCK_STID);
8beefa24 3808 list_add(&stp->st_perfile, &fp->fi_stateids);
fe0750e5
BF
3809 list_add(&stp->st_perstateowner, &lo->lo_owner.so_stateids);
3810 stp->st_stateowner = &lo->lo_owner;
13cd2184 3811 get_nfs4_file(fp);
1da177e4 3812 stp->st_file = fp;
0997b173 3813 stp->st_access_bmap = 0;
1da177e4 3814 stp->st_deny_bmap = open_stp->st_deny_bmap;
4c4cd222 3815 stp->st_openstp = open_stp;
1da177e4
LT
3816 return stp;
3817}
3818
fd39ca9a 3819static int
1da177e4
LT
3820check_lock_length(u64 offset, u64 length)
3821{
87df4de8 3822 return ((length == 0) || ((length != NFS4_MAX_UINT64) &&
1da177e4
LT
3823 LOFF_OVERFLOW(offset, length)));
3824}
3825
dcef0413 3826static void get_lock_access(struct nfs4_ol_stateid *lock_stp, u32 access)
0997b173
BF
3827{
3828 struct nfs4_file *fp = lock_stp->st_file;
3829 int oflag = nfs4_access_to_omode(access);
3830
3831 if (test_bit(access, &lock_stp->st_access_bmap))
3832 return;
3833 nfs4_file_get_access(fp, oflag);
3834 __set_bit(access, &lock_stp->st_access_bmap);
3835}
3836
1da177e4
LT
3837/*
3838 * LOCK operation
3839 */
b37ad28b 3840__be32
ca364317 3841nfsd4_lock(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 3842 struct nfsd4_lock *lock)
1da177e4 3843{
fe0750e5
BF
3844 struct nfs4_openowner *open_sop = NULL;
3845 struct nfs4_lockowner *lock_sop = NULL;
dcef0413 3846 struct nfs4_ol_stateid *lock_stp;
7d947842
BF
3847 struct nfs4_file *fp;
3848 struct file *filp = NULL;
1da177e4 3849 struct file_lock file_lock;
8dc7c311 3850 struct file_lock conflock;
b37ad28b 3851 __be32 status = 0;
1da177e4 3852 unsigned int strhashval;
b34f27aa 3853 int lkflg;
b8dd7b9a 3854 int err;
1da177e4
LT
3855
3856 dprintk("NFSD: nfsd4_lock: start=%Ld length=%Ld\n",
3857 (long long) lock->lk_offset,
3858 (long long) lock->lk_length);
3859
1da177e4
LT
3860 if (check_lock_length(lock->lk_offset, lock->lk_length))
3861 return nfserr_inval;
3862
ca364317 3863 if ((status = fh_verify(rqstp, &cstate->current_fh,
8837abca 3864 S_IFREG, NFSD_MAY_LOCK))) {
a6f6ef2f
AA
3865 dprintk("NFSD: nfsd4_lock: permission denied!\n");
3866 return status;
3867 }
3868
1da177e4
LT
3869 nfs4_lock_state();
3870
3871 if (lock->lk_is_new) {
893f8770
N
3872 /*
3873 * Client indicates that this is a new lockowner.
3874 * Use open owner and open stateid to create lock owner and
3875 * lock stateid.
3876 */
dcef0413 3877 struct nfs4_ol_stateid *open_stp = NULL;
1da177e4
LT
3878
3879 status = nfserr_stale_clientid;
60adfc50
AA
3880 if (!nfsd4_has_session(cstate) &&
3881 STALE_CLIENTID(&lock->lk_new_clientid))
1da177e4 3882 goto out;
1da177e4 3883
1da177e4 3884 /* validate and update open stateid and open seqid */
c0a5d93e 3885 status = nfs4_preprocess_confirmed_seqid_op(cstate,
1da177e4
LT
3886 lock->lk_new_open_seqid,
3887 &lock->lk_new_open_stateid,
c0a5d93e 3888 &open_stp);
37515177 3889 if (status)
1da177e4 3890 goto out;
fe0750e5 3891 open_sop = openowner(open_stp->st_stateowner);
b34f27aa 3892 status = nfserr_bad_stateid;
b34f27aa 3893 if (!nfsd4_has_session(cstate) &&
fe0750e5 3894 !same_clid(&open_sop->oo_owner.so_client->cl_clientid,
b34f27aa
BF
3895 &lock->v.new.clientid))
3896 goto out;
1da177e4
LT
3897 /* create lockowner and lock stateid */
3898 fp = open_stp->st_file;
fe0750e5
BF
3899 strhashval = lock_ownerstr_hashval(fp->fi_inode,
3900 open_sop->oo_owner.so_client->cl_clientid.cl_id,
1da177e4 3901 &lock->v.new.owner);
3e9e3dbe
N
3902 /* XXX: Do we need to check for duplicate stateowners on
3903 * the same file, or should they just be allowed (and
3904 * create new stateids)? */
3e772463 3905 status = nfserr_jukebox;
b59e3c0e 3906 lock_sop = alloc_init_lock_stateowner(strhashval,
fe0750e5 3907 open_sop->oo_owner.so_client, open_stp, lock);
b59e3c0e 3908 if (lock_sop == NULL)
1da177e4 3909 goto out;
b59e3c0e 3910 lock_stp = alloc_init_lock_stateid(lock_sop, fp, open_stp);
8a280510 3911 if (lock_stp == NULL)
1da177e4 3912 goto out;
1da177e4
LT
3913 } else {
3914 /* lock (lock owner + lock stateid) already exists */
dd453dfd 3915 status = nfs4_preprocess_seqid_op(cstate,
fe0750e5
BF
3916 lock->lk_old_lock_seqid,
3917 &lock->lk_old_lock_stateid,
2288d0e3 3918 NFS4_LOCK_STID, &lock_stp);
1da177e4
LT
3919 if (status)
3920 goto out;
fe0750e5 3921 lock_sop = lockowner(lock_stp->st_stateowner);
7d947842 3922 fp = lock_stp->st_file;
1da177e4 3923 }
9072d5c6 3924 /* lock_sop and lock_stp have been created or found */
1da177e4 3925
b34f27aa
BF
3926 lkflg = setlkflg(lock->lk_type);
3927 status = nfs4_check_openmode(lock_stp, lkflg);
3928 if (status)
3929 goto out;
3930
0dd395dc 3931 status = nfserr_grace;
af558e33 3932 if (locks_in_grace() && !lock->lk_reclaim)
0dd395dc
N
3933 goto out;
3934 status = nfserr_no_grace;
af558e33 3935 if (!locks_in_grace() && lock->lk_reclaim)
0dd395dc
N
3936 goto out;
3937
1da177e4
LT
3938 locks_init_lock(&file_lock);
3939 switch (lock->lk_type) {
3940 case NFS4_READ_LT:
3941 case NFS4_READW_LT:
0997b173
BF
3942 filp = find_readable_file(lock_stp->st_file);
3943 if (filp)
3944 get_lock_access(lock_stp, NFS4_SHARE_ACCESS_READ);
1da177e4 3945 file_lock.fl_type = F_RDLCK;
529d7b2a 3946 break;
1da177e4
LT
3947 case NFS4_WRITE_LT:
3948 case NFS4_WRITEW_LT:
0997b173
BF
3949 filp = find_writeable_file(lock_stp->st_file);
3950 if (filp)
3951 get_lock_access(lock_stp, NFS4_SHARE_ACCESS_WRITE);
1da177e4 3952 file_lock.fl_type = F_WRLCK;
529d7b2a 3953 break;
1da177e4
LT
3954 default:
3955 status = nfserr_inval;
3956 goto out;
3957 }
f9d7562f
BF
3958 if (!filp) {
3959 status = nfserr_openmode;
3960 goto out;
3961 }
b59e3c0e 3962 file_lock.fl_owner = (fl_owner_t)lock_sop;
1da177e4
LT
3963 file_lock.fl_pid = current->tgid;
3964 file_lock.fl_file = filp;
3965 file_lock.fl_flags = FL_POSIX;
d5b9026a 3966 file_lock.fl_lmops = &nfsd_posix_mng_ops;
1da177e4
LT
3967
3968 file_lock.fl_start = lock->lk_offset;
87df4de8 3969 file_lock.fl_end = last_byte_offset(lock->lk_offset, lock->lk_length);
1da177e4
LT
3970 nfs4_transform_lock_offset(&file_lock);
3971
3972 /*
3973 * Try to lock the file in the VFS.
3974 * Note: locks.c uses the BKL to protect the inode's lock list.
3975 */
3976
529d7b2a 3977 err = vfs_lock_file(filp, F_SETLK, &file_lock, &conflock);
b8dd7b9a 3978 switch (-err) {
1da177e4 3979 case 0: /* success! */
dcef0413
BF
3980 update_stateid(&lock_stp->st_stid.sc_stateid);
3981 memcpy(&lock->lk_resp_stateid, &lock_stp->st_stid.sc_stateid,
1da177e4 3982 sizeof(stateid_t));
b8dd7b9a 3983 status = 0;
eb76b3fd
AA
3984 break;
3985 case (EAGAIN): /* conflock holds conflicting lock */
3986 status = nfserr_denied;
3987 dprintk("NFSD: nfsd4_lock: conflicting lock found!\n");
3988 nfs4_set_lock_denied(&conflock, &lock->lk_denied);
3989 break;
1da177e4
LT
3990 case (EDEADLK):
3991 status = nfserr_deadlock;
eb76b3fd 3992 break;
3e772463 3993 default:
fd85b817 3994 dprintk("NFSD: nfsd4_lock: vfs_lock_file() failed! status %d\n",err);
3e772463 3995 status = nfserrno(err);
eb76b3fd 3996 break;
1da177e4 3997 }
1da177e4 3998out:
8a280510 3999 if (status && lock->lk_is_new && lock_sop)
f044ff83 4000 release_lockowner(lock_sop);
5ec094c1
BF
4001 if (!cstate->replay_owner)
4002 nfs4_unlock_state();
1da177e4
LT
4003 return status;
4004}
4005
55ef1274
BF
4006/*
4007 * The NFSv4 spec allows a client to do a LOCKT without holding an OPEN,
4008 * so we do a temporary open here just to get an open file to pass to
4009 * vfs_test_lock. (Arguably perhaps test_lock should be done with an
4010 * inode operation.)
4011 */
4012static int nfsd_test_lock(struct svc_rqst *rqstp, struct svc_fh *fhp, struct file_lock *lock)
4013{
4014 struct file *file;
4015 int err;
4016
4017 err = nfsd_open(rqstp, fhp, S_IFREG, NFSD_MAY_READ, &file);
4018 if (err)
4019 return err;
4020 err = vfs_test_lock(file, lock);
4021 nfsd_close(file);
4022 return err;
4023}
4024
1da177e4
LT
4025/*
4026 * LOCKT operation
4027 */
b37ad28b 4028__be32
ca364317
BF
4029nfsd4_lockt(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4030 struct nfsd4_lockt *lockt)
1da177e4
LT
4031{
4032 struct inode *inode;
1da177e4 4033 struct file_lock file_lock;
fe0750e5 4034 struct nfs4_lockowner *lo;
fd85b817 4035 int error;
b37ad28b 4036 __be32 status;
1da177e4 4037
af558e33 4038 if (locks_in_grace())
1da177e4
LT
4039 return nfserr_grace;
4040
4041 if (check_lock_length(lockt->lt_offset, lockt->lt_length))
4042 return nfserr_inval;
4043
1da177e4
LT
4044 nfs4_lock_state();
4045
4046 status = nfserr_stale_clientid;
60adfc50 4047 if (!nfsd4_has_session(cstate) && STALE_CLIENTID(&lockt->lt_clientid))
1da177e4 4048 goto out;
1da177e4 4049
75c096f7 4050 if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
1da177e4 4051 goto out;
1da177e4 4052
ca364317 4053 inode = cstate->current_fh.fh_dentry->d_inode;
1da177e4
LT
4054 locks_init_lock(&file_lock);
4055 switch (lockt->lt_type) {
4056 case NFS4_READ_LT:
4057 case NFS4_READW_LT:
4058 file_lock.fl_type = F_RDLCK;
4059 break;
4060 case NFS4_WRITE_LT:
4061 case NFS4_WRITEW_LT:
4062 file_lock.fl_type = F_WRLCK;
4063 break;
4064 default:
2fdada03 4065 dprintk("NFSD: nfs4_lockt: bad lock type!\n");
1da177e4
LT
4066 status = nfserr_inval;
4067 goto out;
4068 }
4069
fe0750e5
BF
4070 lo = find_lockowner_str(inode, &lockt->lt_clientid, &lockt->lt_owner);
4071 if (lo)
4072 file_lock.fl_owner = (fl_owner_t)lo;
1da177e4
LT
4073 file_lock.fl_pid = current->tgid;
4074 file_lock.fl_flags = FL_POSIX;
4075
4076 file_lock.fl_start = lockt->lt_offset;
87df4de8 4077 file_lock.fl_end = last_byte_offset(lockt->lt_offset, lockt->lt_length);
1da177e4
LT
4078
4079 nfs4_transform_lock_offset(&file_lock);
4080
1da177e4 4081 status = nfs_ok;
55ef1274 4082 error = nfsd_test_lock(rqstp, &cstate->current_fh, &file_lock);
fd85b817
ME
4083 if (error) {
4084 status = nfserrno(error);
4085 goto out;
4086 }
9d6a8c5c 4087 if (file_lock.fl_type != F_UNLCK) {
1da177e4 4088 status = nfserr_denied;
9d6a8c5c 4089 nfs4_set_lock_denied(&file_lock, &lockt->lt_denied);
1da177e4
LT
4090 }
4091out:
4092 nfs4_unlock_state();
4093 return status;
4094}
4095
b37ad28b 4096__be32
ca364317 4097nfsd4_locku(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 4098 struct nfsd4_locku *locku)
1da177e4 4099{
dcef0413 4100 struct nfs4_ol_stateid *stp;
1da177e4
LT
4101 struct file *filp = NULL;
4102 struct file_lock file_lock;
b37ad28b 4103 __be32 status;
b8dd7b9a 4104 int err;
1da177e4
LT
4105
4106 dprintk("NFSD: nfsd4_locku: start=%Ld length=%Ld\n",
4107 (long long) locku->lu_offset,
4108 (long long) locku->lu_length);
4109
4110 if (check_lock_length(locku->lu_offset, locku->lu_length))
4111 return nfserr_inval;
4112
4113 nfs4_lock_state();
4114
9072d5c6 4115 status = nfs4_preprocess_seqid_op(cstate, locku->lu_seqid,
2288d0e3 4116 &locku->lu_stateid, NFS4_LOCK_STID, &stp);
9072d5c6 4117 if (status)
1da177e4 4118 goto out;
f9d7562f
BF
4119 filp = find_any_file(stp->st_file);
4120 if (!filp) {
4121 status = nfserr_lock_range;
4122 goto out;
4123 }
1da177e4
LT
4124 BUG_ON(!filp);
4125 locks_init_lock(&file_lock);
4126 file_lock.fl_type = F_UNLCK;
fe0750e5 4127 file_lock.fl_owner = (fl_owner_t)lockowner(stp->st_stateowner);
1da177e4
LT
4128 file_lock.fl_pid = current->tgid;
4129 file_lock.fl_file = filp;
4130 file_lock.fl_flags = FL_POSIX;
d5b9026a 4131 file_lock.fl_lmops = &nfsd_posix_mng_ops;
1da177e4
LT
4132 file_lock.fl_start = locku->lu_offset;
4133
87df4de8 4134 file_lock.fl_end = last_byte_offset(locku->lu_offset, locku->lu_length);
1da177e4
LT
4135 nfs4_transform_lock_offset(&file_lock);
4136
4137 /*
4138 * Try to unlock the file in the VFS.
4139 */
fd85b817 4140 err = vfs_lock_file(filp, F_SETLK, &file_lock, NULL);
b8dd7b9a 4141 if (err) {
fd85b817 4142 dprintk("NFSD: nfs4_locku: vfs_lock_file failed!\n");
1da177e4
LT
4143 goto out_nfserr;
4144 }
4145 /*
4146 * OK, unlock succeeded; the only thing left to do is update the stateid.
4147 */
dcef0413
BF
4148 update_stateid(&stp->st_stid.sc_stateid);
4149 memcpy(&locku->lu_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4
LT
4150
4151out:
71c3bcd7
BF
4152 if (!cstate->replay_owner)
4153 nfs4_unlock_state();
1da177e4
LT
4154 return status;
4155
4156out_nfserr:
b8dd7b9a 4157 status = nfserrno(err);
1da177e4
LT
4158 goto out;
4159}
4160
4161/*
4162 * returns
4163 * 1: locks held by lockowner
4164 * 0: no locks held by lockowner
4165 */
4166static int
fe0750e5 4167check_for_locks(struct nfs4_file *filp, struct nfs4_lockowner *lowner)
1da177e4
LT
4168{
4169 struct file_lock **flpp;
f9d7562f 4170 struct inode *inode = filp->fi_inode;
1da177e4
LT
4171 int status = 0;
4172
b89f4321 4173 lock_flocks();
1da177e4 4174 for (flpp = &inode->i_flock; *flpp != NULL; flpp = &(*flpp)->fl_next) {
796dadfd 4175 if ((*flpp)->fl_owner == (fl_owner_t)lowner) {
1da177e4
LT
4176 status = 1;
4177 goto out;
796dadfd 4178 }
1da177e4
LT
4179 }
4180out:
b89f4321 4181 unlock_flocks();
1da177e4
LT
4182 return status;
4183}
4184
b37ad28b 4185__be32
b591480b
BF
4186nfsd4_release_lockowner(struct svc_rqst *rqstp,
4187 struct nfsd4_compound_state *cstate,
4188 struct nfsd4_release_lockowner *rlockowner)
1da177e4
LT
4189{
4190 clientid_t *clid = &rlockowner->rl_clientid;
3e9e3dbe 4191 struct nfs4_stateowner *sop;
fe0750e5 4192 struct nfs4_lockowner *lo;
dcef0413 4193 struct nfs4_ol_stateid *stp;
1da177e4 4194 struct xdr_netobj *owner = &rlockowner->rl_owner;
3e9e3dbe
N
4195 struct list_head matches;
4196 int i;
b37ad28b 4197 __be32 status;
1da177e4
LT
4198
4199 dprintk("nfsd4_release_lockowner clientid: (%08x/%08x):\n",
4200 clid->cl_boot, clid->cl_id);
4201
4202 /* XXX check for lease expiration */
4203
4204 status = nfserr_stale_clientid;
849823c5 4205 if (STALE_CLIENTID(clid))
1da177e4 4206 return status;
1da177e4
LT
4207
4208 nfs4_lock_state();
4209
3e9e3dbe
N
4210 status = nfserr_locks_held;
4211 /* XXX: we're doing a linear search through all the lockowners.
4212 * Yipes! For now we'll just hope clients aren't really using
4213 * release_lockowner much, but eventually we have to fix these
4214 * data structures. */
4215 INIT_LIST_HEAD(&matches);
4216 for (i = 0; i < LOCK_HASH_SIZE; i++) {
d3b313a4 4217 list_for_each_entry(sop, &lock_ownerstr_hashtbl[i], so_strhash) {
599e0a22 4218 if (!same_owner_str(sop, owner, clid))
3e9e3dbe
N
4219 continue;
4220 list_for_each_entry(stp, &sop->so_stateids,
4221 st_perstateowner) {
fe0750e5
BF
4222 lo = lockowner(sop);
4223 if (check_for_locks(stp->st_file, lo))
3e9e3dbe 4224 goto out;
fe0750e5 4225 list_add(&lo->lo_list, &matches);
3e9e3dbe 4226 }
1da177e4 4227 }
3e9e3dbe
N
4228 }
4229 /* Clients probably won't expect us to return with some (but not all)
4230 * of the lockowner state released; so don't release any until all
4231 * have been checked. */
4232 status = nfs_ok;
0fa822e4 4233 while (!list_empty(&matches)) {
fe0750e5
BF
4234 lo = list_entry(matches.next, struct nfs4_lockowner,
4235 lo_list);
0fa822e4
N
4236 /* unhash_stateowner deletes so_perclient only
4237 * for openowners. */
fe0750e5
BF
4238 list_del(&lo->lo_list);
4239 release_lockowner(lo);
1da177e4
LT
4240 }
4241out:
4242 nfs4_unlock_state();
4243 return status;
4244}
4245
4246static inline struct nfs4_client_reclaim *
a55370a3 4247alloc_reclaim(void)
1da177e4 4248{
a55370a3 4249 return kmalloc(sizeof(struct nfs4_client_reclaim), GFP_KERNEL);
1da177e4
LT
4250}
4251
c7b9a459 4252int
a1bcecd2 4253nfs4_has_reclaimed_state(const char *name, bool use_exchange_id)
c7b9a459
N
4254{
4255 unsigned int strhashval = clientstr_hashval(name);
4256 struct nfs4_client *clp;
4257
e203d506 4258 clp = find_confirmed_client_by_str(name, strhashval);
c7b9a459
N
4259 return clp ? 1 : 0;
4260}
4261
1da177e4
LT
4262/*
4263 * failure => all reset bets are off, nfserr_no_grace...
4264 */
190e4fbf
N
4265int
4266nfs4_client_to_reclaim(const char *name)
1da177e4
LT
4267{
4268 unsigned int strhashval;
4269 struct nfs4_client_reclaim *crp = NULL;
4270
a55370a3
N
4271 dprintk("NFSD nfs4_client_to_reclaim NAME: %.*s\n", HEXDIR_LEN, name);
4272 crp = alloc_reclaim();
1da177e4
LT
4273 if (!crp)
4274 return 0;
a55370a3 4275 strhashval = clientstr_hashval(name);
1da177e4
LT
4276 INIT_LIST_HEAD(&crp->cr_strhash);
4277 list_add(&crp->cr_strhash, &reclaim_str_hashtbl[strhashval]);
a55370a3 4278 memcpy(crp->cr_recdir, name, HEXDIR_LEN);
1da177e4
LT
4279 reclaim_str_hashtbl_size++;
4280 return 1;
4281}
4282
4283static void
4284nfs4_release_reclaim(void)
4285{
4286 struct nfs4_client_reclaim *crp = NULL;
4287 int i;
4288
1da177e4
LT
4289 for (i = 0; i < CLIENT_HASH_SIZE; i++) {
4290 while (!list_empty(&reclaim_str_hashtbl[i])) {
4291 crp = list_entry(reclaim_str_hashtbl[i].next,
4292 struct nfs4_client_reclaim, cr_strhash);
4293 list_del(&crp->cr_strhash);
1da177e4
LT
4294 kfree(crp);
4295 reclaim_str_hashtbl_size--;
4296 }
4297 }
4298 BUG_ON(reclaim_str_hashtbl_size);
4299}
4300
4301/*
4302 * called from OPEN, CLAIM_PREVIOUS with a new clientid. */
fd39ca9a 4303static struct nfs4_client_reclaim *
1da177e4
LT
4304nfs4_find_reclaim_client(clientid_t *clid)
4305{
4306 unsigned int strhashval;
4307 struct nfs4_client *clp;
4308 struct nfs4_client_reclaim *crp = NULL;
4309
4310
4311 /* find clientid in conf_id_hashtbl */
4312 clp = find_confirmed_client(clid);
4313 if (clp == NULL)
4314 return NULL;
4315
a55370a3
N
4316 dprintk("NFSD: nfs4_find_reclaim_client for %.*s with recdir %s\n",
4317 clp->cl_name.len, clp->cl_name.data,
4318 clp->cl_recdir);
1da177e4
LT
4319
4320 /* find clp->cl_name in reclaim_str_hashtbl */
a55370a3 4321 strhashval = clientstr_hashval(clp->cl_recdir);
1da177e4 4322 list_for_each_entry(crp, &reclaim_str_hashtbl[strhashval], cr_strhash) {
a55370a3 4323 if (same_name(crp->cr_recdir, clp->cl_recdir)) {
1da177e4
LT
4324 return crp;
4325 }
4326 }
4327 return NULL;
4328}
4329
4330/*
4331* Called from OPEN. Look for clientid in reclaim list.
4332*/
b37ad28b 4333__be32
1da177e4
LT
4334nfs4_check_open_reclaim(clientid_t *clid)
4335{
dfc83565 4336 return nfs4_find_reclaim_client(clid) ? nfs_ok : nfserr_reclaim_bad;
1da177e4
LT
4337}
4338
ac4d8ff2 4339/* initialization to perform at module load time: */
1da177e4 4340
e8ff2a84 4341int
ac4d8ff2 4342nfs4_state_init(void)
1da177e4 4343{
e8ff2a84 4344 int i, status;
1da177e4 4345
e8ff2a84
BF
4346 status = nfsd4_init_slabs();
4347 if (status)
4348 return status;
1da177e4
LT
4349 for (i = 0; i < CLIENT_HASH_SIZE; i++) {
4350 INIT_LIST_HEAD(&conf_id_hashtbl[i]);
4351 INIT_LIST_HEAD(&conf_str_hashtbl[i]);
4352 INIT_LIST_HEAD(&unconf_str_hashtbl[i]);
4353 INIT_LIST_HEAD(&unconf_id_hashtbl[i]);
02cb2858 4354 INIT_LIST_HEAD(&reclaim_str_hashtbl[i]);
1da177e4 4355 }
5282fd72
ME
4356 for (i = 0; i < SESSION_HASH_SIZE; i++)
4357 INIT_LIST_HEAD(&sessionid_hashtbl[i]);
1da177e4
LT
4358 for (i = 0; i < FILE_HASH_SIZE; i++) {
4359 INIT_LIST_HEAD(&file_hashtbl[i]);
4360 }
506f275f
BF
4361 for (i = 0; i < OPEN_OWNER_HASH_SIZE; i++) {
4362 INIT_LIST_HEAD(&open_ownerstr_hashtbl[i]);
1da177e4 4363 }
1da177e4 4364 for (i = 0; i < LOCK_HASH_SIZE; i++) {
1da177e4
LT
4365 INIT_LIST_HEAD(&lock_ownerstr_hashtbl[i]);
4366 }
1da177e4 4367 memset(&onestateid, ~0, sizeof(stateid_t));
1da177e4
LT
4368 INIT_LIST_HEAD(&close_lru);
4369 INIT_LIST_HEAD(&client_lru);
4370 INIT_LIST_HEAD(&del_recall_lru);
ac4d8ff2 4371 reclaim_str_hashtbl_size = 0;
e8ff2a84 4372 return 0;
ac4d8ff2
N
4373}
4374
190e4fbf
N
4375static void
4376nfsd4_load_reboot_recovery_data(void)
4377{
4378 int status;
4379
0964a3d3 4380 nfs4_lock_state();
48483bf2 4381 nfsd4_init_recdir();
190e4fbf 4382 status = nfsd4_recdir_load();
0964a3d3 4383 nfs4_unlock_state();
190e4fbf
N
4384 if (status)
4385 printk("NFSD: Failure reading reboot recovery data\n");
4386}
4387
c2f1a551
MS
4388/*
4389 * Since the lifetime of a delegation isn't limited to that of an open, a
4390 * client may quite reasonably hang on to a delegation as long as it has
4391 * the inode cached. This becomes an obvious problem the first time a
4392 * client's inode cache approaches the size of the server's total memory.
4393 *
4394 * For now we avoid this problem by imposing a hard limit on the number
4395 * of delegations, which varies according to the server's memory size.
4396 */
4397static void
4398set_max_delegations(void)
4399{
4400 /*
4401 * Allow at most 4 delegations per megabyte of RAM. Quick
4402 * estimates suggest that in the worst case (where every delegation
4403 * is for a different inode), a delegation could take about 1.5K,
4404 * giving a worst case usage of about 6% of memory.
4405 */
4406 max_delegations = nr_free_buffer_pages() >> (20 - 2 - PAGE_SHIFT);
4407}
4408
ac4d8ff2
N
4409/* initialization to perform when the nfsd service is started: */
4410
29ab23cc 4411static int
ac4d8ff2
N
4412__nfs4_state_start(void)
4413{
b5a1a81e
BF
4414 int ret;
4415
1da177e4 4416 boot_time = get_seconds();
af558e33 4417 locks_start_grace(&nfsd4_manager);
9a8db97e 4418 printk(KERN_INFO "NFSD: starting %ld-second grace period\n",
e46b498c 4419 nfsd4_grace);
b5a1a81e
BF
4420 ret = set_callback_cred();
4421 if (ret)
4422 return -ENOMEM;
58da282b 4423 laundry_wq = create_singlethread_workqueue("nfsd4");
29ab23cc
BF
4424 if (laundry_wq == NULL)
4425 return -ENOMEM;
b5a1a81e
BF
4426 ret = nfsd4_create_callback_queue();
4427 if (ret)
4428 goto out_free_laundry;
e46b498c 4429 queue_delayed_work(laundry_wq, &laundromat_work, nfsd4_grace * HZ);
c2f1a551 4430 set_max_delegations();
b5a1a81e
BF
4431 return 0;
4432out_free_laundry:
4433 destroy_workqueue(laundry_wq);
4434 return ret;
1da177e4
LT
4435}
4436
29ab23cc 4437int
76a3550e 4438nfs4_state_start(void)
1da177e4 4439{
190e4fbf 4440 nfsd4_load_reboot_recovery_data();
4ad9a344 4441 return __nfs4_state_start();
1da177e4
LT
4442}
4443
1da177e4
LT
4444static void
4445__nfs4_state_shutdown(void)
4446{
4447 int i;
4448 struct nfs4_client *clp = NULL;
4449 struct nfs4_delegation *dp = NULL;
1da177e4
LT
4450 struct list_head *pos, *next, reaplist;
4451
1da177e4
LT
4452 for (i = 0; i < CLIENT_HASH_SIZE; i++) {
4453 while (!list_empty(&conf_id_hashtbl[i])) {
4454 clp = list_entry(conf_id_hashtbl[i].next, struct nfs4_client, cl_idhash);
4455 expire_client(clp);
4456 }
4457 while (!list_empty(&unconf_str_hashtbl[i])) {
4458 clp = list_entry(unconf_str_hashtbl[i].next, struct nfs4_client, cl_strhash);
4459 expire_client(clp);
4460 }
4461 }
4462 INIT_LIST_HEAD(&reaplist);
4463 spin_lock(&recall_lock);
4464 list_for_each_safe(pos, next, &del_recall_lru) {
4465 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
4466 list_move(&dp->dl_recall_lru, &reaplist);
4467 }
4468 spin_unlock(&recall_lock);
4469 list_for_each_safe(pos, next, &reaplist) {
4470 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
4471 list_del_init(&dp->dl_recall_lru);
4472 unhash_delegation(dp);
4473 }
4474
190e4fbf 4475 nfsd4_shutdown_recdir();
1da177e4
LT
4476}
4477
4478void
4479nfs4_state_shutdown(void)
4480{
afe2c511 4481 cancel_delayed_work_sync(&laundromat_work);
5e8d5c29 4482 destroy_workqueue(laundry_wq);
2c5e7615 4483 locks_end_grace(&nfsd4_manager);
1da177e4
LT
4484 nfs4_lock_state();
4485 nfs4_release_reclaim();
4486 __nfs4_state_shutdown();
1da177e4 4487 nfs4_unlock_state();
c3935e30 4488 nfsd4_destroy_callback_queue();
1da177e4 4489}