nfsd4: add a separate (lockowner, inode) lookup
[linux-2.6-block.git] / fs / nfsd / nfs4state.c
CommitLineData
1da177e4 1/*
1da177e4
LT
2* Copyright (c) 2001 The Regents of the University of Michigan.
3* All rights reserved.
4*
5* Kendrick Smith <kmsmith@umich.edu>
6* Andy Adamson <kandros@umich.edu>
7*
8* Redistribution and use in source and binary forms, with or without
9* modification, are permitted provided that the following conditions
10* are met:
11*
12* 1. Redistributions of source code must retain the above copyright
13* notice, this list of conditions and the following disclaimer.
14* 2. Redistributions in binary form must reproduce the above copyright
15* notice, this list of conditions and the following disclaimer in the
16* documentation and/or other materials provided with the distribution.
17* 3. Neither the name of the University nor the names of its
18* contributors may be used to endorse or promote products derived
19* from this software without specific prior written permission.
20*
21* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24* DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32*
33*/
34
aceaf78d 35#include <linux/file.h>
b89f4321 36#include <linux/fs.h>
5a0e3ad6 37#include <linux/slab.h>
0964a3d3 38#include <linux/namei.h>
c2f1a551 39#include <linux/swap.h>
17456804 40#include <linux/pagemap.h>
68e76ad0 41#include <linux/sunrpc/svcauth_gss.h>
363168b4 42#include <linux/sunrpc/clnt.h>
9a74af21 43#include "xdr4.h"
0a3adade 44#include "vfs.h"
1da177e4
LT
45
46#define NFSDDBG_FACILITY NFSDDBG_PROC
47
48/* Globals */
cf07d2ea 49time_t nfsd4_lease = 90; /* default lease time */
efc4bb4f 50time_t nfsd4_grace = 90;
fd39ca9a 51static time_t boot_time;
fd39ca9a
N
52static stateid_t zerostateid; /* bits all 0 */
53static stateid_t onestateid; /* bits all 1 */
ec6b5d7b 54static u64 current_sessionid = 1;
fd39ca9a
N
55
56#define ZERO_STATEID(stateid) (!memcmp((stateid), &zerostateid, sizeof(stateid_t)))
57#define ONE_STATEID(stateid) (!memcmp((stateid), &onestateid, sizeof(stateid_t)))
1da177e4 58
1da177e4 59/* forward declarations */
fe0750e5 60static int check_for_locks(struct nfs4_file *filp, struct nfs4_lockowner *lowner);
1da177e4 61
8b671b80
BF
62/* Locking: */
63
64/* Currently used for almost all code touching nfsv4 state: */
353ab6e9 65static DEFINE_MUTEX(client_mutex);
1da177e4 66
8b671b80
BF
67/*
68 * Currently used for the del_recall_lru and file hash table. In an
69 * effort to decrease the scope of the client_mutex, this spinlock may
70 * eventually cover more:
71 */
72static DEFINE_SPINLOCK(recall_lock);
73
fe0750e5
BF
74static struct kmem_cache *openowner_slab = NULL;
75static struct kmem_cache *lockowner_slab = NULL;
e18b890b
CL
76static struct kmem_cache *file_slab = NULL;
77static struct kmem_cache *stateid_slab = NULL;
78static struct kmem_cache *deleg_slab = NULL;
e60d4398 79
1da177e4
LT
80void
81nfs4_lock_state(void)
82{
353ab6e9 83 mutex_lock(&client_mutex);
1da177e4
LT
84}
85
86void
87nfs4_unlock_state(void)
88{
353ab6e9 89 mutex_unlock(&client_mutex);
1da177e4
LT
90}
91
92static inline u32
93opaque_hashval(const void *ptr, int nbytes)
94{
95 unsigned char *cptr = (unsigned char *) ptr;
96
97 u32 x = 0;
98 while (nbytes--) {
99 x *= 37;
100 x += *cptr++;
101 }
102 return x;
103}
104
1da177e4
LT
105static struct list_head del_recall_lru;
106
32513b40
BF
107static void nfsd4_free_file(struct nfs4_file *f)
108{
109 kmem_cache_free(file_slab, f);
110}
111
13cd2184
N
112static inline void
113put_nfs4_file(struct nfs4_file *fi)
114{
8b671b80
BF
115 if (atomic_dec_and_lock(&fi->fi_ref, &recall_lock)) {
116 list_del(&fi->fi_hash);
117 spin_unlock(&recall_lock);
118 iput(fi->fi_inode);
32513b40 119 nfsd4_free_file(fi);
8b671b80 120 }
13cd2184
N
121}
122
123static inline void
124get_nfs4_file(struct nfs4_file *fi)
125{
8b671b80 126 atomic_inc(&fi->fi_ref);
13cd2184
N
127}
128
ef0f3390 129static int num_delegations;
c2f1a551 130unsigned int max_delegations;
ef0f3390
N
131
132/*
133 * Open owner state (share locks)
134 */
135
16bfdaaf
BF
136/* hash tables for lock and open owners */
137#define OWNER_HASH_BITS 8
138#define OWNER_HASH_SIZE (1 << OWNER_HASH_BITS)
139#define OWNER_HASH_MASK (OWNER_HASH_SIZE - 1)
ef0f3390 140
16bfdaaf 141static unsigned int ownerstr_hashval(u32 clientid, struct xdr_netobj *ownername)
ddc04c41
BF
142{
143 unsigned int ret;
144
145 ret = opaque_hashval(ownername->data, ownername->len);
146 ret += clientid;
16bfdaaf 147 return ret & OWNER_HASH_MASK;
ddc04c41 148}
ef0f3390 149
16bfdaaf 150static struct list_head ownerstr_hashtbl[OWNER_HASH_SIZE];
ef0f3390
N
151
152/* hash table for nfs4_file */
153#define FILE_HASH_BITS 8
154#define FILE_HASH_SIZE (1 << FILE_HASH_BITS)
35079582 155
ddc04c41
BF
156static unsigned int file_hashval(struct inode *ino)
157{
158 /* XXX: why are we hashing on inode pointer, anyway? */
159 return hash_ptr(ino, FILE_HASH_BITS);
160}
161
ef0f3390 162static struct list_head file_hashtbl[FILE_HASH_SIZE];
ef0f3390 163
998db52c 164static void __nfs4_file_get_access(struct nfs4_file *fp, int oflag)
f9d7562f
BF
165{
166 BUG_ON(!(fp->fi_fds[oflag] || fp->fi_fds[O_RDWR]));
167 atomic_inc(&fp->fi_access[oflag]);
168}
169
998db52c
BF
170static void nfs4_file_get_access(struct nfs4_file *fp, int oflag)
171{
172 if (oflag == O_RDWR) {
173 __nfs4_file_get_access(fp, O_RDONLY);
174 __nfs4_file_get_access(fp, O_WRONLY);
175 } else
176 __nfs4_file_get_access(fp, oflag);
177}
178
179static void nfs4_file_put_fd(struct nfs4_file *fp, int oflag)
f9d7562f
BF
180{
181 if (fp->fi_fds[oflag]) {
182 fput(fp->fi_fds[oflag]);
183 fp->fi_fds[oflag] = NULL;
184 }
185}
186
998db52c 187static void __nfs4_file_put_access(struct nfs4_file *fp, int oflag)
f9d7562f
BF
188{
189 if (atomic_dec_and_test(&fp->fi_access[oflag])) {
f9d7562f 190 nfs4_file_put_fd(fp, oflag);
3d02fa29
BF
191 /*
192 * It's also safe to get rid of the RDWR open *if*
193 * we no longer have need of the other kind of access
194 * or if we already have the other kind of open:
195 */
196 if (fp->fi_fds[1-oflag]
197 || atomic_read(&fp->fi_access[1 - oflag]) == 0)
198 nfs4_file_put_fd(fp, O_RDWR);
f9d7562f
BF
199 }
200}
201
998db52c
BF
202static void nfs4_file_put_access(struct nfs4_file *fp, int oflag)
203{
204 if (oflag == O_RDWR) {
205 __nfs4_file_put_access(fp, O_RDONLY);
206 __nfs4_file_put_access(fp, O_WRONLY);
207 } else
208 __nfs4_file_put_access(fp, oflag);
209}
210
6136d2b4 211static inline int get_new_stid(struct nfs4_stid *stid)
36d44c60 212{
6136d2b4 213 static int min_stateid = 0;
38c2f4b1 214 struct idr *stateids = &stid->sc_client->cl_stateids;
6136d2b4
BF
215 int new_stid;
216 int error;
217
38c2f4b1 218 error = idr_get_new_above(stateids, stid, min_stateid, &new_stid);
6136d2b4 219 /*
996e0938
BF
220 * Note: the necessary preallocation was done in
221 * nfs4_alloc_stateid(). The idr code caps the number of
222 * preallocations that can exist at a time, but the state lock
223 * prevents anyone from using ours before we get here:
6136d2b4
BF
224 */
225 BUG_ON(error);
226 /*
227 * It shouldn't be a problem to reuse an opaque stateid value.
228 * I don't think it is for 4.1. But with 4.0 I worry that, for
229 * example, a stray write retransmission could be accepted by
230 * the server when it should have been rejected. Therefore,
231 * adopt a trick from the sctp code to attempt to maximize the
232 * amount of time until an id is reused, by ensuring they always
233 * "increase" (mod INT_MAX):
234 */
36d44c60 235
6136d2b4
BF
236 min_stateid = new_stid+1;
237 if (min_stateid == INT_MAX)
238 min_stateid = 0;
239 return new_stid;
36d44c60
BF
240}
241
996e0938 242static void init_stid(struct nfs4_stid *stid, struct nfs4_client *cl, unsigned char type)
2a74aba7
BF
243{
244 stateid_t *s = &stid->sc_stateid;
6136d2b4 245 int new_id;
2a74aba7
BF
246
247 stid->sc_type = type;
248 stid->sc_client = cl;
249 s->si_opaque.so_clid = cl->cl_clientid;
6136d2b4 250 new_id = get_new_stid(stid);
6136d2b4 251 s->si_opaque.so_id = (u32)new_id;
2a74aba7
BF
252 /* Will be incremented before return to client: */
253 s->si_generation = 0;
996e0938
BF
254}
255
256static struct nfs4_stid *nfs4_alloc_stid(struct nfs4_client *cl, struct kmem_cache *slab)
257{
258 struct idr *stateids = &cl->cl_stateids;
259
260 if (!idr_pre_get(stateids, GFP_KERNEL))
261 return NULL;
262 /*
263 * Note: if we fail here (or any time between now and the time
264 * we actually get the new idr), we won't need to undo the idr
265 * preallocation, since the idr code caps the number of
266 * preallocated entries.
267 */
268 return kmem_cache_alloc(slab, GFP_KERNEL);
2a74aba7
BF
269}
270
4cdc951b
BF
271static struct nfs4_ol_stateid * nfs4_alloc_stateid(struct nfs4_client *clp)
272{
273 return openlockstateid(nfs4_alloc_stid(clp, stateid_slab));
274}
275
1da177e4 276static struct nfs4_delegation *
dcef0413 277alloc_init_deleg(struct nfs4_client *clp, struct nfs4_ol_stateid *stp, struct svc_fh *current_fh, u32 type)
1da177e4
LT
278{
279 struct nfs4_delegation *dp;
280 struct nfs4_file *fp = stp->st_file;
1da177e4
LT
281
282 dprintk("NFSD alloc_init_deleg\n");
c3e48080
BF
283 /*
284 * Major work on the lease subsystem (for example, to support
285 * calbacks on stat) will be required before we can support
286 * write delegations properly.
287 */
288 if (type != NFS4_OPEN_DELEGATE_READ)
289 return NULL;
47f9940c
MS
290 if (fp->fi_had_conflict)
291 return NULL;
c2f1a551 292 if (num_delegations > max_delegations)
ef0f3390 293 return NULL;
996e0938 294 dp = delegstateid(nfs4_alloc_stid(clp, deleg_slab));
5b2d21c1 295 if (dp == NULL)
1da177e4 296 return dp;
996e0938 297 init_stid(&dp->dl_stid, clp, NFS4_DELEG_STID);
2a74aba7
BF
298 /*
299 * delegation seqid's are never incremented. The 4.1 special
6136d2b4
BF
300 * meaning of seqid 0 isn't meaningful, really, but let's avoid
301 * 0 anyway just for consistency and use 1:
2a74aba7
BF
302 */
303 dp->dl_stid.sc_stateid.si_generation = 1;
ef0f3390 304 num_delegations++;
ea1da636
N
305 INIT_LIST_HEAD(&dp->dl_perfile);
306 INIT_LIST_HEAD(&dp->dl_perclnt);
1da177e4 307 INIT_LIST_HEAD(&dp->dl_recall_lru);
13cd2184 308 get_nfs4_file(fp);
1da177e4 309 dp->dl_file = fp;
1da177e4 310 dp->dl_type = type;
6c02eaa1 311 fh_copy_shallow(&dp->dl_fh, &current_fh->fh_handle);
1da177e4
LT
312 dp->dl_time = 0;
313 atomic_set(&dp->dl_count, 1);
b5a1a81e 314 INIT_WORK(&dp->dl_recall.cb_work, nfsd4_do_callback_rpc);
1da177e4
LT
315 return dp;
316}
317
318void
319nfs4_put_delegation(struct nfs4_delegation *dp)
320{
321 if (atomic_dec_and_test(&dp->dl_count)) {
322 dprintk("NFSD: freeing dp %p\n",dp);
13cd2184 323 put_nfs4_file(dp->dl_file);
5b2d21c1 324 kmem_cache_free(deleg_slab, dp);
ef0f3390 325 num_delegations--;
1da177e4
LT
326 }
327}
328
acfdf5c3 329static void nfs4_put_deleg_lease(struct nfs4_file *fp)
1da177e4 330{
acfdf5c3
BF
331 if (atomic_dec_and_test(&fp->fi_delegees)) {
332 vfs_setlease(fp->fi_deleg_file, F_UNLCK, &fp->fi_lease);
333 fp->fi_lease = NULL;
4ee63624 334 fput(fp->fi_deleg_file);
acfdf5c3
BF
335 fp->fi_deleg_file = NULL;
336 }
1da177e4
LT
337}
338
6136d2b4
BF
339static void unhash_stid(struct nfs4_stid *s)
340{
38c2f4b1
BF
341 struct idr *stateids = &s->sc_client->cl_stateids;
342
343 idr_remove(stateids, s->sc_stateid.si_opaque.so_id);
6136d2b4
BF
344}
345
1da177e4
LT
346/* Called under the state lock. */
347static void
348unhash_delegation(struct nfs4_delegation *dp)
349{
6136d2b4 350 unhash_stid(&dp->dl_stid);
ea1da636 351 list_del_init(&dp->dl_perclnt);
1da177e4 352 spin_lock(&recall_lock);
5d926e8c 353 list_del_init(&dp->dl_perfile);
1da177e4
LT
354 list_del_init(&dp->dl_recall_lru);
355 spin_unlock(&recall_lock);
acfdf5c3 356 nfs4_put_deleg_lease(dp->dl_file);
1da177e4
LT
357 nfs4_put_delegation(dp);
358}
359
360/*
361 * SETCLIENTID state
362 */
363
36acb66b 364/* client_lock protects the client lru list and session hash table */
9089f1b4
BH
365static DEFINE_SPINLOCK(client_lock);
366
1da177e4
LT
367/* Hash tables for nfs4_clientid state */
368#define CLIENT_HASH_BITS 4
369#define CLIENT_HASH_SIZE (1 << CLIENT_HASH_BITS)
370#define CLIENT_HASH_MASK (CLIENT_HASH_SIZE - 1)
371
ddc04c41
BF
372static unsigned int clientid_hashval(u32 id)
373{
374 return id & CLIENT_HASH_MASK;
375}
376
377static unsigned int clientstr_hashval(const char *name)
378{
379 return opaque_hashval(name, 8) & CLIENT_HASH_MASK;
380}
381
1da177e4
LT
382/*
383 * reclaim_str_hashtbl[] holds known client info from previous reset/reboot
384 * used in reboot/reset lease grace period processing
385 *
386 * conf_id_hashtbl[], and conf_str_hashtbl[] hold confirmed
387 * setclientid_confirmed info.
388 *
389 * unconf_str_hastbl[] and unconf_id_hashtbl[] hold unconfirmed
390 * setclientid info.
391 *
392 * client_lru holds client queue ordered by nfs4_client.cl_time
393 * for lease renewal.
394 *
395 * close_lru holds (open) stateowner queue ordered by nfs4_stateowner.so_time
396 * for last close replay.
397 */
398static struct list_head reclaim_str_hashtbl[CLIENT_HASH_SIZE];
399static int reclaim_str_hashtbl_size = 0;
400static struct list_head conf_id_hashtbl[CLIENT_HASH_SIZE];
401static struct list_head conf_str_hashtbl[CLIENT_HASH_SIZE];
402static struct list_head unconf_str_hashtbl[CLIENT_HASH_SIZE];
403static struct list_head unconf_id_hashtbl[CLIENT_HASH_SIZE];
404static struct list_head client_lru;
405static struct list_head close_lru;
406
f9d7562f
BF
407/*
408 * We store the NONE, READ, WRITE, and BOTH bits separately in the
409 * st_{access,deny}_bmap field of the stateid, in order to track not
410 * only what share bits are currently in force, but also what
411 * combinations of share bits previous opens have used. This allows us
412 * to enforce the recommendation of rfc 3530 14.2.19 that the server
413 * return an error if the client attempt to downgrade to a combination
414 * of share bits not explicable by closing some of its previous opens.
415 *
416 * XXX: This enforcement is actually incomplete, since we don't keep
417 * track of access/deny bit combinations; so, e.g., we allow:
418 *
419 * OPEN allow read, deny write
420 * OPEN allow both, deny none
421 * DOWNGRADE allow read, deny none
422 *
423 * which we should reject.
424 */
425static void
426set_access(unsigned int *access, unsigned long bmap) {
427 int i;
428
429 *access = 0;
430 for (i = 1; i < 4; i++) {
431 if (test_bit(i, &bmap))
432 *access |= i;
433 }
434}
435
436static void
437set_deny(unsigned int *deny, unsigned long bmap) {
438 int i;
439
440 *deny = 0;
441 for (i = 0; i < 4; i++) {
442 if (test_bit(i, &bmap))
443 *deny |= i ;
444 }
445}
446
447static int
dcef0413 448test_share(struct nfs4_ol_stateid *stp, struct nfsd4_open *open) {
f9d7562f
BF
449 unsigned int access, deny;
450
451 set_access(&access, stp->st_access_bmap);
452 set_deny(&deny, stp->st_deny_bmap);
453 if ((access & open->op_share_deny) || (deny & open->op_share_access))
454 return 0;
455 return 1;
456}
457
458static int nfs4_access_to_omode(u32 access)
459{
8f34a430 460 switch (access & NFS4_SHARE_ACCESS_BOTH) {
f9d7562f
BF
461 case NFS4_SHARE_ACCESS_READ:
462 return O_RDONLY;
463 case NFS4_SHARE_ACCESS_WRITE:
464 return O_WRONLY;
465 case NFS4_SHARE_ACCESS_BOTH:
466 return O_RDWR;
467 }
468 BUG();
469}
470
dcef0413 471static void unhash_generic_stateid(struct nfs4_ol_stateid *stp)
529d7b2a 472{
529d7b2a
BF
473 list_del(&stp->st_perfile);
474 list_del(&stp->st_perstateowner);
475}
476
dcef0413 477static void close_generic_stateid(struct nfs4_ol_stateid *stp)
529d7b2a 478{
499f3edc 479 int i;
0997b173 480
23fcf2ec 481 if (stp->st_access_bmap) {
499f3edc
BF
482 for (i = 1; i < 4; i++) {
483 if (test_bit(i, &stp->st_access_bmap))
484 nfs4_file_put_access(stp->st_file,
485 nfs4_access_to_omode(i));
4665e2ba 486 __clear_bit(i, &stp->st_access_bmap);
499f3edc 487 }
23fcf2ec 488 }
a96e5b90 489 put_nfs4_file(stp->st_file);
4665e2ba
BF
490 stp->st_file = NULL;
491}
492
dcef0413 493static void free_generic_stateid(struct nfs4_ol_stateid *stp)
4665e2ba 494{
529d7b2a
BF
495 kmem_cache_free(stateid_slab, stp);
496}
497
dcef0413 498static void release_lock_stateid(struct nfs4_ol_stateid *stp)
529d7b2a
BF
499{
500 struct file *file;
501
502 unhash_generic_stateid(stp);
6136d2b4 503 unhash_stid(&stp->st_stid);
529d7b2a
BF
504 file = find_any_file(stp->st_file);
505 if (file)
fe0750e5 506 locks_remove_posix(file, (fl_owner_t)lockowner(stp->st_stateowner));
38c387b5 507 close_generic_stateid(stp);
529d7b2a
BF
508 free_generic_stateid(stp);
509}
510
fe0750e5 511static void unhash_lockowner(struct nfs4_lockowner *lo)
529d7b2a 512{
dcef0413 513 struct nfs4_ol_stateid *stp;
529d7b2a 514
fe0750e5
BF
515 list_del(&lo->lo_owner.so_strhash);
516 list_del(&lo->lo_perstateid);
009673b4 517 list_del(&lo->lo_owner_ino_hash);
fe0750e5
BF
518 while (!list_empty(&lo->lo_owner.so_stateids)) {
519 stp = list_first_entry(&lo->lo_owner.so_stateids,
dcef0413 520 struct nfs4_ol_stateid, st_perstateowner);
529d7b2a
BF
521 release_lock_stateid(stp);
522 }
523}
524
fe0750e5 525static void release_lockowner(struct nfs4_lockowner *lo)
529d7b2a 526{
fe0750e5
BF
527 unhash_lockowner(lo);
528 nfs4_free_lockowner(lo);
529d7b2a
BF
529}
530
531static void
dcef0413 532release_stateid_lockowners(struct nfs4_ol_stateid *open_stp)
529d7b2a 533{
fe0750e5 534 struct nfs4_lockowner *lo;
529d7b2a
BF
535
536 while (!list_empty(&open_stp->st_lockowners)) {
fe0750e5
BF
537 lo = list_entry(open_stp->st_lockowners.next,
538 struct nfs4_lockowner, lo_perstateid);
539 release_lockowner(lo);
529d7b2a
BF
540 }
541}
542
38c387b5 543static void unhash_open_stateid(struct nfs4_ol_stateid *stp)
2283963f
BF
544{
545 unhash_generic_stateid(stp);
546 release_stateid_lockowners(stp);
38c387b5
BF
547 close_generic_stateid(stp);
548}
549
550static void release_open_stateid(struct nfs4_ol_stateid *stp)
551{
552 unhash_open_stateid(stp);
6136d2b4 553 unhash_stid(&stp->st_stid);
2283963f
BF
554 free_generic_stateid(stp);
555}
556
fe0750e5 557static void unhash_openowner(struct nfs4_openowner *oo)
f1d110ca 558{
dcef0413 559 struct nfs4_ol_stateid *stp;
f1d110ca 560
fe0750e5
BF
561 list_del(&oo->oo_owner.so_strhash);
562 list_del(&oo->oo_perclient);
563 while (!list_empty(&oo->oo_owner.so_stateids)) {
564 stp = list_first_entry(&oo->oo_owner.so_stateids,
dcef0413 565 struct nfs4_ol_stateid, st_perstateowner);
f044ff83 566 release_open_stateid(stp);
f1d110ca
BF
567 }
568}
569
f7a4d872
BF
570static void release_last_closed_stateid(struct nfs4_openowner *oo)
571{
572 struct nfs4_ol_stateid *s = oo->oo_last_closed_stid;
573
574 if (s) {
6136d2b4 575 unhash_stid(&s->st_stid);
f7a4d872
BF
576 free_generic_stateid(s);
577 oo->oo_last_closed_stid = NULL;
578 }
579}
580
fe0750e5 581static void release_openowner(struct nfs4_openowner *oo)
f1d110ca 582{
fe0750e5
BF
583 unhash_openowner(oo);
584 list_del(&oo->oo_close_lru);
f7a4d872 585 release_last_closed_stateid(oo);
fe0750e5 586 nfs4_free_openowner(oo);
f1d110ca
BF
587}
588
5282fd72
ME
589#define SESSION_HASH_SIZE 512
590static struct list_head sessionid_hashtbl[SESSION_HASH_SIZE];
591
592static inline int
593hash_sessionid(struct nfs4_sessionid *sessionid)
594{
595 struct nfsd4_sessionid *sid = (struct nfsd4_sessionid *)sessionid;
596
597 return sid->sequence % SESSION_HASH_SIZE;
598}
599
600static inline void
601dump_sessionid(const char *fn, struct nfs4_sessionid *sessionid)
602{
603 u32 *ptr = (u32 *)(&sessionid->data[0]);
604 dprintk("%s: %u:%u:%u:%u\n", fn, ptr[0], ptr[1], ptr[2], ptr[3]);
605}
606
ec6b5d7b
AA
607static void
608gen_sessionid(struct nfsd4_session *ses)
609{
610 struct nfs4_client *clp = ses->se_client;
611 struct nfsd4_sessionid *sid;
612
613 sid = (struct nfsd4_sessionid *)ses->se_sessionid.data;
614 sid->clientid = clp->cl_clientid;
615 sid->sequence = current_sessionid++;
616 sid->reserved = 0;
617}
618
619/*
a649637c
AA
620 * The protocol defines ca_maxresponssize_cached to include the size of
621 * the rpc header, but all we need to cache is the data starting after
622 * the end of the initial SEQUENCE operation--the rest we regenerate
623 * each time. Therefore we can advertise a ca_maxresponssize_cached
624 * value that is the number of bytes in our cache plus a few additional
625 * bytes. In order to stay on the safe side, and not promise more than
626 * we can cache, those additional bytes must be the minimum possible: 24
627 * bytes of rpc header (xid through accept state, with AUTH_NULL
628 * verifier), 12 for the compound header (with zero-length tag), and 44
629 * for the SEQUENCE op response:
630 */
631#define NFSD_MIN_HDR_SEQ_SZ (24 + 12 + 44)
632
557ce264
AA
633static void
634free_session_slots(struct nfsd4_session *ses)
635{
636 int i;
637
638 for (i = 0; i < ses->se_fchannel.maxreqs; i++)
639 kfree(ses->se_slots[i]);
640}
641
a649637c 642/*
efe0cb6d
BF
643 * We don't actually need to cache the rpc and session headers, so we
644 * can allocate a little less for each slot:
645 */
646static inline int slot_bytes(struct nfsd4_channel_attrs *ca)
647{
648 return ca->maxresp_cached - NFSD_MIN_HDR_SEQ_SZ;
649}
650
5b6feee9 651static int nfsd4_sanitize_slot_size(u32 size)
ec6b5d7b 652{
5b6feee9
BF
653 size -= NFSD_MIN_HDR_SEQ_SZ; /* We don't cache the rpc header */
654 size = min_t(u32, size, NFSD_SLOT_CACHE_SIZE);
ec6b5d7b 655
5b6feee9
BF
656 return size;
657}
ec6b5d7b 658
5b6feee9
BF
659/*
660 * XXX: If we run out of reserved DRC memory we could (up to a point)
a649637c
AA
661 * re-negotiate active sessions and reduce their slot usage to make
662 * rooom for new connections. For now we just fail the create session.
ec6b5d7b 663 */
5b6feee9 664static int nfsd4_get_drc_mem(int slotsize, u32 num)
ec6b5d7b 665{
5b6feee9 666 int avail;
ec6b5d7b 667
5b6feee9 668 num = min_t(u32, num, NFSD_MAX_SLOTS_PER_SESSION);
5d77ddfb 669
5b6feee9
BF
670 spin_lock(&nfsd_drc_lock);
671 avail = min_t(int, NFSD_MAX_MEM_PER_SESSION,
672 nfsd_drc_max_mem - nfsd_drc_mem_used);
673 num = min_t(int, num, avail / slotsize);
674 nfsd_drc_mem_used += num * slotsize;
675 spin_unlock(&nfsd_drc_lock);
ec6b5d7b 676
5b6feee9
BF
677 return num;
678}
ec6b5d7b 679
5b6feee9
BF
680static void nfsd4_put_drc_mem(int slotsize, int num)
681{
4bd9b0f4 682 spin_lock(&nfsd_drc_lock);
5b6feee9 683 nfsd_drc_mem_used -= slotsize * num;
4bd9b0f4 684 spin_unlock(&nfsd_drc_lock);
5b6feee9 685}
ec6b5d7b 686
5b6feee9
BF
687static struct nfsd4_session *alloc_session(int slotsize, int numslots)
688{
689 struct nfsd4_session *new;
690 int mem, i;
a649637c 691
5b6feee9
BF
692 BUILD_BUG_ON(NFSD_MAX_SLOTS_PER_SESSION * sizeof(struct nfsd4_slot *)
693 + sizeof(struct nfsd4_session) > PAGE_SIZE);
694 mem = numslots * sizeof(struct nfsd4_slot *);
ec6b5d7b 695
5b6feee9
BF
696 new = kzalloc(sizeof(*new) + mem, GFP_KERNEL);
697 if (!new)
698 return NULL;
557ce264 699 /* allocate each struct nfsd4_slot and data cache in one piece */
5b6feee9
BF
700 for (i = 0; i < numslots; i++) {
701 mem = sizeof(struct nfsd4_slot) + slotsize;
702 new->se_slots[i] = kzalloc(mem, GFP_KERNEL);
703 if (!new->se_slots[i])
557ce264 704 goto out_free;
557ce264 705 }
5b6feee9
BF
706 return new;
707out_free:
708 while (i--)
709 kfree(new->se_slots[i]);
710 kfree(new);
711 return NULL;
ec6b5d7b
AA
712}
713
5b6feee9 714static void init_forechannel_attrs(struct nfsd4_channel_attrs *new, struct nfsd4_channel_attrs *req, int numslots, int slotsize)
ec6b5d7b 715{
5b6feee9 716 u32 maxrpc = nfsd_serv->sv_max_mesg;
ec6b5d7b 717
5b6feee9 718 new->maxreqs = numslots;
d2b21743
MJ
719 new->maxresp_cached = min_t(u32, req->maxresp_cached,
720 slotsize + NFSD_MIN_HDR_SEQ_SZ);
5b6feee9
BF
721 new->maxreq_sz = min_t(u32, req->maxreq_sz, maxrpc);
722 new->maxresp_sz = min_t(u32, req->maxresp_sz, maxrpc);
723 new->maxops = min_t(u32, req->maxops, NFSD_MAX_OPS_PER_COMPOUND);
724}
ec6b5d7b 725
19cf5c02
BF
726static void free_conn(struct nfsd4_conn *c)
727{
728 svc_xprt_put(c->cn_xprt);
729 kfree(c);
730}
ec6b5d7b 731
19cf5c02
BF
732static void nfsd4_conn_lost(struct svc_xpt_user *u)
733{
734 struct nfsd4_conn *c = container_of(u, struct nfsd4_conn, cn_xpt_user);
735 struct nfs4_client *clp = c->cn_session->se_client;
ec6b5d7b 736
19cf5c02
BF
737 spin_lock(&clp->cl_lock);
738 if (!list_empty(&c->cn_persession)) {
739 list_del(&c->cn_persession);
740 free_conn(c);
741 }
742 spin_unlock(&clp->cl_lock);
eea49806 743 nfsd4_probe_callback(clp);
19cf5c02 744}
ec6b5d7b 745
d29c374c 746static struct nfsd4_conn *alloc_conn(struct svc_rqst *rqstp, u32 flags)
c7662518 747{
c7662518 748 struct nfsd4_conn *conn;
ec6b5d7b 749
c7662518
BF
750 conn = kmalloc(sizeof(struct nfsd4_conn), GFP_KERNEL);
751 if (!conn)
db90681d 752 return NULL;
c7662518
BF
753 svc_xprt_get(rqstp->rq_xprt);
754 conn->cn_xprt = rqstp->rq_xprt;
d29c374c 755 conn->cn_flags = flags;
db90681d
BF
756 INIT_LIST_HEAD(&conn->cn_xpt_user.list);
757 return conn;
758}
a649637c 759
328ead28
BF
760static void __nfsd4_hash_conn(struct nfsd4_conn *conn, struct nfsd4_session *ses)
761{
762 conn->cn_session = ses;
763 list_add(&conn->cn_persession, &ses->se_conns);
ec6b5d7b
AA
764}
765
db90681d 766static void nfsd4_hash_conn(struct nfsd4_conn *conn, struct nfsd4_session *ses)
557ce264 767{
db90681d 768 struct nfs4_client *clp = ses->se_client;
557ce264 769
c7662518 770 spin_lock(&clp->cl_lock);
328ead28 771 __nfsd4_hash_conn(conn, ses);
c7662518 772 spin_unlock(&clp->cl_lock);
557ce264
AA
773}
774
21b75b01 775static int nfsd4_register_conn(struct nfsd4_conn *conn)
efe0cb6d 776{
19cf5c02 777 conn->cn_xpt_user.callback = nfsd4_conn_lost;
21b75b01 778 return register_xpt_user(conn->cn_xprt, &conn->cn_xpt_user);
efe0cb6d
BF
779}
780
1d1bc8f2 781static __be32 nfsd4_new_conn(struct svc_rqst *rqstp, struct nfsd4_session *ses, u32 dir)
ec6b5d7b 782{
db90681d 783 struct nfsd4_conn *conn;
21b75b01 784 int ret;
ec6b5d7b 785
1d1bc8f2 786 conn = alloc_conn(rqstp, dir);
db90681d
BF
787 if (!conn)
788 return nfserr_jukebox;
789 nfsd4_hash_conn(conn, ses);
21b75b01
BF
790 ret = nfsd4_register_conn(conn);
791 if (ret)
792 /* oops; xprt is already down: */
793 nfsd4_conn_lost(&conn->cn_xpt_user);
c7662518
BF
794 return nfs_ok;
795}
ec6b5d7b 796
1d1bc8f2
BF
797static __be32 nfsd4_new_conn_from_crses(struct svc_rqst *rqstp, struct nfsd4_session *ses)
798{
799 u32 dir = NFS4_CDFC4_FORE;
800
801 if (ses->se_flags & SESSION4_BACK_CHAN)
802 dir |= NFS4_CDFC4_BACK;
803
804 return nfsd4_new_conn(rqstp, ses, dir);
805}
806
807/* must be called under client_lock */
19cf5c02 808static void nfsd4_del_conns(struct nfsd4_session *s)
c7662518 809{
19cf5c02
BF
810 struct nfs4_client *clp = s->se_client;
811 struct nfsd4_conn *c;
ec6b5d7b 812
19cf5c02
BF
813 spin_lock(&clp->cl_lock);
814 while (!list_empty(&s->se_conns)) {
815 c = list_first_entry(&s->se_conns, struct nfsd4_conn, cn_persession);
816 list_del_init(&c->cn_persession);
817 spin_unlock(&clp->cl_lock);
557ce264 818
19cf5c02
BF
819 unregister_xpt_user(c->cn_xprt, &c->cn_xpt_user);
820 free_conn(c);
ec6b5d7b 821
19cf5c02
BF
822 spin_lock(&clp->cl_lock);
823 }
824 spin_unlock(&clp->cl_lock);
c7662518 825}
ec6b5d7b 826
c7662518
BF
827void free_session(struct kref *kref)
828{
829 struct nfsd4_session *ses;
830 int mem;
831
832 ses = container_of(kref, struct nfsd4_session, se_ref);
19cf5c02 833 nfsd4_del_conns(ses);
c7662518
BF
834 spin_lock(&nfsd_drc_lock);
835 mem = ses->se_fchannel.maxreqs * slot_bytes(&ses->se_fchannel);
836 nfsd_drc_mem_used -= mem;
837 spin_unlock(&nfsd_drc_lock);
838 free_session_slots(ses);
839 kfree(ses);
840}
841
ac7c46f2 842static struct nfsd4_session *alloc_init_session(struct svc_rqst *rqstp, struct nfs4_client *clp, struct nfsd4_create_session *cses)
5b6feee9
BF
843{
844 struct nfsd4_session *new;
845 struct nfsd4_channel_attrs *fchan = &cses->fore_channel;
846 int numslots, slotsize;
c7662518 847 int status;
5b6feee9
BF
848 int idx;
849
850 /*
851 * Note decreasing slot size below client's request may
852 * make it difficult for client to function correctly, whereas
853 * decreasing the number of slots will (just?) affect
854 * performance. When short on memory we therefore prefer to
855 * decrease number of slots instead of their size.
856 */
857 slotsize = nfsd4_sanitize_slot_size(fchan->maxresp_cached);
858 numslots = nfsd4_get_drc_mem(slotsize, fchan->maxreqs);
ced6dfe9
MJ
859 if (numslots < 1)
860 return NULL;
5b6feee9
BF
861
862 new = alloc_session(slotsize, numslots);
863 if (!new) {
864 nfsd4_put_drc_mem(slotsize, fchan->maxreqs);
ac7c46f2 865 return NULL;
557ce264 866 }
5b6feee9 867 init_forechannel_attrs(&new->se_fchannel, fchan, numslots, slotsize);
557ce264 868
ec6b5d7b
AA
869 new->se_client = clp;
870 gen_sessionid(new);
ec6b5d7b 871
c7662518
BF
872 INIT_LIST_HEAD(&new->se_conns);
873
ac7c46f2 874 new->se_cb_seq_nr = 1;
ec6b5d7b 875 new->se_flags = cses->flags;
8b5ce5cd 876 new->se_cb_prog = cses->callback_prog;
ec6b5d7b 877 kref_init(&new->se_ref);
5b6feee9 878 idx = hash_sessionid(&new->se_sessionid);
9089f1b4 879 spin_lock(&client_lock);
ec6b5d7b 880 list_add(&new->se_hash, &sessionid_hashtbl[idx]);
4c649378 881 spin_lock(&clp->cl_lock);
ec6b5d7b 882 list_add(&new->se_perclnt, &clp->cl_sessions);
4c649378 883 spin_unlock(&clp->cl_lock);
9089f1b4 884 spin_unlock(&client_lock);
ec6b5d7b 885
1d1bc8f2 886 status = nfsd4_new_conn_from_crses(rqstp, new);
ac7c46f2 887 /* whoops: benny points out, status is ignored! (err, or bogus) */
c7662518
BF
888 if (status) {
889 free_session(&new->se_ref);
ac7c46f2 890 return NULL;
c7662518 891 }
dcbeaa68 892 if (cses->flags & SESSION4_BACK_CHAN) {
edd76786 893 struct sockaddr *sa = svc_addr(rqstp);
dcbeaa68
BF
894 /*
895 * This is a little silly; with sessions there's no real
896 * use for the callback address. Use the peer address
897 * as a reasonable default for now, but consider fixing
898 * the rpc client not to require an address in the
899 * future:
900 */
edd76786
BF
901 rpc_copy_addr((struct sockaddr *)&clp->cl_cb_conn.cb_addr, sa);
902 clp->cl_cb_conn.cb_addrlen = svc_addr_len(sa);
edd76786 903 }
dcbeaa68 904 nfsd4_probe_callback(clp);
ac7c46f2 905 return new;
ec6b5d7b
AA
906}
907
9089f1b4 908/* caller must hold client_lock */
5282fd72
ME
909static struct nfsd4_session *
910find_in_sessionid_hashtbl(struct nfs4_sessionid *sessionid)
911{
912 struct nfsd4_session *elem;
913 int idx;
914
915 dump_sessionid(__func__, sessionid);
916 idx = hash_sessionid(sessionid);
5282fd72
ME
917 /* Search in the appropriate list */
918 list_for_each_entry(elem, &sessionid_hashtbl[idx], se_hash) {
5282fd72
ME
919 if (!memcmp(elem->se_sessionid.data, sessionid->data,
920 NFS4_MAX_SESSIONID_LEN)) {
921 return elem;
922 }
923 }
924
925 dprintk("%s: session not found\n", __func__);
926 return NULL;
927}
928
9089f1b4 929/* caller must hold client_lock */
7116ed6b 930static void
5282fd72 931unhash_session(struct nfsd4_session *ses)
7116ed6b
AA
932{
933 list_del(&ses->se_hash);
4c649378 934 spin_lock(&ses->se_client->cl_lock);
7116ed6b 935 list_del(&ses->se_perclnt);
4c649378 936 spin_unlock(&ses->se_client->cl_lock);
5282fd72
ME
937}
938
36acb66b 939/* must be called under the client_lock */
1da177e4 940static inline void
36acb66b 941renew_client_locked(struct nfs4_client *clp)
1da177e4 942{
07cd4909
BH
943 if (is_client_expired(clp)) {
944 dprintk("%s: client (clientid %08x/%08x) already expired\n",
945 __func__,
946 clp->cl_clientid.cl_boot,
947 clp->cl_clientid.cl_id);
948 return;
949 }
950
1da177e4
LT
951 dprintk("renewing client (clientid %08x/%08x)\n",
952 clp->cl_clientid.cl_boot,
953 clp->cl_clientid.cl_id);
954 list_move_tail(&clp->cl_lru, &client_lru);
955 clp->cl_time = get_seconds();
956}
957
36acb66b
BH
958static inline void
959renew_client(struct nfs4_client *clp)
960{
961 spin_lock(&client_lock);
962 renew_client_locked(clp);
963 spin_unlock(&client_lock);
964}
965
1da177e4
LT
966/* SETCLIENTID and SETCLIENTID_CONFIRM Helper functions */
967static int
968STALE_CLIENTID(clientid_t *clid)
969{
970 if (clid->cl_boot == boot_time)
971 return 0;
60adfc50
AA
972 dprintk("NFSD stale clientid (%08x/%08x) boot_time %08lx\n",
973 clid->cl_boot, clid->cl_id, boot_time);
1da177e4
LT
974 return 1;
975}
976
977/*
978 * XXX Should we use a slab cache ?
979 * This type of memory management is somewhat inefficient, but we use it
980 * anyway since SETCLIENTID is not a common operation.
981 */
35bba9a3 982static struct nfs4_client *alloc_client(struct xdr_netobj name)
1da177e4
LT
983{
984 struct nfs4_client *clp;
985
35bba9a3
BF
986 clp = kzalloc(sizeof(struct nfs4_client), GFP_KERNEL);
987 if (clp == NULL)
988 return NULL;
989 clp->cl_name.data = kmalloc(name.len, GFP_KERNEL);
990 if (clp->cl_name.data == NULL) {
991 kfree(clp);
992 return NULL;
1da177e4 993 }
35bba9a3
BF
994 memcpy(clp->cl_name.data, name.data, name.len);
995 clp->cl_name.len = name.len;
1da177e4
LT
996 return clp;
997}
998
999static inline void
1000free_client(struct nfs4_client *clp)
1001{
792c95dd
BF
1002 while (!list_empty(&clp->cl_sessions)) {
1003 struct nfsd4_session *ses;
1004 ses = list_entry(clp->cl_sessions.next, struct nfsd4_session,
1005 se_perclnt);
1006 list_del(&ses->se_perclnt);
1007 nfsd4_put_session(ses);
1008 }
1da177e4
LT
1009 if (clp->cl_cred.cr_group_info)
1010 put_group_info(clp->cl_cred.cr_group_info);
68e76ad0 1011 kfree(clp->cl_principal);
1da177e4
LT
1012 kfree(clp->cl_name.data);
1013 kfree(clp);
1014}
1015
d7682988
BH
1016void
1017release_session_client(struct nfsd4_session *session)
1018{
1019 struct nfs4_client *clp = session->se_client;
1020
1021 if (!atomic_dec_and_lock(&clp->cl_refcount, &client_lock))
1022 return;
1023 if (is_client_expired(clp)) {
1024 free_client(clp);
1025 session->se_client = NULL;
1026 } else
1027 renew_client_locked(clp);
1028 spin_unlock(&client_lock);
d7682988
BH
1029}
1030
84d38ac9
BH
1031/* must be called under the client_lock */
1032static inline void
1033unhash_client_locked(struct nfs4_client *clp)
1034{
792c95dd
BF
1035 struct nfsd4_session *ses;
1036
07cd4909 1037 mark_client_expired(clp);
84d38ac9 1038 list_del(&clp->cl_lru);
4c649378 1039 spin_lock(&clp->cl_lock);
792c95dd
BF
1040 list_for_each_entry(ses, &clp->cl_sessions, se_perclnt)
1041 list_del_init(&ses->se_hash);
4c649378 1042 spin_unlock(&clp->cl_lock);
84d38ac9
BH
1043}
1044
1da177e4
LT
1045static void
1046expire_client(struct nfs4_client *clp)
1047{
fe0750e5 1048 struct nfs4_openowner *oo;
1da177e4 1049 struct nfs4_delegation *dp;
1da177e4
LT
1050 struct list_head reaplist;
1051
1da177e4
LT
1052 INIT_LIST_HEAD(&reaplist);
1053 spin_lock(&recall_lock);
ea1da636
N
1054 while (!list_empty(&clp->cl_delegations)) {
1055 dp = list_entry(clp->cl_delegations.next, struct nfs4_delegation, dl_perclnt);
ea1da636 1056 list_del_init(&dp->dl_perclnt);
1da177e4
LT
1057 list_move(&dp->dl_recall_lru, &reaplist);
1058 }
1059 spin_unlock(&recall_lock);
1060 while (!list_empty(&reaplist)) {
1061 dp = list_entry(reaplist.next, struct nfs4_delegation, dl_recall_lru);
1062 list_del_init(&dp->dl_recall_lru);
1063 unhash_delegation(dp);
1064 }
ea1da636 1065 while (!list_empty(&clp->cl_openowners)) {
fe0750e5
BF
1066 oo = list_entry(clp->cl_openowners.next, struct nfs4_openowner, oo_perclient);
1067 release_openowner(oo);
1da177e4 1068 }
6ff8da08 1069 nfsd4_shutdown_callback(clp);
84d38ac9
BH
1070 if (clp->cl_cb_conn.cb_xprt)
1071 svc_xprt_put(clp->cl_cb_conn.cb_xprt);
36acb66b
BH
1072 list_del(&clp->cl_idhash);
1073 list_del(&clp->cl_strhash);
be1fdf6c 1074 spin_lock(&client_lock);
84d38ac9 1075 unhash_client_locked(clp);
46583e25
BH
1076 if (atomic_read(&clp->cl_refcount) == 0)
1077 free_client(clp);
be1fdf6c 1078 spin_unlock(&client_lock);
1da177e4
LT
1079}
1080
35bba9a3
BF
1081static void copy_verf(struct nfs4_client *target, nfs4_verifier *source)
1082{
1083 memcpy(target->cl_verifier.data, source->data,
1084 sizeof(target->cl_verifier.data));
1da177e4
LT
1085}
1086
35bba9a3
BF
1087static void copy_clid(struct nfs4_client *target, struct nfs4_client *source)
1088{
1da177e4
LT
1089 target->cl_clientid.cl_boot = source->cl_clientid.cl_boot;
1090 target->cl_clientid.cl_id = source->cl_clientid.cl_id;
1091}
1092
35bba9a3
BF
1093static void copy_cred(struct svc_cred *target, struct svc_cred *source)
1094{
1da177e4
LT
1095 target->cr_uid = source->cr_uid;
1096 target->cr_gid = source->cr_gid;
1097 target->cr_group_info = source->cr_group_info;
1098 get_group_info(target->cr_group_info);
1099}
1100
35bba9a3 1101static int same_name(const char *n1, const char *n2)
599e0a22 1102{
a55370a3 1103 return 0 == memcmp(n1, n2, HEXDIR_LEN);
1da177e4
LT
1104}
1105
1106static int
599e0a22
BF
1107same_verf(nfs4_verifier *v1, nfs4_verifier *v2)
1108{
1109 return 0 == memcmp(v1->data, v2->data, sizeof(v1->data));
1da177e4
LT
1110}
1111
1112static int
599e0a22
BF
1113same_clid(clientid_t *cl1, clientid_t *cl2)
1114{
1115 return (cl1->cl_boot == cl2->cl_boot) && (cl1->cl_id == cl2->cl_id);
1da177e4
LT
1116}
1117
1118/* XXX what about NGROUP */
1119static int
599e0a22
BF
1120same_creds(struct svc_cred *cr1, struct svc_cred *cr2)
1121{
1122 return cr1->cr_uid == cr2->cr_uid;
1da177e4
LT
1123}
1124
5ec7b46c
BF
1125static void gen_clid(struct nfs4_client *clp)
1126{
1127 static u32 current_clientid = 1;
1128
1da177e4
LT
1129 clp->cl_clientid.cl_boot = boot_time;
1130 clp->cl_clientid.cl_id = current_clientid++;
1131}
1132
deda2faa
BF
1133static void gen_confirm(struct nfs4_client *clp)
1134{
1135 static u32 i;
1136 u32 *p;
1da177e4 1137
1da177e4 1138 p = (u32 *)clp->cl_confirm.data;
deda2faa
BF
1139 *p++ = get_seconds();
1140 *p++ = i++;
1da177e4
LT
1141}
1142
38c2f4b1 1143static struct nfs4_stid *find_stateid(struct nfs4_client *cl, stateid_t *t)
4581d140 1144{
38c2f4b1 1145 return idr_find(&cl->cl_stateids, t->si_opaque.so_id);
4d71ab87
BF
1146}
1147
38c2f4b1 1148static struct nfs4_stid *find_stateid_by_type(struct nfs4_client *cl, stateid_t *t, char typemask)
f459e453
BF
1149{
1150 struct nfs4_stid *s;
4d71ab87 1151
38c2f4b1 1152 s = find_stateid(cl, t);
4d71ab87
BF
1153 if (!s)
1154 return NULL;
f459e453 1155 if (typemask & s->sc_type)
4581d140 1156 return s;
4581d140
BF
1157 return NULL;
1158}
1159
b09333c4
RL
1160static struct nfs4_client *create_client(struct xdr_netobj name, char *recdir,
1161 struct svc_rqst *rqstp, nfs4_verifier *verf)
1162{
1163 struct nfs4_client *clp;
1164 struct sockaddr *sa = svc_addr(rqstp);
1165 char *princ;
1166
1167 clp = alloc_client(name);
1168 if (clp == NULL)
1169 return NULL;
1170
792c95dd
BF
1171 INIT_LIST_HEAD(&clp->cl_sessions);
1172
b09333c4
RL
1173 princ = svc_gss_principal(rqstp);
1174 if (princ) {
1175 clp->cl_principal = kstrdup(princ, GFP_KERNEL);
1176 if (clp->cl_principal == NULL) {
1177 free_client(clp);
1178 return NULL;
1179 }
1180 }
1181
38c2f4b1 1182 idr_init(&clp->cl_stateids);
b09333c4 1183 memcpy(clp->cl_recdir, recdir, HEXDIR_LEN);
46583e25 1184 atomic_set(&clp->cl_refcount, 0);
77a3569d 1185 clp->cl_cb_state = NFSD4_CB_UNKNOWN;
b09333c4
RL
1186 INIT_LIST_HEAD(&clp->cl_idhash);
1187 INIT_LIST_HEAD(&clp->cl_strhash);
1188 INIT_LIST_HEAD(&clp->cl_openowners);
1189 INIT_LIST_HEAD(&clp->cl_delegations);
b09333c4 1190 INIT_LIST_HEAD(&clp->cl_lru);
5ce8ba25 1191 INIT_LIST_HEAD(&clp->cl_callbacks);
6ff8da08 1192 spin_lock_init(&clp->cl_lock);
cee277d9 1193 INIT_WORK(&clp->cl_cb_null.cb_work, nfsd4_do_callback_rpc);
07cd4909 1194 clp->cl_time = get_seconds();
b09333c4
RL
1195 clear_bit(0, &clp->cl_cb_slot_busy);
1196 rpc_init_wait_queue(&clp->cl_cb_waitq, "Backchannel slot table");
1197 copy_verf(clp, verf);
1198 rpc_copy_addr((struct sockaddr *) &clp->cl_addr, sa);
1199 clp->cl_flavor = rqstp->rq_flavor;
1200 copy_cred(&clp->cl_cred, &rqstp->rq_cred);
1201 gen_confirm(clp);
edd76786 1202 clp->cl_cb_session = NULL;
b09333c4
RL
1203 return clp;
1204}
1205
fd39ca9a 1206static void
1da177e4
LT
1207add_to_unconfirmed(struct nfs4_client *clp, unsigned int strhashval)
1208{
1209 unsigned int idhashval;
1210
1211 list_add(&clp->cl_strhash, &unconf_str_hashtbl[strhashval]);
1212 idhashval = clientid_hashval(clp->cl_clientid.cl_id);
1213 list_add(&clp->cl_idhash, &unconf_id_hashtbl[idhashval]);
36acb66b 1214 renew_client(clp);
1da177e4
LT
1215}
1216
fd39ca9a 1217static void
1da177e4
LT
1218move_to_confirmed(struct nfs4_client *clp)
1219{
1220 unsigned int idhashval = clientid_hashval(clp->cl_clientid.cl_id);
1221 unsigned int strhashval;
1222
1223 dprintk("NFSD: move_to_confirm nfs4_client %p\n", clp);
f116629d 1224 list_move(&clp->cl_idhash, &conf_id_hashtbl[idhashval]);
a55370a3 1225 strhashval = clientstr_hashval(clp->cl_recdir);
328efbab 1226 list_move(&clp->cl_strhash, &conf_str_hashtbl[strhashval]);
1da177e4
LT
1227 renew_client(clp);
1228}
1229
1230static struct nfs4_client *
1231find_confirmed_client(clientid_t *clid)
1232{
1233 struct nfs4_client *clp;
1234 unsigned int idhashval = clientid_hashval(clid->cl_id);
1235
1236 list_for_each_entry(clp, &conf_id_hashtbl[idhashval], cl_idhash) {
a50d2ad1
BF
1237 if (same_clid(&clp->cl_clientid, clid)) {
1238 renew_client(clp);
1da177e4 1239 return clp;
a50d2ad1 1240 }
1da177e4
LT
1241 }
1242 return NULL;
1243}
1244
1245static struct nfs4_client *
1246find_unconfirmed_client(clientid_t *clid)
1247{
1248 struct nfs4_client *clp;
1249 unsigned int idhashval = clientid_hashval(clid->cl_id);
1250
1251 list_for_each_entry(clp, &unconf_id_hashtbl[idhashval], cl_idhash) {
599e0a22 1252 if (same_clid(&clp->cl_clientid, clid))
1da177e4
LT
1253 return clp;
1254 }
1255 return NULL;
1256}
1257
6e5f15c9 1258static bool clp_used_exchangeid(struct nfs4_client *clp)
a1bcecd2 1259{
6e5f15c9 1260 return clp->cl_exchange_flags != 0;
e203d506 1261}
a1bcecd2 1262
28ce6054 1263static struct nfs4_client *
e203d506 1264find_confirmed_client_by_str(const char *dname, unsigned int hashval)
28ce6054
N
1265{
1266 struct nfs4_client *clp;
1267
1268 list_for_each_entry(clp, &conf_str_hashtbl[hashval], cl_strhash) {
e203d506 1269 if (same_name(clp->cl_recdir, dname))
28ce6054
N
1270 return clp;
1271 }
1272 return NULL;
1273}
1274
1275static struct nfs4_client *
e203d506 1276find_unconfirmed_client_by_str(const char *dname, unsigned int hashval)
28ce6054
N
1277{
1278 struct nfs4_client *clp;
1279
1280 list_for_each_entry(clp, &unconf_str_hashtbl[hashval], cl_strhash) {
e203d506 1281 if (same_name(clp->cl_recdir, dname))
28ce6054
N
1282 return clp;
1283 }
1284 return NULL;
1285}
1286
fd39ca9a 1287static void
6f3d772f 1288gen_callback(struct nfs4_client *clp, struct nfsd4_setclientid *se, struct svc_rqst *rqstp)
1da177e4 1289{
07263f1e 1290 struct nfs4_cb_conn *conn = &clp->cl_cb_conn;
6f3d772f
TU
1291 struct sockaddr *sa = svc_addr(rqstp);
1292 u32 scopeid = rpc_get_scope_id(sa);
7077ecba
JL
1293 unsigned short expected_family;
1294
1295 /* Currently, we only support tcp and tcp6 for the callback channel */
1296 if (se->se_callback_netid_len == 3 &&
1297 !memcmp(se->se_callback_netid_val, "tcp", 3))
1298 expected_family = AF_INET;
1299 else if (se->se_callback_netid_len == 4 &&
1300 !memcmp(se->se_callback_netid_val, "tcp6", 4))
1301 expected_family = AF_INET6;
1302 else
1da177e4
LT
1303 goto out_err;
1304
07263f1e 1305 conn->cb_addrlen = rpc_uaddr2sockaddr(se->se_callback_addr_val,
aa9a4ec7 1306 se->se_callback_addr_len,
07263f1e
BF
1307 (struct sockaddr *)&conn->cb_addr,
1308 sizeof(conn->cb_addr));
aa9a4ec7 1309
07263f1e 1310 if (!conn->cb_addrlen || conn->cb_addr.ss_family != expected_family)
1da177e4 1311 goto out_err;
aa9a4ec7 1312
07263f1e
BF
1313 if (conn->cb_addr.ss_family == AF_INET6)
1314 ((struct sockaddr_in6 *)&conn->cb_addr)->sin6_scope_id = scopeid;
fbf4665f 1315
07263f1e
BF
1316 conn->cb_prog = se->se_callback_prog;
1317 conn->cb_ident = se->se_callback_ident;
849a1cf1 1318 memcpy(&conn->cb_saddr, &rqstp->rq_daddr, rqstp->rq_daddrlen);
1da177e4
LT
1319 return;
1320out_err:
07263f1e
BF
1321 conn->cb_addr.ss_family = AF_UNSPEC;
1322 conn->cb_addrlen = 0;
849823c5 1323 dprintk(KERN_INFO "NFSD: this client (clientid %08x/%08x) "
1da177e4
LT
1324 "will not receive delegations\n",
1325 clp->cl_clientid.cl_boot, clp->cl_clientid.cl_id);
1326
1da177e4
LT
1327 return;
1328}
1329
074fe897 1330/*
557ce264 1331 * Cache a reply. nfsd4_check_drc_limit() has bounded the cache size.
074fe897 1332 */
074fe897
AA
1333void
1334nfsd4_store_cache_entry(struct nfsd4_compoundres *resp)
074fe897 1335{
557ce264
AA
1336 struct nfsd4_slot *slot = resp->cstate.slot;
1337 unsigned int base;
074fe897 1338
557ce264 1339 dprintk("--> %s slot %p\n", __func__, slot);
074fe897 1340
557ce264
AA
1341 slot->sl_opcnt = resp->opcnt;
1342 slot->sl_status = resp->cstate.status;
074fe897 1343
bf864a31 1344 if (nfsd4_not_cached(resp)) {
557ce264 1345 slot->sl_datalen = 0;
bf864a31 1346 return;
074fe897 1347 }
557ce264
AA
1348 slot->sl_datalen = (char *)resp->p - (char *)resp->cstate.datap;
1349 base = (char *)resp->cstate.datap -
1350 (char *)resp->xbuf->head[0].iov_base;
1351 if (read_bytes_from_xdr_buf(resp->xbuf, base, slot->sl_data,
1352 slot->sl_datalen))
1353 WARN("%s: sessions DRC could not cache compound\n", __func__);
1354 return;
074fe897
AA
1355}
1356
1357/*
abfabf8c
AA
1358 * Encode the replay sequence operation from the slot values.
1359 * If cachethis is FALSE encode the uncached rep error on the next
1360 * operation which sets resp->p and increments resp->opcnt for
1361 * nfs4svc_encode_compoundres.
074fe897 1362 *
074fe897 1363 */
abfabf8c
AA
1364static __be32
1365nfsd4_enc_sequence_replay(struct nfsd4_compoundargs *args,
1366 struct nfsd4_compoundres *resp)
074fe897 1367{
abfabf8c
AA
1368 struct nfsd4_op *op;
1369 struct nfsd4_slot *slot = resp->cstate.slot;
bf864a31 1370
abfabf8c 1371 dprintk("--> %s resp->opcnt %d cachethis %u \n", __func__,
557ce264 1372 resp->opcnt, resp->cstate.slot->sl_cachethis);
bf864a31 1373
abfabf8c
AA
1374 /* Encode the replayed sequence operation */
1375 op = &args->ops[resp->opcnt - 1];
1376 nfsd4_encode_operation(resp, op);
bf864a31 1377
abfabf8c 1378 /* Return nfserr_retry_uncached_rep in next operation. */
557ce264 1379 if (args->opcnt > 1 && slot->sl_cachethis == 0) {
abfabf8c
AA
1380 op = &args->ops[resp->opcnt++];
1381 op->status = nfserr_retry_uncached_rep;
1382 nfsd4_encode_operation(resp, op);
074fe897 1383 }
abfabf8c 1384 return op->status;
074fe897
AA
1385}
1386
1387/*
557ce264
AA
1388 * The sequence operation is not cached because we can use the slot and
1389 * session values.
074fe897
AA
1390 */
1391__be32
bf864a31
AA
1392nfsd4_replay_cache_entry(struct nfsd4_compoundres *resp,
1393 struct nfsd4_sequence *seq)
074fe897 1394{
557ce264 1395 struct nfsd4_slot *slot = resp->cstate.slot;
074fe897
AA
1396 __be32 status;
1397
557ce264 1398 dprintk("--> %s slot %p\n", __func__, slot);
074fe897 1399
abfabf8c
AA
1400 /* Either returns 0 or nfserr_retry_uncached */
1401 status = nfsd4_enc_sequence_replay(resp->rqstp->rq_argp, resp);
1402 if (status == nfserr_retry_uncached_rep)
1403 return status;
074fe897 1404
557ce264
AA
1405 /* The sequence operation has been encoded, cstate->datap set. */
1406 memcpy(resp->cstate.datap, slot->sl_data, slot->sl_datalen);
074fe897 1407
557ce264
AA
1408 resp->opcnt = slot->sl_opcnt;
1409 resp->p = resp->cstate.datap + XDR_QUADLEN(slot->sl_datalen);
1410 status = slot->sl_status;
074fe897
AA
1411
1412 return status;
1413}
1414
0733d213
AA
1415/*
1416 * Set the exchange_id flags returned by the server.
1417 */
1418static void
1419nfsd4_set_ex_flags(struct nfs4_client *new, struct nfsd4_exchange_id *clid)
1420{
1421 /* pNFS is not supported */
1422 new->cl_exchange_flags |= EXCHGID4_FLAG_USE_NON_PNFS;
1423
1424 /* Referrals are supported, Migration is not. */
1425 new->cl_exchange_flags |= EXCHGID4_FLAG_SUPP_MOVED_REFER;
1426
1427 /* set the wire flags to return to client. */
1428 clid->flags = new->cl_exchange_flags;
1429}
1430
069b6ad4
AA
1431__be32
1432nfsd4_exchange_id(struct svc_rqst *rqstp,
1433 struct nfsd4_compound_state *cstate,
1434 struct nfsd4_exchange_id *exid)
1435{
0733d213
AA
1436 struct nfs4_client *unconf, *conf, *new;
1437 int status;
1438 unsigned int strhashval;
1439 char dname[HEXDIR_LEN];
363168b4 1440 char addr_str[INET6_ADDRSTRLEN];
0733d213 1441 nfs4_verifier verf = exid->verifier;
363168b4 1442 struct sockaddr *sa = svc_addr(rqstp);
0733d213 1443
363168b4 1444 rpc_ntop(sa, addr_str, sizeof(addr_str));
0733d213 1445 dprintk("%s rqstp=%p exid=%p clname.len=%u clname.data=%p "
363168b4 1446 "ip_addr=%s flags %x, spa_how %d\n",
0733d213 1447 __func__, rqstp, exid, exid->clname.len, exid->clname.data,
363168b4 1448 addr_str, exid->flags, exid->spa_how);
0733d213 1449
a084daf5 1450 if (exid->flags & ~EXCHGID4_FLAG_MASK_A)
0733d213
AA
1451 return nfserr_inval;
1452
1453 /* Currently only support SP4_NONE */
1454 switch (exid->spa_how) {
1455 case SP4_NONE:
1456 break;
1457 case SP4_SSV:
044bc1d4 1458 return nfserr_serverfault;
0733d213
AA
1459 default:
1460 BUG(); /* checked by xdr code */
1461 case SP4_MACH_CRED:
1462 return nfserr_serverfault; /* no excuse :-/ */
1463 }
1464
1465 status = nfs4_make_rec_clidname(dname, &exid->clname);
1466
1467 if (status)
1468 goto error;
1469
1470 strhashval = clientstr_hashval(dname);
1471
1472 nfs4_lock_state();
1473 status = nfs_ok;
1474
e203d506 1475 conf = find_confirmed_client_by_str(dname, strhashval);
0733d213 1476 if (conf) {
e203d506
BF
1477 if (!clp_used_exchangeid(conf)) {
1478 status = nfserr_clid_inuse; /* XXX: ? */
1479 goto out;
1480 }
0733d213
AA
1481 if (!same_verf(&verf, &conf->cl_verifier)) {
1482 /* 18.35.4 case 8 */
1483 if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
1484 status = nfserr_not_same;
1485 goto out;
1486 }
1487 /* Client reboot: destroy old state */
1488 expire_client(conf);
1489 goto out_new;
1490 }
1491 if (!same_creds(&conf->cl_cred, &rqstp->rq_cred)) {
1492 /* 18.35.4 case 9 */
1493 if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
1494 status = nfserr_perm;
1495 goto out;
1496 }
1497 expire_client(conf);
1498 goto out_new;
1499 }
0733d213
AA
1500 /*
1501 * Set bit when the owner id and verifier map to an already
1502 * confirmed client id (18.35.3).
1503 */
1504 exid->flags |= EXCHGID4_FLAG_CONFIRMED_R;
1505
1506 /*
1507 * Falling into 18.35.4 case 2, possible router replay.
1508 * Leave confirmed record intact and return same result.
1509 */
1510 copy_verf(conf, &verf);
1511 new = conf;
1512 goto out_copy;
6ddbbbfe
MS
1513 }
1514
1515 /* 18.35.4 case 7 */
1516 if (exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A) {
1517 status = nfserr_noent;
1518 goto out;
0733d213
AA
1519 }
1520
e203d506 1521 unconf = find_unconfirmed_client_by_str(dname, strhashval);
0733d213
AA
1522 if (unconf) {
1523 /*
1524 * Possible retry or client restart. Per 18.35.4 case 4,
1525 * a new unconfirmed record should be generated regardless
1526 * of whether any properties have changed.
1527 */
1528 expire_client(unconf);
1529 }
1530
1531out_new:
1532 /* Normal case */
b09333c4 1533 new = create_client(exid->clname, dname, rqstp, &verf);
0733d213 1534 if (new == NULL) {
4731030d 1535 status = nfserr_jukebox;
0733d213
AA
1536 goto out;
1537 }
1538
0733d213 1539 gen_clid(new);
0733d213
AA
1540 add_to_unconfirmed(new, strhashval);
1541out_copy:
1542 exid->clientid.cl_boot = new->cl_clientid.cl_boot;
1543 exid->clientid.cl_id = new->cl_clientid.cl_id;
1544
38eb76a5 1545 exid->seqid = 1;
0733d213
AA
1546 nfsd4_set_ex_flags(new, exid);
1547
1548 dprintk("nfsd4_exchange_id seqid %d flags %x\n",
49557cc7 1549 new->cl_cs_slot.sl_seqid, new->cl_exchange_flags);
0733d213
AA
1550 status = nfs_ok;
1551
1552out:
1553 nfs4_unlock_state();
1554error:
1555 dprintk("nfsd4_exchange_id returns %d\n", ntohl(status));
1556 return status;
069b6ad4
AA
1557}
1558
b85d4c01 1559static int
88e588d5 1560check_slot_seqid(u32 seqid, u32 slot_seqid, int slot_inuse)
b85d4c01 1561{
88e588d5
AA
1562 dprintk("%s enter. seqid %d slot_seqid %d\n", __func__, seqid,
1563 slot_seqid);
b85d4c01
BH
1564
1565 /* The slot is in use, and no response has been sent. */
88e588d5
AA
1566 if (slot_inuse) {
1567 if (seqid == slot_seqid)
b85d4c01
BH
1568 return nfserr_jukebox;
1569 else
1570 return nfserr_seq_misordered;
1571 }
1572 /* Normal */
88e588d5 1573 if (likely(seqid == slot_seqid + 1))
b85d4c01
BH
1574 return nfs_ok;
1575 /* Replay */
88e588d5 1576 if (seqid == slot_seqid)
b85d4c01
BH
1577 return nfserr_replay_cache;
1578 /* Wraparound */
88e588d5 1579 if (seqid == 1 && (slot_seqid + 1) == 0)
b85d4c01
BH
1580 return nfs_ok;
1581 /* Misordered replay or misordered new request */
1582 return nfserr_seq_misordered;
1583}
1584
49557cc7
AA
1585/*
1586 * Cache the create session result into the create session single DRC
1587 * slot cache by saving the xdr structure. sl_seqid has been set.
1588 * Do this for solo or embedded create session operations.
1589 */
1590static void
1591nfsd4_cache_create_session(struct nfsd4_create_session *cr_ses,
1592 struct nfsd4_clid_slot *slot, int nfserr)
1593{
1594 slot->sl_status = nfserr;
1595 memcpy(&slot->sl_cr_ses, cr_ses, sizeof(*cr_ses));
1596}
1597
1598static __be32
1599nfsd4_replay_create_session(struct nfsd4_create_session *cr_ses,
1600 struct nfsd4_clid_slot *slot)
1601{
1602 memcpy(cr_ses, &slot->sl_cr_ses, sizeof(*cr_ses));
1603 return slot->sl_status;
1604}
1605
1b74c25b
MJ
1606#define NFSD_MIN_REQ_HDR_SEQ_SZ ((\
1607 2 * 2 + /* credential,verifier: AUTH_NULL, length 0 */ \
1608 1 + /* MIN tag is length with zero, only length */ \
1609 3 + /* version, opcount, opcode */ \
1610 XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
1611 /* seqid, slotID, slotID, cache */ \
1612 4 ) * sizeof(__be32))
1613
1614#define NFSD_MIN_RESP_HDR_SEQ_SZ ((\
1615 2 + /* verifier: AUTH_NULL, length 0 */\
1616 1 + /* status */ \
1617 1 + /* MIN tag is length with zero, only length */ \
1618 3 + /* opcount, opcode, opstatus*/ \
1619 XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
1620 /* seqid, slotID, slotID, slotID, status */ \
1621 5 ) * sizeof(__be32))
1622
1623static __be32 check_forechannel_attrs(struct nfsd4_channel_attrs fchannel)
1624{
1625 return fchannel.maxreq_sz < NFSD_MIN_REQ_HDR_SEQ_SZ
1626 || fchannel.maxresp_sz < NFSD_MIN_RESP_HDR_SEQ_SZ;
1627}
1628
069b6ad4
AA
1629__be32
1630nfsd4_create_session(struct svc_rqst *rqstp,
1631 struct nfsd4_compound_state *cstate,
1632 struct nfsd4_create_session *cr_ses)
1633{
363168b4 1634 struct sockaddr *sa = svc_addr(rqstp);
ec6b5d7b 1635 struct nfs4_client *conf, *unconf;
ac7c46f2 1636 struct nfsd4_session *new;
49557cc7 1637 struct nfsd4_clid_slot *cs_slot = NULL;
86c3e16c 1638 bool confirm_me = false;
ec6b5d7b
AA
1639 int status = 0;
1640
a62573dc
MJ
1641 if (cr_ses->flags & ~SESSION4_FLAG_MASK_A)
1642 return nfserr_inval;
1643
ec6b5d7b
AA
1644 nfs4_lock_state();
1645 unconf = find_unconfirmed_client(&cr_ses->clientid);
1646 conf = find_confirmed_client(&cr_ses->clientid);
1647
1648 if (conf) {
49557cc7
AA
1649 cs_slot = &conf->cl_cs_slot;
1650 status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
38eb76a5 1651 if (status == nfserr_replay_cache) {
ec6b5d7b 1652 dprintk("Got a create_session replay! seqid= %d\n",
49557cc7 1653 cs_slot->sl_seqid);
38eb76a5 1654 /* Return the cached reply status */
49557cc7 1655 status = nfsd4_replay_create_session(cr_ses, cs_slot);
38eb76a5 1656 goto out;
49557cc7 1657 } else if (cr_ses->seqid != cs_slot->sl_seqid + 1) {
ec6b5d7b
AA
1658 status = nfserr_seq_misordered;
1659 dprintk("Sequence misordered!\n");
1660 dprintk("Expected seqid= %d but got seqid= %d\n",
49557cc7 1661 cs_slot->sl_seqid, cr_ses->seqid);
ec6b5d7b
AA
1662 goto out;
1663 }
ec6b5d7b
AA
1664 } else if (unconf) {
1665 if (!same_creds(&unconf->cl_cred, &rqstp->rq_cred) ||
363168b4 1666 !rpc_cmp_addr(sa, (struct sockaddr *) &unconf->cl_addr)) {
ec6b5d7b
AA
1667 status = nfserr_clid_inuse;
1668 goto out;
1669 }
1670
49557cc7
AA
1671 cs_slot = &unconf->cl_cs_slot;
1672 status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
38eb76a5
AA
1673 if (status) {
1674 /* an unconfirmed replay returns misordered */
ec6b5d7b 1675 status = nfserr_seq_misordered;
cd5b8144 1676 goto out;
ec6b5d7b
AA
1677 }
1678
86c3e16c 1679 confirm_me = true;
ec6b5d7b
AA
1680 conf = unconf;
1681 } else {
1682 status = nfserr_stale_clientid;
1683 goto out;
1684 }
1685
8323c3b2
BF
1686 /*
1687 * XXX: we should probably set this at creation time, and check
1688 * for consistent minorversion use throughout:
1689 */
1690 conf->cl_minorversion = 1;
408b79bc
BF
1691 /*
1692 * We do not support RDMA or persistent sessions
1693 */
1694 cr_ses->flags &= ~SESSION4_PERSIST;
1695 cr_ses->flags &= ~SESSION4_RDMA;
1696
1b74c25b
MJ
1697 status = nfserr_toosmall;
1698 if (check_forechannel_attrs(cr_ses->fore_channel))
1699 goto out;
1700
ac7c46f2
BF
1701 status = nfserr_jukebox;
1702 new = alloc_init_session(rqstp, conf, cr_ses);
1703 if (!new)
ec6b5d7b 1704 goto out;
ac7c46f2
BF
1705 status = nfs_ok;
1706 memcpy(cr_ses->sessionid.data, new->se_sessionid.data,
ec6b5d7b 1707 NFS4_MAX_SESSIONID_LEN);
12050657
MJ
1708 memcpy(&cr_ses->fore_channel, &new->se_fchannel,
1709 sizeof(struct nfsd4_channel_attrs));
86c3e16c 1710 cs_slot->sl_seqid++;
49557cc7 1711 cr_ses->seqid = cs_slot->sl_seqid;
ec6b5d7b 1712
49557cc7
AA
1713 /* cache solo and embedded create sessions under the state lock */
1714 nfsd4_cache_create_session(cr_ses, cs_slot, status);
86c3e16c
BF
1715 if (confirm_me)
1716 move_to_confirmed(conf);
ec6b5d7b
AA
1717out:
1718 nfs4_unlock_state();
1719 dprintk("%s returns %d\n", __func__, ntohl(status));
1720 return status;
069b6ad4
AA
1721}
1722
57716355
BF
1723static bool nfsd4_last_compound_op(struct svc_rqst *rqstp)
1724{
1725 struct nfsd4_compoundres *resp = rqstp->rq_resp;
1726 struct nfsd4_compoundargs *argp = rqstp->rq_argp;
1727
1728 return argp->opcnt == resp->opcnt;
1729}
1730
1d1bc8f2
BF
1731static __be32 nfsd4_map_bcts_dir(u32 *dir)
1732{
1733 switch (*dir) {
1734 case NFS4_CDFC4_FORE:
1735 case NFS4_CDFC4_BACK:
1736 return nfs_ok;
1737 case NFS4_CDFC4_FORE_OR_BOTH:
1738 case NFS4_CDFC4_BACK_OR_BOTH:
1739 *dir = NFS4_CDFC4_BOTH;
1740 return nfs_ok;
1741 };
1742 return nfserr_inval;
1743}
1744
1745__be32 nfsd4_bind_conn_to_session(struct svc_rqst *rqstp,
1746 struct nfsd4_compound_state *cstate,
1747 struct nfsd4_bind_conn_to_session *bcts)
1748{
1749 __be32 status;
1750
1751 if (!nfsd4_last_compound_op(rqstp))
1752 return nfserr_not_only_op;
1753 spin_lock(&client_lock);
1754 cstate->session = find_in_sessionid_hashtbl(&bcts->sessionid);
1755 /* Sorta weird: we only need the refcnt'ing because new_conn acquires
1756 * client_lock iself: */
1757 if (cstate->session) {
1758 nfsd4_get_session(cstate->session);
1759 atomic_inc(&cstate->session->se_client->cl_refcount);
1760 }
1761 spin_unlock(&client_lock);
1762 if (!cstate->session)
1763 return nfserr_badsession;
1764
1765 status = nfsd4_map_bcts_dir(&bcts->dir);
1db2b9dd
BS
1766 if (!status)
1767 nfsd4_new_conn(rqstp, cstate->session, bcts->dir);
1768 return status;
1d1bc8f2
BF
1769}
1770
5d4cec2f
BF
1771static bool nfsd4_compound_in_session(struct nfsd4_session *session, struct nfs4_sessionid *sid)
1772{
1773 if (!session)
1774 return 0;
1775 return !memcmp(sid, &session->se_sessionid, sizeof(*sid));
1776}
1777
069b6ad4
AA
1778__be32
1779nfsd4_destroy_session(struct svc_rqst *r,
1780 struct nfsd4_compound_state *cstate,
1781 struct nfsd4_destroy_session *sessionid)
1782{
e10e0cfc
BH
1783 struct nfsd4_session *ses;
1784 u32 status = nfserr_badsession;
1785
1786 /* Notes:
1787 * - The confirmed nfs4_client->cl_sessionid holds destroyed sessinid
1788 * - Should we return nfserr_back_chan_busy if waiting for
1789 * callbacks on to-be-destroyed session?
1790 * - Do we need to clear any callback info from previous session?
1791 */
1792
5d4cec2f 1793 if (nfsd4_compound_in_session(cstate->session, &sessionid->sessionid)) {
57716355
BF
1794 if (!nfsd4_last_compound_op(r))
1795 return nfserr_not_only_op;
1796 }
e10e0cfc 1797 dump_sessionid(__func__, &sessionid->sessionid);
9089f1b4 1798 spin_lock(&client_lock);
e10e0cfc
BH
1799 ses = find_in_sessionid_hashtbl(&sessionid->sessionid);
1800 if (!ses) {
9089f1b4 1801 spin_unlock(&client_lock);
e10e0cfc
BH
1802 goto out;
1803 }
1804
1805 unhash_session(ses);
9089f1b4 1806 spin_unlock(&client_lock);
e10e0cfc 1807
ab707e15 1808 nfs4_lock_state();
84f5f7cc 1809 nfsd4_probe_callback_sync(ses->se_client);
ab707e15 1810 nfs4_unlock_state();
19cf5c02
BF
1811
1812 nfsd4_del_conns(ses);
1813
e10e0cfc
BH
1814 nfsd4_put_session(ses);
1815 status = nfs_ok;
1816out:
1817 dprintk("%s returns %d\n", __func__, ntohl(status));
1818 return status;
069b6ad4
AA
1819}
1820
a663bdd8 1821static struct nfsd4_conn *__nfsd4_find_conn(struct svc_xprt *xpt, struct nfsd4_session *s)
328ead28
BF
1822{
1823 struct nfsd4_conn *c;
1824
1825 list_for_each_entry(c, &s->se_conns, cn_persession) {
a663bdd8 1826 if (c->cn_xprt == xpt) {
328ead28
BF
1827 return c;
1828 }
1829 }
1830 return NULL;
1831}
1832
a663bdd8 1833static void nfsd4_sequence_check_conn(struct nfsd4_conn *new, struct nfsd4_session *ses)
328ead28
BF
1834{
1835 struct nfs4_client *clp = ses->se_client;
a663bdd8 1836 struct nfsd4_conn *c;
21b75b01 1837 int ret;
328ead28
BF
1838
1839 spin_lock(&clp->cl_lock);
a663bdd8 1840 c = __nfsd4_find_conn(new->cn_xprt, ses);
328ead28
BF
1841 if (c) {
1842 spin_unlock(&clp->cl_lock);
1843 free_conn(new);
1844 return;
1845 }
1846 __nfsd4_hash_conn(new, ses);
1847 spin_unlock(&clp->cl_lock);
21b75b01
BF
1848 ret = nfsd4_register_conn(new);
1849 if (ret)
1850 /* oops; xprt is already down: */
1851 nfsd4_conn_lost(&new->cn_xpt_user);
328ead28
BF
1852 return;
1853}
1854
868b89c3
MJ
1855static bool nfsd4_session_too_many_ops(struct svc_rqst *rqstp, struct nfsd4_session *session)
1856{
1857 struct nfsd4_compoundargs *args = rqstp->rq_argp;
1858
1859 return args->opcnt > session->se_fchannel.maxops;
1860}
1861
ae82a8d0
MJ
1862static bool nfsd4_request_too_big(struct svc_rqst *rqstp,
1863 struct nfsd4_session *session)
1864{
1865 struct xdr_buf *xb = &rqstp->rq_arg;
1866
1867 return xb->len > session->se_fchannel.maxreq_sz;
1868}
1869
069b6ad4 1870__be32
b85d4c01 1871nfsd4_sequence(struct svc_rqst *rqstp,
069b6ad4
AA
1872 struct nfsd4_compound_state *cstate,
1873 struct nfsd4_sequence *seq)
1874{
f9bb94c4 1875 struct nfsd4_compoundres *resp = rqstp->rq_resp;
b85d4c01
BH
1876 struct nfsd4_session *session;
1877 struct nfsd4_slot *slot;
a663bdd8 1878 struct nfsd4_conn *conn;
b85d4c01
BH
1879 int status;
1880
f9bb94c4
AA
1881 if (resp->opcnt != 1)
1882 return nfserr_sequence_pos;
1883
a663bdd8
BF
1884 /*
1885 * Will be either used or freed by nfsd4_sequence_check_conn
1886 * below.
1887 */
1888 conn = alloc_conn(rqstp, NFS4_CDFC4_FORE);
1889 if (!conn)
1890 return nfserr_jukebox;
1891
9089f1b4 1892 spin_lock(&client_lock);
b85d4c01
BH
1893 status = nfserr_badsession;
1894 session = find_in_sessionid_hashtbl(&seq->sessionid);
1895 if (!session)
1896 goto out;
1897
868b89c3
MJ
1898 status = nfserr_too_many_ops;
1899 if (nfsd4_session_too_many_ops(rqstp, session))
1900 goto out;
1901
ae82a8d0
MJ
1902 status = nfserr_req_too_big;
1903 if (nfsd4_request_too_big(rqstp, session))
1904 goto out;
1905
b85d4c01 1906 status = nfserr_badslot;
6c18ba9f 1907 if (seq->slotid >= session->se_fchannel.maxreqs)
b85d4c01
BH
1908 goto out;
1909
557ce264 1910 slot = session->se_slots[seq->slotid];
b85d4c01
BH
1911 dprintk("%s: slotid %d\n", __func__, seq->slotid);
1912
a8dfdaeb
AA
1913 /* We do not negotiate the number of slots yet, so set the
1914 * maxslots to the session maxreqs which is used to encode
1915 * sr_highest_slotid and the sr_target_slot id to maxslots */
1916 seq->maxslots = session->se_fchannel.maxreqs;
1917
88e588d5 1918 status = check_slot_seqid(seq->seqid, slot->sl_seqid, slot->sl_inuse);
b85d4c01
BH
1919 if (status == nfserr_replay_cache) {
1920 cstate->slot = slot;
1921 cstate->session = session;
da3846a2 1922 /* Return the cached reply status and set cstate->status
557ce264 1923 * for nfsd4_proc_compound processing */
bf864a31 1924 status = nfsd4_replay_cache_entry(resp, seq);
da3846a2 1925 cstate->status = nfserr_replay_cache;
aaf84eb9 1926 goto out;
b85d4c01
BH
1927 }
1928 if (status)
1929 goto out;
1930
a663bdd8
BF
1931 nfsd4_sequence_check_conn(conn, session);
1932 conn = NULL;
328ead28 1933
b85d4c01
BH
1934 /* Success! bump slot seqid */
1935 slot->sl_inuse = true;
1936 slot->sl_seqid = seq->seqid;
557ce264 1937 slot->sl_cachethis = seq->cachethis;
b85d4c01
BH
1938
1939 cstate->slot = slot;
1940 cstate->session = session;
1941
b85d4c01 1942out:
26c0c75e 1943 /* Hold a session reference until done processing the compound. */
aaf84eb9 1944 if (cstate->session) {
0d7bb719
BF
1945 struct nfs4_client *clp = session->se_client;
1946
36acb66b 1947 nfsd4_get_session(cstate->session);
0d7bb719 1948 atomic_inc(&clp->cl_refcount);
5423732a
BH
1949 switch (clp->cl_cb_state) {
1950 case NFSD4_CB_DOWN:
fc0c3dd1 1951 seq->status_flags = SEQ4_STATUS_CB_PATH_DOWN;
5423732a
BH
1952 break;
1953 case NFSD4_CB_FAULT:
fc0c3dd1 1954 seq->status_flags = SEQ4_STATUS_BACKCHANNEL_FAULT;
5423732a 1955 break;
fc0c3dd1
BH
1956 default:
1957 seq->status_flags = 0;
5423732a 1958 }
aaf84eb9 1959 }
a663bdd8 1960 kfree(conn);
36acb66b 1961 spin_unlock(&client_lock);
b85d4c01
BH
1962 dprintk("%s: return %d\n", __func__, ntohl(status));
1963 return status;
069b6ad4
AA
1964}
1965
345c2842
MJ
1966static inline bool has_resources(struct nfs4_client *clp)
1967{
1968 return !list_empty(&clp->cl_openowners)
1969 || !list_empty(&clp->cl_delegations)
1970 || !list_empty(&clp->cl_sessions);
1971}
1972
1973__be32
1974nfsd4_destroy_clientid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_destroy_clientid *dc)
1975{
1976 struct nfs4_client *conf, *unconf, *clp;
1977 int status = 0;
1978
1979 nfs4_lock_state();
1980 unconf = find_unconfirmed_client(&dc->clientid);
1981 conf = find_confirmed_client(&dc->clientid);
1982
1983 if (conf) {
1984 clp = conf;
1985
1986 if (!is_client_expired(conf) && has_resources(conf)) {
1987 status = nfserr_clientid_busy;
1988 goto out;
1989 }
1990
1991 /* rfc5661 18.50.3 */
1992 if (cstate->session && conf == cstate->session->se_client) {
1993 status = nfserr_clientid_busy;
1994 goto out;
1995 }
1996 } else if (unconf)
1997 clp = unconf;
1998 else {
1999 status = nfserr_stale_clientid;
2000 goto out;
2001 }
2002
2003 expire_client(clp);
2004out:
2005 nfs4_unlock_state();
2006 dprintk("%s return %d\n", __func__, ntohl(status));
2007 return status;
2008}
2009
4dc6ec00
BF
2010__be32
2011nfsd4_reclaim_complete(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_reclaim_complete *rc)
2012{
bcecf1cc
MJ
2013 int status = 0;
2014
4dc6ec00
BF
2015 if (rc->rca_one_fs) {
2016 if (!cstate->current_fh.fh_dentry)
2017 return nfserr_nofilehandle;
2018 /*
2019 * We don't take advantage of the rca_one_fs case.
2020 * That's OK, it's optional, we can safely ignore it.
2021 */
2022 return nfs_ok;
2023 }
bcecf1cc 2024
4dc6ec00 2025 nfs4_lock_state();
bcecf1cc
MJ
2026 status = nfserr_complete_already;
2027 if (cstate->session->se_client->cl_firststate)
2028 goto out;
2029
2030 status = nfserr_stale_clientid;
2031 if (is_client_expired(cstate->session->se_client))
4dc6ec00
BF
2032 /*
2033 * The following error isn't really legal.
2034 * But we only get here if the client just explicitly
2035 * destroyed the client. Surely it no longer cares what
2036 * error it gets back on an operation for the dead
2037 * client.
2038 */
bcecf1cc
MJ
2039 goto out;
2040
2041 status = nfs_ok;
4dc6ec00 2042 nfsd4_create_clid_dir(cstate->session->se_client);
bcecf1cc 2043out:
4dc6ec00 2044 nfs4_unlock_state();
bcecf1cc 2045 return status;
4dc6ec00
BF
2046}
2047
b37ad28b 2048__be32
b591480b
BF
2049nfsd4_setclientid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
2050 struct nfsd4_setclientid *setclid)
1da177e4 2051{
a084daf5 2052 struct xdr_netobj clname = setclid->se_name;
1da177e4
LT
2053 nfs4_verifier clverifier = setclid->se_verf;
2054 unsigned int strhashval;
28ce6054 2055 struct nfs4_client *conf, *unconf, *new;
b37ad28b 2056 __be32 status;
a55370a3 2057 char dname[HEXDIR_LEN];
1da177e4 2058
a55370a3
N
2059 status = nfs4_make_rec_clidname(dname, &clname);
2060 if (status)
73aea4ec 2061 return status;
a55370a3 2062
1da177e4
LT
2063 /*
2064 * XXX The Duplicate Request Cache (DRC) has been checked (??)
2065 * We get here on a DRC miss.
2066 */
2067
a55370a3 2068 strhashval = clientstr_hashval(dname);
1da177e4 2069
1da177e4 2070 nfs4_lock_state();
e203d506 2071 conf = find_confirmed_client_by_str(dname, strhashval);
28ce6054 2072 if (conf) {
a186e767 2073 /* RFC 3530 14.2.33 CASE 0: */
1da177e4 2074 status = nfserr_clid_inuse;
e203d506
BF
2075 if (clp_used_exchangeid(conf))
2076 goto out;
026722c2 2077 if (!same_creds(&conf->cl_cred, &rqstp->rq_cred)) {
363168b4
JL
2078 char addr_str[INET6_ADDRSTRLEN];
2079 rpc_ntop((struct sockaddr *) &conf->cl_addr, addr_str,
2080 sizeof(addr_str));
2081 dprintk("NFSD: setclientid: string in use by client "
2082 "at %s\n", addr_str);
1da177e4
LT
2083 goto out;
2084 }
1da177e4 2085 }
a186e767
BF
2086 /*
2087 * section 14.2.33 of RFC 3530 (under the heading "IMPLEMENTATION")
2088 * has a description of SETCLIENTID request processing consisting
2089 * of 5 bullet points, labeled as CASE0 - CASE4 below.
2090 */
e203d506 2091 unconf = find_unconfirmed_client_by_str(dname, strhashval);
3e772463 2092 status = nfserr_jukebox;
1da177e4 2093 if (!conf) {
a186e767
BF
2094 /*
2095 * RFC 3530 14.2.33 CASE 4:
2096 * placed first, because it is the normal case
1da177e4
LT
2097 */
2098 if (unconf)
2099 expire_client(unconf);
b09333c4 2100 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2101 if (new == NULL)
1da177e4 2102 goto out;
1da177e4 2103 gen_clid(new);
599e0a22 2104 } else if (same_verf(&conf->cl_verifier, &clverifier)) {
1da177e4 2105 /*
a186e767
BF
2106 * RFC 3530 14.2.33 CASE 1:
2107 * probable callback update
1da177e4 2108 */
31f4a6c1
N
2109 if (unconf) {
2110 /* Note this is removing unconfirmed {*x***},
2111 * which is stronger than RFC recommended {vxc**}.
2112 * This has the advantage that there is at most
2113 * one {*x***} in either list at any time.
2114 */
2115 expire_client(unconf);
1da177e4 2116 }
b09333c4 2117 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2118 if (new == NULL)
1da177e4 2119 goto out;
1da177e4 2120 copy_clid(new, conf);
1da177e4
LT
2121 } else if (!unconf) {
2122 /*
a186e767
BF
2123 * RFC 3530 14.2.33 CASE 2:
2124 * probable client reboot; state will be removed if
2125 * confirmed.
1da177e4 2126 */
b09333c4 2127 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2128 if (new == NULL)
1da177e4 2129 goto out;
1da177e4 2130 gen_clid(new);
49ba8781 2131 } else {
a186e767
BF
2132 /*
2133 * RFC 3530 14.2.33 CASE 3:
2134 * probable client reboot; state will be removed if
2135 * confirmed.
1da177e4
LT
2136 */
2137 expire_client(unconf);
b09333c4 2138 new = create_client(clname, dname, rqstp, &clverifier);
a55370a3 2139 if (new == NULL)
1da177e4 2140 goto out;
1da177e4 2141 gen_clid(new);
1da177e4 2142 }
8323c3b2
BF
2143 /*
2144 * XXX: we should probably set this at creation time, and check
2145 * for consistent minorversion use throughout:
2146 */
2147 new->cl_minorversion = 0;
6f3d772f 2148 gen_callback(new, setclid, rqstp);
c175b83c 2149 add_to_unconfirmed(new, strhashval);
1da177e4
LT
2150 setclid->se_clientid.cl_boot = new->cl_clientid.cl_boot;
2151 setclid->se_clientid.cl_id = new->cl_clientid.cl_id;
2152 memcpy(setclid->se_confirm.data, new->cl_confirm.data, sizeof(setclid->se_confirm.data));
2153 status = nfs_ok;
2154out:
2155 nfs4_unlock_state();
2156 return status;
2157}
2158
2159
2160/*
a186e767
BF
2161 * Section 14.2.34 of RFC 3530 (under the heading "IMPLEMENTATION") has
2162 * a description of SETCLIENTID_CONFIRM request processing consisting of 4
2163 * bullets, labeled as CASE1 - CASE4 below.
1da177e4 2164 */
b37ad28b 2165__be32
b591480b
BF
2166nfsd4_setclientid_confirm(struct svc_rqst *rqstp,
2167 struct nfsd4_compound_state *cstate,
2168 struct nfsd4_setclientid_confirm *setclientid_confirm)
1da177e4 2169{
363168b4 2170 struct sockaddr *sa = svc_addr(rqstp);
21ab45a4 2171 struct nfs4_client *conf, *unconf;
1da177e4
LT
2172 nfs4_verifier confirm = setclientid_confirm->sc_confirm;
2173 clientid_t * clid = &setclientid_confirm->sc_clientid;
b37ad28b 2174 __be32 status;
1da177e4
LT
2175
2176 if (STALE_CLIENTID(clid))
2177 return nfserr_stale_clientid;
2178 /*
2179 * XXX The Duplicate Request Cache (DRC) has been checked (??)
2180 * We get here on a DRC miss.
2181 */
2182
2183 nfs4_lock_state();
21ab45a4
N
2184
2185 conf = find_confirmed_client(clid);
2186 unconf = find_unconfirmed_client(clid);
2187
2188 status = nfserr_clid_inuse;
363168b4 2189 if (conf && !rpc_cmp_addr((struct sockaddr *) &conf->cl_addr, sa))
21ab45a4 2190 goto out;
363168b4 2191 if (unconf && !rpc_cmp_addr((struct sockaddr *) &unconf->cl_addr, sa))
21ab45a4
N
2192 goto out;
2193
a186e767
BF
2194 /*
2195 * section 14.2.34 of RFC 3530 has a description of
2196 * SETCLIENTID_CONFIRM request processing consisting
2197 * of 4 bullet points, labeled as CASE1 - CASE4 below.
2198 */
366e0c1d 2199 if (conf && unconf && same_verf(&confirm, &unconf->cl_confirm)) {
a186e767
BF
2200 /*
2201 * RFC 3530 14.2.34 CASE 1:
2202 * callback update
2203 */
599e0a22 2204 if (!same_creds(&conf->cl_cred, &unconf->cl_cred))
1da177e4
LT
2205 status = nfserr_clid_inuse;
2206 else {
5a3c9d71
BF
2207 nfsd4_change_callback(conf, &unconf->cl_cb_conn);
2208 nfsd4_probe_callback(conf);
1a69c179 2209 expire_client(unconf);
1da177e4 2210 status = nfs_ok;
1a69c179 2211
1da177e4 2212 }
f3aba4e5 2213 } else if (conf && !unconf) {
a186e767
BF
2214 /*
2215 * RFC 3530 14.2.34 CASE 2:
2216 * probable retransmitted request; play it safe and
2217 * do nothing.
7c79f737 2218 */
599e0a22 2219 if (!same_creds(&conf->cl_cred, &rqstp->rq_cred))
1da177e4 2220 status = nfserr_clid_inuse;
21ab45a4 2221 else
1da177e4 2222 status = nfs_ok;
7c79f737 2223 } else if (!conf && unconf
599e0a22 2224 && same_verf(&unconf->cl_confirm, &confirm)) {
a186e767
BF
2225 /*
2226 * RFC 3530 14.2.34 CASE 3:
2227 * Normal case; new or rebooted client:
7c79f737 2228 */
599e0a22 2229 if (!same_creds(&unconf->cl_cred, &rqstp->rq_cred)) {
1da177e4
LT
2230 status = nfserr_clid_inuse;
2231 } else {
1a69c179
N
2232 unsigned int hash =
2233 clientstr_hashval(unconf->cl_recdir);
2234 conf = find_confirmed_client_by_str(unconf->cl_recdir,
e203d506 2235 hash);
1a69c179 2236 if (conf) {
c7b9a459 2237 nfsd4_remove_clid_dir(conf);
1a69c179
N
2238 expire_client(conf);
2239 }
1da177e4 2240 move_to_confirmed(unconf);
21ab45a4 2241 conf = unconf;
5a3c9d71 2242 nfsd4_probe_callback(conf);
1a69c179 2243 status = nfs_ok;
1da177e4 2244 }
599e0a22
BF
2245 } else if ((!conf || (conf && !same_verf(&conf->cl_confirm, &confirm)))
2246 && (!unconf || (unconf && !same_verf(&unconf->cl_confirm,
7c79f737 2247 &confirm)))) {
a186e767
BF
2248 /*
2249 * RFC 3530 14.2.34 CASE 4:
2250 * Client probably hasn't noticed that we rebooted yet.
7c79f737 2251 */
1da177e4 2252 status = nfserr_stale_clientid;
7c79f737 2253 } else {
08e8987c
N
2254 /* check that we have hit one of the cases...*/
2255 status = nfserr_clid_inuse;
2256 }
1da177e4 2257out:
1da177e4
LT
2258 nfs4_unlock_state();
2259 return status;
2260}
2261
32513b40
BF
2262static struct nfs4_file *nfsd4_alloc_file(void)
2263{
2264 return kmem_cache_alloc(file_slab, GFP_KERNEL);
2265}
2266
1da177e4 2267/* OPEN Share state helper functions */
32513b40 2268static void nfsd4_init_file(struct nfs4_file *fp, struct inode *ino)
1da177e4 2269{
1da177e4
LT
2270 unsigned int hashval = file_hashval(ino);
2271
32513b40
BF
2272 atomic_set(&fp->fi_ref, 1);
2273 INIT_LIST_HEAD(&fp->fi_hash);
2274 INIT_LIST_HEAD(&fp->fi_stateids);
2275 INIT_LIST_HEAD(&fp->fi_delegations);
2276 fp->fi_inode = igrab(ino);
2277 fp->fi_had_conflict = false;
2278 fp->fi_lease = NULL;
2279 memset(fp->fi_fds, 0, sizeof(fp->fi_fds));
2280 memset(fp->fi_access, 0, sizeof(fp->fi_access));
2281 spin_lock(&recall_lock);
2282 list_add(&fp->fi_hash, &file_hashtbl[hashval]);
2283 spin_unlock(&recall_lock);
1da177e4
LT
2284}
2285
e60d4398 2286static void
e18b890b 2287nfsd4_free_slab(struct kmem_cache **slab)
1da177e4 2288{
e60d4398
N
2289 if (*slab == NULL)
2290 return;
1a1d92c1 2291 kmem_cache_destroy(*slab);
e60d4398 2292 *slab = NULL;
1da177e4
LT
2293}
2294
e8ff2a84 2295void
1da177e4
LT
2296nfsd4_free_slabs(void)
2297{
fe0750e5
BF
2298 nfsd4_free_slab(&openowner_slab);
2299 nfsd4_free_slab(&lockowner_slab);
e60d4398 2300 nfsd4_free_slab(&file_slab);
5ac049ac 2301 nfsd4_free_slab(&stateid_slab);
5b2d21c1 2302 nfsd4_free_slab(&deleg_slab);
e60d4398 2303}
1da177e4 2304
72083396 2305int
e60d4398
N
2306nfsd4_init_slabs(void)
2307{
fe0750e5
BF
2308 openowner_slab = kmem_cache_create("nfsd4_openowners",
2309 sizeof(struct nfs4_openowner), 0, 0, NULL);
2310 if (openowner_slab == NULL)
2311 goto out_nomem;
2312 lockowner_slab = kmem_cache_create("nfsd4_lockowners",
2313 sizeof(struct nfs4_openowner), 0, 0, NULL);
2314 if (lockowner_slab == NULL)
e60d4398
N
2315 goto out_nomem;
2316 file_slab = kmem_cache_create("nfsd4_files",
20c2df83 2317 sizeof(struct nfs4_file), 0, 0, NULL);
e60d4398
N
2318 if (file_slab == NULL)
2319 goto out_nomem;
5ac049ac 2320 stateid_slab = kmem_cache_create("nfsd4_stateids",
dcef0413 2321 sizeof(struct nfs4_ol_stateid), 0, 0, NULL);
5ac049ac
N
2322 if (stateid_slab == NULL)
2323 goto out_nomem;
5b2d21c1 2324 deleg_slab = kmem_cache_create("nfsd4_delegations",
20c2df83 2325 sizeof(struct nfs4_delegation), 0, 0, NULL);
5b2d21c1
N
2326 if (deleg_slab == NULL)
2327 goto out_nomem;
e60d4398
N
2328 return 0;
2329out_nomem:
2330 nfsd4_free_slabs();
2331 dprintk("nfsd4: out of memory while initializing nfsv4\n");
2332 return -ENOMEM;
1da177e4
LT
2333}
2334
fe0750e5
BF
2335void nfs4_free_openowner(struct nfs4_openowner *oo)
2336{
2337 kfree(oo->oo_owner.so_owner.data);
2338 kmem_cache_free(openowner_slab, oo);
2339}
2340
2341void nfs4_free_lockowner(struct nfs4_lockowner *lo)
1da177e4 2342{
fe0750e5
BF
2343 kfree(lo->lo_owner.so_owner.data);
2344 kmem_cache_free(lockowner_slab, lo);
1da177e4
LT
2345}
2346
ff194bd9 2347static void init_nfs4_replay(struct nfs4_replay *rp)
1da177e4 2348{
ff194bd9
BF
2349 rp->rp_status = nfserr_serverfault;
2350 rp->rp_buflen = 0;
2351 rp->rp_buf = rp->rp_ibuf;
1da177e4
LT
2352}
2353
fe0750e5 2354static inline void *alloc_stateowner(struct kmem_cache *slab, struct xdr_netobj *owner, struct nfs4_client *clp)
ff194bd9 2355{
1da177e4 2356 struct nfs4_stateowner *sop;
1da177e4 2357
fe0750e5 2358 sop = kmem_cache_alloc(slab, GFP_KERNEL);
ff194bd9
BF
2359 if (!sop)
2360 return NULL;
2361
2362 sop->so_owner.data = kmemdup(owner->data, owner->len, GFP_KERNEL);
2363 if (!sop->so_owner.data) {
fe0750e5 2364 kmem_cache_free(slab, sop);
1da177e4 2365 return NULL;
ff194bd9
BF
2366 }
2367 sop->so_owner.len = owner->len;
2368
ea1da636 2369 INIT_LIST_HEAD(&sop->so_stateids);
ff194bd9
BF
2370 sop->so_client = clp;
2371 init_nfs4_replay(&sop->so_replay);
2372 return sop;
2373}
2374
fe0750e5 2375static void hash_openowner(struct nfs4_openowner *oo, struct nfs4_client *clp, unsigned int strhashval)
ff194bd9 2376{
16bfdaaf 2377 list_add(&oo->oo_owner.so_strhash, &ownerstr_hashtbl[strhashval]);
fe0750e5 2378 list_add(&oo->oo_perclient, &clp->cl_openowners);
ff194bd9
BF
2379}
2380
fe0750e5 2381static struct nfs4_openowner *
ff194bd9 2382alloc_init_open_stateowner(unsigned int strhashval, struct nfs4_client *clp, struct nfsd4_open *open) {
fe0750e5 2383 struct nfs4_openowner *oo;
ff194bd9 2384
fe0750e5
BF
2385 oo = alloc_stateowner(openowner_slab, &open->op_owner, clp);
2386 if (!oo)
ff194bd9 2387 return NULL;
fe0750e5
BF
2388 oo->oo_owner.so_is_open_owner = 1;
2389 oo->oo_owner.so_seqid = open->op_seqid;
d29b20cd 2390 oo->oo_flags = NFS4_OO_NEW;
fe0750e5 2391 oo->oo_time = 0;
38c387b5 2392 oo->oo_last_closed_stid = NULL;
fe0750e5
BF
2393 INIT_LIST_HEAD(&oo->oo_close_lru);
2394 hash_openowner(oo, clp, strhashval);
2395 return oo;
1da177e4
LT
2396}
2397
996e0938 2398static void init_open_stateid(struct nfs4_ol_stateid *stp, struct nfs4_file *fp, struct nfsd4_open *open) {
fe0750e5 2399 struct nfs4_openowner *oo = open->op_openowner;
d3b313a4 2400 struct nfs4_client *clp = oo->oo_owner.so_client;
1da177e4 2401
996e0938 2402 init_stid(&stp->st_stid, clp, NFS4_OPEN_STID);
ea1da636 2403 INIT_LIST_HEAD(&stp->st_lockowners);
fe0750e5 2404 list_add(&stp->st_perstateowner, &oo->oo_owner.so_stateids);
8beefa24 2405 list_add(&stp->st_perfile, &fp->fi_stateids);
fe0750e5 2406 stp->st_stateowner = &oo->oo_owner;
13cd2184 2407 get_nfs4_file(fp);
1da177e4 2408 stp->st_file = fp;
1da177e4
LT
2409 stp->st_access_bmap = 0;
2410 stp->st_deny_bmap = 0;
b6d2f1ca 2411 __set_bit(open->op_share_access, &stp->st_access_bmap);
1da177e4 2412 __set_bit(open->op_share_deny, &stp->st_deny_bmap);
4c4cd222 2413 stp->st_openstp = NULL;
1da177e4
LT
2414}
2415
fd39ca9a 2416static void
fe0750e5 2417move_to_close_lru(struct nfs4_openowner *oo)
1da177e4 2418{
fe0750e5 2419 dprintk("NFSD: move_to_close_lru nfs4_openowner %p\n", oo);
1da177e4 2420
fe0750e5
BF
2421 list_move_tail(&oo->oo_close_lru, &close_lru);
2422 oo->oo_time = get_seconds();
1da177e4
LT
2423}
2424
1da177e4 2425static int
599e0a22
BF
2426same_owner_str(struct nfs4_stateowner *sop, struct xdr_netobj *owner,
2427 clientid_t *clid)
2428{
2429 return (sop->so_owner.len == owner->len) &&
2430 0 == memcmp(sop->so_owner.data, owner->data, owner->len) &&
2431 (sop->so_client->cl_clientid.cl_id == clid->cl_id);
1da177e4
LT
2432}
2433
fe0750e5 2434static struct nfs4_openowner *
1da177e4
LT
2435find_openstateowner_str(unsigned int hashval, struct nfsd4_open *open)
2436{
a50d2ad1
BF
2437 struct nfs4_stateowner *so;
2438 struct nfs4_openowner *oo;
1da177e4 2439
16bfdaaf
BF
2440 list_for_each_entry(so, &ownerstr_hashtbl[hashval], so_strhash) {
2441 if (!so->so_is_open_owner)
2442 continue;
a50d2ad1
BF
2443 if (same_owner_str(so, &open->op_owner, &open->op_clientid)) {
2444 oo = openowner(so);
2445 renew_client(oo->oo_owner.so_client);
2446 return oo;
2447 }
1da177e4
LT
2448 }
2449 return NULL;
2450}
2451
2452/* search file_hashtbl[] for file */
2453static struct nfs4_file *
2454find_file(struct inode *ino)
2455{
2456 unsigned int hashval = file_hashval(ino);
2457 struct nfs4_file *fp;
2458
8b671b80 2459 spin_lock(&recall_lock);
1da177e4 2460 list_for_each_entry(fp, &file_hashtbl[hashval], fi_hash) {
13cd2184
N
2461 if (fp->fi_inode == ino) {
2462 get_nfs4_file(fp);
8b671b80 2463 spin_unlock(&recall_lock);
1da177e4 2464 return fp;
13cd2184 2465 }
1da177e4 2466 }
8b671b80 2467 spin_unlock(&recall_lock);
1da177e4
LT
2468 return NULL;
2469}
2470
1da177e4
LT
2471/*
2472 * Called to check deny when READ with all zero stateid or
2473 * WRITE with all zero or all one stateid
2474 */
b37ad28b 2475static __be32
1da177e4
LT
2476nfs4_share_conflict(struct svc_fh *current_fh, unsigned int deny_type)
2477{
2478 struct inode *ino = current_fh->fh_dentry->d_inode;
2479 struct nfs4_file *fp;
dcef0413 2480 struct nfs4_ol_stateid *stp;
b37ad28b 2481 __be32 ret;
1da177e4
LT
2482
2483 dprintk("NFSD: nfs4_share_conflict\n");
2484
2485 fp = find_file(ino);
13cd2184
N
2486 if (!fp)
2487 return nfs_ok;
b700949b 2488 ret = nfserr_locked;
1da177e4 2489 /* Search for conflicting share reservations */
13cd2184
N
2490 list_for_each_entry(stp, &fp->fi_stateids, st_perfile) {
2491 if (test_bit(deny_type, &stp->st_deny_bmap) ||
2492 test_bit(NFS4_SHARE_DENY_BOTH, &stp->st_deny_bmap))
2493 goto out;
1da177e4 2494 }
13cd2184
N
2495 ret = nfs_ok;
2496out:
2497 put_nfs4_file(fp);
2498 return ret;
1da177e4
LT
2499}
2500
6b57d9c8 2501static void nfsd_break_one_deleg(struct nfs4_delegation *dp)
1da177e4 2502{
1da177e4
LT
2503 /* We're assuming the state code never drops its reference
2504 * without first removing the lease. Since we're in this lease
2505 * callback (and since the lease code is serialized by the kernel
2506 * lock) we know the server hasn't removed the lease yet, we know
2507 * it's safe to take a reference: */
2508 atomic_inc(&dp->dl_count);
2509
1da177e4 2510 list_add_tail(&dp->dl_recall_lru, &del_recall_lru);
1da177e4 2511
460781b5 2512 /* only place dl_time is set. protected by lock_flocks*/
1da177e4
LT
2513 dp->dl_time = get_seconds();
2514
6b57d9c8
BF
2515 nfsd4_cb_recall(dp);
2516}
2517
acfdf5c3 2518/* Called from break_lease() with lock_flocks() held. */
6b57d9c8
BF
2519static void nfsd_break_deleg_cb(struct file_lock *fl)
2520{
acfdf5c3
BF
2521 struct nfs4_file *fp = (struct nfs4_file *)fl->fl_owner;
2522 struct nfs4_delegation *dp;
6b57d9c8 2523
acfdf5c3
BF
2524 BUG_ON(!fp);
2525 /* We assume break_lease is only called once per lease: */
2526 BUG_ON(fp->fi_had_conflict);
0272e1fd
BF
2527 /*
2528 * We don't want the locks code to timeout the lease for us;
acfdf5c3 2529 * we'll remove it ourself if a delegation isn't returned
6b57d9c8 2530 * in time:
0272e1fd
BF
2531 */
2532 fl->fl_break_time = 0;
1da177e4 2533
5d926e8c 2534 spin_lock(&recall_lock);
acfdf5c3
BF
2535 fp->fi_had_conflict = true;
2536 list_for_each_entry(dp, &fp->fi_delegations, dl_perfile)
2537 nfsd_break_one_deleg(dp);
5d926e8c 2538 spin_unlock(&recall_lock);
1da177e4
LT
2539}
2540
1da177e4
LT
2541static
2542int nfsd_change_deleg_cb(struct file_lock **onlist, int arg)
2543{
2544 if (arg & F_UNLCK)
2545 return lease_modify(onlist, arg);
2546 else
2547 return -EAGAIN;
2548}
2549
7b021967 2550static const struct lock_manager_operations nfsd_lease_mng_ops = {
8fb47a4f
BF
2551 .lm_break = nfsd_break_deleg_cb,
2552 .lm_change = nfsd_change_deleg_cb,
1da177e4
LT
2553};
2554
7a8711c9
BF
2555static __be32 nfsd4_check_seqid(struct nfsd4_compound_state *cstate, struct nfs4_stateowner *so, u32 seqid)
2556{
2557 if (nfsd4_has_session(cstate))
2558 return nfs_ok;
2559 if (seqid == so->so_seqid - 1)
2560 return nfserr_replay_me;
2561 if (seqid == so->so_seqid)
2562 return nfs_ok;
2563 return nfserr_bad_seqid;
2564}
1da177e4 2565
b37ad28b 2566__be32
6668958f
AA
2567nfsd4_process_open1(struct nfsd4_compound_state *cstate,
2568 struct nfsd4_open *open)
1da177e4 2569{
1da177e4
LT
2570 clientid_t *clientid = &open->op_clientid;
2571 struct nfs4_client *clp = NULL;
2572 unsigned int strhashval;
fe0750e5 2573 struct nfs4_openowner *oo = NULL;
4cdc951b 2574 __be32 status;
1da177e4 2575
1da177e4
LT
2576 if (STALE_CLIENTID(&open->op_clientid))
2577 return nfserr_stale_clientid;
32513b40
BF
2578 /*
2579 * In case we need it later, after we've already created the
2580 * file and don't want to risk a further failure:
2581 */
2582 open->op_file = nfsd4_alloc_file();
2583 if (open->op_file == NULL)
2584 return nfserr_jukebox;
1da177e4 2585
16bfdaaf 2586 strhashval = ownerstr_hashval(clientid->cl_id, &open->op_owner);
fe0750e5
BF
2587 oo = find_openstateowner_str(strhashval, open);
2588 open->op_openowner = oo;
2589 if (!oo) {
1da177e4
LT
2590 clp = find_confirmed_client(clientid);
2591 if (clp == NULL)
0f442aa2 2592 return nfserr_expired;
bcf130f9 2593 goto new_owner;
1da177e4 2594 }
dad1c067 2595 if (!(oo->oo_flags & NFS4_OO_CONFIRMED)) {
0f442aa2 2596 /* Replace unconfirmed owners without checking for replay. */
fe0750e5
BF
2597 clp = oo->oo_owner.so_client;
2598 release_openowner(oo);
2599 open->op_openowner = NULL;
bcf130f9 2600 goto new_owner;
0f442aa2 2601 }
4cdc951b
BF
2602 status = nfsd4_check_seqid(cstate, &oo->oo_owner, open->op_seqid);
2603 if (status)
2604 return status;
2605 clp = oo->oo_owner.so_client;
2606 goto alloc_stateid;
bcf130f9
BF
2607new_owner:
2608 oo = alloc_init_open_stateowner(strhashval, clp, open);
2609 if (oo == NULL)
2610 return nfserr_jukebox;
2611 open->op_openowner = oo;
4cdc951b
BF
2612alloc_stateid:
2613 open->op_stp = nfs4_alloc_stateid(clp);
2614 if (!open->op_stp)
2615 return nfserr_jukebox;
0f442aa2 2616 return nfs_ok;
1da177e4
LT
2617}
2618
b37ad28b 2619static inline __be32
4a6e43e6
N
2620nfs4_check_delegmode(struct nfs4_delegation *dp, int flags)
2621{
2622 if ((flags & WR_STATE) && (dp->dl_type == NFS4_OPEN_DELEGATE_READ))
2623 return nfserr_openmode;
2624 else
2625 return nfs_ok;
2626}
2627
f459e453 2628static int share_access_to_flags(u32 share_access)
52f4fb43 2629{
f459e453 2630 share_access &= ~NFS4_SHARE_WANT_MASK;
52f4fb43 2631
f459e453 2632 return share_access == NFS4_SHARE_ACCESS_READ ? RD_STATE : WR_STATE;
52f4fb43
N
2633}
2634
38c2f4b1 2635static struct nfs4_delegation *find_deleg_stateid(struct nfs4_client *cl, stateid_t *s)
24a0111e 2636{
f459e453 2637 struct nfs4_stid *ret;
24a0111e 2638
38c2f4b1 2639 ret = find_stateid_by_type(cl, s, NFS4_DELEG_STID);
f459e453
BF
2640 if (!ret)
2641 return NULL;
2642 return delegstateid(ret);
24a0111e
BF
2643}
2644
8b289b2c
BF
2645static bool nfsd4_is_deleg_cur(struct nfsd4_open *open)
2646{
2647 return open->op_claim_type == NFS4_OPEN_CLAIM_DELEGATE_CUR ||
2648 open->op_claim_type == NFS4_OPEN_CLAIM_DELEG_CUR_FH;
2649}
2650
b37ad28b 2651static __be32
38c2f4b1 2652nfs4_check_deleg(struct nfs4_client *cl, struct nfs4_file *fp, struct nfsd4_open *open,
567d9829
N
2653 struct nfs4_delegation **dp)
2654{
2655 int flags;
b37ad28b 2656 __be32 status = nfserr_bad_stateid;
567d9829 2657
38c2f4b1 2658 *dp = find_deleg_stateid(cl, &open->op_delegate_stateid);
567d9829 2659 if (*dp == NULL)
c44c5eeb 2660 goto out;
24a0111e 2661 flags = share_access_to_flags(open->op_share_access);
567d9829
N
2662 status = nfs4_check_delegmode(*dp, flags);
2663 if (status)
2664 *dp = NULL;
c44c5eeb 2665out:
8b289b2c 2666 if (!nfsd4_is_deleg_cur(open))
c44c5eeb
N
2667 return nfs_ok;
2668 if (status)
2669 return status;
dad1c067 2670 open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
c44c5eeb 2671 return nfs_ok;
567d9829
N
2672}
2673
b37ad28b 2674static __be32
dcef0413 2675nfs4_check_open(struct nfs4_file *fp, struct nfsd4_open *open, struct nfs4_ol_stateid **stpp)
1da177e4 2676{
dcef0413 2677 struct nfs4_ol_stateid *local;
fe0750e5 2678 struct nfs4_openowner *oo = open->op_openowner;
1da177e4 2679
8beefa24 2680 list_for_each_entry(local, &fp->fi_stateids, st_perfile) {
1da177e4
LT
2681 /* ignore lock owners */
2682 if (local->st_stateowner->so_is_open_owner == 0)
2683 continue;
2684 /* remember if we have seen this open owner */
fe0750e5 2685 if (local->st_stateowner == &oo->oo_owner)
1da177e4
LT
2686 *stpp = local;
2687 /* check for conflicting share reservations */
2688 if (!test_share(local, open))
77eaae8d 2689 return nfserr_share_denied;
1da177e4 2690 }
77eaae8d 2691 return nfs_ok;
1da177e4
LT
2692}
2693
996e0938
BF
2694static void nfs4_free_stateid(struct nfs4_ol_stateid *s)
2695{
2696 kmem_cache_free(stateid_slab, s);
5ac049ac
N
2697}
2698
21fb4016
BF
2699static inline int nfs4_access_to_access(u32 nfs4_access)
2700{
2701 int flags = 0;
2702
2703 if (nfs4_access & NFS4_SHARE_ACCESS_READ)
2704 flags |= NFSD_MAY_READ;
2705 if (nfs4_access & NFS4_SHARE_ACCESS_WRITE)
2706 flags |= NFSD_MAY_WRITE;
2707 return flags;
2708}
2709
0c12eaff
CB
2710static __be32 nfs4_get_vfs_file(struct svc_rqst *rqstp, struct nfs4_file *fp,
2711 struct svc_fh *cur_fh, struct nfsd4_open *open)
f9d7562f
BF
2712{
2713 __be32 status;
0c12eaff
CB
2714 int oflag = nfs4_access_to_omode(open->op_share_access);
2715 int access = nfs4_access_to_access(open->op_share_access);
2716
f9d7562f
BF
2717 if (!fp->fi_fds[oflag]) {
2718 status = nfsd_open(rqstp, cur_fh, S_IFREG, access,
2719 &fp->fi_fds[oflag]);
f9d7562f
BF
2720 if (status)
2721 return status;
2722 }
2723 nfs4_file_get_access(fp, oflag);
2724
2725 return nfs_ok;
2726}
2727
b37ad28b 2728static inline __be32
1da177e4
LT
2729nfsd4_truncate(struct svc_rqst *rqstp, struct svc_fh *fh,
2730 struct nfsd4_open *open)
2731{
2732 struct iattr iattr = {
2733 .ia_valid = ATTR_SIZE,
2734 .ia_size = 0,
2735 };
2736 if (!open->op_truncate)
2737 return 0;
2738 if (!(open->op_share_access & NFS4_SHARE_ACCESS_WRITE))
9246585a 2739 return nfserr_inval;
1da177e4
LT
2740 return nfsd_setattr(rqstp, fh, &iattr, 0, (time_t)0);
2741}
2742
b37ad28b 2743static __be32
dcef0413 2744nfs4_upgrade_open(struct svc_rqst *rqstp, struct nfs4_file *fp, struct svc_fh *cur_fh, struct nfs4_ol_stateid *stp, struct nfsd4_open *open)
1da177e4 2745{
b6d2f1ca 2746 u32 op_share_access = open->op_share_access;
7d947842 2747 bool new_access;
b37ad28b 2748 __be32 status;
1da177e4 2749
7d947842 2750 new_access = !test_bit(op_share_access, &stp->st_access_bmap);
f9d7562f 2751 if (new_access) {
0c12eaff 2752 status = nfs4_get_vfs_file(rqstp, fp, cur_fh, open);
f9d7562f
BF
2753 if (status)
2754 return status;
6c26d08f 2755 }
1da177e4
LT
2756 status = nfsd4_truncate(rqstp, cur_fh, open);
2757 if (status) {
f9d7562f 2758 if (new_access) {
f197c271 2759 int oflag = nfs4_access_to_omode(op_share_access);
f9d7562f
BF
2760 nfs4_file_put_access(fp, oflag);
2761 }
1da177e4
LT
2762 return status;
2763 }
2764 /* remember the open */
24a0111e 2765 __set_bit(op_share_access, &stp->st_access_bmap);
b55e0ba1 2766 __set_bit(open->op_share_deny, &stp->st_deny_bmap);
1da177e4
LT
2767
2768 return nfs_ok;
2769}
2770
2771
1da177e4 2772static void
37515177 2773nfs4_set_claim_prev(struct nfsd4_open *open)
1da177e4 2774{
dad1c067 2775 open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
fe0750e5 2776 open->op_openowner->oo_owner.so_client->cl_firststate = 1;
1da177e4
LT
2777}
2778
14a24e99
BF
2779/* Should we give out recallable state?: */
2780static bool nfsd4_cb_channel_good(struct nfs4_client *clp)
2781{
2782 if (clp->cl_cb_state == NFSD4_CB_UP)
2783 return true;
2784 /*
2785 * In the sessions case, since we don't have to establish a
2786 * separate connection for callbacks, we assume it's OK
2787 * until we hear otherwise:
2788 */
2789 return clp->cl_minorversion && clp->cl_cb_state == NFSD4_CB_UNKNOWN;
2790}
2791
22d38c4c
BF
2792static struct file_lock *nfs4_alloc_init_lease(struct nfs4_delegation *dp, int flag)
2793{
2794 struct file_lock *fl;
2795
2796 fl = locks_alloc_lock();
2797 if (!fl)
2798 return NULL;
2799 locks_init_lock(fl);
2800 fl->fl_lmops = &nfsd_lease_mng_ops;
2801 fl->fl_flags = FL_LEASE;
2802 fl->fl_type = flag == NFS4_OPEN_DELEGATE_READ? F_RDLCK: F_WRLCK;
2803 fl->fl_end = OFFSET_MAX;
acfdf5c3 2804 fl->fl_owner = (fl_owner_t)(dp->dl_file);
22d38c4c 2805 fl->fl_pid = current->tgid;
22d38c4c
BF
2806 return fl;
2807}
2808
edab9782
BF
2809static int nfs4_setlease(struct nfs4_delegation *dp, int flag)
2810{
acfdf5c3 2811 struct nfs4_file *fp = dp->dl_file;
edab9782
BF
2812 struct file_lock *fl;
2813 int status;
2814
2815 fl = nfs4_alloc_init_lease(dp, flag);
2816 if (!fl)
2817 return -ENOMEM;
acfdf5c3 2818 fl->fl_file = find_readable_file(fp);
2a74aba7 2819 list_add(&dp->dl_perclnt, &dp->dl_stid.sc_client->cl_delegations);
acfdf5c3 2820 status = vfs_setlease(fl->fl_file, fl->fl_type, &fl);
edab9782 2821 if (status) {
acfdf5c3 2822 list_del_init(&dp->dl_perclnt);
edab9782
BF
2823 locks_free_lock(fl);
2824 return -ENOMEM;
2825 }
acfdf5c3
BF
2826 fp->fi_lease = fl;
2827 fp->fi_deleg_file = fl->fl_file;
2828 get_file(fp->fi_deleg_file);
2829 atomic_set(&fp->fi_delegees, 1);
2830 list_add(&dp->dl_perfile, &fp->fi_delegations);
2831 return 0;
2832}
2833
2834static int nfs4_set_delegation(struct nfs4_delegation *dp, int flag)
2835{
2836 struct nfs4_file *fp = dp->dl_file;
2837
2838 if (!fp->fi_lease)
2839 return nfs4_setlease(dp, flag);
2840 spin_lock(&recall_lock);
2841 if (fp->fi_had_conflict) {
2842 spin_unlock(&recall_lock);
2843 return -EAGAIN;
2844 }
2845 atomic_inc(&fp->fi_delegees);
2846 list_add(&dp->dl_perfile, &fp->fi_delegations);
2847 spin_unlock(&recall_lock);
2a74aba7 2848 list_add(&dp->dl_perclnt, &dp->dl_stid.sc_client->cl_delegations);
edab9782
BF
2849 return 0;
2850}
2851
1da177e4
LT
2852/*
2853 * Attempt to hand out a delegation.
2854 */
2855static void
dcef0413 2856nfs4_open_delegation(struct svc_fh *fh, struct nfsd4_open *open, struct nfs4_ol_stateid *stp)
1da177e4
LT
2857{
2858 struct nfs4_delegation *dp;
fe0750e5 2859 struct nfs4_openowner *oo = container_of(stp->st_stateowner, struct nfs4_openowner, oo_owner);
14a24e99 2860 int cb_up;
1da177e4
LT
2861 int status, flag = 0;
2862
fe0750e5 2863 cb_up = nfsd4_cb_channel_good(oo->oo_owner.so_client);
1da177e4 2864 flag = NFS4_OPEN_DELEGATE_NONE;
7b190fec
N
2865 open->op_recall = 0;
2866 switch (open->op_claim_type) {
2867 case NFS4_OPEN_CLAIM_PREVIOUS:
2bf23875 2868 if (!cb_up)
7b190fec
N
2869 open->op_recall = 1;
2870 flag = open->op_delegate_type;
2871 if (flag == NFS4_OPEN_DELEGATE_NONE)
2872 goto out;
2873 break;
2874 case NFS4_OPEN_CLAIM_NULL:
2875 /* Let's not give out any delegations till everyone's
2876 * had the chance to reclaim theirs.... */
af558e33 2877 if (locks_in_grace())
7b190fec 2878 goto out;
dad1c067 2879 if (!cb_up || !(oo->oo_flags & NFS4_OO_CONFIRMED))
7b190fec
N
2880 goto out;
2881 if (open->op_share_access & NFS4_SHARE_ACCESS_WRITE)
2882 flag = NFS4_OPEN_DELEGATE_WRITE;
2883 else
2884 flag = NFS4_OPEN_DELEGATE_READ;
2885 break;
2886 default:
2887 goto out;
2888 }
1da177e4 2889
fe0750e5 2890 dp = alloc_init_deleg(oo->oo_owner.so_client, stp, fh, flag);
dd239cc0
BF
2891 if (dp == NULL)
2892 goto out_no_deleg;
acfdf5c3 2893 status = nfs4_set_delegation(dp, flag);
edab9782 2894 if (status)
dd239cc0 2895 goto out_free;
1da177e4 2896
d5477a8d 2897 memcpy(&open->op_delegate_stateid, &dp->dl_stid.sc_stateid, sizeof(dp->dl_stid.sc_stateid));
1da177e4 2898
8c10cbdb 2899 dprintk("NFSD: delegation stateid=" STATEID_FMT "\n",
d5477a8d 2900 STATEID_VAL(&dp->dl_stid.sc_stateid));
1da177e4 2901out:
7b190fec
N
2902 if (open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS
2903 && flag == NFS4_OPEN_DELEGATE_NONE
2904 && open->op_delegate_type != NFS4_OPEN_DELEGATE_NONE)
2fdada03 2905 dprintk("NFSD: WARNING: refusing delegation reclaim\n");
1da177e4 2906 open->op_delegate_type = flag;
dd239cc0
BF
2907 return;
2908out_free:
acfdf5c3 2909 nfs4_put_delegation(dp);
dd239cc0
BF
2910out_no_deleg:
2911 flag = NFS4_OPEN_DELEGATE_NONE;
2912 goto out;
1da177e4
LT
2913}
2914
2915/*
2916 * called with nfs4_lock_state() held.
2917 */
b37ad28b 2918__be32
1da177e4
LT
2919nfsd4_process_open2(struct svc_rqst *rqstp, struct svc_fh *current_fh, struct nfsd4_open *open)
2920{
6668958f 2921 struct nfsd4_compoundres *resp = rqstp->rq_resp;
38c2f4b1 2922 struct nfs4_client *cl = open->op_openowner->oo_owner.so_client;
1da177e4
LT
2923 struct nfs4_file *fp = NULL;
2924 struct inode *ino = current_fh->fh_dentry->d_inode;
dcef0413 2925 struct nfs4_ol_stateid *stp = NULL;
567d9829 2926 struct nfs4_delegation *dp = NULL;
b37ad28b 2927 __be32 status;
1da177e4 2928
1da177e4
LT
2929 /*
2930 * Lookup file; if found, lookup stateid and check open request,
2931 * and check for delegations in the process of being recalled.
2932 * If not found, create the nfs4_file struct
2933 */
2934 fp = find_file(ino);
2935 if (fp) {
2936 if ((status = nfs4_check_open(fp, open, &stp)))
2937 goto out;
38c2f4b1 2938 status = nfs4_check_deleg(cl, fp, open, &dp);
c44c5eeb
N
2939 if (status)
2940 goto out;
1da177e4 2941 } else {
c44c5eeb 2942 status = nfserr_bad_stateid;
8b289b2c 2943 if (nfsd4_is_deleg_cur(open))
c44c5eeb 2944 goto out;
3e772463 2945 status = nfserr_jukebox;
32513b40
BF
2946 fp = open->op_file;
2947 open->op_file = NULL;
2948 nfsd4_init_file(fp, ino);
1da177e4
LT
2949 }
2950
2951 /*
2952 * OPEN the file, or upgrade an existing OPEN.
2953 * If truncate fails, the OPEN fails.
2954 */
2955 if (stp) {
2956 /* Stateid was found, this is an OPEN upgrade */
f9d7562f 2957 status = nfs4_upgrade_open(rqstp, fp, current_fh, stp, open);
1da177e4
LT
2958 if (status)
2959 goto out;
2960 } else {
4cdc951b 2961 status = nfs4_get_vfs_file(rqstp, fp, current_fh, open);
567d9829 2962 if (status)
1da177e4 2963 goto out;
4cdc951b
BF
2964 stp = open->op_stp;
2965 open->op_stp = NULL;
996e0938 2966 init_open_stateid(stp, fp, open);
1da177e4
LT
2967 status = nfsd4_truncate(rqstp, current_fh, open);
2968 if (status) {
2283963f 2969 release_open_stateid(stp);
1da177e4
LT
2970 goto out;
2971 }
2972 }
dcef0413
BF
2973 update_stateid(&stp->st_stid.sc_stateid);
2974 memcpy(&open->op_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4 2975
4dc6ec00 2976 if (nfsd4_has_session(&resp->cstate))
dad1c067 2977 open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
6668958f 2978
1da177e4
LT
2979 /*
2980 * Attempt to hand out a delegation. No error return, because the
2981 * OPEN succeeds even if we fail.
2982 */
2983 nfs4_open_delegation(current_fh, open, stp);
2984
2985 status = nfs_ok;
2986
8c10cbdb 2987 dprintk("%s: stateid=" STATEID_FMT "\n", __func__,
dcef0413 2988 STATEID_VAL(&stp->st_stid.sc_stateid));
1da177e4 2989out:
13cd2184
N
2990 if (fp)
2991 put_nfs4_file(fp);
37515177
N
2992 if (status == 0 && open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS)
2993 nfs4_set_claim_prev(open);
1da177e4
LT
2994 /*
2995 * To finish the open response, we just need to set the rflags.
2996 */
2997 open->op_rflags = NFS4_OPEN_RESULT_LOCKTYPE_POSIX;
dad1c067 2998 if (!(open->op_openowner->oo_flags & NFS4_OO_CONFIRMED) &&
6668958f 2999 !nfsd4_has_session(&resp->cstate))
1da177e4
LT
3000 open->op_rflags |= NFS4_OPEN_RESULT_CONFIRM;
3001
3002 return status;
3003}
3004
d29b20cd
BF
3005void nfsd4_cleanup_open_state(struct nfsd4_open *open, __be32 status)
3006{
3007 if (open->op_openowner) {
3008 struct nfs4_openowner *oo = open->op_openowner;
3009
3010 if (!list_empty(&oo->oo_owner.so_stateids))
3011 list_del_init(&oo->oo_close_lru);
3012 if (oo->oo_flags & NFS4_OO_NEW) {
3013 if (status) {
3014 release_openowner(oo);
3015 open->op_openowner = NULL;
3016 } else
3017 oo->oo_flags &= ~NFS4_OO_NEW;
3018 }
3019 }
32513b40
BF
3020 if (open->op_file)
3021 nfsd4_free_file(open->op_file);
4cdc951b
BF
3022 if (open->op_stp)
3023 nfs4_free_stateid(open->op_stp);
d29b20cd
BF
3024}
3025
b37ad28b 3026__be32
b591480b
BF
3027nfsd4_renew(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
3028 clientid_t *clid)
1da177e4
LT
3029{
3030 struct nfs4_client *clp;
b37ad28b 3031 __be32 status;
1da177e4
LT
3032
3033 nfs4_lock_state();
3034 dprintk("process_renew(%08x/%08x): starting\n",
3035 clid->cl_boot, clid->cl_id);
3036 status = nfserr_stale_clientid;
3037 if (STALE_CLIENTID(clid))
3038 goto out;
3039 clp = find_confirmed_client(clid);
3040 status = nfserr_expired;
3041 if (clp == NULL) {
3042 /* We assume the client took too long to RENEW. */
3043 dprintk("nfsd4_renew: clientid not found!\n");
3044 goto out;
3045 }
1da177e4 3046 status = nfserr_cb_path_down;
ea1da636 3047 if (!list_empty(&clp->cl_delegations)
77a3569d 3048 && clp->cl_cb_state != NFSD4_CB_UP)
1da177e4
LT
3049 goto out;
3050 status = nfs_ok;
3051out:
3052 nfs4_unlock_state();
3053 return status;
3054}
3055
c47d832b 3056static struct lock_manager nfsd4_manager = {
af558e33
BF
3057};
3058
a76b4319 3059static void
af558e33 3060nfsd4_end_grace(void)
a76b4319
N
3061{
3062 dprintk("NFSD: end of grace period\n");
c7b9a459 3063 nfsd4_recdir_purge_old();
af558e33 3064 locks_end_grace(&nfsd4_manager);
e46b498c
BF
3065 /*
3066 * Now that every NFSv4 client has had the chance to recover and
3067 * to see the (possibly new, possibly shorter) lease time, we
3068 * can safely set the next grace time to the current lease time:
3069 */
3070 nfsd4_grace = nfsd4_lease;
a76b4319
N
3071}
3072
fd39ca9a 3073static time_t
1da177e4
LT
3074nfs4_laundromat(void)
3075{
3076 struct nfs4_client *clp;
fe0750e5 3077 struct nfs4_openowner *oo;
1da177e4
LT
3078 struct nfs4_delegation *dp;
3079 struct list_head *pos, *next, reaplist;
cf07d2ea
BF
3080 time_t cutoff = get_seconds() - nfsd4_lease;
3081 time_t t, clientid_val = nfsd4_lease;
3082 time_t u, test_val = nfsd4_lease;
1da177e4
LT
3083
3084 nfs4_lock_state();
3085
3086 dprintk("NFSD: laundromat service - starting\n");
af558e33
BF
3087 if (locks_in_grace())
3088 nfsd4_end_grace();
36acb66b
BH
3089 INIT_LIST_HEAD(&reaplist);
3090 spin_lock(&client_lock);
1da177e4
LT
3091 list_for_each_safe(pos, next, &client_lru) {
3092 clp = list_entry(pos, struct nfs4_client, cl_lru);
3093 if (time_after((unsigned long)clp->cl_time, (unsigned long)cutoff)) {
3094 t = clp->cl_time - cutoff;
3095 if (clientid_val > t)
3096 clientid_val = t;
3097 break;
3098 }
d7682988
BH
3099 if (atomic_read(&clp->cl_refcount)) {
3100 dprintk("NFSD: client in use (clientid %08x)\n",
3101 clp->cl_clientid.cl_id);
3102 continue;
3103 }
3104 unhash_client_locked(clp);
3105 list_add(&clp->cl_lru, &reaplist);
36acb66b
BH
3106 }
3107 spin_unlock(&client_lock);
3108 list_for_each_safe(pos, next, &reaplist) {
3109 clp = list_entry(pos, struct nfs4_client, cl_lru);
1da177e4
LT
3110 dprintk("NFSD: purging unused client (clientid %08x)\n",
3111 clp->cl_clientid.cl_id);
c7b9a459 3112 nfsd4_remove_clid_dir(clp);
1da177e4
LT
3113 expire_client(clp);
3114 }
1da177e4
LT
3115 spin_lock(&recall_lock);
3116 list_for_each_safe(pos, next, &del_recall_lru) {
3117 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
3118 if (time_after((unsigned long)dp->dl_time, (unsigned long)cutoff)) {
3119 u = dp->dl_time - cutoff;
3120 if (test_val > u)
3121 test_val = u;
3122 break;
3123 }
1da177e4
LT
3124 list_move(&dp->dl_recall_lru, &reaplist);
3125 }
3126 spin_unlock(&recall_lock);
3127 list_for_each_safe(pos, next, &reaplist) {
3128 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
3129 list_del_init(&dp->dl_recall_lru);
3130 unhash_delegation(dp);
3131 }
cf07d2ea 3132 test_val = nfsd4_lease;
1da177e4 3133 list_for_each_safe(pos, next, &close_lru) {
fe0750e5
BF
3134 oo = container_of(pos, struct nfs4_openowner, oo_close_lru);
3135 if (time_after((unsigned long)oo->oo_time, (unsigned long)cutoff)) {
3136 u = oo->oo_time - cutoff;
1da177e4
LT
3137 if (test_val > u)
3138 test_val = u;
3139 break;
3140 }
fe0750e5 3141 release_openowner(oo);
1da177e4
LT
3142 }
3143 if (clientid_val < NFSD_LAUNDROMAT_MINTIMEOUT)
3144 clientid_val = NFSD_LAUNDROMAT_MINTIMEOUT;
3145 nfs4_unlock_state();
3146 return clientid_val;
3147}
3148
a254b246
HH
3149static struct workqueue_struct *laundry_wq;
3150static void laundromat_main(struct work_struct *);
3151static DECLARE_DELAYED_WORK(laundromat_work, laundromat_main);
3152
3153static void
c4028958 3154laundromat_main(struct work_struct *not_used)
1da177e4
LT
3155{
3156 time_t t;
3157
3158 t = nfs4_laundromat();
3159 dprintk("NFSD: laundromat_main - sleeping for %ld seconds\n", t);
58da282b 3160 queue_delayed_work(laundry_wq, &laundromat_work, t*HZ);
1da177e4
LT
3161}
3162
f7a4d872 3163static inline __be32 nfs4_check_fh(struct svc_fh *fhp, struct nfs4_ol_stateid *stp)
1da177e4 3164{
f7a4d872
BF
3165 if (fhp->fh_dentry->d_inode != stp->st_file->fi_inode)
3166 return nfserr_bad_stateid;
3167 return nfs_ok;
1da177e4
LT
3168}
3169
3170static int
3171STALE_STATEID(stateid_t *stateid)
3172{
d3b313a4 3173 if (stateid->si_opaque.so_clid.cl_boot == boot_time)
e4e83ea4
BF
3174 return 0;
3175 dprintk("NFSD: stale stateid " STATEID_FMT "!\n",
8c10cbdb 3176 STATEID_VAL(stateid));
e4e83ea4 3177 return 1;
1da177e4
LT
3178}
3179
3180static inline int
3181access_permit_read(unsigned long access_bmap)
3182{
3183 return test_bit(NFS4_SHARE_ACCESS_READ, &access_bmap) ||
3184 test_bit(NFS4_SHARE_ACCESS_BOTH, &access_bmap) ||
3185 test_bit(NFS4_SHARE_ACCESS_WRITE, &access_bmap);
3186}
3187
3188static inline int
3189access_permit_write(unsigned long access_bmap)
3190{
3191 return test_bit(NFS4_SHARE_ACCESS_WRITE, &access_bmap) ||
3192 test_bit(NFS4_SHARE_ACCESS_BOTH, &access_bmap);
3193}
3194
3195static
dcef0413 3196__be32 nfs4_check_openmode(struct nfs4_ol_stateid *stp, int flags)
1da177e4 3197{
b37ad28b 3198 __be32 status = nfserr_openmode;
1da177e4 3199
02921914
BF
3200 /* For lock stateid's, we test the parent open, not the lock: */
3201 if (stp->st_openstp)
3202 stp = stp->st_openstp;
1da177e4
LT
3203 if ((flags & WR_STATE) && (!access_permit_write(stp->st_access_bmap)))
3204 goto out;
3205 if ((flags & RD_STATE) && (!access_permit_read(stp->st_access_bmap)))
3206 goto out;
3207 status = nfs_ok;
3208out:
3209 return status;
3210}
3211
b37ad28b 3212static inline __be32
1da177e4
LT
3213check_special_stateids(svc_fh *current_fh, stateid_t *stateid, int flags)
3214{
203a8c8e 3215 if (ONE_STATEID(stateid) && (flags & RD_STATE))
1da177e4 3216 return nfs_ok;
af558e33 3217 else if (locks_in_grace()) {
25985edc 3218 /* Answer in remaining cases depends on existence of
1da177e4
LT
3219 * conflicting state; so we must wait out the grace period. */
3220 return nfserr_grace;
3221 } else if (flags & WR_STATE)
3222 return nfs4_share_conflict(current_fh,
3223 NFS4_SHARE_DENY_WRITE);
3224 else /* (flags & RD_STATE) && ZERO_STATEID(stateid) */
3225 return nfs4_share_conflict(current_fh,
3226 NFS4_SHARE_DENY_READ);
3227}
3228
3229/*
3230 * Allow READ/WRITE during grace period on recovered state only for files
3231 * that are not able to provide mandatory locking.
3232 */
3233static inline int
18f82731 3234grace_disallows_io(struct inode *inode)
1da177e4 3235{
203a8c8e 3236 return locks_in_grace() && mandatory_lock(inode);
1da177e4
LT
3237}
3238
81b82965
BF
3239/* Returns true iff a is later than b: */
3240static bool stateid_generation_after(stateid_t *a, stateid_t *b)
3241{
3242 return (s32)a->si_generation - (s32)b->si_generation > 0;
3243}
3244
28dde241 3245static int check_stateid_generation(stateid_t *in, stateid_t *ref, bool has_session)
0836f587 3246{
6668958f
AA
3247 /*
3248 * When sessions are used the stateid generation number is ignored
3249 * when it is zero.
3250 */
28dde241 3251 if (has_session && in->si_generation == 0)
81b82965
BF
3252 return nfs_ok;
3253
3254 if (in->si_generation == ref->si_generation)
3255 return nfs_ok;
6668958f 3256
0836f587 3257 /* If the client sends us a stateid from the future, it's buggy: */
81b82965 3258 if (stateid_generation_after(in, ref))
0836f587
BF
3259 return nfserr_bad_stateid;
3260 /*
81b82965
BF
3261 * However, we could see a stateid from the past, even from a
3262 * non-buggy client. For example, if the client sends a lock
3263 * while some IO is outstanding, the lock may bump si_generation
3264 * while the IO is still in flight. The client could avoid that
3265 * situation by waiting for responses on all the IO requests,
3266 * but better performance may result in retrying IO that
3267 * receives an old_stateid error if requests are rarely
3268 * reordered in flight:
0836f587 3269 */
81b82965 3270 return nfserr_old_stateid;
0836f587
BF
3271}
3272
38c2f4b1 3273__be32 nfs4_validate_stateid(struct nfs4_client *cl, stateid_t *stateid)
17456804 3274{
97b7e3b6
BF
3275 struct nfs4_stid *s;
3276 struct nfs4_ol_stateid *ols;
3277 __be32 status;
17456804
BS
3278
3279 if (STALE_STATEID(stateid))
97b7e3b6 3280 return nfserr_stale_stateid;
17456804 3281
38c2f4b1 3282 s = find_stateid(cl, stateid);
97b7e3b6
BF
3283 if (!s)
3284 return nfserr_stale_stateid;
36279ac1 3285 status = check_stateid_generation(stateid, &s->sc_stateid, 1);
17456804 3286 if (status)
97b7e3b6
BF
3287 return status;
3288 if (!(s->sc_type & (NFS4_OPEN_STID | NFS4_LOCK_STID)))
3289 return nfs_ok;
3290 ols = openlockstateid(s);
3291 if (ols->st_stateowner->so_is_open_owner
dad1c067 3292 && !(openowner(ols->st_stateowner)->oo_flags & NFS4_OO_CONFIRMED))
97b7e3b6
BF
3293 return nfserr_bad_stateid;
3294 return nfs_ok;
17456804
BS
3295}
3296
38c2f4b1
BF
3297static __be32 nfsd4_lookup_stateid(stateid_t *stateid, unsigned char typemask, struct nfs4_stid **s)
3298{
3299 struct nfs4_client *cl;
3300
3301 if (ZERO_STATEID(stateid) || ONE_STATEID(stateid))
3302 return nfserr_bad_stateid;
3303 if (STALE_STATEID(stateid))
3304 return nfserr_stale_stateid;
3305 cl = find_confirmed_client(&stateid->si_opaque.so_clid);
3306 if (!cl)
3307 return nfserr_expired;
3308 *s = find_stateid_by_type(cl, stateid, typemask);
3309 if (!*s)
3310 return nfserr_bad_stateid;
3311 return nfs_ok;
3312
3313}
3314
1da177e4
LT
3315/*
3316* Checks for stateid operations
3317*/
b37ad28b 3318__be32
dd453dfd
BH
3319nfs4_preprocess_stateid_op(struct nfsd4_compound_state *cstate,
3320 stateid_t *stateid, int flags, struct file **filpp)
1da177e4 3321{
69064a27 3322 struct nfs4_stid *s;
dcef0413 3323 struct nfs4_ol_stateid *stp = NULL;
1da177e4 3324 struct nfs4_delegation *dp = NULL;
dd453dfd 3325 struct svc_fh *current_fh = &cstate->current_fh;
1da177e4 3326 struct inode *ino = current_fh->fh_dentry->d_inode;
b37ad28b 3327 __be32 status;
1da177e4 3328
1da177e4
LT
3329 if (filpp)
3330 *filpp = NULL;
3331
18f82731 3332 if (grace_disallows_io(ino))
1da177e4
LT
3333 return nfserr_grace;
3334
3335 if (ZERO_STATEID(stateid) || ONE_STATEID(stateid))
3336 return check_special_stateids(current_fh, stateid, flags);
3337
38c2f4b1
BF
3338 status = nfsd4_lookup_stateid(stateid, NFS4_DELEG_STID|NFS4_OPEN_STID|NFS4_LOCK_STID, &s);
3339 if (status)
3340 return status;
69064a27
BF
3341 status = check_stateid_generation(stateid, &s->sc_stateid, nfsd4_has_session(cstate));
3342 if (status)
3343 goto out;
f7a4d872
BF
3344 switch (s->sc_type) {
3345 case NFS4_DELEG_STID:
69064a27 3346 dp = delegstateid(s);
dc9bf700
BF
3347 status = nfs4_check_delegmode(dp, flags);
3348 if (status)
3349 goto out;
43b0178e 3350 if (filpp) {
acfdf5c3 3351 *filpp = dp->dl_file->fi_deleg_file;
43b0178e
DC
3352 BUG_ON(!*filpp);
3353 }
f7a4d872
BF
3354 break;
3355 case NFS4_OPEN_STID:
3356 case NFS4_LOCK_STID:
69064a27 3357 stp = openlockstateid(s);
f7a4d872
BF
3358 status = nfs4_check_fh(current_fh, stp);
3359 if (status)
1da177e4 3360 goto out;
fe0750e5 3361 if (stp->st_stateowner->so_is_open_owner
dad1c067 3362 && !(openowner(stp->st_stateowner)->oo_flags & NFS4_OO_CONFIRMED))
1da177e4 3363 goto out;
a4455be0
BF
3364 status = nfs4_check_openmode(stp, flags);
3365 if (status)
1da177e4 3366 goto out;
f9d7562f
BF
3367 if (filpp) {
3368 if (flags & RD_STATE)
3369 *filpp = find_readable_file(stp->st_file);
3370 else
3371 *filpp = find_writeable_file(stp->st_file);
f9d7562f 3372 }
f7a4d872
BF
3373 break;
3374 default:
3375 return nfserr_bad_stateid;
1da177e4
LT
3376 }
3377 status = nfs_ok;
3378out:
3379 return status;
3380}
3381
e1ca12df 3382static __be32
dcef0413 3383nfsd4_free_lock_stateid(struct nfs4_ol_stateid *stp)
e1ca12df 3384{
fe0750e5 3385 if (check_for_locks(stp->st_file, lockowner(stp->st_stateowner)))
e1ca12df
BS
3386 return nfserr_locks_held;
3387 release_lock_stateid(stp);
3388 return nfs_ok;
3389}
3390
17456804
BS
3391/*
3392 * Test if the stateid is valid
3393 */
3394__be32
3395nfsd4_test_stateid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
3396 struct nfsd4_test_stateid *test_stateid)
3397{
36279ac1 3398 /* real work is done during encoding */
17456804
BS
3399 return nfs_ok;
3400}
3401
e1ca12df
BS
3402__be32
3403nfsd4_free_stateid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
3404 struct nfsd4_free_stateid *free_stateid)
3405{
3406 stateid_t *stateid = &free_stateid->fr_stateid;
2da1cec7 3407 struct nfs4_stid *s;
38c2f4b1 3408 struct nfs4_client *cl = cstate->session->se_client;
2da1cec7 3409 __be32 ret = nfserr_bad_stateid;
e1ca12df
BS
3410
3411 nfs4_lock_state();
38c2f4b1 3412 s = find_stateid(cl, stateid);
2da1cec7 3413 if (!s)
81b82965 3414 goto out;
2da1cec7
BF
3415 switch (s->sc_type) {
3416 case NFS4_DELEG_STID:
e1ca12df
BS
3417 ret = nfserr_locks_held;
3418 goto out;
2da1cec7
BF
3419 case NFS4_OPEN_STID:
3420 case NFS4_LOCK_STID:
3421 ret = check_stateid_generation(stateid, &s->sc_stateid, 1);
3422 if (ret)
3423 goto out;
3424 if (s->sc_type == NFS4_LOCK_STID)
3425 ret = nfsd4_free_lock_stateid(openlockstateid(s));
3426 else
3427 ret = nfserr_locks_held;
f7a4d872
BF
3428 break;
3429 default:
3430 ret = nfserr_bad_stateid;
e1ca12df 3431 }
e1ca12df
BS
3432out:
3433 nfs4_unlock_state();
3434 return ret;
3435}
3436
4c4cd222
N
3437static inline int
3438setlkflg (int type)
3439{
3440 return (type == NFS4_READW_LT || type == NFS4_READ_LT) ?
3441 RD_STATE : WR_STATE;
3442}
1da177e4 3443
dcef0413 3444static __be32 nfs4_seqid_op_checks(struct nfsd4_compound_state *cstate, stateid_t *stateid, u32 seqid, struct nfs4_ol_stateid *stp)
c0a5d93e
BF
3445{
3446 struct svc_fh *current_fh = &cstate->current_fh;
3447 struct nfs4_stateowner *sop = stp->st_stateowner;
3448 __be32 status;
3449
c0a5d93e
BF
3450 status = nfsd4_check_seqid(cstate, sop, seqid);
3451 if (status)
3452 return status;
f7a4d872
BF
3453 if (stp->st_stid.sc_type == NFS4_CLOSED_STID)
3454 /*
3455 * "Closed" stateid's exist *only* to return
3456 * nfserr_replay_me from the previous step.
3457 */
3458 return nfserr_bad_stateid;
3459 status = check_stateid_generation(stateid, &stp->st_stid.sc_stateid, nfsd4_has_session(cstate));
3460 if (status)
3461 return status;
3462 return nfs4_check_fh(current_fh, stp);
c0a5d93e
BF
3463}
3464
1da177e4
LT
3465/*
3466 * Checks for sequence id mutating operations.
3467 */
b37ad28b 3468static __be32
dd453dfd 3469nfs4_preprocess_seqid_op(struct nfsd4_compound_state *cstate, u32 seqid,
2288d0e3 3470 stateid_t *stateid, char typemask,
dcef0413 3471 struct nfs4_ol_stateid **stpp)
1da177e4 3472{
0836f587 3473 __be32 status;
38c2f4b1 3474 struct nfs4_stid *s;
1da177e4 3475
8c10cbdb
BH
3476 dprintk("NFSD: %s: seqid=%d stateid = " STATEID_FMT "\n", __func__,
3477 seqid, STATEID_VAL(stateid));
3a4f98bb 3478
1da177e4 3479 *stpp = NULL;
38c2f4b1 3480 status = nfsd4_lookup_stateid(stateid, typemask, &s);
c0a5d93e
BF
3481 if (status)
3482 return status;
38c2f4b1 3483 *stpp = openlockstateid(s);
c0a5d93e 3484 cstate->replay_owner = (*stpp)->st_stateowner;
1da177e4 3485
c0a5d93e
BF
3486 return nfs4_seqid_op_checks(cstate, stateid, seqid, *stpp);
3487}
39325bd0 3488
dcef0413 3489static __be32 nfs4_preprocess_confirmed_seqid_op(struct nfsd4_compound_state *cstate, u32 seqid, stateid_t *stateid, struct nfs4_ol_stateid **stpp)
c0a5d93e
BF
3490{
3491 __be32 status;
3492 struct nfs4_openowner *oo;
1da177e4 3493
c0a5d93e 3494 status = nfs4_preprocess_seqid_op(cstate, seqid, stateid,
2288d0e3 3495 NFS4_OPEN_STID, stpp);
7a8711c9
BF
3496 if (status)
3497 return status;
c0a5d93e 3498 oo = openowner((*stpp)->st_stateowner);
dad1c067 3499 if (!(oo->oo_flags & NFS4_OO_CONFIRMED))
3a4f98bb 3500 return nfserr_bad_stateid;
3a4f98bb 3501 return nfs_ok;
1da177e4
LT
3502}
3503
b37ad28b 3504__be32
ca364317 3505nfsd4_open_confirm(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 3506 struct nfsd4_open_confirm *oc)
1da177e4 3507{
b37ad28b 3508 __be32 status;
fe0750e5 3509 struct nfs4_openowner *oo;
dcef0413 3510 struct nfs4_ol_stateid *stp;
1da177e4
LT
3511
3512 dprintk("NFSD: nfsd4_open_confirm on file %.*s\n",
ca364317
BF
3513 (int)cstate->current_fh.fh_dentry->d_name.len,
3514 cstate->current_fh.fh_dentry->d_name.name);
1da177e4 3515
ca364317 3516 status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0);
a8cddc5d
BF
3517 if (status)
3518 return status;
1da177e4
LT
3519
3520 nfs4_lock_state();
3521
9072d5c6 3522 status = nfs4_preprocess_seqid_op(cstate,
ca364317 3523 oc->oc_seqid, &oc->oc_req_stateid,
2288d0e3 3524 NFS4_OPEN_STID, &stp);
9072d5c6 3525 if (status)
68b66e82 3526 goto out;
fe0750e5 3527 oo = openowner(stp->st_stateowner);
68b66e82 3528 status = nfserr_bad_stateid;
dad1c067 3529 if (oo->oo_flags & NFS4_OO_CONFIRMED)
68b66e82 3530 goto out;
dad1c067 3531 oo->oo_flags |= NFS4_OO_CONFIRMED;
dcef0413
BF
3532 update_stateid(&stp->st_stid.sc_stateid);
3533 memcpy(&oc->oc_resp_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
8c10cbdb 3534 dprintk("NFSD: %s: success, seqid=%d stateid=" STATEID_FMT "\n",
dcef0413 3535 __func__, oc->oc_seqid, STATEID_VAL(&stp->st_stid.sc_stateid));
c7b9a459 3536
fe0750e5 3537 nfsd4_create_clid_dir(oo->oo_owner.so_client);
68b66e82 3538 status = nfs_ok;
1da177e4 3539out:
5ec094c1
BF
3540 if (!cstate->replay_owner)
3541 nfs4_unlock_state();
1da177e4
LT
3542 return status;
3543}
3544
6409a5a6 3545static inline void nfs4_stateid_downgrade_bit(struct nfs4_ol_stateid *stp, u32 access)
1da177e4 3546{
6409a5a6
BF
3547 if (!test_bit(access, &stp->st_access_bmap))
3548 return;
3549 nfs4_file_put_access(stp->st_file, nfs4_access_to_omode(access));
3550 __clear_bit(access, &stp->st_access_bmap);
3551}
f197c271 3552
6409a5a6
BF
3553static inline void nfs4_stateid_downgrade(struct nfs4_ol_stateid *stp, u32 to_access)
3554{
3555 switch (to_access) {
3556 case NFS4_SHARE_ACCESS_READ:
3557 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_WRITE);
3558 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
3559 break;
3560 case NFS4_SHARE_ACCESS_WRITE:
3561 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_READ);
3562 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
3563 break;
3564 case NFS4_SHARE_ACCESS_BOTH:
3565 break;
3566 default:
3567 BUG();
1da177e4
LT
3568 }
3569}
3570
3571static void
3572reset_union_bmap_deny(unsigned long deny, unsigned long *bmap)
3573{
3574 int i;
3575 for (i = 0; i < 4; i++) {
3576 if ((i & deny) != i)
3577 __clear_bit(i, bmap);
3578 }
3579}
3580
b37ad28b 3581__be32
ca364317
BF
3582nfsd4_open_downgrade(struct svc_rqst *rqstp,
3583 struct nfsd4_compound_state *cstate,
a4f1706a 3584 struct nfsd4_open_downgrade *od)
1da177e4 3585{
b37ad28b 3586 __be32 status;
dcef0413 3587 struct nfs4_ol_stateid *stp;
1da177e4
LT
3588
3589 dprintk("NFSD: nfsd4_open_downgrade on file %.*s\n",
ca364317
BF
3590 (int)cstate->current_fh.fh_dentry->d_name.len,
3591 cstate->current_fh.fh_dentry->d_name.name);
1da177e4 3592
c30e92df
BF
3593 /* We don't yet support WANT bits: */
3594 od->od_share_access &= NFS4_SHARE_ACCESS_MASK;
1da177e4
LT
3595
3596 nfs4_lock_state();
c0a5d93e
BF
3597 status = nfs4_preprocess_confirmed_seqid_op(cstate, od->od_seqid,
3598 &od->od_stateid, &stp);
9072d5c6 3599 if (status)
1da177e4 3600 goto out;
1da177e4
LT
3601 status = nfserr_inval;
3602 if (!test_bit(od->od_share_access, &stp->st_access_bmap)) {
3603 dprintk("NFSD:access not a subset current bitmap: 0x%lx, input access=%08x\n",
3604 stp->st_access_bmap, od->od_share_access);
3605 goto out;
3606 }
3607 if (!test_bit(od->od_share_deny, &stp->st_deny_bmap)) {
3608 dprintk("NFSD:deny not a subset current bitmap: 0x%lx, input deny=%08x\n",
3609 stp->st_deny_bmap, od->od_share_deny);
3610 goto out;
3611 }
6409a5a6 3612 nfs4_stateid_downgrade(stp, od->od_share_access);
1da177e4 3613
1da177e4
LT
3614 reset_union_bmap_deny(od->od_share_deny, &stp->st_deny_bmap);
3615
dcef0413
BF
3616 update_stateid(&stp->st_stid.sc_stateid);
3617 memcpy(&od->od_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4
LT
3618 status = nfs_ok;
3619out:
5ec094c1
BF
3620 if (!cstate->replay_owner)
3621 nfs4_unlock_state();
1da177e4
LT
3622 return status;
3623}
3624
38c387b5
BF
3625void nfsd4_purge_closed_stateid(struct nfs4_stateowner *so)
3626{
3627 struct nfs4_openowner *oo;
3628 struct nfs4_ol_stateid *s;
3629
3630 if (!so->so_is_open_owner)
3631 return;
3632 oo = openowner(so);
3633 s = oo->oo_last_closed_stid;
3634 if (!s)
3635 return;
3636 if (!(oo->oo_flags & NFS4_OO_PURGE_CLOSE)) {
3637 /* Release the last_closed_stid on the next seqid bump: */
3638 oo->oo_flags |= NFS4_OO_PURGE_CLOSE;
3639 return;
3640 }
3641 oo->oo_flags &= ~NFS4_OO_PURGE_CLOSE;
f7a4d872
BF
3642 release_last_closed_stateid(oo);
3643}
3644
3645static void nfsd4_close_open_stateid(struct nfs4_ol_stateid *s)
3646{
3647 unhash_open_stateid(s);
3648 s->st_stid.sc_type = NFS4_CLOSED_STID;
38c387b5
BF
3649}
3650
1da177e4
LT
3651/*
3652 * nfs4_unlock_state() called after encode
3653 */
b37ad28b 3654__be32
ca364317 3655nfsd4_close(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 3656 struct nfsd4_close *close)
1da177e4 3657{
b37ad28b 3658 __be32 status;
fe0750e5 3659 struct nfs4_openowner *oo;
dcef0413 3660 struct nfs4_ol_stateid *stp;
1da177e4
LT
3661
3662 dprintk("NFSD: nfsd4_close on file %.*s\n",
ca364317
BF
3663 (int)cstate->current_fh.fh_dentry->d_name.len,
3664 cstate->current_fh.fh_dentry->d_name.name);
1da177e4
LT
3665
3666 nfs4_lock_state();
f7a4d872
BF
3667 status = nfs4_preprocess_seqid_op(cstate, close->cl_seqid,
3668 &close->cl_stateid,
3669 NFS4_OPEN_STID|NFS4_CLOSED_STID,
3670 &stp);
9072d5c6 3671 if (status)
1da177e4 3672 goto out;
fe0750e5 3673 oo = openowner(stp->st_stateowner);
1da177e4 3674 status = nfs_ok;
dcef0413
BF
3675 update_stateid(&stp->st_stid.sc_stateid);
3676 memcpy(&close->cl_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4 3677
f7a4d872 3678 nfsd4_close_open_stateid(stp);
38c387b5 3679 oo->oo_last_closed_stid = stp;
04ef5954
BF
3680
3681 /* place unused nfs4_stateowners on so_close_lru list to be
3682 * released by the laundromat service after the lease period
3683 * to enable us to handle CLOSE replay
3684 */
fe0750e5
BF
3685 if (list_empty(&oo->oo_owner.so_stateids))
3686 move_to_close_lru(oo);
1da177e4 3687out:
5ec094c1
BF
3688 if (!cstate->replay_owner)
3689 nfs4_unlock_state();
1da177e4
LT
3690 return status;
3691}
3692
b37ad28b 3693__be32
ca364317
BF
3694nfsd4_delegreturn(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
3695 struct nfsd4_delegreturn *dr)
1da177e4 3696{
203a8c8e
BF
3697 struct nfs4_delegation *dp;
3698 stateid_t *stateid = &dr->dr_stateid;
38c2f4b1 3699 struct nfs4_stid *s;
203a8c8e 3700 struct inode *inode;
b37ad28b 3701 __be32 status;
1da177e4 3702
ca364317 3703 if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
203a8c8e
BF
3704 return status;
3705 inode = cstate->current_fh.fh_dentry->d_inode;
1da177e4
LT
3706
3707 nfs4_lock_state();
38c2f4b1
BF
3708 status = nfsd4_lookup_stateid(stateid, NFS4_DELEG_STID, &s);
3709 if (status)
203a8c8e 3710 goto out;
38c2f4b1 3711 dp = delegstateid(s);
d5477a8d 3712 status = check_stateid_generation(stateid, &dp->dl_stid.sc_stateid, nfsd4_has_session(cstate));
203a8c8e
BF
3713 if (status)
3714 goto out;
203a8c8e
BF
3715
3716 unhash_delegation(dp);
1da177e4 3717out:
203a8c8e
BF
3718 nfs4_unlock_state();
3719
1da177e4
LT
3720 return status;
3721}
3722
3723
1da177e4 3724#define LOFF_OVERFLOW(start, len) ((u64)(len) > ~(u64)(start))
1da177e4 3725
009673b4
BF
3726#define LOCKOWNER_INO_HASH_BITS 8
3727#define LOCKOWNER_INO_HASH_SIZE (1 << LOCKOWNER_INO_HASH_BITS)
3728#define LOCKOWNER_INO_HASH_MASK (LOCKOWNER_INO_HASH_SIZE - 1)
3729
87df4de8
BH
3730static inline u64
3731end_offset(u64 start, u64 len)
3732{
3733 u64 end;
3734
3735 end = start + len;
3736 return end >= start ? end: NFS4_MAX_UINT64;
3737}
3738
3739/* last octet in a range */
3740static inline u64
3741last_byte_offset(u64 start, u64 len)
3742{
3743 u64 end;
3744
3745 BUG_ON(!len);
3746 end = start + len;
3747 return end > start ? end - 1: NFS4_MAX_UINT64;
3748}
3749
009673b4
BF
3750static unsigned int lockowner_ino_hashval(struct inode *inode, u32 cl_id, struct xdr_netobj *ownername)
3751{
3752 return (file_hashval(inode) + cl_id
3753 + opaque_hashval(ownername->data, ownername->len))
3754 & LOCKOWNER_INO_HASH_MASK;
3755}
3756
3757static struct list_head lockowner_ino_hashtbl[LOCKOWNER_INO_HASH_SIZE];
3758
1da177e4
LT
3759/*
3760 * TODO: Linux file offsets are _signed_ 64-bit quantities, which means that
3761 * we can't properly handle lock requests that go beyond the (2^63 - 1)-th
3762 * byte, because of sign extension problems. Since NFSv4 calls for 64-bit
3763 * locking, this prevents us from being completely protocol-compliant. The
3764 * real solution to this problem is to start using unsigned file offsets in
3765 * the VFS, but this is a very deep change!
3766 */
3767static inline void
3768nfs4_transform_lock_offset(struct file_lock *lock)
3769{
3770 if (lock->fl_start < 0)
3771 lock->fl_start = OFFSET_MAX;
3772 if (lock->fl_end < 0)
3773 lock->fl_end = OFFSET_MAX;
3774}
3775
d5b9026a
N
3776/* Hack!: For now, we're defining this just so we can use a pointer to it
3777 * as a unique cookie to identify our (NFSv4's) posix locks. */
7b021967 3778static const struct lock_manager_operations nfsd_posix_mng_ops = {
d5b9026a 3779};
1da177e4
LT
3780
3781static inline void
3782nfs4_set_lock_denied(struct file_lock *fl, struct nfsd4_lock_denied *deny)
3783{
fe0750e5 3784 struct nfs4_lockowner *lo;
1da177e4 3785
d5b9026a 3786 if (fl->fl_lmops == &nfsd_posix_mng_ops) {
fe0750e5
BF
3787 lo = (struct nfs4_lockowner *) fl->fl_owner;
3788 deny->ld_owner.data = kmemdup(lo->lo_owner.so_owner.data,
3789 lo->lo_owner.so_owner.len, GFP_KERNEL);
7c13f344
BF
3790 if (!deny->ld_owner.data)
3791 /* We just don't care that much */
3792 goto nevermind;
fe0750e5
BF
3793 deny->ld_owner.len = lo->lo_owner.so_owner.len;
3794 deny->ld_clientid = lo->lo_owner.so_client->cl_clientid;
d5b9026a 3795 } else {
7c13f344
BF
3796nevermind:
3797 deny->ld_owner.len = 0;
3798 deny->ld_owner.data = NULL;
d5b9026a
N
3799 deny->ld_clientid.cl_boot = 0;
3800 deny->ld_clientid.cl_id = 0;
1da177e4
LT
3801 }
3802 deny->ld_start = fl->fl_start;
87df4de8
BH
3803 deny->ld_length = NFS4_MAX_UINT64;
3804 if (fl->fl_end != NFS4_MAX_UINT64)
1da177e4
LT
3805 deny->ld_length = fl->fl_end - fl->fl_start + 1;
3806 deny->ld_type = NFS4_READ_LT;
3807 if (fl->fl_type != F_RDLCK)
3808 deny->ld_type = NFS4_WRITE_LT;
3809}
3810
b93d87c1
BF
3811static bool same_lockowner_ino(struct nfs4_lockowner *lo, struct inode *inode, clientid_t *clid, struct xdr_netobj *owner)
3812{
3813 struct nfs4_ol_stateid *lst;
3814
3815 if (!same_owner_str(&lo->lo_owner, owner, clid))
3816 return false;
3817 lst = list_first_entry(&lo->lo_owner.so_stateids,
3818 struct nfs4_ol_stateid, st_perstateowner);
3819 return lst->st_file->fi_inode == inode;
3820}
3821
fe0750e5
BF
3822static struct nfs4_lockowner *
3823find_lockowner_str(struct inode *inode, clientid_t *clid,
1da177e4
LT
3824 struct xdr_netobj *owner)
3825{
009673b4 3826 unsigned int hashval = lockowner_ino_hashval(inode, clid->cl_id, owner);
b93d87c1 3827 struct nfs4_lockowner *lo;
1da177e4 3828
009673b4 3829 list_for_each_entry(lo, &lockowner_ino_hashtbl[hashval], lo_owner_ino_hash) {
b93d87c1
BF
3830 if (same_lockowner_ino(lo, inode, clid, owner))
3831 return lo;
1da177e4
LT
3832 }
3833 return NULL;
3834}
3835
dcef0413 3836static void hash_lockowner(struct nfs4_lockowner *lo, unsigned int strhashval, struct nfs4_client *clp, struct nfs4_ol_stateid *open_stp)
ff194bd9 3837{
009673b4
BF
3838 struct inode *inode = open_stp->st_file->fi_inode;
3839 unsigned int inohash = lockowner_ino_hashval(inode,
3840 clp->cl_clientid.cl_id, &lo->lo_owner.so_owner);
3841
16bfdaaf 3842 list_add(&lo->lo_owner.so_strhash, &ownerstr_hashtbl[strhashval]);
009673b4 3843 list_add(&lo->lo_owner_ino_hash, &lockowner_ino_hashtbl[inohash]);
fe0750e5 3844 list_add(&lo->lo_perstateid, &open_stp->st_lockowners);
ff194bd9
BF
3845}
3846
1da177e4
LT
3847/*
3848 * Alloc a lock owner structure.
3849 * Called in nfsd4_lock - therefore, OPEN and OPEN_CONFIRM (if needed) has
25985edc 3850 * occurred.
1da177e4 3851 *
16bfdaaf 3852 * strhashval = ownerstr_hashval
1da177e4
LT
3853 */
3854
fe0750e5 3855static struct nfs4_lockowner *
dcef0413 3856alloc_init_lock_stateowner(unsigned int strhashval, struct nfs4_client *clp, struct nfs4_ol_stateid *open_stp, struct nfsd4_lock *lock) {
fe0750e5 3857 struct nfs4_lockowner *lo;
1da177e4 3858
fe0750e5
BF
3859 lo = alloc_stateowner(lockowner_slab, &lock->lk_new_owner, clp);
3860 if (!lo)
1da177e4 3861 return NULL;
fe0750e5
BF
3862 INIT_LIST_HEAD(&lo->lo_owner.so_stateids);
3863 lo->lo_owner.so_is_open_owner = 0;
b59e3c0e
NB
3864 /* It is the openowner seqid that will be incremented in encode in the
3865 * case of new lockowners; so increment the lock seqid manually: */
fe0750e5
BF
3866 lo->lo_owner.so_seqid = lock->lk_new_lock_seqid + 1;
3867 hash_lockowner(lo, strhashval, clp, open_stp);
3868 return lo;
1da177e4
LT
3869}
3870
dcef0413
BF
3871static struct nfs4_ol_stateid *
3872alloc_init_lock_stateid(struct nfs4_lockowner *lo, struct nfs4_file *fp, struct nfs4_ol_stateid *open_stp)
1da177e4 3873{
dcef0413 3874 struct nfs4_ol_stateid *stp;
d3b313a4 3875 struct nfs4_client *clp = lo->lo_owner.so_client;
1da177e4 3876
996e0938 3877 stp = nfs4_alloc_stateid(clp);
5ac049ac 3878 if (stp == NULL)
6136d2b4 3879 return NULL;
996e0938 3880 init_stid(&stp->st_stid, clp, NFS4_LOCK_STID);
8beefa24 3881 list_add(&stp->st_perfile, &fp->fi_stateids);
fe0750e5
BF
3882 list_add(&stp->st_perstateowner, &lo->lo_owner.so_stateids);
3883 stp->st_stateowner = &lo->lo_owner;
13cd2184 3884 get_nfs4_file(fp);
1da177e4 3885 stp->st_file = fp;
0997b173 3886 stp->st_access_bmap = 0;
1da177e4 3887 stp->st_deny_bmap = open_stp->st_deny_bmap;
4c4cd222 3888 stp->st_openstp = open_stp;
1da177e4
LT
3889 return stp;
3890}
3891
fd39ca9a 3892static int
1da177e4
LT
3893check_lock_length(u64 offset, u64 length)
3894{
87df4de8 3895 return ((length == 0) || ((length != NFS4_MAX_UINT64) &&
1da177e4
LT
3896 LOFF_OVERFLOW(offset, length)));
3897}
3898
dcef0413 3899static void get_lock_access(struct nfs4_ol_stateid *lock_stp, u32 access)
0997b173
BF
3900{
3901 struct nfs4_file *fp = lock_stp->st_file;
3902 int oflag = nfs4_access_to_omode(access);
3903
3904 if (test_bit(access, &lock_stp->st_access_bmap))
3905 return;
3906 nfs4_file_get_access(fp, oflag);
3907 __set_bit(access, &lock_stp->st_access_bmap);
3908}
3909
64a284d0
BF
3910__be32 lookup_or_create_lock_state(struct nfsd4_compound_state *cstate, struct nfs4_ol_stateid *ost, struct nfsd4_lock *lock, struct nfs4_ol_stateid **lst, bool *new)
3911{
3912 struct nfs4_file *fi = ost->st_file;
3913 struct nfs4_openowner *oo = openowner(ost->st_stateowner);
3914 struct nfs4_client *cl = oo->oo_owner.so_client;
3915 struct nfs4_lockowner *lo;
3916 unsigned int strhashval;
3917
3918 lo = find_lockowner_str(fi->fi_inode, &cl->cl_clientid, &lock->v.new.owner);
3919 if (lo) {
3920 if (!cstate->minorversion)
3921 return nfserr_bad_seqid;
3922 /* XXX: a lockowner always has exactly one stateid: */
3923 *lst = list_first_entry(&lo->lo_owner.so_stateids,
3924 struct nfs4_ol_stateid, st_perstateowner);
3925 return nfs_ok;
3926 }
16bfdaaf 3927 strhashval = ownerstr_hashval(cl->cl_clientid.cl_id,
64a284d0
BF
3928 &lock->v.new.owner);
3929 lo = alloc_init_lock_stateowner(strhashval, cl, ost, lock);
3930 if (lo == NULL)
3931 return nfserr_jukebox;
3932 *lst = alloc_init_lock_stateid(lo, fi, ost);
3933 if (*lst == NULL) {
3934 release_lockowner(lo);
3935 return nfserr_jukebox;
3936 }
3937 *new = true;
3938 return nfs_ok;
3939}
3940
1da177e4
LT
3941/*
3942 * LOCK operation
3943 */
b37ad28b 3944__be32
ca364317 3945nfsd4_lock(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 3946 struct nfsd4_lock *lock)
1da177e4 3947{
fe0750e5
BF
3948 struct nfs4_openowner *open_sop = NULL;
3949 struct nfs4_lockowner *lock_sop = NULL;
dcef0413 3950 struct nfs4_ol_stateid *lock_stp;
7d947842
BF
3951 struct nfs4_file *fp;
3952 struct file *filp = NULL;
1da177e4 3953 struct file_lock file_lock;
8dc7c311 3954 struct file_lock conflock;
b37ad28b 3955 __be32 status = 0;
64a284d0 3956 bool new_state = false;
b34f27aa 3957 int lkflg;
b8dd7b9a 3958 int err;
1da177e4
LT
3959
3960 dprintk("NFSD: nfsd4_lock: start=%Ld length=%Ld\n",
3961 (long long) lock->lk_offset,
3962 (long long) lock->lk_length);
3963
1da177e4
LT
3964 if (check_lock_length(lock->lk_offset, lock->lk_length))
3965 return nfserr_inval;
3966
ca364317 3967 if ((status = fh_verify(rqstp, &cstate->current_fh,
8837abca 3968 S_IFREG, NFSD_MAY_LOCK))) {
a6f6ef2f
AA
3969 dprintk("NFSD: nfsd4_lock: permission denied!\n");
3970 return status;
3971 }
3972
1da177e4
LT
3973 nfs4_lock_state();
3974
3975 if (lock->lk_is_new) {
893f8770
N
3976 /*
3977 * Client indicates that this is a new lockowner.
3978 * Use open owner and open stateid to create lock owner and
3979 * lock stateid.
3980 */
dcef0413 3981 struct nfs4_ol_stateid *open_stp = NULL;
684e5638
BF
3982
3983 if (nfsd4_has_session(cstate))
3984 /* See rfc 5661 18.10.3: given clientid is ignored: */
3985 memcpy(&lock->v.new.clientid,
3986 &cstate->session->se_client->cl_clientid,
3987 sizeof(clientid_t));
3988
1da177e4 3989 status = nfserr_stale_clientid;
684e5638 3990 if (STALE_CLIENTID(&lock->lk_new_clientid))
1da177e4 3991 goto out;
1da177e4 3992
1da177e4 3993 /* validate and update open stateid and open seqid */
c0a5d93e 3994 status = nfs4_preprocess_confirmed_seqid_op(cstate,
1da177e4
LT
3995 lock->lk_new_open_seqid,
3996 &lock->lk_new_open_stateid,
c0a5d93e 3997 &open_stp);
37515177 3998 if (status)
1da177e4 3999 goto out;
fe0750e5 4000 open_sop = openowner(open_stp->st_stateowner);
b34f27aa 4001 status = nfserr_bad_stateid;
684e5638 4002 if (!same_clid(&open_sop->oo_owner.so_client->cl_clientid,
b34f27aa
BF
4003 &lock->v.new.clientid))
4004 goto out;
64a284d0
BF
4005 status = lookup_or_create_lock_state(cstate, open_stp, lock,
4006 &lock_stp, &new_state);
4007 if (status)
1da177e4 4008 goto out;
1da177e4
LT
4009 } else {
4010 /* lock (lock owner + lock stateid) already exists */
dd453dfd 4011 status = nfs4_preprocess_seqid_op(cstate,
fe0750e5
BF
4012 lock->lk_old_lock_seqid,
4013 &lock->lk_old_lock_stateid,
2288d0e3 4014 NFS4_LOCK_STID, &lock_stp);
1da177e4
LT
4015 if (status)
4016 goto out;
4017 }
64a284d0
BF
4018 lock_sop = lockowner(lock_stp->st_stateowner);
4019 fp = lock_stp->st_file;
1da177e4 4020
b34f27aa
BF
4021 lkflg = setlkflg(lock->lk_type);
4022 status = nfs4_check_openmode(lock_stp, lkflg);
4023 if (status)
4024 goto out;
4025
0dd395dc 4026 status = nfserr_grace;
af558e33 4027 if (locks_in_grace() && !lock->lk_reclaim)
0dd395dc
N
4028 goto out;
4029 status = nfserr_no_grace;
af558e33 4030 if (!locks_in_grace() && lock->lk_reclaim)
0dd395dc
N
4031 goto out;
4032
1da177e4
LT
4033 locks_init_lock(&file_lock);
4034 switch (lock->lk_type) {
4035 case NFS4_READ_LT:
4036 case NFS4_READW_LT:
0997b173
BF
4037 filp = find_readable_file(lock_stp->st_file);
4038 if (filp)
4039 get_lock_access(lock_stp, NFS4_SHARE_ACCESS_READ);
1da177e4 4040 file_lock.fl_type = F_RDLCK;
529d7b2a 4041 break;
1da177e4
LT
4042 case NFS4_WRITE_LT:
4043 case NFS4_WRITEW_LT:
0997b173
BF
4044 filp = find_writeable_file(lock_stp->st_file);
4045 if (filp)
4046 get_lock_access(lock_stp, NFS4_SHARE_ACCESS_WRITE);
1da177e4 4047 file_lock.fl_type = F_WRLCK;
529d7b2a 4048 break;
1da177e4
LT
4049 default:
4050 status = nfserr_inval;
4051 goto out;
4052 }
f9d7562f
BF
4053 if (!filp) {
4054 status = nfserr_openmode;
4055 goto out;
4056 }
b59e3c0e 4057 file_lock.fl_owner = (fl_owner_t)lock_sop;
1da177e4
LT
4058 file_lock.fl_pid = current->tgid;
4059 file_lock.fl_file = filp;
4060 file_lock.fl_flags = FL_POSIX;
d5b9026a 4061 file_lock.fl_lmops = &nfsd_posix_mng_ops;
1da177e4
LT
4062
4063 file_lock.fl_start = lock->lk_offset;
87df4de8 4064 file_lock.fl_end = last_byte_offset(lock->lk_offset, lock->lk_length);
1da177e4
LT
4065 nfs4_transform_lock_offset(&file_lock);
4066
4067 /*
4068 * Try to lock the file in the VFS.
4069 * Note: locks.c uses the BKL to protect the inode's lock list.
4070 */
4071
529d7b2a 4072 err = vfs_lock_file(filp, F_SETLK, &file_lock, &conflock);
b8dd7b9a 4073 switch (-err) {
1da177e4 4074 case 0: /* success! */
dcef0413
BF
4075 update_stateid(&lock_stp->st_stid.sc_stateid);
4076 memcpy(&lock->lk_resp_stateid, &lock_stp->st_stid.sc_stateid,
1da177e4 4077 sizeof(stateid_t));
b8dd7b9a 4078 status = 0;
eb76b3fd
AA
4079 break;
4080 case (EAGAIN): /* conflock holds conflicting lock */
4081 status = nfserr_denied;
4082 dprintk("NFSD: nfsd4_lock: conflicting lock found!\n");
4083 nfs4_set_lock_denied(&conflock, &lock->lk_denied);
4084 break;
1da177e4
LT
4085 case (EDEADLK):
4086 status = nfserr_deadlock;
eb76b3fd 4087 break;
3e772463 4088 default:
fd85b817 4089 dprintk("NFSD: nfsd4_lock: vfs_lock_file() failed! status %d\n",err);
3e772463 4090 status = nfserrno(err);
eb76b3fd 4091 break;
1da177e4 4092 }
1da177e4 4093out:
64a284d0 4094 if (status && new_state)
f044ff83 4095 release_lockowner(lock_sop);
5ec094c1
BF
4096 if (!cstate->replay_owner)
4097 nfs4_unlock_state();
1da177e4
LT
4098 return status;
4099}
4100
55ef1274
BF
4101/*
4102 * The NFSv4 spec allows a client to do a LOCKT without holding an OPEN,
4103 * so we do a temporary open here just to get an open file to pass to
4104 * vfs_test_lock. (Arguably perhaps test_lock should be done with an
4105 * inode operation.)
4106 */
4107static int nfsd_test_lock(struct svc_rqst *rqstp, struct svc_fh *fhp, struct file_lock *lock)
4108{
4109 struct file *file;
4110 int err;
4111
4112 err = nfsd_open(rqstp, fhp, S_IFREG, NFSD_MAY_READ, &file);
4113 if (err)
4114 return err;
4115 err = vfs_test_lock(file, lock);
4116 nfsd_close(file);
4117 return err;
4118}
4119
1da177e4
LT
4120/*
4121 * LOCKT operation
4122 */
b37ad28b 4123__be32
ca364317
BF
4124nfsd4_lockt(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4125 struct nfsd4_lockt *lockt)
1da177e4
LT
4126{
4127 struct inode *inode;
1da177e4 4128 struct file_lock file_lock;
fe0750e5 4129 struct nfs4_lockowner *lo;
fd85b817 4130 int error;
b37ad28b 4131 __be32 status;
1da177e4 4132
af558e33 4133 if (locks_in_grace())
1da177e4
LT
4134 return nfserr_grace;
4135
4136 if (check_lock_length(lockt->lt_offset, lockt->lt_length))
4137 return nfserr_inval;
4138
1da177e4
LT
4139 nfs4_lock_state();
4140
4141 status = nfserr_stale_clientid;
60adfc50 4142 if (!nfsd4_has_session(cstate) && STALE_CLIENTID(&lockt->lt_clientid))
1da177e4 4143 goto out;
1da177e4 4144
75c096f7 4145 if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
1da177e4 4146 goto out;
1da177e4 4147
ca364317 4148 inode = cstate->current_fh.fh_dentry->d_inode;
1da177e4
LT
4149 locks_init_lock(&file_lock);
4150 switch (lockt->lt_type) {
4151 case NFS4_READ_LT:
4152 case NFS4_READW_LT:
4153 file_lock.fl_type = F_RDLCK;
4154 break;
4155 case NFS4_WRITE_LT:
4156 case NFS4_WRITEW_LT:
4157 file_lock.fl_type = F_WRLCK;
4158 break;
4159 default:
2fdada03 4160 dprintk("NFSD: nfs4_lockt: bad lock type!\n");
1da177e4
LT
4161 status = nfserr_inval;
4162 goto out;
4163 }
4164
fe0750e5
BF
4165 lo = find_lockowner_str(inode, &lockt->lt_clientid, &lockt->lt_owner);
4166 if (lo)
4167 file_lock.fl_owner = (fl_owner_t)lo;
1da177e4
LT
4168 file_lock.fl_pid = current->tgid;
4169 file_lock.fl_flags = FL_POSIX;
4170
4171 file_lock.fl_start = lockt->lt_offset;
87df4de8 4172 file_lock.fl_end = last_byte_offset(lockt->lt_offset, lockt->lt_length);
1da177e4
LT
4173
4174 nfs4_transform_lock_offset(&file_lock);
4175
1da177e4 4176 status = nfs_ok;
55ef1274 4177 error = nfsd_test_lock(rqstp, &cstate->current_fh, &file_lock);
fd85b817
ME
4178 if (error) {
4179 status = nfserrno(error);
4180 goto out;
4181 }
9d6a8c5c 4182 if (file_lock.fl_type != F_UNLCK) {
1da177e4 4183 status = nfserr_denied;
9d6a8c5c 4184 nfs4_set_lock_denied(&file_lock, &lockt->lt_denied);
1da177e4
LT
4185 }
4186out:
4187 nfs4_unlock_state();
4188 return status;
4189}
4190
b37ad28b 4191__be32
ca364317 4192nfsd4_locku(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
a4f1706a 4193 struct nfsd4_locku *locku)
1da177e4 4194{
dcef0413 4195 struct nfs4_ol_stateid *stp;
1da177e4
LT
4196 struct file *filp = NULL;
4197 struct file_lock file_lock;
b37ad28b 4198 __be32 status;
b8dd7b9a 4199 int err;
1da177e4
LT
4200
4201 dprintk("NFSD: nfsd4_locku: start=%Ld length=%Ld\n",
4202 (long long) locku->lu_offset,
4203 (long long) locku->lu_length);
4204
4205 if (check_lock_length(locku->lu_offset, locku->lu_length))
4206 return nfserr_inval;
4207
4208 nfs4_lock_state();
4209
9072d5c6 4210 status = nfs4_preprocess_seqid_op(cstate, locku->lu_seqid,
2288d0e3 4211 &locku->lu_stateid, NFS4_LOCK_STID, &stp);
9072d5c6 4212 if (status)
1da177e4 4213 goto out;
f9d7562f
BF
4214 filp = find_any_file(stp->st_file);
4215 if (!filp) {
4216 status = nfserr_lock_range;
4217 goto out;
4218 }
1da177e4
LT
4219 BUG_ON(!filp);
4220 locks_init_lock(&file_lock);
4221 file_lock.fl_type = F_UNLCK;
fe0750e5 4222 file_lock.fl_owner = (fl_owner_t)lockowner(stp->st_stateowner);
1da177e4
LT
4223 file_lock.fl_pid = current->tgid;
4224 file_lock.fl_file = filp;
4225 file_lock.fl_flags = FL_POSIX;
d5b9026a 4226 file_lock.fl_lmops = &nfsd_posix_mng_ops;
1da177e4
LT
4227 file_lock.fl_start = locku->lu_offset;
4228
87df4de8 4229 file_lock.fl_end = last_byte_offset(locku->lu_offset, locku->lu_length);
1da177e4
LT
4230 nfs4_transform_lock_offset(&file_lock);
4231
4232 /*
4233 * Try to unlock the file in the VFS.
4234 */
fd85b817 4235 err = vfs_lock_file(filp, F_SETLK, &file_lock, NULL);
b8dd7b9a 4236 if (err) {
fd85b817 4237 dprintk("NFSD: nfs4_locku: vfs_lock_file failed!\n");
1da177e4
LT
4238 goto out_nfserr;
4239 }
4240 /*
4241 * OK, unlock succeeded; the only thing left to do is update the stateid.
4242 */
dcef0413
BF
4243 update_stateid(&stp->st_stid.sc_stateid);
4244 memcpy(&locku->lu_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
1da177e4
LT
4245
4246out:
71c3bcd7
BF
4247 if (!cstate->replay_owner)
4248 nfs4_unlock_state();
1da177e4
LT
4249 return status;
4250
4251out_nfserr:
b8dd7b9a 4252 status = nfserrno(err);
1da177e4
LT
4253 goto out;
4254}
4255
4256/*
4257 * returns
4258 * 1: locks held by lockowner
4259 * 0: no locks held by lockowner
4260 */
4261static int
fe0750e5 4262check_for_locks(struct nfs4_file *filp, struct nfs4_lockowner *lowner)
1da177e4
LT
4263{
4264 struct file_lock **flpp;
f9d7562f 4265 struct inode *inode = filp->fi_inode;
1da177e4
LT
4266 int status = 0;
4267
b89f4321 4268 lock_flocks();
1da177e4 4269 for (flpp = &inode->i_flock; *flpp != NULL; flpp = &(*flpp)->fl_next) {
796dadfd 4270 if ((*flpp)->fl_owner == (fl_owner_t)lowner) {
1da177e4
LT
4271 status = 1;
4272 goto out;
796dadfd 4273 }
1da177e4
LT
4274 }
4275out:
b89f4321 4276 unlock_flocks();
1da177e4
LT
4277 return status;
4278}
4279
b37ad28b 4280__be32
b591480b
BF
4281nfsd4_release_lockowner(struct svc_rqst *rqstp,
4282 struct nfsd4_compound_state *cstate,
4283 struct nfsd4_release_lockowner *rlockowner)
1da177e4
LT
4284{
4285 clientid_t *clid = &rlockowner->rl_clientid;
3e9e3dbe 4286 struct nfs4_stateowner *sop;
fe0750e5 4287 struct nfs4_lockowner *lo;
dcef0413 4288 struct nfs4_ol_stateid *stp;
1da177e4 4289 struct xdr_netobj *owner = &rlockowner->rl_owner;
3e9e3dbe 4290 struct list_head matches;
16bfdaaf 4291 unsigned int hashval = ownerstr_hashval(clid->cl_id, owner);
b37ad28b 4292 __be32 status;
1da177e4
LT
4293
4294 dprintk("nfsd4_release_lockowner clientid: (%08x/%08x):\n",
4295 clid->cl_boot, clid->cl_id);
4296
4297 /* XXX check for lease expiration */
4298
4299 status = nfserr_stale_clientid;
849823c5 4300 if (STALE_CLIENTID(clid))
1da177e4 4301 return status;
1da177e4
LT
4302
4303 nfs4_lock_state();
4304
3e9e3dbe 4305 status = nfserr_locks_held;
3e9e3dbe 4306 INIT_LIST_HEAD(&matches);
06f1f864 4307
16bfdaaf
BF
4308 list_for_each_entry(sop, &ownerstr_hashtbl[hashval], so_strhash) {
4309 if (sop->so_is_open_owner)
4310 continue;
06f1f864
BF
4311 if (!same_owner_str(sop, owner, clid))
4312 continue;
4313 list_for_each_entry(stp, &sop->so_stateids,
4314 st_perstateowner) {
4315 lo = lockowner(sop);
4316 if (check_for_locks(stp->st_file, lo))
4317 goto out;
4318 list_add(&lo->lo_list, &matches);
1da177e4 4319 }
3e9e3dbe
N
4320 }
4321 /* Clients probably won't expect us to return with some (but not all)
4322 * of the lockowner state released; so don't release any until all
4323 * have been checked. */
4324 status = nfs_ok;
0fa822e4 4325 while (!list_empty(&matches)) {
fe0750e5
BF
4326 lo = list_entry(matches.next, struct nfs4_lockowner,
4327 lo_list);
0fa822e4
N
4328 /* unhash_stateowner deletes so_perclient only
4329 * for openowners. */
fe0750e5
BF
4330 list_del(&lo->lo_list);
4331 release_lockowner(lo);
1da177e4
LT
4332 }
4333out:
4334 nfs4_unlock_state();
4335 return status;
4336}
4337
4338static inline struct nfs4_client_reclaim *
a55370a3 4339alloc_reclaim(void)
1da177e4 4340{
a55370a3 4341 return kmalloc(sizeof(struct nfs4_client_reclaim), GFP_KERNEL);
1da177e4
LT
4342}
4343
c7b9a459 4344int
a1bcecd2 4345nfs4_has_reclaimed_state(const char *name, bool use_exchange_id)
c7b9a459
N
4346{
4347 unsigned int strhashval = clientstr_hashval(name);
4348 struct nfs4_client *clp;
4349
e203d506 4350 clp = find_confirmed_client_by_str(name, strhashval);
c7b9a459
N
4351 return clp ? 1 : 0;
4352}
4353
1da177e4
LT
4354/*
4355 * failure => all reset bets are off, nfserr_no_grace...
4356 */
190e4fbf
N
4357int
4358nfs4_client_to_reclaim(const char *name)
1da177e4
LT
4359{
4360 unsigned int strhashval;
4361 struct nfs4_client_reclaim *crp = NULL;
4362
a55370a3
N
4363 dprintk("NFSD nfs4_client_to_reclaim NAME: %.*s\n", HEXDIR_LEN, name);
4364 crp = alloc_reclaim();
1da177e4
LT
4365 if (!crp)
4366 return 0;
a55370a3 4367 strhashval = clientstr_hashval(name);
1da177e4
LT
4368 INIT_LIST_HEAD(&crp->cr_strhash);
4369 list_add(&crp->cr_strhash, &reclaim_str_hashtbl[strhashval]);
a55370a3 4370 memcpy(crp->cr_recdir, name, HEXDIR_LEN);
1da177e4
LT
4371 reclaim_str_hashtbl_size++;
4372 return 1;
4373}
4374
4375static void
4376nfs4_release_reclaim(void)
4377{
4378 struct nfs4_client_reclaim *crp = NULL;
4379 int i;
4380
1da177e4
LT
4381 for (i = 0; i < CLIENT_HASH_SIZE; i++) {
4382 while (!list_empty(&reclaim_str_hashtbl[i])) {
4383 crp = list_entry(reclaim_str_hashtbl[i].next,
4384 struct nfs4_client_reclaim, cr_strhash);
4385 list_del(&crp->cr_strhash);
1da177e4
LT
4386 kfree(crp);
4387 reclaim_str_hashtbl_size--;
4388 }
4389 }
4390 BUG_ON(reclaim_str_hashtbl_size);
4391}
4392
4393/*
4394 * called from OPEN, CLAIM_PREVIOUS with a new clientid. */
fd39ca9a 4395static struct nfs4_client_reclaim *
1da177e4
LT
4396nfs4_find_reclaim_client(clientid_t *clid)
4397{
4398 unsigned int strhashval;
4399 struct nfs4_client *clp;
4400 struct nfs4_client_reclaim *crp = NULL;
4401
4402
4403 /* find clientid in conf_id_hashtbl */
4404 clp = find_confirmed_client(clid);
4405 if (clp == NULL)
4406 return NULL;
4407
a55370a3
N
4408 dprintk("NFSD: nfs4_find_reclaim_client for %.*s with recdir %s\n",
4409 clp->cl_name.len, clp->cl_name.data,
4410 clp->cl_recdir);
1da177e4
LT
4411
4412 /* find clp->cl_name in reclaim_str_hashtbl */
a55370a3 4413 strhashval = clientstr_hashval(clp->cl_recdir);
1da177e4 4414 list_for_each_entry(crp, &reclaim_str_hashtbl[strhashval], cr_strhash) {
a55370a3 4415 if (same_name(crp->cr_recdir, clp->cl_recdir)) {
1da177e4
LT
4416 return crp;
4417 }
4418 }
4419 return NULL;
4420}
4421
4422/*
4423* Called from OPEN. Look for clientid in reclaim list.
4424*/
b37ad28b 4425__be32
1da177e4
LT
4426nfs4_check_open_reclaim(clientid_t *clid)
4427{
dfc83565 4428 return nfs4_find_reclaim_client(clid) ? nfs_ok : nfserr_reclaim_bad;
1da177e4
LT
4429}
4430
65178db4
BS
4431#ifdef CONFIG_NFSD_FAULT_INJECTION
4432
4433void nfsd_forget_clients(u64 num)
4434{
4435 struct nfs4_client *clp, *next;
4436 int count = 0;
4437
4438 nfs4_lock_state();
4439 list_for_each_entry_safe(clp, next, &client_lru, cl_lru) {
4440 nfsd4_remove_clid_dir(clp);
4441 expire_client(clp);
4442 if (++count == num)
4443 break;
4444 }
4445 nfs4_unlock_state();
4446
4447 printk(KERN_INFO "NFSD: Forgot %d clients", count);
4448}
4449
4450static void release_lockowner_sop(struct nfs4_stateowner *sop)
4451{
4452 release_lockowner(lockowner(sop));
4453}
4454
4455static void release_openowner_sop(struct nfs4_stateowner *sop)
4456{
4457 release_openowner(openowner(sop));
4458}
4459
353de31b 4460static int nfsd_release_n_owners(u64 num, bool is_open_owner,
65178db4
BS
4461 void (*release_sop)(struct nfs4_stateowner *))
4462{
4463 int i, count = 0;
4464 struct nfs4_stateowner *sop, *next;
4465
16bfdaaf
BF
4466 for (i = 0; i < OWNER_HASH_SIZE; i++) {
4467 list_for_each_entry_safe(sop, next, &ownerstr_hashtbl[i], so_strhash) {
4468 if (sop->so_is_open_owner != is_open_owner)
4469 continue;
65178db4
BS
4470 release_sop(sop);
4471 if (++count == num)
4472 return count;
4473 }
4474 }
4475 return count;
4476}
4477
4478void nfsd_forget_locks(u64 num)
4479{
4480 int count;
4481
4482 nfs4_lock_state();
16bfdaaf 4483 count = nfsd_release_n_owners(num, false, release_lockowner_sop);
65178db4
BS
4484 nfs4_unlock_state();
4485
4486 printk(KERN_INFO "NFSD: Forgot %d locks", count);
4487}
4488
4489void nfsd_forget_openowners(u64 num)
4490{
4491 int count;
4492
4493 nfs4_lock_state();
16bfdaaf 4494 count = nfsd_release_n_owners(num, true, release_openowner_sop);
65178db4
BS
4495 nfs4_unlock_state();
4496
4497 printk(KERN_INFO "NFSD: Forgot %d open owners", count);
4498}
4499
4500int nfsd_process_n_delegations(u64 num, void (*deleg_func)(struct nfs4_delegation *))
4501{
4502 int i, count = 0;
4503 struct nfs4_file *fp;
4504 struct nfs4_delegation *dp, *next;
4505
4506 for (i = 0; i < FILE_HASH_SIZE; i++) {
4507 list_for_each_entry(fp, &file_hashtbl[i], fi_hash) {
4508 list_for_each_entry_safe(dp, next, &fp->fi_delegations, dl_perfile) {
4509 deleg_func(dp);
4510 if (++count == num)
4511 return count;
4512 }
4513 }
4514 }
4515 return count;
4516}
4517
4518void nfsd_forget_delegations(u64 num)
4519{
4520 unsigned int count;
4521
4522 nfs4_lock_state();
4523 count = nfsd_process_n_delegations(num, unhash_delegation);
4524 nfs4_unlock_state();
4525
4526 printk(KERN_INFO "NFSD: Forgot %d delegations", count);
4527}
4528
4529void nfsd_recall_delegations(u64 num)
4530{
4531 unsigned int count;
4532
4533 nfs4_lock_state();
4534 spin_lock(&recall_lock);
4535 count = nfsd_process_n_delegations(num, nfsd_break_one_deleg);
4536 spin_unlock(&recall_lock);
4537 nfs4_unlock_state();
4538
4539 printk(KERN_INFO "NFSD: Recalled %d delegations", count);
4540}
4541
4542#endif /* CONFIG_NFSD_FAULT_INJECTION */
4543
ac4d8ff2 4544/* initialization to perform at module load time: */
1da177e4 4545
72083396 4546void
ac4d8ff2 4547nfs4_state_init(void)
1da177e4 4548{
72083396 4549 int i;
1da177e4 4550
1da177e4
LT
4551 for (i = 0; i < CLIENT_HASH_SIZE; i++) {
4552 INIT_LIST_HEAD(&conf_id_hashtbl[i]);
4553 INIT_LIST_HEAD(&conf_str_hashtbl[i]);
4554 INIT_LIST_HEAD(&unconf_str_hashtbl[i]);
4555 INIT_LIST_HEAD(&unconf_id_hashtbl[i]);
02cb2858 4556 INIT_LIST_HEAD(&reclaim_str_hashtbl[i]);
1da177e4 4557 }
5282fd72
ME
4558 for (i = 0; i < SESSION_HASH_SIZE; i++)
4559 INIT_LIST_HEAD(&sessionid_hashtbl[i]);
1da177e4
LT
4560 for (i = 0; i < FILE_HASH_SIZE; i++) {
4561 INIT_LIST_HEAD(&file_hashtbl[i]);
4562 }
16bfdaaf
BF
4563 for (i = 0; i < OWNER_HASH_SIZE; i++) {
4564 INIT_LIST_HEAD(&ownerstr_hashtbl[i]);
1da177e4 4565 }
009673b4
BF
4566 for (i = 0; i < LOCKOWNER_INO_HASH_SIZE; i++)
4567 INIT_LIST_HEAD(&lockowner_ino_hashtbl[i]);
1da177e4 4568 memset(&onestateid, ~0, sizeof(stateid_t));
1da177e4
LT
4569 INIT_LIST_HEAD(&close_lru);
4570 INIT_LIST_HEAD(&client_lru);
4571 INIT_LIST_HEAD(&del_recall_lru);
ac4d8ff2 4572 reclaim_str_hashtbl_size = 0;
ac4d8ff2
N
4573}
4574
190e4fbf
N
4575static void
4576nfsd4_load_reboot_recovery_data(void)
4577{
4578 int status;
4579
0964a3d3 4580 nfs4_lock_state();
48483bf2 4581 nfsd4_init_recdir();
190e4fbf 4582 status = nfsd4_recdir_load();
0964a3d3 4583 nfs4_unlock_state();
190e4fbf
N
4584 if (status)
4585 printk("NFSD: Failure reading reboot recovery data\n");
4586}
4587
c2f1a551
MS
4588/*
4589 * Since the lifetime of a delegation isn't limited to that of an open, a
4590 * client may quite reasonably hang on to a delegation as long as it has
4591 * the inode cached. This becomes an obvious problem the first time a
4592 * client's inode cache approaches the size of the server's total memory.
4593 *
4594 * For now we avoid this problem by imposing a hard limit on the number
4595 * of delegations, which varies according to the server's memory size.
4596 */
4597static void
4598set_max_delegations(void)
4599{
4600 /*
4601 * Allow at most 4 delegations per megabyte of RAM. Quick
4602 * estimates suggest that in the worst case (where every delegation
4603 * is for a different inode), a delegation could take about 1.5K,
4604 * giving a worst case usage of about 6% of memory.
4605 */
4606 max_delegations = nr_free_buffer_pages() >> (20 - 2 - PAGE_SHIFT);
4607}
4608
ac4d8ff2
N
4609/* initialization to perform when the nfsd service is started: */
4610
29ab23cc 4611static int
ac4d8ff2
N
4612__nfs4_state_start(void)
4613{
b5a1a81e
BF
4614 int ret;
4615
1da177e4 4616 boot_time = get_seconds();
af558e33 4617 locks_start_grace(&nfsd4_manager);
9a8db97e 4618 printk(KERN_INFO "NFSD: starting %ld-second grace period\n",
e46b498c 4619 nfsd4_grace);
b5a1a81e
BF
4620 ret = set_callback_cred();
4621 if (ret)
4622 return -ENOMEM;
58da282b 4623 laundry_wq = create_singlethread_workqueue("nfsd4");
29ab23cc
BF
4624 if (laundry_wq == NULL)
4625 return -ENOMEM;
b5a1a81e
BF
4626 ret = nfsd4_create_callback_queue();
4627 if (ret)
4628 goto out_free_laundry;
e46b498c 4629 queue_delayed_work(laundry_wq, &laundromat_work, nfsd4_grace * HZ);
c2f1a551 4630 set_max_delegations();
b5a1a81e
BF
4631 return 0;
4632out_free_laundry:
4633 destroy_workqueue(laundry_wq);
4634 return ret;
1da177e4
LT
4635}
4636
29ab23cc 4637int
76a3550e 4638nfs4_state_start(void)
1da177e4 4639{
190e4fbf 4640 nfsd4_load_reboot_recovery_data();
4ad9a344 4641 return __nfs4_state_start();
1da177e4
LT
4642}
4643
1da177e4
LT
4644static void
4645__nfs4_state_shutdown(void)
4646{
4647 int i;
4648 struct nfs4_client *clp = NULL;
4649 struct nfs4_delegation *dp = NULL;
1da177e4
LT
4650 struct list_head *pos, *next, reaplist;
4651
1da177e4
LT
4652 for (i = 0; i < CLIENT_HASH_SIZE; i++) {
4653 while (!list_empty(&conf_id_hashtbl[i])) {
4654 clp = list_entry(conf_id_hashtbl[i].next, struct nfs4_client, cl_idhash);
4655 expire_client(clp);
4656 }
4657 while (!list_empty(&unconf_str_hashtbl[i])) {
4658 clp = list_entry(unconf_str_hashtbl[i].next, struct nfs4_client, cl_strhash);
4659 expire_client(clp);
4660 }
4661 }
4662 INIT_LIST_HEAD(&reaplist);
4663 spin_lock(&recall_lock);
4664 list_for_each_safe(pos, next, &del_recall_lru) {
4665 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
4666 list_move(&dp->dl_recall_lru, &reaplist);
4667 }
4668 spin_unlock(&recall_lock);
4669 list_for_each_safe(pos, next, &reaplist) {
4670 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
4671 list_del_init(&dp->dl_recall_lru);
4672 unhash_delegation(dp);
4673 }
4674
190e4fbf 4675 nfsd4_shutdown_recdir();
1da177e4
LT
4676}
4677
4678void
4679nfs4_state_shutdown(void)
4680{
afe2c511 4681 cancel_delayed_work_sync(&laundromat_work);
5e8d5c29 4682 destroy_workqueue(laundry_wq);
2c5e7615 4683 locks_end_grace(&nfsd4_manager);
1da177e4
LT
4684 nfs4_lock_state();
4685 nfs4_release_reclaim();
4686 __nfs4_state_shutdown();
1da177e4 4687 nfs4_unlock_state();
c3935e30 4688 nfsd4_destroy_callback_queue();
1da177e4 4689}