NFS: Treat NFS4ERR_CLID_INUSE as a fatal error
[linux-2.6-block.git] / fs / nfs / nfs4proc.c
1 /*
2  *  fs/nfs/nfs4proc.c
3  *
4  *  Client-side procedure declarations for NFSv4.
5  *
6  *  Copyright (c) 2002 The Regents of the University of Michigan.
7  *  All rights reserved.
8  *
9  *  Kendrick Smith <kmsmith@umich.edu>
10  *  Andy Adamson   <andros@umich.edu>
11  *
12  *  Redistribution and use in source and binary forms, with or without
13  *  modification, are permitted provided that the following conditions
14  *  are met:
15  *
16  *  1. Redistributions of source code must retain the above copyright
17  *     notice, this list of conditions and the following disclaimer.
18  *  2. Redistributions in binary form must reproduce the above copyright
19  *     notice, this list of conditions and the following disclaimer in the
20  *     documentation and/or other materials provided with the distribution.
21  *  3. Neither the name of the University nor the names of its
22  *     contributors may be used to endorse or promote products derived
23  *     from this software without specific prior written permission.
24  *
25  *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
26  *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
27  *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
28  *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
29  *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30  *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31  *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
32  *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
33  *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
34  *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
35  *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36  */
37
38 #include <linux/mm.h>
39 #include <linux/delay.h>
40 #include <linux/errno.h>
41 #include <linux/string.h>
42 #include <linux/ratelimit.h>
43 #include <linux/printk.h>
44 #include <linux/slab.h>
45 #include <linux/sunrpc/clnt.h>
46 #include <linux/nfs.h>
47 #include <linux/nfs4.h>
48 #include <linux/nfs_fs.h>
49 #include <linux/nfs_page.h>
50 #include <linux/nfs_mount.h>
51 #include <linux/namei.h>
52 #include <linux/mount.h>
53 #include <linux/module.h>
54 #include <linux/nfs_idmap.h>
55 #include <linux/sunrpc/bc_xprt.h>
56 #include <linux/xattr.h>
57 #include <linux/utsname.h>
58 #include <linux/freezer.h>
59
60 #include "nfs4_fs.h"
61 #include "delegation.h"
62 #include "internal.h"
63 #include "iostat.h"
64 #include "callback.h"
65 #include "pnfs.h"
66 #include "netns.h"
67
68 #define NFSDBG_FACILITY         NFSDBG_PROC
69
70 #define NFS4_POLL_RETRY_MIN     (HZ/10)
71 #define NFS4_POLL_RETRY_MAX     (15*HZ)
72
73 #define NFS4_MAX_LOOP_ON_RECOVER (10)
74
75 static unsigned short max_session_slots = NFS4_DEF_SLOT_TABLE_SIZE;
76
77 struct nfs4_opendata;
78 static int _nfs4_proc_open(struct nfs4_opendata *data);
79 static int _nfs4_recover_proc_open(struct nfs4_opendata *data);
80 static int nfs4_do_fsinfo(struct nfs_server *, struct nfs_fh *, struct nfs_fsinfo *);
81 static int nfs4_async_handle_error(struct rpc_task *, const struct nfs_server *, struct nfs4_state *);
82 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr);
83 static int nfs4_proc_getattr(struct nfs_server *, struct nfs_fh *, struct nfs_fattr *);
84 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr);
85 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
86                             struct nfs_fattr *fattr, struct iattr *sattr,
87                             struct nfs4_state *state);
88 #ifdef CONFIG_NFS_V4_1
89 static int nfs41_test_stateid(struct nfs_server *, nfs4_stateid *);
90 static int nfs41_free_stateid(struct nfs_server *, nfs4_stateid *);
91 #endif
92 /* Prevent leaks of NFSv4 errors into userland */
93 static int nfs4_map_errors(int err)
94 {
95         if (err >= -1000)
96                 return err;
97         switch (err) {
98         case -NFS4ERR_RESOURCE:
99                 return -EREMOTEIO;
100         case -NFS4ERR_WRONGSEC:
101                 return -EPERM;
102         case -NFS4ERR_BADOWNER:
103         case -NFS4ERR_BADNAME:
104                 return -EINVAL;
105         case -NFS4ERR_SHARE_DENIED:
106                 return -EACCES;
107         case -NFS4ERR_MINOR_VERS_MISMATCH:
108                 return -EPROTONOSUPPORT;
109         default:
110                 dprintk("%s could not handle NFSv4 error %d\n",
111                                 __func__, -err);
112                 break;
113         }
114         return -EIO;
115 }
116
117 /*
118  * This is our standard bitmap for GETATTR requests.
119  */
120 const u32 nfs4_fattr_bitmap[3] = {
121         FATTR4_WORD0_TYPE
122         | FATTR4_WORD0_CHANGE
123         | FATTR4_WORD0_SIZE
124         | FATTR4_WORD0_FSID
125         | FATTR4_WORD0_FILEID,
126         FATTR4_WORD1_MODE
127         | FATTR4_WORD1_NUMLINKS
128         | FATTR4_WORD1_OWNER
129         | FATTR4_WORD1_OWNER_GROUP
130         | FATTR4_WORD1_RAWDEV
131         | FATTR4_WORD1_SPACE_USED
132         | FATTR4_WORD1_TIME_ACCESS
133         | FATTR4_WORD1_TIME_METADATA
134         | FATTR4_WORD1_TIME_MODIFY
135 };
136
137 static const u32 nfs4_pnfs_open_bitmap[3] = {
138         FATTR4_WORD0_TYPE
139         | FATTR4_WORD0_CHANGE
140         | FATTR4_WORD0_SIZE
141         | FATTR4_WORD0_FSID
142         | FATTR4_WORD0_FILEID,
143         FATTR4_WORD1_MODE
144         | FATTR4_WORD1_NUMLINKS
145         | FATTR4_WORD1_OWNER
146         | FATTR4_WORD1_OWNER_GROUP
147         | FATTR4_WORD1_RAWDEV
148         | FATTR4_WORD1_SPACE_USED
149         | FATTR4_WORD1_TIME_ACCESS
150         | FATTR4_WORD1_TIME_METADATA
151         | FATTR4_WORD1_TIME_MODIFY,
152         FATTR4_WORD2_MDSTHRESHOLD
153 };
154
155 const u32 nfs4_statfs_bitmap[2] = {
156         FATTR4_WORD0_FILES_AVAIL
157         | FATTR4_WORD0_FILES_FREE
158         | FATTR4_WORD0_FILES_TOTAL,
159         FATTR4_WORD1_SPACE_AVAIL
160         | FATTR4_WORD1_SPACE_FREE
161         | FATTR4_WORD1_SPACE_TOTAL
162 };
163
164 const u32 nfs4_pathconf_bitmap[2] = {
165         FATTR4_WORD0_MAXLINK
166         | FATTR4_WORD0_MAXNAME,
167         0
168 };
169
170 const u32 nfs4_fsinfo_bitmap[3] = { FATTR4_WORD0_MAXFILESIZE
171                         | FATTR4_WORD0_MAXREAD
172                         | FATTR4_WORD0_MAXWRITE
173                         | FATTR4_WORD0_LEASE_TIME,
174                         FATTR4_WORD1_TIME_DELTA
175                         | FATTR4_WORD1_FS_LAYOUT_TYPES,
176                         FATTR4_WORD2_LAYOUT_BLKSIZE
177 };
178
179 const u32 nfs4_fs_locations_bitmap[2] = {
180         FATTR4_WORD0_TYPE
181         | FATTR4_WORD0_CHANGE
182         | FATTR4_WORD0_SIZE
183         | FATTR4_WORD0_FSID
184         | FATTR4_WORD0_FILEID
185         | FATTR4_WORD0_FS_LOCATIONS,
186         FATTR4_WORD1_MODE
187         | FATTR4_WORD1_NUMLINKS
188         | FATTR4_WORD1_OWNER
189         | FATTR4_WORD1_OWNER_GROUP
190         | FATTR4_WORD1_RAWDEV
191         | FATTR4_WORD1_SPACE_USED
192         | FATTR4_WORD1_TIME_ACCESS
193         | FATTR4_WORD1_TIME_METADATA
194         | FATTR4_WORD1_TIME_MODIFY
195         | FATTR4_WORD1_MOUNTED_ON_FILEID
196 };
197
198 static void nfs4_setup_readdir(u64 cookie, __be32 *verifier, struct dentry *dentry,
199                 struct nfs4_readdir_arg *readdir)
200 {
201         __be32 *start, *p;
202
203         BUG_ON(readdir->count < 80);
204         if (cookie > 2) {
205                 readdir->cookie = cookie;
206                 memcpy(&readdir->verifier, verifier, sizeof(readdir->verifier));
207                 return;
208         }
209
210         readdir->cookie = 0;
211         memset(&readdir->verifier, 0, sizeof(readdir->verifier));
212         if (cookie == 2)
213                 return;
214         
215         /*
216          * NFSv4 servers do not return entries for '.' and '..'
217          * Therefore, we fake these entries here.  We let '.'
218          * have cookie 0 and '..' have cookie 1.  Note that
219          * when talking to the server, we always send cookie 0
220          * instead of 1 or 2.
221          */
222         start = p = kmap_atomic(*readdir->pages);
223         
224         if (cookie == 0) {
225                 *p++ = xdr_one;                                  /* next */
226                 *p++ = xdr_zero;                   /* cookie, first word */
227                 *p++ = xdr_one;                   /* cookie, second word */
228                 *p++ = xdr_one;                             /* entry len */
229                 memcpy(p, ".\0\0\0", 4);                        /* entry */
230                 p++;
231                 *p++ = xdr_one;                         /* bitmap length */
232                 *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
233                 *p++ = htonl(8);              /* attribute buffer length */
234                 p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_inode));
235         }
236         
237         *p++ = xdr_one;                                  /* next */
238         *p++ = xdr_zero;                   /* cookie, first word */
239         *p++ = xdr_two;                   /* cookie, second word */
240         *p++ = xdr_two;                             /* entry len */
241         memcpy(p, "..\0\0", 4);                         /* entry */
242         p++;
243         *p++ = xdr_one;                         /* bitmap length */
244         *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
245         *p++ = htonl(8);              /* attribute buffer length */
246         p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_parent->d_inode));
247
248         readdir->pgbase = (char *)p - (char *)start;
249         readdir->count -= readdir->pgbase;
250         kunmap_atomic(start);
251 }
252
253 static int nfs4_wait_clnt_recover(struct nfs_client *clp)
254 {
255         int res;
256
257         might_sleep();
258
259         res = wait_on_bit(&clp->cl_state, NFS4CLNT_MANAGER_RUNNING,
260                         nfs_wait_bit_killable, TASK_KILLABLE);
261         if (res)
262                 return res;
263
264         if (clp->cl_cons_state < 0)
265                 return clp->cl_cons_state;
266         return 0;
267 }
268
269 static int nfs4_delay(struct rpc_clnt *clnt, long *timeout)
270 {
271         int res = 0;
272
273         might_sleep();
274
275         if (*timeout <= 0)
276                 *timeout = NFS4_POLL_RETRY_MIN;
277         if (*timeout > NFS4_POLL_RETRY_MAX)
278                 *timeout = NFS4_POLL_RETRY_MAX;
279         freezable_schedule_timeout_killable(*timeout);
280         if (fatal_signal_pending(current))
281                 res = -ERESTARTSYS;
282         *timeout <<= 1;
283         return res;
284 }
285
286 /* This is the error handling routine for processes that are allowed
287  * to sleep.
288  */
289 static int nfs4_handle_exception(struct nfs_server *server, int errorcode, struct nfs4_exception *exception)
290 {
291         struct nfs_client *clp = server->nfs_client;
292         struct nfs4_state *state = exception->state;
293         struct inode *inode = exception->inode;
294         int ret = errorcode;
295
296         exception->retry = 0;
297         switch(errorcode) {
298                 case 0:
299                         return 0;
300                 case -NFS4ERR_OPENMODE:
301                         if (inode && nfs4_have_delegation(inode, FMODE_READ)) {
302                                 nfs4_inode_return_delegation(inode);
303                                 exception->retry = 1;
304                                 return 0;
305                         }
306                         if (state == NULL)
307                                 break;
308                         nfs4_schedule_stateid_recovery(server, state);
309                         goto wait_on_recovery;
310                 case -NFS4ERR_DELEG_REVOKED:
311                 case -NFS4ERR_ADMIN_REVOKED:
312                 case -NFS4ERR_BAD_STATEID:
313                         if (state == NULL)
314                                 break;
315                         nfs_remove_bad_delegation(state->inode);
316                         nfs4_schedule_stateid_recovery(server, state);
317                         goto wait_on_recovery;
318                 case -NFS4ERR_EXPIRED:
319                         if (state != NULL)
320                                 nfs4_schedule_stateid_recovery(server, state);
321                 case -NFS4ERR_STALE_STATEID:
322                 case -NFS4ERR_STALE_CLIENTID:
323                         nfs4_schedule_lease_recovery(clp);
324                         goto wait_on_recovery;
325 #if defined(CONFIG_NFS_V4_1)
326                 case -NFS4ERR_BADSESSION:
327                 case -NFS4ERR_BADSLOT:
328                 case -NFS4ERR_BAD_HIGH_SLOT:
329                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
330                 case -NFS4ERR_DEADSESSION:
331                 case -NFS4ERR_SEQ_FALSE_RETRY:
332                 case -NFS4ERR_SEQ_MISORDERED:
333                         dprintk("%s ERROR: %d Reset session\n", __func__,
334                                 errorcode);
335                         nfs4_schedule_session_recovery(clp->cl_session, errorcode);
336                         exception->retry = 1;
337                         break;
338 #endif /* defined(CONFIG_NFS_V4_1) */
339                 case -NFS4ERR_FILE_OPEN:
340                         if (exception->timeout > HZ) {
341                                 /* We have retried a decent amount, time to
342                                  * fail
343                                  */
344                                 ret = -EBUSY;
345                                 break;
346                         }
347                 case -NFS4ERR_GRACE:
348                 case -NFS4ERR_DELAY:
349                 case -EKEYEXPIRED:
350                         ret = nfs4_delay(server->client, &exception->timeout);
351                         if (ret != 0)
352                                 break;
353                 case -NFS4ERR_RETRY_UNCACHED_REP:
354                 case -NFS4ERR_OLD_STATEID:
355                         exception->retry = 1;
356                         break;
357                 case -NFS4ERR_BADOWNER:
358                         /* The following works around a Linux server bug! */
359                 case -NFS4ERR_BADNAME:
360                         if (server->caps & NFS_CAP_UIDGID_NOMAP) {
361                                 server->caps &= ~NFS_CAP_UIDGID_NOMAP;
362                                 exception->retry = 1;
363                                 printk(KERN_WARNING "NFS: v4 server %s "
364                                                 "does not accept raw "
365                                                 "uid/gids. "
366                                                 "Reenabling the idmapper.\n",
367                                                 server->nfs_client->cl_hostname);
368                         }
369         }
370         /* We failed to handle the error */
371         return nfs4_map_errors(ret);
372 wait_on_recovery:
373         ret = nfs4_wait_clnt_recover(clp);
374         if (ret == 0)
375                 exception->retry = 1;
376         return ret;
377 }
378
379
380 static void do_renew_lease(struct nfs_client *clp, unsigned long timestamp)
381 {
382         spin_lock(&clp->cl_lock);
383         if (time_before(clp->cl_last_renewal,timestamp))
384                 clp->cl_last_renewal = timestamp;
385         spin_unlock(&clp->cl_lock);
386 }
387
388 static void renew_lease(const struct nfs_server *server, unsigned long timestamp)
389 {
390         do_renew_lease(server->nfs_client, timestamp);
391 }
392
393 #if defined(CONFIG_NFS_V4_1)
394
395 /*
396  * nfs4_free_slot - free a slot and efficiently update slot table.
397  *
398  * freeing a slot is trivially done by clearing its respective bit
399  * in the bitmap.
400  * If the freed slotid equals highest_used_slotid we want to update it
401  * so that the server would be able to size down the slot table if needed,
402  * otherwise we know that the highest_used_slotid is still in use.
403  * When updating highest_used_slotid there may be "holes" in the bitmap
404  * so we need to scan down from highest_used_slotid to 0 looking for the now
405  * highest slotid in use.
406  * If none found, highest_used_slotid is set to NFS4_NO_SLOT.
407  *
408  * Must be called while holding tbl->slot_tbl_lock
409  */
410 static void
411 nfs4_free_slot(struct nfs4_slot_table *tbl, u32 slotid)
412 {
413         BUG_ON(slotid >= NFS4_MAX_SLOT_TABLE);
414         /* clear used bit in bitmap */
415         __clear_bit(slotid, tbl->used_slots);
416
417         /* update highest_used_slotid when it is freed */
418         if (slotid == tbl->highest_used_slotid) {
419                 slotid = find_last_bit(tbl->used_slots, tbl->max_slots);
420                 if (slotid < tbl->max_slots)
421                         tbl->highest_used_slotid = slotid;
422                 else
423                         tbl->highest_used_slotid = NFS4_NO_SLOT;
424         }
425         dprintk("%s: slotid %u highest_used_slotid %d\n", __func__,
426                 slotid, tbl->highest_used_slotid);
427 }
428
429 bool nfs4_set_task_privileged(struct rpc_task *task, void *dummy)
430 {
431         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
432         return true;
433 }
434
435 /*
436  * Signal state manager thread if session fore channel is drained
437  */
438 static void nfs4_check_drain_fc_complete(struct nfs4_session *ses)
439 {
440         if (!test_bit(NFS4_SESSION_DRAINING, &ses->session_state)) {
441                 rpc_wake_up_first(&ses->fc_slot_table.slot_tbl_waitq,
442                                 nfs4_set_task_privileged, NULL);
443                 return;
444         }
445
446         if (ses->fc_slot_table.highest_used_slotid != NFS4_NO_SLOT)
447                 return;
448
449         dprintk("%s COMPLETE: Session Fore Channel Drained\n", __func__);
450         complete(&ses->fc_slot_table.complete);
451 }
452
453 /*
454  * Signal state manager thread if session back channel is drained
455  */
456 void nfs4_check_drain_bc_complete(struct nfs4_session *ses)
457 {
458         if (!test_bit(NFS4_SESSION_DRAINING, &ses->session_state) ||
459             ses->bc_slot_table.highest_used_slotid != NFS4_NO_SLOT)
460                 return;
461         dprintk("%s COMPLETE: Session Back Channel Drained\n", __func__);
462         complete(&ses->bc_slot_table.complete);
463 }
464
465 static void nfs41_sequence_free_slot(struct nfs4_sequence_res *res)
466 {
467         struct nfs4_slot_table *tbl;
468
469         tbl = &res->sr_session->fc_slot_table;
470         if (!res->sr_slot) {
471                 /* just wake up the next guy waiting since
472                  * we may have not consumed a slot after all */
473                 dprintk("%s: No slot\n", __func__);
474                 return;
475         }
476
477         spin_lock(&tbl->slot_tbl_lock);
478         nfs4_free_slot(tbl, res->sr_slot - tbl->slots);
479         nfs4_check_drain_fc_complete(res->sr_session);
480         spin_unlock(&tbl->slot_tbl_lock);
481         res->sr_slot = NULL;
482 }
483
484 static int nfs41_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
485 {
486         unsigned long timestamp;
487         struct nfs_client *clp;
488
489         /*
490          * sr_status remains 1 if an RPC level error occurred. The server
491          * may or may not have processed the sequence operation..
492          * Proceed as if the server received and processed the sequence
493          * operation.
494          */
495         if (res->sr_status == 1)
496                 res->sr_status = NFS_OK;
497
498         /* don't increment the sequence number if the task wasn't sent */
499         if (!RPC_WAS_SENT(task))
500                 goto out;
501
502         /* Check the SEQUENCE operation status */
503         switch (res->sr_status) {
504         case 0:
505                 /* Update the slot's sequence and clientid lease timer */
506                 ++res->sr_slot->seq_nr;
507                 timestamp = res->sr_renewal_time;
508                 clp = res->sr_session->clp;
509                 do_renew_lease(clp, timestamp);
510                 /* Check sequence flags */
511                 if (res->sr_status_flags != 0)
512                         nfs4_schedule_lease_recovery(clp);
513                 break;
514         case -NFS4ERR_DELAY:
515                 /* The server detected a resend of the RPC call and
516                  * returned NFS4ERR_DELAY as per Section 2.10.6.2
517                  * of RFC5661.
518                  */
519                 dprintk("%s: slot=%td seq=%d: Operation in progress\n",
520                         __func__,
521                         res->sr_slot - res->sr_session->fc_slot_table.slots,
522                         res->sr_slot->seq_nr);
523                 goto out_retry;
524         default:
525                 /* Just update the slot sequence no. */
526                 ++res->sr_slot->seq_nr;
527         }
528 out:
529         /* The session may be reset by one of the error handlers. */
530         dprintk("%s: Error %d free the slot \n", __func__, res->sr_status);
531         nfs41_sequence_free_slot(res);
532         return 1;
533 out_retry:
534         if (!rpc_restart_call(task))
535                 goto out;
536         rpc_delay(task, NFS4_POLL_RETRY_MAX);
537         return 0;
538 }
539
540 static int nfs4_sequence_done(struct rpc_task *task,
541                                struct nfs4_sequence_res *res)
542 {
543         if (res->sr_session == NULL)
544                 return 1;
545         return nfs41_sequence_done(task, res);
546 }
547
548 /*
549  * nfs4_find_slot - efficiently look for a free slot
550  *
551  * nfs4_find_slot looks for an unset bit in the used_slots bitmap.
552  * If found, we mark the slot as used, update the highest_used_slotid,
553  * and respectively set up the sequence operation args.
554  * The slot number is returned if found, or NFS4_NO_SLOT otherwise.
555  *
556  * Note: must be called with under the slot_tbl_lock.
557  */
558 static u32
559 nfs4_find_slot(struct nfs4_slot_table *tbl)
560 {
561         u32 slotid;
562         u32 ret_id = NFS4_NO_SLOT;
563
564         dprintk("--> %s used_slots=%04lx highest_used=%u max_slots=%u\n",
565                 __func__, tbl->used_slots[0], tbl->highest_used_slotid,
566                 tbl->max_slots);
567         slotid = find_first_zero_bit(tbl->used_slots, tbl->max_slots);
568         if (slotid >= tbl->max_slots)
569                 goto out;
570         __set_bit(slotid, tbl->used_slots);
571         if (slotid > tbl->highest_used_slotid ||
572                         tbl->highest_used_slotid == NFS4_NO_SLOT)
573                 tbl->highest_used_slotid = slotid;
574         ret_id = slotid;
575 out:
576         dprintk("<-- %s used_slots=%04lx highest_used=%d slotid=%d \n",
577                 __func__, tbl->used_slots[0], tbl->highest_used_slotid, ret_id);
578         return ret_id;
579 }
580
581 static void nfs41_init_sequence(struct nfs4_sequence_args *args,
582                 struct nfs4_sequence_res *res, int cache_reply)
583 {
584         args->sa_session = NULL;
585         args->sa_cache_this = 0;
586         if (cache_reply)
587                 args->sa_cache_this = 1;
588         res->sr_session = NULL;
589         res->sr_slot = NULL;
590 }
591
592 int nfs41_setup_sequence(struct nfs4_session *session,
593                                 struct nfs4_sequence_args *args,
594                                 struct nfs4_sequence_res *res,
595                                 struct rpc_task *task)
596 {
597         struct nfs4_slot *slot;
598         struct nfs4_slot_table *tbl;
599         u32 slotid;
600
601         dprintk("--> %s\n", __func__);
602         /* slot already allocated? */
603         if (res->sr_slot != NULL)
604                 return 0;
605
606         tbl = &session->fc_slot_table;
607
608         spin_lock(&tbl->slot_tbl_lock);
609         if (test_bit(NFS4_SESSION_DRAINING, &session->session_state) &&
610             !rpc_task_has_priority(task, RPC_PRIORITY_PRIVILEGED)) {
611                 /* The state manager will wait until the slot table is empty */
612                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
613                 spin_unlock(&tbl->slot_tbl_lock);
614                 dprintk("%s session is draining\n", __func__);
615                 return -EAGAIN;
616         }
617
618         if (!rpc_queue_empty(&tbl->slot_tbl_waitq) &&
619             !rpc_task_has_priority(task, RPC_PRIORITY_PRIVILEGED)) {
620                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
621                 spin_unlock(&tbl->slot_tbl_lock);
622                 dprintk("%s enforce FIFO order\n", __func__);
623                 return -EAGAIN;
624         }
625
626         slotid = nfs4_find_slot(tbl);
627         if (slotid == NFS4_NO_SLOT) {
628                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
629                 spin_unlock(&tbl->slot_tbl_lock);
630                 dprintk("<-- %s: no free slots\n", __func__);
631                 return -EAGAIN;
632         }
633         spin_unlock(&tbl->slot_tbl_lock);
634
635         rpc_task_set_priority(task, RPC_PRIORITY_NORMAL);
636         slot = tbl->slots + slotid;
637         args->sa_session = session;
638         args->sa_slotid = slotid;
639
640         dprintk("<-- %s slotid=%d seqid=%d\n", __func__, slotid, slot->seq_nr);
641
642         res->sr_session = session;
643         res->sr_slot = slot;
644         res->sr_renewal_time = jiffies;
645         res->sr_status_flags = 0;
646         /*
647          * sr_status is only set in decode_sequence, and so will remain
648          * set to 1 if an rpc level failure occurs.
649          */
650         res->sr_status = 1;
651         return 0;
652 }
653 EXPORT_SYMBOL_GPL(nfs41_setup_sequence);
654
655 int nfs4_setup_sequence(const struct nfs_server *server,
656                         struct nfs4_sequence_args *args,
657                         struct nfs4_sequence_res *res,
658                         struct rpc_task *task)
659 {
660         struct nfs4_session *session = nfs4_get_session(server);
661         int ret = 0;
662
663         if (session == NULL)
664                 goto out;
665
666         dprintk("--> %s clp %p session %p sr_slot %td\n",
667                 __func__, session->clp, session, res->sr_slot ?
668                         res->sr_slot - session->fc_slot_table.slots : -1);
669
670         ret = nfs41_setup_sequence(session, args, res, task);
671 out:
672         dprintk("<-- %s status=%d\n", __func__, ret);
673         return ret;
674 }
675
676 struct nfs41_call_sync_data {
677         const struct nfs_server *seq_server;
678         struct nfs4_sequence_args *seq_args;
679         struct nfs4_sequence_res *seq_res;
680 };
681
682 static void nfs41_call_sync_prepare(struct rpc_task *task, void *calldata)
683 {
684         struct nfs41_call_sync_data *data = calldata;
685
686         dprintk("--> %s data->seq_server %p\n", __func__, data->seq_server);
687
688         if (nfs4_setup_sequence(data->seq_server, data->seq_args,
689                                 data->seq_res, task))
690                 return;
691         rpc_call_start(task);
692 }
693
694 static void nfs41_call_priv_sync_prepare(struct rpc_task *task, void *calldata)
695 {
696         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
697         nfs41_call_sync_prepare(task, calldata);
698 }
699
700 static void nfs41_call_sync_done(struct rpc_task *task, void *calldata)
701 {
702         struct nfs41_call_sync_data *data = calldata;
703
704         nfs41_sequence_done(task, data->seq_res);
705 }
706
707 static const struct rpc_call_ops nfs41_call_sync_ops = {
708         .rpc_call_prepare = nfs41_call_sync_prepare,
709         .rpc_call_done = nfs41_call_sync_done,
710 };
711
712 static const struct rpc_call_ops nfs41_call_priv_sync_ops = {
713         .rpc_call_prepare = nfs41_call_priv_sync_prepare,
714         .rpc_call_done = nfs41_call_sync_done,
715 };
716
717 static int nfs4_call_sync_sequence(struct rpc_clnt *clnt,
718                                    struct nfs_server *server,
719                                    struct rpc_message *msg,
720                                    struct nfs4_sequence_args *args,
721                                    struct nfs4_sequence_res *res,
722                                    int privileged)
723 {
724         int ret;
725         struct rpc_task *task;
726         struct nfs41_call_sync_data data = {
727                 .seq_server = server,
728                 .seq_args = args,
729                 .seq_res = res,
730         };
731         struct rpc_task_setup task_setup = {
732                 .rpc_client = clnt,
733                 .rpc_message = msg,
734                 .callback_ops = &nfs41_call_sync_ops,
735                 .callback_data = &data
736         };
737
738         if (privileged)
739                 task_setup.callback_ops = &nfs41_call_priv_sync_ops;
740         task = rpc_run_task(&task_setup);
741         if (IS_ERR(task))
742                 ret = PTR_ERR(task);
743         else {
744                 ret = task->tk_status;
745                 rpc_put_task(task);
746         }
747         return ret;
748 }
749
750 int _nfs4_call_sync_session(struct rpc_clnt *clnt,
751                             struct nfs_server *server,
752                             struct rpc_message *msg,
753                             struct nfs4_sequence_args *args,
754                             struct nfs4_sequence_res *res,
755                             int cache_reply)
756 {
757         nfs41_init_sequence(args, res, cache_reply);
758         return nfs4_call_sync_sequence(clnt, server, msg, args, res, 0);
759 }
760
761 #else
762 static inline
763 void nfs41_init_sequence(struct nfs4_sequence_args *args,
764                 struct nfs4_sequence_res *res, int cache_reply)
765 {
766 }
767
768 static int nfs4_sequence_done(struct rpc_task *task,
769                                struct nfs4_sequence_res *res)
770 {
771         return 1;
772 }
773 #endif /* CONFIG_NFS_V4_1 */
774
775 int _nfs4_call_sync(struct rpc_clnt *clnt,
776                     struct nfs_server *server,
777                     struct rpc_message *msg,
778                     struct nfs4_sequence_args *args,
779                     struct nfs4_sequence_res *res,
780                     int cache_reply)
781 {
782         nfs41_init_sequence(args, res, cache_reply);
783         return rpc_call_sync(clnt, msg, 0);
784 }
785
786 static inline
787 int nfs4_call_sync(struct rpc_clnt *clnt,
788                    struct nfs_server *server,
789                    struct rpc_message *msg,
790                    struct nfs4_sequence_args *args,
791                    struct nfs4_sequence_res *res,
792                    int cache_reply)
793 {
794         return server->nfs_client->cl_mvops->call_sync(clnt, server, msg,
795                                                 args, res, cache_reply);
796 }
797
798 static void update_changeattr(struct inode *dir, struct nfs4_change_info *cinfo)
799 {
800         struct nfs_inode *nfsi = NFS_I(dir);
801
802         spin_lock(&dir->i_lock);
803         nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA;
804         if (!cinfo->atomic || cinfo->before != dir->i_version)
805                 nfs_force_lookup_revalidate(dir);
806         dir->i_version = cinfo->after;
807         spin_unlock(&dir->i_lock);
808 }
809
810 struct nfs4_opendata {
811         struct kref kref;
812         struct nfs_openargs o_arg;
813         struct nfs_openres o_res;
814         struct nfs_open_confirmargs c_arg;
815         struct nfs_open_confirmres c_res;
816         struct nfs4_string owner_name;
817         struct nfs4_string group_name;
818         struct nfs_fattr f_attr;
819         struct dentry *dir;
820         struct dentry *dentry;
821         struct nfs4_state_owner *owner;
822         struct nfs4_state *state;
823         struct iattr attrs;
824         unsigned long timestamp;
825         unsigned int rpc_done : 1;
826         int rpc_status;
827         int cancelled;
828 };
829
830
831 static void nfs4_init_opendata_res(struct nfs4_opendata *p)
832 {
833         p->o_res.f_attr = &p->f_attr;
834         p->o_res.seqid = p->o_arg.seqid;
835         p->c_res.seqid = p->c_arg.seqid;
836         p->o_res.server = p->o_arg.server;
837         nfs_fattr_init(&p->f_attr);
838         nfs_fattr_init_names(&p->f_attr, &p->owner_name, &p->group_name);
839 }
840
841 static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
842                 struct nfs4_state_owner *sp, fmode_t fmode, int flags,
843                 const struct iattr *attrs,
844                 gfp_t gfp_mask)
845 {
846         struct dentry *parent = dget_parent(dentry);
847         struct inode *dir = parent->d_inode;
848         struct nfs_server *server = NFS_SERVER(dir);
849         struct nfs4_opendata *p;
850
851         p = kzalloc(sizeof(*p), gfp_mask);
852         if (p == NULL)
853                 goto err;
854         p->o_arg.seqid = nfs_alloc_seqid(&sp->so_seqid, gfp_mask);
855         if (p->o_arg.seqid == NULL)
856                 goto err_free;
857         nfs_sb_active(dentry->d_sb);
858         p->dentry = dget(dentry);
859         p->dir = parent;
860         p->owner = sp;
861         atomic_inc(&sp->so_count);
862         p->o_arg.fh = NFS_FH(dir);
863         p->o_arg.open_flags = flags;
864         p->o_arg.fmode = fmode & (FMODE_READ|FMODE_WRITE);
865         p->o_arg.clientid = server->nfs_client->cl_clientid;
866         p->o_arg.id.create_time = ktime_to_ns(sp->so_seqid.create_time);
867         p->o_arg.id.uniquifier = sp->so_seqid.owner_id;
868         p->o_arg.name = &dentry->d_name;
869         p->o_arg.server = server;
870         p->o_arg.bitmask = server->attr_bitmask;
871         p->o_arg.open_bitmap = &nfs4_fattr_bitmap[0];
872         p->o_arg.claim = NFS4_OPEN_CLAIM_NULL;
873         if (attrs != NULL && attrs->ia_valid != 0) {
874                 __be32 verf[2];
875
876                 p->o_arg.u.attrs = &p->attrs;
877                 memcpy(&p->attrs, attrs, sizeof(p->attrs));
878
879                 verf[0] = jiffies;
880                 verf[1] = current->pid;
881                 memcpy(p->o_arg.u.verifier.data, verf,
882                                 sizeof(p->o_arg.u.verifier.data));
883         }
884         p->c_arg.fh = &p->o_res.fh;
885         p->c_arg.stateid = &p->o_res.stateid;
886         p->c_arg.seqid = p->o_arg.seqid;
887         nfs4_init_opendata_res(p);
888         kref_init(&p->kref);
889         return p;
890 err_free:
891         kfree(p);
892 err:
893         dput(parent);
894         return NULL;
895 }
896
897 static void nfs4_opendata_free(struct kref *kref)
898 {
899         struct nfs4_opendata *p = container_of(kref,
900                         struct nfs4_opendata, kref);
901         struct super_block *sb = p->dentry->d_sb;
902
903         nfs_free_seqid(p->o_arg.seqid);
904         if (p->state != NULL)
905                 nfs4_put_open_state(p->state);
906         nfs4_put_state_owner(p->owner);
907         dput(p->dir);
908         dput(p->dentry);
909         nfs_sb_deactive(sb);
910         nfs_fattr_free_names(&p->f_attr);
911         kfree(p);
912 }
913
914 static void nfs4_opendata_put(struct nfs4_opendata *p)
915 {
916         if (p != NULL)
917                 kref_put(&p->kref, nfs4_opendata_free);
918 }
919
920 static int nfs4_wait_for_completion_rpc_task(struct rpc_task *task)
921 {
922         int ret;
923
924         ret = rpc_wait_for_completion_task(task);
925         return ret;
926 }
927
928 static int can_open_cached(struct nfs4_state *state, fmode_t mode, int open_mode)
929 {
930         int ret = 0;
931
932         if (open_mode & (O_EXCL|O_TRUNC))
933                 goto out;
934         switch (mode & (FMODE_READ|FMODE_WRITE)) {
935                 case FMODE_READ:
936                         ret |= test_bit(NFS_O_RDONLY_STATE, &state->flags) != 0
937                                 && state->n_rdonly != 0;
938                         break;
939                 case FMODE_WRITE:
940                         ret |= test_bit(NFS_O_WRONLY_STATE, &state->flags) != 0
941                                 && state->n_wronly != 0;
942                         break;
943                 case FMODE_READ|FMODE_WRITE:
944                         ret |= test_bit(NFS_O_RDWR_STATE, &state->flags) != 0
945                                 && state->n_rdwr != 0;
946         }
947 out:
948         return ret;
949 }
950
951 static int can_open_delegated(struct nfs_delegation *delegation, fmode_t fmode)
952 {
953         if (delegation == NULL)
954                 return 0;
955         if ((delegation->type & fmode) != fmode)
956                 return 0;
957         if (test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags))
958                 return 0;
959         nfs_mark_delegation_referenced(delegation);
960         return 1;
961 }
962
963 static void update_open_stateflags(struct nfs4_state *state, fmode_t fmode)
964 {
965         switch (fmode) {
966                 case FMODE_WRITE:
967                         state->n_wronly++;
968                         break;
969                 case FMODE_READ:
970                         state->n_rdonly++;
971                         break;
972                 case FMODE_READ|FMODE_WRITE:
973                         state->n_rdwr++;
974         }
975         nfs4_state_set_mode_locked(state, state->state | fmode);
976 }
977
978 static void nfs_set_open_stateid_locked(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
979 {
980         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
981                 nfs4_stateid_copy(&state->stateid, stateid);
982         nfs4_stateid_copy(&state->open_stateid, stateid);
983         switch (fmode) {
984                 case FMODE_READ:
985                         set_bit(NFS_O_RDONLY_STATE, &state->flags);
986                         break;
987                 case FMODE_WRITE:
988                         set_bit(NFS_O_WRONLY_STATE, &state->flags);
989                         break;
990                 case FMODE_READ|FMODE_WRITE:
991                         set_bit(NFS_O_RDWR_STATE, &state->flags);
992         }
993 }
994
995 static void nfs_set_open_stateid(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
996 {
997         write_seqlock(&state->seqlock);
998         nfs_set_open_stateid_locked(state, stateid, fmode);
999         write_sequnlock(&state->seqlock);
1000 }
1001
1002 static void __update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, const nfs4_stateid *deleg_stateid, fmode_t fmode)
1003 {
1004         /*
1005          * Protect the call to nfs4_state_set_mode_locked and
1006          * serialise the stateid update
1007          */
1008         write_seqlock(&state->seqlock);
1009         if (deleg_stateid != NULL) {
1010                 nfs4_stateid_copy(&state->stateid, deleg_stateid);
1011                 set_bit(NFS_DELEGATED_STATE, &state->flags);
1012         }
1013         if (open_stateid != NULL)
1014                 nfs_set_open_stateid_locked(state, open_stateid, fmode);
1015         write_sequnlock(&state->seqlock);
1016         spin_lock(&state->owner->so_lock);
1017         update_open_stateflags(state, fmode);
1018         spin_unlock(&state->owner->so_lock);
1019 }
1020
1021 static int update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, nfs4_stateid *delegation, fmode_t fmode)
1022 {
1023         struct nfs_inode *nfsi = NFS_I(state->inode);
1024         struct nfs_delegation *deleg_cur;
1025         int ret = 0;
1026
1027         fmode &= (FMODE_READ|FMODE_WRITE);
1028
1029         rcu_read_lock();
1030         deleg_cur = rcu_dereference(nfsi->delegation);
1031         if (deleg_cur == NULL)
1032                 goto no_delegation;
1033
1034         spin_lock(&deleg_cur->lock);
1035         if (nfsi->delegation != deleg_cur ||
1036             (deleg_cur->type & fmode) != fmode)
1037                 goto no_delegation_unlock;
1038
1039         if (delegation == NULL)
1040                 delegation = &deleg_cur->stateid;
1041         else if (!nfs4_stateid_match(&deleg_cur->stateid, delegation))
1042                 goto no_delegation_unlock;
1043
1044         nfs_mark_delegation_referenced(deleg_cur);
1045         __update_open_stateid(state, open_stateid, &deleg_cur->stateid, fmode);
1046         ret = 1;
1047 no_delegation_unlock:
1048         spin_unlock(&deleg_cur->lock);
1049 no_delegation:
1050         rcu_read_unlock();
1051
1052         if (!ret && open_stateid != NULL) {
1053                 __update_open_stateid(state, open_stateid, NULL, fmode);
1054                 ret = 1;
1055         }
1056
1057         return ret;
1058 }
1059
1060
1061 static void nfs4_return_incompatible_delegation(struct inode *inode, fmode_t fmode)
1062 {
1063         struct nfs_delegation *delegation;
1064
1065         rcu_read_lock();
1066         delegation = rcu_dereference(NFS_I(inode)->delegation);
1067         if (delegation == NULL || (delegation->type & fmode) == fmode) {
1068                 rcu_read_unlock();
1069                 return;
1070         }
1071         rcu_read_unlock();
1072         nfs4_inode_return_delegation(inode);
1073 }
1074
1075 static struct nfs4_state *nfs4_try_open_cached(struct nfs4_opendata *opendata)
1076 {
1077         struct nfs4_state *state = opendata->state;
1078         struct nfs_inode *nfsi = NFS_I(state->inode);
1079         struct nfs_delegation *delegation;
1080         int open_mode = opendata->o_arg.open_flags & (O_EXCL|O_TRUNC);
1081         fmode_t fmode = opendata->o_arg.fmode;
1082         nfs4_stateid stateid;
1083         int ret = -EAGAIN;
1084
1085         for (;;) {
1086                 if (can_open_cached(state, fmode, open_mode)) {
1087                         spin_lock(&state->owner->so_lock);
1088                         if (can_open_cached(state, fmode, open_mode)) {
1089                                 update_open_stateflags(state, fmode);
1090                                 spin_unlock(&state->owner->so_lock);
1091                                 goto out_return_state;
1092                         }
1093                         spin_unlock(&state->owner->so_lock);
1094                 }
1095                 rcu_read_lock();
1096                 delegation = rcu_dereference(nfsi->delegation);
1097                 if (!can_open_delegated(delegation, fmode)) {
1098                         rcu_read_unlock();
1099                         break;
1100                 }
1101                 /* Save the delegation */
1102                 nfs4_stateid_copy(&stateid, &delegation->stateid);
1103                 rcu_read_unlock();
1104                 ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
1105                 if (ret != 0)
1106                         goto out;
1107                 ret = -EAGAIN;
1108
1109                 /* Try to update the stateid using the delegation */
1110                 if (update_open_stateid(state, NULL, &stateid, fmode))
1111                         goto out_return_state;
1112         }
1113 out:
1114         return ERR_PTR(ret);
1115 out_return_state:
1116         atomic_inc(&state->count);
1117         return state;
1118 }
1119
1120 static struct nfs4_state *nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
1121 {
1122         struct inode *inode;
1123         struct nfs4_state *state = NULL;
1124         struct nfs_delegation *delegation;
1125         int ret;
1126
1127         if (!data->rpc_done) {
1128                 state = nfs4_try_open_cached(data);
1129                 goto out;
1130         }
1131
1132         ret = -EAGAIN;
1133         if (!(data->f_attr.valid & NFS_ATTR_FATTR))
1134                 goto err;
1135         inode = nfs_fhget(data->dir->d_sb, &data->o_res.fh, &data->f_attr);
1136         ret = PTR_ERR(inode);
1137         if (IS_ERR(inode))
1138                 goto err;
1139         ret = -ENOMEM;
1140         state = nfs4_get_open_state(inode, data->owner);
1141         if (state == NULL)
1142                 goto err_put_inode;
1143         if (data->o_res.delegation_type != 0) {
1144                 struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
1145                 int delegation_flags = 0;
1146
1147                 rcu_read_lock();
1148                 delegation = rcu_dereference(NFS_I(inode)->delegation);
1149                 if (delegation)
1150                         delegation_flags = delegation->flags;
1151                 rcu_read_unlock();
1152                 if (data->o_arg.claim == NFS4_OPEN_CLAIM_DELEGATE_CUR) {
1153                         pr_err_ratelimited("NFS: Broken NFSv4 server %s is "
1154                                         "returning a delegation for "
1155                                         "OPEN(CLAIM_DELEGATE_CUR)\n",
1156                                         clp->cl_hostname);
1157                 } else if ((delegation_flags & 1UL<<NFS_DELEGATION_NEED_RECLAIM) == 0)
1158                         nfs_inode_set_delegation(state->inode,
1159                                         data->owner->so_cred,
1160                                         &data->o_res);
1161                 else
1162                         nfs_inode_reclaim_delegation(state->inode,
1163                                         data->owner->so_cred,
1164                                         &data->o_res);
1165         }
1166
1167         update_open_stateid(state, &data->o_res.stateid, NULL,
1168                         data->o_arg.fmode);
1169         iput(inode);
1170 out:
1171         return state;
1172 err_put_inode:
1173         iput(inode);
1174 err:
1175         return ERR_PTR(ret);
1176 }
1177
1178 static struct nfs_open_context *nfs4_state_find_open_context(struct nfs4_state *state)
1179 {
1180         struct nfs_inode *nfsi = NFS_I(state->inode);
1181         struct nfs_open_context *ctx;
1182
1183         spin_lock(&state->inode->i_lock);
1184         list_for_each_entry(ctx, &nfsi->open_files, list) {
1185                 if (ctx->state != state)
1186                         continue;
1187                 get_nfs_open_context(ctx);
1188                 spin_unlock(&state->inode->i_lock);
1189                 return ctx;
1190         }
1191         spin_unlock(&state->inode->i_lock);
1192         return ERR_PTR(-ENOENT);
1193 }
1194
1195 static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx, struct nfs4_state *state)
1196 {
1197         struct nfs4_opendata *opendata;
1198
1199         opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0, NULL, GFP_NOFS);
1200         if (opendata == NULL)
1201                 return ERR_PTR(-ENOMEM);
1202         opendata->state = state;
1203         atomic_inc(&state->count);
1204         return opendata;
1205 }
1206
1207 static int nfs4_open_recover_helper(struct nfs4_opendata *opendata, fmode_t fmode, struct nfs4_state **res)
1208 {
1209         struct nfs4_state *newstate;
1210         int ret;
1211
1212         opendata->o_arg.open_flags = 0;
1213         opendata->o_arg.fmode = fmode;
1214         memset(&opendata->o_res, 0, sizeof(opendata->o_res));
1215         memset(&opendata->c_res, 0, sizeof(opendata->c_res));
1216         nfs4_init_opendata_res(opendata);
1217         ret = _nfs4_recover_proc_open(opendata);
1218         if (ret != 0)
1219                 return ret; 
1220         newstate = nfs4_opendata_to_nfs4_state(opendata);
1221         if (IS_ERR(newstate))
1222                 return PTR_ERR(newstate);
1223         nfs4_close_state(newstate, fmode);
1224         *res = newstate;
1225         return 0;
1226 }
1227
1228 static int nfs4_open_recover(struct nfs4_opendata *opendata, struct nfs4_state *state)
1229 {
1230         struct nfs4_state *newstate;
1231         int ret;
1232
1233         /* memory barrier prior to reading state->n_* */
1234         clear_bit(NFS_DELEGATED_STATE, &state->flags);
1235         smp_rmb();
1236         if (state->n_rdwr != 0) {
1237                 clear_bit(NFS_O_RDWR_STATE, &state->flags);
1238                 ret = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE, &newstate);
1239                 if (ret != 0)
1240                         return ret;
1241                 if (newstate != state)
1242                         return -ESTALE;
1243         }
1244         if (state->n_wronly != 0) {
1245                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1246                 ret = nfs4_open_recover_helper(opendata, FMODE_WRITE, &newstate);
1247                 if (ret != 0)
1248                         return ret;
1249                 if (newstate != state)
1250                         return -ESTALE;
1251         }
1252         if (state->n_rdonly != 0) {
1253                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1254                 ret = nfs4_open_recover_helper(opendata, FMODE_READ, &newstate);
1255                 if (ret != 0)
1256                         return ret;
1257                 if (newstate != state)
1258                         return -ESTALE;
1259         }
1260         /*
1261          * We may have performed cached opens for all three recoveries.
1262          * Check if we need to update the current stateid.
1263          */
1264         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0 &&
1265             !nfs4_stateid_match(&state->stateid, &state->open_stateid)) {
1266                 write_seqlock(&state->seqlock);
1267                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1268                         nfs4_stateid_copy(&state->stateid, &state->open_stateid);
1269                 write_sequnlock(&state->seqlock);
1270         }
1271         return 0;
1272 }
1273
1274 /*
1275  * OPEN_RECLAIM:
1276  *      reclaim state on the server after a reboot.
1277  */
1278 static int _nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1279 {
1280         struct nfs_delegation *delegation;
1281         struct nfs4_opendata *opendata;
1282         fmode_t delegation_type = 0;
1283         int status;
1284
1285         opendata = nfs4_open_recoverdata_alloc(ctx, state);
1286         if (IS_ERR(opendata))
1287                 return PTR_ERR(opendata);
1288         opendata->o_arg.claim = NFS4_OPEN_CLAIM_PREVIOUS;
1289         opendata->o_arg.fh = NFS_FH(state->inode);
1290         rcu_read_lock();
1291         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1292         if (delegation != NULL && test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) != 0)
1293                 delegation_type = delegation->type;
1294         rcu_read_unlock();
1295         opendata->o_arg.u.delegation_type = delegation_type;
1296         status = nfs4_open_recover(opendata, state);
1297         nfs4_opendata_put(opendata);
1298         return status;
1299 }
1300
1301 static int nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1302 {
1303         struct nfs_server *server = NFS_SERVER(state->inode);
1304         struct nfs4_exception exception = { };
1305         int err;
1306         do {
1307                 err = _nfs4_do_open_reclaim(ctx, state);
1308                 if (err != -NFS4ERR_DELAY)
1309                         break;
1310                 nfs4_handle_exception(server, err, &exception);
1311         } while (exception.retry);
1312         return err;
1313 }
1314
1315 static int nfs4_open_reclaim(struct nfs4_state_owner *sp, struct nfs4_state *state)
1316 {
1317         struct nfs_open_context *ctx;
1318         int ret;
1319
1320         ctx = nfs4_state_find_open_context(state);
1321         if (IS_ERR(ctx))
1322                 return PTR_ERR(ctx);
1323         ret = nfs4_do_open_reclaim(ctx, state);
1324         put_nfs_open_context(ctx);
1325         return ret;
1326 }
1327
1328 static int _nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
1329 {
1330         struct nfs4_opendata *opendata;
1331         int ret;
1332
1333         opendata = nfs4_open_recoverdata_alloc(ctx, state);
1334         if (IS_ERR(opendata))
1335                 return PTR_ERR(opendata);
1336         opendata->o_arg.claim = NFS4_OPEN_CLAIM_DELEGATE_CUR;
1337         nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
1338         ret = nfs4_open_recover(opendata, state);
1339         nfs4_opendata_put(opendata);
1340         return ret;
1341 }
1342
1343 int nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
1344 {
1345         struct nfs4_exception exception = { };
1346         struct nfs_server *server = NFS_SERVER(state->inode);
1347         int err;
1348         do {
1349                 err = _nfs4_open_delegation_recall(ctx, state, stateid);
1350                 switch (err) {
1351                         case 0:
1352                         case -ENOENT:
1353                         case -ESTALE:
1354                                 goto out;
1355                         case -NFS4ERR_BADSESSION:
1356                         case -NFS4ERR_BADSLOT:
1357                         case -NFS4ERR_BAD_HIGH_SLOT:
1358                         case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
1359                         case -NFS4ERR_DEADSESSION:
1360                                 nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
1361                                 goto out;
1362                         case -NFS4ERR_STALE_CLIENTID:
1363                         case -NFS4ERR_STALE_STATEID:
1364                         case -NFS4ERR_EXPIRED:
1365                                 /* Don't recall a delegation if it was lost */
1366                                 nfs4_schedule_lease_recovery(server->nfs_client);
1367                                 goto out;
1368                         case -ERESTARTSYS:
1369                                 /*
1370                                  * The show must go on: exit, but mark the
1371                                  * stateid as needing recovery.
1372                                  */
1373                         case -NFS4ERR_DELEG_REVOKED:
1374                         case -NFS4ERR_ADMIN_REVOKED:
1375                         case -NFS4ERR_BAD_STATEID:
1376                                 nfs_inode_find_state_and_recover(state->inode,
1377                                                 stateid);
1378                                 nfs4_schedule_stateid_recovery(server, state);
1379                         case -EKEYEXPIRED:
1380                                 /*
1381                                  * User RPCSEC_GSS context has expired.
1382                                  * We cannot recover this stateid now, so
1383                                  * skip it and allow recovery thread to
1384                                  * proceed.
1385                                  */
1386                         case -ENOMEM:
1387                                 err = 0;
1388                                 goto out;
1389                 }
1390                 err = nfs4_handle_exception(server, err, &exception);
1391         } while (exception.retry);
1392 out:
1393         return err;
1394 }
1395
1396 static void nfs4_open_confirm_done(struct rpc_task *task, void *calldata)
1397 {
1398         struct nfs4_opendata *data = calldata;
1399
1400         data->rpc_status = task->tk_status;
1401         if (data->rpc_status == 0) {
1402                 nfs4_stateid_copy(&data->o_res.stateid, &data->c_res.stateid);
1403                 nfs_confirm_seqid(&data->owner->so_seqid, 0);
1404                 renew_lease(data->o_res.server, data->timestamp);
1405                 data->rpc_done = 1;
1406         }
1407 }
1408
1409 static void nfs4_open_confirm_release(void *calldata)
1410 {
1411         struct nfs4_opendata *data = calldata;
1412         struct nfs4_state *state = NULL;
1413
1414         /* If this request hasn't been cancelled, do nothing */
1415         if (data->cancelled == 0)
1416                 goto out_free;
1417         /* In case of error, no cleanup! */
1418         if (!data->rpc_done)
1419                 goto out_free;
1420         state = nfs4_opendata_to_nfs4_state(data);
1421         if (!IS_ERR(state))
1422                 nfs4_close_state(state, data->o_arg.fmode);
1423 out_free:
1424         nfs4_opendata_put(data);
1425 }
1426
1427 static const struct rpc_call_ops nfs4_open_confirm_ops = {
1428         .rpc_call_done = nfs4_open_confirm_done,
1429         .rpc_release = nfs4_open_confirm_release,
1430 };
1431
1432 /*
1433  * Note: On error, nfs4_proc_open_confirm will free the struct nfs4_opendata
1434  */
1435 static int _nfs4_proc_open_confirm(struct nfs4_opendata *data)
1436 {
1437         struct nfs_server *server = NFS_SERVER(data->dir->d_inode);
1438         struct rpc_task *task;
1439         struct  rpc_message msg = {
1440                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_CONFIRM],
1441                 .rpc_argp = &data->c_arg,
1442                 .rpc_resp = &data->c_res,
1443                 .rpc_cred = data->owner->so_cred,
1444         };
1445         struct rpc_task_setup task_setup_data = {
1446                 .rpc_client = server->client,
1447                 .rpc_message = &msg,
1448                 .callback_ops = &nfs4_open_confirm_ops,
1449                 .callback_data = data,
1450                 .workqueue = nfsiod_workqueue,
1451                 .flags = RPC_TASK_ASYNC,
1452         };
1453         int status;
1454
1455         kref_get(&data->kref);
1456         data->rpc_done = 0;
1457         data->rpc_status = 0;
1458         data->timestamp = jiffies;
1459         task = rpc_run_task(&task_setup_data);
1460         if (IS_ERR(task))
1461                 return PTR_ERR(task);
1462         status = nfs4_wait_for_completion_rpc_task(task);
1463         if (status != 0) {
1464                 data->cancelled = 1;
1465                 smp_wmb();
1466         } else
1467                 status = data->rpc_status;
1468         rpc_put_task(task);
1469         return status;
1470 }
1471
1472 static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
1473 {
1474         struct nfs4_opendata *data = calldata;
1475         struct nfs4_state_owner *sp = data->owner;
1476
1477         if (nfs_wait_on_sequence(data->o_arg.seqid, task) != 0)
1478                 return;
1479         /*
1480          * Check if we still need to send an OPEN call, or if we can use
1481          * a delegation instead.
1482          */
1483         if (data->state != NULL) {
1484                 struct nfs_delegation *delegation;
1485
1486                 if (can_open_cached(data->state, data->o_arg.fmode, data->o_arg.open_flags))
1487                         goto out_no_action;
1488                 rcu_read_lock();
1489                 delegation = rcu_dereference(NFS_I(data->state->inode)->delegation);
1490                 if (data->o_arg.claim != NFS4_OPEN_CLAIM_DELEGATE_CUR &&
1491                     can_open_delegated(delegation, data->o_arg.fmode))
1492                         goto unlock_no_action;
1493                 rcu_read_unlock();
1494         }
1495         /* Update client id. */
1496         data->o_arg.clientid = sp->so_server->nfs_client->cl_clientid;
1497         if (data->o_arg.claim == NFS4_OPEN_CLAIM_PREVIOUS) {
1498                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
1499                 nfs_copy_fh(&data->o_res.fh, data->o_arg.fh);
1500         }
1501         data->timestamp = jiffies;
1502         if (nfs4_setup_sequence(data->o_arg.server,
1503                                 &data->o_arg.seq_args,
1504                                 &data->o_res.seq_res, task))
1505                 return;
1506         rpc_call_start(task);
1507         return;
1508 unlock_no_action:
1509         rcu_read_unlock();
1510 out_no_action:
1511         task->tk_action = NULL;
1512
1513 }
1514
1515 static void nfs4_recover_open_prepare(struct rpc_task *task, void *calldata)
1516 {
1517         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
1518         nfs4_open_prepare(task, calldata);
1519 }
1520
1521 static void nfs4_open_done(struct rpc_task *task, void *calldata)
1522 {
1523         struct nfs4_opendata *data = calldata;
1524
1525         data->rpc_status = task->tk_status;
1526
1527         if (!nfs4_sequence_done(task, &data->o_res.seq_res))
1528                 return;
1529
1530         if (task->tk_status == 0) {
1531                 switch (data->o_res.f_attr->mode & S_IFMT) {
1532                         case S_IFREG:
1533                                 break;
1534                         case S_IFLNK:
1535                                 data->rpc_status = -ELOOP;
1536                                 break;
1537                         case S_IFDIR:
1538                                 data->rpc_status = -EISDIR;
1539                                 break;
1540                         default:
1541                                 data->rpc_status = -ENOTDIR;
1542                 }
1543                 renew_lease(data->o_res.server, data->timestamp);
1544                 if (!(data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM))
1545                         nfs_confirm_seqid(&data->owner->so_seqid, 0);
1546         }
1547         data->rpc_done = 1;
1548 }
1549
1550 static void nfs4_open_release(void *calldata)
1551 {
1552         struct nfs4_opendata *data = calldata;
1553         struct nfs4_state *state = NULL;
1554
1555         /* If this request hasn't been cancelled, do nothing */
1556         if (data->cancelled == 0)
1557                 goto out_free;
1558         /* In case of error, no cleanup! */
1559         if (data->rpc_status != 0 || !data->rpc_done)
1560                 goto out_free;
1561         /* In case we need an open_confirm, no cleanup! */
1562         if (data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM)
1563                 goto out_free;
1564         state = nfs4_opendata_to_nfs4_state(data);
1565         if (!IS_ERR(state))
1566                 nfs4_close_state(state, data->o_arg.fmode);
1567 out_free:
1568         nfs4_opendata_put(data);
1569 }
1570
1571 static const struct rpc_call_ops nfs4_open_ops = {
1572         .rpc_call_prepare = nfs4_open_prepare,
1573         .rpc_call_done = nfs4_open_done,
1574         .rpc_release = nfs4_open_release,
1575 };
1576
1577 static const struct rpc_call_ops nfs4_recover_open_ops = {
1578         .rpc_call_prepare = nfs4_recover_open_prepare,
1579         .rpc_call_done = nfs4_open_done,
1580         .rpc_release = nfs4_open_release,
1581 };
1582
1583 static int nfs4_run_open_task(struct nfs4_opendata *data, int isrecover)
1584 {
1585         struct inode *dir = data->dir->d_inode;
1586         struct nfs_server *server = NFS_SERVER(dir);
1587         struct nfs_openargs *o_arg = &data->o_arg;
1588         struct nfs_openres *o_res = &data->o_res;
1589         struct rpc_task *task;
1590         struct rpc_message msg = {
1591                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN],
1592                 .rpc_argp = o_arg,
1593                 .rpc_resp = o_res,
1594                 .rpc_cred = data->owner->so_cred,
1595         };
1596         struct rpc_task_setup task_setup_data = {
1597                 .rpc_client = server->client,
1598                 .rpc_message = &msg,
1599                 .callback_ops = &nfs4_open_ops,
1600                 .callback_data = data,
1601                 .workqueue = nfsiod_workqueue,
1602                 .flags = RPC_TASK_ASYNC,
1603         };
1604         int status;
1605
1606         nfs41_init_sequence(&o_arg->seq_args, &o_res->seq_res, 1);
1607         kref_get(&data->kref);
1608         data->rpc_done = 0;
1609         data->rpc_status = 0;
1610         data->cancelled = 0;
1611         if (isrecover)
1612                 task_setup_data.callback_ops = &nfs4_recover_open_ops;
1613         task = rpc_run_task(&task_setup_data);
1614         if (IS_ERR(task))
1615                 return PTR_ERR(task);
1616         status = nfs4_wait_for_completion_rpc_task(task);
1617         if (status != 0) {
1618                 data->cancelled = 1;
1619                 smp_wmb();
1620         } else
1621                 status = data->rpc_status;
1622         rpc_put_task(task);
1623
1624         return status;
1625 }
1626
1627 static int _nfs4_recover_proc_open(struct nfs4_opendata *data)
1628 {
1629         struct inode *dir = data->dir->d_inode;
1630         struct nfs_openres *o_res = &data->o_res;
1631         int status;
1632
1633         status = nfs4_run_open_task(data, 1);
1634         if (status != 0 || !data->rpc_done)
1635                 return status;
1636
1637         nfs_fattr_map_and_free_names(NFS_SERVER(dir), &data->f_attr);
1638
1639         if (o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
1640                 status = _nfs4_proc_open_confirm(data);
1641                 if (status != 0)
1642                         return status;
1643         }
1644
1645         return status;
1646 }
1647
1648 /*
1649  * Note: On error, nfs4_proc_open will free the struct nfs4_opendata
1650  */
1651 static int _nfs4_proc_open(struct nfs4_opendata *data)
1652 {
1653         struct inode *dir = data->dir->d_inode;
1654         struct nfs_server *server = NFS_SERVER(dir);
1655         struct nfs_openargs *o_arg = &data->o_arg;
1656         struct nfs_openres *o_res = &data->o_res;
1657         int status;
1658
1659         status = nfs4_run_open_task(data, 0);
1660         if (!data->rpc_done)
1661                 return status;
1662         if (status != 0) {
1663                 if (status == -NFS4ERR_BADNAME &&
1664                                 !(o_arg->open_flags & O_CREAT))
1665                         return -ENOENT;
1666                 return status;
1667         }
1668
1669         nfs_fattr_map_and_free_names(server, &data->f_attr);
1670
1671         if (o_arg->open_flags & O_CREAT)
1672                 update_changeattr(dir, &o_res->cinfo);
1673         if ((o_res->rflags & NFS4_OPEN_RESULT_LOCKTYPE_POSIX) == 0)
1674                 server->caps &= ~NFS_CAP_POSIX_LOCK;
1675         if(o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
1676                 status = _nfs4_proc_open_confirm(data);
1677                 if (status != 0)
1678                         return status;
1679         }
1680         if (!(o_res->f_attr->valid & NFS_ATTR_FATTR))
1681                 _nfs4_proc_getattr(server, &o_res->fh, o_res->f_attr);
1682         return 0;
1683 }
1684
1685 static int nfs4_client_recover_expired_lease(struct nfs_client *clp)
1686 {
1687         unsigned int loop;
1688         int ret;
1689
1690         for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
1691                 ret = nfs4_wait_clnt_recover(clp);
1692                 if (ret != 0)
1693                         break;
1694                 if (!test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) &&
1695                     !test_bit(NFS4CLNT_CHECK_LEASE,&clp->cl_state))
1696                         break;
1697                 nfs4_schedule_state_manager(clp);
1698                 ret = -EIO;
1699         }
1700         return ret;
1701 }
1702
1703 static int nfs4_recover_expired_lease(struct nfs_server *server)
1704 {
1705         return nfs4_client_recover_expired_lease(server->nfs_client);
1706 }
1707
1708 /*
1709  * OPEN_EXPIRED:
1710  *      reclaim state on the server after a network partition.
1711  *      Assumes caller holds the appropriate lock
1712  */
1713 static int _nfs4_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
1714 {
1715         struct nfs4_opendata *opendata;
1716         int ret;
1717
1718         opendata = nfs4_open_recoverdata_alloc(ctx, state);
1719         if (IS_ERR(opendata))
1720                 return PTR_ERR(opendata);
1721         ret = nfs4_open_recover(opendata, state);
1722         if (ret == -ESTALE)
1723                 d_drop(ctx->dentry);
1724         nfs4_opendata_put(opendata);
1725         return ret;
1726 }
1727
1728 static int nfs4_do_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
1729 {
1730         struct nfs_server *server = NFS_SERVER(state->inode);
1731         struct nfs4_exception exception = { };
1732         int err;
1733
1734         do {
1735                 err = _nfs4_open_expired(ctx, state);
1736                 switch (err) {
1737                 default:
1738                         goto out;
1739                 case -NFS4ERR_GRACE:
1740                 case -NFS4ERR_DELAY:
1741                         nfs4_handle_exception(server, err, &exception);
1742                         err = 0;
1743                 }
1744         } while (exception.retry);
1745 out:
1746         return err;
1747 }
1748
1749 static int nfs4_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
1750 {
1751         struct nfs_open_context *ctx;
1752         int ret;
1753
1754         ctx = nfs4_state_find_open_context(state);
1755         if (IS_ERR(ctx))
1756                 return PTR_ERR(ctx);
1757         ret = nfs4_do_open_expired(ctx, state);
1758         put_nfs_open_context(ctx);
1759         return ret;
1760 }
1761
1762 #if defined(CONFIG_NFS_V4_1)
1763 static void nfs41_clear_delegation_stateid(struct nfs4_state *state)
1764 {
1765         struct nfs_server *server = NFS_SERVER(state->inode);
1766         nfs4_stateid *stateid = &state->stateid;
1767         int status;
1768
1769         /* If a state reset has been done, test_stateid is unneeded */
1770         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1771                 return;
1772
1773         status = nfs41_test_stateid(server, stateid);
1774         if (status != NFS_OK) {
1775                 /* Free the stateid unless the server explicitly
1776                  * informs us the stateid is unrecognized. */
1777                 if (status != -NFS4ERR_BAD_STATEID)
1778                         nfs41_free_stateid(server, stateid);
1779
1780                 clear_bit(NFS_DELEGATED_STATE, &state->flags);
1781         }
1782 }
1783
1784 /**
1785  * nfs41_check_open_stateid - possibly free an open stateid
1786  *
1787  * @state: NFSv4 state for an inode
1788  *
1789  * Returns NFS_OK if recovery for this stateid is now finished.
1790  * Otherwise a negative NFS4ERR value is returned.
1791  */
1792 static int nfs41_check_open_stateid(struct nfs4_state *state)
1793 {
1794         struct nfs_server *server = NFS_SERVER(state->inode);
1795         nfs4_stateid *stateid = &state->stateid;
1796         int status;
1797
1798         /* If a state reset has been done, test_stateid is unneeded */
1799         if ((test_bit(NFS_O_RDONLY_STATE, &state->flags) == 0) &&
1800             (test_bit(NFS_O_WRONLY_STATE, &state->flags) == 0) &&
1801             (test_bit(NFS_O_RDWR_STATE, &state->flags) == 0))
1802                 return -NFS4ERR_BAD_STATEID;
1803
1804         status = nfs41_test_stateid(server, stateid);
1805         if (status != NFS_OK) {
1806                 /* Free the stateid unless the server explicitly
1807                  * informs us the stateid is unrecognized. */
1808                 if (status != -NFS4ERR_BAD_STATEID)
1809                         nfs41_free_stateid(server, stateid);
1810
1811                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1812                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1813                 clear_bit(NFS_O_RDWR_STATE, &state->flags);
1814         }
1815         return status;
1816 }
1817
1818 static int nfs41_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
1819 {
1820         int status;
1821
1822         nfs41_clear_delegation_stateid(state);
1823         status = nfs41_check_open_stateid(state);
1824         if (status != NFS_OK)
1825                 status = nfs4_open_expired(sp, state);
1826         return status;
1827 }
1828 #endif
1829
1830 /*
1831  * on an EXCLUSIVE create, the server should send back a bitmask with FATTR4-*
1832  * fields corresponding to attributes that were used to store the verifier.
1833  * Make sure we clobber those fields in the later setattr call
1834  */
1835 static inline void nfs4_exclusive_attrset(struct nfs4_opendata *opendata, struct iattr *sattr)
1836 {
1837         if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_ACCESS) &&
1838             !(sattr->ia_valid & ATTR_ATIME_SET))
1839                 sattr->ia_valid |= ATTR_ATIME;
1840
1841         if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_MODIFY) &&
1842             !(sattr->ia_valid & ATTR_MTIME_SET))
1843                 sattr->ia_valid |= ATTR_MTIME;
1844 }
1845
1846 /*
1847  * Returns a referenced nfs4_state
1848  */
1849 static int _nfs4_do_open(struct inode *dir,
1850                         struct dentry *dentry,
1851                         fmode_t fmode,
1852                         int flags,
1853                         struct iattr *sattr,
1854                         struct rpc_cred *cred,
1855                         struct nfs4_state **res,
1856                         struct nfs4_threshold **ctx_th)
1857 {
1858         struct nfs4_state_owner  *sp;
1859         struct nfs4_state     *state = NULL;
1860         struct nfs_server       *server = NFS_SERVER(dir);
1861         struct nfs4_opendata *opendata;
1862         int status;
1863
1864         /* Protect against reboot recovery conflicts */
1865         status = -ENOMEM;
1866         sp = nfs4_get_state_owner(server, cred, GFP_KERNEL);
1867         if (sp == NULL) {
1868                 dprintk("nfs4_do_open: nfs4_get_state_owner failed!\n");
1869                 goto out_err;
1870         }
1871         status = nfs4_recover_expired_lease(server);
1872         if (status != 0)
1873                 goto err_put_state_owner;
1874         if (dentry->d_inode != NULL)
1875                 nfs4_return_incompatible_delegation(dentry->d_inode, fmode);
1876         status = -ENOMEM;
1877         opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags, sattr, GFP_KERNEL);
1878         if (opendata == NULL)
1879                 goto err_put_state_owner;
1880
1881         if (ctx_th && server->attr_bitmask[2] & FATTR4_WORD2_MDSTHRESHOLD) {
1882                 opendata->f_attr.mdsthreshold = pnfs_mdsthreshold_alloc();
1883                 if (!opendata->f_attr.mdsthreshold)
1884                         goto err_opendata_put;
1885                 opendata->o_arg.open_bitmap = &nfs4_pnfs_open_bitmap[0];
1886         }
1887         if (dentry->d_inode != NULL)
1888                 opendata->state = nfs4_get_open_state(dentry->d_inode, sp);
1889
1890         status = _nfs4_proc_open(opendata);
1891         if (status != 0)
1892                 goto err_opendata_put;
1893
1894         state = nfs4_opendata_to_nfs4_state(opendata);
1895         status = PTR_ERR(state);
1896         if (IS_ERR(state))
1897                 goto err_opendata_put;
1898         if (server->caps & NFS_CAP_POSIX_LOCK)
1899                 set_bit(NFS_STATE_POSIX_LOCKS, &state->flags);
1900
1901         if (opendata->o_arg.open_flags & O_EXCL) {
1902                 nfs4_exclusive_attrset(opendata, sattr);
1903
1904                 nfs_fattr_init(opendata->o_res.f_attr);
1905                 status = nfs4_do_setattr(state->inode, cred,
1906                                 opendata->o_res.f_attr, sattr,
1907                                 state);
1908                 if (status == 0)
1909                         nfs_setattr_update_inode(state->inode, sattr);
1910                 nfs_post_op_update_inode(state->inode, opendata->o_res.f_attr);
1911         }
1912
1913         if (pnfs_use_threshold(ctx_th, opendata->f_attr.mdsthreshold, server))
1914                 *ctx_th = opendata->f_attr.mdsthreshold;
1915         else
1916                 kfree(opendata->f_attr.mdsthreshold);
1917         opendata->f_attr.mdsthreshold = NULL;
1918
1919         nfs4_opendata_put(opendata);
1920         nfs4_put_state_owner(sp);
1921         *res = state;
1922         return 0;
1923 err_opendata_put:
1924         kfree(opendata->f_attr.mdsthreshold);
1925         nfs4_opendata_put(opendata);
1926 err_put_state_owner:
1927         nfs4_put_state_owner(sp);
1928 out_err:
1929         *res = NULL;
1930         return status;
1931 }
1932
1933
1934 static struct nfs4_state *nfs4_do_open(struct inode *dir,
1935                                         struct dentry *dentry,
1936                                         fmode_t fmode,
1937                                         int flags,
1938                                         struct iattr *sattr,
1939                                         struct rpc_cred *cred,
1940                                         struct nfs4_threshold **ctx_th)
1941 {
1942         struct nfs4_exception exception = { };
1943         struct nfs4_state *res;
1944         int status;
1945
1946         fmode &= FMODE_READ|FMODE_WRITE;
1947         do {
1948                 status = _nfs4_do_open(dir, dentry, fmode, flags, sattr, cred,
1949                                        &res, ctx_th);
1950                 if (status == 0)
1951                         break;
1952                 /* NOTE: BAD_SEQID means the server and client disagree about the
1953                  * book-keeping w.r.t. state-changing operations
1954                  * (OPEN/CLOSE/LOCK/LOCKU...)
1955                  * It is actually a sign of a bug on the client or on the server.
1956                  *
1957                  * If we receive a BAD_SEQID error in the particular case of
1958                  * doing an OPEN, we assume that nfs_increment_open_seqid() will
1959                  * have unhashed the old state_owner for us, and that we can
1960                  * therefore safely retry using a new one. We should still warn
1961                  * the user though...
1962                  */
1963                 if (status == -NFS4ERR_BAD_SEQID) {
1964                         pr_warn_ratelimited("NFS: v4 server %s "
1965                                         " returned a bad sequence-id error!\n",
1966                                         NFS_SERVER(dir)->nfs_client->cl_hostname);
1967                         exception.retry = 1;
1968                         continue;
1969                 }
1970                 /*
1971                  * BAD_STATEID on OPEN means that the server cancelled our
1972                  * state before it received the OPEN_CONFIRM.
1973                  * Recover by retrying the request as per the discussion
1974                  * on Page 181 of RFC3530.
1975                  */
1976                 if (status == -NFS4ERR_BAD_STATEID) {
1977                         exception.retry = 1;
1978                         continue;
1979                 }
1980                 if (status == -EAGAIN) {
1981                         /* We must have found a delegation */
1982                         exception.retry = 1;
1983                         continue;
1984                 }
1985                 res = ERR_PTR(nfs4_handle_exception(NFS_SERVER(dir),
1986                                         status, &exception));
1987         } while (exception.retry);
1988         return res;
1989 }
1990
1991 static int _nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
1992                             struct nfs_fattr *fattr, struct iattr *sattr,
1993                             struct nfs4_state *state)
1994 {
1995         struct nfs_server *server = NFS_SERVER(inode);
1996         struct nfs_setattrargs  arg = {
1997                 .fh             = NFS_FH(inode),
1998                 .iap            = sattr,
1999                 .server         = server,
2000                 .bitmask = server->attr_bitmask,
2001         };
2002         struct nfs_setattrres  res = {
2003                 .fattr          = fattr,
2004                 .server         = server,
2005         };
2006         struct rpc_message msg = {
2007                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
2008                 .rpc_argp       = &arg,
2009                 .rpc_resp       = &res,
2010                 .rpc_cred       = cred,
2011         };
2012         unsigned long timestamp = jiffies;
2013         int status;
2014
2015         nfs_fattr_init(fattr);
2016
2017         if (state != NULL) {
2018                 nfs4_select_rw_stateid(&arg.stateid, state, FMODE_WRITE,
2019                                 current->files, current->tgid);
2020         } else if (nfs4_copy_delegation_stateid(&arg.stateid, inode,
2021                                 FMODE_WRITE)) {
2022                 /* Use that stateid */
2023         } else
2024                 nfs4_stateid_copy(&arg.stateid, &zero_stateid);
2025
2026         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
2027         if (status == 0 && state != NULL)
2028                 renew_lease(server, timestamp);
2029         return status;
2030 }
2031
2032 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
2033                            struct nfs_fattr *fattr, struct iattr *sattr,
2034                            struct nfs4_state *state)
2035 {
2036         struct nfs_server *server = NFS_SERVER(inode);
2037         struct nfs4_exception exception = {
2038                 .state = state,
2039                 .inode = inode,
2040         };
2041         int err;
2042         do {
2043                 err = _nfs4_do_setattr(inode, cred, fattr, sattr, state);
2044                 switch (err) {
2045                 case -NFS4ERR_OPENMODE:
2046                         if (state && !(state->state & FMODE_WRITE)) {
2047                                 err = -EBADF;
2048                                 if (sattr->ia_valid & ATTR_OPEN)
2049                                         err = -EACCES;
2050                                 goto out;
2051                         }
2052                 }
2053                 err = nfs4_handle_exception(server, err, &exception);
2054         } while (exception.retry);
2055 out:
2056         return err;
2057 }
2058
2059 struct nfs4_closedata {
2060         struct inode *inode;
2061         struct nfs4_state *state;
2062         struct nfs_closeargs arg;
2063         struct nfs_closeres res;
2064         struct nfs_fattr fattr;
2065         unsigned long timestamp;
2066         bool roc;
2067         u32 roc_barrier;
2068 };
2069
2070 static void nfs4_free_closedata(void *data)
2071 {
2072         struct nfs4_closedata *calldata = data;
2073         struct nfs4_state_owner *sp = calldata->state->owner;
2074         struct super_block *sb = calldata->state->inode->i_sb;
2075
2076         if (calldata->roc)
2077                 pnfs_roc_release(calldata->state->inode);
2078         nfs4_put_open_state(calldata->state);
2079         nfs_free_seqid(calldata->arg.seqid);
2080         nfs4_put_state_owner(sp);
2081         nfs_sb_deactive(sb);
2082         kfree(calldata);
2083 }
2084
2085 static void nfs4_close_clear_stateid_flags(struct nfs4_state *state,
2086                 fmode_t fmode)
2087 {
2088         spin_lock(&state->owner->so_lock);
2089         if (!(fmode & FMODE_READ))
2090                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
2091         if (!(fmode & FMODE_WRITE))
2092                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
2093         clear_bit(NFS_O_RDWR_STATE, &state->flags);
2094         spin_unlock(&state->owner->so_lock);
2095 }
2096
2097 static void nfs4_close_done(struct rpc_task *task, void *data)
2098 {
2099         struct nfs4_closedata *calldata = data;
2100         struct nfs4_state *state = calldata->state;
2101         struct nfs_server *server = NFS_SERVER(calldata->inode);
2102
2103         dprintk("%s: begin!\n", __func__);
2104         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
2105                 return;
2106         /* hmm. we are done with the inode, and in the process of freeing
2107          * the state_owner. we keep this around to process errors
2108          */
2109         switch (task->tk_status) {
2110                 case 0:
2111                         if (calldata->roc)
2112                                 pnfs_roc_set_barrier(state->inode,
2113                                                      calldata->roc_barrier);
2114                         nfs_set_open_stateid(state, &calldata->res.stateid, 0);
2115                         renew_lease(server, calldata->timestamp);
2116                         nfs4_close_clear_stateid_flags(state,
2117                                         calldata->arg.fmode);
2118                         break;
2119                 case -NFS4ERR_STALE_STATEID:
2120                 case -NFS4ERR_OLD_STATEID:
2121                 case -NFS4ERR_BAD_STATEID:
2122                 case -NFS4ERR_EXPIRED:
2123                         if (calldata->arg.fmode == 0)
2124                                 break;
2125                 default:
2126                         if (nfs4_async_handle_error(task, server, state) == -EAGAIN)
2127                                 rpc_restart_call_prepare(task);
2128         }
2129         nfs_release_seqid(calldata->arg.seqid);
2130         nfs_refresh_inode(calldata->inode, calldata->res.fattr);
2131         dprintk("%s: done, ret = %d!\n", __func__, task->tk_status);
2132 }
2133
2134 static void nfs4_close_prepare(struct rpc_task *task, void *data)
2135 {
2136         struct nfs4_closedata *calldata = data;
2137         struct nfs4_state *state = calldata->state;
2138         int call_close = 0;
2139
2140         dprintk("%s: begin!\n", __func__);
2141         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
2142                 return;
2143
2144         task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_DOWNGRADE];
2145         calldata->arg.fmode = FMODE_READ|FMODE_WRITE;
2146         spin_lock(&state->owner->so_lock);
2147         /* Calculate the change in open mode */
2148         if (state->n_rdwr == 0) {
2149                 if (state->n_rdonly == 0) {
2150                         call_close |= test_bit(NFS_O_RDONLY_STATE, &state->flags);
2151                         call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
2152                         calldata->arg.fmode &= ~FMODE_READ;
2153                 }
2154                 if (state->n_wronly == 0) {
2155                         call_close |= test_bit(NFS_O_WRONLY_STATE, &state->flags);
2156                         call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
2157                         calldata->arg.fmode &= ~FMODE_WRITE;
2158                 }
2159         }
2160         spin_unlock(&state->owner->so_lock);
2161
2162         if (!call_close) {
2163                 /* Note: exit _without_ calling nfs4_close_done */
2164                 task->tk_action = NULL;
2165                 goto out;
2166         }
2167
2168         if (calldata->arg.fmode == 0) {
2169                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE];
2170                 if (calldata->roc &&
2171                     pnfs_roc_drain(calldata->inode, &calldata->roc_barrier)) {
2172                         rpc_sleep_on(&NFS_SERVER(calldata->inode)->roc_rpcwaitq,
2173                                      task, NULL);
2174                         goto out;
2175                 }
2176         }
2177
2178         nfs_fattr_init(calldata->res.fattr);
2179         calldata->timestamp = jiffies;
2180         if (nfs4_setup_sequence(NFS_SERVER(calldata->inode),
2181                                 &calldata->arg.seq_args,
2182                                 &calldata->res.seq_res,
2183                                 task))
2184                 goto out;
2185         rpc_call_start(task);
2186 out:
2187         dprintk("%s: done!\n", __func__);
2188 }
2189
2190 static const struct rpc_call_ops nfs4_close_ops = {
2191         .rpc_call_prepare = nfs4_close_prepare,
2192         .rpc_call_done = nfs4_close_done,
2193         .rpc_release = nfs4_free_closedata,
2194 };
2195
2196 /* 
2197  * It is possible for data to be read/written from a mem-mapped file 
2198  * after the sys_close call (which hits the vfs layer as a flush).
2199  * This means that we can't safely call nfsv4 close on a file until 
2200  * the inode is cleared. This in turn means that we are not good
2201  * NFSv4 citizens - we do not indicate to the server to update the file's 
2202  * share state even when we are done with one of the three share 
2203  * stateid's in the inode.
2204  *
2205  * NOTE: Caller must be holding the sp->so_owner semaphore!
2206  */
2207 int nfs4_do_close(struct nfs4_state *state, gfp_t gfp_mask, int wait, bool roc)
2208 {
2209         struct nfs_server *server = NFS_SERVER(state->inode);
2210         struct nfs4_closedata *calldata;
2211         struct nfs4_state_owner *sp = state->owner;
2212         struct rpc_task *task;
2213         struct rpc_message msg = {
2214                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE],
2215                 .rpc_cred = state->owner->so_cred,
2216         };
2217         struct rpc_task_setup task_setup_data = {
2218                 .rpc_client = server->client,
2219                 .rpc_message = &msg,
2220                 .callback_ops = &nfs4_close_ops,
2221                 .workqueue = nfsiod_workqueue,
2222                 .flags = RPC_TASK_ASYNC,
2223         };
2224         int status = -ENOMEM;
2225
2226         calldata = kzalloc(sizeof(*calldata), gfp_mask);
2227         if (calldata == NULL)
2228                 goto out;
2229         nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 1);
2230         calldata->inode = state->inode;
2231         calldata->state = state;
2232         calldata->arg.fh = NFS_FH(state->inode);
2233         calldata->arg.stateid = &state->open_stateid;
2234         /* Serialization for the sequence id */
2235         calldata->arg.seqid = nfs_alloc_seqid(&state->owner->so_seqid, gfp_mask);
2236         if (calldata->arg.seqid == NULL)
2237                 goto out_free_calldata;
2238         calldata->arg.fmode = 0;
2239         calldata->arg.bitmask = server->cache_consistency_bitmask;
2240         calldata->res.fattr = &calldata->fattr;
2241         calldata->res.seqid = calldata->arg.seqid;
2242         calldata->res.server = server;
2243         calldata->roc = roc;
2244         nfs_sb_active(calldata->inode->i_sb);
2245
2246         msg.rpc_argp = &calldata->arg;
2247         msg.rpc_resp = &calldata->res;
2248         task_setup_data.callback_data = calldata;
2249         task = rpc_run_task(&task_setup_data);
2250         if (IS_ERR(task))
2251                 return PTR_ERR(task);
2252         status = 0;
2253         if (wait)
2254                 status = rpc_wait_for_completion_task(task);
2255         rpc_put_task(task);
2256         return status;
2257 out_free_calldata:
2258         kfree(calldata);
2259 out:
2260         if (roc)
2261                 pnfs_roc_release(state->inode);
2262         nfs4_put_open_state(state);
2263         nfs4_put_state_owner(sp);
2264         return status;
2265 }
2266
2267 static struct inode *
2268 nfs4_atomic_open(struct inode *dir, struct nfs_open_context *ctx, int open_flags, struct iattr *attr)
2269 {
2270         struct nfs4_state *state;
2271
2272         /* Protect against concurrent sillydeletes */
2273         state = nfs4_do_open(dir, ctx->dentry, ctx->mode, open_flags, attr,
2274                              ctx->cred, &ctx->mdsthreshold);
2275         if (IS_ERR(state))
2276                 return ERR_CAST(state);
2277         ctx->state = state;
2278         return igrab(state->inode);
2279 }
2280
2281 static void nfs4_close_context(struct nfs_open_context *ctx, int is_sync)
2282 {
2283         if (ctx->state == NULL)
2284                 return;
2285         if (is_sync)
2286                 nfs4_close_sync(ctx->state, ctx->mode);
2287         else
2288                 nfs4_close_state(ctx->state, ctx->mode);
2289 }
2290
2291 static int _nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
2292 {
2293         struct nfs4_server_caps_arg args = {
2294                 .fhandle = fhandle,
2295         };
2296         struct nfs4_server_caps_res res = {};
2297         struct rpc_message msg = {
2298                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SERVER_CAPS],
2299                 .rpc_argp = &args,
2300                 .rpc_resp = &res,
2301         };
2302         int status;
2303
2304         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2305         if (status == 0) {
2306                 memcpy(server->attr_bitmask, res.attr_bitmask, sizeof(server->attr_bitmask));
2307                 server->caps &= ~(NFS_CAP_ACLS|NFS_CAP_HARDLINKS|
2308                                 NFS_CAP_SYMLINKS|NFS_CAP_FILEID|
2309                                 NFS_CAP_MODE|NFS_CAP_NLINK|NFS_CAP_OWNER|
2310                                 NFS_CAP_OWNER_GROUP|NFS_CAP_ATIME|
2311                                 NFS_CAP_CTIME|NFS_CAP_MTIME);
2312                 if (res.attr_bitmask[0] & FATTR4_WORD0_ACL)
2313                         server->caps |= NFS_CAP_ACLS;
2314                 if (res.has_links != 0)
2315                         server->caps |= NFS_CAP_HARDLINKS;
2316                 if (res.has_symlinks != 0)
2317                         server->caps |= NFS_CAP_SYMLINKS;
2318                 if (res.attr_bitmask[0] & FATTR4_WORD0_FILEID)
2319                         server->caps |= NFS_CAP_FILEID;
2320                 if (res.attr_bitmask[1] & FATTR4_WORD1_MODE)
2321                         server->caps |= NFS_CAP_MODE;
2322                 if (res.attr_bitmask[1] & FATTR4_WORD1_NUMLINKS)
2323                         server->caps |= NFS_CAP_NLINK;
2324                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER)
2325                         server->caps |= NFS_CAP_OWNER;
2326                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER_GROUP)
2327                         server->caps |= NFS_CAP_OWNER_GROUP;
2328                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_ACCESS)
2329                         server->caps |= NFS_CAP_ATIME;
2330                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_METADATA)
2331                         server->caps |= NFS_CAP_CTIME;
2332                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_MODIFY)
2333                         server->caps |= NFS_CAP_MTIME;
2334
2335                 memcpy(server->cache_consistency_bitmask, res.attr_bitmask, sizeof(server->cache_consistency_bitmask));
2336                 server->cache_consistency_bitmask[0] &= FATTR4_WORD0_CHANGE|FATTR4_WORD0_SIZE;
2337                 server->cache_consistency_bitmask[1] &= FATTR4_WORD1_TIME_METADATA|FATTR4_WORD1_TIME_MODIFY;
2338                 server->acl_bitmask = res.acl_bitmask;
2339                 server->fh_expire_type = res.fh_expire_type;
2340         }
2341
2342         return status;
2343 }
2344
2345 int nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
2346 {
2347         struct nfs4_exception exception = { };
2348         int err;
2349         do {
2350                 err = nfs4_handle_exception(server,
2351                                 _nfs4_server_capabilities(server, fhandle),
2352                                 &exception);
2353         } while (exception.retry);
2354         return err;
2355 }
2356
2357 static int _nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
2358                 struct nfs_fsinfo *info)
2359 {
2360         struct nfs4_lookup_root_arg args = {
2361                 .bitmask = nfs4_fattr_bitmap,
2362         };
2363         struct nfs4_lookup_res res = {
2364                 .server = server,
2365                 .fattr = info->fattr,
2366                 .fh = fhandle,
2367         };
2368         struct rpc_message msg = {
2369                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP_ROOT],
2370                 .rpc_argp = &args,
2371                 .rpc_resp = &res,
2372         };
2373
2374         nfs_fattr_init(info->fattr);
2375         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2376 }
2377
2378 static int nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
2379                 struct nfs_fsinfo *info)
2380 {
2381         struct nfs4_exception exception = { };
2382         int err;
2383         do {
2384                 err = _nfs4_lookup_root(server, fhandle, info);
2385                 switch (err) {
2386                 case 0:
2387                 case -NFS4ERR_WRONGSEC:
2388                         goto out;
2389                 default:
2390                         err = nfs4_handle_exception(server, err, &exception);
2391                 }
2392         } while (exception.retry);
2393 out:
2394         return err;
2395 }
2396
2397 static int nfs4_lookup_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
2398                                 struct nfs_fsinfo *info, rpc_authflavor_t flavor)
2399 {
2400         struct rpc_auth *auth;
2401         int ret;
2402
2403         auth = rpcauth_create(flavor, server->client);
2404         if (!auth) {
2405                 ret = -EIO;
2406                 goto out;
2407         }
2408         ret = nfs4_lookup_root(server, fhandle, info);
2409 out:
2410         return ret;
2411 }
2412
2413 static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
2414                               struct nfs_fsinfo *info)
2415 {
2416         int i, len, status = 0;
2417         rpc_authflavor_t flav_array[NFS_MAX_SECFLAVORS];
2418
2419         len = rpcauth_list_flavors(flav_array, ARRAY_SIZE(flav_array));
2420         BUG_ON(len < 0);
2421
2422         for (i = 0; i < len; i++) {
2423                 /* AUTH_UNIX is the default flavor if none was specified,
2424                  * thus has already been tried. */
2425                 if (flav_array[i] == RPC_AUTH_UNIX)
2426                         continue;
2427
2428                 status = nfs4_lookup_root_sec(server, fhandle, info, flav_array[i]);
2429                 if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
2430                         continue;
2431                 break;
2432         }
2433         /*
2434          * -EACCESS could mean that the user doesn't have correct permissions
2435          * to access the mount.  It could also mean that we tried to mount
2436          * with a gss auth flavor, but rpc.gssd isn't running.  Either way,
2437          * existing mount programs don't handle -EACCES very well so it should
2438          * be mapped to -EPERM instead.
2439          */
2440         if (status == -EACCES)
2441                 status = -EPERM;
2442         return status;
2443 }
2444
2445 /*
2446  * get the file handle for the "/" directory on the server
2447  */
2448 int nfs4_proc_get_rootfh(struct nfs_server *server, struct nfs_fh *fhandle,
2449                          struct nfs_fsinfo *info)
2450 {
2451         int minor_version = server->nfs_client->cl_minorversion;
2452         int status = nfs4_lookup_root(server, fhandle, info);
2453         if ((status == -NFS4ERR_WRONGSEC) && !(server->flags & NFS_MOUNT_SECFLAVOUR))
2454                 /*
2455                  * A status of -NFS4ERR_WRONGSEC will be mapped to -EPERM
2456                  * by nfs4_map_errors() as this function exits.
2457                  */
2458                 status = nfs_v4_minor_ops[minor_version]->find_root_sec(server, fhandle, info);
2459         if (status == 0)
2460                 status = nfs4_server_capabilities(server, fhandle);
2461         if (status == 0)
2462                 status = nfs4_do_fsinfo(server, fhandle, info);
2463         return nfs4_map_errors(status);
2464 }
2465
2466 static int nfs4_proc_get_root(struct nfs_server *server, struct nfs_fh *mntfh,
2467                               struct nfs_fsinfo *info)
2468 {
2469         int error;
2470         struct nfs_fattr *fattr = info->fattr;
2471
2472         error = nfs4_server_capabilities(server, mntfh);
2473         if (error < 0) {
2474                 dprintk("nfs4_get_root: getcaps error = %d\n", -error);
2475                 return error;
2476         }
2477
2478         error = nfs4_proc_getattr(server, mntfh, fattr);
2479         if (error < 0) {
2480                 dprintk("nfs4_get_root: getattr error = %d\n", -error);
2481                 return error;
2482         }
2483
2484         if (fattr->valid & NFS_ATTR_FATTR_FSID &&
2485             !nfs_fsid_equal(&server->fsid, &fattr->fsid))
2486                 memcpy(&server->fsid, &fattr->fsid, sizeof(server->fsid));
2487
2488         return error;
2489 }
2490
2491 /*
2492  * Get locations and (maybe) other attributes of a referral.
2493  * Note that we'll actually follow the referral later when
2494  * we detect fsid mismatch in inode revalidation
2495  */
2496 static int nfs4_get_referral(struct rpc_clnt *client, struct inode *dir,
2497                              const struct qstr *name, struct nfs_fattr *fattr,
2498                              struct nfs_fh *fhandle)
2499 {
2500         int status = -ENOMEM;
2501         struct page *page = NULL;
2502         struct nfs4_fs_locations *locations = NULL;
2503
2504         page = alloc_page(GFP_KERNEL);
2505         if (page == NULL)
2506                 goto out;
2507         locations = kmalloc(sizeof(struct nfs4_fs_locations), GFP_KERNEL);
2508         if (locations == NULL)
2509                 goto out;
2510
2511         status = nfs4_proc_fs_locations(client, dir, name, locations, page);
2512         if (status != 0)
2513                 goto out;
2514         /* Make sure server returned a different fsid for the referral */
2515         if (nfs_fsid_equal(&NFS_SERVER(dir)->fsid, &locations->fattr.fsid)) {
2516                 dprintk("%s: server did not return a different fsid for"
2517                         " a referral at %s\n", __func__, name->name);
2518                 status = -EIO;
2519                 goto out;
2520         }
2521         /* Fixup attributes for the nfs_lookup() call to nfs_fhget() */
2522         nfs_fixup_referral_attributes(&locations->fattr);
2523
2524         /* replace the lookup nfs_fattr with the locations nfs_fattr */
2525         memcpy(fattr, &locations->fattr, sizeof(struct nfs_fattr));
2526         memset(fhandle, 0, sizeof(struct nfs_fh));
2527 out:
2528         if (page)
2529                 __free_page(page);
2530         kfree(locations);
2531         return status;
2532 }
2533
2534 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2535 {
2536         struct nfs4_getattr_arg args = {
2537                 .fh = fhandle,
2538                 .bitmask = server->attr_bitmask,
2539         };
2540         struct nfs4_getattr_res res = {
2541                 .fattr = fattr,
2542                 .server = server,
2543         };
2544         struct rpc_message msg = {
2545                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
2546                 .rpc_argp = &args,
2547                 .rpc_resp = &res,
2548         };
2549         
2550         nfs_fattr_init(fattr);
2551         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2552 }
2553
2554 static int nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2555 {
2556         struct nfs4_exception exception = { };
2557         int err;
2558         do {
2559                 err = nfs4_handle_exception(server,
2560                                 _nfs4_proc_getattr(server, fhandle, fattr),
2561                                 &exception);
2562         } while (exception.retry);
2563         return err;
2564 }
2565
2566 /* 
2567  * The file is not closed if it is opened due to the a request to change
2568  * the size of the file. The open call will not be needed once the
2569  * VFS layer lookup-intents are implemented.
2570  *
2571  * Close is called when the inode is destroyed.
2572  * If we haven't opened the file for O_WRONLY, we
2573  * need to in the size_change case to obtain a stateid.
2574  *
2575  * Got race?
2576  * Because OPEN is always done by name in nfsv4, it is
2577  * possible that we opened a different file by the same
2578  * name.  We can recognize this race condition, but we
2579  * can't do anything about it besides returning an error.
2580  *
2581  * This will be fixed with VFS changes (lookup-intent).
2582  */
2583 static int
2584 nfs4_proc_setattr(struct dentry *dentry, struct nfs_fattr *fattr,
2585                   struct iattr *sattr)
2586 {
2587         struct inode *inode = dentry->d_inode;
2588         struct rpc_cred *cred = NULL;
2589         struct nfs4_state *state = NULL;
2590         int status;
2591
2592         if (pnfs_ld_layoutret_on_setattr(inode))
2593                 pnfs_return_layout(inode);
2594
2595         nfs_fattr_init(fattr);
2596         
2597         /* Deal with open(O_TRUNC) */
2598         if (sattr->ia_valid & ATTR_OPEN)
2599                 sattr->ia_valid &= ~(ATTR_MTIME|ATTR_CTIME|ATTR_OPEN);
2600
2601         /* Optimization: if the end result is no change, don't RPC */
2602         if ((sattr->ia_valid & ~(ATTR_FILE)) == 0)
2603                 return 0;
2604
2605         /* Search for an existing open(O_WRITE) file */
2606         if (sattr->ia_valid & ATTR_FILE) {
2607                 struct nfs_open_context *ctx;
2608
2609                 ctx = nfs_file_open_context(sattr->ia_file);
2610                 if (ctx) {
2611                         cred = ctx->cred;
2612                         state = ctx->state;
2613                 }
2614         }
2615
2616         status = nfs4_do_setattr(inode, cred, fattr, sattr, state);
2617         if (status == 0)
2618                 nfs_setattr_update_inode(inode, sattr);
2619         return status;
2620 }
2621
2622 static int _nfs4_proc_lookup(struct rpc_clnt *clnt, struct inode *dir,
2623                 const struct qstr *name, struct nfs_fh *fhandle,
2624                 struct nfs_fattr *fattr)
2625 {
2626         struct nfs_server *server = NFS_SERVER(dir);
2627         int                    status;
2628         struct nfs4_lookup_arg args = {
2629                 .bitmask = server->attr_bitmask,
2630                 .dir_fh = NFS_FH(dir),
2631                 .name = name,
2632         };
2633         struct nfs4_lookup_res res = {
2634                 .server = server,
2635                 .fattr = fattr,
2636                 .fh = fhandle,
2637         };
2638         struct rpc_message msg = {
2639                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP],
2640                 .rpc_argp = &args,
2641                 .rpc_resp = &res,
2642         };
2643
2644         nfs_fattr_init(fattr);
2645
2646         dprintk("NFS call  lookup %s\n", name->name);
2647         status = nfs4_call_sync(clnt, server, &msg, &args.seq_args, &res.seq_res, 0);
2648         dprintk("NFS reply lookup: %d\n", status);
2649         return status;
2650 }
2651
2652 static void nfs_fixup_secinfo_attributes(struct nfs_fattr *fattr)
2653 {
2654         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
2655                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_MOUNTPOINT;
2656         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
2657         fattr->nlink = 2;
2658 }
2659
2660 static int nfs4_proc_lookup_common(struct rpc_clnt **clnt, struct inode *dir,
2661                                    struct qstr *name, struct nfs_fh *fhandle,
2662                                    struct nfs_fattr *fattr)
2663 {
2664         struct nfs4_exception exception = { };
2665         struct rpc_clnt *client = *clnt;
2666         int err;
2667         do {
2668                 err = _nfs4_proc_lookup(client, dir, name, fhandle, fattr);
2669                 switch (err) {
2670                 case -NFS4ERR_BADNAME:
2671                         err = -ENOENT;
2672                         goto out;
2673                 case -NFS4ERR_MOVED:
2674                         err = nfs4_get_referral(client, dir, name, fattr, fhandle);
2675                         goto out;
2676                 case -NFS4ERR_WRONGSEC:
2677                         err = -EPERM;
2678                         if (client != *clnt)
2679                                 goto out;
2680
2681                         client = nfs4_create_sec_client(client, dir, name);
2682                         if (IS_ERR(client))
2683                                 return PTR_ERR(client);
2684
2685                         exception.retry = 1;
2686                         break;
2687                 default:
2688                         err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
2689                 }
2690         } while (exception.retry);
2691
2692 out:
2693         if (err == 0)
2694                 *clnt = client;
2695         else if (client != *clnt)
2696                 rpc_shutdown_client(client);
2697
2698         return err;
2699 }
2700
2701 static int nfs4_proc_lookup(struct inode *dir, struct qstr *name,
2702                             struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2703 {
2704         int status;
2705         struct rpc_clnt *client = NFS_CLIENT(dir);
2706
2707         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
2708         if (client != NFS_CLIENT(dir)) {
2709                 rpc_shutdown_client(client);
2710                 nfs_fixup_secinfo_attributes(fattr);
2711         }
2712         return status;
2713 }
2714
2715 struct rpc_clnt *
2716 nfs4_proc_lookup_mountpoint(struct inode *dir, struct qstr *name,
2717                             struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2718 {
2719         int status;
2720         struct rpc_clnt *client = rpc_clone_client(NFS_CLIENT(dir));
2721
2722         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
2723         if (status < 0) {
2724                 rpc_shutdown_client(client);
2725                 return ERR_PTR(status);
2726         }
2727         return client;
2728 }
2729
2730 static int _nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
2731 {
2732         struct nfs_server *server = NFS_SERVER(inode);
2733         struct nfs4_accessargs args = {
2734                 .fh = NFS_FH(inode),
2735                 .bitmask = server->cache_consistency_bitmask,
2736         };
2737         struct nfs4_accessres res = {
2738                 .server = server,
2739         };
2740         struct rpc_message msg = {
2741                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_ACCESS],
2742                 .rpc_argp = &args,
2743                 .rpc_resp = &res,
2744                 .rpc_cred = entry->cred,
2745         };
2746         int mode = entry->mask;
2747         int status;
2748
2749         /*
2750          * Determine which access bits we want to ask for...
2751          */
2752         if (mode & MAY_READ)
2753                 args.access |= NFS4_ACCESS_READ;
2754         if (S_ISDIR(inode->i_mode)) {
2755                 if (mode & MAY_WRITE)
2756                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND | NFS4_ACCESS_DELETE;
2757                 if (mode & MAY_EXEC)
2758                         args.access |= NFS4_ACCESS_LOOKUP;
2759         } else {
2760                 if (mode & MAY_WRITE)
2761                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND;
2762                 if (mode & MAY_EXEC)
2763                         args.access |= NFS4_ACCESS_EXECUTE;
2764         }
2765
2766         res.fattr = nfs_alloc_fattr();
2767         if (res.fattr == NULL)
2768                 return -ENOMEM;
2769
2770         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2771         if (!status) {
2772                 entry->mask = 0;
2773                 if (res.access & NFS4_ACCESS_READ)
2774                         entry->mask |= MAY_READ;
2775                 if (res.access & (NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND | NFS4_ACCESS_DELETE))
2776                         entry->mask |= MAY_WRITE;
2777                 if (res.access & (NFS4_ACCESS_LOOKUP|NFS4_ACCESS_EXECUTE))
2778                         entry->mask |= MAY_EXEC;
2779                 nfs_refresh_inode(inode, res.fattr);
2780         }
2781         nfs_free_fattr(res.fattr);
2782         return status;
2783 }
2784
2785 static int nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
2786 {
2787         struct nfs4_exception exception = { };
2788         int err;
2789         do {
2790                 err = nfs4_handle_exception(NFS_SERVER(inode),
2791                                 _nfs4_proc_access(inode, entry),
2792                                 &exception);
2793         } while (exception.retry);
2794         return err;
2795 }
2796
2797 /*
2798  * TODO: For the time being, we don't try to get any attributes
2799  * along with any of the zero-copy operations READ, READDIR,
2800  * READLINK, WRITE.
2801  *
2802  * In the case of the first three, we want to put the GETATTR
2803  * after the read-type operation -- this is because it is hard
2804  * to predict the length of a GETATTR response in v4, and thus
2805  * align the READ data correctly.  This means that the GETATTR
2806  * may end up partially falling into the page cache, and we should
2807  * shift it into the 'tail' of the xdr_buf before processing.
2808  * To do this efficiently, we need to know the total length
2809  * of data received, which doesn't seem to be available outside
2810  * of the RPC layer.
2811  *
2812  * In the case of WRITE, we also want to put the GETATTR after
2813  * the operation -- in this case because we want to make sure
2814  * we get the post-operation mtime and size.
2815  *
2816  * Both of these changes to the XDR layer would in fact be quite
2817  * minor, but I decided to leave them for a subsequent patch.
2818  */
2819 static int _nfs4_proc_readlink(struct inode *inode, struct page *page,
2820                 unsigned int pgbase, unsigned int pglen)
2821 {
2822         struct nfs4_readlink args = {
2823                 .fh       = NFS_FH(inode),
2824                 .pgbase   = pgbase,
2825                 .pglen    = pglen,
2826                 .pages    = &page,
2827         };
2828         struct nfs4_readlink_res res;
2829         struct rpc_message msg = {
2830                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READLINK],
2831                 .rpc_argp = &args,
2832                 .rpc_resp = &res,
2833         };
2834
2835         return nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode), &msg, &args.seq_args, &res.seq_res, 0);
2836 }
2837
2838 static int nfs4_proc_readlink(struct inode *inode, struct page *page,
2839                 unsigned int pgbase, unsigned int pglen)
2840 {
2841         struct nfs4_exception exception = { };
2842         int err;
2843         do {
2844                 err = nfs4_handle_exception(NFS_SERVER(inode),
2845                                 _nfs4_proc_readlink(inode, page, pgbase, pglen),
2846                                 &exception);
2847         } while (exception.retry);
2848         return err;
2849 }
2850
2851 /*
2852  * This is just for mknod.  open(O_CREAT) will always do ->open_context().
2853  */
2854 static int
2855 nfs4_proc_create(struct inode *dir, struct dentry *dentry, struct iattr *sattr,
2856                  int flags)
2857 {
2858         struct nfs_open_context *ctx;
2859         struct nfs4_state *state;
2860         int status = 0;
2861
2862         ctx = alloc_nfs_open_context(dentry, FMODE_READ);
2863         if (IS_ERR(ctx))
2864                 return PTR_ERR(ctx);
2865
2866         sattr->ia_mode &= ~current_umask();
2867         state = nfs4_do_open(dir, dentry, ctx->mode,
2868                         flags, sattr, ctx->cred,
2869                         &ctx->mdsthreshold);
2870         d_drop(dentry);
2871         if (IS_ERR(state)) {
2872                 status = PTR_ERR(state);
2873                 goto out;
2874         }
2875         d_add(dentry, igrab(state->inode));
2876         nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
2877         ctx->state = state;
2878 out:
2879         put_nfs_open_context(ctx);
2880         return status;
2881 }
2882
2883 static int _nfs4_proc_remove(struct inode *dir, struct qstr *name)
2884 {
2885         struct nfs_server *server = NFS_SERVER(dir);
2886         struct nfs_removeargs args = {
2887                 .fh = NFS_FH(dir),
2888                 .name = *name,
2889         };
2890         struct nfs_removeres res = {
2891                 .server = server,
2892         };
2893         struct rpc_message msg = {
2894                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE],
2895                 .rpc_argp = &args,
2896                 .rpc_resp = &res,
2897         };
2898         int status;
2899
2900         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
2901         if (status == 0)
2902                 update_changeattr(dir, &res.cinfo);
2903         return status;
2904 }
2905
2906 static int nfs4_proc_remove(struct inode *dir, struct qstr *name)
2907 {
2908         struct nfs4_exception exception = { };
2909         int err;
2910         do {
2911                 err = nfs4_handle_exception(NFS_SERVER(dir),
2912                                 _nfs4_proc_remove(dir, name),
2913                                 &exception);
2914         } while (exception.retry);
2915         return err;
2916 }
2917
2918 static void nfs4_proc_unlink_setup(struct rpc_message *msg, struct inode *dir)
2919 {
2920         struct nfs_server *server = NFS_SERVER(dir);
2921         struct nfs_removeargs *args = msg->rpc_argp;
2922         struct nfs_removeres *res = msg->rpc_resp;
2923
2924         res->server = server;
2925         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE];
2926         nfs41_init_sequence(&args->seq_args, &res->seq_res, 1);
2927 }
2928
2929 static void nfs4_proc_unlink_rpc_prepare(struct rpc_task *task, struct nfs_unlinkdata *data)
2930 {
2931         if (nfs4_setup_sequence(NFS_SERVER(data->dir),
2932                                 &data->args.seq_args,
2933                                 &data->res.seq_res,
2934                                 task))
2935                 return;
2936         rpc_call_start(task);
2937 }
2938
2939 static int nfs4_proc_unlink_done(struct rpc_task *task, struct inode *dir)
2940 {
2941         struct nfs_removeres *res = task->tk_msg.rpc_resp;
2942
2943         if (!nfs4_sequence_done(task, &res->seq_res))
2944                 return 0;
2945         if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
2946                 return 0;
2947         update_changeattr(dir, &res->cinfo);
2948         return 1;
2949 }
2950
2951 static void nfs4_proc_rename_setup(struct rpc_message *msg, struct inode *dir)
2952 {
2953         struct nfs_server *server = NFS_SERVER(dir);
2954         struct nfs_renameargs *arg = msg->rpc_argp;
2955         struct nfs_renameres *res = msg->rpc_resp;
2956
2957         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME];
2958         res->server = server;
2959         nfs41_init_sequence(&arg->seq_args, &res->seq_res, 1);
2960 }
2961
2962 static void nfs4_proc_rename_rpc_prepare(struct rpc_task *task, struct nfs_renamedata *data)
2963 {
2964         if (nfs4_setup_sequence(NFS_SERVER(data->old_dir),
2965                                 &data->args.seq_args,
2966                                 &data->res.seq_res,
2967                                 task))
2968                 return;
2969         rpc_call_start(task);
2970 }
2971
2972 static int nfs4_proc_rename_done(struct rpc_task *task, struct inode *old_dir,
2973                                  struct inode *new_dir)
2974 {
2975         struct nfs_renameres *res = task->tk_msg.rpc_resp;
2976
2977         if (!nfs4_sequence_done(task, &res->seq_res))
2978                 return 0;
2979         if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
2980                 return 0;
2981
2982         update_changeattr(old_dir, &res->old_cinfo);
2983         update_changeattr(new_dir, &res->new_cinfo);
2984         return 1;
2985 }
2986
2987 static int _nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
2988                 struct inode *new_dir, struct qstr *new_name)
2989 {
2990         struct nfs_server *server = NFS_SERVER(old_dir);
2991         struct nfs_renameargs arg = {
2992                 .old_dir = NFS_FH(old_dir),
2993                 .new_dir = NFS_FH(new_dir),
2994                 .old_name = old_name,
2995                 .new_name = new_name,
2996         };
2997         struct nfs_renameres res = {
2998                 .server = server,
2999         };
3000         struct rpc_message msg = {
3001                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME],
3002                 .rpc_argp = &arg,
3003                 .rpc_resp = &res,
3004         };
3005         int status = -ENOMEM;
3006         
3007         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
3008         if (!status) {
3009                 update_changeattr(old_dir, &res.old_cinfo);
3010                 update_changeattr(new_dir, &res.new_cinfo);
3011         }
3012         return status;
3013 }
3014
3015 static int nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
3016                 struct inode *new_dir, struct qstr *new_name)
3017 {
3018         struct nfs4_exception exception = { };
3019         int err;
3020         do {
3021                 err = nfs4_handle_exception(NFS_SERVER(old_dir),
3022                                 _nfs4_proc_rename(old_dir, old_name,
3023                                         new_dir, new_name),
3024                                 &exception);
3025         } while (exception.retry);
3026         return err;
3027 }
3028
3029 static int _nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
3030 {
3031         struct nfs_server *server = NFS_SERVER(inode);
3032         struct nfs4_link_arg arg = {
3033                 .fh     = NFS_FH(inode),
3034                 .dir_fh = NFS_FH(dir),
3035                 .name   = name,
3036                 .bitmask = server->attr_bitmask,
3037         };
3038         struct nfs4_link_res res = {
3039                 .server = server,
3040         };
3041         struct rpc_message msg = {
3042                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LINK],
3043                 .rpc_argp = &arg,
3044                 .rpc_resp = &res,
3045         };
3046         int status = -ENOMEM;
3047
3048         res.fattr = nfs_alloc_fattr();
3049         if (res.fattr == NULL)
3050                 goto out;
3051
3052         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
3053         if (!status) {
3054                 update_changeattr(dir, &res.cinfo);
3055                 nfs_post_op_update_inode(inode, res.fattr);
3056         }
3057 out:
3058         nfs_free_fattr(res.fattr);
3059         return status;
3060 }
3061
3062 static int nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
3063 {
3064         struct nfs4_exception exception = { };
3065         int err;
3066         do {
3067                 err = nfs4_handle_exception(NFS_SERVER(inode),
3068                                 _nfs4_proc_link(inode, dir, name),
3069                                 &exception);
3070         } while (exception.retry);
3071         return err;
3072 }
3073
3074 struct nfs4_createdata {
3075         struct rpc_message msg;
3076         struct nfs4_create_arg arg;
3077         struct nfs4_create_res res;
3078         struct nfs_fh fh;
3079         struct nfs_fattr fattr;
3080 };
3081
3082 static struct nfs4_createdata *nfs4_alloc_createdata(struct inode *dir,
3083                 struct qstr *name, struct iattr *sattr, u32 ftype)
3084 {
3085         struct nfs4_createdata *data;
3086
3087         data = kzalloc(sizeof(*data), GFP_KERNEL);
3088         if (data != NULL) {
3089                 struct nfs_server *server = NFS_SERVER(dir);
3090
3091                 data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE];
3092                 data->msg.rpc_argp = &data->arg;
3093                 data->msg.rpc_resp = &data->res;
3094                 data->arg.dir_fh = NFS_FH(dir);
3095                 data->arg.server = server;
3096                 data->arg.name = name;
3097                 data->arg.attrs = sattr;
3098                 data->arg.ftype = ftype;
3099                 data->arg.bitmask = server->attr_bitmask;
3100                 data->res.server = server;
3101                 data->res.fh = &data->fh;
3102                 data->res.fattr = &data->fattr;
3103                 nfs_fattr_init(data->res.fattr);
3104         }
3105         return data;
3106 }
3107
3108 static int nfs4_do_create(struct inode *dir, struct dentry *dentry, struct nfs4_createdata *data)
3109 {
3110         int status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &data->msg,
3111                                     &data->arg.seq_args, &data->res.seq_res, 1);
3112         if (status == 0) {
3113                 update_changeattr(dir, &data->res.dir_cinfo);
3114                 status = nfs_instantiate(dentry, data->res.fh, data->res.fattr);
3115         }
3116         return status;
3117 }
3118
3119 static void nfs4_free_createdata(struct nfs4_createdata *data)
3120 {
3121         kfree(data);
3122 }
3123
3124 static int _nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3125                 struct page *page, unsigned int len, struct iattr *sattr)
3126 {
3127         struct nfs4_createdata *data;
3128         int status = -ENAMETOOLONG;
3129
3130         if (len > NFS4_MAXPATHLEN)
3131                 goto out;
3132
3133         status = -ENOMEM;
3134         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4LNK);
3135         if (data == NULL)
3136                 goto out;
3137
3138         data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SYMLINK];
3139         data->arg.u.symlink.pages = &page;
3140         data->arg.u.symlink.len = len;
3141         
3142         status = nfs4_do_create(dir, dentry, data);
3143
3144         nfs4_free_createdata(data);
3145 out:
3146         return status;
3147 }
3148
3149 static int nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3150                 struct page *page, unsigned int len, struct iattr *sattr)
3151 {
3152         struct nfs4_exception exception = { };
3153         int err;
3154         do {
3155                 err = nfs4_handle_exception(NFS_SERVER(dir),
3156                                 _nfs4_proc_symlink(dir, dentry, page,
3157                                                         len, sattr),
3158                                 &exception);
3159         } while (exception.retry);
3160         return err;
3161 }
3162
3163 static int _nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
3164                 struct iattr *sattr)
3165 {
3166         struct nfs4_createdata *data;
3167         int status = -ENOMEM;
3168
3169         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4DIR);
3170         if (data == NULL)
3171                 goto out;
3172
3173         status = nfs4_do_create(dir, dentry, data);
3174
3175         nfs4_free_createdata(data);
3176 out:
3177         return status;
3178 }
3179
3180 static int nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
3181                 struct iattr *sattr)
3182 {
3183         struct nfs4_exception exception = { };
3184         int err;
3185
3186         sattr->ia_mode &= ~current_umask();
3187         do {
3188                 err = nfs4_handle_exception(NFS_SERVER(dir),
3189                                 _nfs4_proc_mkdir(dir, dentry, sattr),
3190                                 &exception);
3191         } while (exception.retry);
3192         return err;
3193 }
3194
3195 static int _nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
3196                 u64 cookie, struct page **pages, unsigned int count, int plus)
3197 {
3198         struct inode            *dir = dentry->d_inode;
3199         struct nfs4_readdir_arg args = {
3200                 .fh = NFS_FH(dir),
3201                 .pages = pages,
3202                 .pgbase = 0,
3203                 .count = count,
3204                 .bitmask = NFS_SERVER(dentry->d_inode)->attr_bitmask,
3205                 .plus = plus,
3206         };
3207         struct nfs4_readdir_res res;
3208         struct rpc_message msg = {
3209                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READDIR],
3210                 .rpc_argp = &args,
3211                 .rpc_resp = &res,
3212                 .rpc_cred = cred,
3213         };
3214         int                     status;
3215
3216         dprintk("%s: dentry = %s/%s, cookie = %Lu\n", __func__,
3217                         dentry->d_parent->d_name.name,
3218                         dentry->d_name.name,
3219                         (unsigned long long)cookie);
3220         nfs4_setup_readdir(cookie, NFS_COOKIEVERF(dir), dentry, &args);
3221         res.pgbase = args.pgbase;
3222         status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
3223         if (status >= 0) {
3224                 memcpy(NFS_COOKIEVERF(dir), res.verifier.data, NFS4_VERIFIER_SIZE);
3225                 status += args.pgbase;
3226         }
3227
3228         nfs_invalidate_atime(dir);
3229
3230         dprintk("%s: returns %d\n", __func__, status);
3231         return status;
3232 }
3233
3234 static int nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
3235                 u64 cookie, struct page **pages, unsigned int count, int plus)
3236 {
3237         struct nfs4_exception exception = { };
3238         int err;
3239         do {
3240                 err = nfs4_handle_exception(NFS_SERVER(dentry->d_inode),
3241                                 _nfs4_proc_readdir(dentry, cred, cookie,
3242                                         pages, count, plus),
3243                                 &exception);
3244         } while (exception.retry);
3245         return err;
3246 }
3247
3248 static int _nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
3249                 struct iattr *sattr, dev_t rdev)
3250 {
3251         struct nfs4_createdata *data;
3252         int mode = sattr->ia_mode;
3253         int status = -ENOMEM;
3254
3255         BUG_ON(!(sattr->ia_valid & ATTR_MODE));
3256         BUG_ON(!S_ISFIFO(mode) && !S_ISBLK(mode) && !S_ISCHR(mode) && !S_ISSOCK(mode));
3257
3258         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4SOCK);
3259         if (data == NULL)
3260                 goto out;
3261
3262         if (S_ISFIFO(mode))
3263                 data->arg.ftype = NF4FIFO;
3264         else if (S_ISBLK(mode)) {
3265                 data->arg.ftype = NF4BLK;
3266                 data->arg.u.device.specdata1 = MAJOR(rdev);
3267                 data->arg.u.device.specdata2 = MINOR(rdev);
3268         }
3269         else if (S_ISCHR(mode)) {
3270                 data->arg.ftype = NF4CHR;
3271                 data->arg.u.device.specdata1 = MAJOR(rdev);
3272                 data->arg.u.device.specdata2 = MINOR(rdev);
3273         }
3274         
3275         status = nfs4_do_create(dir, dentry, data);
3276
3277         nfs4_free_createdata(data);
3278 out:
3279         return status;
3280 }
3281
3282 static int nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
3283                 struct iattr *sattr, dev_t rdev)
3284 {
3285         struct nfs4_exception exception = { };
3286         int err;
3287
3288         sattr->ia_mode &= ~current_umask();
3289         do {
3290                 err = nfs4_handle_exception(NFS_SERVER(dir),
3291                                 _nfs4_proc_mknod(dir, dentry, sattr, rdev),
3292                                 &exception);
3293         } while (exception.retry);
3294         return err;
3295 }
3296
3297 static int _nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle,
3298                  struct nfs_fsstat *fsstat)
3299 {
3300         struct nfs4_statfs_arg args = {
3301                 .fh = fhandle,
3302                 .bitmask = server->attr_bitmask,
3303         };
3304         struct nfs4_statfs_res res = {
3305                 .fsstat = fsstat,
3306         };
3307         struct rpc_message msg = {
3308                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_STATFS],
3309                 .rpc_argp = &args,
3310                 .rpc_resp = &res,
3311         };
3312
3313         nfs_fattr_init(fsstat->fattr);
3314         return  nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3315 }
3316
3317 static int nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsstat *fsstat)
3318 {
3319         struct nfs4_exception exception = { };
3320         int err;
3321         do {
3322                 err = nfs4_handle_exception(server,
3323                                 _nfs4_proc_statfs(server, fhandle, fsstat),
3324                                 &exception);
3325         } while (exception.retry);
3326         return err;
3327 }
3328
3329 static int _nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle,
3330                 struct nfs_fsinfo *fsinfo)
3331 {
3332         struct nfs4_fsinfo_arg args = {
3333                 .fh = fhandle,
3334                 .bitmask = server->attr_bitmask,
3335         };
3336         struct nfs4_fsinfo_res res = {
3337                 .fsinfo = fsinfo,
3338         };
3339         struct rpc_message msg = {
3340                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSINFO],
3341                 .rpc_argp = &args,
3342                 .rpc_resp = &res,
3343         };
3344
3345         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3346 }
3347
3348 static int nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
3349 {
3350         struct nfs4_exception exception = { };
3351         int err;
3352
3353         do {
3354                 err = nfs4_handle_exception(server,
3355                                 _nfs4_do_fsinfo(server, fhandle, fsinfo),
3356                                 &exception);
3357         } while (exception.retry);
3358         return err;
3359 }
3360
3361 static int nfs4_proc_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
3362 {
3363         int error;
3364
3365         nfs_fattr_init(fsinfo->fattr);
3366         error = nfs4_do_fsinfo(server, fhandle, fsinfo);
3367         if (error == 0)
3368                 set_pnfs_layoutdriver(server, fhandle, fsinfo->layouttype);
3369
3370         return error;
3371 }
3372
3373 static int _nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
3374                 struct nfs_pathconf *pathconf)
3375 {
3376         struct nfs4_pathconf_arg args = {
3377                 .fh = fhandle,
3378                 .bitmask = server->attr_bitmask,
3379         };
3380         struct nfs4_pathconf_res res = {
3381                 .pathconf = pathconf,
3382         };
3383         struct rpc_message msg = {
3384                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_PATHCONF],
3385                 .rpc_argp = &args,
3386                 .rpc_resp = &res,
3387         };
3388
3389         /* None of the pathconf attributes are mandatory to implement */
3390         if ((args.bitmask[0] & nfs4_pathconf_bitmap[0]) == 0) {
3391                 memset(pathconf, 0, sizeof(*pathconf));
3392                 return 0;
3393         }
3394
3395         nfs_fattr_init(pathconf->fattr);
3396         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3397 }
3398
3399 static int nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
3400                 struct nfs_pathconf *pathconf)
3401 {
3402         struct nfs4_exception exception = { };
3403         int err;
3404
3405         do {
3406                 err = nfs4_handle_exception(server,
3407                                 _nfs4_proc_pathconf(server, fhandle, pathconf),
3408                                 &exception);
3409         } while (exception.retry);
3410         return err;
3411 }
3412
3413 void __nfs4_read_done_cb(struct nfs_read_data *data)
3414 {
3415         nfs_invalidate_atime(data->header->inode);
3416 }
3417
3418 static int nfs4_read_done_cb(struct rpc_task *task, struct nfs_read_data *data)
3419 {
3420         struct nfs_server *server = NFS_SERVER(data->header->inode);
3421
3422         if (nfs4_async_handle_error(task, server, data->args.context->state) == -EAGAIN) {
3423                 rpc_restart_call_prepare(task);
3424                 return -EAGAIN;
3425         }
3426
3427         __nfs4_read_done_cb(data);
3428         if (task->tk_status > 0)
3429                 renew_lease(server, data->timestamp);
3430         return 0;
3431 }
3432
3433 static int nfs4_read_done(struct rpc_task *task, struct nfs_read_data *data)
3434 {
3435
3436         dprintk("--> %s\n", __func__);
3437
3438         if (!nfs4_sequence_done(task, &data->res.seq_res))
3439                 return -EAGAIN;
3440
3441         return data->read_done_cb ? data->read_done_cb(task, data) :
3442                                     nfs4_read_done_cb(task, data);
3443 }
3444
3445 static void nfs4_proc_read_setup(struct nfs_read_data *data, struct rpc_message *msg)
3446 {
3447         data->timestamp   = jiffies;
3448         data->read_done_cb = nfs4_read_done_cb;
3449         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READ];
3450         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
3451 }
3452
3453 static void nfs4_proc_read_rpc_prepare(struct rpc_task *task, struct nfs_read_data *data)
3454 {
3455         if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3456                                 &data->args.seq_args,
3457                                 &data->res.seq_res,
3458                                 task))
3459                 return;
3460         rpc_call_start(task);
3461 }
3462
3463 static int nfs4_write_done_cb(struct rpc_task *task, struct nfs_write_data *data)
3464 {
3465         struct inode *inode = data->header->inode;
3466         
3467         if (nfs4_async_handle_error(task, NFS_SERVER(inode), data->args.context->state) == -EAGAIN) {
3468                 rpc_restart_call_prepare(task);
3469                 return -EAGAIN;
3470         }
3471         if (task->tk_status >= 0) {
3472                 renew_lease(NFS_SERVER(inode), data->timestamp);
3473                 nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
3474         }
3475         return 0;
3476 }
3477
3478 static int nfs4_write_done(struct rpc_task *task, struct nfs_write_data *data)
3479 {
3480         if (!nfs4_sequence_done(task, &data->res.seq_res))
3481                 return -EAGAIN;
3482         return data->write_done_cb ? data->write_done_cb(task, data) :
3483                 nfs4_write_done_cb(task, data);
3484 }
3485
3486 static
3487 bool nfs4_write_need_cache_consistency_data(const struct nfs_write_data *data)
3488 {
3489         const struct nfs_pgio_header *hdr = data->header;
3490
3491         /* Don't request attributes for pNFS or O_DIRECT writes */
3492         if (data->ds_clp != NULL || hdr->dreq != NULL)
3493                 return false;
3494         /* Otherwise, request attributes if and only if we don't hold
3495          * a delegation
3496          */
3497         return nfs4_have_delegation(hdr->inode, FMODE_READ) == 0;
3498 }
3499
3500 static void nfs4_proc_write_setup(struct nfs_write_data *data, struct rpc_message *msg)
3501 {
3502         struct nfs_server *server = NFS_SERVER(data->header->inode);
3503
3504         if (!nfs4_write_need_cache_consistency_data(data)) {
3505                 data->args.bitmask = NULL;
3506                 data->res.fattr = NULL;
3507         } else
3508                 data->args.bitmask = server->cache_consistency_bitmask;
3509
3510         if (!data->write_done_cb)
3511                 data->write_done_cb = nfs4_write_done_cb;
3512         data->res.server = server;
3513         data->timestamp   = jiffies;
3514
3515         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_WRITE];
3516         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
3517 }
3518
3519 static void nfs4_proc_write_rpc_prepare(struct rpc_task *task, struct nfs_write_data *data)
3520 {
3521         if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3522                                 &data->args.seq_args,
3523                                 &data->res.seq_res,
3524                                 task))
3525                 return;
3526         rpc_call_start(task);
3527 }
3528
3529 static void nfs4_proc_commit_rpc_prepare(struct rpc_task *task, struct nfs_commit_data *data)
3530 {
3531         if (nfs4_setup_sequence(NFS_SERVER(data->inode),
3532                                 &data->args.seq_args,
3533                                 &data->res.seq_res,
3534                                 task))
3535                 return;
3536         rpc_call_start(task);
3537 }
3538
3539 static int nfs4_commit_done_cb(struct rpc_task *task, struct nfs_commit_data *data)
3540 {
3541         struct inode *inode = data->inode;
3542
3543         if (nfs4_async_handle_error(task, NFS_SERVER(inode), NULL) == -EAGAIN) {
3544                 rpc_restart_call_prepare(task);
3545                 return -EAGAIN;
3546         }
3547         return 0;
3548 }
3549
3550 static int nfs4_commit_done(struct rpc_task *task, struct nfs_commit_data *data)
3551 {
3552         if (!nfs4_sequence_done(task, &data->res.seq_res))
3553                 return -EAGAIN;
3554         return data->commit_done_cb(task, data);
3555 }
3556
3557 static void nfs4_proc_commit_setup(struct nfs_commit_data *data, struct rpc_message *msg)
3558 {
3559         struct nfs_server *server = NFS_SERVER(data->inode);
3560
3561         if (data->commit_done_cb == NULL)
3562                 data->commit_done_cb = nfs4_commit_done_cb;
3563         data->res.server = server;
3564         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_COMMIT];
3565         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
3566 }
3567
3568 struct nfs4_renewdata {
3569         struct nfs_client       *client;
3570         unsigned long           timestamp;
3571 };
3572
3573 /*
3574  * nfs4_proc_async_renew(): This is not one of the nfs_rpc_ops; it is a special
3575  * standalone procedure for queueing an asynchronous RENEW.
3576  */
3577 static void nfs4_renew_release(void *calldata)
3578 {
3579         struct nfs4_renewdata *data = calldata;
3580         struct nfs_client *clp = data->client;
3581
3582         if (atomic_read(&clp->cl_count) > 1)
3583                 nfs4_schedule_state_renewal(clp);
3584         nfs_put_client(clp);
3585         kfree(data);
3586 }
3587
3588 static void nfs4_renew_done(struct rpc_task *task, void *calldata)
3589 {
3590         struct nfs4_renewdata *data = calldata;
3591         struct nfs_client *clp = data->client;
3592         unsigned long timestamp = data->timestamp;
3593
3594         if (task->tk_status < 0) {
3595                 /* Unless we're shutting down, schedule state recovery! */
3596                 if (test_bit(NFS_CS_RENEWD, &clp->cl_res_state) == 0)
3597                         return;
3598                 if (task->tk_status != NFS4ERR_CB_PATH_DOWN) {
3599                         nfs4_schedule_lease_recovery(clp);
3600                         return;
3601                 }
3602                 nfs4_schedule_path_down_recovery(clp);
3603         }
3604         do_renew_lease(clp, timestamp);
3605 }
3606
3607 static const struct rpc_call_ops nfs4_renew_ops = {
3608         .rpc_call_done = nfs4_renew_done,
3609         .rpc_release = nfs4_renew_release,
3610 };
3611
3612 static int nfs4_proc_async_renew(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
3613 {
3614         struct rpc_message msg = {
3615                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
3616                 .rpc_argp       = clp,
3617                 .rpc_cred       = cred,
3618         };
3619         struct nfs4_renewdata *data;
3620
3621         if (renew_flags == 0)
3622                 return 0;
3623         if (!atomic_inc_not_zero(&clp->cl_count))
3624                 return -EIO;
3625         data = kmalloc(sizeof(*data), GFP_NOFS);
3626         if (data == NULL)
3627                 return -ENOMEM;
3628         data->client = clp;
3629         data->timestamp = jiffies;
3630         return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_SOFT,
3631                         &nfs4_renew_ops, data);
3632 }
3633
3634 static int nfs4_proc_renew(struct nfs_client *clp, struct rpc_cred *cred)
3635 {
3636         struct rpc_message msg = {
3637                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
3638                 .rpc_argp       = clp,
3639                 .rpc_cred       = cred,
3640         };
3641         unsigned long now = jiffies;
3642         int status;
3643
3644         status = rpc_call_sync(clp->cl_rpcclient, &msg, 0);
3645         if (status < 0)
3646                 return status;
3647         do_renew_lease(clp, now);
3648         return 0;
3649 }
3650
3651 static inline int nfs4_server_supports_acls(struct nfs_server *server)
3652 {
3653         return (server->caps & NFS_CAP_ACLS)
3654                 && (server->acl_bitmask & ACL4_SUPPORT_ALLOW_ACL)
3655                 && (server->acl_bitmask & ACL4_SUPPORT_DENY_ACL);
3656 }
3657
3658 /* Assuming that XATTR_SIZE_MAX is a multiple of PAGE_CACHE_SIZE, and that
3659  * it's OK to put sizeof(void) * (XATTR_SIZE_MAX/PAGE_CACHE_SIZE) bytes on
3660  * the stack.
3661  */
3662 #define NFS4ACL_MAXPAGES (XATTR_SIZE_MAX >> PAGE_CACHE_SHIFT)
3663
3664 static int buf_to_pages_noslab(const void *buf, size_t buflen,
3665                 struct page **pages, unsigned int *pgbase)
3666 {
3667         struct page *newpage, **spages;
3668         int rc = 0;
3669         size_t len;
3670         spages = pages;
3671
3672         do {
3673                 len = min_t(size_t, PAGE_CACHE_SIZE, buflen);
3674                 newpage = alloc_page(GFP_KERNEL);
3675
3676                 if (newpage == NULL)
3677                         goto unwind;
3678                 memcpy(page_address(newpage), buf, len);
3679                 buf += len;
3680                 buflen -= len;
3681                 *pages++ = newpage;
3682                 rc++;
3683         } while (buflen != 0);
3684
3685         return rc;
3686
3687 unwind:
3688         for(; rc > 0; rc--)
3689                 __free_page(spages[rc-1]);
3690         return -ENOMEM;
3691 }
3692
3693 struct nfs4_cached_acl {
3694         int cached;
3695         size_t len;
3696         char data[0];
3697 };
3698
3699 static void nfs4_set_cached_acl(struct inode *inode, struct nfs4_cached_acl *acl)
3700 {
3701         struct nfs_inode *nfsi = NFS_I(inode);
3702
3703         spin_lock(&inode->i_lock);
3704         kfree(nfsi->nfs4_acl);
3705         nfsi->nfs4_acl = acl;
3706         spin_unlock(&inode->i_lock);
3707 }
3708
3709 static void nfs4_zap_acl_attr(struct inode *inode)
3710 {
3711         nfs4_set_cached_acl(inode, NULL);
3712 }
3713
3714 static inline ssize_t nfs4_read_cached_acl(struct inode *inode, char *buf, size_t buflen)
3715 {
3716         struct nfs_inode *nfsi = NFS_I(inode);
3717         struct nfs4_cached_acl *acl;
3718         int ret = -ENOENT;
3719
3720         spin_lock(&inode->i_lock);
3721         acl = nfsi->nfs4_acl;
3722         if (acl == NULL)
3723                 goto out;
3724         if (buf == NULL) /* user is just asking for length */
3725                 goto out_len;
3726         if (acl->cached == 0)
3727                 goto out;
3728         ret = -ERANGE; /* see getxattr(2) man page */
3729         if (acl->len > buflen)
3730                 goto out;
3731         memcpy(buf, acl->data, acl->len);
3732 out_len:
3733         ret = acl->len;
3734 out:
3735         spin_unlock(&inode->i_lock);
3736         return ret;
3737 }
3738
3739 static void nfs4_write_cached_acl(struct inode *inode, struct page **pages, size_t pgbase, size_t acl_len)
3740 {
3741         struct nfs4_cached_acl *acl;
3742
3743         if (pages && acl_len <= PAGE_SIZE) {
3744                 acl = kmalloc(sizeof(*acl) + acl_len, GFP_KERNEL);
3745                 if (acl == NULL)
3746                         goto out;
3747                 acl->cached = 1;
3748                 _copy_from_pages(acl->data, pages, pgbase, acl_len);
3749         } else {
3750                 acl = kmalloc(sizeof(*acl), GFP_KERNEL);
3751                 if (acl == NULL)
3752                         goto out;
3753                 acl->cached = 0;
3754         }
3755         acl->len = acl_len;
3756 out:
3757         nfs4_set_cached_acl(inode, acl);
3758 }
3759
3760 /*
3761  * The getxattr API returns the required buffer length when called with a
3762  * NULL buf. The NFSv4 acl tool then calls getxattr again after allocating
3763  * the required buf.  On a NULL buf, we send a page of data to the server
3764  * guessing that the ACL request can be serviced by a page. If so, we cache
3765  * up to the page of ACL data, and the 2nd call to getxattr is serviced by
3766  * the cache. If not so, we throw away the page, and cache the required
3767  * length. The next getxattr call will then produce another round trip to
3768  * the server, this time with the input buf of the required size.
3769  */
3770 static ssize_t __nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
3771 {
3772         struct page *pages[NFS4ACL_MAXPAGES] = {NULL, };
3773         struct nfs_getaclargs args = {
3774                 .fh = NFS_FH(inode),
3775                 .acl_pages = pages,
3776                 .acl_len = buflen,
3777         };
3778         struct nfs_getaclres res = {
3779                 .acl_len = buflen,
3780         };
3781         struct rpc_message msg = {
3782                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETACL],
3783                 .rpc_argp = &args,
3784                 .rpc_resp = &res,
3785         };
3786         int ret = -ENOMEM, npages, i;
3787         size_t acl_len = 0;
3788
3789         npages = (buflen + PAGE_SIZE - 1) >> PAGE_SHIFT;
3790         /* As long as we're doing a round trip to the server anyway,
3791          * let's be prepared for a page of acl data. */
3792         if (npages == 0)
3793                 npages = 1;
3794
3795         /* Add an extra page to handle the bitmap returned */
3796         npages++;
3797
3798         for (i = 0; i < npages; i++) {
3799                 pages[i] = alloc_page(GFP_KERNEL);
3800                 if (!pages[i])
3801                         goto out_free;
3802         }
3803
3804         /* for decoding across pages */
3805         res.acl_scratch = alloc_page(GFP_KERNEL);
3806         if (!res.acl_scratch)
3807                 goto out_free;
3808
3809         args.acl_len = npages * PAGE_SIZE;
3810         args.acl_pgbase = 0;
3811
3812         /* Let decode_getfacl know not to fail if the ACL data is larger than
3813          * the page we send as a guess */
3814         if (buf == NULL)
3815                 res.acl_flags |= NFS4_ACL_LEN_REQUEST;
3816
3817         dprintk("%s  buf %p buflen %zu npages %d args.acl_len %zu\n",
3818                 __func__, buf, buflen, npages, args.acl_len);
3819         ret = nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode),
3820                              &msg, &args.seq_args, &res.seq_res, 0);
3821         if (ret)
3822                 goto out_free;
3823
3824         acl_len = res.acl_len - res.acl_data_offset;
3825         if (acl_len > args.acl_len)
3826                 nfs4_write_cached_acl(inode, NULL, 0, acl_len);
3827         else
3828                 nfs4_write_cached_acl(inode, pages, res.acl_data_offset,
3829                                       acl_len);
3830         if (buf) {
3831                 ret = -ERANGE;
3832                 if (acl_len > buflen)
3833                         goto out_free;
3834                 _copy_from_pages(buf, pages, res.acl_data_offset,
3835                                 acl_len);
3836         }
3837         ret = acl_len;
3838 out_free:
3839         for (i = 0; i < npages; i++)
3840                 if (pages[i])
3841                         __free_page(pages[i]);
3842         if (res.acl_scratch)
3843                 __free_page(res.acl_scratch);
3844         return ret;
3845 }
3846
3847 static ssize_t nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
3848 {
3849         struct nfs4_exception exception = { };
3850         ssize_t ret;
3851         do {
3852                 ret = __nfs4_get_acl_uncached(inode, buf, buflen);
3853                 if (ret >= 0)
3854                         break;
3855                 ret = nfs4_handle_exception(NFS_SERVER(inode), ret, &exception);
3856         } while (exception.retry);
3857         return ret;
3858 }
3859
3860 static ssize_t nfs4_proc_get_acl(struct inode *inode, void *buf, size_t buflen)
3861 {
3862         struct nfs_server *server = NFS_SERVER(inode);
3863         int ret;
3864
3865         if (!nfs4_server_supports_acls(server))
3866                 return -EOPNOTSUPP;
3867         ret = nfs_revalidate_inode(server, inode);
3868         if (ret < 0)
3869                 return ret;
3870         if (NFS_I(inode)->cache_validity & NFS_INO_INVALID_ACL)
3871                 nfs_zap_acl_cache(inode);
3872         ret = nfs4_read_cached_acl(inode, buf, buflen);
3873         if (ret != -ENOENT)
3874                 /* -ENOENT is returned if there is no ACL or if there is an ACL
3875                  * but no cached acl data, just the acl length */
3876                 return ret;
3877         return nfs4_get_acl_uncached(inode, buf, buflen);
3878 }
3879
3880 static int __nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
3881 {
3882         struct nfs_server *server = NFS_SERVER(inode);
3883         struct page *pages[NFS4ACL_MAXPAGES];
3884         struct nfs_setaclargs arg = {
3885                 .fh             = NFS_FH(inode),
3886                 .acl_pages      = pages,
3887                 .acl_len        = buflen,
3888         };
3889         struct nfs_setaclres res;
3890         struct rpc_message msg = {
3891                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETACL],
3892                 .rpc_argp       = &arg,
3893                 .rpc_resp       = &res,
3894         };
3895         int ret, i;
3896
3897         if (!nfs4_server_supports_acls(server))
3898                 return -EOPNOTSUPP;
3899         i = buf_to_pages_noslab(buf, buflen, arg.acl_pages, &arg.acl_pgbase);
3900         if (i < 0)
3901                 return i;
3902         nfs4_inode_return_delegation(inode);
3903         ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
3904
3905         /*
3906          * Free each page after tx, so the only ref left is
3907          * held by the network stack
3908          */
3909         for (; i > 0; i--)
3910                 put_page(pages[i-1]);
3911
3912         /*
3913          * Acl update can result in inode attribute update.
3914          * so mark the attribute cache invalid.
3915          */
3916         spin_lock(&inode->i_lock);
3917         NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATTR;
3918         spin_unlock(&inode->i_lock);
3919         nfs_access_zap_cache(inode);
3920         nfs_zap_acl_cache(inode);
3921         return ret;
3922 }
3923
3924 static int nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
3925 {
3926         struct nfs4_exception exception = { };
3927         int err;
3928         do {
3929                 err = nfs4_handle_exception(NFS_SERVER(inode),
3930                                 __nfs4_proc_set_acl(inode, buf, buflen),
3931                                 &exception);
3932         } while (exception.retry);
3933         return err;
3934 }
3935
3936 static int
3937 nfs4_async_handle_error(struct rpc_task *task, const struct nfs_server *server, struct nfs4_state *state)
3938 {
3939         struct nfs_client *clp = server->nfs_client;
3940
3941         if (task->tk_status >= 0)
3942                 return 0;
3943         switch(task->tk_status) {
3944                 case -NFS4ERR_DELEG_REVOKED:
3945                 case -NFS4ERR_ADMIN_REVOKED:
3946                 case -NFS4ERR_BAD_STATEID:
3947                         if (state == NULL)
3948                                 break;
3949                         nfs_remove_bad_delegation(state->inode);
3950                 case -NFS4ERR_OPENMODE:
3951                         if (state == NULL)
3952                                 break;
3953                         nfs4_schedule_stateid_recovery(server, state);
3954                         goto wait_on_recovery;
3955                 case -NFS4ERR_EXPIRED:
3956                         if (state != NULL)
3957                                 nfs4_schedule_stateid_recovery(server, state);
3958                 case -NFS4ERR_STALE_STATEID:
3959                 case -NFS4ERR_STALE_CLIENTID:
3960                         nfs4_schedule_lease_recovery(clp);
3961                         goto wait_on_recovery;
3962 #if defined(CONFIG_NFS_V4_1)
3963                 case -NFS4ERR_BADSESSION:
3964                 case -NFS4ERR_BADSLOT:
3965                 case -NFS4ERR_BAD_HIGH_SLOT:
3966                 case -NFS4ERR_DEADSESSION:
3967                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
3968                 case -NFS4ERR_SEQ_FALSE_RETRY:
3969                 case -NFS4ERR_SEQ_MISORDERED:
3970                         dprintk("%s ERROR %d, Reset session\n", __func__,
3971                                 task->tk_status);
3972                         nfs4_schedule_session_recovery(clp->cl_session, task->tk_status);
3973                         task->tk_status = 0;
3974                         return -EAGAIN;
3975 #endif /* CONFIG_NFS_V4_1 */
3976                 case -NFS4ERR_DELAY:
3977                         nfs_inc_server_stats(server, NFSIOS_DELAY);
3978                 case -NFS4ERR_GRACE:
3979                 case -EKEYEXPIRED:
3980                         rpc_delay(task, NFS4_POLL_RETRY_MAX);
3981                         task->tk_status = 0;
3982                         return -EAGAIN;
3983                 case -NFS4ERR_RETRY_UNCACHED_REP:
3984                 case -NFS4ERR_OLD_STATEID:
3985                         task->tk_status = 0;
3986                         return -EAGAIN;
3987         }
3988         task->tk_status = nfs4_map_errors(task->tk_status);
3989         return 0;
3990 wait_on_recovery:
3991         rpc_sleep_on(&clp->cl_rpcwaitq, task, NULL);
3992         if (test_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) == 0)
3993                 rpc_wake_up_queued_task(&clp->cl_rpcwaitq, task);
3994         task->tk_status = 0;
3995         return -EAGAIN;
3996 }
3997
3998 static void nfs4_init_boot_verifier(const struct nfs_client *clp,
3999                                     nfs4_verifier *bootverf)
4000 {
4001         __be32 verf[2];
4002
4003         if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) {
4004                 /* An impossible timestamp guarantees this value
4005                  * will never match a generated boot time. */
4006                 verf[0] = 0;
4007                 verf[1] = (__be32)(NSEC_PER_SEC + 1);
4008         } else {
4009                 struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
4010                 verf[0] = (__be32)nn->boot_time.tv_sec;
4011                 verf[1] = (__be32)nn->boot_time.tv_nsec;
4012         }
4013         memcpy(bootverf->data, verf, sizeof(bootverf->data));
4014 }
4015
4016 int nfs4_proc_setclientid(struct nfs_client *clp, u32 program,
4017                 unsigned short port, struct rpc_cred *cred,
4018                 struct nfs4_setclientid_res *res)
4019 {
4020         nfs4_verifier sc_verifier;
4021         struct nfs4_setclientid setclientid = {
4022                 .sc_verifier = &sc_verifier,
4023                 .sc_prog = program,
4024                 .sc_cb_ident = clp->cl_cb_ident,
4025         };
4026         struct rpc_message msg = {
4027                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID],
4028                 .rpc_argp = &setclientid,
4029                 .rpc_resp = res,
4030                 .rpc_cred = cred,
4031         };
4032
4033         /* nfs_client_id4 */
4034         nfs4_init_boot_verifier(clp, &sc_verifier);
4035         rcu_read_lock();
4036         setclientid.sc_name_len = scnprintf(setclientid.sc_name,
4037                         sizeof(setclientid.sc_name), "%s/%s %s",
4038                         clp->cl_ipaddr,
4039                         rpc_peeraddr2str(clp->cl_rpcclient,
4040                                                 RPC_DISPLAY_ADDR),
4041                         rpc_peeraddr2str(clp->cl_rpcclient,
4042                                                 RPC_DISPLAY_PROTO));
4043         /* cb_client4 */
4044         setclientid.sc_netid_len = scnprintf(setclientid.sc_netid,
4045                                 sizeof(setclientid.sc_netid),
4046                                 rpc_peeraddr2str(clp->cl_rpcclient,
4047                                                         RPC_DISPLAY_NETID));
4048         rcu_read_unlock();
4049         setclientid.sc_uaddr_len = scnprintf(setclientid.sc_uaddr,
4050                                 sizeof(setclientid.sc_uaddr), "%s.%u.%u",
4051                                 clp->cl_ipaddr, port >> 8, port & 255);
4052
4053         return rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
4054 }
4055
4056 int nfs4_proc_setclientid_confirm(struct nfs_client *clp,
4057                 struct nfs4_setclientid_res *arg,
4058                 struct rpc_cred *cred)
4059 {
4060         struct nfs_fsinfo fsinfo;
4061         struct rpc_message msg = {
4062                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID_CONFIRM],
4063                 .rpc_argp = arg,
4064                 .rpc_resp = &fsinfo,
4065                 .rpc_cred = cred,
4066         };
4067         unsigned long now;
4068         int status;
4069
4070         now = jiffies;
4071         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
4072         if (status == 0) {
4073                 spin_lock(&clp->cl_lock);
4074                 clp->cl_lease_time = fsinfo.lease_time * HZ;
4075                 clp->cl_last_renewal = now;
4076                 spin_unlock(&clp->cl_lock);
4077         }
4078         return status;
4079 }
4080
4081 struct nfs4_delegreturndata {
4082         struct nfs4_delegreturnargs args;
4083         struct nfs4_delegreturnres res;
4084         struct nfs_fh fh;
4085         nfs4_stateid stateid;
4086         unsigned long timestamp;
4087         struct nfs_fattr fattr;
4088         int rpc_status;
4089 };
4090
4091 static void nfs4_delegreturn_done(struct rpc_task *task, void *calldata)
4092 {
4093         struct nfs4_delegreturndata *data = calldata;
4094
4095         if (!nfs4_sequence_done(task, &data->res.seq_res))
4096                 return;
4097
4098         switch (task->tk_status) {
4099         case -NFS4ERR_STALE_STATEID:
4100         case -NFS4ERR_EXPIRED:
4101         case 0:
4102                 renew_lease(data->res.server, data->timestamp);
4103                 break;
4104         default:
4105                 if (nfs4_async_handle_error(task, data->res.server, NULL) ==
4106                                 -EAGAIN) {
4107                         rpc_restart_call_prepare(task);
4108                         return;
4109                 }
4110         }
4111         data->rpc_status = task->tk_status;
4112 }
4113
4114 static void nfs4_delegreturn_release(void *calldata)
4115 {
4116         kfree(calldata);
4117 }
4118
4119 #if defined(CONFIG_NFS_V4_1)
4120 static void nfs4_delegreturn_prepare(struct rpc_task *task, void *data)
4121 {
4122         struct nfs4_delegreturndata *d_data;
4123
4124         d_data = (struct nfs4_delegreturndata *)data;
4125
4126         if (nfs4_setup_sequence(d_data->res.server,
4127                                 &d_data->args.seq_args,
4128                                 &d_data->res.seq_res, task))
4129                 return;
4130         rpc_call_start(task);
4131 }
4132 #endif /* CONFIG_NFS_V4_1 */
4133
4134 static const struct rpc_call_ops nfs4_delegreturn_ops = {
4135 #if defined(CONFIG_NFS_V4_1)
4136         .rpc_call_prepare = nfs4_delegreturn_prepare,
4137 #endif /* CONFIG_NFS_V4_1 */
4138         .rpc_call_done = nfs4_delegreturn_done,
4139         .rpc_release = nfs4_delegreturn_release,
4140 };
4141
4142 static int _nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
4143 {
4144         struct nfs4_delegreturndata *data;
4145         struct nfs_server *server = NFS_SERVER(inode);
4146         struct rpc_task *task;
4147         struct rpc_message msg = {
4148                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DELEGRETURN],
4149                 .rpc_cred = cred,
4150         };
4151         struct rpc_task_setup task_setup_data = {
4152                 .rpc_client = server->client,
4153                 .rpc_message = &msg,
4154                 .callback_ops = &nfs4_delegreturn_ops,
4155                 .flags = RPC_TASK_ASYNC,
4156         };
4157         int status = 0;
4158
4159         data = kzalloc(sizeof(*data), GFP_NOFS);
4160         if (data == NULL)
4161                 return -ENOMEM;
4162         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
4163         data->args.fhandle = &data->fh;
4164         data->args.stateid = &data->stateid;
4165         data->args.bitmask = server->cache_consistency_bitmask;
4166         nfs_copy_fh(&data->fh, NFS_FH(inode));
4167         nfs4_stateid_copy(&data->stateid, stateid);
4168         data->res.fattr = &data->fattr;
4169         data->res.server = server;
4170         nfs_fattr_init(data->res.fattr);
4171         data->timestamp = jiffies;
4172         data->rpc_status = 0;
4173
4174         task_setup_data.callback_data = data;
4175         msg.rpc_argp = &data->args;
4176         msg.rpc_resp = &data->res;
4177         task = rpc_run_task(&task_setup_data);
4178         if (IS_ERR(task))
4179                 return PTR_ERR(task);
4180         if (!issync)
4181                 goto out;
4182         status = nfs4_wait_for_completion_rpc_task(task);
4183         if (status != 0)
4184                 goto out;
4185         status = data->rpc_status;
4186         if (status == 0)
4187                 nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
4188         else
4189                 nfs_refresh_inode(inode, &data->fattr);
4190 out:
4191         rpc_put_task(task);
4192         return status;
4193 }
4194
4195 int nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
4196 {
4197         struct nfs_server *server = NFS_SERVER(inode);
4198         struct nfs4_exception exception = { };
4199         int err;
4200         do {
4201                 err = _nfs4_proc_delegreturn(inode, cred, stateid, issync);
4202                 switch (err) {
4203                         case -NFS4ERR_STALE_STATEID:
4204                         case -NFS4ERR_EXPIRED:
4205                         case 0:
4206                                 return 0;
4207                 }
4208                 err = nfs4_handle_exception(server, err, &exception);
4209         } while (exception.retry);
4210         return err;
4211 }
4212
4213 #define NFS4_LOCK_MINTIMEOUT (1 * HZ)
4214 #define NFS4_LOCK_MAXTIMEOUT (30 * HZ)
4215
4216 /* 
4217  * sleep, with exponential backoff, and retry the LOCK operation. 
4218  */
4219 static unsigned long
4220 nfs4_set_lock_task_retry(unsigned long timeout)
4221 {
4222         freezable_schedule_timeout_killable(timeout);
4223         timeout <<= 1;
4224         if (timeout > NFS4_LOCK_MAXTIMEOUT)
4225                 return NFS4_LOCK_MAXTIMEOUT;
4226         return timeout;
4227 }
4228
4229 static int _nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4230 {
4231         struct inode *inode = state->inode;
4232         struct nfs_server *server = NFS_SERVER(inode);
4233         struct nfs_client *clp = server->nfs_client;
4234         struct nfs_lockt_args arg = {
4235                 .fh = NFS_FH(inode),
4236                 .fl = request,
4237         };
4238         struct nfs_lockt_res res = {
4239                 .denied = request,
4240         };
4241         struct rpc_message msg = {
4242                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_LOCKT],
4243                 .rpc_argp       = &arg,
4244                 .rpc_resp       = &res,
4245                 .rpc_cred       = state->owner->so_cred,
4246         };
4247         struct nfs4_lock_state *lsp;
4248         int status;
4249
4250         arg.lock_owner.clientid = clp->cl_clientid;
4251         status = nfs4_set_lock_state(state, request);
4252         if (status != 0)
4253                 goto out;
4254         lsp = request->fl_u.nfs4_fl.owner;
4255         arg.lock_owner.id = lsp->ls_seqid.owner_id;
4256         arg.lock_owner.s_dev = server->s_dev;
4257         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
4258         switch (status) {
4259                 case 0:
4260                         request->fl_type = F_UNLCK;
4261                         break;
4262                 case -NFS4ERR_DENIED:
4263                         status = 0;
4264         }
4265         request->fl_ops->fl_release_private(request);
4266 out:
4267         return status;
4268 }
4269
4270 static int nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4271 {
4272         struct nfs4_exception exception = { };
4273         int err;
4274
4275         do {
4276                 err = nfs4_handle_exception(NFS_SERVER(state->inode),
4277                                 _nfs4_proc_getlk(state, cmd, request),
4278                                 &exception);
4279         } while (exception.retry);
4280         return err;
4281 }
4282
4283 static int do_vfs_lock(struct file *file, struct file_lock *fl)
4284 {
4285         int res = 0;
4286         switch (fl->fl_flags & (FL_POSIX|FL_FLOCK)) {
4287                 case FL_POSIX:
4288                         res = posix_lock_file_wait(file, fl);
4289                         break;
4290                 case FL_FLOCK:
4291                         res = flock_lock_file_wait(file, fl);
4292                         break;
4293                 default:
4294                         BUG();
4295         }
4296         return res;
4297 }
4298
4299 struct nfs4_unlockdata {
4300         struct nfs_locku_args arg;
4301         struct nfs_locku_res res;
4302         struct nfs4_lock_state *lsp;
4303         struct nfs_open_context *ctx;
4304         struct file_lock fl;
4305         const struct nfs_server *server;
4306         unsigned long timestamp;
4307 };
4308
4309 static struct nfs4_unlockdata *nfs4_alloc_unlockdata(struct file_lock *fl,
4310                 struct nfs_open_context *ctx,
4311                 struct nfs4_lock_state *lsp,
4312                 struct nfs_seqid *seqid)
4313 {
4314         struct nfs4_unlockdata *p;
4315         struct inode *inode = lsp->ls_state->inode;
4316
4317         p = kzalloc(sizeof(*p), GFP_NOFS);
4318         if (p == NULL)
4319                 return NULL;
4320         p->arg.fh = NFS_FH(inode);
4321         p->arg.fl = &p->fl;
4322         p->arg.seqid = seqid;
4323         p->res.seqid = seqid;
4324         p->arg.stateid = &lsp->ls_stateid;
4325         p->lsp = lsp;
4326         atomic_inc(&lsp->ls_count);
4327         /* Ensure we don't close file until we're done freeing locks! */
4328         p->ctx = get_nfs_open_context(ctx);
4329         memcpy(&p->fl, fl, sizeof(p->fl));
4330         p->server = NFS_SERVER(inode);
4331         return p;
4332 }
4333
4334 static void nfs4_locku_release_calldata(void *data)
4335 {
4336         struct nfs4_unlockdata *calldata = data;
4337         nfs_free_seqid(calldata->arg.seqid);
4338         nfs4_put_lock_state(calldata->lsp);
4339         put_nfs_open_context(calldata->ctx);
4340         kfree(calldata);
4341 }
4342
4343 static void nfs4_locku_done(struct rpc_task *task, void *data)
4344 {
4345         struct nfs4_unlockdata *calldata = data;
4346
4347         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
4348                 return;
4349         switch (task->tk_status) {
4350                 case 0:
4351                         nfs4_stateid_copy(&calldata->lsp->ls_stateid,
4352                                         &calldata->res.stateid);
4353                         renew_lease(calldata->server, calldata->timestamp);
4354                         break;
4355                 case -NFS4ERR_BAD_STATEID:
4356                 case -NFS4ERR_OLD_STATEID:
4357                 case -NFS4ERR_STALE_STATEID:
4358                 case -NFS4ERR_EXPIRED:
4359                         break;
4360                 default:
4361                         if (nfs4_async_handle_error(task, calldata->server, NULL) == -EAGAIN)
4362                                 rpc_restart_call_prepare(task);
4363         }
4364 }
4365
4366 static void nfs4_locku_prepare(struct rpc_task *task, void *data)
4367 {
4368         struct nfs4_unlockdata *calldata = data;
4369
4370         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
4371                 return;
4372         if ((calldata->lsp->ls_flags & NFS_LOCK_INITIALIZED) == 0) {
4373                 /* Note: exit _without_ running nfs4_locku_done */
4374                 task->tk_action = NULL;
4375                 return;
4376         }
4377         calldata->timestamp = jiffies;
4378         if (nfs4_setup_sequence(calldata->server,
4379                                 &calldata->arg.seq_args,
4380                                 &calldata->res.seq_res, task))
4381                 return;
4382         rpc_call_start(task);
4383 }
4384
4385 static const struct rpc_call_ops nfs4_locku_ops = {
4386         .rpc_call_prepare = nfs4_locku_prepare,
4387         .rpc_call_done = nfs4_locku_done,
4388         .rpc_release = nfs4_locku_release_calldata,
4389 };
4390
4391 static struct rpc_task *nfs4_do_unlck(struct file_lock *fl,
4392                 struct nfs_open_context *ctx,
4393                 struct nfs4_lock_state *lsp,
4394                 struct nfs_seqid *seqid)
4395 {
4396         struct nfs4_unlockdata *data;
4397         struct rpc_message msg = {
4398                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCKU],
4399                 .rpc_cred = ctx->cred,
4400         };
4401         struct rpc_task_setup task_setup_data = {
4402                 .rpc_client = NFS_CLIENT(lsp->ls_state->inode),
4403                 .rpc_message = &msg,
4404                 .callback_ops = &nfs4_locku_ops,
4405                 .workqueue = nfsiod_workqueue,
4406                 .flags = RPC_TASK_ASYNC,
4407         };
4408
4409         /* Ensure this is an unlock - when canceling a lock, the
4410          * canceled lock is passed in, and it won't be an unlock.
4411          */
4412         fl->fl_type = F_UNLCK;
4413
4414         data = nfs4_alloc_unlockdata(fl, ctx, lsp, seqid);
4415         if (data == NULL) {
4416                 nfs_free_seqid(seqid);
4417                 return ERR_PTR(-ENOMEM);
4418         }
4419
4420         nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4421         msg.rpc_argp = &data->arg;
4422         msg.rpc_resp = &data->res;
4423         task_setup_data.callback_data = data;
4424         return rpc_run_task(&task_setup_data);
4425 }
4426
4427 static int nfs4_proc_unlck(struct nfs4_state *state, int cmd, struct file_lock *request)
4428 {
4429         struct nfs_inode *nfsi = NFS_I(state->inode);
4430         struct nfs_seqid *seqid;
4431         struct nfs4_lock_state *lsp;
4432         struct rpc_task *task;
4433         int status = 0;
4434         unsigned char fl_flags = request->fl_flags;
4435
4436         status = nfs4_set_lock_state(state, request);
4437         /* Unlock _before_ we do the RPC call */
4438         request->fl_flags |= FL_EXISTS;
4439         down_read(&nfsi->rwsem);
4440         if (do_vfs_lock(request->fl_file, request) == -ENOENT) {
4441                 up_read(&nfsi->rwsem);
4442                 goto out;
4443         }
4444         up_read(&nfsi->rwsem);
4445         if (status != 0)
4446                 goto out;
4447         /* Is this a delegated lock? */
4448         if (test_bit(NFS_DELEGATED_STATE, &state->flags))
4449                 goto out;
4450         lsp = request->fl_u.nfs4_fl.owner;
4451         seqid = nfs_alloc_seqid(&lsp->ls_seqid, GFP_KERNEL);
4452         status = -ENOMEM;
4453         if (seqid == NULL)
4454                 goto out;
4455         task = nfs4_do_unlck(request, nfs_file_open_context(request->fl_file), lsp, seqid);
4456         status = PTR_ERR(task);
4457         if (IS_ERR(task))
4458                 goto out;
4459         status = nfs4_wait_for_completion_rpc_task(task);
4460         rpc_put_task(task);
4461 out:
4462         request->fl_flags = fl_flags;
4463         return status;
4464 }
4465
4466 struct nfs4_lockdata {
4467         struct nfs_lock_args arg;
4468         struct nfs_lock_res res;
4469         struct nfs4_lock_state *lsp;
4470         struct nfs_open_context *ctx;
4471         struct file_lock fl;
4472         unsigned long timestamp;
4473         int rpc_status;
4474         int cancelled;
4475         struct nfs_server *server;
4476 };
4477
4478 static struct nfs4_lockdata *nfs4_alloc_lockdata(struct file_lock *fl,
4479                 struct nfs_open_context *ctx, struct nfs4_lock_state *lsp,
4480                 gfp_t gfp_mask)
4481 {
4482         struct nfs4_lockdata *p;
4483         struct inode *inode = lsp->ls_state->inode;
4484         struct nfs_server *server = NFS_SERVER(inode);
4485
4486         p = kzalloc(sizeof(*p), gfp_mask);
4487         if (p == NULL)
4488                 return NULL;
4489
4490         p->arg.fh = NFS_FH(inode);
4491         p->arg.fl = &p->fl;
4492         p->arg.open_seqid = nfs_alloc_seqid(&lsp->ls_state->owner->so_seqid, gfp_mask);
4493         if (p->arg.open_seqid == NULL)
4494                 goto out_free;
4495         p->arg.lock_seqid = nfs_alloc_seqid(&lsp->ls_seqid, gfp_mask);
4496         if (p->arg.lock_seqid == NULL)
4497                 goto out_free_seqid;
4498         p->arg.lock_stateid = &lsp->ls_stateid;
4499         p->arg.lock_owner.clientid = server->nfs_client->cl_clientid;
4500         p->arg.lock_owner.id = lsp->ls_seqid.owner_id;
4501         p->arg.lock_owner.s_dev = server->s_dev;
4502         p->res.lock_seqid = p->arg.lock_seqid;
4503         p->lsp = lsp;
4504         p->server = server;
4505         atomic_inc(&lsp->ls_count);
4506         p->ctx = get_nfs_open_context(ctx);
4507         memcpy(&p->fl, fl, sizeof(p->fl));
4508         return p;
4509 out_free_seqid:
4510         nfs_free_seqid(p->arg.open_seqid);
4511 out_free:
4512         kfree(p);
4513         return NULL;
4514 }
4515
4516 static void nfs4_lock_prepare(struct rpc_task *task, void *calldata)
4517 {
4518         struct nfs4_lockdata *data = calldata;
4519         struct nfs4_state *state = data->lsp->ls_state;
4520
4521         dprintk("%s: begin!\n", __func__);
4522         if (nfs_wait_on_sequence(data->arg.lock_seqid, task) != 0)
4523                 return;
4524         /* Do we need to do an open_to_lock_owner? */
4525         if (!(data->arg.lock_seqid->sequence->flags & NFS_SEQID_CONFIRMED)) {
4526                 if (nfs_wait_on_sequence(data->arg.open_seqid, task) != 0)
4527                         return;
4528                 data->arg.open_stateid = &state->stateid;
4529                 data->arg.new_lock_owner = 1;
4530                 data->res.open_seqid = data->arg.open_seqid;
4531         } else
4532                 data->arg.new_lock_owner = 0;
4533         data->timestamp = jiffies;
4534         if (nfs4_setup_sequence(data->server,
4535                                 &data->arg.seq_args,
4536                                 &data->res.seq_res, task))
4537                 return;
4538         rpc_call_start(task);
4539         dprintk("%s: done!, ret = %d\n", __func__, data->rpc_status);
4540 }
4541
4542 static void nfs4_recover_lock_prepare(struct rpc_task *task, void *calldata)
4543 {
4544         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
4545         nfs4_lock_prepare(task, calldata);
4546 }
4547
4548 static void nfs4_lock_done(struct rpc_task *task, void *calldata)
4549 {
4550         struct nfs4_lockdata *data = calldata;
4551
4552         dprintk("%s: begin!\n", __func__);
4553
4554         if (!nfs4_sequence_done(task, &data->res.seq_res))
4555                 return;
4556
4557         data->rpc_status = task->tk_status;
4558         if (data->arg.new_lock_owner != 0) {
4559                 if (data->rpc_status == 0)
4560                         nfs_confirm_seqid(&data->lsp->ls_seqid, 0);
4561                 else
4562                         goto out;
4563         }
4564         if (data->rpc_status == 0) {
4565                 nfs4_stateid_copy(&data->lsp->ls_stateid, &data->res.stateid);
4566                 data->lsp->ls_flags |= NFS_LOCK_INITIALIZED;
4567                 renew_lease(NFS_SERVER(data->ctx->dentry->d_inode), data->timestamp);
4568         }
4569 out:
4570         dprintk("%s: done, ret = %d!\n", __func__, data->rpc_status);
4571 }
4572
4573 static void nfs4_lock_release(void *calldata)
4574 {
4575         struct nfs4_lockdata *data = calldata;
4576
4577         dprintk("%s: begin!\n", __func__);
4578         nfs_free_seqid(data->arg.open_seqid);
4579         if (data->cancelled != 0) {
4580                 struct rpc_task *task;
4581                 task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
4582                                 data->arg.lock_seqid);
4583                 if (!IS_ERR(task))
4584                         rpc_put_task_async(task);
4585                 dprintk("%s: cancelling lock!\n", __func__);
4586         } else
4587                 nfs_free_seqid(data->arg.lock_seqid);
4588         nfs4_put_lock_state(data->lsp);
4589         put_nfs_open_context(data->ctx);
4590         kfree(data);
4591         dprintk("%s: done!\n", __func__);
4592 }
4593
4594 static const struct rpc_call_ops nfs4_lock_ops = {
4595         .rpc_call_prepare = nfs4_lock_prepare,
4596         .rpc_call_done = nfs4_lock_done,
4597         .rpc_release = nfs4_lock_release,
4598 };
4599
4600 static const struct rpc_call_ops nfs4_recover_lock_ops = {
4601         .rpc_call_prepare = nfs4_recover_lock_prepare,
4602         .rpc_call_done = nfs4_lock_done,
4603         .rpc_release = nfs4_lock_release,
4604 };
4605
4606 static void nfs4_handle_setlk_error(struct nfs_server *server, struct nfs4_lock_state *lsp, int new_lock_owner, int error)
4607 {
4608         switch (error) {
4609         case -NFS4ERR_ADMIN_REVOKED:
4610         case -NFS4ERR_BAD_STATEID:
4611                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4612                 if (new_lock_owner != 0 ||
4613                    (lsp->ls_flags & NFS_LOCK_INITIALIZED) != 0)
4614                         nfs4_schedule_stateid_recovery(server, lsp->ls_state);
4615                 break;
4616         case -NFS4ERR_STALE_STATEID:
4617                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4618         case -NFS4ERR_EXPIRED:
4619                 nfs4_schedule_lease_recovery(server->nfs_client);
4620         };
4621 }
4622
4623 static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int recovery_type)
4624 {
4625         struct nfs4_lockdata *data;
4626         struct rpc_task *task;
4627         struct rpc_message msg = {
4628                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCK],
4629                 .rpc_cred = state->owner->so_cred,
4630         };
4631         struct rpc_task_setup task_setup_data = {
4632                 .rpc_client = NFS_CLIENT(state->inode),
4633                 .rpc_message = &msg,
4634                 .callback_ops = &nfs4_lock_ops,
4635                 .workqueue = nfsiod_workqueue,
4636                 .flags = RPC_TASK_ASYNC,
4637         };
4638         int ret;
4639
4640         dprintk("%s: begin!\n", __func__);
4641         data = nfs4_alloc_lockdata(fl, nfs_file_open_context(fl->fl_file),
4642                         fl->fl_u.nfs4_fl.owner,
4643                         recovery_type == NFS_LOCK_NEW ? GFP_KERNEL : GFP_NOFS);
4644         if (data == NULL)
4645                 return -ENOMEM;
4646         if (IS_SETLKW(cmd))
4647                 data->arg.block = 1;
4648         if (recovery_type > NFS_LOCK_NEW) {
4649                 if (recovery_type == NFS_LOCK_RECLAIM)
4650                         data->arg.reclaim = NFS_LOCK_RECLAIM;
4651                 task_setup_data.callback_ops = &nfs4_recover_lock_ops;
4652         }
4653         nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4654         msg.rpc_argp = &data->arg;
4655         msg.rpc_resp = &data->res;
4656         task_setup_data.callback_data = data;
4657         task = rpc_run_task(&task_setup_data);
4658         if (IS_ERR(task))
4659                 return PTR_ERR(task);
4660         ret = nfs4_wait_for_completion_rpc_task(task);
4661         if (ret == 0) {
4662                 ret = data->rpc_status;
4663                 if (ret)
4664                         nfs4_handle_setlk_error(data->server, data->lsp,
4665                                         data->arg.new_lock_owner, ret);
4666         } else
4667                 data->cancelled = 1;
4668         rpc_put_task(task);
4669         dprintk("%s: done, ret = %d!\n", __func__, ret);
4670         return ret;
4671 }
4672
4673 static int nfs4_lock_reclaim(struct nfs4_state *state, struct file_lock *request)
4674 {
4675         struct nfs_server *server = NFS_SERVER(state->inode);
4676         struct nfs4_exception exception = {
4677                 .inode = state->inode,
4678         };
4679         int err;
4680
4681         do {
4682                 /* Cache the lock if possible... */
4683                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
4684                         return 0;
4685                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_RECLAIM);
4686                 if (err != -NFS4ERR_DELAY)
4687                         break;
4688                 nfs4_handle_exception(server, err, &exception);
4689         } while (exception.retry);
4690         return err;
4691 }
4692
4693 static int nfs4_lock_expired(struct nfs4_state *state, struct file_lock *request)
4694 {
4695         struct nfs_server *server = NFS_SERVER(state->inode);
4696         struct nfs4_exception exception = {
4697                 .inode = state->inode,
4698         };
4699         int err;
4700
4701         err = nfs4_set_lock_state(state, request);
4702         if (err != 0)
4703                 return err;
4704         do {
4705                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
4706                         return 0;
4707                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_EXPIRED);
4708                 switch (err) {
4709                 default:
4710                         goto out;
4711                 case -NFS4ERR_GRACE:
4712                 case -NFS4ERR_DELAY:
4713                         nfs4_handle_exception(server, err, &exception);
4714                         err = 0;
4715                 }
4716         } while (exception.retry);
4717 out:
4718         return err;
4719 }
4720
4721 #if defined(CONFIG_NFS_V4_1)
4722 /**
4723  * nfs41_check_expired_locks - possibly free a lock stateid
4724  *
4725  * @state: NFSv4 state for an inode
4726  *
4727  * Returns NFS_OK if recovery for this stateid is now finished.
4728  * Otherwise a negative NFS4ERR value is returned.
4729  */
4730 static int nfs41_check_expired_locks(struct nfs4_state *state)
4731 {
4732         int status, ret = -NFS4ERR_BAD_STATEID;
4733         struct nfs4_lock_state *lsp;
4734         struct nfs_server *server = NFS_SERVER(state->inode);
4735
4736         list_for_each_entry(lsp, &state->lock_states, ls_locks) {
4737                 if (lsp->ls_flags & NFS_LOCK_INITIALIZED) {
4738                         status = nfs41_test_stateid(server, &lsp->ls_stateid);
4739                         if (status != NFS_OK) {
4740                                 /* Free the stateid unless the server
4741                                  * informs us the stateid is unrecognized. */
4742                                 if (status != -NFS4ERR_BAD_STATEID)
4743                                         nfs41_free_stateid(server,
4744                                                         &lsp->ls_stateid);
4745                                 lsp->ls_flags &= ~NFS_LOCK_INITIALIZED;
4746                                 ret = status;
4747                         }
4748                 }
4749         };
4750
4751         return ret;
4752 }
4753
4754 static int nfs41_lock_expired(struct nfs4_state *state, struct file_lock *request)
4755 {
4756         int status = NFS_OK;
4757
4758         if (test_bit(LK_STATE_IN_USE, &state->flags))
4759                 status = nfs41_check_expired_locks(state);
4760         if (status != NFS_OK)
4761                 status = nfs4_lock_expired(state, request);
4762         return status;
4763 }
4764 #endif
4765
4766 static int _nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4767 {
4768         struct nfs_inode *nfsi = NFS_I(state->inode);
4769         unsigned char fl_flags = request->fl_flags;
4770         int status = -ENOLCK;
4771
4772         if ((fl_flags & FL_POSIX) &&
4773                         !test_bit(NFS_STATE_POSIX_LOCKS, &state->flags))
4774                 goto out;
4775         /* Is this a delegated open? */
4776         status = nfs4_set_lock_state(state, request);
4777         if (status != 0)
4778                 goto out;
4779         request->fl_flags |= FL_ACCESS;
4780         status = do_vfs_lock(request->fl_file, request);
4781         if (status < 0)
4782                 goto out;
4783         down_read(&nfsi->rwsem);
4784         if (test_bit(NFS_DELEGATED_STATE, &state->flags)) {
4785                 /* Yes: cache locks! */
4786                 /* ...but avoid races with delegation recall... */
4787                 request->fl_flags = fl_flags & ~FL_SLEEP;
4788                 status = do_vfs_lock(request->fl_file, request);
4789                 goto out_unlock;
4790         }
4791         status = _nfs4_do_setlk(state, cmd, request, NFS_LOCK_NEW);
4792         if (status != 0)
4793                 goto out_unlock;
4794         /* Note: we always want to sleep here! */
4795         request->fl_flags = fl_flags | FL_SLEEP;
4796         if (do_vfs_lock(request->fl_file, request) < 0)
4797                 printk(KERN_WARNING "NFS: %s: VFS is out of sync with lock "
4798                         "manager!\n", __func__);
4799 out_unlock:
4800         up_read(&nfsi->rwsem);
4801 out:
4802         request->fl_flags = fl_flags;
4803         return status;
4804 }
4805
4806 static int nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4807 {
4808         struct nfs4_exception exception = {
4809                 .state = state,
4810                 .inode = state->inode,
4811         };
4812         int err;
4813
4814         do {
4815                 err = _nfs4_proc_setlk(state, cmd, request);
4816                 if (err == -NFS4ERR_DENIED)
4817                         err = -EAGAIN;
4818                 err = nfs4_handle_exception(NFS_SERVER(state->inode),
4819                                 err, &exception);
4820         } while (exception.retry);
4821         return err;
4822 }
4823
4824 static int
4825 nfs4_proc_lock(struct file *filp, int cmd, struct file_lock *request)
4826 {
4827         struct nfs_open_context *ctx;
4828         struct nfs4_state *state;
4829         unsigned long timeout = NFS4_LOCK_MINTIMEOUT;
4830         int status;
4831
4832         /* verify open state */
4833         ctx = nfs_file_open_context(filp);
4834         state = ctx->state;
4835
4836         if (request->fl_start < 0 || request->fl_end < 0)
4837                 return -EINVAL;
4838
4839         if (IS_GETLK(cmd)) {
4840                 if (state != NULL)
4841                         return nfs4_proc_getlk(state, F_GETLK, request);
4842                 return 0;
4843         }
4844
4845         if (!(IS_SETLK(cmd) || IS_SETLKW(cmd)))
4846                 return -EINVAL;
4847
4848         if (request->fl_type == F_UNLCK) {
4849                 if (state != NULL)
4850                         return nfs4_proc_unlck(state, cmd, request);
4851                 return 0;
4852         }
4853
4854         if (state == NULL)
4855                 return -ENOLCK;
4856         /*
4857          * Don't rely on the VFS having checked the file open mode,
4858          * since it won't do this for flock() locks.
4859          */
4860         switch (request->fl_type & (F_RDLCK|F_WRLCK|F_UNLCK)) {
4861         case F_RDLCK:
4862                 if (!(filp->f_mode & FMODE_READ))
4863                         return -EBADF;
4864                 break;
4865         case F_WRLCK:
4866                 if (!(filp->f_mode & FMODE_WRITE))
4867                         return -EBADF;
4868         }
4869
4870         do {
4871                 status = nfs4_proc_setlk(state, cmd, request);
4872                 if ((status != -EAGAIN) || IS_SETLK(cmd))
4873                         break;
4874                 timeout = nfs4_set_lock_task_retry(timeout);
4875                 status = -ERESTARTSYS;
4876                 if (signalled())
4877                         break;
4878         } while(status < 0);
4879         return status;
4880 }
4881
4882 int nfs4_lock_delegation_recall(struct nfs4_state *state, struct file_lock *fl)
4883 {
4884         struct nfs_server *server = NFS_SERVER(state->inode);
4885         struct nfs4_exception exception = { };
4886         int err;
4887
4888         err = nfs4_set_lock_state(state, fl);
4889         if (err != 0)
4890                 goto out;
4891         do {
4892                 err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
4893                 switch (err) {
4894                         default:
4895                                 printk(KERN_ERR "NFS: %s: unhandled error "
4896                                         "%d.\n", __func__, err);
4897                         case 0:
4898                         case -ESTALE:
4899                                 goto out;
4900                         case -NFS4ERR_EXPIRED:
4901                                 nfs4_schedule_stateid_recovery(server, state);
4902                         case -NFS4ERR_STALE_CLIENTID:
4903                         case -NFS4ERR_STALE_STATEID:
4904                                 nfs4_schedule_lease_recovery(server->nfs_client);
4905                                 goto out;
4906                         case -NFS4ERR_BADSESSION:
4907                         case -NFS4ERR_BADSLOT:
4908                         case -NFS4ERR_BAD_HIGH_SLOT:
4909                         case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
4910                         case -NFS4ERR_DEADSESSION:
4911                                 nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
4912                                 goto out;
4913                         case -ERESTARTSYS:
4914                                 /*
4915                                  * The show must go on: exit, but mark the
4916                                  * stateid as needing recovery.
4917                                  */
4918                         case -NFS4ERR_DELEG_REVOKED:
4919                         case -NFS4ERR_ADMIN_REVOKED:
4920                         case -NFS4ERR_BAD_STATEID:
4921                         case -NFS4ERR_OPENMODE:
4922                                 nfs4_schedule_stateid_recovery(server, state);
4923                                 err = 0;
4924                                 goto out;
4925                         case -EKEYEXPIRED:
4926                                 /*
4927                                  * User RPCSEC_GSS context has expired.
4928                                  * We cannot recover this stateid now, so
4929                                  * skip it and allow recovery thread to
4930                                  * proceed.
4931                                  */
4932                                 err = 0;
4933                                 goto out;
4934                         case -ENOMEM:
4935                         case -NFS4ERR_DENIED:
4936                                 /* kill_proc(fl->fl_pid, SIGLOST, 1); */
4937                                 err = 0;
4938                                 goto out;
4939                         case -NFS4ERR_DELAY:
4940                                 break;
4941                 }
4942                 err = nfs4_handle_exception(server, err, &exception);
4943         } while (exception.retry);
4944 out:
4945         return err;
4946 }
4947
4948 struct nfs_release_lockowner_data {
4949         struct nfs4_lock_state *lsp;
4950         struct nfs_server *server;
4951         struct nfs_release_lockowner_args args;
4952 };
4953
4954 static void nfs4_release_lockowner_release(void *calldata)
4955 {
4956         struct nfs_release_lockowner_data *data = calldata;
4957         nfs4_free_lock_state(data->server, data->lsp);
4958         kfree(calldata);
4959 }
4960
4961 static const struct rpc_call_ops nfs4_release_lockowner_ops = {
4962         .rpc_release = nfs4_release_lockowner_release,
4963 };
4964
4965 int nfs4_release_lockowner(struct nfs4_lock_state *lsp)
4966 {
4967         struct nfs_server *server = lsp->ls_state->owner->so_server;
4968         struct nfs_release_lockowner_data *data;
4969         struct rpc_message msg = {
4970                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RELEASE_LOCKOWNER],
4971         };
4972
4973         if (server->nfs_client->cl_mvops->minor_version != 0)
4974                 return -EINVAL;
4975         data = kmalloc(sizeof(*data), GFP_NOFS);
4976         if (!data)
4977                 return -ENOMEM;
4978         data->lsp = lsp;
4979         data->server = server;
4980         data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
4981         data->args.lock_owner.id = lsp->ls_seqid.owner_id;
4982         data->args.lock_owner.s_dev = server->s_dev;
4983         msg.rpc_argp = &data->args;
4984         rpc_call_async(server->client, &msg, 0, &nfs4_release_lockowner_ops, data);
4985         return 0;
4986 }
4987
4988 #define XATTR_NAME_NFSV4_ACL "system.nfs4_acl"
4989
4990 static int nfs4_xattr_set_nfs4_acl(struct dentry *dentry, const char *key,
4991                                    const void *buf, size_t buflen,
4992                                    int flags, int type)
4993 {
4994         if (strcmp(key, "") != 0)
4995                 return -EINVAL;
4996
4997         return nfs4_proc_set_acl(dentry->d_inode, buf, buflen);
4998 }
4999
5000 static int nfs4_xattr_get_nfs4_acl(struct dentry *dentry, const char *key,
5001                                    void *buf, size_t buflen, int type)
5002 {
5003         if (strcmp(key, "") != 0)
5004                 return -EINVAL;
5005
5006         return nfs4_proc_get_acl(dentry->d_inode, buf, buflen);
5007 }
5008
5009 static size_t nfs4_xattr_list_nfs4_acl(struct dentry *dentry, char *list,
5010                                        size_t list_len, const char *name,
5011                                        size_t name_len, int type)
5012 {
5013         size_t len = sizeof(XATTR_NAME_NFSV4_ACL);
5014
5015         if (!nfs4_server_supports_acls(NFS_SERVER(dentry->d_inode)))
5016                 return 0;
5017
5018         if (list && len <= list_len)
5019                 memcpy(list, XATTR_NAME_NFSV4_ACL, len);
5020         return len;
5021 }
5022
5023 /*
5024  * nfs_fhget will use either the mounted_on_fileid or the fileid
5025  */
5026 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr)
5027 {
5028         if (!(((fattr->valid & NFS_ATTR_FATTR_MOUNTED_ON_FILEID) ||
5029                (fattr->valid & NFS_ATTR_FATTR_FILEID)) &&
5030               (fattr->valid & NFS_ATTR_FATTR_FSID) &&
5031               (fattr->valid & NFS_ATTR_FATTR_V4_LOCATIONS)))
5032                 return;
5033
5034         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
5035                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_V4_REFERRAL;
5036         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
5037         fattr->nlink = 2;
5038 }
5039
5040 static int _nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
5041                                    const struct qstr *name,
5042                                    struct nfs4_fs_locations *fs_locations,
5043                                    struct page *page)
5044 {
5045         struct nfs_server *server = NFS_SERVER(dir);
5046         u32 bitmask[2] = {
5047                 [0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
5048         };
5049         struct nfs4_fs_locations_arg args = {
5050                 .dir_fh = NFS_FH(dir),
5051                 .name = name,
5052                 .page = page,
5053                 .bitmask = bitmask,
5054         };
5055         struct nfs4_fs_locations_res res = {
5056                 .fs_locations = fs_locations,
5057         };
5058         struct rpc_message msg = {
5059                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
5060                 .rpc_argp = &args,
5061                 .rpc_resp = &res,
5062         };
5063         int status;
5064
5065         dprintk("%s: start\n", __func__);
5066
5067         /* Ask for the fileid of the absent filesystem if mounted_on_fileid
5068          * is not supported */
5069         if (NFS_SERVER(dir)->attr_bitmask[1] & FATTR4_WORD1_MOUNTED_ON_FILEID)
5070                 bitmask[1] |= FATTR4_WORD1_MOUNTED_ON_FILEID;
5071         else
5072                 bitmask[0] |= FATTR4_WORD0_FILEID;
5073
5074         nfs_fattr_init(&fs_locations->fattr);
5075         fs_locations->server = server;
5076         fs_locations->nlocations = 0;
5077         status = nfs4_call_sync(client, server, &msg, &args.seq_args, &res.seq_res, 0);
5078         dprintk("%s: returned status = %d\n", __func__, status);
5079         return status;
5080 }
5081
5082 int nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
5083                            const struct qstr *name,
5084                            struct nfs4_fs_locations *fs_locations,
5085                            struct page *page)
5086 {
5087         struct nfs4_exception exception = { };
5088         int err;
5089         do {
5090                 err = nfs4_handle_exception(NFS_SERVER(dir),
5091                                 _nfs4_proc_fs_locations(client, dir, name, fs_locations, page),
5092                                 &exception);
5093         } while (exception.retry);
5094         return err;
5095 }
5096
5097 static int _nfs4_proc_secinfo(struct inode *dir, const struct qstr *name, struct nfs4_secinfo_flavors *flavors)
5098 {
5099         int status;
5100         struct nfs4_secinfo_arg args = {
5101                 .dir_fh = NFS_FH(dir),
5102                 .name   = name,
5103         };
5104         struct nfs4_secinfo_res res = {
5105                 .flavors     = flavors,
5106         };
5107         struct rpc_message msg = {
5108                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO],
5109                 .rpc_argp = &args,
5110                 .rpc_resp = &res,
5111         };
5112
5113         dprintk("NFS call  secinfo %s\n", name->name);
5114         status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
5115         dprintk("NFS reply  secinfo: %d\n", status);
5116         return status;
5117 }
5118
5119 int nfs4_proc_secinfo(struct inode *dir, const struct qstr *name,
5120                       struct nfs4_secinfo_flavors *flavors)
5121 {
5122         struct nfs4_exception exception = { };
5123         int err;
5124         do {
5125                 err = nfs4_handle_exception(NFS_SERVER(dir),
5126                                 _nfs4_proc_secinfo(dir, name, flavors),
5127                                 &exception);
5128         } while (exception.retry);
5129         return err;
5130 }
5131
5132 #ifdef CONFIG_NFS_V4_1
5133 /*
5134  * Check the exchange flags returned by the server for invalid flags, having
5135  * both PNFS and NON_PNFS flags set, and not having one of NON_PNFS, PNFS, or
5136  * DS flags set.
5137  */
5138 static int nfs4_check_cl_exchange_flags(u32 flags)
5139 {
5140         if (flags & ~EXCHGID4_FLAG_MASK_R)
5141                 goto out_inval;
5142         if ((flags & EXCHGID4_FLAG_USE_PNFS_MDS) &&
5143             (flags & EXCHGID4_FLAG_USE_NON_PNFS))
5144                 goto out_inval;
5145         if (!(flags & (EXCHGID4_FLAG_MASK_PNFS)))
5146                 goto out_inval;
5147         return NFS_OK;
5148 out_inval:
5149         return -NFS4ERR_INVAL;
5150 }
5151
5152 static bool
5153 nfs41_same_server_scope(struct nfs41_server_scope *a,
5154                         struct nfs41_server_scope *b)
5155 {
5156         if (a->server_scope_sz == b->server_scope_sz &&
5157             memcmp(a->server_scope, b->server_scope, a->server_scope_sz) == 0)
5158                 return true;
5159
5160         return false;
5161 }
5162
5163 /*
5164  * nfs4_proc_bind_conn_to_session()
5165  *
5166  * The 4.1 client currently uses the same TCP connection for the
5167  * fore and backchannel.
5168  */
5169 int nfs4_proc_bind_conn_to_session(struct nfs_client *clp, struct rpc_cred *cred)
5170 {
5171         int status;
5172         struct nfs41_bind_conn_to_session_res res;
5173         struct rpc_message msg = {
5174                 .rpc_proc =
5175                         &nfs4_procedures[NFSPROC4_CLNT_BIND_CONN_TO_SESSION],
5176                 .rpc_argp = clp,
5177                 .rpc_resp = &res,
5178                 .rpc_cred = cred,
5179         };
5180
5181         dprintk("--> %s\n", __func__);
5182         BUG_ON(clp == NULL);
5183
5184         res.session = kzalloc(sizeof(struct nfs4_session), GFP_NOFS);
5185         if (unlikely(res.session == NULL)) {
5186                 status = -ENOMEM;
5187                 goto out;
5188         }
5189
5190         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5191         if (status == 0) {
5192                 if (memcmp(res.session->sess_id.data,
5193                     clp->cl_session->sess_id.data, NFS4_MAX_SESSIONID_LEN)) {
5194                         dprintk("NFS: %s: Session ID mismatch\n", __func__);
5195                         status = -EIO;
5196                         goto out_session;
5197                 }
5198                 if (res.dir != NFS4_CDFS4_BOTH) {
5199                         dprintk("NFS: %s: Unexpected direction from server\n",
5200                                 __func__);
5201                         status = -EIO;
5202                         goto out_session;
5203                 }
5204                 if (res.use_conn_in_rdma_mode) {
5205                         dprintk("NFS: %s: Server returned RDMA mode = true\n",
5206                                 __func__);
5207                         status = -EIO;
5208                         goto out_session;
5209                 }
5210         }
5211 out_session:
5212         kfree(res.session);
5213 out:
5214         dprintk("<-- %s status= %d\n", __func__, status);
5215         return status;
5216 }
5217
5218 /*
5219  * nfs4_proc_exchange_id()
5220  *
5221  * Since the clientid has expired, all compounds using sessions
5222  * associated with the stale clientid will be returning
5223  * NFS4ERR_BADSESSION in the sequence operation, and will therefore
5224  * be in some phase of session reset.
5225  */
5226 int nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred)
5227 {
5228         nfs4_verifier verifier;
5229         struct nfs41_exchange_id_args args = {
5230                 .verifier = &verifier,
5231                 .client = clp,
5232                 .flags = EXCHGID4_FLAG_SUPP_MOVED_REFER,
5233         };
5234         struct nfs41_exchange_id_res res = {
5235                 0
5236         };
5237         int status;
5238         struct rpc_message msg = {
5239                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_EXCHANGE_ID],
5240                 .rpc_argp = &args,
5241                 .rpc_resp = &res,
5242                 .rpc_cred = cred,
5243         };
5244
5245         dprintk("--> %s\n", __func__);
5246         BUG_ON(clp == NULL);
5247
5248         nfs4_init_boot_verifier(clp, &verifier);
5249
5250         args.id_len = scnprintf(args.id, sizeof(args.id),
5251                                 "%s/%s",
5252                                 clp->cl_ipaddr,
5253                                 clp->cl_rpcclient->cl_nodename);
5254
5255         res.server_owner = kzalloc(sizeof(struct nfs41_server_owner),
5256                                         GFP_NOFS);
5257         if (unlikely(res.server_owner == NULL)) {
5258                 status = -ENOMEM;
5259                 goto out;
5260         }
5261
5262         res.server_scope = kzalloc(sizeof(struct nfs41_server_scope),
5263                                         GFP_NOFS);
5264         if (unlikely(res.server_scope == NULL)) {
5265                 status = -ENOMEM;
5266                 goto out_server_owner;
5267         }
5268
5269         res.impl_id = kzalloc(sizeof(struct nfs41_impl_id), GFP_NOFS);
5270         if (unlikely(res.impl_id == NULL)) {
5271                 status = -ENOMEM;
5272                 goto out_server_scope;
5273         }
5274
5275         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5276         if (status == 0)
5277                 status = nfs4_check_cl_exchange_flags(res.flags);
5278
5279         if (status == 0) {
5280                 clp->cl_clientid = res.clientid;
5281                 clp->cl_exchange_flags = (res.flags & ~EXCHGID4_FLAG_CONFIRMED_R);
5282                 if (!(res.flags & EXCHGID4_FLAG_CONFIRMED_R))
5283                         clp->cl_seqid = res.seqid;
5284
5285                 kfree(clp->cl_serverowner);
5286                 clp->cl_serverowner = res.server_owner;
5287                 res.server_owner = NULL;
5288
5289                 /* use the most recent implementation id */
5290                 kfree(clp->cl_implid);
5291                 clp->cl_implid = res.impl_id;
5292
5293                 if (clp->cl_serverscope != NULL &&
5294                     !nfs41_same_server_scope(clp->cl_serverscope,
5295                                              res.server_scope)) {
5296                         dprintk("%s: server_scope mismatch detected\n",
5297                                 __func__);
5298                         set_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state);
5299                         kfree(clp->cl_serverscope);
5300                         clp->cl_serverscope = NULL;
5301                 }
5302
5303                 if (clp->cl_serverscope == NULL) {
5304                         clp->cl_serverscope = res.server_scope;
5305                         goto out;
5306                 }
5307         } else
5308                 kfree(res.impl_id);
5309
5310 out_server_owner:
5311         kfree(res.server_owner);
5312 out_server_scope:
5313         kfree(res.server_scope);
5314 out:
5315         if (clp->cl_implid != NULL)
5316                 dprintk("%s: Server Implementation ID: "
5317                         "domain: %s, name: %s, date: %llu,%u\n",
5318                         __func__, clp->cl_implid->domain, clp->cl_implid->name,
5319                         clp->cl_implid->date.seconds,
5320                         clp->cl_implid->date.nseconds);
5321         dprintk("<-- %s status= %d\n", __func__, status);
5322         return status;
5323 }
5324
5325 static int _nfs4_proc_destroy_clientid(struct nfs_client *clp,
5326                 struct rpc_cred *cred)
5327 {
5328         struct rpc_message msg = {
5329                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_CLIENTID],
5330                 .rpc_argp = clp,
5331                 .rpc_cred = cred,
5332         };
5333         int status;
5334
5335         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5336         if (status)
5337                 dprintk("NFS: Got error %d from the server %s on "
5338                         "DESTROY_CLIENTID.", status, clp->cl_hostname);
5339         return status;
5340 }
5341
5342 static int nfs4_proc_destroy_clientid(struct nfs_client *clp,
5343                 struct rpc_cred *cred)
5344 {
5345         unsigned int loop;
5346         int ret;
5347
5348         for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
5349                 ret = _nfs4_proc_destroy_clientid(clp, cred);
5350                 switch (ret) {
5351                 case -NFS4ERR_DELAY:
5352                 case -NFS4ERR_CLIENTID_BUSY:
5353                         ssleep(1);
5354                         break;
5355                 default:
5356                         return ret;
5357                 }
5358         }
5359         return 0;
5360 }
5361
5362 int nfs4_destroy_clientid(struct nfs_client *clp)
5363 {
5364         struct rpc_cred *cred;
5365         int ret = 0;
5366
5367         if (clp->cl_mvops->minor_version < 1)
5368                 goto out;
5369         if (clp->cl_exchange_flags == 0)
5370                 goto out;
5371         cred = nfs4_get_exchange_id_cred(clp);
5372         ret = nfs4_proc_destroy_clientid(clp, cred);
5373         if (cred)
5374                 put_rpccred(cred);
5375         switch (ret) {
5376         case 0:
5377         case -NFS4ERR_STALE_CLIENTID:
5378                 clp->cl_exchange_flags = 0;
5379         }
5380 out:
5381         return ret;
5382 }
5383
5384 struct nfs4_get_lease_time_data {
5385         struct nfs4_get_lease_time_args *args;
5386         struct nfs4_get_lease_time_res *res;
5387         struct nfs_client *clp;
5388 };
5389
5390 static void nfs4_get_lease_time_prepare(struct rpc_task *task,
5391                                         void *calldata)
5392 {
5393         int ret;
5394         struct nfs4_get_lease_time_data *data =
5395                         (struct nfs4_get_lease_time_data *)calldata;
5396
5397         dprintk("--> %s\n", __func__);
5398         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
5399         /* just setup sequence, do not trigger session recovery
5400            since we're invoked within one */
5401         ret = nfs41_setup_sequence(data->clp->cl_session,
5402                                    &data->args->la_seq_args,
5403                                    &data->res->lr_seq_res, task);
5404
5405         BUG_ON(ret == -EAGAIN);
5406         rpc_call_start(task);
5407         dprintk("<-- %s\n", __func__);
5408 }
5409
5410 /*
5411  * Called from nfs4_state_manager thread for session setup, so don't recover
5412  * from sequence operation or clientid errors.
5413  */
5414 static void nfs4_get_lease_time_done(struct rpc_task *task, void *calldata)
5415 {
5416         struct nfs4_get_lease_time_data *data =
5417                         (struct nfs4_get_lease_time_data *)calldata;
5418
5419         dprintk("--> %s\n", __func__);
5420         if (!nfs41_sequence_done(task, &data->res->lr_seq_res))
5421                 return;
5422         switch (task->tk_status) {
5423         case -NFS4ERR_DELAY:
5424         case -NFS4ERR_GRACE:
5425                 dprintk("%s Retry: tk_status %d\n", __func__, task->tk_status);
5426                 rpc_delay(task, NFS4_POLL_RETRY_MIN);
5427                 task->tk_status = 0;
5428                 /* fall through */
5429         case -NFS4ERR_RETRY_UNCACHED_REP:
5430                 rpc_restart_call_prepare(task);
5431                 return;
5432         }
5433         dprintk("<-- %s\n", __func__);
5434 }
5435
5436 static const struct rpc_call_ops nfs4_get_lease_time_ops = {
5437         .rpc_call_prepare = nfs4_get_lease_time_prepare,
5438         .rpc_call_done = nfs4_get_lease_time_done,
5439 };
5440
5441 int nfs4_proc_get_lease_time(struct nfs_client *clp, struct nfs_fsinfo *fsinfo)
5442 {
5443         struct rpc_task *task;
5444         struct nfs4_get_lease_time_args args;
5445         struct nfs4_get_lease_time_res res = {
5446                 .lr_fsinfo = fsinfo,
5447         };
5448         struct nfs4_get_lease_time_data data = {
5449                 .args = &args,
5450                 .res = &res,
5451                 .clp = clp,
5452         };
5453         struct rpc_message msg = {
5454                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GET_LEASE_TIME],
5455                 .rpc_argp = &args,
5456                 .rpc_resp = &res,
5457         };
5458         struct rpc_task_setup task_setup = {
5459                 .rpc_client = clp->cl_rpcclient,
5460                 .rpc_message = &msg,
5461                 .callback_ops = &nfs4_get_lease_time_ops,
5462                 .callback_data = &data,
5463                 .flags = RPC_TASK_TIMEOUT,
5464         };
5465         int status;
5466
5467         nfs41_init_sequence(&args.la_seq_args, &res.lr_seq_res, 0);
5468         dprintk("--> %s\n", __func__);
5469         task = rpc_run_task(&task_setup);
5470
5471         if (IS_ERR(task))
5472                 status = PTR_ERR(task);
5473         else {
5474                 status = task->tk_status;
5475                 rpc_put_task(task);
5476         }
5477         dprintk("<-- %s return %d\n", __func__, status);
5478
5479         return status;
5480 }
5481
5482 static struct nfs4_slot *nfs4_alloc_slots(u32 max_slots, gfp_t gfp_flags)
5483 {
5484         return kcalloc(max_slots, sizeof(struct nfs4_slot), gfp_flags);
5485 }
5486
5487 static void nfs4_add_and_init_slots(struct nfs4_slot_table *tbl,
5488                 struct nfs4_slot *new,
5489                 u32 max_slots,
5490                 u32 ivalue)
5491 {
5492         struct nfs4_slot *old = NULL;
5493         u32 i;
5494
5495         spin_lock(&tbl->slot_tbl_lock);
5496         if (new) {
5497                 old = tbl->slots;
5498                 tbl->slots = new;
5499                 tbl->max_slots = max_slots;
5500         }
5501         tbl->highest_used_slotid = -1;  /* no slot is currently used */
5502         for (i = 0; i < tbl->max_slots; i++)
5503                 tbl->slots[i].seq_nr = ivalue;
5504         spin_unlock(&tbl->slot_tbl_lock);
5505         kfree(old);
5506 }
5507
5508 /*
5509  * (re)Initialise a slot table
5510  */
5511 static int nfs4_realloc_slot_table(struct nfs4_slot_table *tbl, u32 max_reqs,
5512                                  u32 ivalue)
5513 {
5514         struct nfs4_slot *new = NULL;
5515         int ret = -ENOMEM;
5516
5517         dprintk("--> %s: max_reqs=%u, tbl->max_slots %d\n", __func__,
5518                 max_reqs, tbl->max_slots);
5519
5520         /* Does the newly negotiated max_reqs match the existing slot table? */
5521         if (max_reqs != tbl->max_slots) {
5522                 new = nfs4_alloc_slots(max_reqs, GFP_NOFS);
5523                 if (!new)
5524                         goto out;
5525         }
5526         ret = 0;
5527
5528         nfs4_add_and_init_slots(tbl, new, max_reqs, ivalue);
5529         dprintk("%s: tbl=%p slots=%p max_slots=%d\n", __func__,
5530                 tbl, tbl->slots, tbl->max_slots);
5531 out:
5532         dprintk("<-- %s: return %d\n", __func__, ret);
5533         return ret;
5534 }
5535
5536 /* Destroy the slot table */
5537 static void nfs4_destroy_slot_tables(struct nfs4_session *session)
5538 {
5539         if (session->fc_slot_table.slots != NULL) {
5540                 kfree(session->fc_slot_table.slots);
5541                 session->fc_slot_table.slots = NULL;
5542         }
5543         if (session->bc_slot_table.slots != NULL) {
5544                 kfree(session->bc_slot_table.slots);
5545                 session->bc_slot_table.slots = NULL;
5546         }
5547         return;
5548 }
5549
5550 /*
5551  * Initialize or reset the forechannel and backchannel tables
5552  */
5553 static int nfs4_setup_session_slot_tables(struct nfs4_session *ses)
5554 {
5555         struct nfs4_slot_table *tbl;
5556         int status;
5557
5558         dprintk("--> %s\n", __func__);
5559         /* Fore channel */
5560         tbl = &ses->fc_slot_table;
5561         status = nfs4_realloc_slot_table(tbl, ses->fc_attrs.max_reqs, 1);
5562         if (status) /* -ENOMEM */
5563                 return status;
5564         /* Back channel */
5565         tbl = &ses->bc_slot_table;
5566         status = nfs4_realloc_slot_table(tbl, ses->bc_attrs.max_reqs, 0);
5567         if (status && tbl->slots == NULL)
5568                 /* Fore and back channel share a connection so get
5569                  * both slot tables or neither */
5570                 nfs4_destroy_slot_tables(ses);
5571         return status;
5572 }
5573
5574 struct nfs4_session *nfs4_alloc_session(struct nfs_client *clp)
5575 {
5576         struct nfs4_session *session;
5577         struct nfs4_slot_table *tbl;
5578
5579         session = kzalloc(sizeof(struct nfs4_session), GFP_NOFS);
5580         if (!session)
5581                 return NULL;
5582
5583         tbl = &session->fc_slot_table;
5584         tbl->highest_used_slotid = NFS4_NO_SLOT;
5585         spin_lock_init(&tbl->slot_tbl_lock);
5586         rpc_init_priority_wait_queue(&tbl->slot_tbl_waitq, "ForeChannel Slot table");
5587         init_completion(&tbl->complete);
5588
5589         tbl = &session->bc_slot_table;
5590         tbl->highest_used_slotid = NFS4_NO_SLOT;
5591         spin_lock_init(&tbl->slot_tbl_lock);
5592         rpc_init_wait_queue(&tbl->slot_tbl_waitq, "BackChannel Slot table");
5593         init_completion(&tbl->complete);
5594
5595         session->session_state = 1<<NFS4_SESSION_INITING;
5596
5597         session->clp = clp;
5598         return session;
5599 }
5600
5601 void nfs4_destroy_session(struct nfs4_session *session)
5602 {
5603         struct rpc_xprt *xprt;
5604         struct rpc_cred *cred;
5605
5606         cred = nfs4_get_exchange_id_cred(session->clp);
5607         nfs4_proc_destroy_session(session, cred);
5608         if (cred)
5609                 put_rpccred(cred);
5610
5611         rcu_read_lock();
5612         xprt = rcu_dereference(session->clp->cl_rpcclient->cl_xprt);
5613         rcu_read_unlock();
5614         dprintk("%s Destroy backchannel for xprt %p\n",
5615                 __func__, xprt);
5616         xprt_destroy_backchannel(xprt, NFS41_BC_MIN_CALLBACKS);
5617         nfs4_destroy_slot_tables(session);
5618         kfree(session);
5619 }
5620
5621 /*
5622  * Initialize the values to be used by the client in CREATE_SESSION
5623  * If nfs4_init_session set the fore channel request and response sizes,
5624  * use them.
5625  *
5626  * Set the back channel max_resp_sz_cached to zero to force the client to
5627  * always set csa_cachethis to FALSE because the current implementation
5628  * of the back channel DRC only supports caching the CB_SEQUENCE operation.
5629  */
5630 static void nfs4_init_channel_attrs(struct nfs41_create_session_args *args)
5631 {
5632         struct nfs4_session *session = args->client->cl_session;
5633         unsigned int mxrqst_sz = session->fc_attrs.max_rqst_sz,
5634                      mxresp_sz = session->fc_attrs.max_resp_sz;
5635
5636         if (mxrqst_sz == 0)
5637                 mxrqst_sz = NFS_MAX_FILE_IO_SIZE;
5638         if (mxresp_sz == 0)
5639                 mxresp_sz = NFS_MAX_FILE_IO_SIZE;
5640         /* Fore channel attributes */
5641         args->fc_attrs.max_rqst_sz = mxrqst_sz;
5642         args->fc_attrs.max_resp_sz = mxresp_sz;
5643         args->fc_attrs.max_ops = NFS4_MAX_OPS;
5644         args->fc_attrs.max_reqs = max_session_slots;
5645
5646         dprintk("%s: Fore Channel : max_rqst_sz=%u max_resp_sz=%u "
5647                 "max_ops=%u max_reqs=%u\n",
5648                 __func__,
5649                 args->fc_attrs.max_rqst_sz, args->fc_attrs.max_resp_sz,
5650                 args->fc_attrs.max_ops, args->fc_attrs.max_reqs);
5651
5652         /* Back channel attributes */
5653         args->bc_attrs.max_rqst_sz = PAGE_SIZE;
5654         args->bc_attrs.max_resp_sz = PAGE_SIZE;
5655         args->bc_attrs.max_resp_sz_cached = 0;
5656         args->bc_attrs.max_ops = NFS4_MAX_BACK_CHANNEL_OPS;
5657         args->bc_attrs.max_reqs = 1;
5658
5659         dprintk("%s: Back Channel : max_rqst_sz=%u max_resp_sz=%u "
5660                 "max_resp_sz_cached=%u max_ops=%u max_reqs=%u\n",
5661                 __func__,
5662                 args->bc_attrs.max_rqst_sz, args->bc_attrs.max_resp_sz,
5663                 args->bc_attrs.max_resp_sz_cached, args->bc_attrs.max_ops,
5664                 args->bc_attrs.max_reqs);
5665 }
5666
5667 static int nfs4_verify_fore_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
5668 {
5669         struct nfs4_channel_attrs *sent = &args->fc_attrs;
5670         struct nfs4_channel_attrs *rcvd = &session->fc_attrs;
5671
5672         if (rcvd->max_resp_sz > sent->max_resp_sz)
5673                 return -EINVAL;
5674         /*
5675          * Our requested max_ops is the minimum we need; we're not
5676          * prepared to break up compounds into smaller pieces than that.
5677          * So, no point even trying to continue if the server won't
5678          * cooperate:
5679          */
5680         if (rcvd->max_ops < sent->max_ops)
5681                 return -EINVAL;
5682         if (rcvd->max_reqs == 0)
5683                 return -EINVAL;
5684         if (rcvd->max_reqs > NFS4_MAX_SLOT_TABLE)
5685                 rcvd->max_reqs = NFS4_MAX_SLOT_TABLE;
5686         return 0;
5687 }
5688
5689 static int nfs4_verify_back_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
5690 {
5691         struct nfs4_channel_attrs *sent = &args->bc_attrs;
5692         struct nfs4_channel_attrs *rcvd = &session->bc_attrs;
5693
5694         if (rcvd->max_rqst_sz > sent->max_rqst_sz)
5695                 return -EINVAL;
5696         if (rcvd->max_resp_sz < sent->max_resp_sz)
5697                 return -EINVAL;
5698         if (rcvd->max_resp_sz_cached > sent->max_resp_sz_cached)
5699                 return -EINVAL;
5700         /* These would render the backchannel useless: */
5701         if (rcvd->max_ops != sent->max_ops)
5702                 return -EINVAL;
5703         if (rcvd->max_reqs != sent->max_reqs)
5704                 return -EINVAL;
5705         return 0;
5706 }
5707
5708 static int nfs4_verify_channel_attrs(struct nfs41_create_session_args *args,
5709                                      struct nfs4_session *session)
5710 {
5711         int ret;
5712
5713         ret = nfs4_verify_fore_channel_attrs(args, session);
5714         if (ret)
5715                 return ret;
5716         return nfs4_verify_back_channel_attrs(args, session);
5717 }
5718
5719 static int _nfs4_proc_create_session(struct nfs_client *clp,
5720                 struct rpc_cred *cred)
5721 {
5722         struct nfs4_session *session = clp->cl_session;
5723         struct nfs41_create_session_args args = {
5724                 .client = clp,
5725                 .cb_program = NFS4_CALLBACK,
5726         };
5727         struct nfs41_create_session_res res = {
5728                 .client = clp,
5729         };
5730         struct rpc_message msg = {
5731                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE_SESSION],
5732                 .rpc_argp = &args,
5733                 .rpc_resp = &res,
5734                 .rpc_cred = cred,
5735         };
5736         int status;
5737
5738         nfs4_init_channel_attrs(&args);
5739         args.flags = (SESSION4_PERSIST | SESSION4_BACK_CHAN);
5740
5741         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5742
5743         if (!status)
5744                 /* Verify the session's negotiated channel_attrs values */
5745                 status = nfs4_verify_channel_attrs(&args, session);
5746         if (!status) {
5747                 /* Increment the clientid slot sequence id */
5748                 clp->cl_seqid++;
5749         }
5750
5751         return status;
5752 }
5753
5754 /*
5755  * Issues a CREATE_SESSION operation to the server.
5756  * It is the responsibility of the caller to verify the session is
5757  * expired before calling this routine.
5758  */
5759 int nfs4_proc_create_session(struct nfs_client *clp, struct rpc_cred *cred)
5760 {
5761         int status;
5762         unsigned *ptr;
5763         struct nfs4_session *session = clp->cl_session;
5764
5765         dprintk("--> %s clp=%p session=%p\n", __func__, clp, session);
5766
5767         status = _nfs4_proc_create_session(clp, cred);
5768         if (status)
5769                 goto out;
5770
5771         /* Init or reset the session slot tables */
5772         status = nfs4_setup_session_slot_tables(session);
5773         dprintk("slot table setup returned %d\n", status);
5774         if (status)
5775                 goto out;
5776
5777         ptr = (unsigned *)&session->sess_id.data[0];
5778         dprintk("%s client>seqid %d sessionid %u:%u:%u:%u\n", __func__,
5779                 clp->cl_seqid, ptr[0], ptr[1], ptr[2], ptr[3]);
5780 out:
5781         dprintk("<-- %s\n", __func__);
5782         return status;
5783 }
5784
5785 /*
5786  * Issue the over-the-wire RPC DESTROY_SESSION.
5787  * The caller must serialize access to this routine.
5788  */
5789 int nfs4_proc_destroy_session(struct nfs4_session *session,
5790                 struct rpc_cred *cred)
5791 {
5792         struct rpc_message msg = {
5793                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_SESSION],
5794                 .rpc_argp = session,
5795                 .rpc_cred = cred,
5796         };
5797         int status = 0;
5798
5799         dprintk("--> nfs4_proc_destroy_session\n");
5800
5801         /* session is still being setup */
5802         if (session->clp->cl_cons_state != NFS_CS_READY)
5803                 return status;
5804
5805         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5806
5807         if (status)
5808                 dprintk("NFS: Got error %d from the server on DESTROY_SESSION. "
5809                         "Session has been destroyed regardless...\n", status);
5810
5811         dprintk("<-- nfs4_proc_destroy_session\n");
5812         return status;
5813 }
5814
5815 /*
5816  * With sessions, the client is not marked ready until after a
5817  * successful EXCHANGE_ID and CREATE_SESSION.
5818  *
5819  * Map errors cl_cons_state errors to EPROTONOSUPPORT to indicate
5820  * other versions of NFS can be tried.
5821  */
5822 static int nfs41_check_session_ready(struct nfs_client *clp)
5823 {
5824         int ret;
5825         
5826         if (clp->cl_cons_state == NFS_CS_SESSION_INITING) {
5827                 ret = nfs4_client_recover_expired_lease(clp);
5828                 if (ret)
5829                         return ret;
5830         }
5831         if (clp->cl_cons_state < NFS_CS_READY)
5832                 return -EPROTONOSUPPORT;
5833         smp_rmb();
5834         return 0;
5835 }
5836
5837 int nfs4_init_session(struct nfs_server *server)
5838 {
5839         struct nfs_client *clp = server->nfs_client;
5840         struct nfs4_session *session;
5841         unsigned int rsize, wsize;
5842
5843         if (!nfs4_has_session(clp))
5844                 return 0;
5845
5846         session = clp->cl_session;
5847         spin_lock(&clp->cl_lock);
5848         if (test_and_clear_bit(NFS4_SESSION_INITING, &session->session_state)) {
5849
5850                 rsize = server->rsize;
5851                 if (rsize == 0)
5852                         rsize = NFS_MAX_FILE_IO_SIZE;
5853                 wsize = server->wsize;
5854                 if (wsize == 0)
5855                         wsize = NFS_MAX_FILE_IO_SIZE;
5856
5857                 session->fc_attrs.max_rqst_sz = wsize + nfs41_maxwrite_overhead;
5858                 session->fc_attrs.max_resp_sz = rsize + nfs41_maxread_overhead;
5859         }
5860         spin_unlock(&clp->cl_lock);
5861
5862         return nfs41_check_session_ready(clp);
5863 }
5864
5865 int nfs4_init_ds_session(struct nfs_client *clp, unsigned long lease_time)
5866 {
5867         struct nfs4_session *session = clp->cl_session;
5868         int ret;
5869
5870         spin_lock(&clp->cl_lock);
5871         if (test_and_clear_bit(NFS4_SESSION_INITING, &session->session_state)) {
5872                 /*
5873                  * Do not set NFS_CS_CHECK_LEASE_TIME instead set the
5874                  * DS lease to be equal to the MDS lease.
5875                  */
5876                 clp->cl_lease_time = lease_time;
5877                 clp->cl_last_renewal = jiffies;
5878         }
5879         spin_unlock(&clp->cl_lock);
5880
5881         ret = nfs41_check_session_ready(clp);
5882         if (ret)
5883                 return ret;
5884         /* Test for the DS role */
5885         if (!is_ds_client(clp))
5886                 return -ENODEV;
5887         return 0;
5888 }
5889 EXPORT_SYMBOL_GPL(nfs4_init_ds_session);
5890
5891
5892 /*
5893  * Renew the cl_session lease.
5894  */
5895 struct nfs4_sequence_data {
5896         struct nfs_client *clp;
5897         struct nfs4_sequence_args args;
5898         struct nfs4_sequence_res res;
5899 };
5900
5901 static void nfs41_sequence_release(void *data)
5902 {
5903         struct nfs4_sequence_data *calldata = data;
5904         struct nfs_client *clp = calldata->clp;
5905
5906         if (atomic_read(&clp->cl_count) > 1)
5907                 nfs4_schedule_state_renewal(clp);
5908         nfs_put_client(clp);
5909         kfree(calldata);
5910 }
5911
5912 static int nfs41_sequence_handle_errors(struct rpc_task *task, struct nfs_client *clp)
5913 {
5914         switch(task->tk_status) {
5915         case -NFS4ERR_DELAY:
5916                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
5917                 return -EAGAIN;
5918         default:
5919                 nfs4_schedule_lease_recovery(clp);
5920         }
5921         return 0;
5922 }
5923
5924 static void nfs41_sequence_call_done(struct rpc_task *task, void *data)
5925 {
5926         struct nfs4_sequence_data *calldata = data;
5927         struct nfs_client *clp = calldata->clp;
5928
5929         if (!nfs41_sequence_done(task, task->tk_msg.rpc_resp))
5930                 return;
5931
5932         if (task->tk_status < 0) {
5933                 dprintk("%s ERROR %d\n", __func__, task->tk_status);
5934                 if (atomic_read(&clp->cl_count) == 1)
5935                         goto out;
5936
5937                 if (nfs41_sequence_handle_errors(task, clp) == -EAGAIN) {
5938                         rpc_restart_call_prepare(task);
5939                         return;
5940                 }
5941         }
5942         dprintk("%s rpc_cred %p\n", __func__, task->tk_msg.rpc_cred);
5943 out:
5944         dprintk("<-- %s\n", __func__);
5945 }
5946
5947 static void nfs41_sequence_prepare(struct rpc_task *task, void *data)
5948 {
5949         struct nfs4_sequence_data *calldata = data;
5950         struct nfs_client *clp = calldata->clp;
5951         struct nfs4_sequence_args *args;
5952         struct nfs4_sequence_res *res;
5953
5954         args = task->tk_msg.rpc_argp;
5955         res = task->tk_msg.rpc_resp;
5956
5957         if (nfs41_setup_sequence(clp->cl_session, args, res, task))
5958                 return;
5959         rpc_call_start(task);
5960 }
5961
5962 static const struct rpc_call_ops nfs41_sequence_ops = {
5963         .rpc_call_done = nfs41_sequence_call_done,
5964         .rpc_call_prepare = nfs41_sequence_prepare,
5965         .rpc_release = nfs41_sequence_release,
5966 };
5967
5968 static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
5969 {
5970         struct nfs4_sequence_data *calldata;
5971         struct rpc_message msg = {
5972                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SEQUENCE],
5973                 .rpc_cred = cred,
5974         };
5975         struct rpc_task_setup task_setup_data = {
5976                 .rpc_client = clp->cl_rpcclient,
5977                 .rpc_message = &msg,
5978                 .callback_ops = &nfs41_sequence_ops,
5979                 .flags = RPC_TASK_ASYNC | RPC_TASK_SOFT,
5980         };
5981
5982         if (!atomic_inc_not_zero(&clp->cl_count))
5983                 return ERR_PTR(-EIO);
5984         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
5985         if (calldata == NULL) {
5986                 nfs_put_client(clp);
5987                 return ERR_PTR(-ENOMEM);
5988         }
5989         nfs41_init_sequence(&calldata->args, &calldata->res, 0);
5990         msg.rpc_argp = &calldata->args;
5991         msg.rpc_resp = &calldata->res;
5992         calldata->clp = clp;
5993         task_setup_data.callback_data = calldata;
5994
5995         return rpc_run_task(&task_setup_data);
5996 }
5997
5998 static int nfs41_proc_async_sequence(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
5999 {
6000         struct rpc_task *task;
6001         int ret = 0;
6002
6003         if ((renew_flags & NFS4_RENEW_TIMEOUT) == 0)
6004                 return 0;
6005         task = _nfs41_proc_sequence(clp, cred);
6006         if (IS_ERR(task))
6007                 ret = PTR_ERR(task);
6008         else
6009                 rpc_put_task_async(task);
6010         dprintk("<-- %s status=%d\n", __func__, ret);
6011         return ret;
6012 }
6013
6014 static int nfs4_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
6015 {
6016         struct rpc_task *task;
6017         int ret;
6018
6019         task = _nfs41_proc_sequence(clp, cred);
6020         if (IS_ERR(task)) {
6021                 ret = PTR_ERR(task);
6022                 goto out;
6023         }
6024         ret = rpc_wait_for_completion_task(task);
6025         if (!ret) {
6026                 struct nfs4_sequence_res *res = task->tk_msg.rpc_resp;
6027
6028                 if (task->tk_status == 0)
6029                         nfs41_handle_sequence_flag_errors(clp, res->sr_status_flags);
6030                 ret = task->tk_status;
6031         }
6032         rpc_put_task(task);
6033 out:
6034         dprintk("<-- %s status=%d\n", __func__, ret);
6035         return ret;
6036 }
6037
6038 struct nfs4_reclaim_complete_data {
6039         struct nfs_client *clp;
6040         struct nfs41_reclaim_complete_args arg;
6041         struct nfs41_reclaim_complete_res res;
6042 };
6043
6044 static void nfs4_reclaim_complete_prepare(struct rpc_task *task, void *data)
6045 {
6046         struct nfs4_reclaim_complete_data *calldata = data;
6047
6048         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
6049         if (nfs41_setup_sequence(calldata->clp->cl_session,
6050                                 &calldata->arg.seq_args,
6051                                 &calldata->res.seq_res, task))
6052                 return;
6053
6054         rpc_call_start(task);
6055 }
6056
6057 static int nfs41_reclaim_complete_handle_errors(struct rpc_task *task, struct nfs_client *clp)
6058 {
6059         switch(task->tk_status) {
6060         case 0:
6061         case -NFS4ERR_COMPLETE_ALREADY:
6062         case -NFS4ERR_WRONG_CRED: /* What to do here? */
6063                 break;
6064         case -NFS4ERR_DELAY:
6065                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
6066                 /* fall through */
6067         case -NFS4ERR_RETRY_UNCACHED_REP:
6068                 return -EAGAIN;
6069         default:
6070                 nfs4_schedule_lease_recovery(clp);
6071         }
6072         return 0;
6073 }
6074
6075 static void nfs4_reclaim_complete_done(struct rpc_task *task, void *data)
6076 {
6077         struct nfs4_reclaim_complete_data *calldata = data;
6078         struct nfs_client *clp = calldata->clp;
6079         struct nfs4_sequence_res *res = &calldata->res.seq_res;
6080
6081         dprintk("--> %s\n", __func__);
6082         if (!nfs41_sequence_done(task, res))
6083                 return;
6084
6085         if (nfs41_reclaim_complete_handle_errors(task, clp) == -EAGAIN) {
6086                 rpc_restart_call_prepare(task);
6087                 return;
6088         }
6089         dprintk("<-- %s\n", __func__);
6090 }
6091
6092 static void nfs4_free_reclaim_complete_data(void *data)
6093 {
6094         struct nfs4_reclaim_complete_data *calldata = data;
6095
6096         kfree(calldata);
6097 }
6098
6099 static const struct rpc_call_ops nfs4_reclaim_complete_call_ops = {
6100         .rpc_call_prepare = nfs4_reclaim_complete_prepare,
6101         .rpc_call_done = nfs4_reclaim_complete_done,
6102         .rpc_release = nfs4_free_reclaim_complete_data,
6103 };
6104
6105 /*
6106  * Issue a global reclaim complete.
6107  */
6108 static int nfs41_proc_reclaim_complete(struct nfs_client *clp)
6109 {
6110         struct nfs4_reclaim_complete_data *calldata;
6111         struct rpc_task *task;
6112         struct rpc_message msg = {
6113                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RECLAIM_COMPLETE],
6114         };
6115         struct rpc_task_setup task_setup_data = {
6116                 .rpc_client = clp->cl_rpcclient,
6117                 .rpc_message = &msg,
6118                 .callback_ops = &nfs4_reclaim_complete_call_ops,
6119                 .flags = RPC_TASK_ASYNC,
6120         };
6121         int status = -ENOMEM;
6122
6123         dprintk("--> %s\n", __func__);
6124         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
6125         if (calldata == NULL)
6126                 goto out;
6127         calldata->clp = clp;
6128         calldata->arg.one_fs = 0;
6129
6130         nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 0);
6131         msg.rpc_argp = &calldata->arg;
6132         msg.rpc_resp = &calldata->res;
6133         task_setup_data.callback_data = calldata;
6134         task = rpc_run_task(&task_setup_data);
6135         if (IS_ERR(task)) {
6136                 status = PTR_ERR(task);
6137                 goto out;
6138         }
6139         status = nfs4_wait_for_completion_rpc_task(task);
6140         if (status == 0)
6141                 status = task->tk_status;
6142         rpc_put_task(task);
6143         return 0;
6144 out:
6145         dprintk("<-- %s status=%d\n", __func__, status);
6146         return status;
6147 }
6148
6149 static void
6150 nfs4_layoutget_prepare(struct rpc_task *task, void *calldata)
6151 {
6152         struct nfs4_layoutget *lgp = calldata;
6153         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
6154
6155         dprintk("--> %s\n", __func__);
6156         /* Note the is a race here, where a CB_LAYOUTRECALL can come in
6157          * right now covering the LAYOUTGET we are about to send.
6158          * However, that is not so catastrophic, and there seems
6159          * to be no way to prevent it completely.
6160          */
6161         if (nfs4_setup_sequence(server, &lgp->args.seq_args,
6162                                 &lgp->res.seq_res, task))
6163                 return;
6164         if (pnfs_choose_layoutget_stateid(&lgp->args.stateid,
6165                                           NFS_I(lgp->args.inode)->layout,
6166                                           lgp->args.ctx->state)) {
6167                 rpc_exit(task, NFS4_OK);
6168                 return;
6169         }
6170         rpc_call_start(task);
6171 }
6172
6173 static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
6174 {
6175         struct nfs4_layoutget *lgp = calldata;
6176         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
6177
6178         dprintk("--> %s\n", __func__);
6179
6180         if (!nfs4_sequence_done(task, &lgp->res.seq_res))
6181                 return;
6182
6183         switch (task->tk_status) {
6184         case 0:
6185                 break;
6186         case -NFS4ERR_LAYOUTTRYLATER:
6187         case -NFS4ERR_RECALLCONFLICT:
6188                 task->tk_status = -NFS4ERR_DELAY;
6189                 /* Fall through */
6190         default:
6191                 if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6192                         rpc_restart_call_prepare(task);
6193                         return;
6194                 }
6195         }
6196         dprintk("<-- %s\n", __func__);
6197 }
6198
6199 static void nfs4_layoutget_release(void *calldata)
6200 {
6201         struct nfs4_layoutget *lgp = calldata;
6202
6203         dprintk("--> %s\n", __func__);
6204         put_nfs_open_context(lgp->args.ctx);
6205         kfree(calldata);
6206         dprintk("<-- %s\n", __func__);
6207 }
6208
6209 static const struct rpc_call_ops nfs4_layoutget_call_ops = {
6210         .rpc_call_prepare = nfs4_layoutget_prepare,
6211         .rpc_call_done = nfs4_layoutget_done,
6212         .rpc_release = nfs4_layoutget_release,
6213 };
6214
6215 int nfs4_proc_layoutget(struct nfs4_layoutget *lgp)
6216 {
6217         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
6218         struct rpc_task *task;
6219         struct rpc_message msg = {
6220                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTGET],
6221                 .rpc_argp = &lgp->args,
6222                 .rpc_resp = &lgp->res,
6223         };
6224         struct rpc_task_setup task_setup_data = {
6225                 .rpc_client = server->client,
6226                 .rpc_message = &msg,
6227                 .callback_ops = &nfs4_layoutget_call_ops,
6228                 .callback_data = lgp,
6229                 .flags = RPC_TASK_ASYNC,
6230         };
6231         int status = 0;
6232
6233         dprintk("--> %s\n", __func__);
6234
6235         lgp->res.layoutp = &lgp->args.layout;
6236         lgp->res.seq_res.sr_slot = NULL;
6237         nfs41_init_sequence(&lgp->args.seq_args, &lgp->res.seq_res, 0);
6238         task = rpc_run_task(&task_setup_data);
6239         if (IS_ERR(task))
6240                 return PTR_ERR(task);
6241         status = nfs4_wait_for_completion_rpc_task(task);
6242         if (status == 0)
6243                 status = task->tk_status;
6244         if (status == 0)
6245                 status = pnfs_layout_process(lgp);
6246         rpc_put_task(task);
6247         dprintk("<-- %s status=%d\n", __func__, status);
6248         return status;
6249 }
6250
6251 static void
6252 nfs4_layoutreturn_prepare(struct rpc_task *task, void *calldata)
6253 {
6254         struct nfs4_layoutreturn *lrp = calldata;
6255
6256         dprintk("--> %s\n", __func__);
6257         if (nfs41_setup_sequence(lrp->clp->cl_session, &lrp->args.seq_args,
6258                                 &lrp->res.seq_res, task))
6259                 return;
6260         rpc_call_start(task);
6261 }
6262
6263 static void nfs4_layoutreturn_done(struct rpc_task *task, void *calldata)
6264 {
6265         struct nfs4_layoutreturn *lrp = calldata;
6266         struct nfs_server *server;
6267         struct pnfs_layout_hdr *lo = lrp->args.layout;
6268
6269         dprintk("--> %s\n", __func__);
6270
6271         if (!nfs4_sequence_done(task, &lrp->res.seq_res))
6272                 return;
6273
6274         server = NFS_SERVER(lrp->args.inode);
6275         if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6276                 rpc_restart_call_prepare(task);
6277                 return;
6278         }
6279         spin_lock(&lo->plh_inode->i_lock);
6280         if (task->tk_status == 0) {
6281                 if (lrp->res.lrs_present) {
6282                         pnfs_set_layout_stateid(lo, &lrp->res.stateid, true);
6283                 } else
6284                         BUG_ON(!list_empty(&lo->plh_segs));
6285         }
6286         lo->plh_block_lgets--;
6287         spin_unlock(&lo->plh_inode->i_lock);
6288         dprintk("<-- %s\n", __func__);
6289 }
6290
6291 static void nfs4_layoutreturn_release(void *calldata)
6292 {
6293         struct nfs4_layoutreturn *lrp = calldata;
6294
6295         dprintk("--> %s\n", __func__);
6296         put_layout_hdr(lrp->args.layout);
6297         kfree(calldata);
6298         dprintk("<-- %s\n", __func__);
6299 }
6300
6301 static const struct rpc_call_ops nfs4_layoutreturn_call_ops = {
6302         .rpc_call_prepare = nfs4_layoutreturn_prepare,
6303         .rpc_call_done = nfs4_layoutreturn_done,
6304         .rpc_release = nfs4_layoutreturn_release,
6305 };
6306
6307 int nfs4_proc_layoutreturn(struct nfs4_layoutreturn *lrp)
6308 {
6309         struct rpc_task *task;
6310         struct rpc_message msg = {
6311                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTRETURN],
6312                 .rpc_argp = &lrp->args,
6313                 .rpc_resp = &lrp->res,
6314         };
6315         struct rpc_task_setup task_setup_data = {
6316                 .rpc_client = lrp->clp->cl_rpcclient,
6317                 .rpc_message = &msg,
6318                 .callback_ops = &nfs4_layoutreturn_call_ops,
6319                 .callback_data = lrp,
6320         };
6321         int status;
6322
6323         dprintk("--> %s\n", __func__);
6324         nfs41_init_sequence(&lrp->args.seq_args, &lrp->res.seq_res, 1);
6325         task = rpc_run_task(&task_setup_data);
6326         if (IS_ERR(task))
6327                 return PTR_ERR(task);
6328         status = task->tk_status;
6329         dprintk("<-- %s status=%d\n", __func__, status);
6330         rpc_put_task(task);
6331         return status;
6332 }
6333
6334 /*
6335  * Retrieve the list of Data Server devices from the MDS.
6336  */
6337 static int _nfs4_getdevicelist(struct nfs_server *server,
6338                                     const struct nfs_fh *fh,
6339                                     struct pnfs_devicelist *devlist)
6340 {
6341         struct nfs4_getdevicelist_args args = {
6342                 .fh = fh,
6343                 .layoutclass = server->pnfs_curr_ld->id,
6344         };
6345         struct nfs4_getdevicelist_res res = {
6346                 .devlist = devlist,
6347         };
6348         struct rpc_message msg = {
6349                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICELIST],
6350                 .rpc_argp = &args,
6351                 .rpc_resp = &res,
6352         };
6353         int status;
6354
6355         dprintk("--> %s\n", __func__);
6356         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args,
6357                                 &res.seq_res, 0);
6358         dprintk("<-- %s status=%d\n", __func__, status);
6359         return status;
6360 }
6361
6362 int nfs4_proc_getdevicelist(struct nfs_server *server,
6363                             const struct nfs_fh *fh,
6364                             struct pnfs_devicelist *devlist)
6365 {
6366         struct nfs4_exception exception = { };
6367         int err;
6368
6369         do {
6370                 err = nfs4_handle_exception(server,
6371                                 _nfs4_getdevicelist(server, fh, devlist),
6372                                 &exception);
6373         } while (exception.retry);
6374
6375         dprintk("%s: err=%d, num_devs=%u\n", __func__,
6376                 err, devlist->num_devs);
6377
6378         return err;
6379 }
6380 EXPORT_SYMBOL_GPL(nfs4_proc_getdevicelist);
6381
6382 static int
6383 _nfs4_proc_getdeviceinfo(struct nfs_server *server, struct pnfs_device *pdev)
6384 {
6385         struct nfs4_getdeviceinfo_args args = {
6386                 .pdev = pdev,
6387         };
6388         struct nfs4_getdeviceinfo_res res = {
6389                 .pdev = pdev,
6390         };
6391         struct rpc_message msg = {
6392                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICEINFO],
6393                 .rpc_argp = &args,
6394                 .rpc_resp = &res,
6395         };
6396         int status;
6397
6398         dprintk("--> %s\n", __func__);
6399         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
6400         dprintk("<-- %s status=%d\n", __func__, status);
6401
6402         return status;
6403 }
6404
6405 int nfs4_proc_getdeviceinfo(struct nfs_server *server, struct pnfs_device *pdev)
6406 {
6407         struct nfs4_exception exception = { };
6408         int err;
6409
6410         do {
6411                 err = nfs4_handle_exception(server,
6412                                         _nfs4_proc_getdeviceinfo(server, pdev),
6413                                         &exception);
6414         } while (exception.retry);
6415         return err;
6416 }
6417 EXPORT_SYMBOL_GPL(nfs4_proc_getdeviceinfo);
6418
6419 static void nfs4_layoutcommit_prepare(struct rpc_task *task, void *calldata)
6420 {
6421         struct nfs4_layoutcommit_data *data = calldata;
6422         struct nfs_server *server = NFS_SERVER(data->args.inode);
6423
6424         if (nfs4_setup_sequence(server, &data->args.seq_args,
6425                                 &data->res.seq_res, task))
6426                 return;
6427         rpc_call_start(task);
6428 }
6429
6430 static void
6431 nfs4_layoutcommit_done(struct rpc_task *task, void *calldata)
6432 {
6433         struct nfs4_layoutcommit_data *data = calldata;
6434         struct nfs_server *server = NFS_SERVER(data->args.inode);
6435
6436         if (!nfs4_sequence_done(task, &data->res.seq_res))
6437                 return;
6438
6439         switch (task->tk_status) { /* Just ignore these failures */
6440         case -NFS4ERR_DELEG_REVOKED: /* layout was recalled */
6441         case -NFS4ERR_BADIOMODE:     /* no IOMODE_RW layout for range */
6442         case -NFS4ERR_BADLAYOUT:     /* no layout */
6443         case -NFS4ERR_GRACE:        /* loca_recalim always false */
6444                 task->tk_status = 0;
6445                 break;
6446         case 0:
6447                 nfs_post_op_update_inode_force_wcc(data->args.inode,
6448                                                    data->res.fattr);
6449                 break;
6450         default:
6451                 if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6452                         rpc_restart_call_prepare(task);
6453                         return;
6454                 }
6455         }
6456 }
6457
6458 static void nfs4_layoutcommit_release(void *calldata)
6459 {
6460         struct nfs4_layoutcommit_data *data = calldata;
6461         struct pnfs_layout_segment *lseg, *tmp;
6462         unsigned long *bitlock = &NFS_I(data->args.inode)->flags;
6463
6464         pnfs_cleanup_layoutcommit(data);
6465         /* Matched by references in pnfs_set_layoutcommit */
6466         list_for_each_entry_safe(lseg, tmp, &data->lseg_list, pls_lc_list) {
6467                 list_del_init(&lseg->pls_lc_list);
6468                 if (test_and_clear_bit(NFS_LSEG_LAYOUTCOMMIT,
6469                                        &lseg->pls_flags))
6470                         put_lseg(lseg);
6471         }
6472
6473         clear_bit_unlock(NFS_INO_LAYOUTCOMMITTING, bitlock);
6474         smp_mb__after_clear_bit();
6475         wake_up_bit(bitlock, NFS_INO_LAYOUTCOMMITTING);
6476
6477         put_rpccred(data->cred);
6478         kfree(data);
6479 }
6480
6481 static const struct rpc_call_ops nfs4_layoutcommit_ops = {
6482         .rpc_call_prepare = nfs4_layoutcommit_prepare,
6483         .rpc_call_done = nfs4_layoutcommit_done,
6484         .rpc_release = nfs4_layoutcommit_release,
6485 };
6486
6487 int
6488 nfs4_proc_layoutcommit(struct nfs4_layoutcommit_data *data, bool sync)
6489 {
6490         struct rpc_message msg = {
6491                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTCOMMIT],
6492                 .rpc_argp = &data->args,
6493                 .rpc_resp = &data->res,
6494                 .rpc_cred = data->cred,
6495         };
6496         struct rpc_task_setup task_setup_data = {
6497                 .task = &data->task,
6498                 .rpc_client = NFS_CLIENT(data->args.inode),
6499                 .rpc_message = &msg,
6500                 .callback_ops = &nfs4_layoutcommit_ops,
6501                 .callback_data = data,
6502                 .flags = RPC_TASK_ASYNC,
6503         };
6504         struct rpc_task *task;
6505         int status = 0;
6506
6507         dprintk("NFS: %4d initiating layoutcommit call. sync %d "
6508                 "lbw: %llu inode %lu\n",
6509                 data->task.tk_pid, sync,
6510                 data->args.lastbytewritten,
6511                 data->args.inode->i_ino);
6512
6513         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
6514         task = rpc_run_task(&task_setup_data);
6515         if (IS_ERR(task))
6516                 return PTR_ERR(task);
6517         if (sync == false)
6518                 goto out;
6519         status = nfs4_wait_for_completion_rpc_task(task);
6520         if (status != 0)
6521                 goto out;
6522         status = task->tk_status;
6523 out:
6524         dprintk("%s: status %d\n", __func__, status);
6525         rpc_put_task(task);
6526         return status;
6527 }
6528
6529 static int
6530 _nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
6531                     struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
6532 {
6533         struct nfs41_secinfo_no_name_args args = {
6534                 .style = SECINFO_STYLE_CURRENT_FH,
6535         };
6536         struct nfs4_secinfo_res res = {
6537                 .flavors = flavors,
6538         };
6539         struct rpc_message msg = {
6540                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO_NO_NAME],
6541                 .rpc_argp = &args,
6542                 .rpc_resp = &res,
6543         };
6544         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
6545 }
6546
6547 static int
6548 nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
6549                            struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
6550 {
6551         struct nfs4_exception exception = { };
6552         int err;
6553         do {
6554                 err = _nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
6555                 switch (err) {
6556                 case 0:
6557                 case -NFS4ERR_WRONGSEC:
6558                 case -NFS4ERR_NOTSUPP:
6559                         goto out;
6560                 default:
6561                         err = nfs4_handle_exception(server, err, &exception);
6562                 }
6563         } while (exception.retry);
6564 out:
6565         return err;
6566 }
6567
6568 static int
6569 nfs41_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
6570                     struct nfs_fsinfo *info)
6571 {
6572         int err;
6573         struct page *page;
6574         rpc_authflavor_t flavor;
6575         struct nfs4_secinfo_flavors *flavors;
6576
6577         page = alloc_page(GFP_KERNEL);
6578         if (!page) {
6579                 err = -ENOMEM;
6580                 goto out;
6581         }
6582
6583         flavors = page_address(page);
6584         err = nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
6585
6586         /*
6587          * Fall back on "guess and check" method if
6588          * the server doesn't support SECINFO_NO_NAME
6589          */
6590         if (err == -NFS4ERR_WRONGSEC || err == -NFS4ERR_NOTSUPP) {
6591                 err = nfs4_find_root_sec(server, fhandle, info);
6592                 goto out_freepage;
6593         }
6594         if (err)
6595                 goto out_freepage;
6596
6597         flavor = nfs_find_best_sec(flavors);
6598         if (err == 0)
6599                 err = nfs4_lookup_root_sec(server, fhandle, info, flavor);
6600
6601 out_freepage:
6602         put_page(page);
6603         if (err == -EACCES)
6604                 return -EPERM;
6605 out:
6606         return err;
6607 }
6608
6609 static int _nfs41_test_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6610 {
6611         int status;
6612         struct nfs41_test_stateid_args args = {
6613                 .stateid = stateid,
6614         };
6615         struct nfs41_test_stateid_res res;
6616         struct rpc_message msg = {
6617                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_TEST_STATEID],
6618                 .rpc_argp = &args,
6619                 .rpc_resp = &res,
6620         };
6621
6622         dprintk("NFS call  test_stateid %p\n", stateid);
6623         nfs41_init_sequence(&args.seq_args, &res.seq_res, 0);
6624         status = nfs4_call_sync_sequence(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
6625         if (status != NFS_OK) {
6626                 dprintk("NFS reply test_stateid: failed, %d\n", status);
6627                 return status;
6628         }
6629         dprintk("NFS reply test_stateid: succeeded, %d\n", -res.status);
6630         return -res.status;
6631 }
6632
6633 /**
6634  * nfs41_test_stateid - perform a TEST_STATEID operation
6635  *
6636  * @server: server / transport on which to perform the operation
6637  * @stateid: state ID to test
6638  *
6639  * Returns NFS_OK if the server recognizes that "stateid" is valid.
6640  * Otherwise a negative NFS4ERR value is returned if the operation
6641  * failed or the state ID is not currently valid.
6642  */
6643 static int nfs41_test_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6644 {
6645         struct nfs4_exception exception = { };
6646         int err;
6647         do {
6648                 err = _nfs41_test_stateid(server, stateid);
6649                 if (err != -NFS4ERR_DELAY)
6650                         break;
6651                 nfs4_handle_exception(server, err, &exception);
6652         } while (exception.retry);
6653         return err;
6654 }
6655
6656 static int _nfs4_free_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6657 {
6658         struct nfs41_free_stateid_args args = {
6659                 .stateid = stateid,
6660         };
6661         struct nfs41_free_stateid_res res;
6662         struct rpc_message msg = {
6663                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FREE_STATEID],
6664                 .rpc_argp = &args,
6665                 .rpc_resp = &res,
6666         };
6667         int status;
6668
6669         dprintk("NFS call  free_stateid %p\n", stateid);
6670         nfs41_init_sequence(&args.seq_args, &res.seq_res, 0);
6671         status = nfs4_call_sync_sequence(server->client, server, &msg,
6672                                          &args.seq_args, &res.seq_res, 1);
6673         dprintk("NFS reply free_stateid: %d\n", status);
6674         return status;
6675 }
6676
6677 /**
6678  * nfs41_free_stateid - perform a FREE_STATEID operation
6679  *
6680  * @server: server / transport on which to perform the operation
6681  * @stateid: state ID to release
6682  *
6683  * Returns NFS_OK if the server freed "stateid".  Otherwise a
6684  * negative NFS4ERR value is returned.
6685  */
6686 static int nfs41_free_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6687 {
6688         struct nfs4_exception exception = { };
6689         int err;
6690         do {
6691                 err = _nfs4_free_stateid(server, stateid);
6692                 if (err != -NFS4ERR_DELAY)
6693                         break;
6694                 nfs4_handle_exception(server, err, &exception);
6695         } while (exception.retry);
6696         return err;
6697 }
6698
6699 static bool nfs41_match_stateid(const nfs4_stateid *s1,
6700                 const nfs4_stateid *s2)
6701 {
6702         if (memcmp(s1->other, s2->other, sizeof(s1->other)) != 0)
6703                 return false;
6704
6705         if (s1->seqid == s2->seqid)
6706                 return true;
6707         if (s1->seqid == 0 || s2->seqid == 0)
6708                 return true;
6709
6710         return false;
6711 }
6712
6713 #endif /* CONFIG_NFS_V4_1 */
6714
6715 static bool nfs4_match_stateid(const nfs4_stateid *s1,
6716                 const nfs4_stateid *s2)
6717 {
6718         return nfs4_stateid_match(s1, s2);
6719 }
6720
6721
6722 static const struct nfs4_state_recovery_ops nfs40_reboot_recovery_ops = {
6723         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
6724         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
6725         .recover_open   = nfs4_open_reclaim,
6726         .recover_lock   = nfs4_lock_reclaim,
6727         .establish_clid = nfs4_init_clientid,
6728         .get_clid_cred  = nfs4_get_setclientid_cred,
6729 };
6730
6731 #if defined(CONFIG_NFS_V4_1)
6732 static const struct nfs4_state_recovery_ops nfs41_reboot_recovery_ops = {
6733         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
6734         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
6735         .recover_open   = nfs4_open_reclaim,
6736         .recover_lock   = nfs4_lock_reclaim,
6737         .establish_clid = nfs41_init_clientid,
6738         .get_clid_cred  = nfs4_get_exchange_id_cred,
6739         .reclaim_complete = nfs41_proc_reclaim_complete,
6740 };
6741 #endif /* CONFIG_NFS_V4_1 */
6742
6743 static const struct nfs4_state_recovery_ops nfs40_nograce_recovery_ops = {
6744         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
6745         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
6746         .recover_open   = nfs4_open_expired,
6747         .recover_lock   = nfs4_lock_expired,
6748         .establish_clid = nfs4_init_clientid,
6749         .get_clid_cred  = nfs4_get_setclientid_cred,
6750 };
6751
6752 #if defined(CONFIG_NFS_V4_1)
6753 static const struct nfs4_state_recovery_ops nfs41_nograce_recovery_ops = {
6754         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
6755         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
6756         .recover_open   = nfs41_open_expired,
6757         .recover_lock   = nfs41_lock_expired,
6758         .establish_clid = nfs41_init_clientid,
6759         .get_clid_cred  = nfs4_get_exchange_id_cred,
6760 };
6761 #endif /* CONFIG_NFS_V4_1 */
6762
6763 static const struct nfs4_state_maintenance_ops nfs40_state_renewal_ops = {
6764         .sched_state_renewal = nfs4_proc_async_renew,
6765         .get_state_renewal_cred_locked = nfs4_get_renew_cred_locked,
6766         .renew_lease = nfs4_proc_renew,
6767 };
6768
6769 #if defined(CONFIG_NFS_V4_1)
6770 static const struct nfs4_state_maintenance_ops nfs41_state_renewal_ops = {
6771         .sched_state_renewal = nfs41_proc_async_sequence,
6772         .get_state_renewal_cred_locked = nfs4_get_machine_cred_locked,
6773         .renew_lease = nfs4_proc_sequence,
6774 };
6775 #endif
6776
6777 static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
6778         .minor_version = 0,
6779         .call_sync = _nfs4_call_sync,
6780         .match_stateid = nfs4_match_stateid,
6781         .find_root_sec = nfs4_find_root_sec,
6782         .reboot_recovery_ops = &nfs40_reboot_recovery_ops,
6783         .nograce_recovery_ops = &nfs40_nograce_recovery_ops,
6784         .state_renewal_ops = &nfs40_state_renewal_ops,
6785 };
6786
6787 #if defined(CONFIG_NFS_V4_1)
6788 static const struct nfs4_minor_version_ops nfs_v4_1_minor_ops = {
6789         .minor_version = 1,
6790         .call_sync = _nfs4_call_sync_session,
6791         .match_stateid = nfs41_match_stateid,
6792         .find_root_sec = nfs41_find_root_sec,
6793         .reboot_recovery_ops = &nfs41_reboot_recovery_ops,
6794         .nograce_recovery_ops = &nfs41_nograce_recovery_ops,
6795         .state_renewal_ops = &nfs41_state_renewal_ops,
6796 };
6797 #endif
6798
6799 const struct nfs4_minor_version_ops *nfs_v4_minor_ops[] = {
6800         [0] = &nfs_v4_0_minor_ops,
6801 #if defined(CONFIG_NFS_V4_1)
6802         [1] = &nfs_v4_1_minor_ops,
6803 #endif
6804 };
6805
6806 static const struct inode_operations nfs4_file_inode_operations = {
6807         .permission     = nfs_permission,
6808         .getattr        = nfs_getattr,
6809         .setattr        = nfs_setattr,
6810         .getxattr       = generic_getxattr,
6811         .setxattr       = generic_setxattr,
6812         .listxattr      = generic_listxattr,
6813         .removexattr    = generic_removexattr,
6814 };
6815
6816 const struct nfs_rpc_ops nfs_v4_clientops = {
6817         .version        = 4,                    /* protocol version */
6818         .dentry_ops     = &nfs4_dentry_operations,
6819         .dir_inode_ops  = &nfs4_dir_inode_operations,
6820         .file_inode_ops = &nfs4_file_inode_operations,
6821         .file_ops       = &nfs4_file_operations,
6822         .getroot        = nfs4_proc_get_root,
6823         .submount       = nfs4_submount,
6824         .getattr        = nfs4_proc_getattr,
6825         .setattr        = nfs4_proc_setattr,
6826         .lookup         = nfs4_proc_lookup,
6827         .access         = nfs4_proc_access,
6828         .readlink       = nfs4_proc_readlink,
6829         .create         = nfs4_proc_create,
6830         .remove         = nfs4_proc_remove,
6831         .unlink_setup   = nfs4_proc_unlink_setup,
6832         .unlink_rpc_prepare = nfs4_proc_unlink_rpc_prepare,
6833         .unlink_done    = nfs4_proc_unlink_done,
6834         .rename         = nfs4_proc_rename,
6835         .rename_setup   = nfs4_proc_rename_setup,
6836         .rename_rpc_prepare = nfs4_proc_rename_rpc_prepare,
6837         .rename_done    = nfs4_proc_rename_done,
6838         .link           = nfs4_proc_link,
6839         .symlink        = nfs4_proc_symlink,
6840         .mkdir          = nfs4_proc_mkdir,
6841         .rmdir          = nfs4_proc_remove,
6842         .readdir        = nfs4_proc_readdir,
6843         .mknod          = nfs4_proc_mknod,
6844         .statfs         = nfs4_proc_statfs,
6845         .fsinfo         = nfs4_proc_fsinfo,
6846         .pathconf       = nfs4_proc_pathconf,
6847         .set_capabilities = nfs4_server_capabilities,
6848         .decode_dirent  = nfs4_decode_dirent,
6849         .read_setup     = nfs4_proc_read_setup,
6850         .read_pageio_init = pnfs_pageio_init_read,
6851         .read_rpc_prepare = nfs4_proc_read_rpc_prepare,
6852         .read_done      = nfs4_read_done,
6853         .write_setup    = nfs4_proc_write_setup,
6854         .write_pageio_init = pnfs_pageio_init_write,
6855         .write_rpc_prepare = nfs4_proc_write_rpc_prepare,
6856         .write_done     = nfs4_write_done,
6857         .commit_setup   = nfs4_proc_commit_setup,
6858         .commit_rpc_prepare = nfs4_proc_commit_rpc_prepare,
6859         .commit_done    = nfs4_commit_done,
6860         .lock           = nfs4_proc_lock,
6861         .clear_acl_cache = nfs4_zap_acl_attr,
6862         .close_context  = nfs4_close_context,
6863         .open_context   = nfs4_atomic_open,
6864         .have_delegation = nfs4_have_delegation,
6865         .return_delegation = nfs4_inode_return_delegation,
6866         .alloc_client   = nfs4_alloc_client,
6867         .init_client    = nfs4_init_client,
6868         .free_client    = nfs4_free_client,
6869 };
6870
6871 static const struct xattr_handler nfs4_xattr_nfs4_acl_handler = {
6872         .prefix = XATTR_NAME_NFSV4_ACL,
6873         .list   = nfs4_xattr_list_nfs4_acl,
6874         .get    = nfs4_xattr_get_nfs4_acl,
6875         .set    = nfs4_xattr_set_nfs4_acl,
6876 };
6877
6878 const struct xattr_handler *nfs4_xattr_handlers[] = {
6879         &nfs4_xattr_nfs4_acl_handler,
6880         NULL
6881 };
6882
6883 module_param(max_session_slots, ushort, 0644);
6884 MODULE_PARM_DESC(max_session_slots, "Maximum number of outstanding NFSv4.1 "
6885                 "requests the client will negotiate");
6886
6887 /*
6888  * Local variables:
6889  *  c-basic-offset: 8
6890  * End:
6891  */