]> rtime.felk.cvut.cz Git - linux-imx.git/blob - fs/nfs/nfs4proc.c
NFSv4.1: Use layout credentials for get_deviceinfo calls
[linux-imx.git] / fs / nfs / nfs4proc.c
1 /*
2  *  fs/nfs/nfs4proc.c
3  *
4  *  Client-side procedure declarations for NFSv4.
5  *
6  *  Copyright (c) 2002 The Regents of the University of Michigan.
7  *  All rights reserved.
8  *
9  *  Kendrick Smith <kmsmith@umich.edu>
10  *  Andy Adamson   <andros@umich.edu>
11  *
12  *  Redistribution and use in source and binary forms, with or without
13  *  modification, are permitted provided that the following conditions
14  *  are met:
15  *
16  *  1. Redistributions of source code must retain the above copyright
17  *     notice, this list of conditions and the following disclaimer.
18  *  2. Redistributions in binary form must reproduce the above copyright
19  *     notice, this list of conditions and the following disclaimer in the
20  *     documentation and/or other materials provided with the distribution.
21  *  3. Neither the name of the University nor the names of its
22  *     contributors may be used to endorse or promote products derived
23  *     from this software without specific prior written permission.
24  *
25  *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
26  *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
27  *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
28  *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
29  *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30  *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31  *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
32  *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
33  *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
34  *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
35  *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36  */
37
38 #include <linux/mm.h>
39 #include <linux/delay.h>
40 #include <linux/errno.h>
41 #include <linux/string.h>
42 #include <linux/ratelimit.h>
43 #include <linux/printk.h>
44 #include <linux/slab.h>
45 #include <linux/sunrpc/clnt.h>
46 #include <linux/nfs.h>
47 #include <linux/nfs4.h>
48 #include <linux/nfs_fs.h>
49 #include <linux/nfs_page.h>
50 #include <linux/nfs_mount.h>
51 #include <linux/namei.h>
52 #include <linux/mount.h>
53 #include <linux/module.h>
54 #include <linux/nfs_idmap.h>
55 #include <linux/xattr.h>
56 #include <linux/utsname.h>
57 #include <linux/freezer.h>
58
59 #include "nfs4_fs.h"
60 #include "delegation.h"
61 #include "internal.h"
62 #include "iostat.h"
63 #include "callback.h"
64 #include "pnfs.h"
65 #include "netns.h"
66 #include "nfs4session.h"
67 #include "fscache.h"
68
69 #define NFSDBG_FACILITY         NFSDBG_PROC
70
71 #define NFS4_POLL_RETRY_MIN     (HZ/10)
72 #define NFS4_POLL_RETRY_MAX     (15*HZ)
73
74 struct nfs4_opendata;
75 static int _nfs4_proc_open(struct nfs4_opendata *data);
76 static int _nfs4_recover_proc_open(struct nfs4_opendata *data);
77 static int nfs4_do_fsinfo(struct nfs_server *, struct nfs_fh *, struct nfs_fsinfo *);
78 static int nfs4_async_handle_error(struct rpc_task *, const struct nfs_server *, struct nfs4_state *);
79 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr);
80 static int nfs4_proc_getattr(struct nfs_server *, struct nfs_fh *, struct nfs_fattr *);
81 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr);
82 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
83                             struct nfs_fattr *fattr, struct iattr *sattr,
84                             struct nfs4_state *state);
85 #ifdef CONFIG_NFS_V4_1
86 static int nfs41_test_stateid(struct nfs_server *, nfs4_stateid *,
87                 struct rpc_cred *);
88 static int nfs41_free_stateid(struct nfs_server *, nfs4_stateid *,
89                 struct rpc_cred *);
90 #endif
91 /* Prevent leaks of NFSv4 errors into userland */
92 static int nfs4_map_errors(int err)
93 {
94         if (err >= -1000)
95                 return err;
96         switch (err) {
97         case -NFS4ERR_RESOURCE:
98         case -NFS4ERR_LAYOUTTRYLATER:
99         case -NFS4ERR_RECALLCONFLICT:
100                 return -EREMOTEIO;
101         case -NFS4ERR_WRONGSEC:
102                 return -EPERM;
103         case -NFS4ERR_BADOWNER:
104         case -NFS4ERR_BADNAME:
105                 return -EINVAL;
106         case -NFS4ERR_SHARE_DENIED:
107                 return -EACCES;
108         case -NFS4ERR_MINOR_VERS_MISMATCH:
109                 return -EPROTONOSUPPORT;
110         case -NFS4ERR_ACCESS:
111                 return -EACCES;
112         case -NFS4ERR_FILE_OPEN:
113                 return -EBUSY;
114         default:
115                 dprintk("%s could not handle NFSv4 error %d\n",
116                                 __func__, -err);
117                 break;
118         }
119         return -EIO;
120 }
121
122 /*
123  * This is our standard bitmap for GETATTR requests.
124  */
125 const u32 nfs4_fattr_bitmap[3] = {
126         FATTR4_WORD0_TYPE
127         | FATTR4_WORD0_CHANGE
128         | FATTR4_WORD0_SIZE
129         | FATTR4_WORD0_FSID
130         | FATTR4_WORD0_FILEID,
131         FATTR4_WORD1_MODE
132         | FATTR4_WORD1_NUMLINKS
133         | FATTR4_WORD1_OWNER
134         | FATTR4_WORD1_OWNER_GROUP
135         | FATTR4_WORD1_RAWDEV
136         | FATTR4_WORD1_SPACE_USED
137         | FATTR4_WORD1_TIME_ACCESS
138         | FATTR4_WORD1_TIME_METADATA
139         | FATTR4_WORD1_TIME_MODIFY
140 };
141
142 static const u32 nfs4_pnfs_open_bitmap[3] = {
143         FATTR4_WORD0_TYPE
144         | FATTR4_WORD0_CHANGE
145         | FATTR4_WORD0_SIZE
146         | FATTR4_WORD0_FSID
147         | FATTR4_WORD0_FILEID,
148         FATTR4_WORD1_MODE
149         | FATTR4_WORD1_NUMLINKS
150         | FATTR4_WORD1_OWNER
151         | FATTR4_WORD1_OWNER_GROUP
152         | FATTR4_WORD1_RAWDEV
153         | FATTR4_WORD1_SPACE_USED
154         | FATTR4_WORD1_TIME_ACCESS
155         | FATTR4_WORD1_TIME_METADATA
156         | FATTR4_WORD1_TIME_MODIFY,
157         FATTR4_WORD2_MDSTHRESHOLD
158 };
159
160 static const u32 nfs4_open_noattr_bitmap[3] = {
161         FATTR4_WORD0_TYPE
162         | FATTR4_WORD0_CHANGE
163         | FATTR4_WORD0_FILEID,
164 };
165
166 const u32 nfs4_statfs_bitmap[2] = {
167         FATTR4_WORD0_FILES_AVAIL
168         | FATTR4_WORD0_FILES_FREE
169         | FATTR4_WORD0_FILES_TOTAL,
170         FATTR4_WORD1_SPACE_AVAIL
171         | FATTR4_WORD1_SPACE_FREE
172         | FATTR4_WORD1_SPACE_TOTAL
173 };
174
175 const u32 nfs4_pathconf_bitmap[2] = {
176         FATTR4_WORD0_MAXLINK
177         | FATTR4_WORD0_MAXNAME,
178         0
179 };
180
181 const u32 nfs4_fsinfo_bitmap[3] = { FATTR4_WORD0_MAXFILESIZE
182                         | FATTR4_WORD0_MAXREAD
183                         | FATTR4_WORD0_MAXWRITE
184                         | FATTR4_WORD0_LEASE_TIME,
185                         FATTR4_WORD1_TIME_DELTA
186                         | FATTR4_WORD1_FS_LAYOUT_TYPES,
187                         FATTR4_WORD2_LAYOUT_BLKSIZE
188 };
189
190 const u32 nfs4_fs_locations_bitmap[2] = {
191         FATTR4_WORD0_TYPE
192         | FATTR4_WORD0_CHANGE
193         | FATTR4_WORD0_SIZE
194         | FATTR4_WORD0_FSID
195         | FATTR4_WORD0_FILEID
196         | FATTR4_WORD0_FS_LOCATIONS,
197         FATTR4_WORD1_MODE
198         | FATTR4_WORD1_NUMLINKS
199         | FATTR4_WORD1_OWNER
200         | FATTR4_WORD1_OWNER_GROUP
201         | FATTR4_WORD1_RAWDEV
202         | FATTR4_WORD1_SPACE_USED
203         | FATTR4_WORD1_TIME_ACCESS
204         | FATTR4_WORD1_TIME_METADATA
205         | FATTR4_WORD1_TIME_MODIFY
206         | FATTR4_WORD1_MOUNTED_ON_FILEID
207 };
208
209 static void nfs4_setup_readdir(u64 cookie, __be32 *verifier, struct dentry *dentry,
210                 struct nfs4_readdir_arg *readdir)
211 {
212         __be32 *start, *p;
213
214         if (cookie > 2) {
215                 readdir->cookie = cookie;
216                 memcpy(&readdir->verifier, verifier, sizeof(readdir->verifier));
217                 return;
218         }
219
220         readdir->cookie = 0;
221         memset(&readdir->verifier, 0, sizeof(readdir->verifier));
222         if (cookie == 2)
223                 return;
224         
225         /*
226          * NFSv4 servers do not return entries for '.' and '..'
227          * Therefore, we fake these entries here.  We let '.'
228          * have cookie 0 and '..' have cookie 1.  Note that
229          * when talking to the server, we always send cookie 0
230          * instead of 1 or 2.
231          */
232         start = p = kmap_atomic(*readdir->pages);
233         
234         if (cookie == 0) {
235                 *p++ = xdr_one;                                  /* next */
236                 *p++ = xdr_zero;                   /* cookie, first word */
237                 *p++ = xdr_one;                   /* cookie, second word */
238                 *p++ = xdr_one;                             /* entry len */
239                 memcpy(p, ".\0\0\0", 4);                        /* entry */
240                 p++;
241                 *p++ = xdr_one;                         /* bitmap length */
242                 *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
243                 *p++ = htonl(8);              /* attribute buffer length */
244                 p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_inode));
245         }
246         
247         *p++ = xdr_one;                                  /* next */
248         *p++ = xdr_zero;                   /* cookie, first word */
249         *p++ = xdr_two;                   /* cookie, second word */
250         *p++ = xdr_two;                             /* entry len */
251         memcpy(p, "..\0\0", 4);                         /* entry */
252         p++;
253         *p++ = xdr_one;                         /* bitmap length */
254         *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
255         *p++ = htonl(8);              /* attribute buffer length */
256         p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_parent->d_inode));
257
258         readdir->pgbase = (char *)p - (char *)start;
259         readdir->count -= readdir->pgbase;
260         kunmap_atomic(start);
261 }
262
263 static int nfs4_delay(struct rpc_clnt *clnt, long *timeout)
264 {
265         int res = 0;
266
267         might_sleep();
268
269         if (*timeout <= 0)
270                 *timeout = NFS4_POLL_RETRY_MIN;
271         if (*timeout > NFS4_POLL_RETRY_MAX)
272                 *timeout = NFS4_POLL_RETRY_MAX;
273         freezable_schedule_timeout_killable(*timeout);
274         if (fatal_signal_pending(current))
275                 res = -ERESTARTSYS;
276         *timeout <<= 1;
277         return res;
278 }
279
280 /* This is the error handling routine for processes that are allowed
281  * to sleep.
282  */
283 static int nfs4_handle_exception(struct nfs_server *server, int errorcode, struct nfs4_exception *exception)
284 {
285         struct nfs_client *clp = server->nfs_client;
286         struct nfs4_state *state = exception->state;
287         struct inode *inode = exception->inode;
288         int ret = errorcode;
289
290         exception->retry = 0;
291         switch(errorcode) {
292                 case 0:
293                         return 0;
294                 case -NFS4ERR_OPENMODE:
295                         if (inode && nfs4_have_delegation(inode, FMODE_READ)) {
296                                 nfs4_inode_return_delegation(inode);
297                                 exception->retry = 1;
298                                 return 0;
299                         }
300                         if (state == NULL)
301                                 break;
302                         ret = nfs4_schedule_stateid_recovery(server, state);
303                         if (ret < 0)
304                                 break;
305                         goto wait_on_recovery;
306                 case -NFS4ERR_DELEG_REVOKED:
307                 case -NFS4ERR_ADMIN_REVOKED:
308                 case -NFS4ERR_BAD_STATEID:
309                         if (inode != NULL && nfs4_have_delegation(inode, FMODE_READ)) {
310                                 nfs_remove_bad_delegation(inode);
311                                 exception->retry = 1;
312                                 break;
313                         }
314                         if (state == NULL)
315                                 break;
316                         ret = nfs4_schedule_stateid_recovery(server, state);
317                         if (ret < 0)
318                                 break;
319                         goto wait_on_recovery;
320                 case -NFS4ERR_EXPIRED:
321                         if (state != NULL) {
322                                 ret = nfs4_schedule_stateid_recovery(server, state);
323                                 if (ret < 0)
324                                         break;
325                         }
326                 case -NFS4ERR_STALE_STATEID:
327                 case -NFS4ERR_STALE_CLIENTID:
328                         nfs4_schedule_lease_recovery(clp);
329                         goto wait_on_recovery;
330 #if defined(CONFIG_NFS_V4_1)
331                 case -NFS4ERR_BADSESSION:
332                 case -NFS4ERR_BADSLOT:
333                 case -NFS4ERR_BAD_HIGH_SLOT:
334                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
335                 case -NFS4ERR_DEADSESSION:
336                 case -NFS4ERR_SEQ_FALSE_RETRY:
337                 case -NFS4ERR_SEQ_MISORDERED:
338                         dprintk("%s ERROR: %d Reset session\n", __func__,
339                                 errorcode);
340                         nfs4_schedule_session_recovery(clp->cl_session, errorcode);
341                         goto wait_on_recovery;
342 #endif /* defined(CONFIG_NFS_V4_1) */
343                 case -NFS4ERR_FILE_OPEN:
344                         if (exception->timeout > HZ) {
345                                 /* We have retried a decent amount, time to
346                                  * fail
347                                  */
348                                 ret = -EBUSY;
349                                 break;
350                         }
351                 case -NFS4ERR_GRACE:
352                 case -NFS4ERR_DELAY:
353                         ret = nfs4_delay(server->client, &exception->timeout);
354                         if (ret != 0)
355                                 break;
356                 case -NFS4ERR_RETRY_UNCACHED_REP:
357                 case -NFS4ERR_OLD_STATEID:
358                         exception->retry = 1;
359                         break;
360                 case -NFS4ERR_BADOWNER:
361                         /* The following works around a Linux server bug! */
362                 case -NFS4ERR_BADNAME:
363                         if (server->caps & NFS_CAP_UIDGID_NOMAP) {
364                                 server->caps &= ~NFS_CAP_UIDGID_NOMAP;
365                                 exception->retry = 1;
366                                 printk(KERN_WARNING "NFS: v4 server %s "
367                                                 "does not accept raw "
368                                                 "uid/gids. "
369                                                 "Reenabling the idmapper.\n",
370                                                 server->nfs_client->cl_hostname);
371                         }
372         }
373         /* We failed to handle the error */
374         return nfs4_map_errors(ret);
375 wait_on_recovery:
376         ret = nfs4_wait_clnt_recover(clp);
377         if (ret == 0)
378                 exception->retry = 1;
379         return ret;
380 }
381
382
383 static void do_renew_lease(struct nfs_client *clp, unsigned long timestamp)
384 {
385         spin_lock(&clp->cl_lock);
386         if (time_before(clp->cl_last_renewal,timestamp))
387                 clp->cl_last_renewal = timestamp;
388         spin_unlock(&clp->cl_lock);
389 }
390
391 static void renew_lease(const struct nfs_server *server, unsigned long timestamp)
392 {
393         do_renew_lease(server->nfs_client, timestamp);
394 }
395
396 #if defined(CONFIG_NFS_V4_1)
397
398 static void nfs41_sequence_free_slot(struct nfs4_sequence_res *res)
399 {
400         struct nfs4_session *session;
401         struct nfs4_slot_table *tbl;
402         bool send_new_highest_used_slotid = false;
403
404         if (!res->sr_slot) {
405                 /* just wake up the next guy waiting since
406                  * we may have not consumed a slot after all */
407                 dprintk("%s: No slot\n", __func__);
408                 return;
409         }
410         tbl = res->sr_slot->table;
411         session = tbl->session;
412
413         spin_lock(&tbl->slot_tbl_lock);
414         /* Be nice to the server: try to ensure that the last transmitted
415          * value for highest_user_slotid <= target_highest_slotid
416          */
417         if (tbl->highest_used_slotid > tbl->target_highest_slotid)
418                 send_new_highest_used_slotid = true;
419
420         if (nfs41_wake_and_assign_slot(tbl, res->sr_slot)) {
421                 send_new_highest_used_slotid = false;
422                 goto out_unlock;
423         }
424         nfs4_free_slot(tbl, res->sr_slot);
425
426         if (tbl->highest_used_slotid != NFS4_NO_SLOT)
427                 send_new_highest_used_slotid = false;
428 out_unlock:
429         spin_unlock(&tbl->slot_tbl_lock);
430         res->sr_slot = NULL;
431         if (send_new_highest_used_slotid)
432                 nfs41_server_notify_highest_slotid_update(session->clp);
433 }
434
435 static int nfs41_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
436 {
437         struct nfs4_session *session;
438         struct nfs4_slot *slot;
439         struct nfs_client *clp;
440         bool interrupted = false;
441         int ret = 1;
442
443         /* don't increment the sequence number if the task wasn't sent */
444         if (!RPC_WAS_SENT(task))
445                 goto out;
446
447         slot = res->sr_slot;
448         session = slot->table->session;
449
450         if (slot->interrupted) {
451                 slot->interrupted = 0;
452                 interrupted = true;
453         }
454
455         /* Check the SEQUENCE operation status */
456         switch (res->sr_status) {
457         case 0:
458                 /* Update the slot's sequence and clientid lease timer */
459                 ++slot->seq_nr;
460                 clp = session->clp;
461                 do_renew_lease(clp, res->sr_timestamp);
462                 /* Check sequence flags */
463                 if (res->sr_status_flags != 0)
464                         nfs4_schedule_lease_recovery(clp);
465                 nfs41_update_target_slotid(slot->table, slot, res);
466                 break;
467         case 1:
468                 /*
469                  * sr_status remains 1 if an RPC level error occurred.
470                  * The server may or may not have processed the sequence
471                  * operation..
472                  * Mark the slot as having hosted an interrupted RPC call.
473                  */
474                 slot->interrupted = 1;
475                 goto out;
476         case -NFS4ERR_DELAY:
477                 /* The server detected a resend of the RPC call and
478                  * returned NFS4ERR_DELAY as per Section 2.10.6.2
479                  * of RFC5661.
480                  */
481                 dprintk("%s: slot=%u seq=%u: Operation in progress\n",
482                         __func__,
483                         slot->slot_nr,
484                         slot->seq_nr);
485                 goto out_retry;
486         case -NFS4ERR_BADSLOT:
487                 /*
488                  * The slot id we used was probably retired. Try again
489                  * using a different slot id.
490                  */
491                 goto retry_nowait;
492         case -NFS4ERR_SEQ_MISORDERED:
493                 /*
494                  * Was the last operation on this sequence interrupted?
495                  * If so, retry after bumping the sequence number.
496                  */
497                 if (interrupted) {
498                         ++slot->seq_nr;
499                         goto retry_nowait;
500                 }
501                 /*
502                  * Could this slot have been previously retired?
503                  * If so, then the server may be expecting seq_nr = 1!
504                  */
505                 if (slot->seq_nr != 1) {
506                         slot->seq_nr = 1;
507                         goto retry_nowait;
508                 }
509                 break;
510         case -NFS4ERR_SEQ_FALSE_RETRY:
511                 ++slot->seq_nr;
512                 goto retry_nowait;
513         default:
514                 /* Just update the slot sequence no. */
515                 ++slot->seq_nr;
516         }
517 out:
518         /* The session may be reset by one of the error handlers. */
519         dprintk("%s: Error %d free the slot \n", __func__, res->sr_status);
520         nfs41_sequence_free_slot(res);
521         return ret;
522 retry_nowait:
523         if (rpc_restart_call_prepare(task)) {
524                 task->tk_status = 0;
525                 ret = 0;
526         }
527         goto out;
528 out_retry:
529         if (!rpc_restart_call(task))
530                 goto out;
531         rpc_delay(task, NFS4_POLL_RETRY_MAX);
532         return 0;
533 }
534
535 static int nfs4_sequence_done(struct rpc_task *task,
536                                struct nfs4_sequence_res *res)
537 {
538         if (res->sr_slot == NULL)
539                 return 1;
540         return nfs41_sequence_done(task, res);
541 }
542
543 static void nfs41_init_sequence(struct nfs4_sequence_args *args,
544                 struct nfs4_sequence_res *res, int cache_reply)
545 {
546         args->sa_slot = NULL;
547         args->sa_cache_this = 0;
548         args->sa_privileged = 0;
549         if (cache_reply)
550                 args->sa_cache_this = 1;
551         res->sr_slot = NULL;
552 }
553
554 static void nfs4_set_sequence_privileged(struct nfs4_sequence_args *args)
555 {
556         args->sa_privileged = 1;
557 }
558
559 int nfs41_setup_sequence(struct nfs4_session *session,
560                                 struct nfs4_sequence_args *args,
561                                 struct nfs4_sequence_res *res,
562                                 struct rpc_task *task)
563 {
564         struct nfs4_slot *slot;
565         struct nfs4_slot_table *tbl;
566
567         dprintk("--> %s\n", __func__);
568         /* slot already allocated? */
569         if (res->sr_slot != NULL)
570                 goto out_success;
571
572         tbl = &session->fc_slot_table;
573
574         task->tk_timeout = 0;
575
576         spin_lock(&tbl->slot_tbl_lock);
577         if (test_bit(NFS4_SLOT_TBL_DRAINING, &tbl->slot_tbl_state) &&
578             !args->sa_privileged) {
579                 /* The state manager will wait until the slot table is empty */
580                 dprintk("%s session is draining\n", __func__);
581                 goto out_sleep;
582         }
583
584         slot = nfs4_alloc_slot(tbl);
585         if (IS_ERR(slot)) {
586                 /* If out of memory, try again in 1/4 second */
587                 if (slot == ERR_PTR(-ENOMEM))
588                         task->tk_timeout = HZ >> 2;
589                 dprintk("<-- %s: no free slots\n", __func__);
590                 goto out_sleep;
591         }
592         spin_unlock(&tbl->slot_tbl_lock);
593
594         args->sa_slot = slot;
595
596         dprintk("<-- %s slotid=%d seqid=%d\n", __func__,
597                         slot->slot_nr, slot->seq_nr);
598
599         res->sr_slot = slot;
600         res->sr_timestamp = jiffies;
601         res->sr_status_flags = 0;
602         /*
603          * sr_status is only set in decode_sequence, and so will remain
604          * set to 1 if an rpc level failure occurs.
605          */
606         res->sr_status = 1;
607 out_success:
608         rpc_call_start(task);
609         return 0;
610 out_sleep:
611         /* Privileged tasks are queued with top priority */
612         if (args->sa_privileged)
613                 rpc_sleep_on_priority(&tbl->slot_tbl_waitq, task,
614                                 NULL, RPC_PRIORITY_PRIVILEGED);
615         else
616                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
617         spin_unlock(&tbl->slot_tbl_lock);
618         return -EAGAIN;
619 }
620 EXPORT_SYMBOL_GPL(nfs41_setup_sequence);
621
622 int nfs4_setup_sequence(const struct nfs_server *server,
623                         struct nfs4_sequence_args *args,
624                         struct nfs4_sequence_res *res,
625                         struct rpc_task *task)
626 {
627         struct nfs4_session *session = nfs4_get_session(server);
628         int ret = 0;
629
630         if (session == NULL) {
631                 rpc_call_start(task);
632                 goto out;
633         }
634
635         dprintk("--> %s clp %p session %p sr_slot %d\n",
636                 __func__, session->clp, session, res->sr_slot ?
637                         res->sr_slot->slot_nr : -1);
638
639         ret = nfs41_setup_sequence(session, args, res, task);
640 out:
641         dprintk("<-- %s status=%d\n", __func__, ret);
642         return ret;
643 }
644
645 struct nfs41_call_sync_data {
646         const struct nfs_server *seq_server;
647         struct nfs4_sequence_args *seq_args;
648         struct nfs4_sequence_res *seq_res;
649 };
650
651 static void nfs41_call_sync_prepare(struct rpc_task *task, void *calldata)
652 {
653         struct nfs41_call_sync_data *data = calldata;
654         struct nfs4_session *session = nfs4_get_session(data->seq_server);
655
656         dprintk("--> %s data->seq_server %p\n", __func__, data->seq_server);
657
658         nfs41_setup_sequence(session, data->seq_args, data->seq_res, task);
659 }
660
661 static void nfs41_call_sync_done(struct rpc_task *task, void *calldata)
662 {
663         struct nfs41_call_sync_data *data = calldata;
664
665         nfs41_sequence_done(task, data->seq_res);
666 }
667
668 static const struct rpc_call_ops nfs41_call_sync_ops = {
669         .rpc_call_prepare = nfs41_call_sync_prepare,
670         .rpc_call_done = nfs41_call_sync_done,
671 };
672
673 static int nfs4_call_sync_sequence(struct rpc_clnt *clnt,
674                                    struct nfs_server *server,
675                                    struct rpc_message *msg,
676                                    struct nfs4_sequence_args *args,
677                                    struct nfs4_sequence_res *res)
678 {
679         int ret;
680         struct rpc_task *task;
681         struct nfs41_call_sync_data data = {
682                 .seq_server = server,
683                 .seq_args = args,
684                 .seq_res = res,
685         };
686         struct rpc_task_setup task_setup = {
687                 .rpc_client = clnt,
688                 .rpc_message = msg,
689                 .callback_ops = &nfs41_call_sync_ops,
690                 .callback_data = &data
691         };
692
693         task = rpc_run_task(&task_setup);
694         if (IS_ERR(task))
695                 ret = PTR_ERR(task);
696         else {
697                 ret = task->tk_status;
698                 rpc_put_task(task);
699         }
700         return ret;
701 }
702
703 #else
704 static
705 void nfs41_init_sequence(struct nfs4_sequence_args *args,
706                 struct nfs4_sequence_res *res, int cache_reply)
707 {
708 }
709
710 static void nfs4_set_sequence_privileged(struct nfs4_sequence_args *args)
711 {
712 }
713
714
715 static int nfs4_sequence_done(struct rpc_task *task,
716                                struct nfs4_sequence_res *res)
717 {
718         return 1;
719 }
720 #endif /* CONFIG_NFS_V4_1 */
721
722 static
723 int _nfs4_call_sync(struct rpc_clnt *clnt,
724                     struct nfs_server *server,
725                     struct rpc_message *msg,
726                     struct nfs4_sequence_args *args,
727                     struct nfs4_sequence_res *res)
728 {
729         return rpc_call_sync(clnt, msg, 0);
730 }
731
732 static
733 int nfs4_call_sync(struct rpc_clnt *clnt,
734                    struct nfs_server *server,
735                    struct rpc_message *msg,
736                    struct nfs4_sequence_args *args,
737                    struct nfs4_sequence_res *res,
738                    int cache_reply)
739 {
740         nfs41_init_sequence(args, res, cache_reply);
741         return server->nfs_client->cl_mvops->call_sync(clnt, server, msg,
742                                                 args, res);
743 }
744
745 static void update_changeattr(struct inode *dir, struct nfs4_change_info *cinfo)
746 {
747         struct nfs_inode *nfsi = NFS_I(dir);
748
749         spin_lock(&dir->i_lock);
750         nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA;
751         if (!cinfo->atomic || cinfo->before != dir->i_version)
752                 nfs_force_lookup_revalidate(dir);
753         dir->i_version = cinfo->after;
754         nfs_fscache_invalidate(dir);
755         spin_unlock(&dir->i_lock);
756 }
757
758 struct nfs4_opendata {
759         struct kref kref;
760         struct nfs_openargs o_arg;
761         struct nfs_openres o_res;
762         struct nfs_open_confirmargs c_arg;
763         struct nfs_open_confirmres c_res;
764         struct nfs4_string owner_name;
765         struct nfs4_string group_name;
766         struct nfs_fattr f_attr;
767         struct dentry *dir;
768         struct dentry *dentry;
769         struct nfs4_state_owner *owner;
770         struct nfs4_state *state;
771         struct iattr attrs;
772         unsigned long timestamp;
773         unsigned int rpc_done : 1;
774         unsigned int is_recover : 1;
775         int rpc_status;
776         int cancelled;
777 };
778
779 static bool nfs4_clear_cap_atomic_open_v1(struct nfs_server *server,
780                 int err, struct nfs4_exception *exception)
781 {
782         if (err != -EINVAL)
783                 return false;
784         if (!(server->caps & NFS_CAP_ATOMIC_OPEN_V1))
785                 return false;
786         server->caps &= ~NFS_CAP_ATOMIC_OPEN_V1;
787         exception->retry = 1;
788         return true;
789 }
790
791 static enum open_claim_type4
792 nfs4_map_atomic_open_claim(struct nfs_server *server,
793                 enum open_claim_type4 claim)
794 {
795         if (server->caps & NFS_CAP_ATOMIC_OPEN_V1)
796                 return claim;
797         switch (claim) {
798         default:
799                 return claim;
800         case NFS4_OPEN_CLAIM_FH:
801                 return NFS4_OPEN_CLAIM_NULL;
802         case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
803                 return NFS4_OPEN_CLAIM_DELEGATE_CUR;
804         case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
805                 return NFS4_OPEN_CLAIM_DELEGATE_PREV;
806         }
807 }
808
809 static void nfs4_init_opendata_res(struct nfs4_opendata *p)
810 {
811         p->o_res.f_attr = &p->f_attr;
812         p->o_res.seqid = p->o_arg.seqid;
813         p->c_res.seqid = p->c_arg.seqid;
814         p->o_res.server = p->o_arg.server;
815         p->o_res.access_request = p->o_arg.access;
816         nfs_fattr_init(&p->f_attr);
817         nfs_fattr_init_names(&p->f_attr, &p->owner_name, &p->group_name);
818 }
819
820 static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
821                 struct nfs4_state_owner *sp, fmode_t fmode, int flags,
822                 const struct iattr *attrs,
823                 enum open_claim_type4 claim,
824                 gfp_t gfp_mask)
825 {
826         struct dentry *parent = dget_parent(dentry);
827         struct inode *dir = parent->d_inode;
828         struct nfs_server *server = NFS_SERVER(dir);
829         struct nfs4_opendata *p;
830
831         p = kzalloc(sizeof(*p), gfp_mask);
832         if (p == NULL)
833                 goto err;
834         p->o_arg.seqid = nfs_alloc_seqid(&sp->so_seqid, gfp_mask);
835         if (p->o_arg.seqid == NULL)
836                 goto err_free;
837         nfs_sb_active(dentry->d_sb);
838         p->dentry = dget(dentry);
839         p->dir = parent;
840         p->owner = sp;
841         atomic_inc(&sp->so_count);
842         p->o_arg.open_flags = flags;
843         p->o_arg.fmode = fmode & (FMODE_READ|FMODE_WRITE);
844         /* don't put an ACCESS op in OPEN compound if O_EXCL, because ACCESS
845          * will return permission denied for all bits until close */
846         if (!(flags & O_EXCL)) {
847                 /* ask server to check for all possible rights as results
848                  * are cached */
849                 p->o_arg.access = NFS4_ACCESS_READ | NFS4_ACCESS_MODIFY |
850                                   NFS4_ACCESS_EXTEND | NFS4_ACCESS_EXECUTE;
851         }
852         p->o_arg.clientid = server->nfs_client->cl_clientid;
853         p->o_arg.id.create_time = ktime_to_ns(sp->so_seqid.create_time);
854         p->o_arg.id.uniquifier = sp->so_seqid.owner_id;
855         p->o_arg.name = &dentry->d_name;
856         p->o_arg.server = server;
857         p->o_arg.bitmask = server->attr_bitmask;
858         p->o_arg.open_bitmap = &nfs4_fattr_bitmap[0];
859         p->o_arg.claim = nfs4_map_atomic_open_claim(server, claim);
860         switch (p->o_arg.claim) {
861         case NFS4_OPEN_CLAIM_NULL:
862         case NFS4_OPEN_CLAIM_DELEGATE_CUR:
863         case NFS4_OPEN_CLAIM_DELEGATE_PREV:
864                 p->o_arg.fh = NFS_FH(dir);
865                 break;
866         case NFS4_OPEN_CLAIM_PREVIOUS:
867         case NFS4_OPEN_CLAIM_FH:
868         case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
869         case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
870                 p->o_arg.fh = NFS_FH(dentry->d_inode);
871         }
872         if (attrs != NULL && attrs->ia_valid != 0) {
873                 __be32 verf[2];
874
875                 p->o_arg.u.attrs = &p->attrs;
876                 memcpy(&p->attrs, attrs, sizeof(p->attrs));
877
878                 verf[0] = jiffies;
879                 verf[1] = current->pid;
880                 memcpy(p->o_arg.u.verifier.data, verf,
881                                 sizeof(p->o_arg.u.verifier.data));
882         }
883         p->c_arg.fh = &p->o_res.fh;
884         p->c_arg.stateid = &p->o_res.stateid;
885         p->c_arg.seqid = p->o_arg.seqid;
886         nfs4_init_opendata_res(p);
887         kref_init(&p->kref);
888         return p;
889 err_free:
890         kfree(p);
891 err:
892         dput(parent);
893         return NULL;
894 }
895
896 static void nfs4_opendata_free(struct kref *kref)
897 {
898         struct nfs4_opendata *p = container_of(kref,
899                         struct nfs4_opendata, kref);
900         struct super_block *sb = p->dentry->d_sb;
901
902         nfs_free_seqid(p->o_arg.seqid);
903         if (p->state != NULL)
904                 nfs4_put_open_state(p->state);
905         nfs4_put_state_owner(p->owner);
906         dput(p->dir);
907         dput(p->dentry);
908         nfs_sb_deactive(sb);
909         nfs_fattr_free_names(&p->f_attr);
910         kfree(p);
911 }
912
913 static void nfs4_opendata_put(struct nfs4_opendata *p)
914 {
915         if (p != NULL)
916                 kref_put(&p->kref, nfs4_opendata_free);
917 }
918
919 static int nfs4_wait_for_completion_rpc_task(struct rpc_task *task)
920 {
921         int ret;
922
923         ret = rpc_wait_for_completion_task(task);
924         return ret;
925 }
926
927 static int can_open_cached(struct nfs4_state *state, fmode_t mode, int open_mode)
928 {
929         int ret = 0;
930
931         if (open_mode & (O_EXCL|O_TRUNC))
932                 goto out;
933         switch (mode & (FMODE_READ|FMODE_WRITE)) {
934                 case FMODE_READ:
935                         ret |= test_bit(NFS_O_RDONLY_STATE, &state->flags) != 0
936                                 && state->n_rdonly != 0;
937                         break;
938                 case FMODE_WRITE:
939                         ret |= test_bit(NFS_O_WRONLY_STATE, &state->flags) != 0
940                                 && state->n_wronly != 0;
941                         break;
942                 case FMODE_READ|FMODE_WRITE:
943                         ret |= test_bit(NFS_O_RDWR_STATE, &state->flags) != 0
944                                 && state->n_rdwr != 0;
945         }
946 out:
947         return ret;
948 }
949
950 static int can_open_delegated(struct nfs_delegation *delegation, fmode_t fmode)
951 {
952         if (delegation == NULL)
953                 return 0;
954         if ((delegation->type & fmode) != fmode)
955                 return 0;
956         if (test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags))
957                 return 0;
958         if (test_bit(NFS_DELEGATION_RETURNING, &delegation->flags))
959                 return 0;
960         nfs_mark_delegation_referenced(delegation);
961         return 1;
962 }
963
964 static void update_open_stateflags(struct nfs4_state *state, fmode_t fmode)
965 {
966         switch (fmode) {
967                 case FMODE_WRITE:
968                         state->n_wronly++;
969                         break;
970                 case FMODE_READ:
971                         state->n_rdonly++;
972                         break;
973                 case FMODE_READ|FMODE_WRITE:
974                         state->n_rdwr++;
975         }
976         nfs4_state_set_mode_locked(state, state->state | fmode);
977 }
978
979 static void nfs_set_open_stateid_locked(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
980 {
981         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
982                 nfs4_stateid_copy(&state->stateid, stateid);
983         nfs4_stateid_copy(&state->open_stateid, stateid);
984         set_bit(NFS_OPEN_STATE, &state->flags);
985         switch (fmode) {
986                 case FMODE_READ:
987                         set_bit(NFS_O_RDONLY_STATE, &state->flags);
988                         break;
989                 case FMODE_WRITE:
990                         set_bit(NFS_O_WRONLY_STATE, &state->flags);
991                         break;
992                 case FMODE_READ|FMODE_WRITE:
993                         set_bit(NFS_O_RDWR_STATE, &state->flags);
994         }
995 }
996
997 static void nfs_set_open_stateid(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
998 {
999         write_seqlock(&state->seqlock);
1000         nfs_set_open_stateid_locked(state, stateid, fmode);
1001         write_sequnlock(&state->seqlock);
1002 }
1003
1004 static void __update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, const nfs4_stateid *deleg_stateid, fmode_t fmode)
1005 {
1006         /*
1007          * Protect the call to nfs4_state_set_mode_locked and
1008          * serialise the stateid update
1009          */
1010         write_seqlock(&state->seqlock);
1011         if (deleg_stateid != NULL) {
1012                 nfs4_stateid_copy(&state->stateid, deleg_stateid);
1013                 set_bit(NFS_DELEGATED_STATE, &state->flags);
1014         }
1015         if (open_stateid != NULL)
1016                 nfs_set_open_stateid_locked(state, open_stateid, fmode);
1017         write_sequnlock(&state->seqlock);
1018         spin_lock(&state->owner->so_lock);
1019         update_open_stateflags(state, fmode);
1020         spin_unlock(&state->owner->so_lock);
1021 }
1022
1023 static int update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, nfs4_stateid *delegation, fmode_t fmode)
1024 {
1025         struct nfs_inode *nfsi = NFS_I(state->inode);
1026         struct nfs_delegation *deleg_cur;
1027         int ret = 0;
1028
1029         fmode &= (FMODE_READ|FMODE_WRITE);
1030
1031         rcu_read_lock();
1032         deleg_cur = rcu_dereference(nfsi->delegation);
1033         if (deleg_cur == NULL)
1034                 goto no_delegation;
1035
1036         spin_lock(&deleg_cur->lock);
1037         if (nfsi->delegation != deleg_cur ||
1038            test_bit(NFS_DELEGATION_RETURNING, &deleg_cur->flags) ||
1039             (deleg_cur->type & fmode) != fmode)
1040                 goto no_delegation_unlock;
1041
1042         if (delegation == NULL)
1043                 delegation = &deleg_cur->stateid;
1044         else if (!nfs4_stateid_match(&deleg_cur->stateid, delegation))
1045                 goto no_delegation_unlock;
1046
1047         nfs_mark_delegation_referenced(deleg_cur);
1048         __update_open_stateid(state, open_stateid, &deleg_cur->stateid, fmode);
1049         ret = 1;
1050 no_delegation_unlock:
1051         spin_unlock(&deleg_cur->lock);
1052 no_delegation:
1053         rcu_read_unlock();
1054
1055         if (!ret && open_stateid != NULL) {
1056                 __update_open_stateid(state, open_stateid, NULL, fmode);
1057                 ret = 1;
1058         }
1059
1060         return ret;
1061 }
1062
1063
1064 static void nfs4_return_incompatible_delegation(struct inode *inode, fmode_t fmode)
1065 {
1066         struct nfs_delegation *delegation;
1067
1068         rcu_read_lock();
1069         delegation = rcu_dereference(NFS_I(inode)->delegation);
1070         if (delegation == NULL || (delegation->type & fmode) == fmode) {
1071                 rcu_read_unlock();
1072                 return;
1073         }
1074         rcu_read_unlock();
1075         nfs4_inode_return_delegation(inode);
1076 }
1077
1078 static struct nfs4_state *nfs4_try_open_cached(struct nfs4_opendata *opendata)
1079 {
1080         struct nfs4_state *state = opendata->state;
1081         struct nfs_inode *nfsi = NFS_I(state->inode);
1082         struct nfs_delegation *delegation;
1083         int open_mode = opendata->o_arg.open_flags;
1084         fmode_t fmode = opendata->o_arg.fmode;
1085         nfs4_stateid stateid;
1086         int ret = -EAGAIN;
1087
1088         for (;;) {
1089                 if (can_open_cached(state, fmode, open_mode)) {
1090                         spin_lock(&state->owner->so_lock);
1091                         if (can_open_cached(state, fmode, open_mode)) {
1092                                 update_open_stateflags(state, fmode);
1093                                 spin_unlock(&state->owner->so_lock);
1094                                 goto out_return_state;
1095                         }
1096                         spin_unlock(&state->owner->so_lock);
1097                 }
1098                 rcu_read_lock();
1099                 delegation = rcu_dereference(nfsi->delegation);
1100                 if (!can_open_delegated(delegation, fmode)) {
1101                         rcu_read_unlock();
1102                         break;
1103                 }
1104                 /* Save the delegation */
1105                 nfs4_stateid_copy(&stateid, &delegation->stateid);
1106                 rcu_read_unlock();
1107                 nfs_release_seqid(opendata->o_arg.seqid);
1108                 if (!opendata->is_recover) {
1109                         ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
1110                         if (ret != 0)
1111                                 goto out;
1112                 }
1113                 ret = -EAGAIN;
1114
1115                 /* Try to update the stateid using the delegation */
1116                 if (update_open_stateid(state, NULL, &stateid, fmode))
1117                         goto out_return_state;
1118         }
1119 out:
1120         return ERR_PTR(ret);
1121 out_return_state:
1122         atomic_inc(&state->count);
1123         return state;
1124 }
1125
1126 static void
1127 nfs4_opendata_check_deleg(struct nfs4_opendata *data, struct nfs4_state *state)
1128 {
1129         struct nfs_client *clp = NFS_SERVER(state->inode)->nfs_client;
1130         struct nfs_delegation *delegation;
1131         int delegation_flags = 0;
1132
1133         rcu_read_lock();
1134         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1135         if (delegation)
1136                 delegation_flags = delegation->flags;
1137         rcu_read_unlock();
1138         if (data->o_arg.claim == NFS4_OPEN_CLAIM_DELEGATE_CUR) {
1139                 pr_err_ratelimited("NFS: Broken NFSv4 server %s is "
1140                                    "returning a delegation for "
1141                                    "OPEN(CLAIM_DELEGATE_CUR)\n",
1142                                    clp->cl_hostname);
1143         } else if ((delegation_flags & 1UL<<NFS_DELEGATION_NEED_RECLAIM) == 0)
1144                 nfs_inode_set_delegation(state->inode,
1145                                          data->owner->so_cred,
1146                                          &data->o_res);
1147         else
1148                 nfs_inode_reclaim_delegation(state->inode,
1149                                              data->owner->so_cred,
1150                                              &data->o_res);
1151 }
1152
1153 /*
1154  * Check the inode attributes against the CLAIM_PREVIOUS returned attributes
1155  * and update the nfs4_state.
1156  */
1157 static struct nfs4_state *
1158 _nfs4_opendata_reclaim_to_nfs4_state(struct nfs4_opendata *data)
1159 {
1160         struct inode *inode = data->state->inode;
1161         struct nfs4_state *state = data->state;
1162         int ret;
1163
1164         if (!data->rpc_done) {
1165                 ret = data->rpc_status;
1166                 goto err;
1167         }
1168
1169         ret = -ESTALE;
1170         if (!(data->f_attr.valid & NFS_ATTR_FATTR_TYPE) ||
1171             !(data->f_attr.valid & NFS_ATTR_FATTR_FILEID) ||
1172             !(data->f_attr.valid & NFS_ATTR_FATTR_CHANGE))
1173                 goto err;
1174
1175         ret = -ENOMEM;
1176         state = nfs4_get_open_state(inode, data->owner);
1177         if (state == NULL)
1178                 goto err;
1179
1180         ret = nfs_refresh_inode(inode, &data->f_attr);
1181         if (ret)
1182                 goto err;
1183
1184         if (data->o_res.delegation_type != 0)
1185                 nfs4_opendata_check_deleg(data, state);
1186         update_open_stateid(state, &data->o_res.stateid, NULL,
1187                             data->o_arg.fmode);
1188
1189         return state;
1190 err:
1191         return ERR_PTR(ret);
1192
1193 }
1194
1195 static struct nfs4_state *
1196 _nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
1197 {
1198         struct inode *inode;
1199         struct nfs4_state *state = NULL;
1200         int ret;
1201
1202         if (!data->rpc_done) {
1203                 state = nfs4_try_open_cached(data);
1204                 goto out;
1205         }
1206
1207         ret = -EAGAIN;
1208         if (!(data->f_attr.valid & NFS_ATTR_FATTR))
1209                 goto err;
1210         inode = nfs_fhget(data->dir->d_sb, &data->o_res.fh, &data->f_attr);
1211         ret = PTR_ERR(inode);
1212         if (IS_ERR(inode))
1213                 goto err;
1214         ret = -ENOMEM;
1215         state = nfs4_get_open_state(inode, data->owner);
1216         if (state == NULL)
1217                 goto err_put_inode;
1218         if (data->o_res.delegation_type != 0)
1219                 nfs4_opendata_check_deleg(data, state);
1220         update_open_stateid(state, &data->o_res.stateid, NULL,
1221                         data->o_arg.fmode);
1222         iput(inode);
1223 out:
1224         nfs_release_seqid(data->o_arg.seqid);
1225         return state;
1226 err_put_inode:
1227         iput(inode);
1228 err:
1229         return ERR_PTR(ret);
1230 }
1231
1232 static struct nfs4_state *
1233 nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
1234 {
1235         if (data->o_arg.claim == NFS4_OPEN_CLAIM_PREVIOUS)
1236                 return _nfs4_opendata_reclaim_to_nfs4_state(data);
1237         return _nfs4_opendata_to_nfs4_state(data);
1238 }
1239
1240 static struct nfs_open_context *nfs4_state_find_open_context(struct nfs4_state *state)
1241 {
1242         struct nfs_inode *nfsi = NFS_I(state->inode);
1243         struct nfs_open_context *ctx;
1244
1245         spin_lock(&state->inode->i_lock);
1246         list_for_each_entry(ctx, &nfsi->open_files, list) {
1247                 if (ctx->state != state)
1248                         continue;
1249                 get_nfs_open_context(ctx);
1250                 spin_unlock(&state->inode->i_lock);
1251                 return ctx;
1252         }
1253         spin_unlock(&state->inode->i_lock);
1254         return ERR_PTR(-ENOENT);
1255 }
1256
1257 static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx,
1258                 struct nfs4_state *state, enum open_claim_type4 claim)
1259 {
1260         struct nfs4_opendata *opendata;
1261
1262         opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0,
1263                         NULL, claim, GFP_NOFS);
1264         if (opendata == NULL)
1265                 return ERR_PTR(-ENOMEM);
1266         opendata->state = state;
1267         atomic_inc(&state->count);
1268         return opendata;
1269 }
1270
1271 static int nfs4_open_recover_helper(struct nfs4_opendata *opendata, fmode_t fmode, struct nfs4_state **res)
1272 {
1273         struct nfs4_state *newstate;
1274         int ret;
1275
1276         opendata->o_arg.open_flags = 0;
1277         opendata->o_arg.fmode = fmode;
1278         memset(&opendata->o_res, 0, sizeof(opendata->o_res));
1279         memset(&opendata->c_res, 0, sizeof(opendata->c_res));
1280         nfs4_init_opendata_res(opendata);
1281         ret = _nfs4_recover_proc_open(opendata);
1282         if (ret != 0)
1283                 return ret; 
1284         newstate = nfs4_opendata_to_nfs4_state(opendata);
1285         if (IS_ERR(newstate))
1286                 return PTR_ERR(newstate);
1287         nfs4_close_state(newstate, fmode);
1288         *res = newstate;
1289         return 0;
1290 }
1291
1292 static int nfs4_open_recover(struct nfs4_opendata *opendata, struct nfs4_state *state)
1293 {
1294         struct nfs4_state *newstate;
1295         int ret;
1296
1297         /* memory barrier prior to reading state->n_* */
1298         clear_bit(NFS_DELEGATED_STATE, &state->flags);
1299         clear_bit(NFS_OPEN_STATE, &state->flags);
1300         smp_rmb();
1301         if (state->n_rdwr != 0) {
1302                 clear_bit(NFS_O_RDWR_STATE, &state->flags);
1303                 ret = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE, &newstate);
1304                 if (ret != 0)
1305                         return ret;
1306                 if (newstate != state)
1307                         return -ESTALE;
1308         }
1309         if (state->n_wronly != 0) {
1310                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1311                 ret = nfs4_open_recover_helper(opendata, FMODE_WRITE, &newstate);
1312                 if (ret != 0)
1313                         return ret;
1314                 if (newstate != state)
1315                         return -ESTALE;
1316         }
1317         if (state->n_rdonly != 0) {
1318                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1319                 ret = nfs4_open_recover_helper(opendata, FMODE_READ, &newstate);
1320                 if (ret != 0)
1321                         return ret;
1322                 if (newstate != state)
1323                         return -ESTALE;
1324         }
1325         /*
1326          * We may have performed cached opens for all three recoveries.
1327          * Check if we need to update the current stateid.
1328          */
1329         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0 &&
1330             !nfs4_stateid_match(&state->stateid, &state->open_stateid)) {
1331                 write_seqlock(&state->seqlock);
1332                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1333                         nfs4_stateid_copy(&state->stateid, &state->open_stateid);
1334                 write_sequnlock(&state->seqlock);
1335         }
1336         return 0;
1337 }
1338
1339 /*
1340  * OPEN_RECLAIM:
1341  *      reclaim state on the server after a reboot.
1342  */
1343 static int _nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1344 {
1345         struct nfs_delegation *delegation;
1346         struct nfs4_opendata *opendata;
1347         fmode_t delegation_type = 0;
1348         int status;
1349
1350         opendata = nfs4_open_recoverdata_alloc(ctx, state,
1351                         NFS4_OPEN_CLAIM_PREVIOUS);
1352         if (IS_ERR(opendata))
1353                 return PTR_ERR(opendata);
1354         rcu_read_lock();
1355         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1356         if (delegation != NULL && test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) != 0)
1357                 delegation_type = delegation->type;
1358         rcu_read_unlock();
1359         opendata->o_arg.u.delegation_type = delegation_type;
1360         status = nfs4_open_recover(opendata, state);
1361         nfs4_opendata_put(opendata);
1362         return status;
1363 }
1364
1365 static int nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1366 {
1367         struct nfs_server *server = NFS_SERVER(state->inode);
1368         struct nfs4_exception exception = { };
1369         int err;
1370         do {
1371                 err = _nfs4_do_open_reclaim(ctx, state);
1372                 if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
1373                         continue;
1374                 if (err != -NFS4ERR_DELAY)
1375                         break;
1376                 nfs4_handle_exception(server, err, &exception);
1377         } while (exception.retry);
1378         return err;
1379 }
1380
1381 static int nfs4_open_reclaim(struct nfs4_state_owner *sp, struct nfs4_state *state)
1382 {
1383         struct nfs_open_context *ctx;
1384         int ret;
1385
1386         ctx = nfs4_state_find_open_context(state);
1387         if (IS_ERR(ctx))
1388                 return -EAGAIN;
1389         ret = nfs4_do_open_reclaim(ctx, state);
1390         put_nfs_open_context(ctx);
1391         return ret;
1392 }
1393
1394 static int nfs4_handle_delegation_recall_error(struct nfs_server *server, struct nfs4_state *state, const nfs4_stateid *stateid, int err)
1395 {
1396         switch (err) {
1397                 default:
1398                         printk(KERN_ERR "NFS: %s: unhandled error "
1399                                         "%d.\n", __func__, err);
1400                 case 0:
1401                 case -ENOENT:
1402                 case -ESTALE:
1403                         break;
1404                 case -NFS4ERR_BADSESSION:
1405                 case -NFS4ERR_BADSLOT:
1406                 case -NFS4ERR_BAD_HIGH_SLOT:
1407                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
1408                 case -NFS4ERR_DEADSESSION:
1409                         set_bit(NFS_DELEGATED_STATE, &state->flags);
1410                         nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
1411                         return -EAGAIN;
1412                 case -NFS4ERR_STALE_CLIENTID:
1413                 case -NFS4ERR_STALE_STATEID:
1414                         set_bit(NFS_DELEGATED_STATE, &state->flags);
1415                 case -NFS4ERR_EXPIRED:
1416                         /* Don't recall a delegation if it was lost */
1417                         nfs4_schedule_lease_recovery(server->nfs_client);
1418                         return -EAGAIN;
1419                 case -NFS4ERR_DELEG_REVOKED:
1420                 case -NFS4ERR_ADMIN_REVOKED:
1421                 case -NFS4ERR_BAD_STATEID:
1422                 case -NFS4ERR_OPENMODE:
1423                         nfs_inode_find_state_and_recover(state->inode,
1424                                         stateid);
1425                         nfs4_schedule_stateid_recovery(server, state);
1426                         return 0;
1427                 case -NFS4ERR_DELAY:
1428                 case -NFS4ERR_GRACE:
1429                         set_bit(NFS_DELEGATED_STATE, &state->flags);
1430                         ssleep(1);
1431                         return -EAGAIN;
1432                 case -ENOMEM:
1433                 case -NFS4ERR_DENIED:
1434                         /* kill_proc(fl->fl_pid, SIGLOST, 1); */
1435                         return 0;
1436         }
1437         return err;
1438 }
1439
1440 int nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
1441 {
1442         struct nfs_server *server = NFS_SERVER(state->inode);
1443         struct nfs4_opendata *opendata;
1444         int err;
1445
1446         opendata = nfs4_open_recoverdata_alloc(ctx, state,
1447                         NFS4_OPEN_CLAIM_DELEG_CUR_FH);
1448         if (IS_ERR(opendata))
1449                 return PTR_ERR(opendata);
1450         nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
1451         err = nfs4_open_recover(opendata, state);
1452         nfs4_opendata_put(opendata);
1453         return nfs4_handle_delegation_recall_error(server, state, stateid, err);
1454 }
1455
1456 static void nfs4_open_confirm_done(struct rpc_task *task, void *calldata)
1457 {
1458         struct nfs4_opendata *data = calldata;
1459
1460         data->rpc_status = task->tk_status;
1461         if (data->rpc_status == 0) {
1462                 nfs4_stateid_copy(&data->o_res.stateid, &data->c_res.stateid);
1463                 nfs_confirm_seqid(&data->owner->so_seqid, 0);
1464                 renew_lease(data->o_res.server, data->timestamp);
1465                 data->rpc_done = 1;
1466         }
1467 }
1468
1469 static void nfs4_open_confirm_release(void *calldata)
1470 {
1471         struct nfs4_opendata *data = calldata;
1472         struct nfs4_state *state = NULL;
1473
1474         /* If this request hasn't been cancelled, do nothing */
1475         if (data->cancelled == 0)
1476                 goto out_free;
1477         /* In case of error, no cleanup! */
1478         if (!data->rpc_done)
1479                 goto out_free;
1480         state = nfs4_opendata_to_nfs4_state(data);
1481         if (!IS_ERR(state))
1482                 nfs4_close_state(state, data->o_arg.fmode);
1483 out_free:
1484         nfs4_opendata_put(data);
1485 }
1486
1487 static const struct rpc_call_ops nfs4_open_confirm_ops = {
1488         .rpc_call_done = nfs4_open_confirm_done,
1489         .rpc_release = nfs4_open_confirm_release,
1490 };
1491
1492 /*
1493  * Note: On error, nfs4_proc_open_confirm will free the struct nfs4_opendata
1494  */
1495 static int _nfs4_proc_open_confirm(struct nfs4_opendata *data)
1496 {
1497         struct nfs_server *server = NFS_SERVER(data->dir->d_inode);
1498         struct rpc_task *task;
1499         struct  rpc_message msg = {
1500                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_CONFIRM],
1501                 .rpc_argp = &data->c_arg,
1502                 .rpc_resp = &data->c_res,
1503                 .rpc_cred = data->owner->so_cred,
1504         };
1505         struct rpc_task_setup task_setup_data = {
1506                 .rpc_client = server->client,
1507                 .rpc_message = &msg,
1508                 .callback_ops = &nfs4_open_confirm_ops,
1509                 .callback_data = data,
1510                 .workqueue = nfsiod_workqueue,
1511                 .flags = RPC_TASK_ASYNC,
1512         };
1513         int status;
1514
1515         kref_get(&data->kref);
1516         data->rpc_done = 0;
1517         data->rpc_status = 0;
1518         data->timestamp = jiffies;
1519         task = rpc_run_task(&task_setup_data);
1520         if (IS_ERR(task))
1521                 return PTR_ERR(task);
1522         status = nfs4_wait_for_completion_rpc_task(task);
1523         if (status != 0) {
1524                 data->cancelled = 1;
1525                 smp_wmb();
1526         } else
1527                 status = data->rpc_status;
1528         rpc_put_task(task);
1529         return status;
1530 }
1531
1532 static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
1533 {
1534         struct nfs4_opendata *data = calldata;
1535         struct nfs4_state_owner *sp = data->owner;
1536         struct nfs_client *clp = sp->so_server->nfs_client;
1537
1538         if (nfs_wait_on_sequence(data->o_arg.seqid, task) != 0)
1539                 goto out_wait;
1540         /*
1541          * Check if we still need to send an OPEN call, or if we can use
1542          * a delegation instead.
1543          */
1544         if (data->state != NULL) {
1545                 struct nfs_delegation *delegation;
1546
1547                 if (can_open_cached(data->state, data->o_arg.fmode, data->o_arg.open_flags))
1548                         goto out_no_action;
1549                 rcu_read_lock();
1550                 delegation = rcu_dereference(NFS_I(data->state->inode)->delegation);
1551                 if (data->o_arg.claim != NFS4_OPEN_CLAIM_DELEGATE_CUR &&
1552                     data->o_arg.claim != NFS4_OPEN_CLAIM_DELEG_CUR_FH &&
1553                     can_open_delegated(delegation, data->o_arg.fmode))
1554                         goto unlock_no_action;
1555                 rcu_read_unlock();
1556         }
1557         /* Update client id. */
1558         data->o_arg.clientid = clp->cl_clientid;
1559         switch (data->o_arg.claim) {
1560         case NFS4_OPEN_CLAIM_PREVIOUS:
1561         case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
1562         case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
1563                 data->o_arg.open_bitmap = &nfs4_open_noattr_bitmap[0];
1564         case NFS4_OPEN_CLAIM_FH:
1565                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
1566                 nfs_copy_fh(&data->o_res.fh, data->o_arg.fh);
1567         }
1568         data->timestamp = jiffies;
1569         if (nfs4_setup_sequence(data->o_arg.server,
1570                                 &data->o_arg.seq_args,
1571                                 &data->o_res.seq_res,
1572                                 task) != 0)
1573                 nfs_release_seqid(data->o_arg.seqid);
1574
1575         /* Set the create mode (note dependency on the session type) */
1576         data->o_arg.createmode = NFS4_CREATE_UNCHECKED;
1577         if (data->o_arg.open_flags & O_EXCL) {
1578                 data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE;
1579                 if (nfs4_has_persistent_session(clp))
1580                         data->o_arg.createmode = NFS4_CREATE_GUARDED;
1581                 else if (clp->cl_mvops->minor_version > 0)
1582                         data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE4_1;
1583         }
1584         return;
1585 unlock_no_action:
1586         rcu_read_unlock();
1587 out_no_action:
1588         task->tk_action = NULL;
1589 out_wait:
1590         nfs4_sequence_done(task, &data->o_res.seq_res);
1591 }
1592
1593 static void nfs4_open_done(struct rpc_task *task, void *calldata)
1594 {
1595         struct nfs4_opendata *data = calldata;
1596
1597         data->rpc_status = task->tk_status;
1598
1599         if (!nfs4_sequence_done(task, &data->o_res.seq_res))
1600                 return;
1601
1602         if (task->tk_status == 0) {
1603                 if (data->o_res.f_attr->valid & NFS_ATTR_FATTR_TYPE) {
1604                         switch (data->o_res.f_attr->mode & S_IFMT) {
1605                         case S_IFREG:
1606                                 break;
1607                         case S_IFLNK:
1608                                 data->rpc_status = -ELOOP;
1609                                 break;
1610                         case S_IFDIR:
1611                                 data->rpc_status = -EISDIR;
1612                                 break;
1613                         default:
1614                                 data->rpc_status = -ENOTDIR;
1615                         }
1616                 }
1617                 renew_lease(data->o_res.server, data->timestamp);
1618                 if (!(data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM))
1619                         nfs_confirm_seqid(&data->owner->so_seqid, 0);
1620         }
1621         data->rpc_done = 1;
1622 }
1623
1624 static void nfs4_open_release(void *calldata)
1625 {
1626         struct nfs4_opendata *data = calldata;
1627         struct nfs4_state *state = NULL;
1628
1629         /* If this request hasn't been cancelled, do nothing */
1630         if (data->cancelled == 0)
1631                 goto out_free;
1632         /* In case of error, no cleanup! */
1633         if (data->rpc_status != 0 || !data->rpc_done)
1634                 goto out_free;
1635         /* In case we need an open_confirm, no cleanup! */
1636         if (data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM)
1637                 goto out_free;
1638         state = nfs4_opendata_to_nfs4_state(data);
1639         if (!IS_ERR(state))
1640                 nfs4_close_state(state, data->o_arg.fmode);
1641 out_free:
1642         nfs4_opendata_put(data);
1643 }
1644
1645 static const struct rpc_call_ops nfs4_open_ops = {
1646         .rpc_call_prepare = nfs4_open_prepare,
1647         .rpc_call_done = nfs4_open_done,
1648         .rpc_release = nfs4_open_release,
1649 };
1650
1651 static int nfs4_run_open_task(struct nfs4_opendata *data, int isrecover)
1652 {
1653         struct inode *dir = data->dir->d_inode;
1654         struct nfs_server *server = NFS_SERVER(dir);
1655         struct nfs_openargs *o_arg = &data->o_arg;
1656         struct nfs_openres *o_res = &data->o_res;
1657         struct rpc_task *task;
1658         struct rpc_message msg = {
1659                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN],
1660                 .rpc_argp = o_arg,
1661                 .rpc_resp = o_res,
1662                 .rpc_cred = data->owner->so_cred,
1663         };
1664         struct rpc_task_setup task_setup_data = {
1665                 .rpc_client = server->client,
1666                 .rpc_message = &msg,
1667                 .callback_ops = &nfs4_open_ops,
1668                 .callback_data = data,
1669                 .workqueue = nfsiod_workqueue,
1670                 .flags = RPC_TASK_ASYNC,
1671         };
1672         int status;
1673
1674         nfs41_init_sequence(&o_arg->seq_args, &o_res->seq_res, 1);
1675         kref_get(&data->kref);
1676         data->rpc_done = 0;
1677         data->rpc_status = 0;
1678         data->cancelled = 0;
1679         data->is_recover = 0;
1680         if (isrecover) {
1681                 nfs4_set_sequence_privileged(&o_arg->seq_args);
1682                 data->is_recover = 1;
1683         }
1684         task = rpc_run_task(&task_setup_data);
1685         if (IS_ERR(task))
1686                 return PTR_ERR(task);
1687         status = nfs4_wait_for_completion_rpc_task(task);
1688         if (status != 0) {
1689                 data->cancelled = 1;
1690                 smp_wmb();
1691         } else
1692                 status = data->rpc_status;
1693         rpc_put_task(task);
1694
1695         return status;
1696 }
1697
1698 static int _nfs4_recover_proc_open(struct nfs4_opendata *data)
1699 {
1700         struct inode *dir = data->dir->d_inode;
1701         struct nfs_openres *o_res = &data->o_res;
1702         int status;
1703
1704         status = nfs4_run_open_task(data, 1);
1705         if (status != 0 || !data->rpc_done)
1706                 return status;
1707
1708         nfs_fattr_map_and_free_names(NFS_SERVER(dir), &data->f_attr);
1709
1710         if (o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
1711                 status = _nfs4_proc_open_confirm(data);
1712                 if (status != 0)
1713                         return status;
1714         }
1715
1716         return status;
1717 }
1718
1719 static int nfs4_opendata_access(struct rpc_cred *cred,
1720                                 struct nfs4_opendata *opendata,
1721                                 struct nfs4_state *state, fmode_t fmode,
1722                                 int openflags)
1723 {
1724         struct nfs_access_entry cache;
1725         u32 mask;
1726
1727         /* access call failed or for some reason the server doesn't
1728          * support any access modes -- defer access call until later */
1729         if (opendata->o_res.access_supported == 0)
1730                 return 0;
1731
1732         mask = 0;
1733         /* don't check MAY_WRITE - a newly created file may not have
1734          * write mode bits, but POSIX allows the creating process to write.
1735          * use openflags to check for exec, because fmode won't
1736          * always have FMODE_EXEC set when file open for exec. */
1737         if (openflags & __FMODE_EXEC) {
1738                 /* ONLY check for exec rights */
1739                 mask = MAY_EXEC;
1740         } else if (fmode & FMODE_READ)
1741                 mask = MAY_READ;
1742
1743         cache.cred = cred;
1744         cache.jiffies = jiffies;
1745         nfs_access_set_mask(&cache, opendata->o_res.access_result);
1746         nfs_access_add_cache(state->inode, &cache);
1747
1748         if ((mask & ~cache.mask & (MAY_READ | MAY_EXEC)) == 0)
1749                 return 0;
1750
1751         /* even though OPEN succeeded, access is denied. Close the file */
1752         nfs4_close_state(state, fmode);
1753         return -EACCES;
1754 }
1755
1756 /*
1757  * Note: On error, nfs4_proc_open will free the struct nfs4_opendata
1758  */
1759 static int _nfs4_proc_open(struct nfs4_opendata *data)
1760 {
1761         struct inode *dir = data->dir->d_inode;
1762         struct nfs_server *server = NFS_SERVER(dir);
1763         struct nfs_openargs *o_arg = &data->o_arg;
1764         struct nfs_openres *o_res = &data->o_res;
1765         int status;
1766
1767         status = nfs4_run_open_task(data, 0);
1768         if (!data->rpc_done)
1769                 return status;
1770         if (status != 0) {
1771                 if (status == -NFS4ERR_BADNAME &&
1772                                 !(o_arg->open_flags & O_CREAT))
1773                         return -ENOENT;
1774                 return status;
1775         }
1776
1777         nfs_fattr_map_and_free_names(server, &data->f_attr);
1778
1779         if (o_arg->open_flags & O_CREAT)
1780                 update_changeattr(dir, &o_res->cinfo);
1781         if ((o_res->rflags & NFS4_OPEN_RESULT_LOCKTYPE_POSIX) == 0)
1782                 server->caps &= ~NFS_CAP_POSIX_LOCK;
1783         if(o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
1784                 status = _nfs4_proc_open_confirm(data);
1785                 if (status != 0)
1786                         return status;
1787         }
1788         if (!(o_res->f_attr->valid & NFS_ATTR_FATTR))
1789                 _nfs4_proc_getattr(server, &o_res->fh, o_res->f_attr);
1790         return 0;
1791 }
1792
1793 static int nfs4_recover_expired_lease(struct nfs_server *server)
1794 {
1795         return nfs4_client_recover_expired_lease(server->nfs_client);
1796 }
1797
1798 /*
1799  * OPEN_EXPIRED:
1800  *      reclaim state on the server after a network partition.
1801  *      Assumes caller holds the appropriate lock
1802  */
1803 static int _nfs4_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
1804 {
1805         struct nfs4_opendata *opendata;
1806         int ret;
1807
1808         opendata = nfs4_open_recoverdata_alloc(ctx, state,
1809                         NFS4_OPEN_CLAIM_FH);
1810         if (IS_ERR(opendata))
1811                 return PTR_ERR(opendata);
1812         ret = nfs4_open_recover(opendata, state);
1813         if (ret == -ESTALE)
1814                 d_drop(ctx->dentry);
1815         nfs4_opendata_put(opendata);
1816         return ret;
1817 }
1818
1819 static int nfs4_do_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
1820 {
1821         struct nfs_server *server = NFS_SERVER(state->inode);
1822         struct nfs4_exception exception = { };
1823         int err;
1824
1825         do {
1826                 err = _nfs4_open_expired(ctx, state);
1827                 if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
1828                         continue;
1829                 switch (err) {
1830                 default:
1831                         goto out;
1832                 case -NFS4ERR_GRACE:
1833                 case -NFS4ERR_DELAY:
1834                         nfs4_handle_exception(server, err, &exception);
1835                         err = 0;
1836                 }
1837         } while (exception.retry);
1838 out:
1839         return err;
1840 }
1841
1842 static int nfs4_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
1843 {
1844         struct nfs_open_context *ctx;
1845         int ret;
1846
1847         ctx = nfs4_state_find_open_context(state);
1848         if (IS_ERR(ctx))
1849                 return -EAGAIN;
1850         ret = nfs4_do_open_expired(ctx, state);
1851         put_nfs_open_context(ctx);
1852         return ret;
1853 }
1854
1855 #if defined(CONFIG_NFS_V4_1)
1856 static void nfs41_clear_delegation_stateid(struct nfs4_state *state)
1857 {
1858         struct nfs_server *server = NFS_SERVER(state->inode);
1859         nfs4_stateid *stateid = &state->stateid;
1860         struct nfs_delegation *delegation;
1861         struct rpc_cred *cred = NULL;
1862         int status = -NFS4ERR_BAD_STATEID;
1863
1864         /* If a state reset has been done, test_stateid is unneeded */
1865         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1866                 return;
1867
1868         /* Get the delegation credential for use by test/free_stateid */
1869         rcu_read_lock();
1870         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1871         if (delegation != NULL &&
1872             nfs4_stateid_match(&delegation->stateid, stateid)) {
1873                 cred = get_rpccred(delegation->cred);
1874                 rcu_read_unlock();
1875                 status = nfs41_test_stateid(server, stateid, cred);
1876         } else
1877                 rcu_read_unlock();
1878
1879         if (status != NFS_OK) {
1880                 /* Free the stateid unless the server explicitly
1881                  * informs us the stateid is unrecognized. */
1882                 if (status != -NFS4ERR_BAD_STATEID)
1883                         nfs41_free_stateid(server, stateid, cred);
1884                 nfs_remove_bad_delegation(state->inode);
1885
1886                 write_seqlock(&state->seqlock);
1887                 nfs4_stateid_copy(&state->stateid, &state->open_stateid);
1888                 write_sequnlock(&state->seqlock);
1889                 clear_bit(NFS_DELEGATED_STATE, &state->flags);
1890         }
1891
1892         if (cred != NULL)
1893                 put_rpccred(cred);
1894 }
1895
1896 /**
1897  * nfs41_check_open_stateid - possibly free an open stateid
1898  *
1899  * @state: NFSv4 state for an inode
1900  *
1901  * Returns NFS_OK if recovery for this stateid is now finished.
1902  * Otherwise a negative NFS4ERR value is returned.
1903  */
1904 static int nfs41_check_open_stateid(struct nfs4_state *state)
1905 {
1906         struct nfs_server *server = NFS_SERVER(state->inode);
1907         nfs4_stateid *stateid = &state->open_stateid;
1908         struct rpc_cred *cred = state->owner->so_cred;
1909         int status;
1910
1911         /* If a state reset has been done, test_stateid is unneeded */
1912         if ((test_bit(NFS_O_RDONLY_STATE, &state->flags) == 0) &&
1913             (test_bit(NFS_O_WRONLY_STATE, &state->flags) == 0) &&
1914             (test_bit(NFS_O_RDWR_STATE, &state->flags) == 0))
1915                 return -NFS4ERR_BAD_STATEID;
1916
1917         status = nfs41_test_stateid(server, stateid, cred);
1918         if (status != NFS_OK) {
1919                 /* Free the stateid unless the server explicitly
1920                  * informs us the stateid is unrecognized. */
1921                 if (status != -NFS4ERR_BAD_STATEID)
1922                         nfs41_free_stateid(server, stateid, cred);
1923
1924                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1925                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1926                 clear_bit(NFS_O_RDWR_STATE, &state->flags);
1927                 clear_bit(NFS_OPEN_STATE, &state->flags);
1928         }
1929         return status;
1930 }
1931
1932 static int nfs41_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
1933 {
1934         int status;
1935
1936         nfs41_clear_delegation_stateid(state);
1937         status = nfs41_check_open_stateid(state);
1938         if (status != NFS_OK)
1939                 status = nfs4_open_expired(sp, state);
1940         return status;
1941 }
1942 #endif
1943
1944 /*
1945  * on an EXCLUSIVE create, the server should send back a bitmask with FATTR4-*
1946  * fields corresponding to attributes that were used to store the verifier.
1947  * Make sure we clobber those fields in the later setattr call
1948  */
1949 static inline void nfs4_exclusive_attrset(struct nfs4_opendata *opendata, struct iattr *sattr)
1950 {
1951         if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_ACCESS) &&
1952             !(sattr->ia_valid & ATTR_ATIME_SET))
1953                 sattr->ia_valid |= ATTR_ATIME;
1954
1955         if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_MODIFY) &&
1956             !(sattr->ia_valid & ATTR_MTIME_SET))
1957                 sattr->ia_valid |= ATTR_MTIME;
1958 }
1959
1960 static int _nfs4_open_and_get_state(struct nfs4_opendata *opendata,
1961                 fmode_t fmode,
1962                 int flags,
1963                 struct nfs4_state **res)
1964 {
1965         struct nfs4_state_owner *sp = opendata->owner;
1966         struct nfs_server *server = sp->so_server;
1967         struct nfs4_state *state;
1968         unsigned int seq;
1969         int ret;
1970
1971         seq = raw_seqcount_begin(&sp->so_reclaim_seqcount);
1972
1973         ret = _nfs4_proc_open(opendata);
1974         if (ret != 0)
1975                 goto out;
1976
1977         state = nfs4_opendata_to_nfs4_state(opendata);
1978         ret = PTR_ERR(state);
1979         if (IS_ERR(state))
1980                 goto out;
1981         if (server->caps & NFS_CAP_POSIX_LOCK)
1982                 set_bit(NFS_STATE_POSIX_LOCKS, &state->flags);
1983
1984         ret = nfs4_opendata_access(sp->so_cred, opendata, state, fmode, flags);
1985         if (ret != 0)
1986                 goto out;
1987
1988         if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq))
1989                 nfs4_schedule_stateid_recovery(server, state);
1990         *res = state;
1991 out:
1992         return ret;
1993 }
1994
1995 /*
1996  * Returns a referenced nfs4_state
1997  */
1998 static int _nfs4_do_open(struct inode *dir,
1999                         struct dentry *dentry,
2000                         fmode_t fmode,
2001                         int flags,
2002                         struct iattr *sattr,
2003                         struct rpc_cred *cred,
2004                         struct nfs4_state **res,
2005                         struct nfs4_threshold **ctx_th)
2006 {
2007         struct nfs4_state_owner  *sp;
2008         struct nfs4_state     *state = NULL;
2009         struct nfs_server       *server = NFS_SERVER(dir);
2010         struct nfs4_opendata *opendata;
2011         enum open_claim_type4 claim = NFS4_OPEN_CLAIM_NULL;
2012         int status;
2013
2014         /* Protect against reboot recovery conflicts */
2015         status = -ENOMEM;
2016         sp = nfs4_get_state_owner(server, cred, GFP_KERNEL);
2017         if (sp == NULL) {
2018                 dprintk("nfs4_do_open: nfs4_get_state_owner failed!\n");
2019                 goto out_err;
2020         }
2021         status = nfs4_recover_expired_lease(server);
2022         if (status != 0)
2023                 goto err_put_state_owner;
2024         if (dentry->d_inode != NULL)
2025                 nfs4_return_incompatible_delegation(dentry->d_inode, fmode);
2026         status = -ENOMEM;
2027         if (dentry->d_inode)
2028                 claim = NFS4_OPEN_CLAIM_FH;
2029         opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags, sattr,
2030                         claim, GFP_KERNEL);
2031         if (opendata == NULL)
2032                 goto err_put_state_owner;
2033
2034         if (ctx_th && server->attr_bitmask[2] & FATTR4_WORD2_MDSTHRESHOLD) {
2035                 opendata->f_attr.mdsthreshold = pnfs_mdsthreshold_alloc();
2036                 if (!opendata->f_attr.mdsthreshold)
2037                         goto err_opendata_put;
2038                 opendata->o_arg.open_bitmap = &nfs4_pnfs_open_bitmap[0];
2039         }
2040         if (dentry->d_inode != NULL)
2041                 opendata->state = nfs4_get_open_state(dentry->d_inode, sp);
2042
2043         status = _nfs4_open_and_get_state(opendata, fmode, flags, &state);
2044         if (status != 0)
2045                 goto err_opendata_put;
2046
2047         if ((opendata->o_arg.open_flags & O_EXCL) &&
2048             (opendata->o_arg.createmode != NFS4_CREATE_GUARDED)) {
2049                 nfs4_exclusive_attrset(opendata, sattr);
2050
2051                 nfs_fattr_init(opendata->o_res.f_attr);
2052                 status = nfs4_do_setattr(state->inode, cred,
2053                                 opendata->o_res.f_attr, sattr,
2054                                 state);
2055                 if (status == 0)
2056                         nfs_setattr_update_inode(state->inode, sattr);
2057                 nfs_post_op_update_inode(state->inode, opendata->o_res.f_attr);
2058         }
2059
2060         if (pnfs_use_threshold(ctx_th, opendata->f_attr.mdsthreshold, server))
2061                 *ctx_th = opendata->f_attr.mdsthreshold;
2062         else
2063                 kfree(opendata->f_attr.mdsthreshold);
2064         opendata->f_attr.mdsthreshold = NULL;
2065
2066         nfs4_opendata_put(opendata);
2067         nfs4_put_state_owner(sp);
2068         *res = state;
2069         return 0;
2070 err_opendata_put:
2071         kfree(opendata->f_attr.mdsthreshold);
2072         nfs4_opendata_put(opendata);
2073 err_put_state_owner:
2074         nfs4_put_state_owner(sp);
2075 out_err:
2076         *res = NULL;
2077         return status;
2078 }
2079
2080
2081 static struct nfs4_state *nfs4_do_open(struct inode *dir,
2082                                         struct dentry *dentry,
2083                                         fmode_t fmode,
2084                                         int flags,
2085                                         struct iattr *sattr,
2086                                         struct rpc_cred *cred,
2087                                         struct nfs4_threshold **ctx_th)
2088 {
2089         struct nfs_server *server = NFS_SERVER(dir);
2090         struct nfs4_exception exception = { };
2091         struct nfs4_state *res;
2092         int status;
2093
2094         fmode &= FMODE_READ|FMODE_WRITE|FMODE_EXEC;
2095         do {
2096                 status = _nfs4_do_open(dir, dentry, fmode, flags, sattr, cred,
2097                                        &res, ctx_th);
2098                 if (status == 0)
2099                         break;
2100                 /* NOTE: BAD_SEQID means the server and client disagree about the
2101                  * book-keeping w.r.t. state-changing operations
2102                  * (OPEN/CLOSE/LOCK/LOCKU...)
2103                  * It is actually a sign of a bug on the client or on the server.
2104                  *
2105                  * If we receive a BAD_SEQID error in the particular case of
2106                  * doing an OPEN, we assume that nfs_increment_open_seqid() will
2107                  * have unhashed the old state_owner for us, and that we can
2108                  * therefore safely retry using a new one. We should still warn
2109                  * the user though...
2110                  */
2111                 if (status == -NFS4ERR_BAD_SEQID) {
2112                         pr_warn_ratelimited("NFS: v4 server %s "
2113                                         " returned a bad sequence-id error!\n",
2114                                         NFS_SERVER(dir)->nfs_client->cl_hostname);
2115                         exception.retry = 1;
2116                         continue;
2117                 }
2118                 /*
2119                  * BAD_STATEID on OPEN means that the server cancelled our
2120                  * state before it received the OPEN_CONFIRM.
2121                  * Recover by retrying the request as per the discussion
2122                  * on Page 181 of RFC3530.
2123                  */
2124                 if (status == -NFS4ERR_BAD_STATEID) {
2125                         exception.retry = 1;
2126                         continue;
2127                 }
2128                 if (status == -EAGAIN) {
2129                         /* We must have found a delegation */
2130                         exception.retry = 1;
2131                         continue;
2132                 }
2133                 if (nfs4_clear_cap_atomic_open_v1(server, status, &exception))
2134                         continue;
2135                 res = ERR_PTR(nfs4_handle_exception(server,
2136                                         status, &exception));
2137         } while (exception.retry);
2138         return res;
2139 }
2140
2141 static int _nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
2142                             struct nfs_fattr *fattr, struct iattr *sattr,
2143                             struct nfs4_state *state)
2144 {
2145         struct nfs_server *server = NFS_SERVER(inode);
2146         struct nfs_setattrargs  arg = {
2147                 .fh             = NFS_FH(inode),
2148                 .iap            = sattr,
2149                 .server         = server,
2150                 .bitmask = server->attr_bitmask,
2151         };
2152         struct nfs_setattrres  res = {
2153                 .fattr          = fattr,
2154                 .server         = server,
2155         };
2156         struct rpc_message msg = {
2157                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
2158                 .rpc_argp       = &arg,
2159                 .rpc_resp       = &res,
2160                 .rpc_cred       = cred,
2161         };
2162         unsigned long timestamp = jiffies;
2163         fmode_t fmode;
2164         bool truncate;
2165         int status;
2166
2167         nfs_fattr_init(fattr);
2168
2169         /* Servers should only apply open mode checks for file size changes */
2170         truncate = (sattr->ia_valid & ATTR_SIZE) ? true : false;
2171         fmode = truncate ? FMODE_WRITE : FMODE_READ;
2172
2173         if (nfs4_copy_delegation_stateid(&arg.stateid, inode, fmode)) {
2174                 /* Use that stateid */
2175         } else if (truncate && state != NULL && nfs4_valid_open_stateid(state)) {
2176                 struct nfs_lockowner lockowner = {
2177                         .l_owner = current->files,
2178                         .l_pid = current->tgid,
2179                 };
2180                 nfs4_select_rw_stateid(&arg.stateid, state, FMODE_WRITE,
2181                                 &lockowner);
2182         } else
2183                 nfs4_stateid_copy(&arg.stateid, &zero_stateid);
2184
2185         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
2186         if (status == 0 && state != NULL)
2187                 renew_lease(server, timestamp);
2188         return status;
2189 }
2190
2191 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
2192                            struct nfs_fattr *fattr, struct iattr *sattr,
2193                            struct nfs4_state *state)
2194 {
2195         struct nfs_server *server = NFS_SERVER(inode);
2196         struct nfs4_exception exception = {
2197                 .state = state,
2198                 .inode = inode,
2199         };
2200         int err;
2201         do {
2202                 err = _nfs4_do_setattr(inode, cred, fattr, sattr, state);
2203                 switch (err) {
2204                 case -NFS4ERR_OPENMODE:
2205                         if (!(sattr->ia_valid & ATTR_SIZE)) {
2206                                 pr_warn_once("NFSv4: server %s is incorrectly "
2207                                                 "applying open mode checks to "
2208                                                 "a SETATTR that is not "
2209                                                 "changing file size.\n",
2210                                                 server->nfs_client->cl_hostname);
2211                         }
2212                         if (state && !(state->state & FMODE_WRITE)) {
2213                                 err = -EBADF;
2214                                 if (sattr->ia_valid & ATTR_OPEN)
2215                                         err = -EACCES;
2216                                 goto out;
2217                         }
2218                 }
2219                 err = nfs4_handle_exception(server, err, &exception);
2220         } while (exception.retry);
2221 out:
2222         return err;
2223 }
2224
2225 struct nfs4_closedata {
2226         struct inode *inode;
2227         struct nfs4_state *state;
2228         struct nfs_closeargs arg;
2229         struct nfs_closeres res;
2230         struct nfs_fattr fattr;
2231         unsigned long timestamp;
2232         bool roc;
2233         u32 roc_barrier;
2234 };
2235
2236 static void nfs4_free_closedata(void *data)
2237 {
2238         struct nfs4_closedata *calldata = data;
2239         struct nfs4_state_owner *sp = calldata->state->owner;
2240         struct super_block *sb = calldata->state->inode->i_sb;
2241
2242         if (calldata->roc)
2243                 pnfs_roc_release(calldata->state->inode);
2244         nfs4_put_open_state(calldata->state);
2245         nfs_free_seqid(calldata->arg.seqid);
2246         nfs4_put_state_owner(sp);
2247         nfs_sb_deactive(sb);
2248         kfree(calldata);
2249 }
2250
2251 static void nfs4_close_clear_stateid_flags(struct nfs4_state *state,
2252                 fmode_t fmode)
2253 {
2254         spin_lock(&state->owner->so_lock);
2255         clear_bit(NFS_O_RDWR_STATE, &state->flags);
2256         switch (fmode & (FMODE_READ|FMODE_WRITE)) {
2257         case FMODE_WRITE:
2258                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
2259                 break;
2260         case FMODE_READ:
2261                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
2262                 break;
2263         case 0:
2264                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
2265                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
2266                 clear_bit(NFS_OPEN_STATE, &state->flags);
2267         }
2268         spin_unlock(&state->owner->so_lock);
2269 }
2270
2271 static void nfs4_close_done(struct rpc_task *task, void *data)
2272 {
2273         struct nfs4_closedata *calldata = data;
2274         struct nfs4_state *state = calldata->state;
2275         struct nfs_server *server = NFS_SERVER(calldata->inode);
2276
2277         dprintk("%s: begin!\n", __func__);
2278         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
2279                 return;
2280         /* hmm. we are done with the inode, and in the process of freeing
2281          * the state_owner. we keep this around to process errors
2282          */
2283         switch (task->tk_status) {
2284                 case 0:
2285                         if (calldata->roc)
2286                                 pnfs_roc_set_barrier(state->inode,
2287                                                      calldata->roc_barrier);
2288                         nfs_set_open_stateid(state, &calldata->res.stateid, 0);
2289                         renew_lease(server, calldata->timestamp);
2290                         nfs4_close_clear_stateid_flags(state,
2291                                         calldata->arg.fmode);
2292                         break;
2293                 case -NFS4ERR_STALE_STATEID:
2294                 case -NFS4ERR_OLD_STATEID:
2295                 case -NFS4ERR_BAD_STATEID:
2296                 case -NFS4ERR_EXPIRED:
2297                         if (calldata->arg.fmode == 0)
2298                                 break;
2299                 default:
2300                         if (nfs4_async_handle_error(task, server, state) == -EAGAIN)
2301                                 rpc_restart_call_prepare(task);
2302         }
2303         nfs_release_seqid(calldata->arg.seqid);
2304         nfs_refresh_inode(calldata->inode, calldata->res.fattr);
2305         dprintk("%s: done, ret = %d!\n", __func__, task->tk_status);
2306 }
2307
2308 static void nfs4_close_prepare(struct rpc_task *task, void *data)
2309 {
2310         struct nfs4_closedata *calldata = data;
2311         struct nfs4_state *state = calldata->state;
2312         struct inode *inode = calldata->inode;
2313         int call_close = 0;
2314
2315         dprintk("%s: begin!\n", __func__);
2316         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
2317                 goto out_wait;
2318
2319         task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_DOWNGRADE];
2320         calldata->arg.fmode = FMODE_READ|FMODE_WRITE;
2321         spin_lock(&state->owner->so_lock);
2322         /* Calculate the change in open mode */
2323         if (state->n_rdwr == 0) {
2324                 if (state->n_rdonly == 0) {
2325                         call_close |= test_bit(NFS_O_RDONLY_STATE, &state->flags);
2326                         call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
2327                         calldata->arg.fmode &= ~FMODE_READ;
2328                 }
2329                 if (state->n_wronly == 0) {
2330                         call_close |= test_bit(NFS_O_WRONLY_STATE, &state->flags);
2331                         call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
2332                         calldata->arg.fmode &= ~FMODE_WRITE;
2333                 }
2334         }
2335         if (!nfs4_valid_open_stateid(state))
2336                 call_close = 0;
2337         spin_unlock(&state->owner->so_lock);
2338
2339         if (!call_close) {
2340                 /* Note: exit _without_ calling nfs4_close_done */
2341                 goto out_no_action;
2342         }
2343
2344         if (calldata->arg.fmode == 0) {
2345                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE];
2346                 if (calldata->roc &&
2347                     pnfs_roc_drain(inode, &calldata->roc_barrier, task)) {
2348                         nfs_release_seqid(calldata->arg.seqid);
2349                         goto out_wait;
2350                     }
2351         }
2352
2353         nfs_fattr_init(calldata->res.fattr);
2354         calldata->timestamp = jiffies;
2355         if (nfs4_setup_sequence(NFS_SERVER(inode),
2356                                 &calldata->arg.seq_args,
2357                                 &calldata->res.seq_res,
2358                                 task) != 0)
2359                 nfs_release_seqid(calldata->arg.seqid);
2360         dprintk("%s: done!\n", __func__);
2361         return;
2362 out_no_action:
2363         task->tk_action = NULL;
2364 out_wait:
2365         nfs4_sequence_done(task, &calldata->res.seq_res);
2366 }
2367
2368 static const struct rpc_call_ops nfs4_close_ops = {
2369         .rpc_call_prepare = nfs4_close_prepare,
2370         .rpc_call_done = nfs4_close_done,
2371         .rpc_release = nfs4_free_closedata,
2372 };
2373
2374 /* 
2375  * It is possible for data to be read/written from a mem-mapped file 
2376  * after the sys_close call (which hits the vfs layer as a flush).
2377  * This means that we can't safely call nfsv4 close on a file until 
2378  * the inode is cleared. This in turn means that we are not good
2379  * NFSv4 citizens - we do not indicate to the server to update the file's 
2380  * share state even when we are done with one of the three share 
2381  * stateid's in the inode.
2382  *
2383  * NOTE: Caller must be holding the sp->so_owner semaphore!
2384  */
2385 int nfs4_do_close(struct nfs4_state *state, gfp_t gfp_mask, int wait)
2386 {
2387         struct nfs_server *server = NFS_SERVER(state->inode);
2388         struct nfs4_closedata *calldata;
2389         struct nfs4_state_owner *sp = state->owner;
2390         struct rpc_task *task;
2391         struct rpc_message msg = {
2392                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE],
2393                 .rpc_cred = state->owner->so_cred,
2394         };
2395         struct rpc_task_setup task_setup_data = {
2396                 .rpc_client = server->client,
2397                 .rpc_message = &msg,
2398                 .callback_ops = &nfs4_close_ops,
2399                 .workqueue = nfsiod_workqueue,
2400                 .flags = RPC_TASK_ASYNC,
2401         };
2402         int status = -ENOMEM;
2403
2404         calldata = kzalloc(sizeof(*calldata), gfp_mask);
2405         if (calldata == NULL)
2406                 goto out;
2407         nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 1);
2408         calldata->inode = state->inode;
2409         calldata->state = state;
2410         calldata->arg.fh = NFS_FH(state->inode);
2411         calldata->arg.stateid = &state->open_stateid;
2412         /* Serialization for the sequence id */
2413         calldata->arg.seqid = nfs_alloc_seqid(&state->owner->so_seqid, gfp_mask);
2414         if (calldata->arg.seqid == NULL)
2415                 goto out_free_calldata;
2416         calldata->arg.fmode = 0;
2417         calldata->arg.bitmask = server->cache_consistency_bitmask;
2418         calldata->res.fattr = &calldata->fattr;
2419         calldata->res.seqid = calldata->arg.seqid;
2420         calldata->res.server = server;
2421         calldata->roc = pnfs_roc(state->inode);
2422         nfs_sb_active(calldata->inode->i_sb);
2423
2424         msg.rpc_argp = &calldata->arg;
2425         msg.rpc_resp = &calldata->res;
2426         task_setup_data.callback_data = calldata;
2427         task = rpc_run_task(&task_setup_data);
2428         if (IS_ERR(task))
2429                 return PTR_ERR(task);
2430         status = 0;
2431         if (wait)
2432                 status = rpc_wait_for_completion_task(task);
2433         rpc_put_task(task);
2434         return status;
2435 out_free_calldata:
2436         kfree(calldata);
2437 out:
2438         nfs4_put_open_state(state);
2439         nfs4_put_state_owner(sp);
2440         return status;
2441 }
2442
2443 static struct inode *
2444 nfs4_atomic_open(struct inode *dir, struct nfs_open_context *ctx, int open_flags, struct iattr *attr)
2445 {
2446         struct nfs4_state *state;
2447
2448         /* Protect against concurrent sillydeletes */
2449         state = nfs4_do_open(dir, ctx->dentry, ctx->mode, open_flags, attr,
2450                              ctx->cred, &ctx->mdsthreshold);
2451         if (IS_ERR(state))
2452                 return ERR_CAST(state);
2453         ctx->state = state;
2454         return igrab(state->inode);
2455 }
2456
2457 static void nfs4_close_context(struct nfs_open_context *ctx, int is_sync)
2458 {
2459         if (ctx->state == NULL)
2460                 return;
2461         if (is_sync)
2462                 nfs4_close_sync(ctx->state, ctx->mode);
2463         else
2464                 nfs4_close_state(ctx->state, ctx->mode);
2465 }
2466
2467 static int _nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
2468 {
2469         struct nfs4_server_caps_arg args = {
2470                 .fhandle = fhandle,
2471         };
2472         struct nfs4_server_caps_res res = {};
2473         struct rpc_message msg = {
2474                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SERVER_CAPS],
2475                 .rpc_argp = &args,
2476                 .rpc_resp = &res,
2477         };
2478         int status;
2479
2480         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2481         if (status == 0) {
2482                 memcpy(server->attr_bitmask, res.attr_bitmask, sizeof(server->attr_bitmask));
2483                 server->caps &= ~(NFS_CAP_ACLS|NFS_CAP_HARDLINKS|
2484                                 NFS_CAP_SYMLINKS|NFS_CAP_FILEID|
2485                                 NFS_CAP_MODE|NFS_CAP_NLINK|NFS_CAP_OWNER|
2486                                 NFS_CAP_OWNER_GROUP|NFS_CAP_ATIME|
2487                                 NFS_CAP_CTIME|NFS_CAP_MTIME);
2488                 if (res.attr_bitmask[0] & FATTR4_WORD0_ACL)
2489                         server->caps |= NFS_CAP_ACLS;
2490                 if (res.has_links != 0)
2491                         server->caps |= NFS_CAP_HARDLINKS;
2492                 if (res.has_symlinks != 0)
2493                         server->caps |= NFS_CAP_SYMLINKS;
2494                 if (res.attr_bitmask[0] & FATTR4_WORD0_FILEID)
2495                         server->caps |= NFS_CAP_FILEID;
2496                 if (res.attr_bitmask[1] & FATTR4_WORD1_MODE)
2497                         server->caps |= NFS_CAP_MODE;
2498                 if (res.attr_bitmask[1] & FATTR4_WORD1_NUMLINKS)
2499                         server->caps |= NFS_CAP_NLINK;
2500                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER)
2501                         server->caps |= NFS_CAP_OWNER;
2502                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER_GROUP)
2503                         server->caps |= NFS_CAP_OWNER_GROUP;
2504                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_ACCESS)
2505                         server->caps |= NFS_CAP_ATIME;
2506                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_METADATA)
2507                         server->caps |= NFS_CAP_CTIME;
2508                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_MODIFY)
2509                         server->caps |= NFS_CAP_MTIME;
2510
2511                 memcpy(server->cache_consistency_bitmask, res.attr_bitmask, sizeof(server->cache_consistency_bitmask));
2512                 server->cache_consistency_bitmask[0] &= FATTR4_WORD0_CHANGE|FATTR4_WORD0_SIZE;
2513                 server->cache_consistency_bitmask[1] &= FATTR4_WORD1_TIME_METADATA|FATTR4_WORD1_TIME_MODIFY;
2514                 server->acl_bitmask = res.acl_bitmask;
2515                 server->fh_expire_type = res.fh_expire_type;
2516         }
2517
2518         return status;
2519 }
2520
2521 int nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
2522 {
2523         struct nfs4_exception exception = { };
2524         int err;
2525         do {
2526                 err = nfs4_handle_exception(server,
2527                                 _nfs4_server_capabilities(server, fhandle),
2528                                 &exception);
2529         } while (exception.retry);
2530         return err;
2531 }
2532
2533 static int _nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
2534                 struct nfs_fsinfo *info)
2535 {
2536         struct nfs4_lookup_root_arg args = {
2537                 .bitmask = nfs4_fattr_bitmap,
2538         };
2539         struct nfs4_lookup_res res = {
2540                 .server = server,
2541                 .fattr = info->fattr,
2542                 .fh = fhandle,
2543         };
2544         struct rpc_message msg = {
2545                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP_ROOT],
2546                 .rpc_argp = &args,
2547                 .rpc_resp = &res,
2548         };
2549
2550         nfs_fattr_init(info->fattr);
2551         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2552 }
2553
2554 static int nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
2555                 struct nfs_fsinfo *info)
2556 {
2557         struct nfs4_exception exception = { };
2558         int err;
2559         do {
2560                 err = _nfs4_lookup_root(server, fhandle, info);
2561                 switch (err) {
2562                 case 0:
2563                 case -NFS4ERR_WRONGSEC:
2564                         goto out;
2565                 default:
2566                         err = nfs4_handle_exception(server, err, &exception);
2567                 }
2568         } while (exception.retry);
2569 out:
2570         return err;
2571 }
2572
2573 static int nfs4_lookup_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
2574                                 struct nfs_fsinfo *info, rpc_authflavor_t flavor)
2575 {
2576         struct rpc_auth *auth;
2577         int ret;
2578
2579         auth = rpcauth_create(flavor, server->client);
2580         if (IS_ERR(auth)) {
2581                 ret = -EACCES;
2582                 goto out;
2583         }
2584         ret = nfs4_lookup_root(server, fhandle, info);
2585 out:
2586         return ret;
2587 }
2588
2589 /*
2590  * Retry pseudoroot lookup with various security flavors.  We do this when:
2591  *
2592  *   NFSv4.0: the PUTROOTFH operation returns NFS4ERR_WRONGSEC
2593  *   NFSv4.1: the server does not support the SECINFO_NO_NAME operation
2594  *
2595  * Returns zero on success, or a negative NFS4ERR value, or a
2596  * negative errno value.
2597  */
2598 static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
2599                               struct nfs_fsinfo *info)
2600 {
2601         /* Per 3530bis 15.33.5 */
2602         static const rpc_authflavor_t flav_array[] = {
2603                 RPC_AUTH_GSS_KRB5P,
2604                 RPC_AUTH_GSS_KRB5I,
2605                 RPC_AUTH_GSS_KRB5,
2606                 RPC_AUTH_UNIX,                  /* courtesy */
2607                 RPC_AUTH_NULL,
2608         };
2609         int status = -EPERM;
2610         size_t i;
2611
2612         for (i = 0; i < ARRAY_SIZE(flav_array); i++) {
2613                 status = nfs4_lookup_root_sec(server, fhandle, info, flav_array[i]);
2614                 if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
2615                         continue;
2616                 break;
2617         }
2618
2619         /*
2620          * -EACCESS could mean that the user doesn't have correct permissions
2621          * to access the mount.  It could also mean that we tried to mount
2622          * with a gss auth flavor, but rpc.gssd isn't running.  Either way,
2623          * existing mount programs don't handle -EACCES very well so it should
2624          * be mapped to -EPERM instead.
2625          */
2626         if (status == -EACCES)
2627                 status = -EPERM;
2628         return status;
2629 }
2630
2631 static int nfs4_do_find_root_sec(struct nfs_server *server,
2632                 struct nfs_fh *fhandle, struct nfs_fsinfo *info)
2633 {
2634         int mv = server->nfs_client->cl_minorversion;
2635         return nfs_v4_minor_ops[mv]->find_root_sec(server, fhandle, info);
2636 }
2637
2638 /**
2639  * nfs4_proc_get_rootfh - get file handle for server's pseudoroot
2640  * @server: initialized nfs_server handle
2641  * @fhandle: we fill in the pseudo-fs root file handle
2642  * @info: we fill in an FSINFO struct
2643  *
2644  * Returns zero on success, or a negative errno.
2645  */
2646 int nfs4_proc_get_rootfh(struct nfs_server *server, struct nfs_fh *fhandle,
2647                          struct nfs_fsinfo *info)
2648 {
2649         int status;
2650
2651         status = nfs4_lookup_root(server, fhandle, info);
2652         if ((status == -NFS4ERR_WRONGSEC) &&
2653             !(server->flags & NFS_MOUNT_SECFLAVOUR))
2654                 status = nfs4_do_find_root_sec(server, fhandle, info);
2655
2656         if (status == 0)
2657                 status = nfs4_server_capabilities(server, fhandle);
2658         if (status == 0)
2659                 status = nfs4_do_fsinfo(server, fhandle, info);
2660
2661         return nfs4_map_errors(status);
2662 }
2663
2664 static int nfs4_proc_get_root(struct nfs_server *server, struct nfs_fh *mntfh,
2665                               struct nfs_fsinfo *info)
2666 {
2667         int error;
2668         struct nfs_fattr *fattr = info->fattr;
2669
2670         error = nfs4_server_capabilities(server, mntfh);
2671         if (error < 0) {
2672                 dprintk("nfs4_get_root: getcaps error = %d\n", -error);
2673                 return error;
2674         }
2675
2676         error = nfs4_proc_getattr(server, mntfh, fattr);
2677         if (error < 0) {
2678                 dprintk("nfs4_get_root: getattr error = %d\n", -error);
2679                 return error;
2680         }
2681
2682         if (fattr->valid & NFS_ATTR_FATTR_FSID &&
2683             !nfs_fsid_equal(&server->fsid, &fattr->fsid))
2684                 memcpy(&server->fsid, &fattr->fsid, sizeof(server->fsid));
2685
2686         return error;
2687 }
2688
2689 /*
2690  * Get locations and (maybe) other attributes of a referral.
2691  * Note that we'll actually follow the referral later when
2692  * we detect fsid mismatch in inode revalidation
2693  */
2694 static int nfs4_get_referral(struct rpc_clnt *client, struct inode *dir,
2695                              const struct qstr *name, struct nfs_fattr *fattr,
2696                              struct nfs_fh *fhandle)
2697 {
2698         int status = -ENOMEM;
2699         struct page *page = NULL;
2700         struct nfs4_fs_locations *locations = NULL;
2701
2702         page = alloc_page(GFP_KERNEL);
2703         if (page == NULL)
2704                 goto out;
2705         locations = kmalloc(sizeof(struct nfs4_fs_locations), GFP_KERNEL);
2706         if (locations == NULL)
2707                 goto out;
2708
2709         status = nfs4_proc_fs_locations(client, dir, name, locations, page);
2710         if (status != 0)
2711                 goto out;
2712         /* Make sure server returned a different fsid for the referral */
2713         if (nfs_fsid_equal(&NFS_SERVER(dir)->fsid, &locations->fattr.fsid)) {
2714                 dprintk("%s: server did not return a different fsid for"
2715                         " a referral at %s\n", __func__, name->name);
2716                 status = -EIO;
2717                 goto out;
2718         }
2719         /* Fixup attributes for the nfs_lookup() call to nfs_fhget() */
2720         nfs_fixup_referral_attributes(&locations->fattr);
2721
2722         /* replace the lookup nfs_fattr with the locations nfs_fattr */
2723         memcpy(fattr, &locations->fattr, sizeof(struct nfs_fattr));
2724         memset(fhandle, 0, sizeof(struct nfs_fh));
2725 out:
2726         if (page)
2727                 __free_page(page);
2728         kfree(locations);
2729         return status;
2730 }
2731
2732 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2733 {
2734         struct nfs4_getattr_arg args = {
2735                 .fh = fhandle,
2736                 .bitmask = server->attr_bitmask,
2737         };
2738         struct nfs4_getattr_res res = {
2739                 .fattr = fattr,
2740                 .server = server,
2741         };
2742         struct rpc_message msg = {
2743                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
2744                 .rpc_argp = &args,
2745                 .rpc_resp = &res,
2746         };
2747         
2748         nfs_fattr_init(fattr);
2749         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2750 }
2751
2752 static int nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2753 {
2754         struct nfs4_exception exception = { };
2755         int err;
2756         do {
2757                 err = nfs4_handle_exception(server,
2758                                 _nfs4_proc_getattr(server, fhandle, fattr),
2759                                 &exception);
2760         } while (exception.retry);
2761         return err;
2762 }
2763
2764 /* 
2765  * The file is not closed if it is opened due to the a request to change
2766  * the size of the file. The open call will not be needed once the
2767  * VFS layer lookup-intents are implemented.
2768  *
2769  * Close is called when the inode is destroyed.
2770  * If we haven't opened the file for O_WRONLY, we
2771  * need to in the size_change case to obtain a stateid.
2772  *
2773  * Got race?
2774  * Because OPEN is always done by name in nfsv4, it is
2775  * possible that we opened a different file by the same
2776  * name.  We can recognize this race condition, but we
2777  * can't do anything about it besides returning an error.
2778  *
2779  * This will be fixed with VFS changes (lookup-intent).
2780  */
2781 static int
2782 nfs4_proc_setattr(struct dentry *dentry, struct nfs_fattr *fattr,
2783                   struct iattr *sattr)
2784 {
2785         struct inode *inode = dentry->d_inode;
2786         struct rpc_cred *cred = NULL;
2787         struct nfs4_state *state = NULL;
2788         int status;
2789
2790         if (pnfs_ld_layoutret_on_setattr(inode))
2791                 pnfs_commit_and_return_layout(inode);
2792
2793         nfs_fattr_init(fattr);
2794         
2795         /* Deal with open(O_TRUNC) */
2796         if (sattr->ia_valid & ATTR_OPEN)
2797                 sattr->ia_valid &= ~(ATTR_MTIME|ATTR_CTIME|ATTR_OPEN);
2798
2799         /* Optimization: if the end result is no change, don't RPC */
2800         if ((sattr->ia_valid & ~(ATTR_FILE)) == 0)
2801                 return 0;
2802
2803         /* Search for an existing open(O_WRITE) file */
2804         if (sattr->ia_valid & ATTR_FILE) {
2805                 struct nfs_open_context *ctx;
2806
2807                 ctx = nfs_file_open_context(sattr->ia_file);
2808                 if (ctx) {
2809                         cred = ctx->cred;
2810                         state = ctx->state;
2811                 }
2812         }
2813
2814         status = nfs4_do_setattr(inode, cred, fattr, sattr, state);
2815         if (status == 0)
2816                 nfs_setattr_update_inode(inode, sattr);
2817         return status;
2818 }
2819
2820 static int _nfs4_proc_lookup(struct rpc_clnt *clnt, struct inode *dir,
2821                 const struct qstr *name, struct nfs_fh *fhandle,
2822                 struct nfs_fattr *fattr)
2823 {
2824         struct nfs_server *server = NFS_SERVER(dir);
2825         int                    status;
2826         struct nfs4_lookup_arg args = {
2827                 .bitmask = server->attr_bitmask,
2828                 .dir_fh = NFS_FH(dir),
2829                 .name = name,
2830         };
2831         struct nfs4_lookup_res res = {
2832                 .server = server,
2833                 .fattr = fattr,
2834                 .fh = fhandle,
2835         };
2836         struct rpc_message msg = {
2837                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP],
2838                 .rpc_argp = &args,
2839                 .rpc_resp = &res,
2840         };
2841
2842         nfs_fattr_init(fattr);
2843
2844         dprintk("NFS call  lookup %s\n", name->name);
2845         status = nfs4_call_sync(clnt, server, &msg, &args.seq_args, &res.seq_res, 0);
2846         dprintk("NFS reply lookup: %d\n", status);
2847         return status;
2848 }
2849
2850 static void nfs_fixup_secinfo_attributes(struct nfs_fattr *fattr)
2851 {
2852         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
2853                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_MOUNTPOINT;
2854         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
2855         fattr->nlink = 2;
2856 }
2857
2858 static int nfs4_proc_lookup_common(struct rpc_clnt **clnt, struct inode *dir,
2859                                    struct qstr *name, struct nfs_fh *fhandle,
2860                                    struct nfs_fattr *fattr)
2861 {
2862         struct nfs4_exception exception = { };
2863         struct rpc_clnt *client = *clnt;
2864         int err;
2865         do {
2866                 err = _nfs4_proc_lookup(client, dir, name, fhandle, fattr);
2867                 switch (err) {
2868                 case -NFS4ERR_BADNAME:
2869                         err = -ENOENT;
2870                         goto out;
2871                 case -NFS4ERR_MOVED:
2872                         err = nfs4_get_referral(client, dir, name, fattr, fhandle);
2873                         goto out;
2874                 case -NFS4ERR_WRONGSEC:
2875                         err = -EPERM;
2876                         if (client != *clnt)
2877                                 goto out;
2878
2879                         client = nfs4_create_sec_client(client, dir, name);
2880                         if (IS_ERR(client))
2881                                 return PTR_ERR(client);
2882
2883                         exception.retry = 1;
2884                         break;
2885                 default:
2886                         err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
2887                 }
2888         } while (exception.retry);
2889
2890 out:
2891         if (err == 0)
2892                 *clnt = client;
2893         else if (client != *clnt)
2894                 rpc_shutdown_client(client);
2895
2896         return err;
2897 }
2898
2899 static int nfs4_proc_lookup(struct inode *dir, struct qstr *name,
2900                             struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2901 {
2902         int status;
2903         struct rpc_clnt *client = NFS_CLIENT(dir);
2904
2905         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
2906         if (client != NFS_CLIENT(dir)) {
2907                 rpc_shutdown_client(client);
2908                 nfs_fixup_secinfo_attributes(fattr);
2909         }
2910         return status;
2911 }
2912
2913 struct rpc_clnt *
2914 nfs4_proc_lookup_mountpoint(struct inode *dir, struct qstr *name,
2915                             struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2916 {
2917         int status;
2918         struct rpc_clnt *client = rpc_clone_client(NFS_CLIENT(dir));
2919
2920         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
2921         if (status < 0) {
2922                 rpc_shutdown_client(client);
2923                 return ERR_PTR(status);
2924         }
2925         return client;
2926 }
2927
2928 static int _nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
2929 {
2930         struct nfs_server *server = NFS_SERVER(inode);
2931         struct nfs4_accessargs args = {
2932                 .fh = NFS_FH(inode),
2933                 .bitmask = server->cache_consistency_bitmask,
2934         };
2935         struct nfs4_accessres res = {
2936                 .server = server,
2937         };
2938         struct rpc_message msg = {
2939                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_ACCESS],
2940                 .rpc_argp = &args,
2941                 .rpc_resp = &res,
2942                 .rpc_cred = entry->cred,
2943         };
2944         int mode = entry->mask;
2945         int status;
2946
2947         /*
2948          * Determine which access bits we want to ask for...
2949          */
2950         if (mode & MAY_READ)
2951                 args.access |= NFS4_ACCESS_READ;
2952         if (S_ISDIR(inode->i_mode)) {
2953                 if (mode & MAY_WRITE)
2954                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND | NFS4_ACCESS_DELETE;
2955                 if (mode & MAY_EXEC)
2956                         args.access |= NFS4_ACCESS_LOOKUP;
2957         } else {
2958                 if (mode & MAY_WRITE)
2959                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND;
2960                 if (mode & MAY_EXEC)
2961                         args.access |= NFS4_ACCESS_EXECUTE;
2962         }
2963
2964         res.fattr = nfs_alloc_fattr();
2965         if (res.fattr == NULL)
2966                 return -ENOMEM;
2967
2968         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2969         if (!status) {
2970                 nfs_access_set_mask(entry, res.access);
2971                 nfs_refresh_inode(inode, res.fattr);
2972         }
2973         nfs_free_fattr(res.fattr);
2974         return status;
2975 }
2976
2977 static int nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
2978 {
2979         struct nfs4_exception exception = { };
2980         int err;
2981         do {
2982                 err = nfs4_handle_exception(NFS_SERVER(inode),
2983                                 _nfs4_proc_access(inode, entry),
2984                                 &exception);
2985         } while (exception.retry);
2986         return err;
2987 }
2988
2989 /*
2990  * TODO: For the time being, we don't try to get any attributes
2991  * along with any of the zero-copy operations READ, READDIR,
2992  * READLINK, WRITE.
2993  *
2994  * In the case of the first three, we want to put the GETATTR
2995  * after the read-type operation -- this is because it is hard
2996  * to predict the length of a GETATTR response in v4, and thus
2997  * align the READ data correctly.  This means that the GETATTR
2998  * may end up partially falling into the page cache, and we should
2999  * shift it into the 'tail' of the xdr_buf before processing.
3000  * To do this efficiently, we need to know the total length
3001  * of data received, which doesn't seem to be available outside
3002  * of the RPC layer.
3003  *
3004  * In the case of WRITE, we also want to put the GETATTR after
3005  * the operation -- in this case because we want to make sure
3006  * we get the post-operation mtime and size.
3007  *
3008  * Both of these changes to the XDR layer would in fact be quite
3009  * minor, but I decided to leave them for a subsequent patch.
3010  */
3011 static int _nfs4_proc_readlink(struct inode *inode, struct page *page,
3012                 unsigned int pgbase, unsigned int pglen)
3013 {
3014         struct nfs4_readlink args = {
3015                 .fh       = NFS_FH(inode),
3016                 .pgbase   = pgbase,
3017                 .pglen    = pglen,
3018                 .pages    = &page,
3019         };
3020         struct nfs4_readlink_res res;
3021         struct rpc_message msg = {
3022                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READLINK],
3023                 .rpc_argp = &args,
3024                 .rpc_resp = &res,
3025         };
3026
3027         return nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode), &msg, &args.seq_args, &res.seq_res, 0);
3028 }
3029
3030 static int nfs4_proc_readlink(struct inode *inode, struct page *page,
3031                 unsigned int pgbase, unsigned int pglen)
3032 {
3033         struct nfs4_exception exception = { };
3034         int err;
3035         do {
3036                 err = nfs4_handle_exception(NFS_SERVER(inode),
3037                                 _nfs4_proc_readlink(inode, page, pgbase, pglen),
3038                                 &exception);
3039         } while (exception.retry);
3040         return err;
3041 }
3042
3043 /*
3044  * This is just for mknod.  open(O_CREAT) will always do ->open_context().
3045  */
3046 static int
3047 nfs4_proc_create(struct inode *dir, struct dentry *dentry, struct iattr *sattr,
3048                  int flags)
3049 {
3050         struct nfs_open_context *ctx;
3051         struct nfs4_state *state;
3052         int status = 0;
3053
3054         ctx = alloc_nfs_open_context(dentry, FMODE_READ);
3055         if (IS_ERR(ctx))
3056                 return PTR_ERR(ctx);
3057
3058         sattr->ia_mode &= ~current_umask();
3059         state = nfs4_do_open(dir, dentry, ctx->mode,
3060                         flags, sattr, ctx->cred,
3061                         &ctx->mdsthreshold);
3062         d_drop(dentry);
3063         if (IS_ERR(state)) {
3064                 status = PTR_ERR(state);
3065                 goto out;
3066         }
3067         d_add(dentry, igrab(state->inode));
3068         nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
3069         ctx->state = state;
3070 out:
3071         put_nfs_open_context(ctx);
3072         return status;
3073 }
3074
3075 static int _nfs4_proc_remove(struct inode *dir, struct qstr *name)
3076 {
3077         struct nfs_server *server = NFS_SERVER(dir);
3078         struct nfs_removeargs args = {
3079                 .fh = NFS_FH(dir),
3080                 .name = *name,
3081         };
3082         struct nfs_removeres res = {
3083                 .server = server,
3084         };
3085         struct rpc_message msg = {
3086                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE],
3087                 .rpc_argp = &args,
3088                 .rpc_resp = &res,
3089         };
3090         int status;
3091
3092         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
3093         if (status == 0)
3094                 update_changeattr(dir, &res.cinfo);
3095         return status;
3096 }
3097
3098 static int nfs4_proc_remove(struct inode *dir, struct qstr *name)
3099 {
3100         struct nfs4_exception exception = { };
3101         int err;
3102         do {
3103                 err = nfs4_handle_exception(NFS_SERVER(dir),
3104                                 _nfs4_proc_remove(dir, name),
3105                                 &exception);
3106         } while (exception.retry);
3107         return err;
3108 }
3109
3110 static void nfs4_proc_unlink_setup(struct rpc_message *msg, struct inode *dir)
3111 {
3112         struct nfs_server *server = NFS_SERVER(dir);
3113         struct nfs_removeargs *args = msg->rpc_argp;
3114         struct nfs_removeres *res = msg->rpc_resp;
3115
3116         res->server = server;
3117         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE];
3118         nfs41_init_sequence(&args->seq_args, &res->seq_res, 1);
3119 }
3120
3121 static void nfs4_proc_unlink_rpc_prepare(struct rpc_task *task, struct nfs_unlinkdata *data)
3122 {
3123         nfs4_setup_sequence(NFS_SERVER(data->dir),
3124                         &data->args.seq_args,
3125                         &data->res.seq_res,
3126                         task);
3127 }
3128
3129 static int nfs4_proc_unlink_done(struct rpc_task *task, struct inode *dir)
3130 {
3131         struct nfs_removeres *res = task->tk_msg.rpc_resp;
3132
3133         if (!nfs4_sequence_done(task, &res->seq_res))
3134                 return 0;
3135         if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
3136                 return 0;
3137         update_changeattr(dir, &res->cinfo);
3138         return 1;
3139 }
3140
3141 static void nfs4_proc_rename_setup(struct rpc_message *msg, struct inode *dir)
3142 {
3143         struct nfs_server *server = NFS_SERVER(dir);
3144         struct nfs_renameargs *arg = msg->rpc_argp;
3145         struct nfs_renameres *res = msg->rpc_resp;
3146
3147         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME];
3148         res->server = server;
3149         nfs41_init_sequence(&arg->seq_args, &res->seq_res, 1);
3150 }
3151
3152 static void nfs4_proc_rename_rpc_prepare(struct rpc_task *task, struct nfs_renamedata *data)
3153 {
3154         nfs4_setup_sequence(NFS_SERVER(data->old_dir),
3155                         &data->args.seq_args,
3156                         &data->res.seq_res,
3157                         task);
3158 }
3159
3160 static int nfs4_proc_rename_done(struct rpc_task *task, struct inode *old_dir,
3161                                  struct inode *new_dir)
3162 {
3163         struct nfs_renameres *res = task->tk_msg.rpc_resp;
3164
3165         if (!nfs4_sequence_done(task, &res->seq_res))
3166                 return 0;
3167         if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
3168                 return 0;
3169
3170         update_changeattr(old_dir, &res->old_cinfo);
3171         update_changeattr(new_dir, &res->new_cinfo);
3172         return 1;
3173 }
3174
3175 static int _nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
3176                 struct inode *new_dir, struct qstr *new_name)
3177 {
3178         struct nfs_server *server = NFS_SERVER(old_dir);
3179         struct nfs_renameargs arg = {
3180                 .old_dir = NFS_FH(old_dir),
3181                 .new_dir = NFS_FH(new_dir),
3182                 .old_name = old_name,
3183                 .new_name = new_name,
3184         };
3185         struct nfs_renameres res = {
3186                 .server = server,
3187         };
3188         struct rpc_message msg = {
3189                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME],
3190                 .rpc_argp = &arg,
3191                 .rpc_resp = &res,
3192         };
3193         int status = -ENOMEM;
3194         
3195         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
3196         if (!status) {
3197                 update_changeattr(old_dir, &res.old_cinfo);
3198                 update_changeattr(new_dir, &res.new_cinfo);
3199         }
3200         return status;
3201 }
3202
3203 static int nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
3204                 struct inode *new_dir, struct qstr *new_name)
3205 {
3206         struct nfs4_exception exception = { };
3207         int err;
3208         do {
3209                 err = nfs4_handle_exception(NFS_SERVER(old_dir),
3210                                 _nfs4_proc_rename(old_dir, old_name,
3211                                         new_dir, new_name),
3212                                 &exception);
3213         } while (exception.retry);
3214         return err;
3215 }
3216
3217 static int _nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
3218 {
3219         struct nfs_server *server = NFS_SERVER(inode);
3220         struct nfs4_link_arg arg = {
3221                 .fh     = NFS_FH(inode),
3222                 .dir_fh = NFS_FH(dir),
3223                 .name   = name,
3224                 .bitmask = server->attr_bitmask,
3225         };
3226         struct nfs4_link_res res = {
3227                 .server = server,
3228         };
3229         struct rpc_message msg = {
3230                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LINK],
3231                 .rpc_argp = &arg,
3232                 .rpc_resp = &res,
3233         };
3234         int status = -ENOMEM;
3235
3236         res.fattr = nfs_alloc_fattr();
3237         if (res.fattr == NULL)
3238                 goto out;
3239
3240         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
3241         if (!status) {
3242                 update_changeattr(dir, &res.cinfo);
3243                 nfs_post_op_update_inode(inode, res.fattr);
3244         }
3245 out:
3246         nfs_free_fattr(res.fattr);
3247         return status;
3248 }
3249
3250 static int nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
3251 {
3252         struct nfs4_exception exception = { };
3253         int err;
3254         do {
3255                 err = nfs4_handle_exception(NFS_SERVER(inode),
3256                                 _nfs4_proc_link(inode, dir, name),
3257                                 &exception);
3258         } while (exception.retry);
3259         return err;
3260 }
3261
3262 struct nfs4_createdata {
3263         struct rpc_message msg;
3264         struct nfs4_create_arg arg;
3265         struct nfs4_create_res res;
3266         struct nfs_fh fh;
3267         struct nfs_fattr fattr;
3268 };
3269
3270 static struct nfs4_createdata *nfs4_alloc_createdata(struct inode *dir,
3271                 struct qstr *name, struct iattr *sattr, u32 ftype)
3272 {
3273         struct nfs4_createdata *data;
3274
3275         data = kzalloc(sizeof(*data), GFP_KERNEL);
3276         if (data != NULL) {
3277                 struct nfs_server *server = NFS_SERVER(dir);
3278
3279                 data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE];
3280                 data->msg.rpc_argp = &data->arg;
3281                 data->msg.rpc_resp = &data->res;
3282                 data->arg.dir_fh = NFS_FH(dir);
3283                 data->arg.server = server;
3284                 data->arg.name = name;
3285                 data->arg.attrs = sattr;
3286                 data->arg.ftype = ftype;
3287                 data->arg.bitmask = server->attr_bitmask;
3288                 data->res.server = server;
3289                 data->res.fh = &data->fh;
3290                 data->res.fattr = &data->fattr;
3291                 nfs_fattr_init(data->res.fattr);
3292         }
3293         return data;
3294 }
3295
3296 static int nfs4_do_create(struct inode *dir, struct dentry *dentry, struct nfs4_createdata *data)
3297 {
3298         int status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &data->msg,
3299                                     &data->arg.seq_args, &data->res.seq_res, 1);
3300         if (status == 0) {
3301                 update_changeattr(dir, &data->res.dir_cinfo);
3302                 status = nfs_instantiate(dentry, data->res.fh, data->res.fattr);
3303         }
3304         return status;
3305 }
3306
3307 static void nfs4_free_createdata(struct nfs4_createdata *data)
3308 {
3309         kfree(data);
3310 }
3311
3312 static int _nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3313                 struct page *page, unsigned int len, struct iattr *sattr)
3314 {
3315         struct nfs4_createdata *data;
3316         int status = -ENAMETOOLONG;
3317
3318         if (len > NFS4_MAXPATHLEN)
3319                 goto out;
3320
3321         status = -ENOMEM;
3322         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4LNK);
3323         if (data == NULL)
3324                 goto out;
3325
3326         data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SYMLINK];
3327         data->arg.u.symlink.pages = &page;
3328         data->arg.u.symlink.len = len;
3329         
3330         status = nfs4_do_create(dir, dentry, data);
3331
3332         nfs4_free_createdata(data);
3333 out:
3334         return status;
3335 }
3336
3337 static int nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3338                 struct page *page, unsigned int len, struct iattr *sattr)
3339 {
3340         struct nfs4_exception exception = { };
3341         int err;
3342         do {
3343                 err = nfs4_handle_exception(NFS_SERVER(dir),
3344                                 _nfs4_proc_symlink(dir, dentry, page,
3345                                                         len, sattr),
3346                                 &exception);
3347         } while (exception.retry);
3348         return err;
3349 }
3350
3351 static int _nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
3352                 struct iattr *sattr)
3353 {
3354         struct nfs4_createdata *data;
3355         int status = -ENOMEM;
3356
3357         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4DIR);
3358         if (data == NULL)
3359                 goto out;
3360
3361         status = nfs4_do_create(dir, dentry, data);
3362
3363         nfs4_free_createdata(data);
3364 out:
3365         return status;
3366 }
3367
3368 static int nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
3369                 struct iattr *sattr)
3370 {
3371         struct nfs4_exception exception = { };
3372         int err;
3373
3374         sattr->ia_mode &= ~current_umask();
3375         do {
3376                 err = nfs4_handle_exception(NFS_SERVER(dir),
3377                                 _nfs4_proc_mkdir(dir, dentry, sattr),
3378                                 &exception);
3379         } while (exception.retry);
3380         return err;
3381 }
3382
3383 static int _nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
3384                 u64 cookie, struct page **pages, unsigned int count, int plus)
3385 {
3386         struct inode            *dir = dentry->d_inode;
3387         struct nfs4_readdir_arg args = {
3388                 .fh = NFS_FH(dir),
3389                 .pages = pages,
3390                 .pgbase = 0,
3391                 .count = count,
3392                 .bitmask = NFS_SERVER(dentry->d_inode)->attr_bitmask,
3393                 .plus = plus,
3394         };
3395         struct nfs4_readdir_res res;
3396         struct rpc_message msg = {
3397                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READDIR],
3398                 .rpc_argp = &args,
3399                 .rpc_resp = &res,
3400                 .rpc_cred = cred,
3401         };
3402         int                     status;
3403
3404         dprintk("%s: dentry = %s/%s, cookie = %Lu\n", __func__,
3405                         dentry->d_parent->d_name.name,
3406                         dentry->d_name.name,
3407                         (unsigned long long)cookie);
3408         nfs4_setup_readdir(cookie, NFS_I(dir)->cookieverf, dentry, &args);
3409         res.pgbase = args.pgbase;
3410         status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
3411         if (status >= 0) {
3412                 memcpy(NFS_I(dir)->cookieverf, res.verifier.data, NFS4_VERIFIER_SIZE);
3413                 status += args.pgbase;
3414         }
3415
3416         nfs_invalidate_atime(dir);
3417
3418         dprintk("%s: returns %d\n", __func__, status);
3419         return status;
3420 }
3421
3422 static int nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
3423                 u64 cookie, struct page **pages, unsigned int count, int plus)
3424 {
3425         struct nfs4_exception exception = { };
3426         int err;
3427         do {
3428                 err = nfs4_handle_exception(NFS_SERVER(dentry->d_inode),
3429                                 _nfs4_proc_readdir(dentry, cred, cookie,
3430                                         pages, count, plus),
3431                                 &exception);
3432         } while (exception.retry);
3433         return err;
3434 }
3435
3436 static int _nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
3437                 struct iattr *sattr, dev_t rdev)
3438 {
3439         struct nfs4_createdata *data;
3440         int mode = sattr->ia_mode;
3441         int status = -ENOMEM;
3442
3443         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4SOCK);
3444         if (data == NULL)
3445                 goto out;
3446
3447         if (S_ISFIFO(mode))
3448                 data->arg.ftype = NF4FIFO;
3449         else if (S_ISBLK(mode)) {
3450                 data->arg.ftype = NF4BLK;
3451                 data->arg.u.device.specdata1 = MAJOR(rdev);
3452                 data->arg.u.device.specdata2 = MINOR(rdev);
3453         }
3454         else if (S_ISCHR(mode)) {
3455                 data->arg.ftype = NF4CHR;
3456                 data->arg.u.device.specdata1 = MAJOR(rdev);
3457                 data->arg.u.device.specdata2 = MINOR(rdev);
3458         } else if (!S_ISSOCK(mode)) {
3459                 status = -EINVAL;
3460                 goto out_free;
3461         }
3462         
3463         status = nfs4_do_create(dir, dentry, data);
3464 out_free:
3465         nfs4_free_createdata(data);
3466 out:
3467         return status;
3468 }
3469
3470 static int nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
3471                 struct iattr *sattr, dev_t rdev)
3472 {
3473         struct nfs4_exception exception = { };
3474         int err;
3475
3476         sattr->ia_mode &= ~current_umask();
3477         do {
3478                 err = nfs4_handle_exception(NFS_SERVER(dir),
3479                                 _nfs4_proc_mknod(dir, dentry, sattr, rdev),
3480                                 &exception);
3481         } while (exception.retry);
3482         return err;
3483 }
3484
3485 static int _nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle,
3486                  struct nfs_fsstat *fsstat)
3487 {
3488         struct nfs4_statfs_arg args = {
3489                 .fh = fhandle,
3490                 .bitmask = server->attr_bitmask,
3491         };
3492         struct nfs4_statfs_res res = {
3493                 .fsstat = fsstat,
3494         };
3495         struct rpc_message msg = {
3496                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_STATFS],
3497                 .rpc_argp = &args,
3498                 .rpc_resp = &res,
3499         };
3500
3501         nfs_fattr_init(fsstat->fattr);
3502         return  nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3503 }
3504
3505 static int nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsstat *fsstat)
3506 {
3507         struct nfs4_exception exception = { };
3508         int err;
3509         do {
3510                 err = nfs4_handle_exception(server,
3511                                 _nfs4_proc_statfs(server, fhandle, fsstat),
3512                                 &exception);
3513         } while (exception.retry);
3514         return err;
3515 }
3516
3517 static int _nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle,
3518                 struct nfs_fsinfo *fsinfo)
3519 {
3520         struct nfs4_fsinfo_arg args = {
3521                 .fh = fhandle,
3522                 .bitmask = server->attr_bitmask,
3523         };
3524         struct nfs4_fsinfo_res res = {
3525                 .fsinfo = fsinfo,
3526         };
3527         struct rpc_message msg = {
3528                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSINFO],
3529                 .rpc_argp = &args,
3530                 .rpc_resp = &res,
3531         };
3532
3533         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3534 }
3535
3536 static int nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
3537 {
3538         struct nfs4_exception exception = { };
3539         unsigned long now = jiffies;
3540         int err;
3541
3542         do {
3543                 err = _nfs4_do_fsinfo(server, fhandle, fsinfo);
3544                 if (err == 0) {
3545                         struct nfs_client *clp = server->nfs_client;
3546
3547                         spin_lock(&clp->cl_lock);
3548                         clp->cl_lease_time = fsinfo->lease_time * HZ;
3549                         clp->cl_last_renewal = now;
3550                         spin_unlock(&clp->cl_lock);
3551                         break;
3552                 }
3553                 err = nfs4_handle_exception(server, err, &exception);
3554         } while (exception.retry);
3555         return err;
3556 }
3557
3558 static int nfs4_proc_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
3559 {
3560         int error;
3561
3562         nfs_fattr_init(fsinfo->fattr);
3563         error = nfs4_do_fsinfo(server, fhandle, fsinfo);
3564         if (error == 0) {
3565                 /* block layout checks this! */
3566                 server->pnfs_blksize = fsinfo->blksize;
3567                 set_pnfs_layoutdriver(server, fhandle, fsinfo->layouttype);
3568         }
3569
3570         return error;
3571 }
3572
3573 static int _nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
3574                 struct nfs_pathconf *pathconf)
3575 {
3576         struct nfs4_pathconf_arg args = {
3577                 .fh = fhandle,
3578                 .bitmask = server->attr_bitmask,
3579         };
3580         struct nfs4_pathconf_res res = {
3581                 .pathconf = pathconf,
3582         };
3583         struct rpc_message msg = {
3584                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_PATHCONF],
3585                 .rpc_argp = &args,
3586                 .rpc_resp = &res,
3587         };
3588
3589         /* None of the pathconf attributes are mandatory to implement */
3590         if ((args.bitmask[0] & nfs4_pathconf_bitmap[0]) == 0) {
3591                 memset(pathconf, 0, sizeof(*pathconf));
3592                 return 0;
3593         }
3594
3595         nfs_fattr_init(pathconf->fattr);
3596         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3597 }
3598
3599 static int nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
3600                 struct nfs_pathconf *pathconf)
3601 {
3602         struct nfs4_exception exception = { };
3603         int err;
3604
3605         do {
3606                 err = nfs4_handle_exception(server,
3607                                 _nfs4_proc_pathconf(server, fhandle, pathconf),
3608                                 &exception);
3609         } while (exception.retry);
3610         return err;
3611 }
3612
3613 int nfs4_set_rw_stateid(nfs4_stateid *stateid,
3614                 const struct nfs_open_context *ctx,
3615                 const struct nfs_lock_context *l_ctx,
3616                 fmode_t fmode)
3617 {
3618         const struct nfs_lockowner *lockowner = NULL;
3619
3620         if (l_ctx != NULL)
3621                 lockowner = &l_ctx->lockowner;
3622         return nfs4_select_rw_stateid(stateid, ctx->state, fmode, lockowner);
3623 }
3624 EXPORT_SYMBOL_GPL(nfs4_set_rw_stateid);
3625
3626 static bool nfs4_stateid_is_current(nfs4_stateid *stateid,
3627                 const struct nfs_open_context *ctx,
3628                 const struct nfs_lock_context *l_ctx,
3629                 fmode_t fmode)
3630 {
3631         nfs4_stateid current_stateid;
3632
3633         if (nfs4_set_rw_stateid(&current_stateid, ctx, l_ctx, fmode))
3634                 return false;
3635         return nfs4_stateid_match(stateid, &current_stateid);
3636 }
3637
3638 static bool nfs4_error_stateid_expired(int err)
3639 {
3640         switch (err) {
3641         case -NFS4ERR_DELEG_REVOKED:
3642         case -NFS4ERR_ADMIN_REVOKED:
3643         case -NFS4ERR_BAD_STATEID:
3644         case -NFS4ERR_STALE_STATEID:
3645         case -NFS4ERR_OLD_STATEID:
3646         case -NFS4ERR_OPENMODE:
3647         case -NFS4ERR_EXPIRED:
3648                 return true;
3649         }
3650         return false;
3651 }
3652
3653 void __nfs4_read_done_cb(struct nfs_read_data *data)
3654 {
3655         nfs_invalidate_atime(data->header->inode);
3656 }
3657
3658 static int nfs4_read_done_cb(struct rpc_task *task, struct nfs_read_data *data)
3659 {
3660         struct nfs_server *server = NFS_SERVER(data->header->inode);
3661
3662         if (nfs4_async_handle_error(task, server, data->args.context->state) == -EAGAIN) {
3663                 rpc_restart_call_prepare(task);
3664                 return -EAGAIN;
3665         }
3666
3667         __nfs4_read_done_cb(data);
3668         if (task->tk_status > 0)
3669                 renew_lease(server, data->timestamp);
3670         return 0;
3671 }
3672
3673 static bool nfs4_read_stateid_changed(struct rpc_task *task,
3674                 struct nfs_readargs *args)
3675 {
3676
3677         if (!nfs4_error_stateid_expired(task->tk_status) ||
3678                 nfs4_stateid_is_current(&args->stateid,
3679                                 args->context,
3680                                 args->lock_context,
3681                                 FMODE_READ))
3682                 return false;
3683         rpc_restart_call_prepare(task);
3684         return true;
3685 }
3686
3687 static int nfs4_read_done(struct rpc_task *task, struct nfs_read_data *data)
3688 {
3689
3690         dprintk("--> %s\n", __func__);
3691
3692         if (!nfs4_sequence_done(task, &data->res.seq_res))
3693                 return -EAGAIN;
3694         if (nfs4_read_stateid_changed(task, &data->args))
3695                 return -EAGAIN;
3696         return data->read_done_cb ? data->read_done_cb(task, data) :
3697                                     nfs4_read_done_cb(task, data);
3698 }
3699
3700 static void nfs4_proc_read_setup(struct nfs_read_data *data, struct rpc_message *msg)
3701 {
3702         data->timestamp   = jiffies;
3703         data->read_done_cb = nfs4_read_done_cb;
3704         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READ];
3705         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
3706 }
3707
3708 static void nfs4_proc_read_rpc_prepare(struct rpc_task *task, struct nfs_read_data *data)
3709 {
3710         if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3711                         &data->args.seq_args,
3712                         &data->res.seq_res,
3713                         task))
3714                 return;
3715         nfs4_set_rw_stateid(&data->args.stateid, data->args.context,
3716                         data->args.lock_context, FMODE_READ);
3717 }
3718
3719 static int nfs4_write_done_cb(struct rpc_task *task, struct nfs_write_data *data)
3720 {
3721         struct inode *inode = data->header->inode;
3722         
3723         if (nfs4_async_handle_error(task, NFS_SERVER(inode), data->args.context->state) == -EAGAIN) {
3724                 rpc_restart_call_prepare(task);
3725                 return -EAGAIN;
3726         }
3727         if (task->tk_status >= 0) {
3728                 renew_lease(NFS_SERVER(inode), data->timestamp);
3729                 nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
3730         }
3731         return 0;
3732 }
3733
3734 static bool nfs4_write_stateid_changed(struct rpc_task *task,
3735                 struct nfs_writeargs *args)
3736 {
3737
3738         if (!nfs4_error_stateid_expired(task->tk_status) ||
3739                 nfs4_stateid_is_current(&args->stateid,
3740                                 args->context,
3741                                 args->lock_context,
3742                                 FMODE_WRITE))
3743                 return false;
3744         rpc_restart_call_prepare(task);
3745         return true;
3746 }
3747
3748 static int nfs4_write_done(struct rpc_task *task, struct nfs_write_data *data)
3749 {
3750         if (!nfs4_sequence_done(task, &data->res.seq_res))
3751                 return -EAGAIN;
3752         if (nfs4_write_stateid_changed(task, &data->args))
3753                 return -EAGAIN;
3754         return data->write_done_cb ? data->write_done_cb(task, data) :
3755                 nfs4_write_done_cb(task, data);
3756 }
3757
3758 static
3759 bool nfs4_write_need_cache_consistency_data(const struct nfs_write_data *data)
3760 {
3761         const struct nfs_pgio_header *hdr = data->header;
3762
3763         /* Don't request attributes for pNFS or O_DIRECT writes */
3764         if (data->ds_clp != NULL || hdr->dreq != NULL)
3765                 return false;
3766         /* Otherwise, request attributes if and only if we don't hold
3767          * a delegation
3768          */
3769         return nfs4_have_delegation(hdr->inode, FMODE_READ) == 0;
3770 }
3771
3772 static void nfs4_proc_write_setup(struct nfs_write_data *data, struct rpc_message *msg)
3773 {
3774         struct nfs_server *server = NFS_SERVER(data->header->inode);
3775
3776         if (!nfs4_write_need_cache_consistency_data(data)) {
3777                 data->args.bitmask = NULL;
3778                 data->res.fattr = NULL;
3779         } else
3780                 data->args.bitmask = server->cache_consistency_bitmask;
3781
3782         if (!data->write_done_cb)
3783                 data->write_done_cb = nfs4_write_done_cb;
3784         data->res.server = server;
3785         data->timestamp   = jiffies;
3786
3787         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_WRITE];
3788         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
3789 }
3790
3791 static void nfs4_proc_write_rpc_prepare(struct rpc_task *task, struct nfs_write_data *data)
3792 {
3793         if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3794                         &data->args.seq_args,
3795                         &data->res.seq_res,
3796                         task))
3797                 return;
3798         nfs4_set_rw_stateid(&data->args.stateid, data->args.context,
3799                         data->args.lock_context, FMODE_WRITE);
3800 }
3801
3802 static void nfs4_proc_commit_rpc_prepare(struct rpc_task *task, struct nfs_commit_data *data)
3803 {
3804         nfs4_setup_sequence(NFS_SERVER(data->inode),
3805                         &data->args.seq_args,
3806                         &data->res.seq_res,
3807                         task);
3808 }
3809
3810 static int nfs4_commit_done_cb(struct rpc_task *task, struct nfs_commit_data *data)
3811 {
3812         struct inode *inode = data->inode;
3813
3814         if (nfs4_async_handle_error(task, NFS_SERVER(inode), NULL) == -EAGAIN) {
3815                 rpc_restart_call_prepare(task);
3816                 return -EAGAIN;
3817         }
3818         return 0;
3819 }
3820
3821 static int nfs4_commit_done(struct rpc_task *task, struct nfs_commit_data *data)
3822 {
3823         if (!nfs4_sequence_done(task, &data->res.seq_res))
3824                 return -EAGAIN;
3825         return data->commit_done_cb(task, data);
3826 }
3827
3828 static void nfs4_proc_commit_setup(struct nfs_commit_data *data, struct rpc_message *msg)
3829 {
3830         struct nfs_server *server = NFS_SERVER(data->inode);
3831
3832         if (data->commit_done_cb == NULL)
3833                 data->commit_done_cb = nfs4_commit_done_cb;
3834         data->res.server = server;
3835         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_COMMIT];
3836         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
3837 }
3838
3839 struct nfs4_renewdata {
3840         struct nfs_client       *client;
3841         unsigned long           timestamp;
3842 };
3843
3844 /*
3845  * nfs4_proc_async_renew(): This is not one of the nfs_rpc_ops; it is a special
3846  * standalone procedure for queueing an asynchronous RENEW.
3847  */
3848 static void nfs4_renew_release(void *calldata)
3849 {
3850         struct nfs4_renewdata *data = calldata;
3851         struct nfs_client *clp = data->client;
3852
3853         if (atomic_read(&clp->cl_count) > 1)
3854                 nfs4_schedule_state_renewal(clp);
3855         nfs_put_client(clp);
3856         kfree(data);
3857 }
3858
3859 static void nfs4_renew_done(struct rpc_task *task, void *calldata)
3860 {
3861         struct nfs4_renewdata *data = calldata;
3862         struct nfs_client *clp = data->client;
3863         unsigned long timestamp = data->timestamp;
3864
3865         if (task->tk_status < 0) {
3866                 /* Unless we're shutting down, schedule state recovery! */
3867                 if (test_bit(NFS_CS_RENEWD, &clp->cl_res_state) == 0)
3868                         return;
3869                 if (task->tk_status != NFS4ERR_CB_PATH_DOWN) {
3870                         nfs4_schedule_lease_recovery(clp);
3871                         return;
3872                 }
3873                 nfs4_schedule_path_down_recovery(clp);
3874         }
3875         do_renew_lease(clp, timestamp);
3876 }
3877
3878 static const struct rpc_call_ops nfs4_renew_ops = {
3879         .rpc_call_done = nfs4_renew_done,
3880         .rpc_release = nfs4_renew_release,
3881 };
3882
3883 static int nfs4_proc_async_renew(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
3884 {
3885         struct rpc_message msg = {
3886                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
3887                 .rpc_argp       = clp,
3888                 .rpc_cred       = cred,
3889         };
3890         struct nfs4_renewdata *data;
3891
3892         if (renew_flags == 0)
3893                 return 0;
3894         if (!atomic_inc_not_zero(&clp->cl_count))
3895                 return -EIO;
3896         data = kmalloc(sizeof(*data), GFP_NOFS);
3897         if (data == NULL)
3898                 return -ENOMEM;
3899         data->client = clp;
3900         data->timestamp = jiffies;
3901         return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT,
3902                         &nfs4_renew_ops, data);
3903 }
3904
3905 static int nfs4_proc_renew(struct nfs_client *clp, struct rpc_cred *cred)
3906 {
3907         struct rpc_message msg = {
3908                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
3909                 .rpc_argp       = clp,
3910                 .rpc_cred       = cred,
3911         };
3912         unsigned long now = jiffies;
3913         int status;
3914
3915         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
3916         if (status < 0)
3917                 return status;
3918         do_renew_lease(clp, now);
3919         return 0;
3920 }
3921
3922 static inline int nfs4_server_supports_acls(struct nfs_server *server)
3923 {
3924         return (server->caps & NFS_CAP_ACLS)
3925                 && (server->acl_bitmask & ACL4_SUPPORT_ALLOW_ACL)
3926                 && (server->acl_bitmask & ACL4_SUPPORT_DENY_ACL);
3927 }
3928
3929 /* Assuming that XATTR_SIZE_MAX is a multiple of PAGE_SIZE, and that
3930  * it's OK to put sizeof(void) * (XATTR_SIZE_MAX/PAGE_SIZE) bytes on
3931  * the stack.
3932  */
3933 #define NFS4ACL_MAXPAGES DIV_ROUND_UP(XATTR_SIZE_MAX, PAGE_SIZE)
3934
3935 static int buf_to_pages_noslab(const void *buf, size_t buflen,
3936                 struct page **pages, unsigned int *pgbase)
3937 {
3938         struct page *newpage, **spages;
3939         int rc = 0;
3940         size_t len;
3941         spages = pages;
3942
3943         do {
3944                 len = min_t(size_t, PAGE_SIZE, buflen);
3945                 newpage = alloc_page(GFP_KERNEL);
3946
3947                 if (newpage == NULL)
3948                         goto unwind;
3949                 memcpy(page_address(newpage), buf, len);
3950                 buf += len;
3951                 buflen -= len;
3952                 *pages++ = newpage;
3953                 rc++;
3954         } while (buflen != 0);
3955
3956         return rc;
3957
3958 unwind:
3959         for(; rc > 0; rc--)
3960                 __free_page(spages[rc-1]);
3961         return -ENOMEM;
3962 }
3963
3964 struct nfs4_cached_acl {
3965         int cached;
3966         size_t len;
3967         char data[0];
3968 };
3969
3970 static void nfs4_set_cached_acl(struct inode *inode, struct nfs4_cached_acl *acl)
3971 {
3972         struct nfs_inode *nfsi = NFS_I(inode);
3973
3974         spin_lock(&inode->i_lock);
3975         kfree(nfsi->nfs4_acl);
3976         nfsi->nfs4_acl = acl;
3977         spin_unlock(&inode->i_lock);
3978 }
3979
3980 static void nfs4_zap_acl_attr(struct inode *inode)
3981 {
3982         nfs4_set_cached_acl(inode, NULL);
3983 }
3984
3985 static inline ssize_t nfs4_read_cached_acl(struct inode *inode, char *buf, size_t buflen)
3986 {
3987         struct nfs_inode *nfsi = NFS_I(inode);
3988         struct nfs4_cached_acl *acl;
3989         int ret = -ENOENT;
3990
3991         spin_lock(&inode->i_lock);
3992         acl = nfsi->nfs4_acl;
3993         if (acl == NULL)
3994                 goto out;
3995         if (buf == NULL) /* user is just asking for length */
3996                 goto out_len;
3997         if (acl->cached == 0)
3998                 goto out;
3999         ret = -ERANGE; /* see getxattr(2) man page */
4000         if (acl->len > buflen)
4001                 goto out;
4002         memcpy(buf, acl->data, acl->len);
4003 out_len:
4004         ret = acl->len;
4005 out:
4006         spin_unlock(&inode->i_lock);
4007         return ret;
4008 }
4009
4010 static void nfs4_write_cached_acl(struct inode *inode, struct page **pages, size_t pgbase, size_t acl_len)
4011 {
4012         struct nfs4_cached_acl *acl;
4013         size_t buflen = sizeof(*acl) + acl_len;
4014
4015         if (buflen <= PAGE_SIZE) {
4016                 acl = kmalloc(buflen, GFP_KERNEL);
4017                 if (acl == NULL)
4018                         goto out;
4019                 acl->cached = 1;
4020                 _copy_from_pages(acl->data, pages, pgbase, acl_len);
4021         } else {
4022                 acl = kmalloc(sizeof(*acl), GFP_KERNEL);
4023                 if (acl == NULL)
4024                         goto out;
4025                 acl->cached = 0;
4026         }
4027         acl->len = acl_len;
4028 out:
4029         nfs4_set_cached_acl(inode, acl);
4030 }
4031
4032 /*
4033  * The getxattr API returns the required buffer length when called with a
4034  * NULL buf. The NFSv4 acl tool then calls getxattr again after allocating
4035  * the required buf.  On a NULL buf, we send a page of data to the server
4036  * guessing that the ACL request can be serviced by a page. If so, we cache
4037  * up to the page of ACL data, and the 2nd call to getxattr is serviced by
4038  * the cache. If not so, we throw away the page, and cache the required
4039  * length. The next getxattr call will then produce another round trip to
4040  * the server, this time with the input buf of the required size.
4041  */
4042 static ssize_t __nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
4043 {
4044         struct page *pages[NFS4ACL_MAXPAGES] = {NULL, };
4045         struct nfs_getaclargs args = {
4046                 .fh = NFS_FH(inode),
4047                 .acl_pages = pages,
4048                 .acl_len = buflen,
4049         };
4050         struct nfs_getaclres res = {
4051                 .acl_len = buflen,
4052         };
4053         struct rpc_message msg = {
4054                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETACL],
4055                 .rpc_argp = &args,
4056                 .rpc_resp = &res,
4057         };
4058         unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE);
4059         int ret = -ENOMEM, i;
4060
4061         /* As long as we're doing a round trip to the server anyway,
4062          * let's be prepared for a page of acl data. */
4063         if (npages == 0)
4064                 npages = 1;
4065         if (npages > ARRAY_SIZE(pages))
4066                 return -ERANGE;
4067
4068         for (i = 0; i < npages; i++) {
4069                 pages[i] = alloc_page(GFP_KERNEL);
4070                 if (!pages[i])
4071                         goto out_free;
4072         }
4073
4074         /* for decoding across pages */
4075         res.acl_scratch = alloc_page(GFP_KERNEL);
4076         if (!res.acl_scratch)
4077                 goto out_free;
4078
4079         args.acl_len = npages * PAGE_SIZE;
4080         args.acl_pgbase = 0;
4081
4082         dprintk("%s  buf %p buflen %zu npages %d args.acl_len %zu\n",
4083                 __func__, buf, buflen, npages, args.acl_len);
4084         ret = nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode),
4085                              &msg, &args.seq_args, &res.seq_res, 0);
4086         if (ret)
4087                 goto out_free;
4088
4089         /* Handle the case where the passed-in buffer is too short */
4090         if (res.acl_flags & NFS4_ACL_TRUNC) {
4091                 /* Did the user only issue a request for the acl length? */
4092                 if (buf == NULL)
4093                         goto out_ok;
4094                 ret = -ERANGE;
4095                 goto out_free;
4096         }
4097         nfs4_write_cached_acl(inode, pages, res.acl_data_offset, res.acl_len);
4098         if (buf) {
4099                 if (res.acl_len > buflen) {
4100                         ret = -ERANGE;
4101                         goto out_free;
4102                 }
4103                 _copy_from_pages(buf, pages, res.acl_data_offset, res.acl_len);
4104         }
4105 out_ok:
4106         ret = res.acl_len;
4107 out_free:
4108         for (i = 0; i < npages; i++)
4109                 if (pages[i])
4110                         __free_page(pages[i]);
4111         if (res.acl_scratch)
4112                 __free_page(res.acl_scratch);
4113         return ret;
4114 }
4115
4116 static ssize_t nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
4117 {
4118         struct nfs4_exception exception = { };
4119         ssize_t ret;
4120         do {
4121                 ret = __nfs4_get_acl_uncached(inode, buf, buflen);
4122                 if (ret >= 0)
4123                         break;
4124                 ret = nfs4_handle_exception(NFS_SERVER(inode), ret, &exception);
4125         } while (exception.retry);
4126         return ret;
4127 }
4128
4129 static ssize_t nfs4_proc_get_acl(struct inode *inode, void *buf, size_t buflen)
4130 {
4131         struct nfs_server *server = NFS_SERVER(inode);
4132         int ret;
4133
4134         if (!nfs4_server_supports_acls(server))
4135                 return -EOPNOTSUPP;
4136         ret = nfs_revalidate_inode(server, inode);
4137         if (ret < 0)
4138                 return ret;
4139         if (NFS_I(inode)->cache_validity & NFS_INO_INVALID_ACL)
4140                 nfs_zap_acl_cache(inode);
4141         ret = nfs4_read_cached_acl(inode, buf, buflen);
4142         if (ret != -ENOENT)
4143                 /* -ENOENT is returned if there is no ACL or if there is an ACL
4144                  * but no cached acl data, just the acl length */
4145                 return ret;
4146         return nfs4_get_acl_uncached(inode, buf, buflen);
4147 }
4148
4149 static int __nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
4150 {
4151         struct nfs_server *server = NFS_SERVER(inode);
4152         struct page *pages[NFS4ACL_MAXPAGES];
4153         struct nfs_setaclargs arg = {
4154                 .fh             = NFS_FH(inode),
4155                 .acl_pages      = pages,
4156                 .acl_len        = buflen,
4157         };
4158         struct nfs_setaclres res;
4159         struct rpc_message msg = {
4160                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETACL],
4161                 .rpc_argp       = &arg,
4162                 .rpc_resp       = &res,
4163         };
4164         unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE);
4165         int ret, i;
4166
4167         if (!nfs4_server_supports_acls(server))
4168                 return -EOPNOTSUPP;
4169         if (npages > ARRAY_SIZE(pages))
4170                 return -ERANGE;
4171         i = buf_to_pages_noslab(buf, buflen, arg.acl_pages, &arg.acl_pgbase);
4172         if (i < 0)
4173                 return i;
4174         nfs4_inode_return_delegation(inode);
4175         ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
4176
4177         /*
4178          * Free each page after tx, so the only ref left is
4179          * held by the network stack
4180          */
4181         for (; i > 0; i--)
4182                 put_page(pages[i-1]);
4183
4184         /*
4185          * Acl update can result in inode attribute update.
4186          * so mark the attribute cache invalid.
4187          */
4188         spin_lock(&inode->i_lock);
4189         NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATTR;
4190         spin_unlock(&inode->i_lock);
4191         nfs_access_zap_cache(inode);
4192         nfs_zap_acl_cache(inode);
4193         return ret;
4194 }
4195
4196 static int nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
4197 {
4198         struct nfs4_exception exception = { };
4199         int err;
4200         do {
4201                 err = nfs4_handle_exception(NFS_SERVER(inode),
4202                                 __nfs4_proc_set_acl(inode, buf, buflen),
4203                                 &exception);
4204         } while (exception.retry);
4205         return err;
4206 }
4207
4208 static int
4209 nfs4_async_handle_error(struct rpc_task *task, const struct nfs_server *server, struct nfs4_state *state)
4210 {
4211         struct nfs_client *clp = server->nfs_client;
4212
4213         if (task->tk_status >= 0)
4214                 return 0;
4215         switch(task->tk_status) {
4216                 case -NFS4ERR_DELEG_REVOKED:
4217                 case -NFS4ERR_ADMIN_REVOKED:
4218                 case -NFS4ERR_BAD_STATEID:
4219                         if (state == NULL)
4220                                 break;
4221                         nfs_remove_bad_delegation(state->inode);
4222                 case -NFS4ERR_OPENMODE:
4223                         if (state == NULL)
4224                                 break;
4225                         if (nfs4_schedule_stateid_recovery(server, state) < 0)
4226                                 goto stateid_invalid;
4227                         goto wait_on_recovery;
4228                 case -NFS4ERR_EXPIRED:
4229                         if (state != NULL) {
4230                                 if (nfs4_schedule_stateid_recovery(server, state) < 0)
4231                                         goto stateid_invalid;
4232                         }
4233                 case -NFS4ERR_STALE_STATEID:
4234                 case -NFS4ERR_STALE_CLIENTID:
4235                         nfs4_schedule_lease_recovery(clp);
4236                         goto wait_on_recovery;
4237 #if defined(CONFIG_NFS_V4_1)
4238                 case -NFS4ERR_BADSESSION:
4239                 case -NFS4ERR_BADSLOT:
4240                 case -NFS4ERR_BAD_HIGH_SLOT:
4241                 case -NFS4ERR_DEADSESSION:
4242                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
4243                 case -NFS4ERR_SEQ_FALSE_RETRY:
4244                 case -NFS4ERR_SEQ_MISORDERED:
4245                         dprintk("%s ERROR %d, Reset session\n", __func__,
4246                                 task->tk_status);
4247                         nfs4_schedule_session_recovery(clp->cl_session, task->tk_status);
4248                         task->tk_status = 0;
4249                         return -EAGAIN;
4250 #endif /* CONFIG_NFS_V4_1 */
4251                 case -NFS4ERR_DELAY:
4252                         nfs_inc_server_stats(server, NFSIOS_DELAY);
4253                 case -NFS4ERR_GRACE:
4254                         rpc_delay(task, NFS4_POLL_RETRY_MAX);
4255                         task->tk_status = 0;
4256                         return -EAGAIN;
4257                 case -NFS4ERR_RETRY_UNCACHED_REP:
4258                 case -NFS4ERR_OLD_STATEID:
4259                         task->tk_status = 0;
4260                         return -EAGAIN;
4261         }
4262         task->tk_status = nfs4_map_errors(task->tk_status);
4263         return 0;
4264 stateid_invalid:
4265         task->tk_status = -EIO;
4266         return 0;
4267 wait_on_recovery:
4268         rpc_sleep_on(&clp->cl_rpcwaitq, task, NULL);
4269         if (test_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) == 0)
4270                 rpc_wake_up_queued_task(&clp->cl_rpcwaitq, task);
4271         task->tk_status = 0;
4272         return -EAGAIN;
4273 }
4274
4275 static void nfs4_init_boot_verifier(const struct nfs_client *clp,
4276                                     nfs4_verifier *bootverf)
4277 {
4278         __be32 verf[2];
4279
4280         if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) {
4281                 /* An impossible timestamp guarantees this value
4282                  * will never match a generated boot time. */
4283                 verf[0] = 0;
4284                 verf[1] = (__be32)(NSEC_PER_SEC + 1);
4285         } else {
4286                 struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
4287                 verf[0] = (__be32)nn->boot_time.tv_sec;
4288                 verf[1] = (__be32)nn->boot_time.tv_nsec;
4289         }
4290         memcpy(bootverf->data, verf, sizeof(bootverf->data));
4291 }
4292
4293 static unsigned int
4294 nfs4_init_nonuniform_client_string(const struct nfs_client *clp,
4295                                    char *buf, size_t len)
4296 {
4297         unsigned int result;
4298
4299         rcu_read_lock();
4300         result = scnprintf(buf, len, "Linux NFSv4.0 %s/%s %s",
4301                                 clp->cl_ipaddr,
4302                                 rpc_peeraddr2str(clp->cl_rpcclient,
4303                                                         RPC_DISPLAY_ADDR),
4304                                 rpc_peeraddr2str(clp->cl_rpcclient,
4305                                                         RPC_DISPLAY_PROTO));
4306         rcu_read_unlock();
4307         return result;
4308 }
4309
4310 static unsigned int
4311 nfs4_init_uniform_client_string(const struct nfs_client *clp,
4312                                 char *buf, size_t len)
4313 {
4314         char *nodename = clp->cl_rpcclient->cl_nodename;
4315
4316         if (nfs4_client_id_uniquifier[0] != '\0')
4317                 nodename = nfs4_client_id_uniquifier;
4318         return scnprintf(buf, len, "Linux NFSv%u.%u %s",
4319                                 clp->rpc_ops->version, clp->cl_minorversion,
4320                                 nodename);
4321 }
4322
4323 /**
4324  * nfs4_proc_setclientid - Negotiate client ID
4325  * @clp: state data structure
4326  * @program: RPC program for NFSv4 callback service
4327  * @port: IP port number for NFS4 callback service
4328  * @cred: RPC credential to use for this call
4329  * @res: where to place the result
4330  *
4331  * Returns zero, a negative errno, or a negative NFS4ERR status code.
4332  */
4333 int nfs4_proc_setclientid(struct nfs_client *clp, u32 program,
4334                 unsigned short port, struct rpc_cred *cred,
4335                 struct nfs4_setclientid_res *res)
4336 {
4337         nfs4_verifier sc_verifier;
4338         struct nfs4_setclientid setclientid = {
4339                 .sc_verifier = &sc_verifier,
4340                 .sc_prog = program,
4341                 .sc_cb_ident = clp->cl_cb_ident,
4342         };
4343         struct rpc_message msg = {
4344                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID],
4345                 .rpc_argp = &setclientid,
4346                 .rpc_resp = res,
4347                 .rpc_cred = cred,
4348         };
4349         int status;
4350
4351         /* nfs_client_id4 */
4352         nfs4_init_boot_verifier(clp, &sc_verifier);
4353         if (test_bit(NFS_CS_MIGRATION, &clp->cl_flags))
4354                 setclientid.sc_name_len =
4355                                 nfs4_init_uniform_client_string(clp,
4356                                                 setclientid.sc_name,
4357                                                 sizeof(setclientid.sc_name));
4358         else
4359                 setclientid.sc_name_len =
4360                                 nfs4_init_nonuniform_client_string(clp,
4361                                                 setclientid.sc_name,
4362                                                 sizeof(setclientid.sc_name));
4363         /* cb_client4 */
4364         rcu_read_lock();
4365         setclientid.sc_netid_len = scnprintf(setclientid.sc_netid,
4366                                 sizeof(setclientid.sc_netid),
4367                                 rpc_peeraddr2str(clp->cl_rpcclient,
4368                                                         RPC_DISPLAY_NETID));
4369         rcu_read_unlock();
4370         setclientid.sc_uaddr_len = scnprintf(setclientid.sc_uaddr,
4371                                 sizeof(setclientid.sc_uaddr), "%s.%u.%u",
4372                                 clp->cl_ipaddr, port >> 8, port & 255);
4373
4374         dprintk("NFS call  setclientid auth=%s, '%.*s'\n",
4375                 clp->cl_rpcclient->cl_auth->au_ops->au_name,
4376                 setclientid.sc_name_len, setclientid.sc_name);
4377         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
4378         dprintk("NFS reply setclientid: %d\n", status);
4379         return status;
4380 }
4381
4382 /**
4383  * nfs4_proc_setclientid_confirm - Confirm client ID
4384  * @clp: state data structure
4385  * @res: result of a previous SETCLIENTID
4386  * @cred: RPC credential to use for this call
4387  *
4388  * Returns zero, a negative errno, or a negative NFS4ERR status code.
4389  */
4390 int nfs4_proc_setclientid_confirm(struct nfs_client *clp,
4391                 struct nfs4_setclientid_res *arg,
4392                 struct rpc_cred *cred)
4393 {
4394         struct rpc_message msg = {
4395                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID_CONFIRM],
4396                 .rpc_argp = arg,
4397                 .rpc_cred = cred,
4398         };
4399         int status;
4400
4401         dprintk("NFS call  setclientid_confirm auth=%s, (client ID %llx)\n",
4402                 clp->cl_rpcclient->cl_auth->au_ops->au_name,
4403                 clp->cl_clientid);
4404         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
4405         dprintk("NFS reply setclientid_confirm: %d\n", status);
4406         return status;
4407 }
4408
4409 struct nfs4_delegreturndata {
4410         struct nfs4_delegreturnargs args;
4411         struct nfs4_delegreturnres res;
4412         struct nfs_fh fh;
4413         nfs4_stateid stateid;
4414         unsigned long timestamp;
4415         struct nfs_fattr fattr;
4416         int rpc_status;
4417 };
4418
4419 static void nfs4_delegreturn_done(struct rpc_task *task, void *calldata)
4420 {
4421         struct nfs4_delegreturndata *data = calldata;
4422
4423         if (!nfs4_sequence_done(task, &data->res.seq_res))
4424                 return;
4425
4426         switch (task->tk_status) {
4427         case -NFS4ERR_STALE_STATEID:
4428         case -NFS4ERR_EXPIRED:
4429         case 0:
4430                 renew_lease(data->res.server, data->timestamp);
4431                 break;
4432         default:
4433                 if (nfs4_async_handle_error(task, data->res.server, NULL) ==
4434                                 -EAGAIN) {
4435                         rpc_restart_call_prepare(task);
4436                         return;
4437                 }
4438         }
4439         data->rpc_status = task->tk_status;
4440 }
4441
4442 static void nfs4_delegreturn_release(void *calldata)
4443 {
4444         kfree(calldata);
4445 }
4446
4447 #if defined(CONFIG_NFS_V4_1)
4448 static void nfs4_delegreturn_prepare(struct rpc_task *task, void *data)
4449 {
4450         struct nfs4_delegreturndata *d_data;
4451
4452         d_data = (struct nfs4_delegreturndata *)data;
4453
4454         nfs4_setup_sequence(d_data->res.server,
4455                         &d_data->args.seq_args,
4456                         &d_data->res.seq_res,
4457                         task);
4458 }
4459 #endif /* CONFIG_NFS_V4_1 */
4460
4461 static const struct rpc_call_ops nfs4_delegreturn_ops = {
4462 #if defined(CONFIG_NFS_V4_1)
4463         .rpc_call_prepare = nfs4_delegreturn_prepare,
4464 #endif /* CONFIG_NFS_V4_1 */
4465         .rpc_call_done = nfs4_delegreturn_done,
4466         .rpc_release = nfs4_delegreturn_release,
4467 };
4468
4469 static int _nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
4470 {
4471         struct nfs4_delegreturndata *data;
4472         struct nfs_server *server = NFS_SERVER(inode);
4473         struct rpc_task *task;
4474         struct rpc_message msg = {
4475                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DELEGRETURN],
4476                 .rpc_cred = cred,
4477         };
4478         struct rpc_task_setup task_setup_data = {
4479                 .rpc_client = server->client,
4480                 .rpc_message = &msg,
4481                 .callback_ops = &nfs4_delegreturn_ops,
4482                 .flags = RPC_TASK_ASYNC,
4483         };
4484         int status = 0;
4485
4486         data = kzalloc(sizeof(*data), GFP_NOFS);
4487         if (data == NULL)
4488                 return -ENOMEM;
4489         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
4490         data->args.fhandle = &data->fh;
4491         data->args.stateid = &data->stateid;
4492         data->args.bitmask = server->cache_consistency_bitmask;
4493         nfs_copy_fh(&data->fh, NFS_FH(inode));
4494         nfs4_stateid_copy(&data->stateid, stateid);
4495         data->res.fattr = &data->fattr;
4496         data->res.server = server;
4497         nfs_fattr_init(data->res.fattr);
4498         data->timestamp = jiffies;
4499         data->rpc_status = 0;
4500
4501         task_setup_data.callback_data = data;
4502         msg.rpc_argp = &data->args;
4503         msg.rpc_resp = &data->res;
4504         task = rpc_run_task(&task_setup_data);
4505         if (IS_ERR(task))
4506                 return PTR_ERR(task);
4507         if (!issync)
4508                 goto out;
4509         status = nfs4_wait_for_completion_rpc_task(task);
4510         if (status != 0)
4511                 goto out;
4512         status = data->rpc_status;
4513         if (status == 0)
4514                 nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
4515         else
4516                 nfs_refresh_inode(inode, &data->fattr);
4517 out:
4518         rpc_put_task(task);
4519         return status;
4520 }
4521
4522 int nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
4523 {
4524         struct nfs_server *server = NFS_SERVER(inode);
4525         struct nfs4_exception exception = { };
4526         int err;
4527         do {
4528                 err = _nfs4_proc_delegreturn(inode, cred, stateid, issync);
4529                 switch (err) {
4530                         case -NFS4ERR_STALE_STATEID:
4531                         case -NFS4ERR_EXPIRED:
4532                         case 0:
4533                                 return 0;
4534                 }
4535                 err = nfs4_handle_exception(server, err, &exception);
4536         } while (exception.retry);
4537         return err;
4538 }
4539
4540 #define NFS4_LOCK_MINTIMEOUT (1 * HZ)
4541 #define NFS4_LOCK_MAXTIMEOUT (30 * HZ)
4542
4543 /* 
4544  * sleep, with exponential backoff, and retry the LOCK operation. 
4545  */
4546 static unsigned long
4547 nfs4_set_lock_task_retry(unsigned long timeout)
4548 {
4549         freezable_schedule_timeout_killable(timeout);
4550         timeout <<= 1;
4551         if (timeout > NFS4_LOCK_MAXTIMEOUT)
4552                 return NFS4_LOCK_MAXTIMEOUT;
4553         return timeout;
4554 }
4555
4556 static int _nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4557 {
4558         struct inode *inode = state->inode;
4559         struct nfs_server *server = NFS_SERVER(inode);
4560         struct nfs_client *clp = server->nfs_client;
4561         struct nfs_lockt_args arg = {
4562                 .fh = NFS_FH(inode),
4563                 .fl = request,
4564         };
4565         struct nfs_lockt_res res = {
4566                 .denied = request,
4567         };
4568         struct rpc_message msg = {
4569                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_LOCKT],
4570                 .rpc_argp       = &arg,
4571                 .rpc_resp       = &res,
4572                 .rpc_cred       = state->owner->so_cred,
4573         };
4574         struct nfs4_lock_state *lsp;
4575         int status;
4576
4577         arg.lock_owner.clientid = clp->cl_clientid;
4578         status = nfs4_set_lock_state(state, request);
4579         if (status != 0)
4580                 goto out;
4581         lsp = request->fl_u.nfs4_fl.owner;
4582         arg.lock_owner.id = lsp->ls_seqid.owner_id;
4583         arg.lock_owner.s_dev = server->s_dev;
4584         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
4585         switch (status) {
4586                 case 0:
4587                         request->fl_type = F_UNLCK;
4588                         break;
4589                 case -NFS4ERR_DENIED:
4590                         status = 0;
4591         }
4592         request->fl_ops->fl_release_private(request);
4593 out:
4594         return status;
4595 }
4596
4597 static int nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4598 {
4599         struct nfs4_exception exception = { };
4600         int err;
4601
4602         do {
4603                 err = nfs4_handle_exception(NFS_SERVER(state->inode),
4604                                 _nfs4_proc_getlk(state, cmd, request),
4605                                 &exception);
4606         } while (exception.retry);
4607         return err;
4608 }
4609
4610 static int do_vfs_lock(struct file *file, struct file_lock *fl)
4611 {
4612         int res = 0;
4613         switch (fl->fl_flags & (FL_POSIX|FL_FLOCK)) {
4614                 case FL_POSIX:
4615                         res = posix_lock_file_wait(file, fl);
4616                         break;
4617                 case FL_FLOCK:
4618                         res = flock_lock_file_wait(file, fl);
4619                         break;
4620                 default:
4621                         BUG();
4622         }
4623         return res;
4624 }
4625
4626 struct nfs4_unlockdata {
4627         struct nfs_locku_args arg;
4628         struct nfs_locku_res res;
4629         struct nfs4_lock_state *lsp;
4630         struct nfs_open_context *ctx;
4631         struct file_lock fl;
4632         const struct nfs_server *server;
4633         unsigned long timestamp;
4634 };
4635
4636 static struct nfs4_unlockdata *nfs4_alloc_unlockdata(struct file_lock *fl,
4637                 struct nfs_open_context *ctx,
4638                 struct nfs4_lock_state *lsp,
4639                 struct nfs_seqid *seqid)
4640 {
4641         struct nfs4_unlockdata *p;
4642         struct inode *inode = lsp->ls_state->inode;
4643
4644         p = kzalloc(sizeof(*p), GFP_NOFS);
4645         if (p == NULL)
4646                 return NULL;
4647         p->arg.fh = NFS_FH(inode);
4648         p->arg.fl = &p->fl;
4649         p->arg.seqid = seqid;
4650         p->res.seqid = seqid;
4651         p->arg.stateid = &lsp->ls_stateid;
4652         p->lsp = lsp;
4653         atomic_inc(&lsp->ls_count);
4654         /* Ensure we don't close file until we're done freeing locks! */
4655         p->ctx = get_nfs_open_context(ctx);
4656         memcpy(&p->fl, fl, sizeof(p->fl));
4657         p->server = NFS_SERVER(inode);
4658         return p;
4659 }
4660
4661 static void nfs4_locku_release_calldata(void *data)
4662 {
4663         struct nfs4_unlockdata *calldata = data;
4664         nfs_free_seqid(calldata->arg.seqid);
4665         nfs4_put_lock_state(calldata->lsp);
4666         put_nfs_open_context(calldata->ctx);
4667         kfree(calldata);
4668 }
4669
4670 static void nfs4_locku_done(struct rpc_task *task, void *data)
4671 {
4672         struct nfs4_unlockdata *calldata = data;
4673
4674         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
4675                 return;
4676         switch (task->tk_status) {
4677                 case 0:
4678                         nfs4_stateid_copy(&calldata->lsp->ls_stateid,
4679                                         &calldata->res.stateid);
4680                         renew_lease(calldata->server, calldata->timestamp);
4681                         break;
4682                 case -NFS4ERR_BAD_STATEID:
4683                 case -NFS4ERR_OLD_STATEID:
4684                 case -NFS4ERR_STALE_STATEID:
4685                 case -NFS4ERR_EXPIRED:
4686                         break;
4687                 default:
4688                         if (nfs4_async_handle_error(task, calldata->server, NULL) == -EAGAIN)
4689                                 rpc_restart_call_prepare(task);
4690         }
4691         nfs_release_seqid(calldata->arg.seqid);
4692 }
4693
4694 static void nfs4_locku_prepare(struct rpc_task *task, void *data)
4695 {
4696         struct nfs4_unlockdata *calldata = data;
4697
4698         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
4699                 goto out_wait;
4700         if (test_bit(NFS_LOCK_INITIALIZED, &calldata->lsp->ls_flags) == 0) {
4701                 /* Note: exit _without_ running nfs4_locku_done */
4702                 goto out_no_action;
4703         }
4704         calldata->timestamp = jiffies;
4705         if (nfs4_setup_sequence(calldata->server,
4706                                 &calldata->arg.seq_args,
4707                                 &calldata->res.seq_res,
4708                                 task) != 0)
4709                 nfs_release_seqid(calldata->arg.seqid);
4710         return;
4711 out_no_action:
4712         task->tk_action = NULL;
4713 out_wait:
4714         nfs4_sequence_done(task, &calldata->res.seq_res);
4715 }
4716
4717 static const struct rpc_call_ops nfs4_locku_ops = {
4718         .rpc_call_prepare = nfs4_locku_prepare,
4719         .rpc_call_done = nfs4_locku_done,
4720         .rpc_release = nfs4_locku_release_calldata,
4721 };
4722
4723 static struct rpc_task *nfs4_do_unlck(struct file_lock *fl,
4724                 struct nfs_open_context *ctx,
4725                 struct nfs4_lock_state *lsp,
4726                 struct nfs_seqid *seqid)
4727 {
4728         struct nfs4_unlockdata *data;
4729         struct rpc_message msg = {
4730                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCKU],
4731                 .rpc_cred = ctx->cred,
4732         };
4733         struct rpc_task_setup task_setup_data = {
4734                 .rpc_client = NFS_CLIENT(lsp->ls_state->inode),
4735                 .rpc_message = &msg,
4736                 .callback_ops = &nfs4_locku_ops,
4737                 .workqueue = nfsiod_workqueue,
4738                 .flags = RPC_TASK_ASYNC,
4739         };
4740
4741         /* Ensure this is an unlock - when canceling a lock, the
4742          * canceled lock is passed in, and it won't be an unlock.
4743          */
4744         fl->fl_type = F_UNLCK;
4745
4746         data = nfs4_alloc_unlockdata(fl, ctx, lsp, seqid);
4747         if (data == NULL) {
4748                 nfs_free_seqid(seqid);
4749                 return ERR_PTR(-ENOMEM);
4750         }
4751
4752         nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4753         msg.rpc_argp = &data->arg;
4754         msg.rpc_resp = &data->res;
4755         task_setup_data.callback_data = data;
4756         return rpc_run_task(&task_setup_data);
4757 }
4758
4759 static int nfs4_proc_unlck(struct nfs4_state *state, int cmd, struct file_lock *request)
4760 {
4761         struct inode *inode = state->inode;
4762         struct nfs4_state_owner *sp = state->owner;
4763         struct nfs_inode *nfsi = NFS_I(inode);
4764         struct nfs_seqid *seqid;
4765         struct nfs4_lock_state *lsp;
4766         struct rpc_task *task;
4767         int status = 0;
4768         unsigned char fl_flags = request->fl_flags;
4769
4770         status = nfs4_set_lock_state(state, request);
4771         /* Unlock _before_ we do the RPC call */
4772         request->fl_flags |= FL_EXISTS;
4773         /* Exclude nfs_delegation_claim_locks() */
4774         mutex_lock(&sp->so_delegreturn_mutex);
4775         /* Exclude nfs4_reclaim_open_stateid() - note nesting! */
4776         down_read(&nfsi->rwsem);
4777         if (do_vfs_lock(request->fl_file, request) == -ENOENT) {
4778                 up_read(&nfsi->rwsem);
4779                 mutex_unlock(&sp->so_delegreturn_mutex);
4780                 goto out;
4781         }
4782         up_read(&nfsi->rwsem);
4783         mutex_unlock(&sp->so_delegreturn_mutex);
4784         if (status != 0)
4785                 goto out;
4786         /* Is this a delegated lock? */
4787         lsp = request->fl_u.nfs4_fl.owner;
4788         if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) == 0)
4789                 goto out;
4790         seqid = nfs_alloc_seqid(&lsp->ls_seqid, GFP_KERNEL);
4791         status = -ENOMEM;
4792         if (seqid == NULL)
4793                 goto out;
4794         task = nfs4_do_unlck(request, nfs_file_open_context(request->fl_file), lsp, seqid);
4795         status = PTR_ERR(task);
4796         if (IS_ERR(task))
4797                 goto out;
4798         status = nfs4_wait_for_completion_rpc_task(task);
4799         rpc_put_task(task);
4800 out:
4801         request->fl_flags = fl_flags;
4802         return status;
4803 }
4804
4805 struct nfs4_lockdata {
4806         struct nfs_lock_args arg;
4807         struct nfs_lock_res res;
4808         struct nfs4_lock_state *lsp;
4809         struct nfs_open_context *ctx;
4810         struct file_lock fl;
4811         unsigned long timestamp;
4812         int rpc_status;
4813         int cancelled;
4814         struct nfs_server *server;
4815 };
4816
4817 static struct nfs4_lockdata *nfs4_alloc_lockdata(struct file_lock *fl,
4818                 struct nfs_open_context *ctx, struct nfs4_lock_state *lsp,
4819                 gfp_t gfp_mask)
4820 {
4821         struct nfs4_lockdata *p;
4822         struct inode *inode = lsp->ls_state->inode;
4823         struct nfs_server *server = NFS_SERVER(inode);
4824
4825         p = kzalloc(sizeof(*p), gfp_mask);
4826         if (p == NULL)
4827                 return NULL;
4828
4829         p->arg.fh = NFS_FH(inode);
4830         p->arg.fl = &p->fl;
4831         p->arg.open_seqid = nfs_alloc_seqid(&lsp->ls_state->owner->so_seqid, gfp_mask);
4832         if (p->arg.open_seqid == NULL)
4833                 goto out_free;
4834         p->arg.lock_seqid = nfs_alloc_seqid(&lsp->ls_seqid, gfp_mask);
4835         if (p->arg.lock_seqid == NULL)
4836                 goto out_free_seqid;
4837         p->arg.lock_stateid = &lsp->ls_stateid;
4838         p->arg.lock_owner.clientid = server->nfs_client->cl_clientid;
4839         p->arg.lock_owner.id = lsp->ls_seqid.owner_id;
4840         p->arg.lock_owner.s_dev = server->s_dev;
4841         p->res.lock_seqid = p->arg.lock_seqid;
4842         p->lsp = lsp;
4843         p->server = server;
4844         atomic_inc(&lsp->ls_count);
4845         p->ctx = get_nfs_open_context(ctx);
4846         memcpy(&p->fl, fl, sizeof(p->fl));
4847         return p;
4848 out_free_seqid:
4849         nfs_free_seqid(p->arg.open_seqid);
4850 out_free:
4851         kfree(p);
4852         return NULL;
4853 }
4854
4855 static void nfs4_lock_prepare(struct rpc_task *task, void *calldata)
4856 {
4857         struct nfs4_lockdata *data = calldata;
4858         struct nfs4_state *state = data->lsp->ls_state;
4859
4860         dprintk("%s: begin!\n", __func__);
4861         if (nfs_wait_on_sequence(data->arg.lock_seqid, task) != 0)
4862                 goto out_wait;
4863         /* Do we need to do an open_to_lock_owner? */
4864         if (!(data->arg.lock_seqid->sequence->flags & NFS_SEQID_CONFIRMED)) {
4865                 if (nfs_wait_on_sequence(data->arg.open_seqid, task) != 0) {
4866                         goto out_release_lock_seqid;
4867                 }
4868                 data->arg.open_stateid = &state->open_stateid;
4869                 data->arg.new_lock_owner = 1;
4870                 data->res.open_seqid = data->arg.open_seqid;
4871         } else
4872                 data->arg.new_lock_owner = 0;
4873         if (!nfs4_valid_open_stateid(state)) {
4874                 data->rpc_status = -EBADF;
4875                 task->tk_action = NULL;
4876                 goto out_release_open_seqid;
4877         }
4878         data->timestamp = jiffies;
4879         if (nfs4_setup_sequence(data->server,
4880                                 &data->arg.seq_args,
4881                                 &data->res.seq_res,
4882                                 task) == 0)
4883                 return;
4884 out_release_open_seqid:
4885         nfs_release_seqid(data->arg.open_seqid);
4886 out_release_lock_seqid:
4887         nfs_release_seqid(data->arg.lock_seqid);
4888 out_wait:
4889         nfs4_sequence_done(task, &data->res.seq_res);
4890         dprintk("%s: done!, ret = %d\n", __func__, data->rpc_status);
4891 }
4892
4893 static void nfs4_lock_done(struct rpc_task *task, void *calldata)
4894 {
4895         struct nfs4_lockdata *data = calldata;
4896
4897         dprintk("%s: begin!\n", __func__);
4898
4899         if (!nfs4_sequence_done(task, &data->res.seq_res))
4900                 return;
4901
4902         data->rpc_status = task->tk_status;
4903         if (data->arg.new_lock_owner != 0) {
4904                 if (data->rpc_status == 0)
4905                         nfs_confirm_seqid(&data->lsp->ls_seqid, 0);
4906                 else
4907                         goto out;
4908         }
4909         if (data->rpc_status == 0) {
4910                 nfs4_stateid_copy(&data->lsp->ls_stateid, &data->res.stateid);
4911                 set_bit(NFS_LOCK_INITIALIZED, &data->lsp->ls_flags);
4912                 renew_lease(NFS_SERVER(data->ctx->dentry->d_inode), data->timestamp);
4913         }
4914 out:
4915         dprintk("%s: done, ret = %d!\n", __func__, data->rpc_status);
4916 }
4917
4918 static void nfs4_lock_release(void *calldata)
4919 {
4920         struct nfs4_lockdata *data = calldata;
4921
4922         dprintk("%s: begin!\n", __func__);
4923         nfs_free_seqid(data->arg.open_seqid);
4924         if (data->cancelled != 0) {
4925                 struct rpc_task *task;
4926                 task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
4927                                 data->arg.lock_seqid);
4928                 if (!IS_ERR(task))
4929                         rpc_put_task_async(task);
4930                 dprintk("%s: cancelling lock!\n", __func__);
4931         } else
4932                 nfs_free_seqid(data->arg.lock_seqid);
4933         nfs4_put_lock_state(data->lsp);
4934         put_nfs_open_context(data->ctx);
4935         kfree(data);
4936         dprintk("%s: done!\n", __func__);
4937 }
4938
4939 static const struct rpc_call_ops nfs4_lock_ops = {
4940         .rpc_call_prepare = nfs4_lock_prepare,
4941         .rpc_call_done = nfs4_lock_done,
4942         .rpc_release = nfs4_lock_release,
4943 };
4944
4945 static void nfs4_handle_setlk_error(struct nfs_server *server, struct nfs4_lock_state *lsp, int new_lock_owner, int error)
4946 {
4947         switch (error) {
4948         case -NFS4ERR_ADMIN_REVOKED:
4949         case -NFS4ERR_BAD_STATEID:
4950                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4951                 if (new_lock_owner != 0 ||
4952                    test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) != 0)
4953                         nfs4_schedule_stateid_recovery(server, lsp->ls_state);
4954                 break;
4955         case -NFS4ERR_STALE_STATEID:
4956                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4957         case -NFS4ERR_EXPIRED:
4958                 nfs4_schedule_lease_recovery(server->nfs_client);
4959         };
4960 }
4961
4962 static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int recovery_type)
4963 {
4964         struct nfs4_lockdata *data;
4965         struct rpc_task *task;
4966         struct rpc_message msg = {
4967                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCK],
4968                 .rpc_cred = state->owner->so_cred,
4969         };
4970         struct rpc_task_setup task_setup_data = {
4971                 .rpc_client = NFS_CLIENT(state->inode),
4972                 .rpc_message = &msg,
4973                 .callback_ops = &nfs4_lock_ops,
4974                 .workqueue = nfsiod_workqueue,
4975                 .flags = RPC_TASK_ASYNC,
4976         };
4977         int ret;
4978
4979         dprintk("%s: begin!\n", __func__);
4980         data = nfs4_alloc_lockdata(fl, nfs_file_open_context(fl->fl_file),
4981                         fl->fl_u.nfs4_fl.owner,
4982                         recovery_type == NFS_LOCK_NEW ? GFP_KERNEL : GFP_NOFS);
4983         if (data == NULL)
4984                 return -ENOMEM;
4985         if (IS_SETLKW(cmd))
4986                 data->arg.block = 1;
4987         nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4988         msg.rpc_argp = &data->arg;
4989         msg.rpc_resp = &data->res;
4990         task_setup_data.callback_data = data;
4991         if (recovery_type > NFS_LOCK_NEW) {
4992                 if (recovery_type == NFS_LOCK_RECLAIM)
4993                         data->arg.reclaim = NFS_LOCK_RECLAIM;
4994                 nfs4_set_sequence_privileged(&data->arg.seq_args);
4995         }
4996         task = rpc_run_task(&task_setup_data);
4997         if (IS_ERR(task))
4998                 return PTR_ERR(task);
4999         ret = nfs4_wait_for_completion_rpc_task(task);
5000         if (ret == 0) {
5001                 ret = data->rpc_status;
5002                 if (ret)
5003                         nfs4_handle_setlk_error(data->server, data->lsp,
5004                                         data->arg.new_lock_owner, ret);
5005         } else
5006                 data->cancelled = 1;
5007         rpc_put_task(task);
5008         dprintk("%s: done, ret = %d!\n", __func__, ret);
5009         return ret;
5010 }
5011
5012 static int nfs4_lock_reclaim(struct nfs4_state *state, struct file_lock *request)
5013 {
5014         struct nfs_server *server = NFS_SERVER(state->inode);
5015         struct nfs4_exception exception = {
5016                 .inode = state->inode,
5017         };
5018         int err;
5019
5020         do {
5021                 /* Cache the lock if possible... */
5022                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
5023                         return 0;
5024                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_RECLAIM);
5025                 if (err != -NFS4ERR_DELAY)
5026                         break;
5027                 nfs4_handle_exception(server, err, &exception);
5028         } while (exception.retry);
5029         return err;
5030 }
5031
5032 static int nfs4_lock_expired(struct nfs4_state *state, struct file_lock *request)
5033 {
5034         struct nfs_server *server = NFS_SERVER(state->inode);
5035         struct nfs4_exception exception = {
5036                 .inode = state->inode,
5037         };
5038         int err;
5039
5040         err = nfs4_set_lock_state(state, request);
5041         if (err != 0)
5042                 return err;
5043         do {
5044                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
5045                         return 0;
5046                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_EXPIRED);
5047                 switch (err) {
5048                 default:
5049                         goto out;
5050                 case -NFS4ERR_GRACE:
5051                 case -NFS4ERR_DELAY:
5052                         nfs4_handle_exception(server, err, &exception);
5053                         err = 0;
5054                 }
5055         } while (exception.retry);
5056 out:
5057         return err;
5058 }
5059
5060 #if defined(CONFIG_NFS_V4_1)
5061 /**
5062  * nfs41_check_expired_locks - possibly free a lock stateid
5063  *
5064  * @state: NFSv4 state for an inode
5065  *
5066  * Returns NFS_OK if recovery for this stateid is now finished.
5067  * Otherwise a negative NFS4ERR value is returned.
5068  */
5069 static int nfs41_check_expired_locks(struct nfs4_state *state)
5070 {
5071         int status, ret = -NFS4ERR_BAD_STATEID;
5072         struct nfs4_lock_state *lsp;
5073         struct nfs_server *server = NFS_SERVER(state->inode);
5074
5075         list_for_each_entry(lsp, &state->lock_states, ls_locks) {
5076                 if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags)) {
5077                         struct rpc_cred *cred = lsp->ls_state->owner->so_cred;
5078
5079                         status = nfs41_test_stateid(server,
5080                                         &lsp->ls_stateid,
5081                                         cred);
5082                         if (status != NFS_OK) {
5083                                 /* Free the stateid unless the server
5084                                  * informs us the stateid is unrecognized. */
5085                                 if (status != -NFS4ERR_BAD_STATEID)
5086                                         nfs41_free_stateid(server,
5087                                                         &lsp->ls_stateid,
5088                                                         cred);
5089                                 clear_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags);
5090                                 ret = status;
5091                         }
5092                 }
5093         };
5094
5095         return ret;
5096 }
5097
5098 static int nfs41_lock_expired(struct nfs4_state *state, struct file_lock *request)
5099 {
5100         int status = NFS_OK;
5101
5102         if (test_bit(LK_STATE_IN_USE, &state->flags))
5103                 status = nfs41_check_expired_locks(state);
5104         if (status != NFS_OK)
5105                 status = nfs4_lock_expired(state, request);
5106         return status;
5107 }
5108 #endif
5109
5110 static int _nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
5111 {
5112         struct nfs4_state_owner *sp = state->owner;
5113         struct nfs_inode *nfsi = NFS_I(state->inode);
5114         unsigned char fl_flags = request->fl_flags;
5115         unsigned int seq;
5116         int status = -ENOLCK;
5117
5118         if ((fl_flags & FL_POSIX) &&
5119                         !test_bit(NFS_STATE_POSIX_LOCKS, &state->flags))
5120                 goto out;
5121         /* Is this a delegated open? */
5122         status = nfs4_set_lock_state(state, request);
5123         if (status != 0)
5124                 goto out;
5125         request->fl_flags |= FL_ACCESS;
5126         status = do_vfs_lock(request->fl_file, request);
5127         if (status < 0)
5128                 goto out;
5129         down_read(&nfsi->rwsem);
5130         if (test_bit(NFS_DELEGATED_STATE, &state->flags)) {
5131                 /* Yes: cache locks! */
5132                 /* ...but avoid races with delegation recall... */
5133                 request->fl_flags = fl_flags & ~FL_SLEEP;
5134                 status = do_vfs_lock(request->fl_file, request);
5135                 goto out_unlock;
5136         }
5137         seq = raw_seqcount_begin(&sp->so_reclaim_seqcount);
5138         up_read(&nfsi->rwsem);
5139         status = _nfs4_do_setlk(state, cmd, request, NFS_LOCK_NEW);
5140         if (status != 0)
5141                 goto out;
5142         down_read(&nfsi->rwsem);
5143         if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq)) {
5144                 status = -NFS4ERR_DELAY;
5145                 goto out_unlock;
5146         }
5147         /* Note: we always want to sleep here! */
5148         request->fl_flags = fl_flags | FL_SLEEP;
5149         if (do_vfs_lock(request->fl_file, request) < 0)
5150                 printk(KERN_WARNING "NFS: %s: VFS is out of sync with lock "
5151                         "manager!\n", __func__);
5152 out_unlock:
5153         up_read(&nfsi->rwsem);
5154 out:
5155         request->fl_flags = fl_flags;
5156         return status;
5157 }
5158
5159 static int nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
5160 {
5161         struct nfs4_exception exception = {
5162                 .state = state,
5163                 .inode = state->inode,
5164         };
5165         int err;
5166
5167         do {
5168                 err = _nfs4_proc_setlk(state, cmd, request);
5169                 if (err == -NFS4ERR_DENIED)
5170                         err = -EAGAIN;
5171                 err = nfs4_handle_exception(NFS_SERVER(state->inode),
5172                                 err, &exception);
5173         } while (exception.retry);
5174         return err;
5175 }
5176
5177 static int
5178 nfs4_proc_lock(struct file *filp, int cmd, struct file_lock *request)
5179 {
5180         struct nfs_open_context *ctx;
5181         struct nfs4_state *state;
5182         unsigned long timeout = NFS4_LOCK_MINTIMEOUT;
5183         int status;
5184
5185         /* verify open state */
5186         ctx = nfs_file_open_context(filp);
5187         state = ctx->state;
5188
5189         if (request->fl_start < 0 || request->fl_end < 0)
5190                 return -EINVAL;
5191
5192         if (IS_GETLK(cmd)) {
5193                 if (state != NULL)
5194                         return nfs4_proc_getlk(state, F_GETLK, request);
5195                 return 0;
5196         }
5197
5198         if (!(IS_SETLK(cmd) || IS_SETLKW(cmd)))
5199                 return -EINVAL;
5200
5201         if (request->fl_type == F_UNLCK) {
5202                 if (state != NULL)
5203                         return nfs4_proc_unlck(state, cmd, request);
5204                 return 0;
5205         }
5206
5207         if (state == NULL)
5208                 return -ENOLCK;
5209         /*
5210          * Don't rely on the VFS having checked the file open mode,
5211          * since it won't do this for flock() locks.
5212          */
5213         switch (request->fl_type) {
5214         case F_RDLCK:
5215                 if (!(filp->f_mode & FMODE_READ))
5216                         return -EBADF;
5217                 break;
5218         case F_WRLCK:
5219                 if (!(filp->f_mode & FMODE_WRITE))
5220                         return -EBADF;
5221         }
5222
5223         do {
5224                 status = nfs4_proc_setlk(state, cmd, request);
5225                 if ((status != -EAGAIN) || IS_SETLK(cmd))
5226                         break;
5227                 timeout = nfs4_set_lock_task_retry(timeout);
5228                 status = -ERESTARTSYS;
5229                 if (signalled())
5230                         break;
5231         } while(status < 0);
5232         return status;
5233 }
5234
5235 int nfs4_lock_delegation_recall(struct file_lock *fl, struct nfs4_state *state, const nfs4_stateid *stateid)
5236 {
5237         struct nfs_server *server = NFS_SERVER(state->inode);
5238         int err;
5239
5240         err = nfs4_set_lock_state(state, fl);
5241         if (err != 0)
5242                 return err;
5243         err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
5244         return nfs4_handle_delegation_recall_error(server, state, stateid, err);
5245 }
5246
5247 struct nfs_release_lockowner_data {
5248         struct nfs4_lock_state *lsp;
5249         struct nfs_server *server;
5250         struct nfs_release_lockowner_args args;
5251 };
5252
5253 static void nfs4_release_lockowner_release(void *calldata)
5254 {
5255         struct nfs_release_lockowner_data *data = calldata;
5256         nfs4_free_lock_state(data->server, data->lsp);
5257         kfree(calldata);
5258 }
5259
5260 static const struct rpc_call_ops nfs4_release_lockowner_ops = {
5261         .rpc_release = nfs4_release_lockowner_release,
5262 };
5263
5264 static int nfs4_release_lockowner(struct nfs_server *server, struct nfs4_lock_state *lsp)
5265 {
5266         struct nfs_release_lockowner_data *data;
5267         struct rpc_message msg = {
5268                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RELEASE_LOCKOWNER],
5269         };
5270
5271         if (server->nfs_client->cl_mvops->minor_version != 0)
5272                 return -EINVAL;
5273         data = kmalloc(sizeof(*data), GFP_NOFS);
5274         if (!data)
5275                 return -ENOMEM;
5276         data->lsp = lsp;
5277         data->server = server;
5278         data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
5279         data->args.lock_owner.id = lsp->ls_seqid.owner_id;
5280         data->args.lock_owner.s_dev = server->s_dev;
5281         msg.rpc_argp = &data->args;
5282         rpc_call_async(server->client, &msg, 0, &nfs4_release_lockowner_ops, data);
5283         return 0;
5284 }
5285
5286 #define XATTR_NAME_NFSV4_ACL "system.nfs4_acl"
5287
5288 static int nfs4_xattr_set_nfs4_acl(struct dentry *dentry, const char *key,
5289                                    const void *buf, size_t buflen,
5290                                    int flags, int type)
5291 {
5292         if (strcmp(key, "") != 0)
5293                 return -EINVAL;
5294
5295         return nfs4_proc_set_acl(dentry->d_inode, buf, buflen);
5296 }
5297
5298 static int nfs4_xattr_get_nfs4_acl(struct dentry *dentry, const char *key,
5299                                    void *buf, size_t buflen, int type)
5300 {
5301         if (strcmp(key, "") != 0)
5302                 return -EINVAL;
5303
5304         return nfs4_proc_get_acl(dentry->d_inode, buf, buflen);
5305 }
5306
5307 static size_t nfs4_xattr_list_nfs4_acl(struct dentry *dentry, char *list,
5308                                        size_t list_len, const char *name,
5309                                        size_t name_len, int type)
5310 {
5311         size_t len = sizeof(XATTR_NAME_NFSV4_ACL);
5312
5313         if (!nfs4_server_supports_acls(NFS_SERVER(dentry->d_inode)))
5314                 return 0;
5315
5316         if (list && len <= list_len)
5317                 memcpy(list, XATTR_NAME_NFSV4_ACL, len);
5318         return len;
5319 }
5320
5321 /*
5322  * nfs_fhget will use either the mounted_on_fileid or the fileid
5323  */
5324 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr)
5325 {
5326         if (!(((fattr->valid & NFS_ATTR_FATTR_MOUNTED_ON_FILEID) ||
5327                (fattr->valid & NFS_ATTR_FATTR_FILEID)) &&
5328               (fattr->valid & NFS_ATTR_FATTR_FSID) &&
5329               (fattr->valid & NFS_ATTR_FATTR_V4_LOCATIONS)))
5330                 return;
5331
5332         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
5333                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_V4_REFERRAL;
5334         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
5335         fattr->nlink = 2;
5336 }
5337
5338 static int _nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
5339                                    const struct qstr *name,
5340                                    struct nfs4_fs_locations *fs_locations,
5341                                    struct page *page)
5342 {
5343         struct nfs_server *server = NFS_SERVER(dir);
5344         u32 bitmask[2] = {
5345                 [0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
5346         };
5347         struct nfs4_fs_locations_arg args = {
5348                 .dir_fh = NFS_FH(dir),
5349                 .name = name,
5350                 .page = page,
5351                 .bitmask = bitmask,
5352         };
5353         struct nfs4_fs_locations_res res = {
5354                 .fs_locations = fs_locations,
5355         };
5356         struct rpc_message msg = {
5357                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
5358                 .rpc_argp = &args,
5359                 .rpc_resp = &res,
5360         };
5361         int status;
5362
5363         dprintk("%s: start\n", __func__);
5364
5365         /* Ask for the fileid of the absent filesystem if mounted_on_fileid
5366          * is not supported */
5367         if (NFS_SERVER(dir)->attr_bitmask[1] & FATTR4_WORD1_MOUNTED_ON_FILEID)
5368                 bitmask[1] |= FATTR4_WORD1_MOUNTED_ON_FILEID;
5369         else
5370                 bitmask[0] |= FATTR4_WORD0_FILEID;
5371
5372         nfs_fattr_init(&fs_locations->fattr);
5373         fs_locations->server = server;
5374         fs_locations->nlocations = 0;
5375         status = nfs4_call_sync(client, server, &msg, &args.seq_args, &res.seq_res, 0);
5376         dprintk("%s: returned status = %d\n", __func__, status);
5377         return status;
5378 }
5379
5380 int nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
5381                            const struct qstr *name,
5382                            struct nfs4_fs_locations *fs_locations,
5383                            struct page *page)
5384 {
5385         struct nfs4_exception exception = { };
5386         int err;
5387         do {
5388                 err = nfs4_handle_exception(NFS_SERVER(dir),
5389                                 _nfs4_proc_fs_locations(client, dir, name, fs_locations, page),
5390                                 &exception);
5391         } while (exception.retry);
5392         return err;
5393 }
5394
5395 static int _nfs4_proc_secinfo(struct inode *dir, const struct qstr *name, struct nfs4_secinfo_flavors *flavors)
5396 {
5397         int status;
5398         struct nfs4_secinfo_arg args = {
5399                 .dir_fh = NFS_FH(dir),
5400                 .name   = name,
5401         };
5402         struct nfs4_secinfo_res res = {
5403                 .flavors     = flavors,
5404         };
5405         struct rpc_message msg = {
5406                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO],
5407                 .rpc_argp = &args,
5408                 .rpc_resp = &res,
5409         };
5410
5411         dprintk("NFS call  secinfo %s\n", name->name);
5412         status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
5413         dprintk("NFS reply  secinfo: %d\n", status);
5414         return status;
5415 }
5416
5417 int nfs4_proc_secinfo(struct inode *dir, const struct qstr *name,
5418                       struct nfs4_secinfo_flavors *flavors)
5419 {
5420         struct nfs4_exception exception = { };
5421         int err;
5422         do {
5423                 err = nfs4_handle_exception(NFS_SERVER(dir),
5424                                 _nfs4_proc_secinfo(dir, name, flavors),
5425                                 &exception);
5426         } while (exception.retry);
5427         return err;
5428 }
5429
5430 #ifdef CONFIG_NFS_V4_1
5431 /*
5432  * Check the exchange flags returned by the server for invalid flags, having
5433  * both PNFS and NON_PNFS flags set, and not having one of NON_PNFS, PNFS, or
5434  * DS flags set.
5435  */
5436 static int nfs4_check_cl_exchange_flags(u32 flags)
5437 {
5438         if (flags & ~EXCHGID4_FLAG_MASK_R)
5439                 goto out_inval;
5440         if ((flags & EXCHGID4_FLAG_USE_PNFS_MDS) &&
5441             (flags & EXCHGID4_FLAG_USE_NON_PNFS))
5442                 goto out_inval;
5443         if (!(flags & (EXCHGID4_FLAG_MASK_PNFS)))
5444                 goto out_inval;
5445         return NFS_OK;
5446 out_inval:
5447         return -NFS4ERR_INVAL;
5448 }
5449
5450 static bool
5451 nfs41_same_server_scope(struct nfs41_server_scope *a,
5452                         struct nfs41_server_scope *b)
5453 {
5454         if (a->server_scope_sz == b->server_scope_sz &&
5455             memcmp(a->server_scope, b->server_scope, a->server_scope_sz) == 0)
5456                 return true;
5457
5458         return false;
5459 }
5460
5461 /*
5462  * nfs4_proc_bind_conn_to_session()
5463  *
5464  * The 4.1 client currently uses the same TCP connection for the
5465  * fore and backchannel.
5466  */
5467 int nfs4_proc_bind_conn_to_session(struct nfs_client *clp, struct rpc_cred *cred)
5468 {
5469         int status;
5470         struct nfs41_bind_conn_to_session_res res;
5471         struct rpc_message msg = {
5472                 .rpc_proc =
5473                         &nfs4_procedures[NFSPROC4_CLNT_BIND_CONN_TO_SESSION],
5474                 .rpc_argp = clp,
5475                 .rpc_resp = &res,
5476                 .rpc_cred = cred,
5477         };
5478
5479         dprintk("--> %s\n", __func__);
5480
5481         res.session = kzalloc(sizeof(struct nfs4_session), GFP_NOFS);
5482         if (unlikely(res.session == NULL)) {
5483                 status = -ENOMEM;
5484                 goto out;
5485         }
5486
5487         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5488         if (status == 0) {
5489                 if (memcmp(res.session->sess_id.data,
5490                     clp->cl_session->sess_id.data, NFS4_MAX_SESSIONID_LEN)) {
5491                         dprintk("NFS: %s: Session ID mismatch\n", __func__);
5492                         status = -EIO;
5493                         goto out_session;
5494                 }
5495                 if (res.dir != NFS4_CDFS4_BOTH) {
5496                         dprintk("NFS: %s: Unexpected direction from server\n",
5497                                 __func__);
5498                         status = -EIO;
5499                         goto out_session;
5500                 }
5501                 if (res.use_conn_in_rdma_mode) {
5502                         dprintk("NFS: %s: Server returned RDMA mode = true\n",
5503                                 __func__);
5504                         status = -EIO;
5505                         goto out_session;
5506                 }
5507         }
5508 out_session:
5509         kfree(res.session);
5510 out:
5511         dprintk("<-- %s status= %d\n", __func__, status);
5512         return status;
5513 }
5514
5515 /*
5516  * nfs4_proc_exchange_id()
5517  *
5518  * Returns zero, a negative errno, or a negative NFS4ERR status code.
5519  *
5520  * Since the clientid has expired, all compounds using sessions
5521  * associated with the stale clientid will be returning
5522  * NFS4ERR_BADSESSION in the sequence operation, and will therefore
5523  * be in some phase of session reset.
5524  */
5525 int nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred)
5526 {
5527         nfs4_verifier verifier;
5528         struct nfs41_exchange_id_args args = {
5529                 .verifier = &verifier,
5530                 .client = clp,
5531                 .flags = EXCHGID4_FLAG_SUPP_MOVED_REFER,
5532         };
5533         struct nfs41_exchange_id_res res = {
5534                 0
5535         };
5536         int status;
5537         struct rpc_message msg = {
5538                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_EXCHANGE_ID],
5539                 .rpc_argp = &args,
5540                 .rpc_resp = &res,
5541                 .rpc_cred = cred,
5542         };
5543
5544         nfs4_init_boot_verifier(clp, &verifier);
5545         args.id_len = nfs4_init_uniform_client_string(clp, args.id,
5546                                                         sizeof(args.id));
5547         dprintk("NFS call  exchange_id auth=%s, '%.*s'\n",
5548                 clp->cl_rpcclient->cl_auth->au_ops->au_name,
5549                 args.id_len, args.id);
5550
5551         res.server_owner = kzalloc(sizeof(struct nfs41_server_owner),
5552                                         GFP_NOFS);
5553         if (unlikely(res.server_owner == NULL)) {
5554                 status = -ENOMEM;
5555                 goto out;
5556         }
5557
5558         res.server_scope = kzalloc(sizeof(struct nfs41_server_scope),
5559                                         GFP_NOFS);
5560         if (unlikely(res.server_scope == NULL)) {
5561                 status = -ENOMEM;
5562                 goto out_server_owner;
5563         }
5564
5565         res.impl_id = kzalloc(sizeof(struct nfs41_impl_id), GFP_NOFS);
5566         if (unlikely(res.impl_id == NULL)) {
5567                 status = -ENOMEM;
5568                 goto out_server_scope;
5569         }
5570
5571         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5572         if (status == 0)
5573                 status = nfs4_check_cl_exchange_flags(res.flags);
5574
5575         if (status == 0) {
5576                 clp->cl_clientid = res.clientid;
5577                 clp->cl_exchange_flags = (res.flags & ~EXCHGID4_FLAG_CONFIRMED_R);
5578                 if (!(res.flags & EXCHGID4_FLAG_CONFIRMED_R))
5579                         clp->cl_seqid = res.seqid;
5580
5581                 kfree(clp->cl_serverowner);
5582                 clp->cl_serverowner = res.server_owner;
5583                 res.server_owner = NULL;
5584
5585                 /* use the most recent implementation id */
5586                 kfree(clp->cl_implid);
5587                 clp->cl_implid = res.impl_id;
5588
5589                 if (clp->cl_serverscope != NULL &&
5590                     !nfs41_same_server_scope(clp->cl_serverscope,
5591                                              res.server_scope)) {
5592                         dprintk("%s: server_scope mismatch detected\n",
5593                                 __func__);
5594                         set_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state);
5595                         kfree(clp->cl_serverscope);
5596                         clp->cl_serverscope = NULL;
5597                 }
5598
5599                 if (clp->cl_serverscope == NULL) {
5600                         clp->cl_serverscope = res.server_scope;
5601                         goto out;
5602                 }
5603         } else
5604                 kfree(res.impl_id);
5605
5606 out_server_owner:
5607         kfree(res.server_owner);
5608 out_server_scope:
5609         kfree(res.server_scope);
5610 out:
5611         if (clp->cl_implid != NULL)
5612                 dprintk("NFS reply exchange_id: Server Implementation ID: "
5613                         "domain: %s, name: %s, date: %llu,%u\n",
5614                         clp->cl_implid->domain, clp->cl_implid->name,
5615                         clp->cl_implid->date.seconds,
5616                         clp->cl_implid->date.nseconds);
5617         dprintk("NFS reply exchange_id: %d\n", status);
5618         return status;
5619 }
5620
5621 static int _nfs4_proc_destroy_clientid(struct nfs_client *clp,
5622                 struct rpc_cred *cred)
5623 {
5624         struct rpc_message msg = {
5625                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_CLIENTID],
5626                 .rpc_argp = clp,
5627                 .rpc_cred = cred,
5628         };
5629         int status;
5630
5631         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5632         if (status)
5633                 dprintk("NFS: Got error %d from the server %s on "
5634                         "DESTROY_CLIENTID.", status, clp->cl_hostname);
5635         return status;
5636 }
5637
5638 static int nfs4_proc_destroy_clientid(struct nfs_client *clp,
5639                 struct rpc_cred *cred)
5640 {
5641         unsigned int loop;
5642         int ret;
5643
5644         for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
5645                 ret = _nfs4_proc_destroy_clientid(clp, cred);
5646                 switch (ret) {
5647                 case -NFS4ERR_DELAY:
5648                 case -NFS4ERR_CLIENTID_BUSY:
5649                         ssleep(1);
5650                         break;
5651                 default:
5652                         return ret;
5653                 }
5654         }
5655         return 0;
5656 }
5657
5658 int nfs4_destroy_clientid(struct nfs_client *clp)
5659 {
5660         struct rpc_cred *cred;
5661         int ret = 0;
5662
5663         if (clp->cl_mvops->minor_version < 1)
5664                 goto out;
5665         if (clp->cl_exchange_flags == 0)
5666                 goto out;
5667         if (clp->cl_preserve_clid)
5668                 goto out;
5669         cred = nfs4_get_exchange_id_cred(clp);
5670         ret = nfs4_proc_destroy_clientid(clp, cred);
5671         if (cred)
5672                 put_rpccred(cred);
5673         switch (ret) {
5674         case 0:
5675         case -NFS4ERR_STALE_CLIENTID:
5676                 clp->cl_exchange_flags = 0;
5677         }
5678 out:
5679         return ret;
5680 }
5681
5682 struct nfs4_get_lease_time_data {
5683         struct nfs4_get_lease_time_args *args;
5684         struct nfs4_get_lease_time_res *res;
5685         struct nfs_client *clp;
5686 };
5687
5688 static void nfs4_get_lease_time_prepare(struct rpc_task *task,
5689                                         void *calldata)
5690 {
5691         struct nfs4_get_lease_time_data *data =
5692                         (struct nfs4_get_lease_time_data *)calldata;
5693
5694         dprintk("--> %s\n", __func__);
5695         /* just setup sequence, do not trigger session recovery
5696            since we're invoked within one */
5697         nfs41_setup_sequence(data->clp->cl_session,
5698                         &data->args->la_seq_args,
5699                         &data->res->lr_seq_res,
5700                         task);
5701         dprintk("<-- %s\n", __func__);
5702 }
5703
5704 /*
5705  * Called from nfs4_state_manager thread for session setup, so don't recover
5706  * from sequence operation or clientid errors.
5707  */
5708 static void nfs4_get_lease_time_done(struct rpc_task *task, void *calldata)
5709 {
5710         struct nfs4_get_lease_time_data *data =
5711                         (struct nfs4_get_lease_time_data *)calldata;
5712
5713         dprintk("--> %s\n", __func__);
5714         if (!nfs41_sequence_done(task, &data->res->lr_seq_res))
5715                 return;
5716         switch (task->tk_status) {
5717         case -NFS4ERR_DELAY:
5718         case -NFS4ERR_GRACE:
5719                 dprintk("%s Retry: tk_status %d\n", __func__, task->tk_status);
5720                 rpc_delay(task, NFS4_POLL_RETRY_MIN);
5721                 task->tk_status = 0;
5722                 /* fall through */
5723         case -NFS4ERR_RETRY_UNCACHED_REP:
5724                 rpc_restart_call_prepare(task);
5725                 return;
5726         }
5727         dprintk("<-- %s\n", __func__);
5728 }
5729
5730 static const struct rpc_call_ops nfs4_get_lease_time_ops = {
5731         .rpc_call_prepare = nfs4_get_lease_time_prepare,
5732         .rpc_call_done = nfs4_get_lease_time_done,
5733 };
5734
5735 int nfs4_proc_get_lease_time(struct nfs_client *clp, struct nfs_fsinfo *fsinfo)
5736 {
5737         struct rpc_task *task;
5738         struct nfs4_get_lease_time_args args;
5739         struct nfs4_get_lease_time_res res = {
5740                 .lr_fsinfo = fsinfo,
5741         };
5742         struct nfs4_get_lease_time_data data = {
5743                 .args = &args,
5744                 .res = &res,
5745                 .clp = clp,
5746         };
5747         struct rpc_message msg = {
5748                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GET_LEASE_TIME],
5749                 .rpc_argp = &args,
5750                 .rpc_resp = &res,
5751         };
5752         struct rpc_task_setup task_setup = {
5753                 .rpc_client = clp->cl_rpcclient,
5754                 .rpc_message = &msg,
5755                 .callback_ops = &nfs4_get_lease_time_ops,
5756                 .callback_data = &data,
5757                 .flags = RPC_TASK_TIMEOUT,
5758         };
5759         int status;
5760
5761         nfs41_init_sequence(&args.la_seq_args, &res.lr_seq_res, 0);
5762         nfs4_set_sequence_privileged(&args.la_seq_args);
5763         dprintk("--> %s\n", __func__);
5764         task = rpc_run_task(&task_setup);
5765
5766         if (IS_ERR(task))
5767                 status = PTR_ERR(task);
5768         else {
5769                 status = task->tk_status;
5770                 rpc_put_task(task);
5771         }
5772         dprintk("<-- %s return %d\n", __func__, status);
5773
5774         return status;
5775 }
5776
5777 /*
5778  * Initialize the values to be used by the client in CREATE_SESSION
5779  * If nfs4_init_session set the fore channel request and response sizes,
5780  * use them.
5781  *
5782  * Set the back channel max_resp_sz_cached to zero to force the client to
5783  * always set csa_cachethis to FALSE because the current implementation
5784  * of the back channel DRC only supports caching the CB_SEQUENCE operation.
5785  */
5786 static void nfs4_init_channel_attrs(struct nfs41_create_session_args *args)
5787 {
5788         struct nfs4_session *session = args->client->cl_session;
5789         unsigned int mxrqst_sz = session->fc_target_max_rqst_sz,
5790                      mxresp_sz = session->fc_target_max_resp_sz;
5791
5792         if (mxrqst_sz == 0)
5793                 mxrqst_sz = NFS_MAX_FILE_IO_SIZE;
5794         if (mxresp_sz == 0)
5795                 mxresp_sz = NFS_MAX_FILE_IO_SIZE;
5796         /* Fore channel attributes */
5797         args->fc_attrs.max_rqst_sz = mxrqst_sz;
5798         args->fc_attrs.max_resp_sz = mxresp_sz;
5799         args->fc_attrs.max_ops = NFS4_MAX_OPS;
5800         args->fc_attrs.max_reqs = max_session_slots;
5801
5802         dprintk("%s: Fore Channel : max_rqst_sz=%u max_resp_sz=%u "
5803                 "max_ops=%u max_reqs=%u\n",
5804                 __func__,
5805                 args->fc_attrs.max_rqst_sz, args->fc_attrs.max_resp_sz,
5806                 args->fc_attrs.max_ops, args->fc_attrs.max_reqs);
5807
5808         /* Back channel attributes */
5809         args->bc_attrs.max_rqst_sz = PAGE_SIZE;
5810         args->bc_attrs.max_resp_sz = PAGE_SIZE;
5811         args->bc_attrs.max_resp_sz_cached = 0;
5812         args->bc_attrs.max_ops = NFS4_MAX_BACK_CHANNEL_OPS;
5813         args->bc_attrs.max_reqs = 1;
5814
5815         dprintk("%s: Back Channel : max_rqst_sz=%u max_resp_sz=%u "
5816                 "max_resp_sz_cached=%u max_ops=%u max_reqs=%u\n",
5817                 __func__,
5818                 args->bc_attrs.max_rqst_sz, args->bc_attrs.max_resp_sz,
5819                 args->bc_attrs.max_resp_sz_cached, args->bc_attrs.max_ops,
5820                 args->bc_attrs.max_reqs);
5821 }
5822
5823 static int nfs4_verify_fore_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
5824 {
5825         struct nfs4_channel_attrs *sent = &args->fc_attrs;
5826         struct nfs4_channel_attrs *rcvd = &session->fc_attrs;
5827
5828         if (rcvd->max_resp_sz > sent->max_resp_sz)
5829                 return -EINVAL;
5830         /*
5831          * Our requested max_ops is the minimum we need; we're not
5832          * prepared to break up compounds into smaller pieces than that.
5833          * So, no point even trying to continue if the server won't
5834          * cooperate:
5835          */
5836         if (rcvd->max_ops < sent->max_ops)
5837                 return -EINVAL;
5838         if (rcvd->max_reqs == 0)
5839                 return -EINVAL;
5840         if (rcvd->max_reqs > NFS4_MAX_SLOT_TABLE)
5841                 rcvd->max_reqs = NFS4_MAX_SLOT_TABLE;
5842         return 0;
5843 }
5844
5845 static int nfs4_verify_back_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
5846 {
5847         struct nfs4_channel_attrs *sent = &args->bc_attrs;
5848         struct nfs4_channel_attrs *rcvd = &session->bc_attrs;
5849
5850         if (rcvd->max_rqst_sz > sent->max_rqst_sz)
5851                 return -EINVAL;
5852         if (rcvd->max_resp_sz < sent->max_resp_sz)
5853                 return -EINVAL;
5854         if (rcvd->max_resp_sz_cached > sent->max_resp_sz_cached)
5855                 return -EINVAL;
5856         /* These would render the backchannel useless: */
5857         if (rcvd->max_ops != sent->max_ops)
5858                 return -EINVAL;
5859         if (rcvd->max_reqs != sent->max_reqs)
5860                 return -EINVAL;
5861         return 0;
5862 }
5863
5864 static int nfs4_verify_channel_attrs(struct nfs41_create_session_args *args,
5865                                      struct nfs4_session *session)
5866 {
5867         int ret;
5868
5869         ret = nfs4_verify_fore_channel_attrs(args, session);
5870         if (ret)
5871                 return ret;
5872         return nfs4_verify_back_channel_attrs(args, session);
5873 }
5874
5875 static int _nfs4_proc_create_session(struct nfs_client *clp,
5876                 struct rpc_cred *cred)
5877 {
5878         struct nfs4_session *session = clp->cl_session;
5879         struct nfs41_create_session_args args = {
5880                 .client = clp,
5881                 .cb_program = NFS4_CALLBACK,
5882         };
5883         struct nfs41_create_session_res res = {
5884                 .client = clp,
5885         };
5886         struct rpc_message msg = {
5887                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE_SESSION],
5888                 .rpc_argp = &args,
5889                 .rpc_resp = &res,
5890                 .rpc_cred = cred,
5891         };
5892         int status;
5893
5894         nfs4_init_channel_attrs(&args);
5895         args.flags = (SESSION4_PERSIST | SESSION4_BACK_CHAN);
5896
5897         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5898
5899         if (!status) {
5900                 /* Verify the session's negotiated channel_attrs values */
5901                 status = nfs4_verify_channel_attrs(&args, session);
5902                 /* Increment the clientid slot sequence id */
5903                 clp->cl_seqid++;
5904         }
5905
5906         return status;
5907 }
5908
5909 /*
5910  * Issues a CREATE_SESSION operation to the server.
5911  * It is the responsibility of the caller to verify the session is
5912  * expired before calling this routine.
5913  */
5914 int nfs4_proc_create_session(struct nfs_client *clp, struct rpc_cred *cred)
5915 {
5916         int status;
5917         unsigned *ptr;
5918         struct nfs4_session *session = clp->cl_session;
5919
5920         dprintk("--> %s clp=%p session=%p\n", __func__, clp, session);
5921
5922         status = _nfs4_proc_create_session(clp, cred);
5923         if (status)
5924                 goto out;
5925
5926         /* Init or reset the session slot tables */
5927         status = nfs4_setup_session_slot_tables(session);
5928         dprintk("slot table setup returned %d\n", status);
5929         if (status)
5930                 goto out;
5931
5932         ptr = (unsigned *)&session->sess_id.data[0];
5933         dprintk("%s client>seqid %d sessionid %u:%u:%u:%u\n", __func__,
5934                 clp->cl_seqid, ptr[0], ptr[1], ptr[2], ptr[3]);
5935 out:
5936         dprintk("<-- %s\n", __func__);
5937         return status;
5938 }
5939
5940 /*
5941  * Issue the over-the-wire RPC DESTROY_SESSION.
5942  * The caller must serialize access to this routine.
5943  */
5944 int nfs4_proc_destroy_session(struct nfs4_session *session,
5945                 struct rpc_cred *cred)
5946 {
5947         struct rpc_message msg = {
5948                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_SESSION],
5949                 .rpc_argp = session,
5950                 .rpc_cred = cred,
5951         };
5952         int status = 0;
5953
5954         dprintk("--> nfs4_proc_destroy_session\n");
5955
5956         /* session is still being setup */
5957         if (session->clp->cl_cons_state != NFS_CS_READY)
5958                 return status;
5959
5960         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5961
5962         if (status)
5963                 dprintk("NFS: Got error %d from the server on DESTROY_SESSION. "
5964                         "Session has been destroyed regardless...\n", status);
5965
5966         dprintk("<-- nfs4_proc_destroy_session\n");
5967         return status;
5968 }
5969
5970 /*
5971  * Renew the cl_session lease.
5972  */
5973 struct nfs4_sequence_data {
5974         struct nfs_client *clp;
5975         struct nfs4_sequence_args args;
5976         struct nfs4_sequence_res res;
5977 };
5978
5979 static void nfs41_sequence_release(void *data)
5980 {
5981         struct nfs4_sequence_data *calldata = data;
5982         struct nfs_client *clp = calldata->clp;
5983
5984         if (atomic_read(&clp->cl_count) > 1)
5985                 nfs4_schedule_state_renewal(clp);
5986         nfs_put_client(clp);
5987         kfree(calldata);
5988 }
5989
5990 static int nfs41_sequence_handle_errors(struct rpc_task *task, struct nfs_client *clp)
5991 {
5992         switch(task->tk_status) {
5993         case -NFS4ERR_DELAY:
5994                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
5995                 return -EAGAIN;
5996         default:
5997                 nfs4_schedule_lease_recovery(clp);
5998         }
5999         return 0;
6000 }
6001
6002 static void nfs41_sequence_call_done(struct rpc_task *task, void *data)
6003 {
6004         struct nfs4_sequence_data *calldata = data;
6005         struct nfs_client *clp = calldata->clp;
6006
6007         if (!nfs41_sequence_done(task, task->tk_msg.rpc_resp))
6008                 return;
6009
6010         if (task->tk_status < 0) {
6011                 dprintk("%s ERROR %d\n", __func__, task->tk_status);
6012                 if (atomic_read(&clp->cl_count) == 1)
6013                         goto out;
6014
6015                 if (nfs41_sequence_handle_errors(task, clp) == -EAGAIN) {
6016                         rpc_restart_call_prepare(task);
6017                         return;
6018                 }
6019         }
6020         dprintk("%s rpc_cred %p\n", __func__, task->tk_msg.rpc_cred);
6021 out:
6022         dprintk("<-- %s\n", __func__);
6023 }
6024
6025 static void nfs41_sequence_prepare(struct rpc_task *task, void *data)
6026 {
6027         struct nfs4_sequence_data *calldata = data;
6028         struct nfs_client *clp = calldata->clp;
6029         struct nfs4_sequence_args *args;
6030         struct nfs4_sequence_res *res;
6031
6032         args = task->tk_msg.rpc_argp;
6033         res = task->tk_msg.rpc_resp;
6034
6035         nfs41_setup_sequence(clp->cl_session, args, res, task);
6036 }
6037
6038 static const struct rpc_call_ops nfs41_sequence_ops = {
6039         .rpc_call_done = nfs41_sequence_call_done,
6040         .rpc_call_prepare = nfs41_sequence_prepare,
6041         .rpc_release = nfs41_sequence_release,
6042 };
6043
6044 static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp,
6045                 struct rpc_cred *cred,
6046                 bool is_privileged)
6047 {
6048         struct nfs4_sequence_data *calldata;
6049         struct rpc_message msg = {
6050                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SEQUENCE],
6051                 .rpc_cred = cred,
6052         };
6053         struct rpc_task_setup task_setup_data = {
6054                 .rpc_client = clp->cl_rpcclient,
6055                 .rpc_message = &msg,
6056                 .callback_ops = &nfs41_sequence_ops,
6057                 .flags = RPC_TASK_ASYNC | RPC_TASK_TIMEOUT,
6058         };
6059
6060         if (!atomic_inc_not_zero(&clp->cl_count))
6061                 return ERR_PTR(-EIO);
6062         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
6063         if (calldata == NULL) {
6064                 nfs_put_client(clp);
6065                 return ERR_PTR(-ENOMEM);
6066         }
6067         nfs41_init_sequence(&calldata->args, &calldata->res, 0);
6068         if (is_privileged)
6069                 nfs4_set_sequence_privileged(&calldata->args);
6070         msg.rpc_argp = &calldata->args;
6071         msg.rpc_resp = &calldata->res;
6072         calldata->clp = clp;
6073         task_setup_data.callback_data = calldata;
6074
6075         return rpc_run_task(&task_setup_data);
6076 }
6077
6078 static int nfs41_proc_async_sequence(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
6079 {
6080         struct rpc_task *task;
6081         int ret = 0;
6082
6083         if ((renew_flags & NFS4_RENEW_TIMEOUT) == 0)
6084                 return 0;
6085         task = _nfs41_proc_sequence(clp, cred, false);
6086         if (IS_ERR(task))
6087                 ret = PTR_ERR(task);
6088         else
6089                 rpc_put_task_async(task);
6090         dprintk("<-- %s status=%d\n", __func__, ret);
6091         return ret;
6092 }
6093
6094 static int nfs4_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
6095 {
6096         struct rpc_task *task;
6097         int ret;
6098
6099         task = _nfs41_proc_sequence(clp, cred, true);
6100         if (IS_ERR(task)) {
6101                 ret = PTR_ERR(task);
6102                 goto out;
6103         }
6104         ret = rpc_wait_for_completion_task(task);
6105         if (!ret) {
6106                 struct nfs4_sequence_res *res = task->tk_msg.rpc_resp;
6107
6108                 if (task->tk_status == 0)
6109                         nfs41_handle_sequence_flag_errors(clp, res->sr_status_flags);
6110                 ret = task->tk_status;
6111         }
6112         rpc_put_task(task);
6113 out:
6114         dprintk("<-- %s status=%d\n", __func__, ret);
6115         return ret;
6116 }
6117
6118 struct nfs4_reclaim_complete_data {
6119         struct nfs_client *clp;
6120         struct nfs41_reclaim_complete_args arg;
6121         struct nfs41_reclaim_complete_res res;
6122 };
6123
6124 static void nfs4_reclaim_complete_prepare(struct rpc_task *task, void *data)
6125 {
6126         struct nfs4_reclaim_complete_data *calldata = data;
6127
6128         nfs41_setup_sequence(calldata->clp->cl_session,
6129                         &calldata->arg.seq_args,
6130                         &calldata->res.seq_res,
6131                         task);
6132 }
6133
6134 static int nfs41_reclaim_complete_handle_errors(struct rpc_task *task, struct nfs_client *clp)
6135 {
6136         switch(task->tk_status) {
6137         case 0:
6138         case -NFS4ERR_COMPLETE_ALREADY:
6139         case -NFS4ERR_WRONG_CRED: /* What to do here? */
6140                 break;
6141         case -NFS4ERR_DELAY:
6142                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
6143                 /* fall through */
6144         case -NFS4ERR_RETRY_UNCACHED_REP:
6145                 return -EAGAIN;
6146         default:
6147                 nfs4_schedule_lease_recovery(clp);
6148         }
6149         return 0;
6150 }
6151
6152 static void nfs4_reclaim_complete_done(struct rpc_task *task, void *data)
6153 {
6154         struct nfs4_reclaim_complete_data *calldata = data;
6155         struct nfs_client *clp = calldata->clp;
6156         struct nfs4_sequence_res *res = &calldata->res.seq_res;
6157
6158         dprintk("--> %s\n", __func__);
6159         if (!nfs41_sequence_done(task, res))
6160                 return;
6161
6162         if (nfs41_reclaim_complete_handle_errors(task, clp) == -EAGAIN) {
6163                 rpc_restart_call_prepare(task);
6164                 return;
6165         }
6166         dprintk("<-- %s\n", __func__);
6167 }
6168
6169 static void nfs4_free_reclaim_complete_data(void *data)
6170 {
6171         struct nfs4_reclaim_complete_data *calldata = data;
6172
6173         kfree(calldata);
6174 }
6175
6176 static const struct rpc_call_ops nfs4_reclaim_complete_call_ops = {
6177         .rpc_call_prepare = nfs4_reclaim_complete_prepare,
6178         .rpc_call_done = nfs4_reclaim_complete_done,
6179         .rpc_release = nfs4_free_reclaim_complete_data,
6180 };
6181
6182 /*
6183  * Issue a global reclaim complete.
6184  */
6185 static int nfs41_proc_reclaim_complete(struct nfs_client *clp,
6186                 struct rpc_cred *cred)
6187 {
6188         struct nfs4_reclaim_complete_data *calldata;
6189         struct rpc_task *task;
6190         struct rpc_message msg = {
6191                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RECLAIM_COMPLETE],
6192                 .rpc_cred = cred,
6193         };
6194         struct rpc_task_setup task_setup_data = {
6195                 .rpc_client = clp->cl_rpcclient,
6196                 .rpc_message = &msg,
6197                 .callback_ops = &nfs4_reclaim_complete_call_ops,
6198                 .flags = RPC_TASK_ASYNC,
6199         };
6200         int status = -ENOMEM;
6201
6202         dprintk("--> %s\n", __func__);
6203         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
6204         if (calldata == NULL)
6205                 goto out;
6206         calldata->clp = clp;
6207         calldata->arg.one_fs = 0;
6208
6209         nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 0);
6210         nfs4_set_sequence_privileged(&calldata->arg.seq_args);
6211         msg.rpc_argp = &calldata->arg;
6212         msg.rpc_resp = &calldata->res;
6213         task_setup_data.callback_data = calldata;
6214         task = rpc_run_task(&task_setup_data);
6215         if (IS_ERR(task)) {
6216                 status = PTR_ERR(task);
6217                 goto out;
6218         }
6219         status = nfs4_wait_for_completion_rpc_task(task);
6220         if (status == 0)
6221                 status = task->tk_status;
6222         rpc_put_task(task);
6223         return 0;
6224 out:
6225         dprintk("<-- %s status=%d\n", __func__, status);
6226         return status;
6227 }
6228
6229 static void
6230 nfs4_layoutget_prepare(struct rpc_task *task, void *calldata)
6231 {
6232         struct nfs4_layoutget *lgp = calldata;
6233         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
6234         struct nfs4_session *session = nfs4_get_session(server);
6235
6236         dprintk("--> %s\n", __func__);
6237         /* Note the is a race here, where a CB_LAYOUTRECALL can come in
6238          * right now covering the LAYOUTGET we are about to send.
6239          * However, that is not so catastrophic, and there seems
6240          * to be no way to prevent it completely.
6241          */
6242         if (nfs41_setup_sequence(session, &lgp->args.seq_args,
6243                                 &lgp->res.seq_res, task))
6244                 return;
6245         if (pnfs_choose_layoutget_stateid(&lgp->args.stateid,
6246                                           NFS_I(lgp->args.inode)->layout,
6247                                           lgp->args.ctx->state)) {
6248                 rpc_exit(task, NFS4_OK);
6249         }
6250 }
6251
6252 static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
6253 {
6254         struct nfs4_layoutget *lgp = calldata;
6255         struct inode *inode = lgp->args.inode;
6256         struct nfs_server *server = NFS_SERVER(inode);
6257         struct pnfs_layout_hdr *lo;
6258         struct nfs4_state *state = NULL;
6259         unsigned long timeo, giveup;
6260
6261         dprintk("--> %s\n", __func__);
6262
6263         if (!nfs41_sequence_done(task, &lgp->res.seq_res))
6264                 goto out;
6265
6266         switch (task->tk_status) {
6267         case 0:
6268                 goto out;
6269         case -NFS4ERR_LAYOUTTRYLATER:
6270         case -NFS4ERR_RECALLCONFLICT:
6271                 timeo = rpc_get_timeout(task->tk_client);
6272                 giveup = lgp->args.timestamp + timeo;
6273                 if (time_after(giveup, jiffies))
6274                         task->tk_status = -NFS4ERR_DELAY;
6275                 break;
6276         case -NFS4ERR_EXPIRED:
6277         case -NFS4ERR_BAD_STATEID:
6278                 spin_lock(&inode->i_lock);
6279                 lo = NFS_I(inode)->layout;
6280                 if (!lo || list_empty(&lo->plh_segs)) {
6281                         spin_unlock(&inode->i_lock);
6282                         /* If the open stateid was bad, then recover it. */
6283                         state = lgp->args.ctx->state;
6284                 } else {
6285                         LIST_HEAD(head);
6286
6287                         pnfs_mark_matching_lsegs_invalid(lo, &head, NULL);
6288                         spin_unlock(&inode->i_lock);
6289                         /* Mark the bad layout state as invalid, then
6290                          * retry using the open stateid. */
6291                         pnfs_free_lseg_list(&head);
6292                 }
6293         }
6294         if (nfs4_async_handle_error(task, server, state) == -EAGAIN)
6295                 rpc_restart_call_prepare(task);
6296 out:
6297         dprintk("<-- %s\n", __func__);
6298 }
6299
6300 static size_t max_response_pages(struct nfs_server *server)
6301 {
6302         u32 max_resp_sz = server->nfs_client->cl_session->fc_attrs.max_resp_sz;
6303         return nfs_page_array_len(0, max_resp_sz);
6304 }
6305
6306 static void nfs4_free_pages(struct page **pages, size_t size)
6307 {
6308         int i;
6309
6310         if (!pages)
6311                 return;
6312
6313         for (i = 0; i < size; i++) {
6314                 if (!pages[i])
6315                         break;
6316                 __free_page(pages[i]);
6317         }
6318         kfree(pages);
6319 }
6320
6321 static struct page **nfs4_alloc_pages(size_t size, gfp_t gfp_flags)
6322 {
6323         struct page **pages;
6324         int i;
6325
6326         pages = kcalloc(size, sizeof(struct page *), gfp_flags);
6327         if (!pages) {
6328                 dprintk("%s: can't alloc array of %zu pages\n", __func__, size);
6329                 return NULL;
6330         }
6331
6332         for (i = 0; i < size; i++) {
6333                 pages[i] = alloc_page(gfp_flags);
6334                 if (!pages[i]) {
6335                         dprintk("%s: failed to allocate page\n", __func__);
6336                         nfs4_free_pages(pages, size);
6337                         return NULL;
6338                 }
6339         }
6340
6341         return pages;
6342 }
6343
6344 static void nfs4_layoutget_release(void *calldata)
6345 {
6346         struct nfs4_layoutget *lgp = calldata;
6347         struct inode *inode = lgp->args.inode;
6348         struct nfs_server *server = NFS_SERVER(inode);
6349         size_t max_pages = max_response_pages(server);
6350
6351         dprintk("--> %s\n", __func__);
6352         nfs4_free_pages(lgp->args.layout.pages, max_pages);
6353         pnfs_put_layout_hdr(NFS_I(inode)->layout);
6354         put_nfs_open_context(lgp->args.ctx);
6355         kfree(calldata);
6356         dprintk("<-- %s\n", __func__);
6357 }
6358
6359 static const struct rpc_call_ops nfs4_layoutget_call_ops = {
6360         .rpc_call_prepare = nfs4_layoutget_prepare,
6361         .rpc_call_done = nfs4_layoutget_done,
6362         .rpc_release = nfs4_layoutget_release,
6363 };
6364
6365 struct pnfs_layout_segment *
6366 nfs4_proc_layoutget(struct nfs4_layoutget *lgp, gfp_t gfp_flags)
6367 {
6368         struct inode *inode = lgp->args.inode;
6369         struct nfs_server *server = NFS_SERVER(inode);
6370         size_t max_pages = max_response_pages(server);
6371         struct rpc_task *task;
6372         struct rpc_message msg = {
6373                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTGET],
6374                 .rpc_argp = &lgp->args,
6375                 .rpc_resp = &lgp->res,
6376                 .rpc_cred = lgp->cred,
6377         };
6378         struct rpc_task_setup task_setup_data = {
6379                 .rpc_client = server->client,
6380                 .rpc_message = &msg,
6381                 .callback_ops = &nfs4_layoutget_call_ops,
6382                 .callback_data = lgp,
6383                 .flags = RPC_TASK_ASYNC,
6384         };
6385         struct pnfs_layout_segment *lseg = NULL;
6386         int status = 0;
6387
6388         dprintk("--> %s\n", __func__);
6389
6390         lgp->args.layout.pages = nfs4_alloc_pages(max_pages, gfp_flags);
6391         if (!lgp->args.layout.pages) {
6392                 nfs4_layoutget_release(lgp);
6393                 return ERR_PTR(-ENOMEM);
6394         }
6395         lgp->args.layout.pglen = max_pages * PAGE_SIZE;
6396         lgp->args.timestamp = jiffies;
6397
6398         lgp->res.layoutp = &lgp->args.layout;
6399         lgp->res.seq_res.sr_slot = NULL;
6400         nfs41_init_sequence(&lgp->args.seq_args, &lgp->res.seq_res, 0);
6401
6402         /* nfs4_layoutget_release calls pnfs_put_layout_hdr */
6403         pnfs_get_layout_hdr(NFS_I(inode)->layout);
6404
6405         task = rpc_run_task(&task_setup_data);
6406         if (IS_ERR(task))
6407                 return ERR_CAST(task);
6408         status = nfs4_wait_for_completion_rpc_task(task);
6409         if (status == 0)
6410                 status = task->tk_status;
6411         /* if layoutp->len is 0, nfs4_layoutget_prepare called rpc_exit */
6412         if (status == 0 && lgp->res.layoutp->len)
6413                 lseg = pnfs_layout_process(lgp);
6414         rpc_put_task(task);
6415         dprintk("<-- %s status=%d\n", __func__, status);
6416         if (status)
6417                 return ERR_PTR(status);
6418         return lseg;
6419 }
6420
6421 static void
6422 nfs4_layoutreturn_prepare(struct rpc_task *task, void *calldata)
6423 {
6424         struct nfs4_layoutreturn *lrp = calldata;
6425
6426         dprintk("--> %s\n", __func__);
6427         nfs41_setup_sequence(lrp->clp->cl_session,
6428                         &lrp->args.seq_args,
6429                         &lrp->res.seq_res,
6430                         task);
6431 }
6432
6433 static void nfs4_layoutreturn_done(struct rpc_task *task, void *calldata)
6434 {
6435         struct nfs4_layoutreturn *lrp = calldata;
6436         struct nfs_server *server;
6437
6438         dprintk("--> %s\n", __func__);
6439
6440         if (!nfs41_sequence_done(task, &lrp->res.seq_res))
6441                 return;
6442
6443         server = NFS_SERVER(lrp->args.inode);
6444         if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6445                 rpc_restart_call_prepare(task);
6446                 return;
6447         }
6448         dprintk("<-- %s\n", __func__);
6449 }
6450
6451 static void nfs4_layoutreturn_release(void *calldata)
6452 {
6453         struct nfs4_layoutreturn *lrp = calldata;
6454         struct pnfs_layout_hdr *lo = lrp->args.layout;
6455
6456         dprintk("--> %s\n", __func__);
6457         spin_lock(&lo->plh_inode->i_lock);
6458         if (lrp->res.lrs_present)
6459                 pnfs_set_layout_stateid(lo, &lrp->res.stateid, true);
6460         lo->plh_block_lgets--;
6461         spin_unlock(&lo->plh_inode->i_lock);
6462         pnfs_put_layout_hdr(lrp->args.layout);
6463         kfree(calldata);
6464         dprintk("<-- %s\n", __func__);
6465 }
6466
6467 static const struct rpc_call_ops nfs4_layoutreturn_call_ops = {
6468         .rpc_call_prepare = nfs4_layoutreturn_prepare,
6469         .rpc_call_done = nfs4_layoutreturn_done,
6470         .rpc_release = nfs4_layoutreturn_release,
6471 };
6472
6473 int nfs4_proc_layoutreturn(struct nfs4_layoutreturn *lrp)
6474 {
6475         struct rpc_task *task;
6476         struct rpc_message msg = {
6477                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTRETURN],
6478                 .rpc_argp = &lrp->args,
6479                 .rpc_resp = &lrp->res,
6480                 .rpc_cred = lrp->cred,
6481         };
6482         struct rpc_task_setup task_setup_data = {
6483                 .rpc_client = lrp->clp->cl_rpcclient,
6484                 .rpc_message = &msg,
6485                 .callback_ops = &nfs4_layoutreturn_call_ops,
6486                 .callback_data = lrp,
6487         };
6488         int status;
6489
6490         dprintk("--> %s\n", __func__);
6491         nfs41_init_sequence(&lrp->args.seq_args, &lrp->res.seq_res, 1);
6492         task = rpc_run_task(&task_setup_data);
6493         if (IS_ERR(task))
6494                 return PTR_ERR(task);
6495         status = task->tk_status;
6496         dprintk("<-- %s status=%d\n", __func__, status);
6497         rpc_put_task(task);
6498         return status;
6499 }
6500
6501 /*
6502  * Retrieve the list of Data Server devices from the MDS.
6503  */
6504 static int _nfs4_getdevicelist(struct nfs_server *server,
6505                                     const struct nfs_fh *fh,
6506                                     struct pnfs_devicelist *devlist)
6507 {
6508         struct nfs4_getdevicelist_args args = {
6509                 .fh = fh,
6510                 .layoutclass = server->pnfs_curr_ld->id,
6511         };
6512         struct nfs4_getdevicelist_res res = {
6513                 .devlist = devlist,
6514         };
6515         struct rpc_message msg = {
6516                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICELIST],
6517                 .rpc_argp = &args,
6518                 .rpc_resp = &res,
6519         };
6520         int status;
6521
6522         dprintk("--> %s\n", __func__);
6523         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args,
6524                                 &res.seq_res, 0);
6525         dprintk("<-- %s status=%d\n", __func__, status);
6526         return status;
6527 }
6528
6529 int nfs4_proc_getdevicelist(struct nfs_server *server,
6530                             const struct nfs_fh *fh,
6531                             struct pnfs_devicelist *devlist)
6532 {
6533         struct nfs4_exception exception = { };
6534         int err;
6535
6536         do {
6537                 err = nfs4_handle_exception(server,
6538                                 _nfs4_getdevicelist(server, fh, devlist),
6539                                 &exception);
6540         } while (exception.retry);
6541
6542         dprintk("%s: err=%d, num_devs=%u\n", __func__,
6543                 err, devlist->num_devs);
6544
6545         return err;
6546 }
6547 EXPORT_SYMBOL_GPL(nfs4_proc_getdevicelist);
6548
6549 static int
6550 _nfs4_proc_getdeviceinfo(struct nfs_server *server,
6551                 struct pnfs_device *pdev,
6552                 struct rpc_cred *cred)
6553 {
6554         struct nfs4_getdeviceinfo_args args = {
6555                 .pdev = pdev,
6556         };
6557         struct nfs4_getdeviceinfo_res res = {
6558                 .pdev = pdev,
6559         };
6560         struct rpc_message msg = {
6561                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICEINFO],
6562                 .rpc_argp = &args,
6563                 .rpc_resp = &res,
6564                 .rpc_cred = cred,
6565         };
6566         int status;
6567
6568         dprintk("--> %s\n", __func__);
6569         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
6570         dprintk("<-- %s status=%d\n", __func__, status);
6571
6572         return status;
6573 }
6574
6575 int nfs4_proc_getdeviceinfo(struct nfs_server *server,
6576                 struct pnfs_device *pdev,
6577                 struct rpc_cred *cred)
6578 {
6579         struct nfs4_exception exception = { };
6580         int err;
6581
6582         do {
6583                 err = nfs4_handle_exception(server,
6584                                         _nfs4_proc_getdeviceinfo(server, pdev, cred),
6585                                         &exception);
6586         } while (exception.retry);
6587         return err;
6588 }
6589 EXPORT_SYMBOL_GPL(nfs4_proc_getdeviceinfo);
6590
6591 static void nfs4_layoutcommit_prepare(struct rpc_task *task, void *calldata)
6592 {
6593         struct nfs4_layoutcommit_data *data = calldata;
6594         struct nfs_server *server = NFS_SERVER(data->args.inode);
6595         struct nfs4_session *session = nfs4_get_session(server);
6596
6597         nfs41_setup_sequence(session,
6598                         &data->args.seq_args,
6599                         &data->res.seq_res,
6600                         task);
6601 }
6602
6603 static void
6604 nfs4_layoutcommit_done(struct rpc_task *task, void *calldata)
6605 {
6606         struct nfs4_layoutcommit_data *data = calldata;
6607         struct nfs_server *server = NFS_SERVER(data->args.inode);
6608
6609         if (!nfs41_sequence_done(task, &data->res.seq_res))
6610                 return;
6611
6612         switch (task->tk_status) { /* Just ignore these failures */
6613         case -NFS4ERR_DELEG_REVOKED: /* layout was recalled */
6614         case -NFS4ERR_BADIOMODE:     /* no IOMODE_RW layout for range */
6615         case -NFS4ERR_BADLAYOUT:     /* no layout */
6616         case -NFS4ERR_GRACE:        /* loca_recalim always false */
6617                 task->tk_status = 0;
6618                 break;
6619         case 0:
6620                 nfs_post_op_update_inode_force_wcc(data->args.inode,
6621                                                    data->res.fattr);
6622                 break;
6623         default:
6624                 if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6625                         rpc_restart_call_prepare(task);
6626                         return;
6627                 }
6628         }
6629 }
6630
6631 static void nfs4_layoutcommit_release(void *calldata)
6632 {
6633         struct nfs4_layoutcommit_data *data = calldata;
6634
6635         pnfs_cleanup_layoutcommit(data);
6636         put_rpccred(data->cred);
6637         kfree(data);
6638 }
6639
6640 static const struct rpc_call_ops nfs4_layoutcommit_ops = {
6641         .rpc_call_prepare = nfs4_layoutcommit_prepare,
6642         .rpc_call_done = nfs4_layoutcommit_done,
6643         .rpc_release = nfs4_layoutcommit_release,
6644 };
6645
6646 int
6647 nfs4_proc_layoutcommit(struct nfs4_layoutcommit_data *data, bool sync)
6648 {
6649         struct rpc_message msg = {
6650                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTCOMMIT],
6651                 .rpc_argp = &data->args,
6652                 .rpc_resp = &data->res,
6653                 .rpc_cred = data->cred,
6654         };
6655         struct rpc_task_setup task_setup_data = {
6656                 .task = &data->task,
6657                 .rpc_client = NFS_CLIENT(data->args.inode),
6658                 .rpc_message = &msg,
6659                 .callback_ops = &nfs4_layoutcommit_ops,
6660                 .callback_data = data,
6661                 .flags = RPC_TASK_ASYNC,
6662         };
6663         struct rpc_task *task;
6664         int status = 0;
6665
6666         dprintk("NFS: %4d initiating layoutcommit call. sync %d "
6667                 "lbw: %llu inode %lu\n",
6668                 data->task.tk_pid, sync,
6669                 data->args.lastbytewritten,
6670                 data->args.inode->i_ino);
6671
6672         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
6673         task = rpc_run_task(&task_setup_data);
6674         if (IS_ERR(task))
6675                 return PTR_ERR(task);
6676         if (sync == false)
6677                 goto out;
6678         status = nfs4_wait_for_completion_rpc_task(task);
6679         if (status != 0)
6680                 goto out;
6681         status = task->tk_status;
6682 out:
6683         dprintk("%s: status %d\n", __func__, status);
6684         rpc_put_task(task);
6685         return status;
6686 }
6687
6688 static int
6689 _nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
6690                     struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
6691 {
6692         struct nfs41_secinfo_no_name_args args = {
6693                 .style = SECINFO_STYLE_CURRENT_FH,
6694         };
6695         struct nfs4_secinfo_res res = {
6696                 .flavors = flavors,
6697         };
6698         struct rpc_message msg = {
6699                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO_NO_NAME],
6700                 .rpc_argp = &args,
6701                 .rpc_resp = &res,
6702         };
6703         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
6704 }
6705
6706 static int
6707 nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
6708                            struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
6709 {
6710         struct nfs4_exception exception = { };
6711         int err;
6712         do {
6713                 err = _nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
6714                 switch (err) {
6715                 case 0:
6716                 case -NFS4ERR_WRONGSEC:
6717                 case -NFS4ERR_NOTSUPP:
6718                         goto out;
6719                 default:
6720                         err = nfs4_handle_exception(server, err, &exception);
6721                 }
6722         } while (exception.retry);
6723 out:
6724         return err;
6725 }
6726
6727 static int
6728 nfs41_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
6729                     struct nfs_fsinfo *info)
6730 {
6731         int err;
6732         struct page *page;
6733         rpc_authflavor_t flavor;
6734         struct nfs4_secinfo_flavors *flavors;
6735
6736         page = alloc_page(GFP_KERNEL);
6737         if (!page) {
6738                 err = -ENOMEM;
6739                 goto out;
6740         }
6741
6742         flavors = page_address(page);
6743         err = nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
6744
6745         /*
6746          * Fall back on "guess and check" method if
6747          * the server doesn't support SECINFO_NO_NAME
6748          */
6749         if (err == -NFS4ERR_WRONGSEC || err == -NFS4ERR_NOTSUPP) {
6750                 err = nfs4_find_root_sec(server, fhandle, info);
6751                 goto out_freepage;
6752         }
6753         if (err)
6754                 goto out_freepage;
6755
6756         flavor = nfs_find_best_sec(flavors);
6757         if (err == 0)
6758                 err = nfs4_lookup_root_sec(server, fhandle, info, flavor);
6759
6760 out_freepage:
6761         put_page(page);
6762         if (err == -EACCES)
6763                 return -EPERM;
6764 out:
6765         return err;
6766 }
6767
6768 static int _nfs41_test_stateid(struct nfs_server *server,
6769                 nfs4_stateid *stateid,
6770                 struct rpc_cred *cred)
6771 {
6772         int status;
6773         struct nfs41_test_stateid_args args = {
6774                 .stateid = stateid,
6775         };
6776         struct nfs41_test_stateid_res res;
6777         struct rpc_message msg = {
6778                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_TEST_STATEID],
6779                 .rpc_argp = &args,
6780                 .rpc_resp = &res,
6781                 .rpc_cred = cred,
6782         };
6783
6784         dprintk("NFS call  test_stateid %p\n", stateid);
6785         nfs41_init_sequence(&args.seq_args, &res.seq_res, 0);
6786         nfs4_set_sequence_privileged(&args.seq_args);
6787         status = nfs4_call_sync_sequence(server->client, server, &msg,
6788                         &args.seq_args, &res.seq_res);
6789         if (status != NFS_OK) {
6790                 dprintk("NFS reply test_stateid: failed, %d\n", status);
6791                 return status;
6792         }
6793         dprintk("NFS reply test_stateid: succeeded, %d\n", -res.status);
6794         return -res.status;
6795 }
6796
6797 /**
6798  * nfs41_test_stateid - perform a TEST_STATEID operation
6799  *
6800  * @server: server / transport on which to perform the operation
6801  * @stateid: state ID to test
6802  * @cred: credential
6803  *
6804  * Returns NFS_OK if the server recognizes that "stateid" is valid.
6805  * Otherwise a negative NFS4ERR value is returned if the operation
6806  * failed or the state ID is not currently valid.
6807  */
6808 static int nfs41_test_stateid(struct nfs_server *server,
6809                 nfs4_stateid *stateid,
6810                 struct rpc_cred *cred)
6811 {
6812         struct nfs4_exception exception = { };
6813         int err;
6814         do {
6815                 err = _nfs41_test_stateid(server, stateid, cred);
6816                 if (err != -NFS4ERR_DELAY)
6817                         break;
6818                 nfs4_handle_exception(server, err, &exception);
6819         } while (exception.retry);
6820         return err;
6821 }
6822
6823 struct nfs_free_stateid_data {
6824         struct nfs_server *server;
6825         struct nfs41_free_stateid_args args;
6826         struct nfs41_free_stateid_res res;
6827 };
6828
6829 static void nfs41_free_stateid_prepare(struct rpc_task *task, void *calldata)
6830 {
6831         struct nfs_free_stateid_data *data = calldata;
6832         nfs41_setup_sequence(nfs4_get_session(data->server),
6833                         &data->args.seq_args,
6834                         &data->res.seq_res,
6835                         task);
6836 }
6837
6838 static void nfs41_free_stateid_done(struct rpc_task *task, void *calldata)
6839 {
6840         struct nfs_free_stateid_data *data = calldata;
6841
6842         nfs41_sequence_done(task, &data->res.seq_res);
6843
6844         switch (task->tk_status) {
6845         case -NFS4ERR_DELAY:
6846                 if (nfs4_async_handle_error(task, data->server, NULL) == -EAGAIN)
6847                         rpc_restart_call_prepare(task);
6848         }
6849 }
6850
6851 static void nfs41_free_stateid_release(void *calldata)
6852 {
6853         kfree(calldata);
6854 }
6855
6856 const struct rpc_call_ops nfs41_free_stateid_ops = {
6857         .rpc_call_prepare = nfs41_free_stateid_prepare,
6858         .rpc_call_done = nfs41_free_stateid_done,
6859         .rpc_release = nfs41_free_stateid_release,
6860 };
6861
6862 static struct rpc_task *_nfs41_free_stateid(struct nfs_server *server,
6863                 nfs4_stateid *stateid,
6864                 struct rpc_cred *cred,
6865                 bool privileged)
6866 {
6867         struct rpc_message msg = {
6868                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FREE_STATEID],
6869                 .rpc_cred = cred,
6870         };
6871         struct rpc_task_setup task_setup = {
6872                 .rpc_client = server->client,
6873                 .rpc_message = &msg,
6874                 .callback_ops = &nfs41_free_stateid_ops,
6875                 .flags = RPC_TASK_ASYNC,
6876         };
6877         struct nfs_free_stateid_data *data;
6878
6879         dprintk("NFS call  free_stateid %p\n", stateid);
6880         data = kmalloc(sizeof(*data), GFP_NOFS);
6881         if (!data)
6882                 return ERR_PTR(-ENOMEM);
6883         data->server = server;
6884         nfs4_stateid_copy(&data->args.stateid, stateid);
6885
6886         task_setup.callback_data = data;
6887
6888         msg.rpc_argp = &data->args;
6889         msg.rpc_resp = &data->res;
6890         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
6891         if (privileged)
6892                 nfs4_set_sequence_privileged(&data->args.seq_args);
6893
6894         return rpc_run_task(&task_setup);
6895 }
6896
6897 /**
6898  * nfs41_free_stateid - perform a FREE_STATEID operation
6899  *
6900  * @server: server / transport on which to perform the operation
6901  * @stateid: state ID to release
6902  * @cred: credential
6903  *
6904  * Returns NFS_OK if the server freed "stateid".  Otherwise a
6905  * negative NFS4ERR value is returned.
6906  */
6907 static int nfs41_free_stateid(struct nfs_server *server,
6908                 nfs4_stateid *stateid,
6909                 struct rpc_cred *cred)
6910 {
6911         struct rpc_task *task;
6912         int ret;
6913
6914         task = _nfs41_free_stateid(server, stateid, cred, true);
6915         if (IS_ERR(task))
6916                 return PTR_ERR(task);
6917         ret = rpc_wait_for_completion_task(task);
6918         if (!ret)
6919                 ret = task->tk_status;
6920         rpc_put_task(task);
6921         return ret;
6922 }
6923
6924 static int nfs41_free_lock_state(struct nfs_server *server, struct nfs4_lock_state *lsp)
6925 {
6926         struct rpc_task *task;
6927         struct rpc_cred *cred = lsp->ls_state->owner->so_cred;
6928
6929         task = _nfs41_free_stateid(server, &lsp->ls_stateid, cred, false);
6930         nfs4_free_lock_state(server, lsp);
6931         if (IS_ERR(task))
6932                 return PTR_ERR(task);
6933         rpc_put_task(task);
6934         return 0;
6935 }
6936
6937 static bool nfs41_match_stateid(const nfs4_stateid *s1,
6938                 const nfs4_stateid *s2)
6939 {
6940         if (memcmp(s1->other, s2->other, sizeof(s1->other)) != 0)
6941                 return false;
6942
6943         if (s1->seqid == s2->seqid)
6944                 return true;
6945         if (s1->seqid == 0 || s2->seqid == 0)
6946                 return true;
6947
6948         return false;
6949 }
6950
6951 #endif /* CONFIG_NFS_V4_1 */
6952
6953 static bool nfs4_match_stateid(const nfs4_stateid *s1,
6954                 const nfs4_stateid *s2)
6955 {
6956         return nfs4_stateid_match(s1, s2);
6957 }
6958
6959
6960 static const struct nfs4_state_recovery_ops nfs40_reboot_recovery_ops = {
6961         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
6962         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
6963         .recover_open   = nfs4_open_reclaim,
6964         .recover_lock   = nfs4_lock_reclaim,
6965         .establish_clid = nfs4_init_clientid,
6966         .get_clid_cred  = nfs4_get_setclientid_cred,
6967         .detect_trunking = nfs40_discover_server_trunking,
6968 };
6969
6970 #if defined(CONFIG_NFS_V4_1)
6971 static const struct nfs4_state_recovery_ops nfs41_reboot_recovery_ops = {
6972         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
6973         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
6974         .recover_open   = nfs4_open_reclaim,
6975         .recover_lock   = nfs4_lock_reclaim,
6976         .establish_clid = nfs41_init_clientid,
6977         .get_clid_cred  = nfs4_get_exchange_id_cred,
6978         .reclaim_complete = nfs41_proc_reclaim_complete,
6979         .detect_trunking = nfs41_discover_server_trunking,
6980 };
6981 #endif /* CONFIG_NFS_V4_1 */
6982
6983 static const struct nfs4_state_recovery_ops nfs40_nograce_recovery_ops = {
6984         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
6985         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
6986         .recover_open   = nfs4_open_expired,
6987         .recover_lock   = nfs4_lock_expired,
6988         .establish_clid = nfs4_init_clientid,
6989         .get_clid_cred  = nfs4_get_setclientid_cred,
6990 };
6991
6992 #if defined(CONFIG_NFS_V4_1)
6993 static const struct nfs4_state_recovery_ops nfs41_nograce_recovery_ops = {
6994         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
6995         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
6996         .recover_open   = nfs41_open_expired,
6997         .recover_lock   = nfs41_lock_expired,
6998         .establish_clid = nfs41_init_clientid,
6999         .get_clid_cred  = nfs4_get_exchange_id_cred,
7000 };
7001 #endif /* CONFIG_NFS_V4_1 */
7002
7003 static const struct nfs4_state_maintenance_ops nfs40_state_renewal_ops = {
7004         .sched_state_renewal = nfs4_proc_async_renew,
7005         .get_state_renewal_cred_locked = nfs4_get_renew_cred_locked,
7006         .renew_lease = nfs4_proc_renew,
7007 };
7008
7009 #if defined(CONFIG_NFS_V4_1)
7010 static const struct nfs4_state_maintenance_ops nfs41_state_renewal_ops = {
7011         .sched_state_renewal = nfs41_proc_async_sequence,
7012         .get_state_renewal_cred_locked = nfs4_get_machine_cred_locked,
7013         .renew_lease = nfs4_proc_sequence,
7014 };
7015 #endif
7016
7017 static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
7018         .minor_version = 0,
7019         .init_caps = NFS_CAP_READDIRPLUS
7020                 | NFS_CAP_ATOMIC_OPEN
7021                 | NFS_CAP_CHANGE_ATTR
7022                 | NFS_CAP_POSIX_LOCK,
7023         .call_sync = _nfs4_call_sync,
7024         .match_stateid = nfs4_match_stateid,
7025         .find_root_sec = nfs4_find_root_sec,
7026         .free_lock_state = nfs4_release_lockowner,
7027         .reboot_recovery_ops = &nfs40_reboot_recovery_ops,
7028         .nograce_recovery_ops = &nfs40_nograce_recovery_ops,
7029         .state_renewal_ops = &nfs40_state_renewal_ops,
7030 };
7031
7032 #if defined(CONFIG_NFS_V4_1)
7033 static const struct nfs4_minor_version_ops nfs_v4_1_minor_ops = {
7034         .minor_version = 1,
7035         .init_caps = NFS_CAP_READDIRPLUS
7036                 | NFS_CAP_ATOMIC_OPEN
7037                 | NFS_CAP_CHANGE_ATTR
7038                 | NFS_CAP_POSIX_LOCK
7039                 | NFS_CAP_STATEID_NFSV41
7040                 | NFS_CAP_ATOMIC_OPEN_V1,
7041         .call_sync = nfs4_call_sync_sequence,
7042         .match_stateid = nfs41_match_stateid,
7043         .find_root_sec = nfs41_find_root_sec,
7044         .free_lock_state = nfs41_free_lock_state,
7045         .reboot_recovery_ops = &nfs41_reboot_recovery_ops,
7046         .nograce_recovery_ops = &nfs41_nograce_recovery_ops,
7047         .state_renewal_ops = &nfs41_state_renewal_ops,
7048 };
7049 #endif
7050
7051 const struct nfs4_minor_version_ops *nfs_v4_minor_ops[] = {
7052         [0] = &nfs_v4_0_minor_ops,
7053 #if defined(CONFIG_NFS_V4_1)
7054         [1] = &nfs_v4_1_minor_ops,
7055 #endif
7056 };
7057
7058 const struct inode_operations nfs4_dir_inode_operations = {
7059         .create         = nfs_create,
7060         .lookup         = nfs_lookup,
7061         .atomic_open    = nfs_atomic_open,
7062         .link           = nfs_link,
7063         .unlink         = nfs_unlink,
7064         .symlink        = nfs_symlink,
7065         .mkdir          = nfs_mkdir,
7066         .rmdir          = nfs_rmdir,
7067         .mknod          = nfs_mknod,
7068         .rename         = nfs_rename,
7069         .permission     = nfs_permission,
7070         .getattr        = nfs_getattr,
7071         .setattr        = nfs_setattr,
7072         .getxattr       = generic_getxattr,
7073         .setxattr       = generic_setxattr,
7074         .listxattr      = generic_listxattr,
7075         .removexattr    = generic_removexattr,
7076 };
7077
7078 static const struct inode_operations nfs4_file_inode_operations = {
7079         .permission     = nfs_permission,
7080         .getattr        = nfs_getattr,
7081         .setattr        = nfs_setattr,
7082         .getxattr       = generic_getxattr,
7083         .setxattr       = generic_setxattr,
7084         .listxattr      = generic_listxattr,
7085         .removexattr    = generic_removexattr,
7086 };
7087
7088 const struct nfs_rpc_ops nfs_v4_clientops = {
7089         .version        = 4,                    /* protocol version */
7090         .dentry_ops     = &nfs4_dentry_operations,
7091         .dir_inode_ops  = &nfs4_dir_inode_operations,
7092         .file_inode_ops = &nfs4_file_inode_operations,
7093         .file_ops       = &nfs4_file_operations,
7094         .getroot        = nfs4_proc_get_root,
7095         .submount       = nfs4_submount,
7096         .try_mount      = nfs4_try_mount,
7097         .getattr        = nfs4_proc_getattr,
7098         .setattr        = nfs4_proc_setattr,
7099         .lookup         = nfs4_proc_lookup,
7100         .access         = nfs4_proc_access,
7101         .readlink       = nfs4_proc_readlink,
7102         .create         = nfs4_proc_create,
7103         .remove         = nfs4_proc_remove,
7104         .unlink_setup   = nfs4_proc_unlink_setup,
7105         .unlink_rpc_prepare = nfs4_proc_unlink_rpc_prepare,
7106         .unlink_done    = nfs4_proc_unlink_done,
7107         .rename         = nfs4_proc_rename,
7108         .rename_setup   = nfs4_proc_rename_setup,
7109         .rename_rpc_prepare = nfs4_proc_rename_rpc_prepare,
7110         .rename_done    = nfs4_proc_rename_done,
7111         .link           = nfs4_proc_link,
7112         .symlink        = nfs4_proc_symlink,
7113         .mkdir          = nfs4_proc_mkdir,
7114         .rmdir          = nfs4_proc_remove,
7115         .readdir        = nfs4_proc_readdir,
7116         .mknod          = nfs4_proc_mknod,
7117         .statfs         = nfs4_proc_statfs,
7118         .fsinfo         = nfs4_proc_fsinfo,
7119         .pathconf       = nfs4_proc_pathconf,
7120         .set_capabilities = nfs4_server_capabilities,
7121         .decode_dirent  = nfs4_decode_dirent,
7122         .read_setup     = nfs4_proc_read_setup,
7123         .read_pageio_init = pnfs_pageio_init_read,
7124         .read_rpc_prepare = nfs4_proc_read_rpc_prepare,
7125         .read_done      = nfs4_read_done,
7126         .write_setup    = nfs4_proc_write_setup,
7127         .write_pageio_init = pnfs_pageio_init_write,
7128         .write_rpc_prepare = nfs4_proc_write_rpc_prepare,
7129         .write_done     = nfs4_write_done,
7130         .commit_setup   = nfs4_proc_commit_setup,
7131         .commit_rpc_prepare = nfs4_proc_commit_rpc_prepare,
7132         .commit_done    = nfs4_commit_done,
7133         .lock           = nfs4_proc_lock,
7134         .clear_acl_cache = nfs4_zap_acl_attr,
7135         .close_context  = nfs4_close_context,
7136         .open_context   = nfs4_atomic_open,
7137         .have_delegation = nfs4_have_delegation,
7138         .return_delegation = nfs4_inode_return_delegation,
7139         .alloc_client   = nfs4_alloc_client,
7140         .init_client    = nfs4_init_client,
7141         .free_client    = nfs4_free_client,
7142         .create_server  = nfs4_create_server,
7143         .clone_server   = nfs_clone_server,
7144 };
7145
7146 static const struct xattr_handler nfs4_xattr_nfs4_acl_handler = {
7147         .prefix = XATTR_NAME_NFSV4_ACL,
7148         .list   = nfs4_xattr_list_nfs4_acl,
7149         .get    = nfs4_xattr_get_nfs4_acl,
7150         .set    = nfs4_xattr_set_nfs4_acl,
7151 };
7152
7153 const struct xattr_handler *nfs4_xattr_handlers[] = {
7154         &nfs4_xattr_nfs4_acl_handler,
7155         NULL
7156 };
7157
7158 /*
7159  * Local variables:
7160  *  c-basic-offset: 8
7161  * End:
7162  */