NFSv4.1: Fix session initialisation races
[platform/adaptation/renesas_rcar/renesas_kernel.git] / fs / nfs / nfs4proc.c
1 /*
2  *  fs/nfs/nfs4proc.c
3  *
4  *  Client-side procedure declarations for NFSv4.
5  *
6  *  Copyright (c) 2002 The Regents of the University of Michigan.
7  *  All rights reserved.
8  *
9  *  Kendrick Smith <kmsmith@umich.edu>
10  *  Andy Adamson   <andros@umich.edu>
11  *
12  *  Redistribution and use in source and binary forms, with or without
13  *  modification, are permitted provided that the following conditions
14  *  are met:
15  *
16  *  1. Redistributions of source code must retain the above copyright
17  *     notice, this list of conditions and the following disclaimer.
18  *  2. Redistributions in binary form must reproduce the above copyright
19  *     notice, this list of conditions and the following disclaimer in the
20  *     documentation and/or other materials provided with the distribution.
21  *  3. Neither the name of the University nor the names of its
22  *     contributors may be used to endorse or promote products derived
23  *     from this software without specific prior written permission.
24  *
25  *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
26  *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
27  *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
28  *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
29  *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30  *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31  *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
32  *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
33  *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
34  *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
35  *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36  */
37
38 #include <linux/mm.h>
39 #include <linux/delay.h>
40 #include <linux/errno.h>
41 #include <linux/string.h>
42 #include <linux/ratelimit.h>
43 #include <linux/printk.h>
44 #include <linux/slab.h>
45 #include <linux/sunrpc/clnt.h>
46 #include <linux/sunrpc/gss_api.h>
47 #include <linux/nfs.h>
48 #include <linux/nfs4.h>
49 #include <linux/nfs_fs.h>
50 #include <linux/nfs_page.h>
51 #include <linux/nfs_mount.h>
52 #include <linux/namei.h>
53 #include <linux/mount.h>
54 #include <linux/module.h>
55 #include <linux/nfs_idmap.h>
56 #include <linux/sunrpc/bc_xprt.h>
57 #include <linux/xattr.h>
58 #include <linux/utsname.h>
59 #include <linux/freezer.h>
60
61 #include "nfs4_fs.h"
62 #include "delegation.h"
63 #include "internal.h"
64 #include "iostat.h"
65 #include "callback.h"
66 #include "pnfs.h"
67 #include "netns.h"
68
69 #define NFSDBG_FACILITY         NFSDBG_PROC
70
71 #define NFS4_POLL_RETRY_MIN     (HZ/10)
72 #define NFS4_POLL_RETRY_MAX     (15*HZ)
73
74 #define NFS4_MAX_LOOP_ON_RECOVER (10)
75
76 static unsigned short max_session_slots = NFS4_DEF_SLOT_TABLE_SIZE;
77
78 struct nfs4_opendata;
79 static int _nfs4_proc_open(struct nfs4_opendata *data);
80 static int _nfs4_recover_proc_open(struct nfs4_opendata *data);
81 static int nfs4_do_fsinfo(struct nfs_server *, struct nfs_fh *, struct nfs_fsinfo *);
82 static int nfs4_async_handle_error(struct rpc_task *, const struct nfs_server *, struct nfs4_state *);
83 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr);
84 static int nfs4_proc_getattr(struct nfs_server *, struct nfs_fh *, struct nfs_fattr *);
85 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr);
86 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
87                             struct nfs_fattr *fattr, struct iattr *sattr,
88                             struct nfs4_state *state);
89 #ifdef CONFIG_NFS_V4_1
90 static int nfs41_test_stateid(struct nfs_server *, nfs4_stateid *);
91 static int nfs41_free_stateid(struct nfs_server *, nfs4_stateid *);
92 #endif
93 /* Prevent leaks of NFSv4 errors into userland */
94 static int nfs4_map_errors(int err)
95 {
96         if (err >= -1000)
97                 return err;
98         switch (err) {
99         case -NFS4ERR_RESOURCE:
100                 return -EREMOTEIO;
101         case -NFS4ERR_WRONGSEC:
102                 return -EPERM;
103         case -NFS4ERR_BADOWNER:
104         case -NFS4ERR_BADNAME:
105                 return -EINVAL;
106         default:
107                 dprintk("%s could not handle NFSv4 error %d\n",
108                                 __func__, -err);
109                 break;
110         }
111         return -EIO;
112 }
113
114 /*
115  * This is our standard bitmap for GETATTR requests.
116  */
117 const u32 nfs4_fattr_bitmap[2] = {
118         FATTR4_WORD0_TYPE
119         | FATTR4_WORD0_CHANGE
120         | FATTR4_WORD0_SIZE
121         | FATTR4_WORD0_FSID
122         | FATTR4_WORD0_FILEID,
123         FATTR4_WORD1_MODE
124         | FATTR4_WORD1_NUMLINKS
125         | FATTR4_WORD1_OWNER
126         | FATTR4_WORD1_OWNER_GROUP
127         | FATTR4_WORD1_RAWDEV
128         | FATTR4_WORD1_SPACE_USED
129         | FATTR4_WORD1_TIME_ACCESS
130         | FATTR4_WORD1_TIME_METADATA
131         | FATTR4_WORD1_TIME_MODIFY
132 };
133
134 const u32 nfs4_statfs_bitmap[2] = {
135         FATTR4_WORD0_FILES_AVAIL
136         | FATTR4_WORD0_FILES_FREE
137         | FATTR4_WORD0_FILES_TOTAL,
138         FATTR4_WORD1_SPACE_AVAIL
139         | FATTR4_WORD1_SPACE_FREE
140         | FATTR4_WORD1_SPACE_TOTAL
141 };
142
143 const u32 nfs4_pathconf_bitmap[2] = {
144         FATTR4_WORD0_MAXLINK
145         | FATTR4_WORD0_MAXNAME,
146         0
147 };
148
149 const u32 nfs4_fsinfo_bitmap[3] = { FATTR4_WORD0_MAXFILESIZE
150                         | FATTR4_WORD0_MAXREAD
151                         | FATTR4_WORD0_MAXWRITE
152                         | FATTR4_WORD0_LEASE_TIME,
153                         FATTR4_WORD1_TIME_DELTA
154                         | FATTR4_WORD1_FS_LAYOUT_TYPES,
155                         FATTR4_WORD2_LAYOUT_BLKSIZE
156 };
157
158 const u32 nfs4_fs_locations_bitmap[2] = {
159         FATTR4_WORD0_TYPE
160         | FATTR4_WORD0_CHANGE
161         | FATTR4_WORD0_SIZE
162         | FATTR4_WORD0_FSID
163         | FATTR4_WORD0_FILEID
164         | FATTR4_WORD0_FS_LOCATIONS,
165         FATTR4_WORD1_MODE
166         | FATTR4_WORD1_NUMLINKS
167         | FATTR4_WORD1_OWNER
168         | FATTR4_WORD1_OWNER_GROUP
169         | FATTR4_WORD1_RAWDEV
170         | FATTR4_WORD1_SPACE_USED
171         | FATTR4_WORD1_TIME_ACCESS
172         | FATTR4_WORD1_TIME_METADATA
173         | FATTR4_WORD1_TIME_MODIFY
174         | FATTR4_WORD1_MOUNTED_ON_FILEID
175 };
176
177 static void nfs4_setup_readdir(u64 cookie, __be32 *verifier, struct dentry *dentry,
178                 struct nfs4_readdir_arg *readdir)
179 {
180         __be32 *start, *p;
181
182         BUG_ON(readdir->count < 80);
183         if (cookie > 2) {
184                 readdir->cookie = cookie;
185                 memcpy(&readdir->verifier, verifier, sizeof(readdir->verifier));
186                 return;
187         }
188
189         readdir->cookie = 0;
190         memset(&readdir->verifier, 0, sizeof(readdir->verifier));
191         if (cookie == 2)
192                 return;
193         
194         /*
195          * NFSv4 servers do not return entries for '.' and '..'
196          * Therefore, we fake these entries here.  We let '.'
197          * have cookie 0 and '..' have cookie 1.  Note that
198          * when talking to the server, we always send cookie 0
199          * instead of 1 or 2.
200          */
201         start = p = kmap_atomic(*readdir->pages);
202         
203         if (cookie == 0) {
204                 *p++ = xdr_one;                                  /* next */
205                 *p++ = xdr_zero;                   /* cookie, first word */
206                 *p++ = xdr_one;                   /* cookie, second word */
207                 *p++ = xdr_one;                             /* entry len */
208                 memcpy(p, ".\0\0\0", 4);                        /* entry */
209                 p++;
210                 *p++ = xdr_one;                         /* bitmap length */
211                 *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
212                 *p++ = htonl(8);              /* attribute buffer length */
213                 p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_inode));
214         }
215         
216         *p++ = xdr_one;                                  /* next */
217         *p++ = xdr_zero;                   /* cookie, first word */
218         *p++ = xdr_two;                   /* cookie, second word */
219         *p++ = xdr_two;                             /* entry len */
220         memcpy(p, "..\0\0", 4);                         /* entry */
221         p++;
222         *p++ = xdr_one;                         /* bitmap length */
223         *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
224         *p++ = htonl(8);              /* attribute buffer length */
225         p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_parent->d_inode));
226
227         readdir->pgbase = (char *)p - (char *)start;
228         readdir->count -= readdir->pgbase;
229         kunmap_atomic(start);
230 }
231
232 static int nfs4_wait_clnt_recover(struct nfs_client *clp)
233 {
234         int res;
235
236         might_sleep();
237
238         res = wait_on_bit(&clp->cl_state, NFS4CLNT_MANAGER_RUNNING,
239                         nfs_wait_bit_killable, TASK_KILLABLE);
240         return res;
241 }
242
243 static int nfs4_delay(struct rpc_clnt *clnt, long *timeout)
244 {
245         int res = 0;
246
247         might_sleep();
248
249         if (*timeout <= 0)
250                 *timeout = NFS4_POLL_RETRY_MIN;
251         if (*timeout > NFS4_POLL_RETRY_MAX)
252                 *timeout = NFS4_POLL_RETRY_MAX;
253         freezable_schedule_timeout_killable(*timeout);
254         if (fatal_signal_pending(current))
255                 res = -ERESTARTSYS;
256         *timeout <<= 1;
257         return res;
258 }
259
260 /* This is the error handling routine for processes that are allowed
261  * to sleep.
262  */
263 static int nfs4_handle_exception(struct nfs_server *server, int errorcode, struct nfs4_exception *exception)
264 {
265         struct nfs_client *clp = server->nfs_client;
266         struct nfs4_state *state = exception->state;
267         struct inode *inode = exception->inode;
268         int ret = errorcode;
269
270         exception->retry = 0;
271         switch(errorcode) {
272                 case 0:
273                         return 0;
274                 case -NFS4ERR_OPENMODE:
275                         if (inode && nfs_have_delegation(inode, FMODE_READ)) {
276                                 nfs_inode_return_delegation(inode);
277                                 exception->retry = 1;
278                                 return 0;
279                         }
280                         if (state == NULL)
281                                 break;
282                         nfs4_schedule_stateid_recovery(server, state);
283                         goto wait_on_recovery;
284                 case -NFS4ERR_DELEG_REVOKED:
285                 case -NFS4ERR_ADMIN_REVOKED:
286                 case -NFS4ERR_BAD_STATEID:
287                         if (state == NULL)
288                                 break;
289                         nfs_remove_bad_delegation(state->inode);
290                         nfs4_schedule_stateid_recovery(server, state);
291                         goto wait_on_recovery;
292                 case -NFS4ERR_EXPIRED:
293                         if (state != NULL)
294                                 nfs4_schedule_stateid_recovery(server, state);
295                 case -NFS4ERR_STALE_STATEID:
296                 case -NFS4ERR_STALE_CLIENTID:
297                         nfs4_schedule_lease_recovery(clp);
298                         goto wait_on_recovery;
299 #if defined(CONFIG_NFS_V4_1)
300                 case -NFS4ERR_BADSESSION:
301                 case -NFS4ERR_BADSLOT:
302                 case -NFS4ERR_BAD_HIGH_SLOT:
303                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
304                 case -NFS4ERR_DEADSESSION:
305                 case -NFS4ERR_SEQ_FALSE_RETRY:
306                 case -NFS4ERR_SEQ_MISORDERED:
307                         dprintk("%s ERROR: %d Reset session\n", __func__,
308                                 errorcode);
309                         nfs4_schedule_session_recovery(clp->cl_session);
310                         exception->retry = 1;
311                         break;
312 #endif /* defined(CONFIG_NFS_V4_1) */
313                 case -NFS4ERR_FILE_OPEN:
314                         if (exception->timeout > HZ) {
315                                 /* We have retried a decent amount, time to
316                                  * fail
317                                  */
318                                 ret = -EBUSY;
319                                 break;
320                         }
321                 case -NFS4ERR_GRACE:
322                 case -NFS4ERR_DELAY:
323                 case -EKEYEXPIRED:
324                         ret = nfs4_delay(server->client, &exception->timeout);
325                         if (ret != 0)
326                                 break;
327                 case -NFS4ERR_RETRY_UNCACHED_REP:
328                 case -NFS4ERR_OLD_STATEID:
329                         exception->retry = 1;
330                         break;
331                 case -NFS4ERR_BADOWNER:
332                         /* The following works around a Linux server bug! */
333                 case -NFS4ERR_BADNAME:
334                         if (server->caps & NFS_CAP_UIDGID_NOMAP) {
335                                 server->caps &= ~NFS_CAP_UIDGID_NOMAP;
336                                 exception->retry = 1;
337                                 printk(KERN_WARNING "NFS: v4 server %s "
338                                                 "does not accept raw "
339                                                 "uid/gids. "
340                                                 "Reenabling the idmapper.\n",
341                                                 server->nfs_client->cl_hostname);
342                         }
343         }
344         /* We failed to handle the error */
345         return nfs4_map_errors(ret);
346 wait_on_recovery:
347         ret = nfs4_wait_clnt_recover(clp);
348         if (ret == 0)
349                 exception->retry = 1;
350         return ret;
351 }
352
353
354 static void do_renew_lease(struct nfs_client *clp, unsigned long timestamp)
355 {
356         spin_lock(&clp->cl_lock);
357         if (time_before(clp->cl_last_renewal,timestamp))
358                 clp->cl_last_renewal = timestamp;
359         spin_unlock(&clp->cl_lock);
360 }
361
362 static void renew_lease(const struct nfs_server *server, unsigned long timestamp)
363 {
364         do_renew_lease(server->nfs_client, timestamp);
365 }
366
367 #if defined(CONFIG_NFS_V4_1)
368
369 /*
370  * nfs4_free_slot - free a slot and efficiently update slot table.
371  *
372  * freeing a slot is trivially done by clearing its respective bit
373  * in the bitmap.
374  * If the freed slotid equals highest_used_slotid we want to update it
375  * so that the server would be able to size down the slot table if needed,
376  * otherwise we know that the highest_used_slotid is still in use.
377  * When updating highest_used_slotid there may be "holes" in the bitmap
378  * so we need to scan down from highest_used_slotid to 0 looking for the now
379  * highest slotid in use.
380  * If none found, highest_used_slotid is set to NFS4_NO_SLOT.
381  *
382  * Must be called while holding tbl->slot_tbl_lock
383  */
384 static void
385 nfs4_free_slot(struct nfs4_slot_table *tbl, u32 slotid)
386 {
387         BUG_ON(slotid >= NFS4_MAX_SLOT_TABLE);
388         /* clear used bit in bitmap */
389         __clear_bit(slotid, tbl->used_slots);
390
391         /* update highest_used_slotid when it is freed */
392         if (slotid == tbl->highest_used_slotid) {
393                 slotid = find_last_bit(tbl->used_slots, tbl->max_slots);
394                 if (slotid < tbl->max_slots)
395                         tbl->highest_used_slotid = slotid;
396                 else
397                         tbl->highest_used_slotid = NFS4_NO_SLOT;
398         }
399         dprintk("%s: slotid %u highest_used_slotid %d\n", __func__,
400                 slotid, tbl->highest_used_slotid);
401 }
402
403 bool nfs4_set_task_privileged(struct rpc_task *task, void *dummy)
404 {
405         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
406         return true;
407 }
408
409 /*
410  * Signal state manager thread if session fore channel is drained
411  */
412 static void nfs4_check_drain_fc_complete(struct nfs4_session *ses)
413 {
414         if (!test_bit(NFS4_SESSION_DRAINING, &ses->session_state)) {
415                 rpc_wake_up_first(&ses->fc_slot_table.slot_tbl_waitq,
416                                 nfs4_set_task_privileged, NULL);
417                 return;
418         }
419
420         if (ses->fc_slot_table.highest_used_slotid != NFS4_NO_SLOT)
421                 return;
422
423         dprintk("%s COMPLETE: Session Fore Channel Drained\n", __func__);
424         complete(&ses->fc_slot_table.complete);
425 }
426
427 /*
428  * Signal state manager thread if session back channel is drained
429  */
430 void nfs4_check_drain_bc_complete(struct nfs4_session *ses)
431 {
432         if (!test_bit(NFS4_SESSION_DRAINING, &ses->session_state) ||
433             ses->bc_slot_table.highest_used_slotid != NFS4_NO_SLOT)
434                 return;
435         dprintk("%s COMPLETE: Session Back Channel Drained\n", __func__);
436         complete(&ses->bc_slot_table.complete);
437 }
438
439 static void nfs41_sequence_free_slot(struct nfs4_sequence_res *res)
440 {
441         struct nfs4_slot_table *tbl;
442
443         tbl = &res->sr_session->fc_slot_table;
444         if (!res->sr_slot) {
445                 /* just wake up the next guy waiting since
446                  * we may have not consumed a slot after all */
447                 dprintk("%s: No slot\n", __func__);
448                 return;
449         }
450
451         spin_lock(&tbl->slot_tbl_lock);
452         nfs4_free_slot(tbl, res->sr_slot - tbl->slots);
453         nfs4_check_drain_fc_complete(res->sr_session);
454         spin_unlock(&tbl->slot_tbl_lock);
455         res->sr_slot = NULL;
456 }
457
458 static int nfs41_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
459 {
460         unsigned long timestamp;
461         struct nfs_client *clp;
462
463         /*
464          * sr_status remains 1 if an RPC level error occurred. The server
465          * may or may not have processed the sequence operation..
466          * Proceed as if the server received and processed the sequence
467          * operation.
468          */
469         if (res->sr_status == 1)
470                 res->sr_status = NFS_OK;
471
472         /* don't increment the sequence number if the task wasn't sent */
473         if (!RPC_WAS_SENT(task))
474                 goto out;
475
476         /* Check the SEQUENCE operation status */
477         switch (res->sr_status) {
478         case 0:
479                 /* Update the slot's sequence and clientid lease timer */
480                 ++res->sr_slot->seq_nr;
481                 timestamp = res->sr_renewal_time;
482                 clp = res->sr_session->clp;
483                 do_renew_lease(clp, timestamp);
484                 /* Check sequence flags */
485                 if (res->sr_status_flags != 0)
486                         nfs4_schedule_lease_recovery(clp);
487                 break;
488         case -NFS4ERR_DELAY:
489                 /* The server detected a resend of the RPC call and
490                  * returned NFS4ERR_DELAY as per Section 2.10.6.2
491                  * of RFC5661.
492                  */
493                 dprintk("%s: slot=%td seq=%d: Operation in progress\n",
494                         __func__,
495                         res->sr_slot - res->sr_session->fc_slot_table.slots,
496                         res->sr_slot->seq_nr);
497                 goto out_retry;
498         default:
499                 /* Just update the slot sequence no. */
500                 ++res->sr_slot->seq_nr;
501         }
502 out:
503         /* The session may be reset by one of the error handlers. */
504         dprintk("%s: Error %d free the slot \n", __func__, res->sr_status);
505         nfs41_sequence_free_slot(res);
506         return 1;
507 out_retry:
508         if (!rpc_restart_call(task))
509                 goto out;
510         rpc_delay(task, NFS4_POLL_RETRY_MAX);
511         return 0;
512 }
513
514 static int nfs4_sequence_done(struct rpc_task *task,
515                                struct nfs4_sequence_res *res)
516 {
517         if (res->sr_session == NULL)
518                 return 1;
519         return nfs41_sequence_done(task, res);
520 }
521
522 /*
523  * nfs4_find_slot - efficiently look for a free slot
524  *
525  * nfs4_find_slot looks for an unset bit in the used_slots bitmap.
526  * If found, we mark the slot as used, update the highest_used_slotid,
527  * and respectively set up the sequence operation args.
528  * The slot number is returned if found, or NFS4_NO_SLOT otherwise.
529  *
530  * Note: must be called with under the slot_tbl_lock.
531  */
532 static u32
533 nfs4_find_slot(struct nfs4_slot_table *tbl)
534 {
535         u32 slotid;
536         u32 ret_id = NFS4_NO_SLOT;
537
538         dprintk("--> %s used_slots=%04lx highest_used=%u max_slots=%u\n",
539                 __func__, tbl->used_slots[0], tbl->highest_used_slotid,
540                 tbl->max_slots);
541         slotid = find_first_zero_bit(tbl->used_slots, tbl->max_slots);
542         if (slotid >= tbl->max_slots)
543                 goto out;
544         __set_bit(slotid, tbl->used_slots);
545         if (slotid > tbl->highest_used_slotid ||
546                         tbl->highest_used_slotid == NFS4_NO_SLOT)
547                 tbl->highest_used_slotid = slotid;
548         ret_id = slotid;
549 out:
550         dprintk("<-- %s used_slots=%04lx highest_used=%d slotid=%d \n",
551                 __func__, tbl->used_slots[0], tbl->highest_used_slotid, ret_id);
552         return ret_id;
553 }
554
555 static void nfs41_init_sequence(struct nfs4_sequence_args *args,
556                 struct nfs4_sequence_res *res, int cache_reply)
557 {
558         args->sa_session = NULL;
559         args->sa_cache_this = 0;
560         if (cache_reply)
561                 args->sa_cache_this = 1;
562         res->sr_session = NULL;
563         res->sr_slot = NULL;
564 }
565
566 int nfs41_setup_sequence(struct nfs4_session *session,
567                                 struct nfs4_sequence_args *args,
568                                 struct nfs4_sequence_res *res,
569                                 struct rpc_task *task)
570 {
571         struct nfs4_slot *slot;
572         struct nfs4_slot_table *tbl;
573         u32 slotid;
574
575         dprintk("--> %s\n", __func__);
576         /* slot already allocated? */
577         if (res->sr_slot != NULL)
578                 return 0;
579
580         tbl = &session->fc_slot_table;
581
582         spin_lock(&tbl->slot_tbl_lock);
583         if (test_bit(NFS4_SESSION_DRAINING, &session->session_state) &&
584             !rpc_task_has_priority(task, RPC_PRIORITY_PRIVILEGED)) {
585                 /* The state manager will wait until the slot table is empty */
586                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
587                 spin_unlock(&tbl->slot_tbl_lock);
588                 dprintk("%s session is draining\n", __func__);
589                 return -EAGAIN;
590         }
591
592         if (!rpc_queue_empty(&tbl->slot_tbl_waitq) &&
593             !rpc_task_has_priority(task, RPC_PRIORITY_PRIVILEGED)) {
594                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
595                 spin_unlock(&tbl->slot_tbl_lock);
596                 dprintk("%s enforce FIFO order\n", __func__);
597                 return -EAGAIN;
598         }
599
600         slotid = nfs4_find_slot(tbl);
601         if (slotid == NFS4_NO_SLOT) {
602                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
603                 spin_unlock(&tbl->slot_tbl_lock);
604                 dprintk("<-- %s: no free slots\n", __func__);
605                 return -EAGAIN;
606         }
607         spin_unlock(&tbl->slot_tbl_lock);
608
609         rpc_task_set_priority(task, RPC_PRIORITY_NORMAL);
610         slot = tbl->slots + slotid;
611         args->sa_session = session;
612         args->sa_slotid = slotid;
613
614         dprintk("<-- %s slotid=%d seqid=%d\n", __func__, slotid, slot->seq_nr);
615
616         res->sr_session = session;
617         res->sr_slot = slot;
618         res->sr_renewal_time = jiffies;
619         res->sr_status_flags = 0;
620         /*
621          * sr_status is only set in decode_sequence, and so will remain
622          * set to 1 if an rpc level failure occurs.
623          */
624         res->sr_status = 1;
625         return 0;
626 }
627 EXPORT_SYMBOL_GPL(nfs41_setup_sequence);
628
629 int nfs4_setup_sequence(const struct nfs_server *server,
630                         struct nfs4_sequence_args *args,
631                         struct nfs4_sequence_res *res,
632                         struct rpc_task *task)
633 {
634         struct nfs4_session *session = nfs4_get_session(server);
635         int ret = 0;
636
637         if (session == NULL)
638                 goto out;
639
640         dprintk("--> %s clp %p session %p sr_slot %td\n",
641                 __func__, session->clp, session, res->sr_slot ?
642                         res->sr_slot - session->fc_slot_table.slots : -1);
643
644         ret = nfs41_setup_sequence(session, args, res, task);
645 out:
646         dprintk("<-- %s status=%d\n", __func__, ret);
647         return ret;
648 }
649
650 struct nfs41_call_sync_data {
651         const struct nfs_server *seq_server;
652         struct nfs4_sequence_args *seq_args;
653         struct nfs4_sequence_res *seq_res;
654 };
655
656 static void nfs41_call_sync_prepare(struct rpc_task *task, void *calldata)
657 {
658         struct nfs41_call_sync_data *data = calldata;
659
660         dprintk("--> %s data->seq_server %p\n", __func__, data->seq_server);
661
662         if (nfs4_setup_sequence(data->seq_server, data->seq_args,
663                                 data->seq_res, task))
664                 return;
665         rpc_call_start(task);
666 }
667
668 static void nfs41_call_priv_sync_prepare(struct rpc_task *task, void *calldata)
669 {
670         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
671         nfs41_call_sync_prepare(task, calldata);
672 }
673
674 static void nfs41_call_sync_done(struct rpc_task *task, void *calldata)
675 {
676         struct nfs41_call_sync_data *data = calldata;
677
678         nfs41_sequence_done(task, data->seq_res);
679 }
680
681 static const struct rpc_call_ops nfs41_call_sync_ops = {
682         .rpc_call_prepare = nfs41_call_sync_prepare,
683         .rpc_call_done = nfs41_call_sync_done,
684 };
685
686 static const struct rpc_call_ops nfs41_call_priv_sync_ops = {
687         .rpc_call_prepare = nfs41_call_priv_sync_prepare,
688         .rpc_call_done = nfs41_call_sync_done,
689 };
690
691 static int nfs4_call_sync_sequence(struct rpc_clnt *clnt,
692                                    struct nfs_server *server,
693                                    struct rpc_message *msg,
694                                    struct nfs4_sequence_args *args,
695                                    struct nfs4_sequence_res *res,
696                                    int privileged)
697 {
698         int ret;
699         struct rpc_task *task;
700         struct nfs41_call_sync_data data = {
701                 .seq_server = server,
702                 .seq_args = args,
703                 .seq_res = res,
704         };
705         struct rpc_task_setup task_setup = {
706                 .rpc_client = clnt,
707                 .rpc_message = msg,
708                 .callback_ops = &nfs41_call_sync_ops,
709                 .callback_data = &data
710         };
711
712         if (privileged)
713                 task_setup.callback_ops = &nfs41_call_priv_sync_ops;
714         task = rpc_run_task(&task_setup);
715         if (IS_ERR(task))
716                 ret = PTR_ERR(task);
717         else {
718                 ret = task->tk_status;
719                 rpc_put_task(task);
720         }
721         return ret;
722 }
723
724 int _nfs4_call_sync_session(struct rpc_clnt *clnt,
725                             struct nfs_server *server,
726                             struct rpc_message *msg,
727                             struct nfs4_sequence_args *args,
728                             struct nfs4_sequence_res *res,
729                             int cache_reply)
730 {
731         nfs41_init_sequence(args, res, cache_reply);
732         return nfs4_call_sync_sequence(clnt, server, msg, args, res, 0);
733 }
734
735 #else
736 static inline
737 void nfs41_init_sequence(struct nfs4_sequence_args *args,
738                 struct nfs4_sequence_res *res, int cache_reply)
739 {
740 }
741
742 static int nfs4_sequence_done(struct rpc_task *task,
743                                struct nfs4_sequence_res *res)
744 {
745         return 1;
746 }
747 #endif /* CONFIG_NFS_V4_1 */
748
749 int _nfs4_call_sync(struct rpc_clnt *clnt,
750                     struct nfs_server *server,
751                     struct rpc_message *msg,
752                     struct nfs4_sequence_args *args,
753                     struct nfs4_sequence_res *res,
754                     int cache_reply)
755 {
756         nfs41_init_sequence(args, res, cache_reply);
757         return rpc_call_sync(clnt, msg, 0);
758 }
759
760 static inline
761 int nfs4_call_sync(struct rpc_clnt *clnt,
762                    struct nfs_server *server,
763                    struct rpc_message *msg,
764                    struct nfs4_sequence_args *args,
765                    struct nfs4_sequence_res *res,
766                    int cache_reply)
767 {
768         return server->nfs_client->cl_mvops->call_sync(clnt, server, msg,
769                                                 args, res, cache_reply);
770 }
771
772 static void update_changeattr(struct inode *dir, struct nfs4_change_info *cinfo)
773 {
774         struct nfs_inode *nfsi = NFS_I(dir);
775
776         spin_lock(&dir->i_lock);
777         nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE|NFS_INO_INVALID_DATA;
778         if (!cinfo->atomic || cinfo->before != dir->i_version)
779                 nfs_force_lookup_revalidate(dir);
780         dir->i_version = cinfo->after;
781         spin_unlock(&dir->i_lock);
782 }
783
784 struct nfs4_opendata {
785         struct kref kref;
786         struct nfs_openargs o_arg;
787         struct nfs_openres o_res;
788         struct nfs_open_confirmargs c_arg;
789         struct nfs_open_confirmres c_res;
790         struct nfs4_string owner_name;
791         struct nfs4_string group_name;
792         struct nfs_fattr f_attr;
793         struct dentry *dir;
794         struct dentry *dentry;
795         struct nfs4_state_owner *owner;
796         struct nfs4_state *state;
797         struct iattr attrs;
798         unsigned long timestamp;
799         unsigned int rpc_done : 1;
800         int rpc_status;
801         int cancelled;
802 };
803
804
805 static void nfs4_init_opendata_res(struct nfs4_opendata *p)
806 {
807         p->o_res.f_attr = &p->f_attr;
808         p->o_res.seqid = p->o_arg.seqid;
809         p->c_res.seqid = p->c_arg.seqid;
810         p->o_res.server = p->o_arg.server;
811         nfs_fattr_init(&p->f_attr);
812         nfs_fattr_init_names(&p->f_attr, &p->owner_name, &p->group_name);
813 }
814
815 static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
816                 struct nfs4_state_owner *sp, fmode_t fmode, int flags,
817                 const struct iattr *attrs,
818                 gfp_t gfp_mask)
819 {
820         struct dentry *parent = dget_parent(dentry);
821         struct inode *dir = parent->d_inode;
822         struct nfs_server *server = NFS_SERVER(dir);
823         struct nfs4_opendata *p;
824
825         p = kzalloc(sizeof(*p), gfp_mask);
826         if (p == NULL)
827                 goto err;
828         p->o_arg.seqid = nfs_alloc_seqid(&sp->so_seqid, gfp_mask);
829         if (p->o_arg.seqid == NULL)
830                 goto err_free;
831         nfs_sb_active(dentry->d_sb);
832         p->dentry = dget(dentry);
833         p->dir = parent;
834         p->owner = sp;
835         atomic_inc(&sp->so_count);
836         p->o_arg.fh = NFS_FH(dir);
837         p->o_arg.open_flags = flags;
838         p->o_arg.fmode = fmode & (FMODE_READ|FMODE_WRITE);
839         p->o_arg.clientid = server->nfs_client->cl_clientid;
840         p->o_arg.id.create_time = ktime_to_ns(sp->so_seqid.create_time);
841         p->o_arg.id.uniquifier = sp->so_seqid.owner_id;
842         p->o_arg.name = &dentry->d_name;
843         p->o_arg.server = server;
844         p->o_arg.bitmask = server->attr_bitmask;
845         p->o_arg.claim = NFS4_OPEN_CLAIM_NULL;
846         if (attrs != NULL && attrs->ia_valid != 0) {
847                 __be32 verf[2];
848
849                 p->o_arg.u.attrs = &p->attrs;
850                 memcpy(&p->attrs, attrs, sizeof(p->attrs));
851
852                 verf[0] = jiffies;
853                 verf[1] = current->pid;
854                 memcpy(p->o_arg.u.verifier.data, verf,
855                                 sizeof(p->o_arg.u.verifier.data));
856         }
857         p->c_arg.fh = &p->o_res.fh;
858         p->c_arg.stateid = &p->o_res.stateid;
859         p->c_arg.seqid = p->o_arg.seqid;
860         nfs4_init_opendata_res(p);
861         kref_init(&p->kref);
862         return p;
863 err_free:
864         kfree(p);
865 err:
866         dput(parent);
867         return NULL;
868 }
869
870 static void nfs4_opendata_free(struct kref *kref)
871 {
872         struct nfs4_opendata *p = container_of(kref,
873                         struct nfs4_opendata, kref);
874         struct super_block *sb = p->dentry->d_sb;
875
876         nfs_free_seqid(p->o_arg.seqid);
877         if (p->state != NULL)
878                 nfs4_put_open_state(p->state);
879         nfs4_put_state_owner(p->owner);
880         dput(p->dir);
881         dput(p->dentry);
882         nfs_sb_deactive(sb);
883         nfs_fattr_free_names(&p->f_attr);
884         kfree(p);
885 }
886
887 static void nfs4_opendata_put(struct nfs4_opendata *p)
888 {
889         if (p != NULL)
890                 kref_put(&p->kref, nfs4_opendata_free);
891 }
892
893 static int nfs4_wait_for_completion_rpc_task(struct rpc_task *task)
894 {
895         int ret;
896
897         ret = rpc_wait_for_completion_task(task);
898         return ret;
899 }
900
901 static int can_open_cached(struct nfs4_state *state, fmode_t mode, int open_mode)
902 {
903         int ret = 0;
904
905         if (open_mode & (O_EXCL|O_TRUNC))
906                 goto out;
907         switch (mode & (FMODE_READ|FMODE_WRITE)) {
908                 case FMODE_READ:
909                         ret |= test_bit(NFS_O_RDONLY_STATE, &state->flags) != 0
910                                 && state->n_rdonly != 0;
911                         break;
912                 case FMODE_WRITE:
913                         ret |= test_bit(NFS_O_WRONLY_STATE, &state->flags) != 0
914                                 && state->n_wronly != 0;
915                         break;
916                 case FMODE_READ|FMODE_WRITE:
917                         ret |= test_bit(NFS_O_RDWR_STATE, &state->flags) != 0
918                                 && state->n_rdwr != 0;
919         }
920 out:
921         return ret;
922 }
923
924 static int can_open_delegated(struct nfs_delegation *delegation, fmode_t fmode)
925 {
926         if (delegation == NULL)
927                 return 0;
928         if ((delegation->type & fmode) != fmode)
929                 return 0;
930         if (test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags))
931                 return 0;
932         nfs_mark_delegation_referenced(delegation);
933         return 1;
934 }
935
936 static void update_open_stateflags(struct nfs4_state *state, fmode_t fmode)
937 {
938         switch (fmode) {
939                 case FMODE_WRITE:
940                         state->n_wronly++;
941                         break;
942                 case FMODE_READ:
943                         state->n_rdonly++;
944                         break;
945                 case FMODE_READ|FMODE_WRITE:
946                         state->n_rdwr++;
947         }
948         nfs4_state_set_mode_locked(state, state->state | fmode);
949 }
950
951 static void nfs_set_open_stateid_locked(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
952 {
953         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
954                 nfs4_stateid_copy(&state->stateid, stateid);
955         nfs4_stateid_copy(&state->open_stateid, stateid);
956         switch (fmode) {
957                 case FMODE_READ:
958                         set_bit(NFS_O_RDONLY_STATE, &state->flags);
959                         break;
960                 case FMODE_WRITE:
961                         set_bit(NFS_O_WRONLY_STATE, &state->flags);
962                         break;
963                 case FMODE_READ|FMODE_WRITE:
964                         set_bit(NFS_O_RDWR_STATE, &state->flags);
965         }
966 }
967
968 static void nfs_set_open_stateid(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
969 {
970         write_seqlock(&state->seqlock);
971         nfs_set_open_stateid_locked(state, stateid, fmode);
972         write_sequnlock(&state->seqlock);
973 }
974
975 static void __update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, const nfs4_stateid *deleg_stateid, fmode_t fmode)
976 {
977         /*
978          * Protect the call to nfs4_state_set_mode_locked and
979          * serialise the stateid update
980          */
981         write_seqlock(&state->seqlock);
982         if (deleg_stateid != NULL) {
983                 nfs4_stateid_copy(&state->stateid, deleg_stateid);
984                 set_bit(NFS_DELEGATED_STATE, &state->flags);
985         }
986         if (open_stateid != NULL)
987                 nfs_set_open_stateid_locked(state, open_stateid, fmode);
988         write_sequnlock(&state->seqlock);
989         spin_lock(&state->owner->so_lock);
990         update_open_stateflags(state, fmode);
991         spin_unlock(&state->owner->so_lock);
992 }
993
994 static int update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, nfs4_stateid *delegation, fmode_t fmode)
995 {
996         struct nfs_inode *nfsi = NFS_I(state->inode);
997         struct nfs_delegation *deleg_cur;
998         int ret = 0;
999
1000         fmode &= (FMODE_READ|FMODE_WRITE);
1001
1002         rcu_read_lock();
1003         deleg_cur = rcu_dereference(nfsi->delegation);
1004         if (deleg_cur == NULL)
1005                 goto no_delegation;
1006
1007         spin_lock(&deleg_cur->lock);
1008         if (nfsi->delegation != deleg_cur ||
1009             (deleg_cur->type & fmode) != fmode)
1010                 goto no_delegation_unlock;
1011
1012         if (delegation == NULL)
1013                 delegation = &deleg_cur->stateid;
1014         else if (!nfs4_stateid_match(&deleg_cur->stateid, delegation))
1015                 goto no_delegation_unlock;
1016
1017         nfs_mark_delegation_referenced(deleg_cur);
1018         __update_open_stateid(state, open_stateid, &deleg_cur->stateid, fmode);
1019         ret = 1;
1020 no_delegation_unlock:
1021         spin_unlock(&deleg_cur->lock);
1022 no_delegation:
1023         rcu_read_unlock();
1024
1025         if (!ret && open_stateid != NULL) {
1026                 __update_open_stateid(state, open_stateid, NULL, fmode);
1027                 ret = 1;
1028         }
1029
1030         return ret;
1031 }
1032
1033
1034 static void nfs4_return_incompatible_delegation(struct inode *inode, fmode_t fmode)
1035 {
1036         struct nfs_delegation *delegation;
1037
1038         rcu_read_lock();
1039         delegation = rcu_dereference(NFS_I(inode)->delegation);
1040         if (delegation == NULL || (delegation->type & fmode) == fmode) {
1041                 rcu_read_unlock();
1042                 return;
1043         }
1044         rcu_read_unlock();
1045         nfs_inode_return_delegation(inode);
1046 }
1047
1048 static struct nfs4_state *nfs4_try_open_cached(struct nfs4_opendata *opendata)
1049 {
1050         struct nfs4_state *state = opendata->state;
1051         struct nfs_inode *nfsi = NFS_I(state->inode);
1052         struct nfs_delegation *delegation;
1053         int open_mode = opendata->o_arg.open_flags & (O_EXCL|O_TRUNC);
1054         fmode_t fmode = opendata->o_arg.fmode;
1055         nfs4_stateid stateid;
1056         int ret = -EAGAIN;
1057
1058         for (;;) {
1059                 if (can_open_cached(state, fmode, open_mode)) {
1060                         spin_lock(&state->owner->so_lock);
1061                         if (can_open_cached(state, fmode, open_mode)) {
1062                                 update_open_stateflags(state, fmode);
1063                                 spin_unlock(&state->owner->so_lock);
1064                                 goto out_return_state;
1065                         }
1066                         spin_unlock(&state->owner->so_lock);
1067                 }
1068                 rcu_read_lock();
1069                 delegation = rcu_dereference(nfsi->delegation);
1070                 if (!can_open_delegated(delegation, fmode)) {
1071                         rcu_read_unlock();
1072                         break;
1073                 }
1074                 /* Save the delegation */
1075                 nfs4_stateid_copy(&stateid, &delegation->stateid);
1076                 rcu_read_unlock();
1077                 ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
1078                 if (ret != 0)
1079                         goto out;
1080                 ret = -EAGAIN;
1081
1082                 /* Try to update the stateid using the delegation */
1083                 if (update_open_stateid(state, NULL, &stateid, fmode))
1084                         goto out_return_state;
1085         }
1086 out:
1087         return ERR_PTR(ret);
1088 out_return_state:
1089         atomic_inc(&state->count);
1090         return state;
1091 }
1092
1093 static struct nfs4_state *nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
1094 {
1095         struct inode *inode;
1096         struct nfs4_state *state = NULL;
1097         struct nfs_delegation *delegation;
1098         int ret;
1099
1100         if (!data->rpc_done) {
1101                 state = nfs4_try_open_cached(data);
1102                 goto out;
1103         }
1104
1105         ret = -EAGAIN;
1106         if (!(data->f_attr.valid & NFS_ATTR_FATTR))
1107                 goto err;
1108         inode = nfs_fhget(data->dir->d_sb, &data->o_res.fh, &data->f_attr);
1109         ret = PTR_ERR(inode);
1110         if (IS_ERR(inode))
1111                 goto err;
1112         ret = -ENOMEM;
1113         state = nfs4_get_open_state(inode, data->owner);
1114         if (state == NULL)
1115                 goto err_put_inode;
1116         if (data->o_res.delegation_type != 0) {
1117                 struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
1118                 int delegation_flags = 0;
1119
1120                 rcu_read_lock();
1121                 delegation = rcu_dereference(NFS_I(inode)->delegation);
1122                 if (delegation)
1123                         delegation_flags = delegation->flags;
1124                 rcu_read_unlock();
1125                 if (data->o_arg.claim == NFS4_OPEN_CLAIM_DELEGATE_CUR) {
1126                         pr_err_ratelimited("NFS: Broken NFSv4 server %s is "
1127                                         "returning a delegation for "
1128                                         "OPEN(CLAIM_DELEGATE_CUR)\n",
1129                                         clp->cl_hostname);
1130                 } else if ((delegation_flags & 1UL<<NFS_DELEGATION_NEED_RECLAIM) == 0)
1131                         nfs_inode_set_delegation(state->inode,
1132                                         data->owner->so_cred,
1133                                         &data->o_res);
1134                 else
1135                         nfs_inode_reclaim_delegation(state->inode,
1136                                         data->owner->so_cred,
1137                                         &data->o_res);
1138         }
1139
1140         update_open_stateid(state, &data->o_res.stateid, NULL,
1141                         data->o_arg.fmode);
1142         iput(inode);
1143 out:
1144         return state;
1145 err_put_inode:
1146         iput(inode);
1147 err:
1148         return ERR_PTR(ret);
1149 }
1150
1151 static struct nfs_open_context *nfs4_state_find_open_context(struct nfs4_state *state)
1152 {
1153         struct nfs_inode *nfsi = NFS_I(state->inode);
1154         struct nfs_open_context *ctx;
1155
1156         spin_lock(&state->inode->i_lock);
1157         list_for_each_entry(ctx, &nfsi->open_files, list) {
1158                 if (ctx->state != state)
1159                         continue;
1160                 get_nfs_open_context(ctx);
1161                 spin_unlock(&state->inode->i_lock);
1162                 return ctx;
1163         }
1164         spin_unlock(&state->inode->i_lock);
1165         return ERR_PTR(-ENOENT);
1166 }
1167
1168 static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx, struct nfs4_state *state)
1169 {
1170         struct nfs4_opendata *opendata;
1171
1172         opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0, NULL, GFP_NOFS);
1173         if (opendata == NULL)
1174                 return ERR_PTR(-ENOMEM);
1175         opendata->state = state;
1176         atomic_inc(&state->count);
1177         return opendata;
1178 }
1179
1180 static int nfs4_open_recover_helper(struct nfs4_opendata *opendata, fmode_t fmode, struct nfs4_state **res)
1181 {
1182         struct nfs4_state *newstate;
1183         int ret;
1184
1185         opendata->o_arg.open_flags = 0;
1186         opendata->o_arg.fmode = fmode;
1187         memset(&opendata->o_res, 0, sizeof(opendata->o_res));
1188         memset(&opendata->c_res, 0, sizeof(opendata->c_res));
1189         nfs4_init_opendata_res(opendata);
1190         ret = _nfs4_recover_proc_open(opendata);
1191         if (ret != 0)
1192                 return ret; 
1193         newstate = nfs4_opendata_to_nfs4_state(opendata);
1194         if (IS_ERR(newstate))
1195                 return PTR_ERR(newstate);
1196         nfs4_close_state(newstate, fmode);
1197         *res = newstate;
1198         return 0;
1199 }
1200
1201 static int nfs4_open_recover(struct nfs4_opendata *opendata, struct nfs4_state *state)
1202 {
1203         struct nfs4_state *newstate;
1204         int ret;
1205
1206         /* memory barrier prior to reading state->n_* */
1207         clear_bit(NFS_DELEGATED_STATE, &state->flags);
1208         smp_rmb();
1209         if (state->n_rdwr != 0) {
1210                 clear_bit(NFS_O_RDWR_STATE, &state->flags);
1211                 ret = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE, &newstate);
1212                 if (ret != 0)
1213                         return ret;
1214                 if (newstate != state)
1215                         return -ESTALE;
1216         }
1217         if (state->n_wronly != 0) {
1218                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1219                 ret = nfs4_open_recover_helper(opendata, FMODE_WRITE, &newstate);
1220                 if (ret != 0)
1221                         return ret;
1222                 if (newstate != state)
1223                         return -ESTALE;
1224         }
1225         if (state->n_rdonly != 0) {
1226                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1227                 ret = nfs4_open_recover_helper(opendata, FMODE_READ, &newstate);
1228                 if (ret != 0)
1229                         return ret;
1230                 if (newstate != state)
1231                         return -ESTALE;
1232         }
1233         /*
1234          * We may have performed cached opens for all three recoveries.
1235          * Check if we need to update the current stateid.
1236          */
1237         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0 &&
1238             !nfs4_stateid_match(&state->stateid, &state->open_stateid)) {
1239                 write_seqlock(&state->seqlock);
1240                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1241                         nfs4_stateid_copy(&state->stateid, &state->open_stateid);
1242                 write_sequnlock(&state->seqlock);
1243         }
1244         return 0;
1245 }
1246
1247 /*
1248  * OPEN_RECLAIM:
1249  *      reclaim state on the server after a reboot.
1250  */
1251 static int _nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1252 {
1253         struct nfs_delegation *delegation;
1254         struct nfs4_opendata *opendata;
1255         fmode_t delegation_type = 0;
1256         int status;
1257
1258         opendata = nfs4_open_recoverdata_alloc(ctx, state);
1259         if (IS_ERR(opendata))
1260                 return PTR_ERR(opendata);
1261         opendata->o_arg.claim = NFS4_OPEN_CLAIM_PREVIOUS;
1262         opendata->o_arg.fh = NFS_FH(state->inode);
1263         rcu_read_lock();
1264         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1265         if (delegation != NULL && test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) != 0)
1266                 delegation_type = delegation->type;
1267         rcu_read_unlock();
1268         opendata->o_arg.u.delegation_type = delegation_type;
1269         status = nfs4_open_recover(opendata, state);
1270         nfs4_opendata_put(opendata);
1271         return status;
1272 }
1273
1274 static int nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1275 {
1276         struct nfs_server *server = NFS_SERVER(state->inode);
1277         struct nfs4_exception exception = { };
1278         int err;
1279         do {
1280                 err = _nfs4_do_open_reclaim(ctx, state);
1281                 if (err != -NFS4ERR_DELAY)
1282                         break;
1283                 nfs4_handle_exception(server, err, &exception);
1284         } while (exception.retry);
1285         return err;
1286 }
1287
1288 static int nfs4_open_reclaim(struct nfs4_state_owner *sp, struct nfs4_state *state)
1289 {
1290         struct nfs_open_context *ctx;
1291         int ret;
1292
1293         ctx = nfs4_state_find_open_context(state);
1294         if (IS_ERR(ctx))
1295                 return PTR_ERR(ctx);
1296         ret = nfs4_do_open_reclaim(ctx, state);
1297         put_nfs_open_context(ctx);
1298         return ret;
1299 }
1300
1301 static int _nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
1302 {
1303         struct nfs4_opendata *opendata;
1304         int ret;
1305
1306         opendata = nfs4_open_recoverdata_alloc(ctx, state);
1307         if (IS_ERR(opendata))
1308                 return PTR_ERR(opendata);
1309         opendata->o_arg.claim = NFS4_OPEN_CLAIM_DELEGATE_CUR;
1310         nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
1311         ret = nfs4_open_recover(opendata, state);
1312         nfs4_opendata_put(opendata);
1313         return ret;
1314 }
1315
1316 int nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
1317 {
1318         struct nfs4_exception exception = { };
1319         struct nfs_server *server = NFS_SERVER(state->inode);
1320         int err;
1321         do {
1322                 err = _nfs4_open_delegation_recall(ctx, state, stateid);
1323                 switch (err) {
1324                         case 0:
1325                         case -ENOENT:
1326                         case -ESTALE:
1327                                 goto out;
1328                         case -NFS4ERR_BADSESSION:
1329                         case -NFS4ERR_BADSLOT:
1330                         case -NFS4ERR_BAD_HIGH_SLOT:
1331                         case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
1332                         case -NFS4ERR_DEADSESSION:
1333                                 nfs4_schedule_session_recovery(server->nfs_client->cl_session);
1334                                 goto out;
1335                         case -NFS4ERR_STALE_CLIENTID:
1336                         case -NFS4ERR_STALE_STATEID:
1337                         case -NFS4ERR_EXPIRED:
1338                                 /* Don't recall a delegation if it was lost */
1339                                 nfs4_schedule_lease_recovery(server->nfs_client);
1340                                 goto out;
1341                         case -ERESTARTSYS:
1342                                 /*
1343                                  * The show must go on: exit, but mark the
1344                                  * stateid as needing recovery.
1345                                  */
1346                         case -NFS4ERR_DELEG_REVOKED:
1347                         case -NFS4ERR_ADMIN_REVOKED:
1348                         case -NFS4ERR_BAD_STATEID:
1349                                 nfs_inode_find_state_and_recover(state->inode,
1350                                                 stateid);
1351                                 nfs4_schedule_stateid_recovery(server, state);
1352                         case -EKEYEXPIRED:
1353                                 /*
1354                                  * User RPCSEC_GSS context has expired.
1355                                  * We cannot recover this stateid now, so
1356                                  * skip it and allow recovery thread to
1357                                  * proceed.
1358                                  */
1359                         case -ENOMEM:
1360                                 err = 0;
1361                                 goto out;
1362                 }
1363                 err = nfs4_handle_exception(server, err, &exception);
1364         } while (exception.retry);
1365 out:
1366         return err;
1367 }
1368
1369 static void nfs4_open_confirm_done(struct rpc_task *task, void *calldata)
1370 {
1371         struct nfs4_opendata *data = calldata;
1372
1373         data->rpc_status = task->tk_status;
1374         if (data->rpc_status == 0) {
1375                 nfs4_stateid_copy(&data->o_res.stateid, &data->c_res.stateid);
1376                 nfs_confirm_seqid(&data->owner->so_seqid, 0);
1377                 renew_lease(data->o_res.server, data->timestamp);
1378                 data->rpc_done = 1;
1379         }
1380 }
1381
1382 static void nfs4_open_confirm_release(void *calldata)
1383 {
1384         struct nfs4_opendata *data = calldata;
1385         struct nfs4_state *state = NULL;
1386
1387         /* If this request hasn't been cancelled, do nothing */
1388         if (data->cancelled == 0)
1389                 goto out_free;
1390         /* In case of error, no cleanup! */
1391         if (!data->rpc_done)
1392                 goto out_free;
1393         state = nfs4_opendata_to_nfs4_state(data);
1394         if (!IS_ERR(state))
1395                 nfs4_close_state(state, data->o_arg.fmode);
1396 out_free:
1397         nfs4_opendata_put(data);
1398 }
1399
1400 static const struct rpc_call_ops nfs4_open_confirm_ops = {
1401         .rpc_call_done = nfs4_open_confirm_done,
1402         .rpc_release = nfs4_open_confirm_release,
1403 };
1404
1405 /*
1406  * Note: On error, nfs4_proc_open_confirm will free the struct nfs4_opendata
1407  */
1408 static int _nfs4_proc_open_confirm(struct nfs4_opendata *data)
1409 {
1410         struct nfs_server *server = NFS_SERVER(data->dir->d_inode);
1411         struct rpc_task *task;
1412         struct  rpc_message msg = {
1413                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_CONFIRM],
1414                 .rpc_argp = &data->c_arg,
1415                 .rpc_resp = &data->c_res,
1416                 .rpc_cred = data->owner->so_cred,
1417         };
1418         struct rpc_task_setup task_setup_data = {
1419                 .rpc_client = server->client,
1420                 .rpc_message = &msg,
1421                 .callback_ops = &nfs4_open_confirm_ops,
1422                 .callback_data = data,
1423                 .workqueue = nfsiod_workqueue,
1424                 .flags = RPC_TASK_ASYNC,
1425         };
1426         int status;
1427
1428         kref_get(&data->kref);
1429         data->rpc_done = 0;
1430         data->rpc_status = 0;
1431         data->timestamp = jiffies;
1432         task = rpc_run_task(&task_setup_data);
1433         if (IS_ERR(task))
1434                 return PTR_ERR(task);
1435         status = nfs4_wait_for_completion_rpc_task(task);
1436         if (status != 0) {
1437                 data->cancelled = 1;
1438                 smp_wmb();
1439         } else
1440                 status = data->rpc_status;
1441         rpc_put_task(task);
1442         return status;
1443 }
1444
1445 static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
1446 {
1447         struct nfs4_opendata *data = calldata;
1448         struct nfs4_state_owner *sp = data->owner;
1449
1450         if (nfs_wait_on_sequence(data->o_arg.seqid, task) != 0)
1451                 return;
1452         /*
1453          * Check if we still need to send an OPEN call, or if we can use
1454          * a delegation instead.
1455          */
1456         if (data->state != NULL) {
1457                 struct nfs_delegation *delegation;
1458
1459                 if (can_open_cached(data->state, data->o_arg.fmode, data->o_arg.open_flags))
1460                         goto out_no_action;
1461                 rcu_read_lock();
1462                 delegation = rcu_dereference(NFS_I(data->state->inode)->delegation);
1463                 if (data->o_arg.claim != NFS4_OPEN_CLAIM_DELEGATE_CUR &&
1464                     can_open_delegated(delegation, data->o_arg.fmode))
1465                         goto unlock_no_action;
1466                 rcu_read_unlock();
1467         }
1468         /* Update client id. */
1469         data->o_arg.clientid = sp->so_server->nfs_client->cl_clientid;
1470         if (data->o_arg.claim == NFS4_OPEN_CLAIM_PREVIOUS) {
1471                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
1472                 nfs_copy_fh(&data->o_res.fh, data->o_arg.fh);
1473         }
1474         data->timestamp = jiffies;
1475         if (nfs4_setup_sequence(data->o_arg.server,
1476                                 &data->o_arg.seq_args,
1477                                 &data->o_res.seq_res, task))
1478                 return;
1479         rpc_call_start(task);
1480         return;
1481 unlock_no_action:
1482         rcu_read_unlock();
1483 out_no_action:
1484         task->tk_action = NULL;
1485
1486 }
1487
1488 static void nfs4_recover_open_prepare(struct rpc_task *task, void *calldata)
1489 {
1490         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
1491         nfs4_open_prepare(task, calldata);
1492 }
1493
1494 static void nfs4_open_done(struct rpc_task *task, void *calldata)
1495 {
1496         struct nfs4_opendata *data = calldata;
1497
1498         data->rpc_status = task->tk_status;
1499
1500         if (!nfs4_sequence_done(task, &data->o_res.seq_res))
1501                 return;
1502
1503         if (task->tk_status == 0) {
1504                 switch (data->o_res.f_attr->mode & S_IFMT) {
1505                         case S_IFREG:
1506                                 break;
1507                         case S_IFLNK:
1508                                 data->rpc_status = -ELOOP;
1509                                 break;
1510                         case S_IFDIR:
1511                                 data->rpc_status = -EISDIR;
1512                                 break;
1513                         default:
1514                                 data->rpc_status = -ENOTDIR;
1515                 }
1516                 renew_lease(data->o_res.server, data->timestamp);
1517                 if (!(data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM))
1518                         nfs_confirm_seqid(&data->owner->so_seqid, 0);
1519         }
1520         data->rpc_done = 1;
1521 }
1522
1523 static void nfs4_open_release(void *calldata)
1524 {
1525         struct nfs4_opendata *data = calldata;
1526         struct nfs4_state *state = NULL;
1527
1528         /* If this request hasn't been cancelled, do nothing */
1529         if (data->cancelled == 0)
1530                 goto out_free;
1531         /* In case of error, no cleanup! */
1532         if (data->rpc_status != 0 || !data->rpc_done)
1533                 goto out_free;
1534         /* In case we need an open_confirm, no cleanup! */
1535         if (data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM)
1536                 goto out_free;
1537         state = nfs4_opendata_to_nfs4_state(data);
1538         if (!IS_ERR(state))
1539                 nfs4_close_state(state, data->o_arg.fmode);
1540 out_free:
1541         nfs4_opendata_put(data);
1542 }
1543
1544 static const struct rpc_call_ops nfs4_open_ops = {
1545         .rpc_call_prepare = nfs4_open_prepare,
1546         .rpc_call_done = nfs4_open_done,
1547         .rpc_release = nfs4_open_release,
1548 };
1549
1550 static const struct rpc_call_ops nfs4_recover_open_ops = {
1551         .rpc_call_prepare = nfs4_recover_open_prepare,
1552         .rpc_call_done = nfs4_open_done,
1553         .rpc_release = nfs4_open_release,
1554 };
1555
1556 static int nfs4_run_open_task(struct nfs4_opendata *data, int isrecover)
1557 {
1558         struct inode *dir = data->dir->d_inode;
1559         struct nfs_server *server = NFS_SERVER(dir);
1560         struct nfs_openargs *o_arg = &data->o_arg;
1561         struct nfs_openres *o_res = &data->o_res;
1562         struct rpc_task *task;
1563         struct rpc_message msg = {
1564                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN],
1565                 .rpc_argp = o_arg,
1566                 .rpc_resp = o_res,
1567                 .rpc_cred = data->owner->so_cred,
1568         };
1569         struct rpc_task_setup task_setup_data = {
1570                 .rpc_client = server->client,
1571                 .rpc_message = &msg,
1572                 .callback_ops = &nfs4_open_ops,
1573                 .callback_data = data,
1574                 .workqueue = nfsiod_workqueue,
1575                 .flags = RPC_TASK_ASYNC,
1576         };
1577         int status;
1578
1579         nfs41_init_sequence(&o_arg->seq_args, &o_res->seq_res, 1);
1580         kref_get(&data->kref);
1581         data->rpc_done = 0;
1582         data->rpc_status = 0;
1583         data->cancelled = 0;
1584         if (isrecover)
1585                 task_setup_data.callback_ops = &nfs4_recover_open_ops;
1586         task = rpc_run_task(&task_setup_data);
1587         if (IS_ERR(task))
1588                 return PTR_ERR(task);
1589         status = nfs4_wait_for_completion_rpc_task(task);
1590         if (status != 0) {
1591                 data->cancelled = 1;
1592                 smp_wmb();
1593         } else
1594                 status = data->rpc_status;
1595         rpc_put_task(task);
1596
1597         return status;
1598 }
1599
1600 static int _nfs4_recover_proc_open(struct nfs4_opendata *data)
1601 {
1602         struct inode *dir = data->dir->d_inode;
1603         struct nfs_openres *o_res = &data->o_res;
1604         int status;
1605
1606         status = nfs4_run_open_task(data, 1);
1607         if (status != 0 || !data->rpc_done)
1608                 return status;
1609
1610         nfs_fattr_map_and_free_names(NFS_SERVER(dir), &data->f_attr);
1611
1612         if (o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
1613                 status = _nfs4_proc_open_confirm(data);
1614                 if (status != 0)
1615                         return status;
1616         }
1617
1618         return status;
1619 }
1620
1621 /*
1622  * Note: On error, nfs4_proc_open will free the struct nfs4_opendata
1623  */
1624 static int _nfs4_proc_open(struct nfs4_opendata *data)
1625 {
1626         struct inode *dir = data->dir->d_inode;
1627         struct nfs_server *server = NFS_SERVER(dir);
1628         struct nfs_openargs *o_arg = &data->o_arg;
1629         struct nfs_openres *o_res = &data->o_res;
1630         int status;
1631
1632         status = nfs4_run_open_task(data, 0);
1633         if (!data->rpc_done)
1634                 return status;
1635         if (status != 0) {
1636                 if (status == -NFS4ERR_BADNAME &&
1637                                 !(o_arg->open_flags & O_CREAT))
1638                         return -ENOENT;
1639                 return status;
1640         }
1641
1642         nfs_fattr_map_and_free_names(server, &data->f_attr);
1643
1644         if (o_arg->open_flags & O_CREAT)
1645                 update_changeattr(dir, &o_res->cinfo);
1646         if ((o_res->rflags & NFS4_OPEN_RESULT_LOCKTYPE_POSIX) == 0)
1647                 server->caps &= ~NFS_CAP_POSIX_LOCK;
1648         if(o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
1649                 status = _nfs4_proc_open_confirm(data);
1650                 if (status != 0)
1651                         return status;
1652         }
1653         if (!(o_res->f_attr->valid & NFS_ATTR_FATTR))
1654                 _nfs4_proc_getattr(server, &o_res->fh, o_res->f_attr);
1655         return 0;
1656 }
1657
1658 static int nfs4_client_recover_expired_lease(struct nfs_client *clp)
1659 {
1660         unsigned int loop;
1661         int ret;
1662
1663         for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
1664                 ret = nfs4_wait_clnt_recover(clp);
1665                 if (ret != 0)
1666                         break;
1667                 if (!test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) &&
1668                     !test_bit(NFS4CLNT_CHECK_LEASE,&clp->cl_state))
1669                         break;
1670                 nfs4_schedule_state_manager(clp);
1671                 ret = -EIO;
1672         }
1673         return ret;
1674 }
1675
1676 static int nfs4_recover_expired_lease(struct nfs_server *server)
1677 {
1678         return nfs4_client_recover_expired_lease(server->nfs_client);
1679 }
1680
1681 /*
1682  * OPEN_EXPIRED:
1683  *      reclaim state on the server after a network partition.
1684  *      Assumes caller holds the appropriate lock
1685  */
1686 static int _nfs4_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
1687 {
1688         struct nfs4_opendata *opendata;
1689         int ret;
1690
1691         opendata = nfs4_open_recoverdata_alloc(ctx, state);
1692         if (IS_ERR(opendata))
1693                 return PTR_ERR(opendata);
1694         ret = nfs4_open_recover(opendata, state);
1695         if (ret == -ESTALE)
1696                 d_drop(ctx->dentry);
1697         nfs4_opendata_put(opendata);
1698         return ret;
1699 }
1700
1701 static int nfs4_do_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
1702 {
1703         struct nfs_server *server = NFS_SERVER(state->inode);
1704         struct nfs4_exception exception = { };
1705         int err;
1706
1707         do {
1708                 err = _nfs4_open_expired(ctx, state);
1709                 switch (err) {
1710                 default:
1711                         goto out;
1712                 case -NFS4ERR_GRACE:
1713                 case -NFS4ERR_DELAY:
1714                         nfs4_handle_exception(server, err, &exception);
1715                         err = 0;
1716                 }
1717         } while (exception.retry);
1718 out:
1719         return err;
1720 }
1721
1722 static int nfs4_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
1723 {
1724         struct nfs_open_context *ctx;
1725         int ret;
1726
1727         ctx = nfs4_state_find_open_context(state);
1728         if (IS_ERR(ctx))
1729                 return PTR_ERR(ctx);
1730         ret = nfs4_do_open_expired(ctx, state);
1731         put_nfs_open_context(ctx);
1732         return ret;
1733 }
1734
1735 #if defined(CONFIG_NFS_V4_1)
1736 static int nfs41_check_expired_stateid(struct nfs4_state *state, nfs4_stateid *stateid, unsigned int flags)
1737 {
1738         int status = NFS_OK;
1739         struct nfs_server *server = NFS_SERVER(state->inode);
1740
1741         if (state->flags & flags) {
1742                 status = nfs41_test_stateid(server, stateid);
1743                 if (status != NFS_OK) {
1744                         nfs41_free_stateid(server, stateid);
1745                         state->flags &= ~flags;
1746                 }
1747         }
1748         return status;
1749 }
1750
1751 static int nfs41_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
1752 {
1753         int deleg_status, open_status;
1754         int deleg_flags = 1 << NFS_DELEGATED_STATE;
1755         int open_flags = (1 << NFS_O_RDONLY_STATE) | (1 << NFS_O_WRONLY_STATE) | (1 << NFS_O_RDWR_STATE);
1756
1757         deleg_status = nfs41_check_expired_stateid(state, &state->stateid, deleg_flags);
1758         open_status = nfs41_check_expired_stateid(state,  &state->open_stateid, open_flags);
1759
1760         if ((deleg_status == NFS_OK) && (open_status == NFS_OK))
1761                 return NFS_OK;
1762         return nfs4_open_expired(sp, state);
1763 }
1764 #endif
1765
1766 /*
1767  * on an EXCLUSIVE create, the server should send back a bitmask with FATTR4-*
1768  * fields corresponding to attributes that were used to store the verifier.
1769  * Make sure we clobber those fields in the later setattr call
1770  */
1771 static inline void nfs4_exclusive_attrset(struct nfs4_opendata *opendata, struct iattr *sattr)
1772 {
1773         if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_ACCESS) &&
1774             !(sattr->ia_valid & ATTR_ATIME_SET))
1775                 sattr->ia_valid |= ATTR_ATIME;
1776
1777         if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_MODIFY) &&
1778             !(sattr->ia_valid & ATTR_MTIME_SET))
1779                 sattr->ia_valid |= ATTR_MTIME;
1780 }
1781
1782 /*
1783  * Returns a referenced nfs4_state
1784  */
1785 static int _nfs4_do_open(struct inode *dir, struct dentry *dentry, fmode_t fmode, int flags, struct iattr *sattr, struct rpc_cred *cred, struct nfs4_state **res)
1786 {
1787         struct nfs4_state_owner  *sp;
1788         struct nfs4_state     *state = NULL;
1789         struct nfs_server       *server = NFS_SERVER(dir);
1790         struct nfs4_opendata *opendata;
1791         int status;
1792
1793         /* Protect against reboot recovery conflicts */
1794         status = -ENOMEM;
1795         sp = nfs4_get_state_owner(server, cred, GFP_KERNEL);
1796         if (sp == NULL) {
1797                 dprintk("nfs4_do_open: nfs4_get_state_owner failed!\n");
1798                 goto out_err;
1799         }
1800         status = nfs4_recover_expired_lease(server);
1801         if (status != 0)
1802                 goto err_put_state_owner;
1803         if (dentry->d_inode != NULL)
1804                 nfs4_return_incompatible_delegation(dentry->d_inode, fmode);
1805         status = -ENOMEM;
1806         opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags, sattr, GFP_KERNEL);
1807         if (opendata == NULL)
1808                 goto err_put_state_owner;
1809
1810         if (dentry->d_inode != NULL)
1811                 opendata->state = nfs4_get_open_state(dentry->d_inode, sp);
1812
1813         status = _nfs4_proc_open(opendata);
1814         if (status != 0)
1815                 goto err_opendata_put;
1816
1817         state = nfs4_opendata_to_nfs4_state(opendata);
1818         status = PTR_ERR(state);
1819         if (IS_ERR(state))
1820                 goto err_opendata_put;
1821         if (server->caps & NFS_CAP_POSIX_LOCK)
1822                 set_bit(NFS_STATE_POSIX_LOCKS, &state->flags);
1823
1824         if (opendata->o_arg.open_flags & O_EXCL) {
1825                 nfs4_exclusive_attrset(opendata, sattr);
1826
1827                 nfs_fattr_init(opendata->o_res.f_attr);
1828                 status = nfs4_do_setattr(state->inode, cred,
1829                                 opendata->o_res.f_attr, sattr,
1830                                 state);
1831                 if (status == 0)
1832                         nfs_setattr_update_inode(state->inode, sattr);
1833                 nfs_post_op_update_inode(state->inode, opendata->o_res.f_attr);
1834         }
1835         nfs4_opendata_put(opendata);
1836         nfs4_put_state_owner(sp);
1837         *res = state;
1838         return 0;
1839 err_opendata_put:
1840         nfs4_opendata_put(opendata);
1841 err_put_state_owner:
1842         nfs4_put_state_owner(sp);
1843 out_err:
1844         *res = NULL;
1845         return status;
1846 }
1847
1848
1849 static struct nfs4_state *nfs4_do_open(struct inode *dir, struct dentry *dentry, fmode_t fmode, int flags, struct iattr *sattr, struct rpc_cred *cred)
1850 {
1851         struct nfs4_exception exception = { };
1852         struct nfs4_state *res;
1853         int status;
1854
1855         do {
1856                 status = _nfs4_do_open(dir, dentry, fmode, flags, sattr, cred, &res);
1857                 if (status == 0)
1858                         break;
1859                 /* NOTE: BAD_SEQID means the server and client disagree about the
1860                  * book-keeping w.r.t. state-changing operations
1861                  * (OPEN/CLOSE/LOCK/LOCKU...)
1862                  * It is actually a sign of a bug on the client or on the server.
1863                  *
1864                  * If we receive a BAD_SEQID error in the particular case of
1865                  * doing an OPEN, we assume that nfs_increment_open_seqid() will
1866                  * have unhashed the old state_owner for us, and that we can
1867                  * therefore safely retry using a new one. We should still warn
1868                  * the user though...
1869                  */
1870                 if (status == -NFS4ERR_BAD_SEQID) {
1871                         pr_warn_ratelimited("NFS: v4 server %s "
1872                                         " returned a bad sequence-id error!\n",
1873                                         NFS_SERVER(dir)->nfs_client->cl_hostname);
1874                         exception.retry = 1;
1875                         continue;
1876                 }
1877                 /*
1878                  * BAD_STATEID on OPEN means that the server cancelled our
1879                  * state before it received the OPEN_CONFIRM.
1880                  * Recover by retrying the request as per the discussion
1881                  * on Page 181 of RFC3530.
1882                  */
1883                 if (status == -NFS4ERR_BAD_STATEID) {
1884                         exception.retry = 1;
1885                         continue;
1886                 }
1887                 if (status == -EAGAIN) {
1888                         /* We must have found a delegation */
1889                         exception.retry = 1;
1890                         continue;
1891                 }
1892                 res = ERR_PTR(nfs4_handle_exception(NFS_SERVER(dir),
1893                                         status, &exception));
1894         } while (exception.retry);
1895         return res;
1896 }
1897
1898 static int _nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
1899                             struct nfs_fattr *fattr, struct iattr *sattr,
1900                             struct nfs4_state *state)
1901 {
1902         struct nfs_server *server = NFS_SERVER(inode);
1903         struct nfs_setattrargs  arg = {
1904                 .fh             = NFS_FH(inode),
1905                 .iap            = sattr,
1906                 .server         = server,
1907                 .bitmask = server->attr_bitmask,
1908         };
1909         struct nfs_setattrres  res = {
1910                 .fattr          = fattr,
1911                 .server         = server,
1912         };
1913         struct rpc_message msg = {
1914                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
1915                 .rpc_argp       = &arg,
1916                 .rpc_resp       = &res,
1917                 .rpc_cred       = cred,
1918         };
1919         unsigned long timestamp = jiffies;
1920         int status;
1921
1922         nfs_fattr_init(fattr);
1923
1924         if (state != NULL) {
1925                 nfs4_select_rw_stateid(&arg.stateid, state, FMODE_WRITE,
1926                                 current->files, current->tgid);
1927         } else if (nfs4_copy_delegation_stateid(&arg.stateid, inode,
1928                                 FMODE_WRITE)) {
1929                 /* Use that stateid */
1930         } else
1931                 nfs4_stateid_copy(&arg.stateid, &zero_stateid);
1932
1933         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
1934         if (status == 0 && state != NULL)
1935                 renew_lease(server, timestamp);
1936         return status;
1937 }
1938
1939 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
1940                            struct nfs_fattr *fattr, struct iattr *sattr,
1941                            struct nfs4_state *state)
1942 {
1943         struct nfs_server *server = NFS_SERVER(inode);
1944         struct nfs4_exception exception = {
1945                 .state = state,
1946                 .inode = inode,
1947         };
1948         int err;
1949         do {
1950                 err = _nfs4_do_setattr(inode, cred, fattr, sattr, state);
1951                 switch (err) {
1952                 case -NFS4ERR_OPENMODE:
1953                         if (state && !(state->state & FMODE_WRITE)) {
1954                                 err = -EBADF;
1955                                 if (sattr->ia_valid & ATTR_OPEN)
1956                                         err = -EACCES;
1957                                 goto out;
1958                         }
1959                 }
1960                 err = nfs4_handle_exception(server, err, &exception);
1961         } while (exception.retry);
1962 out:
1963         return err;
1964 }
1965
1966 struct nfs4_closedata {
1967         struct inode *inode;
1968         struct nfs4_state *state;
1969         struct nfs_closeargs arg;
1970         struct nfs_closeres res;
1971         struct nfs_fattr fattr;
1972         unsigned long timestamp;
1973         bool roc;
1974         u32 roc_barrier;
1975 };
1976
1977 static void nfs4_free_closedata(void *data)
1978 {
1979         struct nfs4_closedata *calldata = data;
1980         struct nfs4_state_owner *sp = calldata->state->owner;
1981         struct super_block *sb = calldata->state->inode->i_sb;
1982
1983         if (calldata->roc)
1984                 pnfs_roc_release(calldata->state->inode);
1985         nfs4_put_open_state(calldata->state);
1986         nfs_free_seqid(calldata->arg.seqid);
1987         nfs4_put_state_owner(sp);
1988         nfs_sb_deactive(sb);
1989         kfree(calldata);
1990 }
1991
1992 static void nfs4_close_clear_stateid_flags(struct nfs4_state *state,
1993                 fmode_t fmode)
1994 {
1995         spin_lock(&state->owner->so_lock);
1996         if (!(fmode & FMODE_READ))
1997                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1998         if (!(fmode & FMODE_WRITE))
1999                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
2000         clear_bit(NFS_O_RDWR_STATE, &state->flags);
2001         spin_unlock(&state->owner->so_lock);
2002 }
2003
2004 static void nfs4_close_done(struct rpc_task *task, void *data)
2005 {
2006         struct nfs4_closedata *calldata = data;
2007         struct nfs4_state *state = calldata->state;
2008         struct nfs_server *server = NFS_SERVER(calldata->inode);
2009
2010         dprintk("%s: begin!\n", __func__);
2011         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
2012                 return;
2013         /* hmm. we are done with the inode, and in the process of freeing
2014          * the state_owner. we keep this around to process errors
2015          */
2016         switch (task->tk_status) {
2017                 case 0:
2018                         if (calldata->roc)
2019                                 pnfs_roc_set_barrier(state->inode,
2020                                                      calldata->roc_barrier);
2021                         nfs_set_open_stateid(state, &calldata->res.stateid, 0);
2022                         renew_lease(server, calldata->timestamp);
2023                         nfs4_close_clear_stateid_flags(state,
2024                                         calldata->arg.fmode);
2025                         break;
2026                 case -NFS4ERR_STALE_STATEID:
2027                 case -NFS4ERR_OLD_STATEID:
2028                 case -NFS4ERR_BAD_STATEID:
2029                 case -NFS4ERR_EXPIRED:
2030                         if (calldata->arg.fmode == 0)
2031                                 break;
2032                 default:
2033                         if (nfs4_async_handle_error(task, server, state) == -EAGAIN)
2034                                 rpc_restart_call_prepare(task);
2035         }
2036         nfs_release_seqid(calldata->arg.seqid);
2037         nfs_refresh_inode(calldata->inode, calldata->res.fattr);
2038         dprintk("%s: done, ret = %d!\n", __func__, task->tk_status);
2039 }
2040
2041 static void nfs4_close_prepare(struct rpc_task *task, void *data)
2042 {
2043         struct nfs4_closedata *calldata = data;
2044         struct nfs4_state *state = calldata->state;
2045         int call_close = 0;
2046
2047         dprintk("%s: begin!\n", __func__);
2048         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
2049                 return;
2050
2051         task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_DOWNGRADE];
2052         calldata->arg.fmode = FMODE_READ|FMODE_WRITE;
2053         spin_lock(&state->owner->so_lock);
2054         /* Calculate the change in open mode */
2055         if (state->n_rdwr == 0) {
2056                 if (state->n_rdonly == 0) {
2057                         call_close |= test_bit(NFS_O_RDONLY_STATE, &state->flags);
2058                         call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
2059                         calldata->arg.fmode &= ~FMODE_READ;
2060                 }
2061                 if (state->n_wronly == 0) {
2062                         call_close |= test_bit(NFS_O_WRONLY_STATE, &state->flags);
2063                         call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
2064                         calldata->arg.fmode &= ~FMODE_WRITE;
2065                 }
2066         }
2067         spin_unlock(&state->owner->so_lock);
2068
2069         if (!call_close) {
2070                 /* Note: exit _without_ calling nfs4_close_done */
2071                 task->tk_action = NULL;
2072                 goto out;
2073         }
2074
2075         if (calldata->arg.fmode == 0) {
2076                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE];
2077                 if (calldata->roc &&
2078                     pnfs_roc_drain(calldata->inode, &calldata->roc_barrier)) {
2079                         rpc_sleep_on(&NFS_SERVER(calldata->inode)->roc_rpcwaitq,
2080                                      task, NULL);
2081                         goto out;
2082                 }
2083         }
2084
2085         nfs_fattr_init(calldata->res.fattr);
2086         calldata->timestamp = jiffies;
2087         if (nfs4_setup_sequence(NFS_SERVER(calldata->inode),
2088                                 &calldata->arg.seq_args,
2089                                 &calldata->res.seq_res,
2090                                 task))
2091                 goto out;
2092         rpc_call_start(task);
2093 out:
2094         dprintk("%s: done!\n", __func__);
2095 }
2096
2097 static const struct rpc_call_ops nfs4_close_ops = {
2098         .rpc_call_prepare = nfs4_close_prepare,
2099         .rpc_call_done = nfs4_close_done,
2100         .rpc_release = nfs4_free_closedata,
2101 };
2102
2103 /* 
2104  * It is possible for data to be read/written from a mem-mapped file 
2105  * after the sys_close call (which hits the vfs layer as a flush).
2106  * This means that we can't safely call nfsv4 close on a file until 
2107  * the inode is cleared. This in turn means that we are not good
2108  * NFSv4 citizens - we do not indicate to the server to update the file's 
2109  * share state even when we are done with one of the three share 
2110  * stateid's in the inode.
2111  *
2112  * NOTE: Caller must be holding the sp->so_owner semaphore!
2113  */
2114 int nfs4_do_close(struct nfs4_state *state, gfp_t gfp_mask, int wait, bool roc)
2115 {
2116         struct nfs_server *server = NFS_SERVER(state->inode);
2117         struct nfs4_closedata *calldata;
2118         struct nfs4_state_owner *sp = state->owner;
2119         struct rpc_task *task;
2120         struct rpc_message msg = {
2121                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE],
2122                 .rpc_cred = state->owner->so_cred,
2123         };
2124         struct rpc_task_setup task_setup_data = {
2125                 .rpc_client = server->client,
2126                 .rpc_message = &msg,
2127                 .callback_ops = &nfs4_close_ops,
2128                 .workqueue = nfsiod_workqueue,
2129                 .flags = RPC_TASK_ASYNC,
2130         };
2131         int status = -ENOMEM;
2132
2133         calldata = kzalloc(sizeof(*calldata), gfp_mask);
2134         if (calldata == NULL)
2135                 goto out;
2136         nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 1);
2137         calldata->inode = state->inode;
2138         calldata->state = state;
2139         calldata->arg.fh = NFS_FH(state->inode);
2140         calldata->arg.stateid = &state->open_stateid;
2141         /* Serialization for the sequence id */
2142         calldata->arg.seqid = nfs_alloc_seqid(&state->owner->so_seqid, gfp_mask);
2143         if (calldata->arg.seqid == NULL)
2144                 goto out_free_calldata;
2145         calldata->arg.fmode = 0;
2146         calldata->arg.bitmask = server->cache_consistency_bitmask;
2147         calldata->res.fattr = &calldata->fattr;
2148         calldata->res.seqid = calldata->arg.seqid;
2149         calldata->res.server = server;
2150         calldata->roc = roc;
2151         nfs_sb_active(calldata->inode->i_sb);
2152
2153         msg.rpc_argp = &calldata->arg;
2154         msg.rpc_resp = &calldata->res;
2155         task_setup_data.callback_data = calldata;
2156         task = rpc_run_task(&task_setup_data);
2157         if (IS_ERR(task))
2158                 return PTR_ERR(task);
2159         status = 0;
2160         if (wait)
2161                 status = rpc_wait_for_completion_task(task);
2162         rpc_put_task(task);
2163         return status;
2164 out_free_calldata:
2165         kfree(calldata);
2166 out:
2167         if (roc)
2168                 pnfs_roc_release(state->inode);
2169         nfs4_put_open_state(state);
2170         nfs4_put_state_owner(sp);
2171         return status;
2172 }
2173
2174 static struct inode *
2175 nfs4_atomic_open(struct inode *dir, struct nfs_open_context *ctx, int open_flags, struct iattr *attr)
2176 {
2177         struct nfs4_state *state;
2178
2179         /* Protect against concurrent sillydeletes */
2180         state = nfs4_do_open(dir, ctx->dentry, ctx->mode, open_flags, attr, ctx->cred);
2181         if (IS_ERR(state))
2182                 return ERR_CAST(state);
2183         ctx->state = state;
2184         return igrab(state->inode);
2185 }
2186
2187 static void nfs4_close_context(struct nfs_open_context *ctx, int is_sync)
2188 {
2189         if (ctx->state == NULL)
2190                 return;
2191         if (is_sync)
2192                 nfs4_close_sync(ctx->state, ctx->mode);
2193         else
2194                 nfs4_close_state(ctx->state, ctx->mode);
2195 }
2196
2197 static int _nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
2198 {
2199         struct nfs4_server_caps_arg args = {
2200                 .fhandle = fhandle,
2201         };
2202         struct nfs4_server_caps_res res = {};
2203         struct rpc_message msg = {
2204                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SERVER_CAPS],
2205                 .rpc_argp = &args,
2206                 .rpc_resp = &res,
2207         };
2208         int status;
2209
2210         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2211         if (status == 0) {
2212                 memcpy(server->attr_bitmask, res.attr_bitmask, sizeof(server->attr_bitmask));
2213                 server->caps &= ~(NFS_CAP_ACLS|NFS_CAP_HARDLINKS|
2214                                 NFS_CAP_SYMLINKS|NFS_CAP_FILEID|
2215                                 NFS_CAP_MODE|NFS_CAP_NLINK|NFS_CAP_OWNER|
2216                                 NFS_CAP_OWNER_GROUP|NFS_CAP_ATIME|
2217                                 NFS_CAP_CTIME|NFS_CAP_MTIME);
2218                 if (res.attr_bitmask[0] & FATTR4_WORD0_ACL)
2219                         server->caps |= NFS_CAP_ACLS;
2220                 if (res.has_links != 0)
2221                         server->caps |= NFS_CAP_HARDLINKS;
2222                 if (res.has_symlinks != 0)
2223                         server->caps |= NFS_CAP_SYMLINKS;
2224                 if (res.attr_bitmask[0] & FATTR4_WORD0_FILEID)
2225                         server->caps |= NFS_CAP_FILEID;
2226                 if (res.attr_bitmask[1] & FATTR4_WORD1_MODE)
2227                         server->caps |= NFS_CAP_MODE;
2228                 if (res.attr_bitmask[1] & FATTR4_WORD1_NUMLINKS)
2229                         server->caps |= NFS_CAP_NLINK;
2230                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER)
2231                         server->caps |= NFS_CAP_OWNER;
2232                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER_GROUP)
2233                         server->caps |= NFS_CAP_OWNER_GROUP;
2234                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_ACCESS)
2235                         server->caps |= NFS_CAP_ATIME;
2236                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_METADATA)
2237                         server->caps |= NFS_CAP_CTIME;
2238                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_MODIFY)
2239                         server->caps |= NFS_CAP_MTIME;
2240
2241                 memcpy(server->cache_consistency_bitmask, res.attr_bitmask, sizeof(server->cache_consistency_bitmask));
2242                 server->cache_consistency_bitmask[0] &= FATTR4_WORD0_CHANGE|FATTR4_WORD0_SIZE;
2243                 server->cache_consistency_bitmask[1] &= FATTR4_WORD1_TIME_METADATA|FATTR4_WORD1_TIME_MODIFY;
2244                 server->acl_bitmask = res.acl_bitmask;
2245                 server->fh_expire_type = res.fh_expire_type;
2246         }
2247
2248         return status;
2249 }
2250
2251 int nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
2252 {
2253         struct nfs4_exception exception = { };
2254         int err;
2255         do {
2256                 err = nfs4_handle_exception(server,
2257                                 _nfs4_server_capabilities(server, fhandle),
2258                                 &exception);
2259         } while (exception.retry);
2260         return err;
2261 }
2262
2263 static int _nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
2264                 struct nfs_fsinfo *info)
2265 {
2266         struct nfs4_lookup_root_arg args = {
2267                 .bitmask = nfs4_fattr_bitmap,
2268         };
2269         struct nfs4_lookup_res res = {
2270                 .server = server,
2271                 .fattr = info->fattr,
2272                 .fh = fhandle,
2273         };
2274         struct rpc_message msg = {
2275                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP_ROOT],
2276                 .rpc_argp = &args,
2277                 .rpc_resp = &res,
2278         };
2279
2280         nfs_fattr_init(info->fattr);
2281         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2282 }
2283
2284 static int nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
2285                 struct nfs_fsinfo *info)
2286 {
2287         struct nfs4_exception exception = { };
2288         int err;
2289         do {
2290                 err = _nfs4_lookup_root(server, fhandle, info);
2291                 switch (err) {
2292                 case 0:
2293                 case -NFS4ERR_WRONGSEC:
2294                         goto out;
2295                 default:
2296                         err = nfs4_handle_exception(server, err, &exception);
2297                 }
2298         } while (exception.retry);
2299 out:
2300         return err;
2301 }
2302
2303 static int nfs4_lookup_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
2304                                 struct nfs_fsinfo *info, rpc_authflavor_t flavor)
2305 {
2306         struct rpc_auth *auth;
2307         int ret;
2308
2309         auth = rpcauth_create(flavor, server->client);
2310         if (!auth) {
2311                 ret = -EIO;
2312                 goto out;
2313         }
2314         ret = nfs4_lookup_root(server, fhandle, info);
2315 out:
2316         return ret;
2317 }
2318
2319 static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
2320                               struct nfs_fsinfo *info)
2321 {
2322         int i, len, status = 0;
2323         rpc_authflavor_t flav_array[NFS_MAX_SECFLAVORS];
2324
2325         len = gss_mech_list_pseudoflavors(&flav_array[0]);
2326         flav_array[len] = RPC_AUTH_NULL;
2327         len += 1;
2328
2329         for (i = 0; i < len; i++) {
2330                 status = nfs4_lookup_root_sec(server, fhandle, info, flav_array[i]);
2331                 if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
2332                         continue;
2333                 break;
2334         }
2335         /*
2336          * -EACCESS could mean that the user doesn't have correct permissions
2337          * to access the mount.  It could also mean that we tried to mount
2338          * with a gss auth flavor, but rpc.gssd isn't running.  Either way,
2339          * existing mount programs don't handle -EACCES very well so it should
2340          * be mapped to -EPERM instead.
2341          */
2342         if (status == -EACCES)
2343                 status = -EPERM;
2344         return status;
2345 }
2346
2347 /*
2348  * get the file handle for the "/" directory on the server
2349  */
2350 int nfs4_proc_get_rootfh(struct nfs_server *server, struct nfs_fh *fhandle,
2351                          struct nfs_fsinfo *info)
2352 {
2353         int minor_version = server->nfs_client->cl_minorversion;
2354         int status = nfs4_lookup_root(server, fhandle, info);
2355         if ((status == -NFS4ERR_WRONGSEC) && !(server->flags & NFS_MOUNT_SECFLAVOUR))
2356                 /*
2357                  * A status of -NFS4ERR_WRONGSEC will be mapped to -EPERM
2358                  * by nfs4_map_errors() as this function exits.
2359                  */
2360                 status = nfs_v4_minor_ops[minor_version]->find_root_sec(server, fhandle, info);
2361         if (status == 0)
2362                 status = nfs4_server_capabilities(server, fhandle);
2363         if (status == 0)
2364                 status = nfs4_do_fsinfo(server, fhandle, info);
2365         return nfs4_map_errors(status);
2366 }
2367
2368 static int nfs4_proc_get_root(struct nfs_server *server, struct nfs_fh *mntfh,
2369                               struct nfs_fsinfo *info)
2370 {
2371         int error;
2372         struct nfs_fattr *fattr = info->fattr;
2373
2374         error = nfs4_server_capabilities(server, mntfh);
2375         if (error < 0) {
2376                 dprintk("nfs4_get_root: getcaps error = %d\n", -error);
2377                 return error;
2378         }
2379
2380         error = nfs4_proc_getattr(server, mntfh, fattr);
2381         if (error < 0) {
2382                 dprintk("nfs4_get_root: getattr error = %d\n", -error);
2383                 return error;
2384         }
2385
2386         if (fattr->valid & NFS_ATTR_FATTR_FSID &&
2387             !nfs_fsid_equal(&server->fsid, &fattr->fsid))
2388                 memcpy(&server->fsid, &fattr->fsid, sizeof(server->fsid));
2389
2390         return error;
2391 }
2392
2393 /*
2394  * Get locations and (maybe) other attributes of a referral.
2395  * Note that we'll actually follow the referral later when
2396  * we detect fsid mismatch in inode revalidation
2397  */
2398 static int nfs4_get_referral(struct rpc_clnt *client, struct inode *dir,
2399                              const struct qstr *name, struct nfs_fattr *fattr,
2400                              struct nfs_fh *fhandle)
2401 {
2402         int status = -ENOMEM;
2403         struct page *page = NULL;
2404         struct nfs4_fs_locations *locations = NULL;
2405
2406         page = alloc_page(GFP_KERNEL);
2407         if (page == NULL)
2408                 goto out;
2409         locations = kmalloc(sizeof(struct nfs4_fs_locations), GFP_KERNEL);
2410         if (locations == NULL)
2411                 goto out;
2412
2413         status = nfs4_proc_fs_locations(client, dir, name, locations, page);
2414         if (status != 0)
2415                 goto out;
2416         /* Make sure server returned a different fsid for the referral */
2417         if (nfs_fsid_equal(&NFS_SERVER(dir)->fsid, &locations->fattr.fsid)) {
2418                 dprintk("%s: server did not return a different fsid for"
2419                         " a referral at %s\n", __func__, name->name);
2420                 status = -EIO;
2421                 goto out;
2422         }
2423         /* Fixup attributes for the nfs_lookup() call to nfs_fhget() */
2424         nfs_fixup_referral_attributes(&locations->fattr);
2425
2426         /* replace the lookup nfs_fattr with the locations nfs_fattr */
2427         memcpy(fattr, &locations->fattr, sizeof(struct nfs_fattr));
2428         memset(fhandle, 0, sizeof(struct nfs_fh));
2429 out:
2430         if (page)
2431                 __free_page(page);
2432         kfree(locations);
2433         return status;
2434 }
2435
2436 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2437 {
2438         struct nfs4_getattr_arg args = {
2439                 .fh = fhandle,
2440                 .bitmask = server->attr_bitmask,
2441         };
2442         struct nfs4_getattr_res res = {
2443                 .fattr = fattr,
2444                 .server = server,
2445         };
2446         struct rpc_message msg = {
2447                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
2448                 .rpc_argp = &args,
2449                 .rpc_resp = &res,
2450         };
2451         
2452         nfs_fattr_init(fattr);
2453         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2454 }
2455
2456 static int nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2457 {
2458         struct nfs4_exception exception = { };
2459         int err;
2460         do {
2461                 err = nfs4_handle_exception(server,
2462                                 _nfs4_proc_getattr(server, fhandle, fattr),
2463                                 &exception);
2464         } while (exception.retry);
2465         return err;
2466 }
2467
2468 /* 
2469  * The file is not closed if it is opened due to the a request to change
2470  * the size of the file. The open call will not be needed once the
2471  * VFS layer lookup-intents are implemented.
2472  *
2473  * Close is called when the inode is destroyed.
2474  * If we haven't opened the file for O_WRONLY, we
2475  * need to in the size_change case to obtain a stateid.
2476  *
2477  * Got race?
2478  * Because OPEN is always done by name in nfsv4, it is
2479  * possible that we opened a different file by the same
2480  * name.  We can recognize this race condition, but we
2481  * can't do anything about it besides returning an error.
2482  *
2483  * This will be fixed with VFS changes (lookup-intent).
2484  */
2485 static int
2486 nfs4_proc_setattr(struct dentry *dentry, struct nfs_fattr *fattr,
2487                   struct iattr *sattr)
2488 {
2489         struct inode *inode = dentry->d_inode;
2490         struct rpc_cred *cred = NULL;
2491         struct nfs4_state *state = NULL;
2492         int status;
2493
2494         if (pnfs_ld_layoutret_on_setattr(inode))
2495                 pnfs_return_layout(inode);
2496
2497         nfs_fattr_init(fattr);
2498         
2499         /* Search for an existing open(O_WRITE) file */
2500         if (sattr->ia_valid & ATTR_FILE) {
2501                 struct nfs_open_context *ctx;
2502
2503                 ctx = nfs_file_open_context(sattr->ia_file);
2504                 if (ctx) {
2505                         cred = ctx->cred;
2506                         state = ctx->state;
2507                 }
2508         }
2509
2510         /* Deal with open(O_TRUNC) */
2511         if (sattr->ia_valid & ATTR_OPEN)
2512                 sattr->ia_valid &= ~(ATTR_MTIME|ATTR_CTIME|ATTR_OPEN);
2513
2514         status = nfs4_do_setattr(inode, cred, fattr, sattr, state);
2515         if (status == 0)
2516                 nfs_setattr_update_inode(inode, sattr);
2517         return status;
2518 }
2519
2520 static int _nfs4_proc_lookup(struct rpc_clnt *clnt, struct inode *dir,
2521                 const struct qstr *name, struct nfs_fh *fhandle,
2522                 struct nfs_fattr *fattr)
2523 {
2524         struct nfs_server *server = NFS_SERVER(dir);
2525         int                    status;
2526         struct nfs4_lookup_arg args = {
2527                 .bitmask = server->attr_bitmask,
2528                 .dir_fh = NFS_FH(dir),
2529                 .name = name,
2530         };
2531         struct nfs4_lookup_res res = {
2532                 .server = server,
2533                 .fattr = fattr,
2534                 .fh = fhandle,
2535         };
2536         struct rpc_message msg = {
2537                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP],
2538                 .rpc_argp = &args,
2539                 .rpc_resp = &res,
2540         };
2541
2542         nfs_fattr_init(fattr);
2543
2544         dprintk("NFS call  lookup %s\n", name->name);
2545         status = nfs4_call_sync(clnt, server, &msg, &args.seq_args, &res.seq_res, 0);
2546         dprintk("NFS reply lookup: %d\n", status);
2547         return status;
2548 }
2549
2550 static void nfs_fixup_secinfo_attributes(struct nfs_fattr *fattr)
2551 {
2552         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
2553                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_MOUNTPOINT;
2554         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
2555         fattr->nlink = 2;
2556 }
2557
2558 static int nfs4_proc_lookup_common(struct rpc_clnt **clnt, struct inode *dir,
2559                                    struct qstr *name, struct nfs_fh *fhandle,
2560                                    struct nfs_fattr *fattr)
2561 {
2562         struct nfs4_exception exception = { };
2563         struct rpc_clnt *client = *clnt;
2564         int err;
2565         do {
2566                 err = _nfs4_proc_lookup(client, dir, name, fhandle, fattr);
2567                 switch (err) {
2568                 case -NFS4ERR_BADNAME:
2569                         err = -ENOENT;
2570                         goto out;
2571                 case -NFS4ERR_MOVED:
2572                         err = nfs4_get_referral(client, dir, name, fattr, fhandle);
2573                         goto out;
2574                 case -NFS4ERR_WRONGSEC:
2575                         err = -EPERM;
2576                         if (client != *clnt)
2577                                 goto out;
2578
2579                         client = nfs4_create_sec_client(client, dir, name);
2580                         if (IS_ERR(client))
2581                                 return PTR_ERR(client);
2582
2583                         exception.retry = 1;
2584                         break;
2585                 default:
2586                         err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
2587                 }
2588         } while (exception.retry);
2589
2590 out:
2591         if (err == 0)
2592                 *clnt = client;
2593         else if (client != *clnt)
2594                 rpc_shutdown_client(client);
2595
2596         return err;
2597 }
2598
2599 static int nfs4_proc_lookup(struct inode *dir, struct qstr *name,
2600                             struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2601 {
2602         int status;
2603         struct rpc_clnt *client = NFS_CLIENT(dir);
2604
2605         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
2606         if (client != NFS_CLIENT(dir)) {
2607                 rpc_shutdown_client(client);
2608                 nfs_fixup_secinfo_attributes(fattr);
2609         }
2610         return status;
2611 }
2612
2613 struct rpc_clnt *
2614 nfs4_proc_lookup_mountpoint(struct inode *dir, struct qstr *name,
2615                             struct nfs_fh *fhandle, struct nfs_fattr *fattr)
2616 {
2617         int status;
2618         struct rpc_clnt *client = rpc_clone_client(NFS_CLIENT(dir));
2619
2620         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
2621         if (status < 0) {
2622                 rpc_shutdown_client(client);
2623                 return ERR_PTR(status);
2624         }
2625         return client;
2626 }
2627
2628 static int _nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
2629 {
2630         struct nfs_server *server = NFS_SERVER(inode);
2631         struct nfs4_accessargs args = {
2632                 .fh = NFS_FH(inode),
2633                 .bitmask = server->cache_consistency_bitmask,
2634         };
2635         struct nfs4_accessres res = {
2636                 .server = server,
2637         };
2638         struct rpc_message msg = {
2639                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_ACCESS],
2640                 .rpc_argp = &args,
2641                 .rpc_resp = &res,
2642                 .rpc_cred = entry->cred,
2643         };
2644         int mode = entry->mask;
2645         int status;
2646
2647         /*
2648          * Determine which access bits we want to ask for...
2649          */
2650         if (mode & MAY_READ)
2651                 args.access |= NFS4_ACCESS_READ;
2652         if (S_ISDIR(inode->i_mode)) {
2653                 if (mode & MAY_WRITE)
2654                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND | NFS4_ACCESS_DELETE;
2655                 if (mode & MAY_EXEC)
2656                         args.access |= NFS4_ACCESS_LOOKUP;
2657         } else {
2658                 if (mode & MAY_WRITE)
2659                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND;
2660                 if (mode & MAY_EXEC)
2661                         args.access |= NFS4_ACCESS_EXECUTE;
2662         }
2663
2664         res.fattr = nfs_alloc_fattr();
2665         if (res.fattr == NULL)
2666                 return -ENOMEM;
2667
2668         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
2669         if (!status) {
2670                 entry->mask = 0;
2671                 if (res.access & NFS4_ACCESS_READ)
2672                         entry->mask |= MAY_READ;
2673                 if (res.access & (NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND | NFS4_ACCESS_DELETE))
2674                         entry->mask |= MAY_WRITE;
2675                 if (res.access & (NFS4_ACCESS_LOOKUP|NFS4_ACCESS_EXECUTE))
2676                         entry->mask |= MAY_EXEC;
2677                 nfs_refresh_inode(inode, res.fattr);
2678         }
2679         nfs_free_fattr(res.fattr);
2680         return status;
2681 }
2682
2683 static int nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
2684 {
2685         struct nfs4_exception exception = { };
2686         int err;
2687         do {
2688                 err = nfs4_handle_exception(NFS_SERVER(inode),
2689                                 _nfs4_proc_access(inode, entry),
2690                                 &exception);
2691         } while (exception.retry);
2692         return err;
2693 }
2694
2695 /*
2696  * TODO: For the time being, we don't try to get any attributes
2697  * along with any of the zero-copy operations READ, READDIR,
2698  * READLINK, WRITE.
2699  *
2700  * In the case of the first three, we want to put the GETATTR
2701  * after the read-type operation -- this is because it is hard
2702  * to predict the length of a GETATTR response in v4, and thus
2703  * align the READ data correctly.  This means that the GETATTR
2704  * may end up partially falling into the page cache, and we should
2705  * shift it into the 'tail' of the xdr_buf before processing.
2706  * To do this efficiently, we need to know the total length
2707  * of data received, which doesn't seem to be available outside
2708  * of the RPC layer.
2709  *
2710  * In the case of WRITE, we also want to put the GETATTR after
2711  * the operation -- in this case because we want to make sure
2712  * we get the post-operation mtime and size.  This means that
2713  * we can't use xdr_encode_pages() as written: we need a variant
2714  * of it which would leave room in the 'tail' iovec.
2715  *
2716  * Both of these changes to the XDR layer would in fact be quite
2717  * minor, but I decided to leave them for a subsequent patch.
2718  */
2719 static int _nfs4_proc_readlink(struct inode *inode, struct page *page,
2720                 unsigned int pgbase, unsigned int pglen)
2721 {
2722         struct nfs4_readlink args = {
2723                 .fh       = NFS_FH(inode),
2724                 .pgbase   = pgbase,
2725                 .pglen    = pglen,
2726                 .pages    = &page,
2727         };
2728         struct nfs4_readlink_res res;
2729         struct rpc_message msg = {
2730                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READLINK],
2731                 .rpc_argp = &args,
2732                 .rpc_resp = &res,
2733         };
2734
2735         return nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode), &msg, &args.seq_args, &res.seq_res, 0);
2736 }
2737
2738 static int nfs4_proc_readlink(struct inode *inode, struct page *page,
2739                 unsigned int pgbase, unsigned int pglen)
2740 {
2741         struct nfs4_exception exception = { };
2742         int err;
2743         do {
2744                 err = nfs4_handle_exception(NFS_SERVER(inode),
2745                                 _nfs4_proc_readlink(inode, page, pgbase, pglen),
2746                                 &exception);
2747         } while (exception.retry);
2748         return err;
2749 }
2750
2751 /*
2752  * Got race?
2753  * We will need to arrange for the VFS layer to provide an atomic open.
2754  * Until then, this create/open method is prone to inefficiency and race
2755  * conditions due to the lookup, create, and open VFS calls from sys_open()
2756  * placed on the wire.
2757  *
2758  * Given the above sorry state of affairs, I'm simply sending an OPEN.
2759  * The file will be opened again in the subsequent VFS open call
2760  * (nfs4_proc_file_open).
2761  *
2762  * The open for read will just hang around to be used by any process that
2763  * opens the file O_RDONLY. This will all be resolved with the VFS changes.
2764  */
2765
2766 static int
2767 nfs4_proc_create(struct inode *dir, struct dentry *dentry, struct iattr *sattr,
2768                  int flags, struct nfs_open_context *ctx)
2769 {
2770         struct dentry *de = dentry;
2771         struct nfs4_state *state;
2772         struct rpc_cred *cred = NULL;
2773         fmode_t fmode = 0;
2774         int status = 0;
2775
2776         if (ctx != NULL) {
2777                 cred = ctx->cred;
2778                 de = ctx->dentry;
2779                 fmode = ctx->mode;
2780         }
2781         sattr->ia_mode &= ~current_umask();
2782         state = nfs4_do_open(dir, de, fmode, flags, sattr, cred);
2783         d_drop(dentry);
2784         if (IS_ERR(state)) {
2785                 status = PTR_ERR(state);
2786                 goto out;
2787         }
2788         d_add(dentry, igrab(state->inode));
2789         nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
2790         if (ctx != NULL)
2791                 ctx->state = state;
2792         else
2793                 nfs4_close_sync(state, fmode);
2794 out:
2795         return status;
2796 }
2797
2798 static int _nfs4_proc_remove(struct inode *dir, struct qstr *name)
2799 {
2800         struct nfs_server *server = NFS_SERVER(dir);
2801         struct nfs_removeargs args = {
2802                 .fh = NFS_FH(dir),
2803                 .name.len = name->len,
2804                 .name.name = name->name,
2805         };
2806         struct nfs_removeres res = {
2807                 .server = server,
2808         };
2809         struct rpc_message msg = {
2810                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE],
2811                 .rpc_argp = &args,
2812                 .rpc_resp = &res,
2813         };
2814         int status;
2815
2816         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
2817         if (status == 0)
2818                 update_changeattr(dir, &res.cinfo);
2819         return status;
2820 }
2821
2822 static int nfs4_proc_remove(struct inode *dir, struct qstr *name)
2823 {
2824         struct nfs4_exception exception = { };
2825         int err;
2826         do {
2827                 err = nfs4_handle_exception(NFS_SERVER(dir),
2828                                 _nfs4_proc_remove(dir, name),
2829                                 &exception);
2830         } while (exception.retry);
2831         return err;
2832 }
2833
2834 static void nfs4_proc_unlink_setup(struct rpc_message *msg, struct inode *dir)
2835 {
2836         struct nfs_server *server = NFS_SERVER(dir);
2837         struct nfs_removeargs *args = msg->rpc_argp;
2838         struct nfs_removeres *res = msg->rpc_resp;
2839
2840         res->server = server;
2841         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE];
2842         nfs41_init_sequence(&args->seq_args, &res->seq_res, 1);
2843 }
2844
2845 static void nfs4_proc_unlink_rpc_prepare(struct rpc_task *task, struct nfs_unlinkdata *data)
2846 {
2847         if (nfs4_setup_sequence(NFS_SERVER(data->dir),
2848                                 &data->args.seq_args,
2849                                 &data->res.seq_res,
2850                                 task))
2851                 return;
2852         rpc_call_start(task);
2853 }
2854
2855 static int nfs4_proc_unlink_done(struct rpc_task *task, struct inode *dir)
2856 {
2857         struct nfs_removeres *res = task->tk_msg.rpc_resp;
2858
2859         if (!nfs4_sequence_done(task, &res->seq_res))
2860                 return 0;
2861         if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
2862                 return 0;
2863         update_changeattr(dir, &res->cinfo);
2864         return 1;
2865 }
2866
2867 static void nfs4_proc_rename_setup(struct rpc_message *msg, struct inode *dir)
2868 {
2869         struct nfs_server *server = NFS_SERVER(dir);
2870         struct nfs_renameargs *arg = msg->rpc_argp;
2871         struct nfs_renameres *res = msg->rpc_resp;
2872
2873         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME];
2874         res->server = server;
2875         nfs41_init_sequence(&arg->seq_args, &res->seq_res, 1);
2876 }
2877
2878 static void nfs4_proc_rename_rpc_prepare(struct rpc_task *task, struct nfs_renamedata *data)
2879 {
2880         if (nfs4_setup_sequence(NFS_SERVER(data->old_dir),
2881                                 &data->args.seq_args,
2882                                 &data->res.seq_res,
2883                                 task))
2884                 return;
2885         rpc_call_start(task);
2886 }
2887
2888 static int nfs4_proc_rename_done(struct rpc_task *task, struct inode *old_dir,
2889                                  struct inode *new_dir)
2890 {
2891         struct nfs_renameres *res = task->tk_msg.rpc_resp;
2892
2893         if (!nfs4_sequence_done(task, &res->seq_res))
2894                 return 0;
2895         if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
2896                 return 0;
2897
2898         update_changeattr(old_dir, &res->old_cinfo);
2899         update_changeattr(new_dir, &res->new_cinfo);
2900         return 1;
2901 }
2902
2903 static int _nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
2904                 struct inode *new_dir, struct qstr *new_name)
2905 {
2906         struct nfs_server *server = NFS_SERVER(old_dir);
2907         struct nfs_renameargs arg = {
2908                 .old_dir = NFS_FH(old_dir),
2909                 .new_dir = NFS_FH(new_dir),
2910                 .old_name = old_name,
2911                 .new_name = new_name,
2912         };
2913         struct nfs_renameres res = {
2914                 .server = server,
2915         };
2916         struct rpc_message msg = {
2917                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME],
2918                 .rpc_argp = &arg,
2919                 .rpc_resp = &res,
2920         };
2921         int status = -ENOMEM;
2922         
2923         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
2924         if (!status) {
2925                 update_changeattr(old_dir, &res.old_cinfo);
2926                 update_changeattr(new_dir, &res.new_cinfo);
2927         }
2928         return status;
2929 }
2930
2931 static int nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
2932                 struct inode *new_dir, struct qstr *new_name)
2933 {
2934         struct nfs4_exception exception = { };
2935         int err;
2936         do {
2937                 err = nfs4_handle_exception(NFS_SERVER(old_dir),
2938                                 _nfs4_proc_rename(old_dir, old_name,
2939                                         new_dir, new_name),
2940                                 &exception);
2941         } while (exception.retry);
2942         return err;
2943 }
2944
2945 static int _nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
2946 {
2947         struct nfs_server *server = NFS_SERVER(inode);
2948         struct nfs4_link_arg arg = {
2949                 .fh     = NFS_FH(inode),
2950                 .dir_fh = NFS_FH(dir),
2951                 .name   = name,
2952                 .bitmask = server->attr_bitmask,
2953         };
2954         struct nfs4_link_res res = {
2955                 .server = server,
2956         };
2957         struct rpc_message msg = {
2958                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LINK],
2959                 .rpc_argp = &arg,
2960                 .rpc_resp = &res,
2961         };
2962         int status = -ENOMEM;
2963
2964         res.fattr = nfs_alloc_fattr();
2965         if (res.fattr == NULL)
2966                 goto out;
2967
2968         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
2969         if (!status) {
2970                 update_changeattr(dir, &res.cinfo);
2971                 nfs_post_op_update_inode(inode, res.fattr);
2972         }
2973 out:
2974         nfs_free_fattr(res.fattr);
2975         return status;
2976 }
2977
2978 static int nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
2979 {
2980         struct nfs4_exception exception = { };
2981         int err;
2982         do {
2983                 err = nfs4_handle_exception(NFS_SERVER(inode),
2984                                 _nfs4_proc_link(inode, dir, name),
2985                                 &exception);
2986         } while (exception.retry);
2987         return err;
2988 }
2989
2990 struct nfs4_createdata {
2991         struct rpc_message msg;
2992         struct nfs4_create_arg arg;
2993         struct nfs4_create_res res;
2994         struct nfs_fh fh;
2995         struct nfs_fattr fattr;
2996 };
2997
2998 static struct nfs4_createdata *nfs4_alloc_createdata(struct inode *dir,
2999                 struct qstr *name, struct iattr *sattr, u32 ftype)
3000 {
3001         struct nfs4_createdata *data;
3002
3003         data = kzalloc(sizeof(*data), GFP_KERNEL);
3004         if (data != NULL) {
3005                 struct nfs_server *server = NFS_SERVER(dir);
3006
3007                 data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE];
3008                 data->msg.rpc_argp = &data->arg;
3009                 data->msg.rpc_resp = &data->res;
3010                 data->arg.dir_fh = NFS_FH(dir);
3011                 data->arg.server = server;
3012                 data->arg.name = name;
3013                 data->arg.attrs = sattr;
3014                 data->arg.ftype = ftype;
3015                 data->arg.bitmask = server->attr_bitmask;
3016                 data->res.server = server;
3017                 data->res.fh = &data->fh;
3018                 data->res.fattr = &data->fattr;
3019                 nfs_fattr_init(data->res.fattr);
3020         }
3021         return data;
3022 }
3023
3024 static int nfs4_do_create(struct inode *dir, struct dentry *dentry, struct nfs4_createdata *data)
3025 {
3026         int status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &data->msg,
3027                                     &data->arg.seq_args, &data->res.seq_res, 1);
3028         if (status == 0) {
3029                 update_changeattr(dir, &data->res.dir_cinfo);
3030                 status = nfs_instantiate(dentry, data->res.fh, data->res.fattr);
3031         }
3032         return status;
3033 }
3034
3035 static void nfs4_free_createdata(struct nfs4_createdata *data)
3036 {
3037         kfree(data);
3038 }
3039
3040 static int _nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3041                 struct page *page, unsigned int len, struct iattr *sattr)
3042 {
3043         struct nfs4_createdata *data;
3044         int status = -ENAMETOOLONG;
3045
3046         if (len > NFS4_MAXPATHLEN)
3047                 goto out;
3048
3049         status = -ENOMEM;
3050         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4LNK);
3051         if (data == NULL)
3052                 goto out;
3053
3054         data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SYMLINK];
3055         data->arg.u.symlink.pages = &page;
3056         data->arg.u.symlink.len = len;
3057         
3058         status = nfs4_do_create(dir, dentry, data);
3059
3060         nfs4_free_createdata(data);
3061 out:
3062         return status;
3063 }
3064
3065 static int nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3066                 struct page *page, unsigned int len, struct iattr *sattr)
3067 {
3068         struct nfs4_exception exception = { };
3069         int err;
3070         do {
3071                 err = nfs4_handle_exception(NFS_SERVER(dir),
3072                                 _nfs4_proc_symlink(dir, dentry, page,
3073                                                         len, sattr),
3074                                 &exception);
3075         } while (exception.retry);
3076         return err;
3077 }
3078
3079 static int _nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
3080                 struct iattr *sattr)
3081 {
3082         struct nfs4_createdata *data;
3083         int status = -ENOMEM;
3084
3085         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4DIR);
3086         if (data == NULL)
3087                 goto out;
3088
3089         status = nfs4_do_create(dir, dentry, data);
3090
3091         nfs4_free_createdata(data);
3092 out:
3093         return status;
3094 }
3095
3096 static int nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
3097                 struct iattr *sattr)
3098 {
3099         struct nfs4_exception exception = { };
3100         int err;
3101
3102         sattr->ia_mode &= ~current_umask();
3103         do {
3104                 err = nfs4_handle_exception(NFS_SERVER(dir),
3105                                 _nfs4_proc_mkdir(dir, dentry, sattr),
3106                                 &exception);
3107         } while (exception.retry);
3108         return err;
3109 }
3110
3111 static int _nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
3112                 u64 cookie, struct page **pages, unsigned int count, int plus)
3113 {
3114         struct inode            *dir = dentry->d_inode;
3115         struct nfs4_readdir_arg args = {
3116                 .fh = NFS_FH(dir),
3117                 .pages = pages,
3118                 .pgbase = 0,
3119                 .count = count,
3120                 .bitmask = NFS_SERVER(dentry->d_inode)->attr_bitmask,
3121                 .plus = plus,
3122         };
3123         struct nfs4_readdir_res res;
3124         struct rpc_message msg = {
3125                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READDIR],
3126                 .rpc_argp = &args,
3127                 .rpc_resp = &res,
3128                 .rpc_cred = cred,
3129         };
3130         int                     status;
3131
3132         dprintk("%s: dentry = %s/%s, cookie = %Lu\n", __func__,
3133                         dentry->d_parent->d_name.name,
3134                         dentry->d_name.name,
3135                         (unsigned long long)cookie);
3136         nfs4_setup_readdir(cookie, NFS_COOKIEVERF(dir), dentry, &args);
3137         res.pgbase = args.pgbase;
3138         status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
3139         if (status >= 0) {
3140                 memcpy(NFS_COOKIEVERF(dir), res.verifier.data, NFS4_VERIFIER_SIZE);
3141                 status += args.pgbase;
3142         }
3143
3144         nfs_invalidate_atime(dir);
3145
3146         dprintk("%s: returns %d\n", __func__, status);
3147         return status;
3148 }
3149
3150 static int nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
3151                 u64 cookie, struct page **pages, unsigned int count, int plus)
3152 {
3153         struct nfs4_exception exception = { };
3154         int err;
3155         do {
3156                 err = nfs4_handle_exception(NFS_SERVER(dentry->d_inode),
3157                                 _nfs4_proc_readdir(dentry, cred, cookie,
3158                                         pages, count, plus),
3159                                 &exception);
3160         } while (exception.retry);
3161         return err;
3162 }
3163
3164 static int _nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
3165                 struct iattr *sattr, dev_t rdev)
3166 {
3167         struct nfs4_createdata *data;
3168         int mode = sattr->ia_mode;
3169         int status = -ENOMEM;
3170
3171         BUG_ON(!(sattr->ia_valid & ATTR_MODE));
3172         BUG_ON(!S_ISFIFO(mode) && !S_ISBLK(mode) && !S_ISCHR(mode) && !S_ISSOCK(mode));
3173
3174         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4SOCK);
3175         if (data == NULL)
3176                 goto out;
3177
3178         if (S_ISFIFO(mode))
3179                 data->arg.ftype = NF4FIFO;
3180         else if (S_ISBLK(mode)) {
3181                 data->arg.ftype = NF4BLK;
3182                 data->arg.u.device.specdata1 = MAJOR(rdev);
3183                 data->arg.u.device.specdata2 = MINOR(rdev);
3184         }
3185         else if (S_ISCHR(mode)) {
3186                 data->arg.ftype = NF4CHR;
3187                 data->arg.u.device.specdata1 = MAJOR(rdev);
3188                 data->arg.u.device.specdata2 = MINOR(rdev);
3189         }
3190         
3191         status = nfs4_do_create(dir, dentry, data);
3192
3193         nfs4_free_createdata(data);
3194 out:
3195         return status;
3196 }
3197
3198 static int nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
3199                 struct iattr *sattr, dev_t rdev)
3200 {
3201         struct nfs4_exception exception = { };
3202         int err;
3203
3204         sattr->ia_mode &= ~current_umask();
3205         do {
3206                 err = nfs4_handle_exception(NFS_SERVER(dir),
3207                                 _nfs4_proc_mknod(dir, dentry, sattr, rdev),
3208                                 &exception);
3209         } while (exception.retry);
3210         return err;
3211 }
3212
3213 static int _nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle,
3214                  struct nfs_fsstat *fsstat)
3215 {
3216         struct nfs4_statfs_arg args = {
3217                 .fh = fhandle,
3218                 .bitmask = server->attr_bitmask,
3219         };
3220         struct nfs4_statfs_res res = {
3221                 .fsstat = fsstat,
3222         };
3223         struct rpc_message msg = {
3224                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_STATFS],
3225                 .rpc_argp = &args,
3226                 .rpc_resp = &res,
3227         };
3228
3229         nfs_fattr_init(fsstat->fattr);
3230         return  nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3231 }
3232
3233 static int nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsstat *fsstat)
3234 {
3235         struct nfs4_exception exception = { };
3236         int err;
3237         do {
3238                 err = nfs4_handle_exception(server,
3239                                 _nfs4_proc_statfs(server, fhandle, fsstat),
3240                                 &exception);
3241         } while (exception.retry);
3242         return err;
3243 }
3244
3245 static int _nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle,
3246                 struct nfs_fsinfo *fsinfo)
3247 {
3248         struct nfs4_fsinfo_arg args = {
3249                 .fh = fhandle,
3250                 .bitmask = server->attr_bitmask,
3251         };
3252         struct nfs4_fsinfo_res res = {
3253                 .fsinfo = fsinfo,
3254         };
3255         struct rpc_message msg = {
3256                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSINFO],
3257                 .rpc_argp = &args,
3258                 .rpc_resp = &res,
3259         };
3260
3261         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3262 }
3263
3264 static int nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
3265 {
3266         struct nfs4_exception exception = { };
3267         int err;
3268
3269         do {
3270                 err = nfs4_handle_exception(server,
3271                                 _nfs4_do_fsinfo(server, fhandle, fsinfo),
3272                                 &exception);
3273         } while (exception.retry);
3274         return err;
3275 }
3276
3277 static int nfs4_proc_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
3278 {
3279         nfs_fattr_init(fsinfo->fattr);
3280         return nfs4_do_fsinfo(server, fhandle, fsinfo);
3281 }
3282
3283 static int _nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
3284                 struct nfs_pathconf *pathconf)
3285 {
3286         struct nfs4_pathconf_arg args = {
3287                 .fh = fhandle,
3288                 .bitmask = server->attr_bitmask,
3289         };
3290         struct nfs4_pathconf_res res = {
3291                 .pathconf = pathconf,
3292         };
3293         struct rpc_message msg = {
3294                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_PATHCONF],
3295                 .rpc_argp = &args,
3296                 .rpc_resp = &res,
3297         };
3298
3299         /* None of the pathconf attributes are mandatory to implement */
3300         if ((args.bitmask[0] & nfs4_pathconf_bitmap[0]) == 0) {
3301                 memset(pathconf, 0, sizeof(*pathconf));
3302                 return 0;
3303         }
3304
3305         nfs_fattr_init(pathconf->fattr);
3306         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3307 }
3308
3309 static int nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
3310                 struct nfs_pathconf *pathconf)
3311 {
3312         struct nfs4_exception exception = { };
3313         int err;
3314
3315         do {
3316                 err = nfs4_handle_exception(server,
3317                                 _nfs4_proc_pathconf(server, fhandle, pathconf),
3318                                 &exception);
3319         } while (exception.retry);
3320         return err;
3321 }
3322
3323 void __nfs4_read_done_cb(struct nfs_read_data *data)
3324 {
3325         nfs_invalidate_atime(data->header->inode);
3326 }
3327
3328 static int nfs4_read_done_cb(struct rpc_task *task, struct nfs_read_data *data)
3329 {
3330         struct nfs_server *server = NFS_SERVER(data->header->inode);
3331
3332         if (nfs4_async_handle_error(task, server, data->args.context->state) == -EAGAIN) {
3333                 rpc_restart_call_prepare(task);
3334                 return -EAGAIN;
3335         }
3336
3337         __nfs4_read_done_cb(data);
3338         if (task->tk_status > 0)
3339                 renew_lease(server, data->timestamp);
3340         return 0;
3341 }
3342
3343 static int nfs4_read_done(struct rpc_task *task, struct nfs_read_data *data)
3344 {
3345
3346         dprintk("--> %s\n", __func__);
3347
3348         if (!nfs4_sequence_done(task, &data->res.seq_res))
3349                 return -EAGAIN;
3350
3351         return data->read_done_cb ? data->read_done_cb(task, data) :
3352                                     nfs4_read_done_cb(task, data);
3353 }
3354
3355 static void nfs4_proc_read_setup(struct nfs_read_data *data, struct rpc_message *msg)
3356 {
3357         data->timestamp   = jiffies;
3358         data->read_done_cb = nfs4_read_done_cb;
3359         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READ];
3360         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
3361 }
3362
3363 static void nfs4_proc_read_rpc_prepare(struct rpc_task *task, struct nfs_read_data *data)
3364 {
3365         if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3366                                 &data->args.seq_args,
3367                                 &data->res.seq_res,
3368                                 task))
3369                 return;
3370         rpc_call_start(task);
3371 }
3372
3373 static int nfs4_write_done_cb(struct rpc_task *task, struct nfs_write_data *data)
3374 {
3375         struct inode *inode = data->header->inode;
3376         
3377         if (nfs4_async_handle_error(task, NFS_SERVER(inode), data->args.context->state) == -EAGAIN) {
3378                 rpc_restart_call_prepare(task);
3379                 return -EAGAIN;
3380         }
3381         if (task->tk_status >= 0) {
3382                 renew_lease(NFS_SERVER(inode), data->timestamp);
3383                 nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
3384         }
3385         return 0;
3386 }
3387
3388 static int nfs4_write_done(struct rpc_task *task, struct nfs_write_data *data)
3389 {
3390         if (!nfs4_sequence_done(task, &data->res.seq_res))
3391                 return -EAGAIN;
3392         return data->write_done_cb ? data->write_done_cb(task, data) :
3393                 nfs4_write_done_cb(task, data);
3394 }
3395
3396 static
3397 bool nfs4_write_need_cache_consistency_data(const struct nfs_write_data *data)
3398 {
3399         const struct nfs_pgio_header *hdr = data->header;
3400
3401         /* Don't request attributes for pNFS or O_DIRECT writes */
3402         if (data->ds_clp != NULL || hdr->dreq != NULL)
3403                 return false;
3404         /* Otherwise, request attributes if and only if we don't hold
3405          * a delegation
3406          */
3407         return nfs_have_delegation(hdr->inode, FMODE_READ) == 0;
3408 }
3409
3410 static void nfs4_proc_write_setup(struct nfs_write_data *data, struct rpc_message *msg)
3411 {
3412         struct nfs_server *server = NFS_SERVER(data->header->inode);
3413
3414         if (!nfs4_write_need_cache_consistency_data(data)) {
3415                 data->args.bitmask = NULL;
3416                 data->res.fattr = NULL;
3417         } else
3418                 data->args.bitmask = server->cache_consistency_bitmask;
3419
3420         if (!data->write_done_cb)
3421                 data->write_done_cb = nfs4_write_done_cb;
3422         data->res.server = server;
3423         data->timestamp   = jiffies;
3424
3425         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_WRITE];
3426         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
3427 }
3428
3429 static void nfs4_proc_write_rpc_prepare(struct rpc_task *task, struct nfs_write_data *data)
3430 {
3431         if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3432                                 &data->args.seq_args,
3433                                 &data->res.seq_res,
3434                                 task))
3435                 return;
3436         rpc_call_start(task);
3437 }
3438
3439 static void nfs4_proc_commit_rpc_prepare(struct rpc_task *task, struct nfs_commit_data *data)
3440 {
3441         if (nfs4_setup_sequence(NFS_SERVER(data->inode),
3442                                 &data->args.seq_args,
3443                                 &data->res.seq_res,
3444                                 task))
3445                 return;
3446         rpc_call_start(task);
3447 }
3448
3449 static int nfs4_commit_done_cb(struct rpc_task *task, struct nfs_commit_data *data)
3450 {
3451         struct inode *inode = data->inode;
3452
3453         if (nfs4_async_handle_error(task, NFS_SERVER(inode), NULL) == -EAGAIN) {
3454                 rpc_restart_call_prepare(task);
3455                 return -EAGAIN;
3456         }
3457         return 0;
3458 }
3459
3460 static int nfs4_commit_done(struct rpc_task *task, struct nfs_commit_data *data)
3461 {
3462         if (!nfs4_sequence_done(task, &data->res.seq_res))
3463                 return -EAGAIN;
3464         return data->commit_done_cb(task, data);
3465 }
3466
3467 static void nfs4_proc_commit_setup(struct nfs_commit_data *data, struct rpc_message *msg)
3468 {
3469         struct nfs_server *server = NFS_SERVER(data->inode);
3470
3471         if (data->commit_done_cb == NULL)
3472                 data->commit_done_cb = nfs4_commit_done_cb;
3473         data->res.server = server;
3474         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_COMMIT];
3475         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
3476 }
3477
3478 struct nfs4_renewdata {
3479         struct nfs_client       *client;
3480         unsigned long           timestamp;
3481 };
3482
3483 /*
3484  * nfs4_proc_async_renew(): This is not one of the nfs_rpc_ops; it is a special
3485  * standalone procedure for queueing an asynchronous RENEW.
3486  */
3487 static void nfs4_renew_release(void *calldata)
3488 {
3489         struct nfs4_renewdata *data = calldata;
3490         struct nfs_client *clp = data->client;
3491
3492         if (atomic_read(&clp->cl_count) > 1)
3493                 nfs4_schedule_state_renewal(clp);
3494         nfs_put_client(clp);
3495         kfree(data);
3496 }
3497
3498 static void nfs4_renew_done(struct rpc_task *task, void *calldata)
3499 {
3500         struct nfs4_renewdata *data = calldata;
3501         struct nfs_client *clp = data->client;
3502         unsigned long timestamp = data->timestamp;
3503
3504         if (task->tk_status < 0) {
3505                 /* Unless we're shutting down, schedule state recovery! */
3506                 if (test_bit(NFS_CS_RENEWD, &clp->cl_res_state) == 0)
3507                         return;
3508                 if (task->tk_status != NFS4ERR_CB_PATH_DOWN) {
3509                         nfs4_schedule_lease_recovery(clp);
3510                         return;
3511                 }
3512                 nfs4_schedule_path_down_recovery(clp);
3513         }
3514         do_renew_lease(clp, timestamp);
3515 }
3516
3517 static const struct rpc_call_ops nfs4_renew_ops = {
3518         .rpc_call_done = nfs4_renew_done,
3519         .rpc_release = nfs4_renew_release,
3520 };
3521
3522 static int nfs4_proc_async_renew(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
3523 {
3524         struct rpc_message msg = {
3525                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
3526                 .rpc_argp       = clp,
3527                 .rpc_cred       = cred,
3528         };
3529         struct nfs4_renewdata *data;
3530
3531         if (renew_flags == 0)
3532                 return 0;
3533         if (!atomic_inc_not_zero(&clp->cl_count))
3534                 return -EIO;
3535         data = kmalloc(sizeof(*data), GFP_NOFS);
3536         if (data == NULL)
3537                 return -ENOMEM;
3538         data->client = clp;
3539         data->timestamp = jiffies;
3540         return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_SOFT,
3541                         &nfs4_renew_ops, data);
3542 }
3543
3544 static int nfs4_proc_renew(struct nfs_client *clp, struct rpc_cred *cred)
3545 {
3546         struct rpc_message msg = {
3547                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
3548                 .rpc_argp       = clp,
3549                 .rpc_cred       = cred,
3550         };
3551         unsigned long now = jiffies;
3552         int status;
3553
3554         status = rpc_call_sync(clp->cl_rpcclient, &msg, 0);
3555         if (status < 0)
3556                 return status;
3557         do_renew_lease(clp, now);
3558         return 0;
3559 }
3560
3561 static inline int nfs4_server_supports_acls(struct nfs_server *server)
3562 {
3563         return (server->caps & NFS_CAP_ACLS)
3564                 && (server->acl_bitmask & ACL4_SUPPORT_ALLOW_ACL)
3565                 && (server->acl_bitmask & ACL4_SUPPORT_DENY_ACL);
3566 }
3567
3568 /* Assuming that XATTR_SIZE_MAX is a multiple of PAGE_CACHE_SIZE, and that
3569  * it's OK to put sizeof(void) * (XATTR_SIZE_MAX/PAGE_CACHE_SIZE) bytes on
3570  * the stack.
3571  */
3572 #define NFS4ACL_MAXPAGES (XATTR_SIZE_MAX >> PAGE_CACHE_SHIFT)
3573
3574 static int buf_to_pages_noslab(const void *buf, size_t buflen,
3575                 struct page **pages, unsigned int *pgbase)
3576 {
3577         struct page *newpage, **spages;
3578         int rc = 0;
3579         size_t len;
3580         spages = pages;
3581
3582         do {
3583                 len = min_t(size_t, PAGE_CACHE_SIZE, buflen);
3584                 newpage = alloc_page(GFP_KERNEL);
3585
3586                 if (newpage == NULL)
3587                         goto unwind;
3588                 memcpy(page_address(newpage), buf, len);
3589                 buf += len;
3590                 buflen -= len;
3591                 *pages++ = newpage;
3592                 rc++;
3593         } while (buflen != 0);
3594
3595         return rc;
3596
3597 unwind:
3598         for(; rc > 0; rc--)
3599                 __free_page(spages[rc-1]);
3600         return -ENOMEM;
3601 }
3602
3603 struct nfs4_cached_acl {
3604         int cached;
3605         size_t len;
3606         char data[0];
3607 };
3608
3609 static void nfs4_set_cached_acl(struct inode *inode, struct nfs4_cached_acl *acl)
3610 {
3611         struct nfs_inode *nfsi = NFS_I(inode);
3612
3613         spin_lock(&inode->i_lock);
3614         kfree(nfsi->nfs4_acl);
3615         nfsi->nfs4_acl = acl;
3616         spin_unlock(&inode->i_lock);
3617 }
3618
3619 static void nfs4_zap_acl_attr(struct inode *inode)
3620 {
3621         nfs4_set_cached_acl(inode, NULL);
3622 }
3623
3624 static inline ssize_t nfs4_read_cached_acl(struct inode *inode, char *buf, size_t buflen)
3625 {
3626         struct nfs_inode *nfsi = NFS_I(inode);
3627         struct nfs4_cached_acl *acl;
3628         int ret = -ENOENT;
3629
3630         spin_lock(&inode->i_lock);
3631         acl = nfsi->nfs4_acl;
3632         if (acl == NULL)
3633                 goto out;
3634         if (buf == NULL) /* user is just asking for length */
3635                 goto out_len;
3636         if (acl->cached == 0)
3637                 goto out;
3638         ret = -ERANGE; /* see getxattr(2) man page */
3639         if (acl->len > buflen)
3640                 goto out;
3641         memcpy(buf, acl->data, acl->len);
3642 out_len:
3643         ret = acl->len;
3644 out:
3645         spin_unlock(&inode->i_lock);
3646         return ret;
3647 }
3648
3649 static void nfs4_write_cached_acl(struct inode *inode, struct page **pages, size_t pgbase, size_t acl_len)
3650 {
3651         struct nfs4_cached_acl *acl;
3652
3653         if (pages && acl_len <= PAGE_SIZE) {
3654                 acl = kmalloc(sizeof(*acl) + acl_len, GFP_KERNEL);
3655                 if (acl == NULL)
3656                         goto out;
3657                 acl->cached = 1;
3658                 _copy_from_pages(acl->data, pages, pgbase, acl_len);
3659         } else {
3660                 acl = kmalloc(sizeof(*acl), GFP_KERNEL);
3661                 if (acl == NULL)
3662                         goto out;
3663                 acl->cached = 0;
3664         }
3665         acl->len = acl_len;
3666 out:
3667         nfs4_set_cached_acl(inode, acl);
3668 }
3669
3670 /*
3671  * The getxattr API returns the required buffer length when called with a
3672  * NULL buf. The NFSv4 acl tool then calls getxattr again after allocating
3673  * the required buf.  On a NULL buf, we send a page of data to the server
3674  * guessing that the ACL request can be serviced by a page. If so, we cache
3675  * up to the page of ACL data, and the 2nd call to getxattr is serviced by
3676  * the cache. If not so, we throw away the page, and cache the required
3677  * length. The next getxattr call will then produce another round trip to
3678  * the server, this time with the input buf of the required size.
3679  */
3680 static ssize_t __nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
3681 {
3682         struct page *pages[NFS4ACL_MAXPAGES] = {NULL, };
3683         struct nfs_getaclargs args = {
3684                 .fh = NFS_FH(inode),
3685                 .acl_pages = pages,
3686                 .acl_len = buflen,
3687         };
3688         struct nfs_getaclres res = {
3689                 .acl_len = buflen,
3690         };
3691         struct rpc_message msg = {
3692                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETACL],
3693                 .rpc_argp = &args,
3694                 .rpc_resp = &res,
3695         };
3696         int ret = -ENOMEM, npages, i, acl_len = 0;
3697
3698         npages = (buflen + PAGE_SIZE - 1) >> PAGE_SHIFT;
3699         /* As long as we're doing a round trip to the server anyway,
3700          * let's be prepared for a page of acl data. */
3701         if (npages == 0)
3702                 npages = 1;
3703
3704         /* Add an extra page to handle the bitmap returned */
3705         npages++;
3706
3707         for (i = 0; i < npages; i++) {
3708                 pages[i] = alloc_page(GFP_KERNEL);
3709                 if (!pages[i])
3710                         goto out_free;
3711         }
3712
3713         /* for decoding across pages */
3714         res.acl_scratch = alloc_page(GFP_KERNEL);
3715         if (!res.acl_scratch)
3716                 goto out_free;
3717
3718         args.acl_len = npages * PAGE_SIZE;
3719         args.acl_pgbase = 0;
3720
3721         /* Let decode_getfacl know not to fail if the ACL data is larger than
3722          * the page we send as a guess */
3723         if (buf == NULL)
3724                 res.acl_flags |= NFS4_ACL_LEN_REQUEST;
3725
3726         dprintk("%s  buf %p buflen %zu npages %d args.acl_len %zu\n",
3727                 __func__, buf, buflen, npages, args.acl_len);
3728         ret = nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode),
3729                              &msg, &args.seq_args, &res.seq_res, 0);
3730         if (ret)
3731                 goto out_free;
3732
3733         acl_len = res.acl_len - res.acl_data_offset;
3734         if (acl_len > args.acl_len)
3735                 nfs4_write_cached_acl(inode, NULL, 0, acl_len);
3736         else
3737                 nfs4_write_cached_acl(inode, pages, res.acl_data_offset,
3738                                       acl_len);
3739         if (buf) {
3740                 ret = -ERANGE;
3741                 if (acl_len > buflen)
3742                         goto out_free;
3743                 _copy_from_pages(buf, pages, res.acl_data_offset,
3744                                 acl_len);
3745         }
3746         ret = acl_len;
3747 out_free:
3748         for (i = 0; i < npages; i++)
3749                 if (pages[i])
3750                         __free_page(pages[i]);
3751         if (res.acl_scratch)
3752                 __free_page(res.acl_scratch);
3753         return ret;
3754 }
3755
3756 static ssize_t nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
3757 {
3758         struct nfs4_exception exception = { };
3759         ssize_t ret;
3760         do {
3761                 ret = __nfs4_get_acl_uncached(inode, buf, buflen);
3762                 if (ret >= 0)
3763                         break;
3764                 ret = nfs4_handle_exception(NFS_SERVER(inode), ret, &exception);
3765         } while (exception.retry);
3766         return ret;
3767 }
3768
3769 static ssize_t nfs4_proc_get_acl(struct inode *inode, void *buf, size_t buflen)
3770 {
3771         struct nfs_server *server = NFS_SERVER(inode);
3772         int ret;
3773
3774         if (!nfs4_server_supports_acls(server))
3775                 return -EOPNOTSUPP;
3776         ret = nfs_revalidate_inode(server, inode);
3777         if (ret < 0)
3778                 return ret;
3779         if (NFS_I(inode)->cache_validity & NFS_INO_INVALID_ACL)
3780                 nfs_zap_acl_cache(inode);
3781         ret = nfs4_read_cached_acl(inode, buf, buflen);
3782         if (ret != -ENOENT)
3783                 /* -ENOENT is returned if there is no ACL or if there is an ACL
3784                  * but no cached acl data, just the acl length */
3785                 return ret;
3786         return nfs4_get_acl_uncached(inode, buf, buflen);
3787 }
3788
3789 static int __nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
3790 {
3791         struct nfs_server *server = NFS_SERVER(inode);
3792         struct page *pages[NFS4ACL_MAXPAGES];
3793         struct nfs_setaclargs arg = {
3794                 .fh             = NFS_FH(inode),
3795                 .acl_pages      = pages,
3796                 .acl_len        = buflen,
3797         };
3798         struct nfs_setaclres res;
3799         struct rpc_message msg = {
3800                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETACL],
3801                 .rpc_argp       = &arg,
3802                 .rpc_resp       = &res,
3803         };
3804         int ret, i;
3805
3806         if (!nfs4_server_supports_acls(server))
3807                 return -EOPNOTSUPP;
3808         i = buf_to_pages_noslab(buf, buflen, arg.acl_pages, &arg.acl_pgbase);
3809         if (i < 0)
3810                 return i;
3811         nfs_inode_return_delegation(inode);
3812         ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
3813
3814         /*
3815          * Free each page after tx, so the only ref left is
3816          * held by the network stack
3817          */
3818         for (; i > 0; i--)
3819                 put_page(pages[i-1]);
3820
3821         /*
3822          * Acl update can result in inode attribute update.
3823          * so mark the attribute cache invalid.
3824          */
3825         spin_lock(&inode->i_lock);
3826         NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATTR;
3827         spin_unlock(&inode->i_lock);
3828         nfs_access_zap_cache(inode);
3829         nfs_zap_acl_cache(inode);
3830         return ret;
3831 }
3832
3833 static int nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
3834 {
3835         struct nfs4_exception exception = { };
3836         int err;
3837         do {
3838                 err = nfs4_handle_exception(NFS_SERVER(inode),
3839                                 __nfs4_proc_set_acl(inode, buf, buflen),
3840                                 &exception);
3841         } while (exception.retry);
3842         return err;
3843 }
3844
3845 static int
3846 nfs4_async_handle_error(struct rpc_task *task, const struct nfs_server *server, struct nfs4_state *state)
3847 {
3848         struct nfs_client *clp = server->nfs_client;
3849
3850         if (task->tk_status >= 0)
3851                 return 0;
3852         switch(task->tk_status) {
3853                 case -NFS4ERR_DELEG_REVOKED:
3854                 case -NFS4ERR_ADMIN_REVOKED:
3855                 case -NFS4ERR_BAD_STATEID:
3856                         if (state == NULL)
3857                                 break;
3858                         nfs_remove_bad_delegation(state->inode);
3859                 case -NFS4ERR_OPENMODE:
3860                         if (state == NULL)
3861                                 break;
3862                         nfs4_schedule_stateid_recovery(server, state);
3863                         goto wait_on_recovery;
3864                 case -NFS4ERR_EXPIRED:
3865                         if (state != NULL)
3866                                 nfs4_schedule_stateid_recovery(server, state);
3867                 case -NFS4ERR_STALE_STATEID:
3868                 case -NFS4ERR_STALE_CLIENTID:
3869                         nfs4_schedule_lease_recovery(clp);
3870                         goto wait_on_recovery;
3871 #if defined(CONFIG_NFS_V4_1)
3872                 case -NFS4ERR_BADSESSION:
3873                 case -NFS4ERR_BADSLOT:
3874                 case -NFS4ERR_BAD_HIGH_SLOT:
3875                 case -NFS4ERR_DEADSESSION:
3876                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
3877                 case -NFS4ERR_SEQ_FALSE_RETRY:
3878                 case -NFS4ERR_SEQ_MISORDERED:
3879                         dprintk("%s ERROR %d, Reset session\n", __func__,
3880                                 task->tk_status);
3881                         nfs4_schedule_session_recovery(clp->cl_session);
3882                         task->tk_status = 0;
3883                         return -EAGAIN;
3884 #endif /* CONFIG_NFS_V4_1 */
3885                 case -NFS4ERR_DELAY:
3886                         nfs_inc_server_stats(server, NFSIOS_DELAY);
3887                 case -NFS4ERR_GRACE:
3888                 case -EKEYEXPIRED:
3889                         rpc_delay(task, NFS4_POLL_RETRY_MAX);
3890                         task->tk_status = 0;
3891                         return -EAGAIN;
3892                 case -NFS4ERR_RETRY_UNCACHED_REP:
3893                 case -NFS4ERR_OLD_STATEID:
3894                         task->tk_status = 0;
3895                         return -EAGAIN;
3896         }
3897         task->tk_status = nfs4_map_errors(task->tk_status);
3898         return 0;
3899 wait_on_recovery:
3900         rpc_sleep_on(&clp->cl_rpcwaitq, task, NULL);
3901         if (test_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) == 0)
3902                 rpc_wake_up_queued_task(&clp->cl_rpcwaitq, task);
3903         task->tk_status = 0;
3904         return -EAGAIN;
3905 }
3906
3907 static void nfs4_init_boot_verifier(const struct nfs_client *clp,
3908                                     nfs4_verifier *bootverf)
3909 {
3910         __be32 verf[2];
3911
3912         if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) {
3913                 /* An impossible timestamp guarantees this value
3914                  * will never match a generated boot time. */
3915                 verf[0] = 0;
3916                 verf[1] = (__be32)(NSEC_PER_SEC + 1);
3917         } else {
3918                 struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
3919                 verf[0] = (__be32)nn->boot_time.tv_sec;
3920                 verf[1] = (__be32)nn->boot_time.tv_nsec;
3921         }
3922         memcpy(bootverf->data, verf, sizeof(bootverf->data));
3923 }
3924
3925 int nfs4_proc_setclientid(struct nfs_client *clp, u32 program,
3926                 unsigned short port, struct rpc_cred *cred,
3927                 struct nfs4_setclientid_res *res)
3928 {
3929         nfs4_verifier sc_verifier;
3930         struct nfs4_setclientid setclientid = {
3931                 .sc_verifier = &sc_verifier,
3932                 .sc_prog = program,
3933                 .sc_cb_ident = clp->cl_cb_ident,
3934         };
3935         struct rpc_message msg = {
3936                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID],
3937                 .rpc_argp = &setclientid,
3938                 .rpc_resp = res,
3939                 .rpc_cred = cred,
3940         };
3941         int loop = 0;
3942         int status;
3943
3944         nfs4_init_boot_verifier(clp, &sc_verifier);
3945
3946         for(;;) {
3947                 rcu_read_lock();
3948                 setclientid.sc_name_len = scnprintf(setclientid.sc_name,
3949                                 sizeof(setclientid.sc_name), "%s/%s %s %s %u",
3950                                 clp->cl_ipaddr,
3951                                 rpc_peeraddr2str(clp->cl_rpcclient,
3952                                                         RPC_DISPLAY_ADDR),
3953                                 rpc_peeraddr2str(clp->cl_rpcclient,
3954                                                         RPC_DISPLAY_PROTO),
3955                                 clp->cl_rpcclient->cl_auth->au_ops->au_name,
3956                                 clp->cl_id_uniquifier);
3957                 setclientid.sc_netid_len = scnprintf(setclientid.sc_netid,
3958                                 sizeof(setclientid.sc_netid),
3959                                 rpc_peeraddr2str(clp->cl_rpcclient,
3960                                                         RPC_DISPLAY_NETID));
3961                 setclientid.sc_uaddr_len = scnprintf(setclientid.sc_uaddr,
3962                                 sizeof(setclientid.sc_uaddr), "%s.%u.%u",
3963                                 clp->cl_ipaddr, port >> 8, port & 255);
3964                 rcu_read_unlock();
3965
3966                 status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
3967                 if (status != -NFS4ERR_CLID_INUSE)
3968                         break;
3969                 if (loop != 0) {
3970                         ++clp->cl_id_uniquifier;
3971                         break;
3972                 }
3973                 ++loop;
3974                 ssleep(clp->cl_lease_time / HZ + 1);
3975         }
3976         return status;
3977 }
3978
3979 int nfs4_proc_setclientid_confirm(struct nfs_client *clp,
3980                 struct nfs4_setclientid_res *arg,
3981                 struct rpc_cred *cred)
3982 {
3983         struct nfs_fsinfo fsinfo;
3984         struct rpc_message msg = {
3985                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID_CONFIRM],
3986                 .rpc_argp = arg,
3987                 .rpc_resp = &fsinfo,
3988                 .rpc_cred = cred,
3989         };
3990         unsigned long now;
3991         int status;
3992
3993         now = jiffies;
3994         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
3995         if (status == 0) {
3996                 spin_lock(&clp->cl_lock);
3997                 clp->cl_lease_time = fsinfo.lease_time * HZ;
3998                 clp->cl_last_renewal = now;
3999                 spin_unlock(&clp->cl_lock);
4000         }
4001         return status;
4002 }
4003
4004 struct nfs4_delegreturndata {
4005         struct nfs4_delegreturnargs args;
4006         struct nfs4_delegreturnres res;
4007         struct nfs_fh fh;
4008         nfs4_stateid stateid;
4009         unsigned long timestamp;
4010         struct nfs_fattr fattr;
4011         int rpc_status;
4012 };
4013
4014 static void nfs4_delegreturn_done(struct rpc_task *task, void *calldata)
4015 {
4016         struct nfs4_delegreturndata *data = calldata;
4017
4018         if (!nfs4_sequence_done(task, &data->res.seq_res))
4019                 return;
4020
4021         switch (task->tk_status) {
4022         case -NFS4ERR_STALE_STATEID:
4023         case -NFS4ERR_EXPIRED:
4024         case 0:
4025                 renew_lease(data->res.server, data->timestamp);
4026                 break;
4027         default:
4028                 if (nfs4_async_handle_error(task, data->res.server, NULL) ==
4029                                 -EAGAIN) {
4030                         rpc_restart_call_prepare(task);
4031                         return;
4032                 }
4033         }
4034         data->rpc_status = task->tk_status;
4035 }
4036
4037 static void nfs4_delegreturn_release(void *calldata)
4038 {
4039         kfree(calldata);
4040 }
4041
4042 #if defined(CONFIG_NFS_V4_1)
4043 static void nfs4_delegreturn_prepare(struct rpc_task *task, void *data)
4044 {
4045         struct nfs4_delegreturndata *d_data;
4046
4047         d_data = (struct nfs4_delegreturndata *)data;
4048
4049         if (nfs4_setup_sequence(d_data->res.server,
4050                                 &d_data->args.seq_args,
4051                                 &d_data->res.seq_res, task))
4052                 return;
4053         rpc_call_start(task);
4054 }
4055 #endif /* CONFIG_NFS_V4_1 */
4056
4057 static const struct rpc_call_ops nfs4_delegreturn_ops = {
4058 #if defined(CONFIG_NFS_V4_1)
4059         .rpc_call_prepare = nfs4_delegreturn_prepare,
4060 #endif /* CONFIG_NFS_V4_1 */
4061         .rpc_call_done = nfs4_delegreturn_done,
4062         .rpc_release = nfs4_delegreturn_release,
4063 };
4064
4065 static int _nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
4066 {
4067         struct nfs4_delegreturndata *data;
4068         struct nfs_server *server = NFS_SERVER(inode);
4069         struct rpc_task *task;
4070         struct rpc_message msg = {
4071                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DELEGRETURN],
4072                 .rpc_cred = cred,
4073         };
4074         struct rpc_task_setup task_setup_data = {
4075                 .rpc_client = server->client,
4076                 .rpc_message = &msg,
4077                 .callback_ops = &nfs4_delegreturn_ops,
4078                 .flags = RPC_TASK_ASYNC,
4079         };
4080         int status = 0;
4081
4082         data = kzalloc(sizeof(*data), GFP_NOFS);
4083         if (data == NULL)
4084                 return -ENOMEM;
4085         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
4086         data->args.fhandle = &data->fh;
4087         data->args.stateid = &data->stateid;
4088         data->args.bitmask = server->cache_consistency_bitmask;
4089         nfs_copy_fh(&data->fh, NFS_FH(inode));
4090         nfs4_stateid_copy(&data->stateid, stateid);
4091         data->res.fattr = &data->fattr;
4092         data->res.server = server;
4093         nfs_fattr_init(data->res.fattr);
4094         data->timestamp = jiffies;
4095         data->rpc_status = 0;
4096
4097         task_setup_data.callback_data = data;
4098         msg.rpc_argp = &data->args;
4099         msg.rpc_resp = &data->res;
4100         task = rpc_run_task(&task_setup_data);
4101         if (IS_ERR(task))
4102                 return PTR_ERR(task);
4103         if (!issync)
4104                 goto out;
4105         status = nfs4_wait_for_completion_rpc_task(task);
4106         if (status != 0)
4107                 goto out;
4108         status = data->rpc_status;
4109         if (status == 0)
4110                 nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
4111         else
4112                 nfs_refresh_inode(inode, &data->fattr);
4113 out:
4114         rpc_put_task(task);
4115         return status;
4116 }
4117
4118 int nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
4119 {
4120         struct nfs_server *server = NFS_SERVER(inode);
4121         struct nfs4_exception exception = { };
4122         int err;
4123         do {
4124                 err = _nfs4_proc_delegreturn(inode, cred, stateid, issync);
4125                 switch (err) {
4126                         case -NFS4ERR_STALE_STATEID:
4127                         case -NFS4ERR_EXPIRED:
4128                         case 0:
4129                                 return 0;
4130                 }
4131                 err = nfs4_handle_exception(server, err, &exception);
4132         } while (exception.retry);
4133         return err;
4134 }
4135
4136 #define NFS4_LOCK_MINTIMEOUT (1 * HZ)
4137 #define NFS4_LOCK_MAXTIMEOUT (30 * HZ)
4138
4139 /* 
4140  * sleep, with exponential backoff, and retry the LOCK operation. 
4141  */
4142 static unsigned long
4143 nfs4_set_lock_task_retry(unsigned long timeout)
4144 {
4145         freezable_schedule_timeout_killable(timeout);
4146         timeout <<= 1;
4147         if (timeout > NFS4_LOCK_MAXTIMEOUT)
4148                 return NFS4_LOCK_MAXTIMEOUT;
4149         return timeout;
4150 }
4151
4152 static int _nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4153 {
4154         struct inode *inode = state->inode;
4155         struct nfs_server *server = NFS_SERVER(inode);
4156         struct nfs_client *clp = server->nfs_client;
4157         struct nfs_lockt_args arg = {
4158                 .fh = NFS_FH(inode),
4159                 .fl = request,
4160         };
4161         struct nfs_lockt_res res = {
4162                 .denied = request,
4163         };
4164         struct rpc_message msg = {
4165                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_LOCKT],
4166                 .rpc_argp       = &arg,
4167                 .rpc_resp       = &res,
4168                 .rpc_cred       = state->owner->so_cred,
4169         };
4170         struct nfs4_lock_state *lsp;
4171         int status;
4172
4173         arg.lock_owner.clientid = clp->cl_clientid;
4174         status = nfs4_set_lock_state(state, request);
4175         if (status != 0)
4176                 goto out;
4177         lsp = request->fl_u.nfs4_fl.owner;
4178         arg.lock_owner.id = lsp->ls_seqid.owner_id;
4179         arg.lock_owner.s_dev = server->s_dev;
4180         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
4181         switch (status) {
4182                 case 0:
4183                         request->fl_type = F_UNLCK;
4184                         break;
4185                 case -NFS4ERR_DENIED:
4186                         status = 0;
4187         }
4188         request->fl_ops->fl_release_private(request);
4189 out:
4190         return status;
4191 }
4192
4193 static int nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4194 {
4195         struct nfs4_exception exception = { };
4196         int err;
4197
4198         do {
4199                 err = nfs4_handle_exception(NFS_SERVER(state->inode),
4200                                 _nfs4_proc_getlk(state, cmd, request),
4201                                 &exception);
4202         } while (exception.retry);
4203         return err;
4204 }
4205
4206 static int do_vfs_lock(struct file *file, struct file_lock *fl)
4207 {
4208         int res = 0;
4209         switch (fl->fl_flags & (FL_POSIX|FL_FLOCK)) {
4210                 case FL_POSIX:
4211                         res = posix_lock_file_wait(file, fl);
4212                         break;
4213                 case FL_FLOCK:
4214                         res = flock_lock_file_wait(file, fl);
4215                         break;
4216                 default:
4217                         BUG();
4218         }
4219         return res;
4220 }
4221
4222 struct nfs4_unlockdata {
4223         struct nfs_locku_args arg;
4224         struct nfs_locku_res res;
4225         struct nfs4_lock_state *lsp;
4226         struct nfs_open_context *ctx;
4227         struct file_lock fl;
4228         const struct nfs_server *server;
4229         unsigned long timestamp;
4230 };
4231
4232 static struct nfs4_unlockdata *nfs4_alloc_unlockdata(struct file_lock *fl,
4233                 struct nfs_open_context *ctx,
4234                 struct nfs4_lock_state *lsp,
4235                 struct nfs_seqid *seqid)
4236 {
4237         struct nfs4_unlockdata *p;
4238         struct inode *inode = lsp->ls_state->inode;
4239
4240         p = kzalloc(sizeof(*p), GFP_NOFS);
4241         if (p == NULL)
4242                 return NULL;
4243         p->arg.fh = NFS_FH(inode);
4244         p->arg.fl = &p->fl;
4245         p->arg.seqid = seqid;
4246         p->res.seqid = seqid;
4247         p->arg.stateid = &lsp->ls_stateid;
4248         p->lsp = lsp;
4249         atomic_inc(&lsp->ls_count);
4250         /* Ensure we don't close file until we're done freeing locks! */
4251         p->ctx = get_nfs_open_context(ctx);
4252         memcpy(&p->fl, fl, sizeof(p->fl));
4253         p->server = NFS_SERVER(inode);
4254         return p;
4255 }
4256
4257 static void nfs4_locku_release_calldata(void *data)
4258 {
4259         struct nfs4_unlockdata *calldata = data;
4260         nfs_free_seqid(calldata->arg.seqid);
4261         nfs4_put_lock_state(calldata->lsp);
4262         put_nfs_open_context(calldata->ctx);
4263         kfree(calldata);
4264 }
4265
4266 static void nfs4_locku_done(struct rpc_task *task, void *data)
4267 {
4268         struct nfs4_unlockdata *calldata = data;
4269
4270         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
4271                 return;
4272         switch (task->tk_status) {
4273                 case 0:
4274                         nfs4_stateid_copy(&calldata->lsp->ls_stateid,
4275                                         &calldata->res.stateid);
4276                         renew_lease(calldata->server, calldata->timestamp);
4277                         break;
4278                 case -NFS4ERR_BAD_STATEID:
4279                 case -NFS4ERR_OLD_STATEID:
4280                 case -NFS4ERR_STALE_STATEID:
4281                 case -NFS4ERR_EXPIRED:
4282                         break;
4283                 default:
4284                         if (nfs4_async_handle_error(task, calldata->server, NULL) == -EAGAIN)
4285                                 rpc_restart_call_prepare(task);
4286         }
4287 }
4288
4289 static void nfs4_locku_prepare(struct rpc_task *task, void *data)
4290 {
4291         struct nfs4_unlockdata *calldata = data;
4292
4293         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
4294                 return;
4295         if ((calldata->lsp->ls_flags & NFS_LOCK_INITIALIZED) == 0) {
4296                 /* Note: exit _without_ running nfs4_locku_done */
4297                 task->tk_action = NULL;
4298                 return;
4299         }
4300         calldata->timestamp = jiffies;
4301         if (nfs4_setup_sequence(calldata->server,
4302                                 &calldata->arg.seq_args,
4303                                 &calldata->res.seq_res, task))
4304                 return;
4305         rpc_call_start(task);
4306 }
4307
4308 static const struct rpc_call_ops nfs4_locku_ops = {
4309         .rpc_call_prepare = nfs4_locku_prepare,
4310         .rpc_call_done = nfs4_locku_done,
4311         .rpc_release = nfs4_locku_release_calldata,
4312 };
4313
4314 static struct rpc_task *nfs4_do_unlck(struct file_lock *fl,
4315                 struct nfs_open_context *ctx,
4316                 struct nfs4_lock_state *lsp,
4317                 struct nfs_seqid *seqid)
4318 {
4319         struct nfs4_unlockdata *data;
4320         struct rpc_message msg = {
4321                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCKU],
4322                 .rpc_cred = ctx->cred,
4323         };
4324         struct rpc_task_setup task_setup_data = {
4325                 .rpc_client = NFS_CLIENT(lsp->ls_state->inode),
4326                 .rpc_message = &msg,
4327                 .callback_ops = &nfs4_locku_ops,
4328                 .workqueue = nfsiod_workqueue,
4329                 .flags = RPC_TASK_ASYNC,
4330         };
4331
4332         /* Ensure this is an unlock - when canceling a lock, the
4333          * canceled lock is passed in, and it won't be an unlock.
4334          */
4335         fl->fl_type = F_UNLCK;
4336
4337         data = nfs4_alloc_unlockdata(fl, ctx, lsp, seqid);
4338         if (data == NULL) {
4339                 nfs_free_seqid(seqid);
4340                 return ERR_PTR(-ENOMEM);
4341         }
4342
4343         nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4344         msg.rpc_argp = &data->arg;
4345         msg.rpc_resp = &data->res;
4346         task_setup_data.callback_data = data;
4347         return rpc_run_task(&task_setup_data);
4348 }
4349
4350 static int nfs4_proc_unlck(struct nfs4_state *state, int cmd, struct file_lock *request)
4351 {
4352         struct nfs_inode *nfsi = NFS_I(state->inode);
4353         struct nfs_seqid *seqid;
4354         struct nfs4_lock_state *lsp;
4355         struct rpc_task *task;
4356         int status = 0;
4357         unsigned char fl_flags = request->fl_flags;
4358
4359         status = nfs4_set_lock_state(state, request);
4360         /* Unlock _before_ we do the RPC call */
4361         request->fl_flags |= FL_EXISTS;
4362         down_read(&nfsi->rwsem);
4363         if (do_vfs_lock(request->fl_file, request) == -ENOENT) {
4364                 up_read(&nfsi->rwsem);
4365                 goto out;
4366         }
4367         up_read(&nfsi->rwsem);
4368         if (status != 0)
4369                 goto out;
4370         /* Is this a delegated lock? */
4371         if (test_bit(NFS_DELEGATED_STATE, &state->flags))
4372                 goto out;
4373         lsp = request->fl_u.nfs4_fl.owner;
4374         seqid = nfs_alloc_seqid(&lsp->ls_seqid, GFP_KERNEL);
4375         status = -ENOMEM;
4376         if (seqid == NULL)
4377                 goto out;
4378         task = nfs4_do_unlck(request, nfs_file_open_context(request->fl_file), lsp, seqid);
4379         status = PTR_ERR(task);
4380         if (IS_ERR(task))
4381                 goto out;
4382         status = nfs4_wait_for_completion_rpc_task(task);
4383         rpc_put_task(task);
4384 out:
4385         request->fl_flags = fl_flags;
4386         return status;
4387 }
4388
4389 struct nfs4_lockdata {
4390         struct nfs_lock_args arg;
4391         struct nfs_lock_res res;
4392         struct nfs4_lock_state *lsp;
4393         struct nfs_open_context *ctx;
4394         struct file_lock fl;
4395         unsigned long timestamp;
4396         int rpc_status;
4397         int cancelled;
4398         struct nfs_server *server;
4399 };
4400
4401 static struct nfs4_lockdata *nfs4_alloc_lockdata(struct file_lock *fl,
4402                 struct nfs_open_context *ctx, struct nfs4_lock_state *lsp,
4403                 gfp_t gfp_mask)
4404 {
4405         struct nfs4_lockdata *p;
4406         struct inode *inode = lsp->ls_state->inode;
4407         struct nfs_server *server = NFS_SERVER(inode);
4408
4409         p = kzalloc(sizeof(*p), gfp_mask);
4410         if (p == NULL)
4411                 return NULL;
4412
4413         p->arg.fh = NFS_FH(inode);
4414         p->arg.fl = &p->fl;
4415         p->arg.open_seqid = nfs_alloc_seqid(&lsp->ls_state->owner->so_seqid, gfp_mask);
4416         if (p->arg.open_seqid == NULL)
4417                 goto out_free;
4418         p->arg.lock_seqid = nfs_alloc_seqid(&lsp->ls_seqid, gfp_mask);
4419         if (p->arg.lock_seqid == NULL)
4420                 goto out_free_seqid;
4421         p->arg.lock_stateid = &lsp->ls_stateid;
4422         p->arg.lock_owner.clientid = server->nfs_client->cl_clientid;
4423         p->arg.lock_owner.id = lsp->ls_seqid.owner_id;
4424         p->arg.lock_owner.s_dev = server->s_dev;
4425         p->res.lock_seqid = p->arg.lock_seqid;
4426         p->lsp = lsp;
4427         p->server = server;
4428         atomic_inc(&lsp->ls_count);
4429         p->ctx = get_nfs_open_context(ctx);
4430         memcpy(&p->fl, fl, sizeof(p->fl));
4431         return p;
4432 out_free_seqid:
4433         nfs_free_seqid(p->arg.open_seqid);
4434 out_free:
4435         kfree(p);
4436         return NULL;
4437 }
4438
4439 static void nfs4_lock_prepare(struct rpc_task *task, void *calldata)
4440 {
4441         struct nfs4_lockdata *data = calldata;
4442         struct nfs4_state *state = data->lsp->ls_state;
4443
4444         dprintk("%s: begin!\n", __func__);
4445         if (nfs_wait_on_sequence(data->arg.lock_seqid, task) != 0)
4446                 return;
4447         /* Do we need to do an open_to_lock_owner? */
4448         if (!(data->arg.lock_seqid->sequence->flags & NFS_SEQID_CONFIRMED)) {
4449                 if (nfs_wait_on_sequence(data->arg.open_seqid, task) != 0)
4450                         return;
4451                 data->arg.open_stateid = &state->stateid;
4452                 data->arg.new_lock_owner = 1;
4453                 data->res.open_seqid = data->arg.open_seqid;
4454         } else
4455                 data->arg.new_lock_owner = 0;
4456         data->timestamp = jiffies;
4457         if (nfs4_setup_sequence(data->server,
4458                                 &data->arg.seq_args,
4459                                 &data->res.seq_res, task))
4460                 return;
4461         rpc_call_start(task);
4462         dprintk("%s: done!, ret = %d\n", __func__, data->rpc_status);
4463 }
4464
4465 static void nfs4_recover_lock_prepare(struct rpc_task *task, void *calldata)
4466 {
4467         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
4468         nfs4_lock_prepare(task, calldata);
4469 }
4470
4471 static void nfs4_lock_done(struct rpc_task *task, void *calldata)
4472 {
4473         struct nfs4_lockdata *data = calldata;
4474
4475         dprintk("%s: begin!\n", __func__);
4476
4477         if (!nfs4_sequence_done(task, &data->res.seq_res))
4478                 return;
4479
4480         data->rpc_status = task->tk_status;
4481         if (data->arg.new_lock_owner != 0) {
4482                 if (data->rpc_status == 0)
4483                         nfs_confirm_seqid(&data->lsp->ls_seqid, 0);
4484                 else
4485                         goto out;
4486         }
4487         if (data->rpc_status == 0) {
4488                 nfs4_stateid_copy(&data->lsp->ls_stateid, &data->res.stateid);
4489                 data->lsp->ls_flags |= NFS_LOCK_INITIALIZED;
4490                 renew_lease(NFS_SERVER(data->ctx->dentry->d_inode), data->timestamp);
4491         }
4492 out:
4493         dprintk("%s: done, ret = %d!\n", __func__, data->rpc_status);
4494 }
4495
4496 static void nfs4_lock_release(void *calldata)
4497 {
4498         struct nfs4_lockdata *data = calldata;
4499
4500         dprintk("%s: begin!\n", __func__);
4501         nfs_free_seqid(data->arg.open_seqid);
4502         if (data->cancelled != 0) {
4503                 struct rpc_task *task;
4504                 task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
4505                                 data->arg.lock_seqid);
4506                 if (!IS_ERR(task))
4507                         rpc_put_task_async(task);
4508                 dprintk("%s: cancelling lock!\n", __func__);
4509         } else
4510                 nfs_free_seqid(data->arg.lock_seqid);
4511         nfs4_put_lock_state(data->lsp);
4512         put_nfs_open_context(data->ctx);
4513         kfree(data);
4514         dprintk("%s: done!\n", __func__);
4515 }
4516
4517 static const struct rpc_call_ops nfs4_lock_ops = {
4518         .rpc_call_prepare = nfs4_lock_prepare,
4519         .rpc_call_done = nfs4_lock_done,
4520         .rpc_release = nfs4_lock_release,
4521 };
4522
4523 static const struct rpc_call_ops nfs4_recover_lock_ops = {
4524         .rpc_call_prepare = nfs4_recover_lock_prepare,
4525         .rpc_call_done = nfs4_lock_done,
4526         .rpc_release = nfs4_lock_release,
4527 };
4528
4529 static void nfs4_handle_setlk_error(struct nfs_server *server, struct nfs4_lock_state *lsp, int new_lock_owner, int error)
4530 {
4531         switch (error) {
4532         case -NFS4ERR_ADMIN_REVOKED:
4533         case -NFS4ERR_BAD_STATEID:
4534                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4535                 if (new_lock_owner != 0 ||
4536                    (lsp->ls_flags & NFS_LOCK_INITIALIZED) != 0)
4537                         nfs4_schedule_stateid_recovery(server, lsp->ls_state);
4538                 break;
4539         case -NFS4ERR_STALE_STATEID:
4540                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4541         case -NFS4ERR_EXPIRED:
4542                 nfs4_schedule_lease_recovery(server->nfs_client);
4543         };
4544 }
4545
4546 static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int recovery_type)
4547 {
4548         struct nfs4_lockdata *data;
4549         struct rpc_task *task;
4550         struct rpc_message msg = {
4551                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCK],
4552                 .rpc_cred = state->owner->so_cred,
4553         };
4554         struct rpc_task_setup task_setup_data = {
4555                 .rpc_client = NFS_CLIENT(state->inode),
4556                 .rpc_message = &msg,
4557                 .callback_ops = &nfs4_lock_ops,
4558                 .workqueue = nfsiod_workqueue,
4559                 .flags = RPC_TASK_ASYNC,
4560         };
4561         int ret;
4562
4563         dprintk("%s: begin!\n", __func__);
4564         data = nfs4_alloc_lockdata(fl, nfs_file_open_context(fl->fl_file),
4565                         fl->fl_u.nfs4_fl.owner,
4566                         recovery_type == NFS_LOCK_NEW ? GFP_KERNEL : GFP_NOFS);
4567         if (data == NULL)
4568                 return -ENOMEM;
4569         if (IS_SETLKW(cmd))
4570                 data->arg.block = 1;
4571         if (recovery_type > NFS_LOCK_NEW) {
4572                 if (recovery_type == NFS_LOCK_RECLAIM)
4573                         data->arg.reclaim = NFS_LOCK_RECLAIM;
4574                 task_setup_data.callback_ops = &nfs4_recover_lock_ops;
4575         }
4576         nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4577         msg.rpc_argp = &data->arg;
4578         msg.rpc_resp = &data->res;
4579         task_setup_data.callback_data = data;
4580         task = rpc_run_task(&task_setup_data);
4581         if (IS_ERR(task))
4582                 return PTR_ERR(task);
4583         ret = nfs4_wait_for_completion_rpc_task(task);
4584         if (ret == 0) {
4585                 ret = data->rpc_status;
4586                 if (ret)
4587                         nfs4_handle_setlk_error(data->server, data->lsp,
4588                                         data->arg.new_lock_owner, ret);
4589         } else
4590                 data->cancelled = 1;
4591         rpc_put_task(task);
4592         dprintk("%s: done, ret = %d!\n", __func__, ret);
4593         return ret;
4594 }
4595
4596 static int nfs4_lock_reclaim(struct nfs4_state *state, struct file_lock *request)
4597 {
4598         struct nfs_server *server = NFS_SERVER(state->inode);
4599         struct nfs4_exception exception = {
4600                 .inode = state->inode,
4601         };
4602         int err;
4603
4604         do {
4605                 /* Cache the lock if possible... */
4606                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
4607                         return 0;
4608                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_RECLAIM);
4609                 if (err != -NFS4ERR_DELAY)
4610                         break;
4611                 nfs4_handle_exception(server, err, &exception);
4612         } while (exception.retry);
4613         return err;
4614 }
4615
4616 static int nfs4_lock_expired(struct nfs4_state *state, struct file_lock *request)
4617 {
4618         struct nfs_server *server = NFS_SERVER(state->inode);
4619         struct nfs4_exception exception = {
4620                 .inode = state->inode,
4621         };
4622         int err;
4623
4624         err = nfs4_set_lock_state(state, request);
4625         if (err != 0)
4626                 return err;
4627         do {
4628                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
4629                         return 0;
4630                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_EXPIRED);
4631                 switch (err) {
4632                 default:
4633                         goto out;
4634                 case -NFS4ERR_GRACE:
4635                 case -NFS4ERR_DELAY:
4636                         nfs4_handle_exception(server, err, &exception);
4637                         err = 0;
4638                 }
4639         } while (exception.retry);
4640 out:
4641         return err;
4642 }
4643
4644 #if defined(CONFIG_NFS_V4_1)
4645 static int nfs41_check_expired_locks(struct nfs4_state *state)
4646 {
4647         int status, ret = NFS_OK;
4648         struct nfs4_lock_state *lsp;
4649         struct nfs_server *server = NFS_SERVER(state->inode);
4650
4651         list_for_each_entry(lsp, &state->lock_states, ls_locks) {
4652                 if (lsp->ls_flags & NFS_LOCK_INITIALIZED) {
4653                         status = nfs41_test_stateid(server, &lsp->ls_stateid);
4654                         if (status != NFS_OK) {
4655                                 nfs41_free_stateid(server, &lsp->ls_stateid);
4656                                 lsp->ls_flags &= ~NFS_LOCK_INITIALIZED;
4657                                 ret = status;
4658                         }
4659                 }
4660         };
4661
4662         return ret;
4663 }
4664
4665 static int nfs41_lock_expired(struct nfs4_state *state, struct file_lock *request)
4666 {
4667         int status = NFS_OK;
4668
4669         if (test_bit(LK_STATE_IN_USE, &state->flags))
4670                 status = nfs41_check_expired_locks(state);
4671         if (status == NFS_OK)
4672                 return status;
4673         return nfs4_lock_expired(state, request);
4674 }
4675 #endif
4676
4677 static int _nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4678 {
4679         struct nfs_inode *nfsi = NFS_I(state->inode);
4680         unsigned char fl_flags = request->fl_flags;
4681         int status = -ENOLCK;
4682
4683         if ((fl_flags & FL_POSIX) &&
4684                         !test_bit(NFS_STATE_POSIX_LOCKS, &state->flags))
4685                 goto out;
4686         /* Is this a delegated open? */
4687         status = nfs4_set_lock_state(state, request);
4688         if (status != 0)
4689                 goto out;
4690         request->fl_flags |= FL_ACCESS;
4691         status = do_vfs_lock(request->fl_file, request);
4692         if (status < 0)
4693                 goto out;
4694         down_read(&nfsi->rwsem);
4695         if (test_bit(NFS_DELEGATED_STATE, &state->flags)) {
4696                 /* Yes: cache locks! */
4697                 /* ...but avoid races with delegation recall... */
4698                 request->fl_flags = fl_flags & ~FL_SLEEP;
4699                 status = do_vfs_lock(request->fl_file, request);
4700                 goto out_unlock;
4701         }
4702         status = _nfs4_do_setlk(state, cmd, request, NFS_LOCK_NEW);
4703         if (status != 0)
4704                 goto out_unlock;
4705         /* Note: we always want to sleep here! */
4706         request->fl_flags = fl_flags | FL_SLEEP;
4707         if (do_vfs_lock(request->fl_file, request) < 0)
4708                 printk(KERN_WARNING "NFS: %s: VFS is out of sync with lock "
4709                         "manager!\n", __func__);
4710 out_unlock:
4711         up_read(&nfsi->rwsem);
4712 out:
4713         request->fl_flags = fl_flags;
4714         return status;
4715 }
4716
4717 static int nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
4718 {
4719         struct nfs4_exception exception = {
4720                 .state = state,
4721                 .inode = state->inode,
4722         };
4723         int err;
4724
4725         do {
4726                 err = _nfs4_proc_setlk(state, cmd, request);
4727                 if (err == -NFS4ERR_DENIED)
4728                         err = -EAGAIN;
4729                 err = nfs4_handle_exception(NFS_SERVER(state->inode),
4730                                 err, &exception);
4731         } while (exception.retry);
4732         return err;
4733 }
4734
4735 static int
4736 nfs4_proc_lock(struct file *filp, int cmd, struct file_lock *request)
4737 {
4738         struct nfs_open_context *ctx;
4739         struct nfs4_state *state;
4740         unsigned long timeout = NFS4_LOCK_MINTIMEOUT;
4741         int status;
4742
4743         /* verify open state */
4744         ctx = nfs_file_open_context(filp);
4745         state = ctx->state;
4746
4747         if (request->fl_start < 0 || request->fl_end < 0)
4748                 return -EINVAL;
4749
4750         if (IS_GETLK(cmd)) {
4751                 if (state != NULL)
4752                         return nfs4_proc_getlk(state, F_GETLK, request);
4753                 return 0;
4754         }
4755
4756         if (!(IS_SETLK(cmd) || IS_SETLKW(cmd)))
4757                 return -EINVAL;
4758
4759         if (request->fl_type == F_UNLCK) {
4760                 if (state != NULL)
4761                         return nfs4_proc_unlck(state, cmd, request);
4762                 return 0;
4763         }
4764
4765         if (state == NULL)
4766                 return -ENOLCK;
4767         /*
4768          * Don't rely on the VFS having checked the file open mode,
4769          * since it won't do this for flock() locks.
4770          */
4771         switch (request->fl_type & (F_RDLCK|F_WRLCK|F_UNLCK)) {
4772         case F_RDLCK:
4773                 if (!(filp->f_mode & FMODE_READ))
4774                         return -EBADF;
4775                 break;
4776         case F_WRLCK:
4777                 if (!(filp->f_mode & FMODE_WRITE))
4778                         return -EBADF;
4779         }
4780
4781         do {
4782                 status = nfs4_proc_setlk(state, cmd, request);
4783                 if ((status != -EAGAIN) || IS_SETLK(cmd))
4784                         break;
4785                 timeout = nfs4_set_lock_task_retry(timeout);
4786                 status = -ERESTARTSYS;
4787                 if (signalled())
4788                         break;
4789         } while(status < 0);
4790         return status;
4791 }
4792
4793 int nfs4_lock_delegation_recall(struct nfs4_state *state, struct file_lock *fl)
4794 {
4795         struct nfs_server *server = NFS_SERVER(state->inode);
4796         struct nfs4_exception exception = { };
4797         int err;
4798
4799         err = nfs4_set_lock_state(state, fl);
4800         if (err != 0)
4801                 goto out;
4802         do {
4803                 err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
4804                 switch (err) {
4805                         default:
4806                                 printk(KERN_ERR "NFS: %s: unhandled error "
4807                                         "%d.\n", __func__, err);
4808                         case 0:
4809                         case -ESTALE:
4810                                 goto out;
4811                         case -NFS4ERR_EXPIRED:
4812                                 nfs4_schedule_stateid_recovery(server, state);
4813                         case -NFS4ERR_STALE_CLIENTID:
4814                         case -NFS4ERR_STALE_STATEID:
4815                                 nfs4_schedule_lease_recovery(server->nfs_client);
4816                                 goto out;
4817                         case -NFS4ERR_BADSESSION:
4818                         case -NFS4ERR_BADSLOT:
4819                         case -NFS4ERR_BAD_HIGH_SLOT:
4820                         case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
4821                         case -NFS4ERR_DEADSESSION:
4822                                 nfs4_schedule_session_recovery(server->nfs_client->cl_session);
4823                                 goto out;
4824                         case -ERESTARTSYS:
4825                                 /*
4826                                  * The show must go on: exit, but mark the
4827                                  * stateid as needing recovery.
4828                                  */
4829                         case -NFS4ERR_DELEG_REVOKED:
4830                         case -NFS4ERR_ADMIN_REVOKED:
4831                         case -NFS4ERR_BAD_STATEID:
4832                         case -NFS4ERR_OPENMODE:
4833                                 nfs4_schedule_stateid_recovery(server, state);
4834                                 err = 0;
4835                                 goto out;
4836                         case -EKEYEXPIRED:
4837                                 /*
4838                                  * User RPCSEC_GSS context has expired.
4839                                  * We cannot recover this stateid now, so
4840                                  * skip it and allow recovery thread to
4841                                  * proceed.
4842                                  */
4843                                 err = 0;
4844                                 goto out;
4845                         case -ENOMEM:
4846                         case -NFS4ERR_DENIED:
4847                                 /* kill_proc(fl->fl_pid, SIGLOST, 1); */
4848                                 err = 0;
4849                                 goto out;
4850                         case -NFS4ERR_DELAY:
4851                                 break;
4852                 }
4853                 err = nfs4_handle_exception(server, err, &exception);
4854         } while (exception.retry);
4855 out:
4856         return err;
4857 }
4858
4859 struct nfs_release_lockowner_data {
4860         struct nfs4_lock_state *lsp;
4861         struct nfs_server *server;
4862         struct nfs_release_lockowner_args args;
4863 };
4864
4865 static void nfs4_release_lockowner_release(void *calldata)
4866 {
4867         struct nfs_release_lockowner_data *data = calldata;
4868         nfs4_free_lock_state(data->server, data->lsp);
4869         kfree(calldata);
4870 }
4871
4872 static const struct rpc_call_ops nfs4_release_lockowner_ops = {
4873         .rpc_release = nfs4_release_lockowner_release,
4874 };
4875
4876 int nfs4_release_lockowner(struct nfs4_lock_state *lsp)
4877 {
4878         struct nfs_server *server = lsp->ls_state->owner->so_server;
4879         struct nfs_release_lockowner_data *data;
4880         struct rpc_message msg = {
4881                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RELEASE_LOCKOWNER],
4882         };
4883
4884         if (server->nfs_client->cl_mvops->minor_version != 0)
4885                 return -EINVAL;
4886         data = kmalloc(sizeof(*data), GFP_NOFS);
4887         if (!data)
4888                 return -ENOMEM;
4889         data->lsp = lsp;
4890         data->server = server;
4891         data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
4892         data->args.lock_owner.id = lsp->ls_seqid.owner_id;
4893         data->args.lock_owner.s_dev = server->s_dev;
4894         msg.rpc_argp = &data->args;
4895         rpc_call_async(server->client, &msg, 0, &nfs4_release_lockowner_ops, data);
4896         return 0;
4897 }
4898
4899 #define XATTR_NAME_NFSV4_ACL "system.nfs4_acl"
4900
4901 static int nfs4_xattr_set_nfs4_acl(struct dentry *dentry, const char *key,
4902                                    const void *buf, size_t buflen,
4903                                    int flags, int type)
4904 {
4905         if (strcmp(key, "") != 0)
4906                 return -EINVAL;
4907
4908         return nfs4_proc_set_acl(dentry->d_inode, buf, buflen);
4909 }
4910
4911 static int nfs4_xattr_get_nfs4_acl(struct dentry *dentry, const char *key,
4912                                    void *buf, size_t buflen, int type)
4913 {
4914         if (strcmp(key, "") != 0)
4915                 return -EINVAL;
4916
4917         return nfs4_proc_get_acl(dentry->d_inode, buf, buflen);
4918 }
4919
4920 static size_t nfs4_xattr_list_nfs4_acl(struct dentry *dentry, char *list,
4921                                        size_t list_len, const char *name,
4922                                        size_t name_len, int type)
4923 {
4924         size_t len = sizeof(XATTR_NAME_NFSV4_ACL);
4925
4926         if (!nfs4_server_supports_acls(NFS_SERVER(dentry->d_inode)))
4927                 return 0;
4928
4929         if (list && len <= list_len)
4930                 memcpy(list, XATTR_NAME_NFSV4_ACL, len);
4931         return len;
4932 }
4933
4934 /*
4935  * nfs_fhget will use either the mounted_on_fileid or the fileid
4936  */
4937 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr)
4938 {
4939         if (!(((fattr->valid & NFS_ATTR_FATTR_MOUNTED_ON_FILEID) ||
4940                (fattr->valid & NFS_ATTR_FATTR_FILEID)) &&
4941               (fattr->valid & NFS_ATTR_FATTR_FSID) &&
4942               (fattr->valid & NFS_ATTR_FATTR_V4_LOCATIONS)))
4943                 return;
4944
4945         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
4946                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_V4_REFERRAL;
4947         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
4948         fattr->nlink = 2;
4949 }
4950
4951 static int _nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
4952                                    const struct qstr *name,
4953                                    struct nfs4_fs_locations *fs_locations,
4954                                    struct page *page)
4955 {
4956         struct nfs_server *server = NFS_SERVER(dir);
4957         u32 bitmask[2] = {
4958                 [0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
4959         };
4960         struct nfs4_fs_locations_arg args = {
4961                 .dir_fh = NFS_FH(dir),
4962                 .name = name,
4963                 .page = page,
4964                 .bitmask = bitmask,
4965         };
4966         struct nfs4_fs_locations_res res = {
4967                 .fs_locations = fs_locations,
4968         };
4969         struct rpc_message msg = {
4970                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
4971                 .rpc_argp = &args,
4972                 .rpc_resp = &res,
4973         };
4974         int status;
4975
4976         dprintk("%s: start\n", __func__);
4977
4978         /* Ask for the fileid of the absent filesystem if mounted_on_fileid
4979          * is not supported */
4980         if (NFS_SERVER(dir)->attr_bitmask[1] & FATTR4_WORD1_MOUNTED_ON_FILEID)
4981                 bitmask[1] |= FATTR4_WORD1_MOUNTED_ON_FILEID;
4982         else
4983                 bitmask[0] |= FATTR4_WORD0_FILEID;
4984
4985         nfs_fattr_init(&fs_locations->fattr);
4986         fs_locations->server = server;
4987         fs_locations->nlocations = 0;
4988         status = nfs4_call_sync(client, server, &msg, &args.seq_args, &res.seq_res, 0);
4989         dprintk("%s: returned status = %d\n", __func__, status);
4990         return status;
4991 }
4992
4993 int nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
4994                            const struct qstr *name,
4995                            struct nfs4_fs_locations *fs_locations,
4996                            struct page *page)
4997 {
4998         struct nfs4_exception exception = { };
4999         int err;
5000         do {
5001                 err = nfs4_handle_exception(NFS_SERVER(dir),
5002                                 _nfs4_proc_fs_locations(client, dir, name, fs_locations, page),
5003                                 &exception);
5004         } while (exception.retry);
5005         return err;
5006 }
5007
5008 static int _nfs4_proc_secinfo(struct inode *dir, const struct qstr *name, struct nfs4_secinfo_flavors *flavors)
5009 {
5010         int status;
5011         struct nfs4_secinfo_arg args = {
5012                 .dir_fh = NFS_FH(dir),
5013                 .name   = name,
5014         };
5015         struct nfs4_secinfo_res res = {
5016                 .flavors     = flavors,
5017         };
5018         struct rpc_message msg = {
5019                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO],
5020                 .rpc_argp = &args,
5021                 .rpc_resp = &res,
5022         };
5023
5024         dprintk("NFS call  secinfo %s\n", name->name);
5025         status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
5026         dprintk("NFS reply  secinfo: %d\n", status);
5027         return status;
5028 }
5029
5030 int nfs4_proc_secinfo(struct inode *dir, const struct qstr *name,
5031                       struct nfs4_secinfo_flavors *flavors)
5032 {
5033         struct nfs4_exception exception = { };
5034         int err;
5035         do {
5036                 err = nfs4_handle_exception(NFS_SERVER(dir),
5037                                 _nfs4_proc_secinfo(dir, name, flavors),
5038                                 &exception);
5039         } while (exception.retry);
5040         return err;
5041 }
5042
5043 #ifdef CONFIG_NFS_V4_1
5044 /*
5045  * Check the exchange flags returned by the server for invalid flags, having
5046  * both PNFS and NON_PNFS flags set, and not having one of NON_PNFS, PNFS, or
5047  * DS flags set.
5048  */
5049 static int nfs4_check_cl_exchange_flags(u32 flags)
5050 {
5051         if (flags & ~EXCHGID4_FLAG_MASK_R)
5052                 goto out_inval;
5053         if ((flags & EXCHGID4_FLAG_USE_PNFS_MDS) &&
5054             (flags & EXCHGID4_FLAG_USE_NON_PNFS))
5055                 goto out_inval;
5056         if (!(flags & (EXCHGID4_FLAG_MASK_PNFS)))
5057                 goto out_inval;
5058         return NFS_OK;
5059 out_inval:
5060         return -NFS4ERR_INVAL;
5061 }
5062
5063 static bool
5064 nfs41_same_server_scope(struct nfs41_server_scope *a,
5065                         struct nfs41_server_scope *b)
5066 {
5067         if (a->server_scope_sz == b->server_scope_sz &&
5068             memcmp(a->server_scope, b->server_scope, a->server_scope_sz) == 0)
5069                 return true;
5070
5071         return false;
5072 }
5073
5074 /*
5075  * nfs4_proc_exchange_id()
5076  *
5077  * Since the clientid has expired, all compounds using sessions
5078  * associated with the stale clientid will be returning
5079  * NFS4ERR_BADSESSION in the sequence operation, and will therefore
5080  * be in some phase of session reset.
5081  */
5082 int nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred)
5083 {
5084         nfs4_verifier verifier;
5085         struct nfs41_exchange_id_args args = {
5086                 .verifier = &verifier,
5087                 .client = clp,
5088                 .flags = EXCHGID4_FLAG_SUPP_MOVED_REFER,
5089         };
5090         struct nfs41_exchange_id_res res = {
5091                 .client = clp,
5092         };
5093         int status;
5094         struct rpc_message msg = {
5095                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_EXCHANGE_ID],
5096                 .rpc_argp = &args,
5097                 .rpc_resp = &res,
5098                 .rpc_cred = cred,
5099         };
5100
5101         dprintk("--> %s\n", __func__);
5102         BUG_ON(clp == NULL);
5103
5104         nfs4_init_boot_verifier(clp, &verifier);
5105
5106         args.id_len = scnprintf(args.id, sizeof(args.id),
5107                                 "%s/%s/%u",
5108                                 clp->cl_ipaddr,
5109                                 clp->cl_rpcclient->cl_nodename,
5110                                 clp->cl_rpcclient->cl_auth->au_flavor);
5111
5112         res.server_owner = kzalloc(sizeof(struct nfs41_server_owner),
5113                                         GFP_KERNEL);
5114         if (unlikely(res.server_owner == NULL)) {
5115                 status = -ENOMEM;
5116                 goto out;
5117         }
5118
5119         res.server_scope = kzalloc(sizeof(struct nfs41_server_scope),
5120                                         GFP_KERNEL);
5121         if (unlikely(res.server_scope == NULL)) {
5122                 status = -ENOMEM;
5123                 goto out_server_owner;
5124         }
5125
5126         res.impl_id = kzalloc(sizeof(struct nfs41_impl_id), GFP_KERNEL);
5127         if (unlikely(res.impl_id == NULL)) {
5128                 status = -ENOMEM;
5129                 goto out_server_scope;
5130         }
5131
5132         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5133         if (status == 0)
5134                 status = nfs4_check_cl_exchange_flags(clp->cl_exchange_flags);
5135
5136         if (status == 0) {
5137                 kfree(clp->cl_serverowner);
5138                 clp->cl_serverowner = res.server_owner;
5139                 res.server_owner = NULL;
5140         }
5141
5142         if (status == 0) {
5143                 /* use the most recent implementation id */
5144                 kfree(clp->cl_implid);
5145                 clp->cl_implid = res.impl_id;
5146         } else
5147                 kfree(res.impl_id);
5148
5149         if (status == 0) {
5150                 if (clp->cl_serverscope != NULL &&
5151                     !nfs41_same_server_scope(clp->cl_serverscope,
5152                                              res.server_scope)) {
5153                         dprintk("%s: server_scope mismatch detected\n",
5154                                 __func__);
5155                         set_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state);
5156                         kfree(clp->cl_serverscope);
5157                         clp->cl_serverscope = NULL;
5158                 }
5159
5160                 if (clp->cl_serverscope == NULL) {
5161                         clp->cl_serverscope = res.server_scope;
5162                         goto out;
5163                 }
5164         }
5165
5166 out_server_owner:
5167         kfree(res.server_owner);
5168 out_server_scope:
5169         kfree(res.server_scope);
5170 out:
5171         if (clp->cl_implid != NULL)
5172                 dprintk("%s: Server Implementation ID: "
5173                         "domain: %s, name: %s, date: %llu,%u\n",
5174                         __func__, clp->cl_implid->domain, clp->cl_implid->name,
5175                         clp->cl_implid->date.seconds,
5176                         clp->cl_implid->date.nseconds);
5177         dprintk("<-- %s status= %d\n", __func__, status);
5178         return status;
5179 }
5180
5181 struct nfs4_get_lease_time_data {
5182         struct nfs4_get_lease_time_args *args;
5183         struct nfs4_get_lease_time_res *res;
5184         struct nfs_client *clp;
5185 };
5186
5187 static void nfs4_get_lease_time_prepare(struct rpc_task *task,
5188                                         void *calldata)
5189 {
5190         int ret;
5191         struct nfs4_get_lease_time_data *data =
5192                         (struct nfs4_get_lease_time_data *)calldata;
5193
5194         dprintk("--> %s\n", __func__);
5195         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
5196         /* just setup sequence, do not trigger session recovery
5197            since we're invoked within one */
5198         ret = nfs41_setup_sequence(data->clp->cl_session,
5199                                    &data->args->la_seq_args,
5200                                    &data->res->lr_seq_res, task);
5201
5202         BUG_ON(ret == -EAGAIN);
5203         rpc_call_start(task);
5204         dprintk("<-- %s\n", __func__);
5205 }
5206
5207 /*
5208  * Called from nfs4_state_manager thread for session setup, so don't recover
5209  * from sequence operation or clientid errors.
5210  */
5211 static void nfs4_get_lease_time_done(struct rpc_task *task, void *calldata)
5212 {
5213         struct nfs4_get_lease_time_data *data =
5214                         (struct nfs4_get_lease_time_data *)calldata;
5215
5216         dprintk("--> %s\n", __func__);
5217         if (!nfs41_sequence_done(task, &data->res->lr_seq_res))
5218                 return;
5219         switch (task->tk_status) {
5220         case -NFS4ERR_DELAY:
5221         case -NFS4ERR_GRACE:
5222                 dprintk("%s Retry: tk_status %d\n", __func__, task->tk_status);
5223                 rpc_delay(task, NFS4_POLL_RETRY_MIN);
5224                 task->tk_status = 0;
5225                 /* fall through */
5226         case -NFS4ERR_RETRY_UNCACHED_REP:
5227                 rpc_restart_call_prepare(task);
5228                 return;
5229         }
5230         dprintk("<-- %s\n", __func__);
5231 }
5232
5233 static const struct rpc_call_ops nfs4_get_lease_time_ops = {
5234         .rpc_call_prepare = nfs4_get_lease_time_prepare,
5235         .rpc_call_done = nfs4_get_lease_time_done,
5236 };
5237
5238 int nfs4_proc_get_lease_time(struct nfs_client *clp, struct nfs_fsinfo *fsinfo)
5239 {
5240         struct rpc_task *task;
5241         struct nfs4_get_lease_time_args args;
5242         struct nfs4_get_lease_time_res res = {
5243                 .lr_fsinfo = fsinfo,
5244         };
5245         struct nfs4_get_lease_time_data data = {
5246                 .args = &args,
5247                 .res = &res,
5248                 .clp = clp,
5249         };
5250         struct rpc_message msg = {
5251                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GET_LEASE_TIME],
5252                 .rpc_argp = &args,
5253                 .rpc_resp = &res,
5254         };
5255         struct rpc_task_setup task_setup = {
5256                 .rpc_client = clp->cl_rpcclient,
5257                 .rpc_message = &msg,
5258                 .callback_ops = &nfs4_get_lease_time_ops,
5259                 .callback_data = &data,
5260                 .flags = RPC_TASK_TIMEOUT,
5261         };
5262         int status;
5263
5264         nfs41_init_sequence(&args.la_seq_args, &res.lr_seq_res, 0);
5265         dprintk("--> %s\n", __func__);
5266         task = rpc_run_task(&task_setup);
5267
5268         if (IS_ERR(task))
5269                 status = PTR_ERR(task);
5270         else {
5271                 status = task->tk_status;
5272                 rpc_put_task(task);
5273         }
5274         dprintk("<-- %s return %d\n", __func__, status);
5275
5276         return status;
5277 }
5278
5279 static struct nfs4_slot *nfs4_alloc_slots(u32 max_slots, gfp_t gfp_flags)
5280 {
5281         return kcalloc(max_slots, sizeof(struct nfs4_slot), gfp_flags);
5282 }
5283
5284 static void nfs4_add_and_init_slots(struct nfs4_slot_table *tbl,
5285                 struct nfs4_slot *new,
5286                 u32 max_slots,
5287                 u32 ivalue)
5288 {
5289         struct nfs4_slot *old = NULL;
5290         u32 i;
5291
5292         spin_lock(&tbl->slot_tbl_lock);
5293         if (new) {
5294                 old = tbl->slots;
5295                 tbl->slots = new;
5296                 tbl->max_slots = max_slots;
5297         }
5298         tbl->highest_used_slotid = -1;  /* no slot is currently used */
5299         for (i = 0; i < tbl->max_slots; i++)
5300                 tbl->slots[i].seq_nr = ivalue;
5301         spin_unlock(&tbl->slot_tbl_lock);
5302         kfree(old);
5303 }
5304
5305 /*
5306  * (re)Initialise a slot table
5307  */
5308 static int nfs4_realloc_slot_table(struct nfs4_slot_table *tbl, u32 max_reqs,
5309                                  u32 ivalue)
5310 {
5311         struct nfs4_slot *new = NULL;
5312         int ret = -ENOMEM;
5313
5314         dprintk("--> %s: max_reqs=%u, tbl->max_slots %d\n", __func__,
5315                 max_reqs, tbl->max_slots);
5316
5317         /* Does the newly negotiated max_reqs match the existing slot table? */
5318         if (max_reqs != tbl->max_slots) {
5319                 new = nfs4_alloc_slots(max_reqs, GFP_NOFS);
5320                 if (!new)
5321                         goto out;
5322         }
5323         ret = 0;
5324
5325         nfs4_add_and_init_slots(tbl, new, max_reqs, ivalue);
5326         dprintk("%s: tbl=%p slots=%p max_slots=%d\n", __func__,
5327                 tbl, tbl->slots, tbl->max_slots);
5328 out:
5329         dprintk("<-- %s: return %d\n", __func__, ret);
5330         return ret;
5331 }
5332
5333 /* Destroy the slot table */
5334 static void nfs4_destroy_slot_tables(struct nfs4_session *session)
5335 {
5336         if (session->fc_slot_table.slots != NULL) {
5337                 kfree(session->fc_slot_table.slots);
5338                 session->fc_slot_table.slots = NULL;
5339         }
5340         if (session->bc_slot_table.slots != NULL) {
5341                 kfree(session->bc_slot_table.slots);
5342                 session->bc_slot_table.slots = NULL;
5343         }
5344         return;
5345 }
5346
5347 /*
5348  * Initialize or reset the forechannel and backchannel tables
5349  */
5350 static int nfs4_setup_session_slot_tables(struct nfs4_session *ses)
5351 {
5352         struct nfs4_slot_table *tbl;
5353         int status;
5354
5355         dprintk("--> %s\n", __func__);
5356         /* Fore channel */
5357         tbl = &ses->fc_slot_table;
5358         status = nfs4_realloc_slot_table(tbl, ses->fc_attrs.max_reqs, 1);
5359         if (status) /* -ENOMEM */
5360                 return status;
5361         /* Back channel */
5362         tbl = &ses->bc_slot_table;
5363         status = nfs4_realloc_slot_table(tbl, ses->bc_attrs.max_reqs, 0);
5364         if (status && tbl->slots == NULL)
5365                 /* Fore and back channel share a connection so get
5366                  * both slot tables or neither */
5367                 nfs4_destroy_slot_tables(ses);
5368         return status;
5369 }
5370
5371 struct nfs4_session *nfs4_alloc_session(struct nfs_client *clp)
5372 {
5373         struct nfs4_session *session;
5374         struct nfs4_slot_table *tbl;
5375
5376         session = kzalloc(sizeof(struct nfs4_session), GFP_NOFS);
5377         if (!session)
5378                 return NULL;
5379
5380         tbl = &session->fc_slot_table;
5381         tbl->highest_used_slotid = NFS4_NO_SLOT;
5382         spin_lock_init(&tbl->slot_tbl_lock);
5383         rpc_init_priority_wait_queue(&tbl->slot_tbl_waitq, "ForeChannel Slot table");
5384         init_completion(&tbl->complete);
5385
5386         tbl = &session->bc_slot_table;
5387         tbl->highest_used_slotid = NFS4_NO_SLOT;
5388         spin_lock_init(&tbl->slot_tbl_lock);
5389         rpc_init_wait_queue(&tbl->slot_tbl_waitq, "BackChannel Slot table");
5390         init_completion(&tbl->complete);
5391
5392         session->session_state = 1<<NFS4_SESSION_INITING;
5393
5394         session->clp = clp;
5395         return session;
5396 }
5397
5398 void nfs4_destroy_session(struct nfs4_session *session)
5399 {
5400         struct rpc_xprt *xprt;
5401
5402         nfs4_proc_destroy_session(session);
5403
5404         rcu_read_lock();
5405         xprt = rcu_dereference(session->clp->cl_rpcclient->cl_xprt);
5406         rcu_read_unlock();
5407         dprintk("%s Destroy backchannel for xprt %p\n",
5408                 __func__, xprt);
5409         xprt_destroy_backchannel(xprt, NFS41_BC_MIN_CALLBACKS);
5410         nfs4_destroy_slot_tables(session);
5411         kfree(session);
5412 }
5413
5414 /*
5415  * Initialize the values to be used by the client in CREATE_SESSION
5416  * If nfs4_init_session set the fore channel request and response sizes,
5417  * use them.
5418  *
5419  * Set the back channel max_resp_sz_cached to zero to force the client to
5420  * always set csa_cachethis to FALSE because the current implementation
5421  * of the back channel DRC only supports caching the CB_SEQUENCE operation.
5422  */
5423 static void nfs4_init_channel_attrs(struct nfs41_create_session_args *args)
5424 {
5425         struct nfs4_session *session = args->client->cl_session;
5426         unsigned int mxrqst_sz = session->fc_attrs.max_rqst_sz,
5427                      mxresp_sz = session->fc_attrs.max_resp_sz;
5428
5429         if (mxrqst_sz == 0)
5430                 mxrqst_sz = NFS_MAX_FILE_IO_SIZE;
5431         if (mxresp_sz == 0)
5432                 mxresp_sz = NFS_MAX_FILE_IO_SIZE;
5433         /* Fore channel attributes */
5434         args->fc_attrs.max_rqst_sz = mxrqst_sz;
5435         args->fc_attrs.max_resp_sz = mxresp_sz;
5436         args->fc_attrs.max_ops = NFS4_MAX_OPS;
5437         args->fc_attrs.max_reqs = max_session_slots;
5438
5439         dprintk("%s: Fore Channel : max_rqst_sz=%u max_resp_sz=%u "
5440                 "max_ops=%u max_reqs=%u\n",
5441                 __func__,
5442                 args->fc_attrs.max_rqst_sz, args->fc_attrs.max_resp_sz,
5443                 args->fc_attrs.max_ops, args->fc_attrs.max_reqs);
5444
5445         /* Back channel attributes */
5446         args->bc_attrs.max_rqst_sz = PAGE_SIZE;
5447         args->bc_attrs.max_resp_sz = PAGE_SIZE;
5448         args->bc_attrs.max_resp_sz_cached = 0;
5449         args->bc_attrs.max_ops = NFS4_MAX_BACK_CHANNEL_OPS;
5450         args->bc_attrs.max_reqs = 1;
5451
5452         dprintk("%s: Back Channel : max_rqst_sz=%u max_resp_sz=%u "
5453                 "max_resp_sz_cached=%u max_ops=%u max_reqs=%u\n",
5454                 __func__,
5455                 args->bc_attrs.max_rqst_sz, args->bc_attrs.max_resp_sz,
5456                 args->bc_attrs.max_resp_sz_cached, args->bc_attrs.max_ops,
5457                 args->bc_attrs.max_reqs);
5458 }
5459
5460 static int nfs4_verify_fore_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
5461 {
5462         struct nfs4_channel_attrs *sent = &args->fc_attrs;
5463         struct nfs4_channel_attrs *rcvd = &session->fc_attrs;
5464
5465         if (rcvd->max_resp_sz > sent->max_resp_sz)
5466                 return -EINVAL;
5467         /*
5468          * Our requested max_ops is the minimum we need; we're not
5469          * prepared to break up compounds into smaller pieces than that.
5470          * So, no point even trying to continue if the server won't
5471          * cooperate:
5472          */
5473         if (rcvd->max_ops < sent->max_ops)
5474                 return -EINVAL;
5475         if (rcvd->max_reqs == 0)
5476                 return -EINVAL;
5477         if (rcvd->max_reqs > NFS4_MAX_SLOT_TABLE)
5478                 rcvd->max_reqs = NFS4_MAX_SLOT_TABLE;
5479         return 0;
5480 }
5481
5482 static int nfs4_verify_back_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
5483 {
5484         struct nfs4_channel_attrs *sent = &args->bc_attrs;
5485         struct nfs4_channel_attrs *rcvd = &session->bc_attrs;
5486
5487         if (rcvd->max_rqst_sz > sent->max_rqst_sz)
5488                 return -EINVAL;
5489         if (rcvd->max_resp_sz < sent->max_resp_sz)
5490                 return -EINVAL;
5491         if (rcvd->max_resp_sz_cached > sent->max_resp_sz_cached)
5492                 return -EINVAL;
5493         /* These would render the backchannel useless: */
5494         if (rcvd->max_ops != sent->max_ops)
5495                 return -EINVAL;
5496         if (rcvd->max_reqs != sent->max_reqs)
5497                 return -EINVAL;
5498         return 0;
5499 }
5500
5501 static int nfs4_verify_channel_attrs(struct nfs41_create_session_args *args,
5502                                      struct nfs4_session *session)
5503 {
5504         int ret;
5505
5506         ret = nfs4_verify_fore_channel_attrs(args, session);
5507         if (ret)
5508                 return ret;
5509         return nfs4_verify_back_channel_attrs(args, session);
5510 }
5511
5512 static int _nfs4_proc_create_session(struct nfs_client *clp)
5513 {
5514         struct nfs4_session *session = clp->cl_session;
5515         struct nfs41_create_session_args args = {
5516                 .client = clp,
5517                 .cb_program = NFS4_CALLBACK,
5518         };
5519         struct nfs41_create_session_res res = {
5520                 .client = clp,
5521         };
5522         struct rpc_message msg = {
5523                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE_SESSION],
5524                 .rpc_argp = &args,
5525                 .rpc_resp = &res,
5526         };
5527         int status;
5528
5529         nfs4_init_channel_attrs(&args);
5530         args.flags = (SESSION4_PERSIST | SESSION4_BACK_CHAN);
5531
5532         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5533
5534         if (!status)
5535                 /* Verify the session's negotiated channel_attrs values */
5536                 status = nfs4_verify_channel_attrs(&args, session);
5537         if (!status) {
5538                 /* Increment the clientid slot sequence id */
5539                 clp->cl_seqid++;
5540         }
5541
5542         return status;
5543 }
5544
5545 /*
5546  * Issues a CREATE_SESSION operation to the server.
5547  * It is the responsibility of the caller to verify the session is
5548  * expired before calling this routine.
5549  */
5550 int nfs4_proc_create_session(struct nfs_client *clp)
5551 {
5552         int status;
5553         unsigned *ptr;
5554         struct nfs4_session *session = clp->cl_session;
5555
5556         dprintk("--> %s clp=%p session=%p\n", __func__, clp, session);
5557
5558         status = _nfs4_proc_create_session(clp);
5559         if (status)
5560                 goto out;
5561
5562         /* Init or reset the session slot tables */
5563         status = nfs4_setup_session_slot_tables(session);
5564         dprintk("slot table setup returned %d\n", status);
5565         if (status)
5566                 goto out;
5567
5568         ptr = (unsigned *)&session->sess_id.data[0];
5569         dprintk("%s client>seqid %d sessionid %u:%u:%u:%u\n", __func__,
5570                 clp->cl_seqid, ptr[0], ptr[1], ptr[2], ptr[3]);
5571 out:
5572         dprintk("<-- %s\n", __func__);
5573         return status;
5574 }
5575
5576 /*
5577  * Issue the over-the-wire RPC DESTROY_SESSION.
5578  * The caller must serialize access to this routine.
5579  */
5580 int nfs4_proc_destroy_session(struct nfs4_session *session)
5581 {
5582         int status = 0;
5583         struct rpc_message msg;
5584
5585         dprintk("--> nfs4_proc_destroy_session\n");
5586
5587         /* session is still being setup */
5588         if (session->clp->cl_cons_state != NFS_CS_READY)
5589                 return status;
5590
5591         msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_SESSION];
5592         msg.rpc_argp = session;
5593         msg.rpc_resp = NULL;
5594         msg.rpc_cred = NULL;
5595         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5596
5597         if (status)
5598                 printk(KERN_WARNING
5599                         "NFS: Got error %d from the server on DESTROY_SESSION. "
5600                         "Session has been destroyed regardless...\n", status);
5601
5602         dprintk("<-- nfs4_proc_destroy_session\n");
5603         return status;
5604 }
5605
5606 /*
5607  * With sessions, the client is not marked ready until after a
5608  * successful EXCHANGE_ID and CREATE_SESSION.
5609  *
5610  * Map errors cl_cons_state errors to EPROTONOSUPPORT to indicate
5611  * other versions of NFS can be tried.
5612  */
5613 static int nfs41_check_session_ready(struct nfs_client *clp)
5614 {
5615         int ret;
5616         
5617         if (clp->cl_cons_state == NFS_CS_SESSION_INITING) {
5618                 ret = nfs4_client_recover_expired_lease(clp);
5619                 if (ret)
5620                         return ret;
5621         }
5622         if (clp->cl_cons_state < NFS_CS_READY)
5623                 return -EPROTONOSUPPORT;
5624         return 0;
5625 }
5626
5627 int nfs4_init_session(struct nfs_server *server)
5628 {
5629         struct nfs_client *clp = server->nfs_client;
5630         struct nfs4_session *session;
5631         unsigned int rsize, wsize;
5632
5633         if (!nfs4_has_session(clp))
5634                 return 0;
5635
5636         session = clp->cl_session;
5637         spin_lock(&clp->cl_lock);
5638         if (test_and_clear_bit(NFS4_SESSION_INITING, &session->session_state)) {
5639
5640                 rsize = server->rsize;
5641                 if (rsize == 0)
5642                         rsize = NFS_MAX_FILE_IO_SIZE;
5643                 wsize = server->wsize;
5644                 if (wsize == 0)
5645                         wsize = NFS_MAX_FILE_IO_SIZE;
5646
5647                 session->fc_attrs.max_rqst_sz = wsize + nfs41_maxwrite_overhead;
5648                 session->fc_attrs.max_resp_sz = rsize + nfs41_maxread_overhead;
5649         }
5650         spin_unlock(&clp->cl_lock);
5651
5652         return nfs41_check_session_ready(clp);
5653 }
5654
5655 int nfs4_init_ds_session(struct nfs_client *clp, unsigned long lease_time)
5656 {
5657         struct nfs4_session *session = clp->cl_session;
5658         int ret;
5659
5660         spin_lock(&clp->cl_lock);
5661         if (test_and_clear_bit(NFS4_SESSION_INITING, &session->session_state)) {
5662                 /*
5663                  * Do not set NFS_CS_CHECK_LEASE_TIME instead set the
5664                  * DS lease to be equal to the MDS lease.
5665                  */
5666                 clp->cl_lease_time = lease_time;
5667                 clp->cl_last_renewal = jiffies;
5668         }
5669         spin_unlock(&clp->cl_lock);
5670
5671         ret = nfs41_check_session_ready(clp);
5672         if (ret)
5673                 return ret;
5674         /* Test for the DS role */
5675         if (!is_ds_client(clp))
5676                 return -ENODEV;
5677         return 0;
5678 }
5679 EXPORT_SYMBOL_GPL(nfs4_init_ds_session);
5680
5681
5682 /*
5683  * Renew the cl_session lease.
5684  */
5685 struct nfs4_sequence_data {
5686         struct nfs_client *clp;
5687         struct nfs4_sequence_args args;
5688         struct nfs4_sequence_res res;
5689 };
5690
5691 static void nfs41_sequence_release(void *data)
5692 {
5693         struct nfs4_sequence_data *calldata = data;
5694         struct nfs_client *clp = calldata->clp;
5695
5696         if (atomic_read(&clp->cl_count) > 1)
5697                 nfs4_schedule_state_renewal(clp);
5698         nfs_put_client(clp);
5699         kfree(calldata);
5700 }
5701
5702 static int nfs41_sequence_handle_errors(struct rpc_task *task, struct nfs_client *clp)
5703 {
5704         switch(task->tk_status) {
5705         case -NFS4ERR_DELAY:
5706                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
5707                 return -EAGAIN;
5708         default:
5709                 nfs4_schedule_lease_recovery(clp);
5710         }
5711         return 0;
5712 }
5713
5714 static void nfs41_sequence_call_done(struct rpc_task *task, void *data)
5715 {
5716         struct nfs4_sequence_data *calldata = data;
5717         struct nfs_client *clp = calldata->clp;
5718
5719         if (!nfs41_sequence_done(task, task->tk_msg.rpc_resp))
5720                 return;
5721
5722         if (task->tk_status < 0) {
5723                 dprintk("%s ERROR %d\n", __func__, task->tk_status);
5724                 if (atomic_read(&clp->cl_count) == 1)
5725                         goto out;
5726
5727                 if (nfs41_sequence_handle_errors(task, clp) == -EAGAIN) {
5728                         rpc_restart_call_prepare(task);
5729                         return;
5730                 }
5731         }
5732         dprintk("%s rpc_cred %p\n", __func__, task->tk_msg.rpc_cred);
5733 out:
5734         dprintk("<-- %s\n", __func__);
5735 }
5736
5737 static void nfs41_sequence_prepare(struct rpc_task *task, void *data)
5738 {
5739         struct nfs4_sequence_data *calldata = data;
5740         struct nfs_client *clp = calldata->clp;
5741         struct nfs4_sequence_args *args;
5742         struct nfs4_sequence_res *res;
5743
5744         args = task->tk_msg.rpc_argp;
5745         res = task->tk_msg.rpc_resp;
5746
5747         if (nfs41_setup_sequence(clp->cl_session, args, res, task))
5748                 return;
5749         rpc_call_start(task);
5750 }
5751
5752 static const struct rpc_call_ops nfs41_sequence_ops = {
5753         .rpc_call_done = nfs41_sequence_call_done,
5754         .rpc_call_prepare = nfs41_sequence_prepare,
5755         .rpc_release = nfs41_sequence_release,
5756 };
5757
5758 static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
5759 {
5760         struct nfs4_sequence_data *calldata;
5761         struct rpc_message msg = {
5762                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SEQUENCE],
5763                 .rpc_cred = cred,
5764         };
5765         struct rpc_task_setup task_setup_data = {
5766                 .rpc_client = clp->cl_rpcclient,
5767                 .rpc_message = &msg,
5768                 .callback_ops = &nfs41_sequence_ops,
5769                 .flags = RPC_TASK_ASYNC | RPC_TASK_SOFT,
5770         };
5771
5772         if (!atomic_inc_not_zero(&clp->cl_count))
5773                 return ERR_PTR(-EIO);
5774         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
5775         if (calldata == NULL) {
5776                 nfs_put_client(clp);
5777                 return ERR_PTR(-ENOMEM);
5778         }
5779         nfs41_init_sequence(&calldata->args, &calldata->res, 0);
5780         msg.rpc_argp = &calldata->args;
5781         msg.rpc_resp = &calldata->res;
5782         calldata->clp = clp;
5783         task_setup_data.callback_data = calldata;
5784
5785         return rpc_run_task(&task_setup_data);
5786 }
5787
5788 static int nfs41_proc_async_sequence(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
5789 {
5790         struct rpc_task *task;
5791         int ret = 0;
5792
5793         if ((renew_flags & NFS4_RENEW_TIMEOUT) == 0)
5794                 return 0;
5795         task = _nfs41_proc_sequence(clp, cred);
5796         if (IS_ERR(task))
5797                 ret = PTR_ERR(task);
5798         else
5799                 rpc_put_task_async(task);
5800         dprintk("<-- %s status=%d\n", __func__, ret);
5801         return ret;
5802 }
5803
5804 static int nfs4_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
5805 {
5806         struct rpc_task *task;
5807         int ret;
5808
5809         task = _nfs41_proc_sequence(clp, cred);
5810         if (IS_ERR(task)) {
5811                 ret = PTR_ERR(task);
5812                 goto out;
5813         }
5814         ret = rpc_wait_for_completion_task(task);
5815         if (!ret) {
5816                 struct nfs4_sequence_res *res = task->tk_msg.rpc_resp;
5817
5818                 if (task->tk_status == 0)
5819                         nfs41_handle_sequence_flag_errors(clp, res->sr_status_flags);
5820                 ret = task->tk_status;
5821         }
5822         rpc_put_task(task);
5823 out:
5824         dprintk("<-- %s status=%d\n", __func__, ret);
5825         return ret;
5826 }
5827
5828 struct nfs4_reclaim_complete_data {
5829         struct nfs_client *clp;
5830         struct nfs41_reclaim_complete_args arg;
5831         struct nfs41_reclaim_complete_res res;
5832 };
5833
5834 static void nfs4_reclaim_complete_prepare(struct rpc_task *task, void *data)
5835 {
5836         struct nfs4_reclaim_complete_data *calldata = data;
5837
5838         rpc_task_set_priority(task, RPC_PRIORITY_PRIVILEGED);
5839         if (nfs41_setup_sequence(calldata->clp->cl_session,
5840                                 &calldata->arg.seq_args,
5841                                 &calldata->res.seq_res, task))
5842                 return;
5843
5844         rpc_call_start(task);
5845 }
5846
5847 static int nfs41_reclaim_complete_handle_errors(struct rpc_task *task, struct nfs_client *clp)
5848 {
5849         switch(task->tk_status) {
5850         case 0:
5851         case -NFS4ERR_COMPLETE_ALREADY:
5852         case -NFS4ERR_WRONG_CRED: /* What to do here? */
5853                 break;
5854         case -NFS4ERR_DELAY:
5855                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
5856                 /* fall through */
5857         case -NFS4ERR_RETRY_UNCACHED_REP:
5858                 return -EAGAIN;
5859         default:
5860                 nfs4_schedule_lease_recovery(clp);
5861         }
5862         return 0;
5863 }
5864
5865 static void nfs4_reclaim_complete_done(struct rpc_task *task, void *data)
5866 {
5867         struct nfs4_reclaim_complete_data *calldata = data;
5868         struct nfs_client *clp = calldata->clp;
5869         struct nfs4_sequence_res *res = &calldata->res.seq_res;
5870
5871         dprintk("--> %s\n", __func__);
5872         if (!nfs41_sequence_done(task, res))
5873                 return;
5874
5875         if (nfs41_reclaim_complete_handle_errors(task, clp) == -EAGAIN) {
5876                 rpc_restart_call_prepare(task);
5877                 return;
5878         }
5879         dprintk("<-- %s\n", __func__);
5880 }
5881
5882 static void nfs4_free_reclaim_complete_data(void *data)
5883 {
5884         struct nfs4_reclaim_complete_data *calldata = data;
5885
5886         kfree(calldata);
5887 }
5888
5889 static const struct rpc_call_ops nfs4_reclaim_complete_call_ops = {
5890         .rpc_call_prepare = nfs4_reclaim_complete_prepare,
5891         .rpc_call_done = nfs4_reclaim_complete_done,
5892         .rpc_release = nfs4_free_reclaim_complete_data,
5893 };
5894
5895 /*
5896  * Issue a global reclaim complete.
5897  */
5898 static int nfs41_proc_reclaim_complete(struct nfs_client *clp)
5899 {
5900         struct nfs4_reclaim_complete_data *calldata;
5901         struct rpc_task *task;
5902         struct rpc_message msg = {
5903                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RECLAIM_COMPLETE],
5904         };
5905         struct rpc_task_setup task_setup_data = {
5906                 .rpc_client = clp->cl_rpcclient,
5907                 .rpc_message = &msg,
5908                 .callback_ops = &nfs4_reclaim_complete_call_ops,
5909                 .flags = RPC_TASK_ASYNC,
5910         };
5911         int status = -ENOMEM;
5912
5913         dprintk("--> %s\n", __func__);
5914         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
5915         if (calldata == NULL)
5916                 goto out;
5917         calldata->clp = clp;
5918         calldata->arg.one_fs = 0;
5919
5920         nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 0);
5921         msg.rpc_argp = &calldata->arg;
5922         msg.rpc_resp = &calldata->res;
5923         task_setup_data.callback_data = calldata;
5924         task = rpc_run_task(&task_setup_data);
5925         if (IS_ERR(task)) {
5926                 status = PTR_ERR(task);
5927                 goto out;
5928         }
5929         status = nfs4_wait_for_completion_rpc_task(task);
5930         if (status == 0)
5931                 status = task->tk_status;
5932         rpc_put_task(task);
5933         return 0;
5934 out:
5935         dprintk("<-- %s status=%d\n", __func__, status);
5936         return status;
5937 }
5938
5939 static void
5940 nfs4_layoutget_prepare(struct rpc_task *task, void *calldata)
5941 {
5942         struct nfs4_layoutget *lgp = calldata;
5943         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
5944
5945         dprintk("--> %s\n", __func__);
5946         /* Note the is a race here, where a CB_LAYOUTRECALL can come in
5947          * right now covering the LAYOUTGET we are about to send.
5948          * However, that is not so catastrophic, and there seems
5949          * to be no way to prevent it completely.
5950          */
5951         if (nfs4_setup_sequence(server, &lgp->args.seq_args,
5952                                 &lgp->res.seq_res, task))
5953                 return;
5954         if (pnfs_choose_layoutget_stateid(&lgp->args.stateid,
5955                                           NFS_I(lgp->args.inode)->layout,
5956                                           lgp->args.ctx->state)) {
5957                 rpc_exit(task, NFS4_OK);
5958                 return;
5959         }
5960         rpc_call_start(task);
5961 }
5962
5963 static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
5964 {
5965         struct nfs4_layoutget *lgp = calldata;
5966         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
5967
5968         dprintk("--> %s\n", __func__);
5969
5970         if (!nfs4_sequence_done(task, &lgp->res.seq_res))
5971                 return;
5972
5973         switch (task->tk_status) {
5974         case 0:
5975                 break;
5976         case -NFS4ERR_LAYOUTTRYLATER:
5977         case -NFS4ERR_RECALLCONFLICT:
5978                 task->tk_status = -NFS4ERR_DELAY;
5979                 /* Fall through */
5980         default:
5981                 if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
5982                         rpc_restart_call_prepare(task);
5983                         return;
5984                 }
5985         }
5986         dprintk("<-- %s\n", __func__);
5987 }
5988
5989 static void nfs4_layoutget_release(void *calldata)
5990 {
5991         struct nfs4_layoutget *lgp = calldata;
5992
5993         dprintk("--> %s\n", __func__);
5994         put_nfs_open_context(lgp->args.ctx);
5995         kfree(calldata);
5996         dprintk("<-- %s\n", __func__);
5997 }
5998
5999 static const struct rpc_call_ops nfs4_layoutget_call_ops = {
6000         .rpc_call_prepare = nfs4_layoutget_prepare,
6001         .rpc_call_done = nfs4_layoutget_done,
6002         .rpc_release = nfs4_layoutget_release,
6003 };
6004
6005 int nfs4_proc_layoutget(struct nfs4_layoutget *lgp)
6006 {
6007         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
6008         struct rpc_task *task;
6009         struct rpc_message msg = {
6010                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTGET],
6011                 .rpc_argp = &lgp->args,
6012                 .rpc_resp = &lgp->res,
6013         };
6014         struct rpc_task_setup task_setup_data = {
6015                 .rpc_client = server->client,
6016                 .rpc_message = &msg,
6017                 .callback_ops = &nfs4_layoutget_call_ops,
6018                 .callback_data = lgp,
6019                 .flags = RPC_TASK_ASYNC,
6020         };
6021         int status = 0;
6022
6023         dprintk("--> %s\n", __func__);
6024
6025         lgp->res.layoutp = &lgp->args.layout;
6026         lgp->res.seq_res.sr_slot = NULL;
6027         nfs41_init_sequence(&lgp->args.seq_args, &lgp->res.seq_res, 0);
6028         task = rpc_run_task(&task_setup_data);
6029         if (IS_ERR(task))
6030                 return PTR_ERR(task);
6031         status = nfs4_wait_for_completion_rpc_task(task);
6032         if (status == 0)
6033                 status = task->tk_status;
6034         if (status == 0)
6035                 status = pnfs_layout_process(lgp);
6036         rpc_put_task(task);
6037         dprintk("<-- %s status=%d\n", __func__, status);
6038         return status;
6039 }
6040
6041 static void
6042 nfs4_layoutreturn_prepare(struct rpc_task *task, void *calldata)
6043 {
6044         struct nfs4_layoutreturn *lrp = calldata;
6045
6046         dprintk("--> %s\n", __func__);
6047         if (nfs41_setup_sequence(lrp->clp->cl_session, &lrp->args.seq_args,
6048                                 &lrp->res.seq_res, task))
6049                 return;
6050         rpc_call_start(task);
6051 }
6052
6053 static void nfs4_layoutreturn_done(struct rpc_task *task, void *calldata)
6054 {
6055         struct nfs4_layoutreturn *lrp = calldata;
6056         struct nfs_server *server;
6057         struct pnfs_layout_hdr *lo = lrp->args.layout;
6058
6059         dprintk("--> %s\n", __func__);
6060
6061         if (!nfs4_sequence_done(task, &lrp->res.seq_res))
6062                 return;
6063
6064         server = NFS_SERVER(lrp->args.inode);
6065         if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6066                 rpc_restart_call_prepare(task);
6067                 return;
6068         }
6069         spin_lock(&lo->plh_inode->i_lock);
6070         if (task->tk_status == 0) {
6071                 if (lrp->res.lrs_present) {
6072                         pnfs_set_layout_stateid(lo, &lrp->res.stateid, true);
6073                 } else
6074                         BUG_ON(!list_empty(&lo->plh_segs));
6075         }
6076         lo->plh_block_lgets--;
6077         spin_unlock(&lo->plh_inode->i_lock);
6078         dprintk("<-- %s\n", __func__);
6079 }
6080
6081 static void nfs4_layoutreturn_release(void *calldata)
6082 {
6083         struct nfs4_layoutreturn *lrp = calldata;
6084
6085         dprintk("--> %s\n", __func__);
6086         put_layout_hdr(lrp->args.layout);
6087         kfree(calldata);
6088         dprintk("<-- %s\n", __func__);
6089 }
6090
6091 static const struct rpc_call_ops nfs4_layoutreturn_call_ops = {
6092         .rpc_call_prepare = nfs4_layoutreturn_prepare,
6093         .rpc_call_done = nfs4_layoutreturn_done,
6094         .rpc_release = nfs4_layoutreturn_release,
6095 };
6096
6097 int nfs4_proc_layoutreturn(struct nfs4_layoutreturn *lrp)
6098 {
6099         struct rpc_task *task;
6100         struct rpc_message msg = {
6101                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTRETURN],
6102                 .rpc_argp = &lrp->args,
6103                 .rpc_resp = &lrp->res,
6104         };
6105         struct rpc_task_setup task_setup_data = {
6106                 .rpc_client = lrp->clp->cl_rpcclient,
6107                 .rpc_message = &msg,
6108                 .callback_ops = &nfs4_layoutreturn_call_ops,
6109                 .callback_data = lrp,
6110         };
6111         int status;
6112
6113         dprintk("--> %s\n", __func__);
6114         nfs41_init_sequence(&lrp->args.seq_args, &lrp->res.seq_res, 1);
6115         task = rpc_run_task(&task_setup_data);
6116         if (IS_ERR(task))
6117                 return PTR_ERR(task);
6118         status = task->tk_status;
6119         dprintk("<-- %s status=%d\n", __func__, status);
6120         rpc_put_task(task);
6121         return status;
6122 }
6123
6124 /*
6125  * Retrieve the list of Data Server devices from the MDS.
6126  */
6127 static int _nfs4_getdevicelist(struct nfs_server *server,
6128                                     const struct nfs_fh *fh,
6129                                     struct pnfs_devicelist *devlist)
6130 {
6131         struct nfs4_getdevicelist_args args = {
6132                 .fh = fh,
6133                 .layoutclass = server->pnfs_curr_ld->id,
6134         };
6135         struct nfs4_getdevicelist_res res = {
6136                 .devlist = devlist,
6137         };
6138         struct rpc_message msg = {
6139                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICELIST],
6140                 .rpc_argp = &args,
6141                 .rpc_resp = &res,
6142         };
6143         int status;
6144
6145         dprintk("--> %s\n", __func__);
6146         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args,
6147                                 &res.seq_res, 0);
6148         dprintk("<-- %s status=%d\n", __func__, status);
6149         return status;
6150 }
6151
6152 int nfs4_proc_getdevicelist(struct nfs_server *server,
6153                             const struct nfs_fh *fh,
6154                             struct pnfs_devicelist *devlist)
6155 {
6156         struct nfs4_exception exception = { };
6157         int err;
6158
6159         do {
6160                 err = nfs4_handle_exception(server,
6161                                 _nfs4_getdevicelist(server, fh, devlist),
6162                                 &exception);
6163         } while (exception.retry);
6164
6165         dprintk("%s: err=%d, num_devs=%u\n", __func__,
6166                 err, devlist->num_devs);
6167
6168         return err;
6169 }
6170 EXPORT_SYMBOL_GPL(nfs4_proc_getdevicelist);
6171
6172 static int
6173 _nfs4_proc_getdeviceinfo(struct nfs_server *server, struct pnfs_device *pdev)
6174 {
6175         struct nfs4_getdeviceinfo_args args = {
6176                 .pdev = pdev,
6177         };
6178         struct nfs4_getdeviceinfo_res res = {
6179                 .pdev = pdev,
6180         };
6181         struct rpc_message msg = {
6182                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICEINFO],
6183                 .rpc_argp = &args,
6184                 .rpc_resp = &res,
6185         };
6186         int status;
6187
6188         dprintk("--> %s\n", __func__);
6189         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
6190         dprintk("<-- %s status=%d\n", __func__, status);
6191
6192         return status;
6193 }
6194
6195 int nfs4_proc_getdeviceinfo(struct nfs_server *server, struct pnfs_device *pdev)
6196 {
6197         struct nfs4_exception exception = { };
6198         int err;
6199
6200         do {
6201                 err = nfs4_handle_exception(server,
6202                                         _nfs4_proc_getdeviceinfo(server, pdev),
6203                                         &exception);
6204         } while (exception.retry);
6205         return err;
6206 }
6207 EXPORT_SYMBOL_GPL(nfs4_proc_getdeviceinfo);
6208
6209 static void nfs4_layoutcommit_prepare(struct rpc_task *task, void *calldata)
6210 {
6211         struct nfs4_layoutcommit_data *data = calldata;
6212         struct nfs_server *server = NFS_SERVER(data->args.inode);
6213
6214         if (nfs4_setup_sequence(server, &data->args.seq_args,
6215                                 &data->res.seq_res, task))
6216                 return;
6217         rpc_call_start(task);
6218 }
6219
6220 static void
6221 nfs4_layoutcommit_done(struct rpc_task *task, void *calldata)
6222 {
6223         struct nfs4_layoutcommit_data *data = calldata;
6224         struct nfs_server *server = NFS_SERVER(data->args.inode);
6225
6226         if (!nfs4_sequence_done(task, &data->res.seq_res))
6227                 return;
6228
6229         switch (task->tk_status) { /* Just ignore these failures */
6230         case -NFS4ERR_DELEG_REVOKED: /* layout was recalled */
6231         case -NFS4ERR_BADIOMODE:     /* no IOMODE_RW layout for range */
6232         case -NFS4ERR_BADLAYOUT:     /* no layout */
6233         case -NFS4ERR_GRACE:        /* loca_recalim always false */
6234                 task->tk_status = 0;
6235                 break;
6236         case 0:
6237                 nfs_post_op_update_inode_force_wcc(data->args.inode,
6238                                                    data->res.fattr);
6239                 break;
6240         default:
6241                 if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6242                         rpc_restart_call_prepare(task);
6243                         return;
6244                 }
6245         }
6246 }
6247
6248 static void nfs4_layoutcommit_release(void *calldata)
6249 {
6250         struct nfs4_layoutcommit_data *data = calldata;
6251         struct pnfs_layout_segment *lseg, *tmp;
6252         unsigned long *bitlock = &NFS_I(data->args.inode)->flags;
6253
6254         pnfs_cleanup_layoutcommit(data);
6255         /* Matched by references in pnfs_set_layoutcommit */
6256         list_for_each_entry_safe(lseg, tmp, &data->lseg_list, pls_lc_list) {
6257                 list_del_init(&lseg->pls_lc_list);
6258                 if (test_and_clear_bit(NFS_LSEG_LAYOUTCOMMIT,
6259                                        &lseg->pls_flags))
6260                         put_lseg(lseg);
6261         }
6262
6263         clear_bit_unlock(NFS_INO_LAYOUTCOMMITTING, bitlock);
6264         smp_mb__after_clear_bit();
6265         wake_up_bit(bitlock, NFS_INO_LAYOUTCOMMITTING);
6266
6267         put_rpccred(data->cred);
6268         kfree(data);
6269 }
6270
6271 static const struct rpc_call_ops nfs4_layoutcommit_ops = {
6272         .rpc_call_prepare = nfs4_layoutcommit_prepare,
6273         .rpc_call_done = nfs4_layoutcommit_done,
6274         .rpc_release = nfs4_layoutcommit_release,
6275 };
6276
6277 int
6278 nfs4_proc_layoutcommit(struct nfs4_layoutcommit_data *data, bool sync)
6279 {
6280         struct rpc_message msg = {
6281                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTCOMMIT],
6282                 .rpc_argp = &data->args,
6283                 .rpc_resp = &data->res,
6284                 .rpc_cred = data->cred,
6285         };
6286         struct rpc_task_setup task_setup_data = {
6287                 .task = &data->task,
6288                 .rpc_client = NFS_CLIENT(data->args.inode),
6289                 .rpc_message = &msg,
6290                 .callback_ops = &nfs4_layoutcommit_ops,
6291                 .callback_data = data,
6292                 .flags = RPC_TASK_ASYNC,
6293         };
6294         struct rpc_task *task;
6295         int status = 0;
6296
6297         dprintk("NFS: %4d initiating layoutcommit call. sync %d "
6298                 "lbw: %llu inode %lu\n",
6299                 data->task.tk_pid, sync,
6300                 data->args.lastbytewritten,
6301                 data->args.inode->i_ino);
6302
6303         nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
6304         task = rpc_run_task(&task_setup_data);
6305         if (IS_ERR(task))
6306                 return PTR_ERR(task);
6307         if (sync == false)
6308                 goto out;
6309         status = nfs4_wait_for_completion_rpc_task(task);
6310         if (status != 0)
6311                 goto out;
6312         status = task->tk_status;
6313 out:
6314         dprintk("%s: status %d\n", __func__, status);
6315         rpc_put_task(task);
6316         return status;
6317 }
6318
6319 static int
6320 _nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
6321                     struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
6322 {
6323         struct nfs41_secinfo_no_name_args args = {
6324                 .style = SECINFO_STYLE_CURRENT_FH,
6325         };
6326         struct nfs4_secinfo_res res = {
6327                 .flavors = flavors,
6328         };
6329         struct rpc_message msg = {
6330                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO_NO_NAME],
6331                 .rpc_argp = &args,
6332                 .rpc_resp = &res,
6333         };
6334         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
6335 }
6336
6337 static int
6338 nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
6339                            struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
6340 {
6341         struct nfs4_exception exception = { };
6342         int err;
6343         do {
6344                 err = _nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
6345                 switch (err) {
6346                 case 0:
6347                 case -NFS4ERR_WRONGSEC:
6348                 case -NFS4ERR_NOTSUPP:
6349                         goto out;
6350                 default:
6351                         err = nfs4_handle_exception(server, err, &exception);
6352                 }
6353         } while (exception.retry);
6354 out:
6355         return err;
6356 }
6357
6358 static int
6359 nfs41_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
6360                     struct nfs_fsinfo *info)
6361 {
6362         int err;
6363         struct page *page;
6364         rpc_authflavor_t flavor;
6365         struct nfs4_secinfo_flavors *flavors;
6366
6367         page = alloc_page(GFP_KERNEL);
6368         if (!page) {
6369                 err = -ENOMEM;
6370                 goto out;
6371         }
6372
6373         flavors = page_address(page);
6374         err = nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
6375
6376         /*
6377          * Fall back on "guess and check" method if
6378          * the server doesn't support SECINFO_NO_NAME
6379          */
6380         if (err == -NFS4ERR_WRONGSEC || err == -NFS4ERR_NOTSUPP) {
6381                 err = nfs4_find_root_sec(server, fhandle, info);
6382                 goto out_freepage;
6383         }
6384         if (err)
6385                 goto out_freepage;
6386
6387         flavor = nfs_find_best_sec(flavors);
6388         if (err == 0)
6389                 err = nfs4_lookup_root_sec(server, fhandle, info, flavor);
6390
6391 out_freepage:
6392         put_page(page);
6393         if (err == -EACCES)
6394                 return -EPERM;
6395 out:
6396         return err;
6397 }
6398
6399 static int _nfs41_test_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6400 {
6401         int status;
6402         struct nfs41_test_stateid_args args = {
6403                 .stateid = stateid,
6404         };
6405         struct nfs41_test_stateid_res res;
6406         struct rpc_message msg = {
6407                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_TEST_STATEID],
6408                 .rpc_argp = &args,
6409                 .rpc_resp = &res,
6410         };
6411
6412         nfs41_init_sequence(&args.seq_args, &res.seq_res, 0);
6413         status = nfs4_call_sync_sequence(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
6414
6415         if (status == NFS_OK)
6416                 return res.status;
6417         return status;
6418 }
6419
6420 static int nfs41_test_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6421 {
6422         struct nfs4_exception exception = { };
6423         int err;
6424         do {
6425                 err = nfs4_handle_exception(server,
6426                                 _nfs41_test_stateid(server, stateid),
6427                                 &exception);
6428         } while (exception.retry);
6429         return err;
6430 }
6431
6432 static int _nfs4_free_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6433 {
6434         struct nfs41_free_stateid_args args = {
6435                 .stateid = stateid,
6436         };
6437         struct nfs41_free_stateid_res res;
6438         struct rpc_message msg = {
6439                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FREE_STATEID],
6440                 .rpc_argp = &args,
6441                 .rpc_resp = &res,
6442         };
6443
6444         nfs41_init_sequence(&args.seq_args, &res.seq_res, 0);
6445         return nfs4_call_sync_sequence(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
6446 }
6447
6448 static int nfs41_free_stateid(struct nfs_server *server, nfs4_stateid *stateid)
6449 {
6450         struct nfs4_exception exception = { };
6451         int err;
6452         do {
6453                 err = nfs4_handle_exception(server,
6454                                 _nfs4_free_stateid(server, stateid),
6455                                 &exception);
6456         } while (exception.retry);
6457         return err;
6458 }
6459
6460 static bool nfs41_match_stateid(const nfs4_stateid *s1,
6461                 const nfs4_stateid *s2)
6462 {
6463         if (memcmp(s1->other, s2->other, sizeof(s1->other)) != 0)
6464                 return false;
6465
6466         if (s1->seqid == s2->seqid)
6467                 return true;
6468         if (s1->seqid == 0 || s2->seqid == 0)
6469                 return true;
6470
6471         return false;
6472 }
6473
6474 #endif /* CONFIG_NFS_V4_1 */
6475
6476 static bool nfs4_match_stateid(const nfs4_stateid *s1,
6477                 const nfs4_stateid *s2)
6478 {
6479         return nfs4_stateid_match(s1, s2);
6480 }
6481
6482
6483 static const struct nfs4_state_recovery_ops nfs40_reboot_recovery_ops = {
6484         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
6485         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
6486         .recover_open   = nfs4_open_reclaim,
6487         .recover_lock   = nfs4_lock_reclaim,
6488         .establish_clid = nfs4_init_clientid,
6489         .get_clid_cred  = nfs4_get_setclientid_cred,
6490 };
6491
6492 #if defined(CONFIG_NFS_V4_1)
6493 static const struct nfs4_state_recovery_ops nfs41_reboot_recovery_ops = {
6494         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
6495         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
6496         .recover_open   = nfs4_open_reclaim,
6497         .recover_lock   = nfs4_lock_reclaim,
6498         .establish_clid = nfs41_init_clientid,
6499         .get_clid_cred  = nfs4_get_exchange_id_cred,
6500         .reclaim_complete = nfs41_proc_reclaim_complete,
6501 };
6502 #endif /* CONFIG_NFS_V4_1 */
6503
6504 static const struct nfs4_state_recovery_ops nfs40_nograce_recovery_ops = {
6505         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
6506         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
6507         .recover_open   = nfs4_open_expired,
6508         .recover_lock   = nfs4_lock_expired,
6509         .establish_clid = nfs4_init_clientid,
6510         .get_clid_cred  = nfs4_get_setclientid_cred,
6511 };
6512
6513 #if defined(CONFIG_NFS_V4_1)
6514 static const struct nfs4_state_recovery_ops nfs41_nograce_recovery_ops = {
6515         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
6516         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
6517         .recover_open   = nfs41_open_expired,
6518         .recover_lock   = nfs41_lock_expired,
6519         .establish_clid = nfs41_init_clientid,
6520         .get_clid_cred  = nfs4_get_exchange_id_cred,
6521 };
6522 #endif /* CONFIG_NFS_V4_1 */
6523
6524 static const struct nfs4_state_maintenance_ops nfs40_state_renewal_ops = {
6525         .sched_state_renewal = nfs4_proc_async_renew,
6526         .get_state_renewal_cred_locked = nfs4_get_renew_cred_locked,
6527         .renew_lease = nfs4_proc_renew,
6528 };
6529
6530 #if defined(CONFIG_NFS_V4_1)
6531 static const struct nfs4_state_maintenance_ops nfs41_state_renewal_ops = {
6532         .sched_state_renewal = nfs41_proc_async_sequence,
6533         .get_state_renewal_cred_locked = nfs4_get_machine_cred_locked,
6534         .renew_lease = nfs4_proc_sequence,
6535 };
6536 #endif
6537
6538 static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
6539         .minor_version = 0,
6540         .call_sync = _nfs4_call_sync,
6541         .match_stateid = nfs4_match_stateid,
6542         .find_root_sec = nfs4_find_root_sec,
6543         .reboot_recovery_ops = &nfs40_reboot_recovery_ops,
6544         .nograce_recovery_ops = &nfs40_nograce_recovery_ops,
6545         .state_renewal_ops = &nfs40_state_renewal_ops,
6546 };
6547
6548 #if defined(CONFIG_NFS_V4_1)
6549 static const struct nfs4_minor_version_ops nfs_v4_1_minor_ops = {
6550         .minor_version = 1,
6551         .call_sync = _nfs4_call_sync_session,
6552         .match_stateid = nfs41_match_stateid,
6553         .find_root_sec = nfs41_find_root_sec,
6554         .reboot_recovery_ops = &nfs41_reboot_recovery_ops,
6555         .nograce_recovery_ops = &nfs41_nograce_recovery_ops,
6556         .state_renewal_ops = &nfs41_state_renewal_ops,
6557 };
6558 #endif
6559
6560 const struct nfs4_minor_version_ops *nfs_v4_minor_ops[] = {
6561         [0] = &nfs_v4_0_minor_ops,
6562 #if defined(CONFIG_NFS_V4_1)
6563         [1] = &nfs_v4_1_minor_ops,
6564 #endif
6565 };
6566
6567 static const struct inode_operations nfs4_file_inode_operations = {
6568         .permission     = nfs_permission,
6569         .getattr        = nfs_getattr,
6570         .setattr        = nfs_setattr,
6571         .getxattr       = generic_getxattr,
6572         .setxattr       = generic_setxattr,
6573         .listxattr      = generic_listxattr,
6574         .removexattr    = generic_removexattr,
6575 };
6576
6577 const struct nfs_rpc_ops nfs_v4_clientops = {
6578         .version        = 4,                    /* protocol version */
6579         .dentry_ops     = &nfs4_dentry_operations,
6580         .dir_inode_ops  = &nfs4_dir_inode_operations,
6581         .file_inode_ops = &nfs4_file_inode_operations,
6582         .file_ops       = &nfs4_file_operations,
6583         .getroot        = nfs4_proc_get_root,
6584         .submount       = nfs4_submount,
6585         .getattr        = nfs4_proc_getattr,
6586         .setattr        = nfs4_proc_setattr,
6587         .lookup         = nfs4_proc_lookup,
6588         .access         = nfs4_proc_access,
6589         .readlink       = nfs4_proc_readlink,
6590         .create         = nfs4_proc_create,
6591         .remove         = nfs4_proc_remove,
6592         .unlink_setup   = nfs4_proc_unlink_setup,
6593         .unlink_rpc_prepare = nfs4_proc_unlink_rpc_prepare,
6594         .unlink_done    = nfs4_proc_unlink_done,
6595         .rename         = nfs4_proc_rename,
6596         .rename_setup   = nfs4_proc_rename_setup,
6597         .rename_rpc_prepare = nfs4_proc_rename_rpc_prepare,
6598         .rename_done    = nfs4_proc_rename_done,
6599         .link           = nfs4_proc_link,
6600         .symlink        = nfs4_proc_symlink,
6601         .mkdir          = nfs4_proc_mkdir,
6602         .rmdir          = nfs4_proc_remove,
6603         .readdir        = nfs4_proc_readdir,
6604         .mknod          = nfs4_proc_mknod,
6605         .statfs         = nfs4_proc_statfs,
6606         .fsinfo         = nfs4_proc_fsinfo,
6607         .pathconf       = nfs4_proc_pathconf,
6608         .set_capabilities = nfs4_server_capabilities,
6609         .decode_dirent  = nfs4_decode_dirent,
6610         .read_setup     = nfs4_proc_read_setup,
6611         .read_rpc_prepare = nfs4_proc_read_rpc_prepare,
6612         .read_done      = nfs4_read_done,
6613         .write_setup    = nfs4_proc_write_setup,
6614         .write_rpc_prepare = nfs4_proc_write_rpc_prepare,
6615         .write_done     = nfs4_write_done,
6616         .commit_setup   = nfs4_proc_commit_setup,
6617         .commit_rpc_prepare = nfs4_proc_commit_rpc_prepare,
6618         .commit_done    = nfs4_commit_done,
6619         .lock           = nfs4_proc_lock,
6620         .clear_acl_cache = nfs4_zap_acl_attr,
6621         .close_context  = nfs4_close_context,
6622         .open_context   = nfs4_atomic_open,
6623         .init_client    = nfs4_init_client,
6624 };
6625
6626 static const struct xattr_handler nfs4_xattr_nfs4_acl_handler = {
6627         .prefix = XATTR_NAME_NFSV4_ACL,
6628         .list   = nfs4_xattr_list_nfs4_acl,
6629         .get    = nfs4_xattr_get_nfs4_acl,
6630         .set    = nfs4_xattr_set_nfs4_acl,
6631 };
6632
6633 const struct xattr_handler *nfs4_xattr_handlers[] = {
6634         &nfs4_xattr_nfs4_acl_handler,
6635         NULL
6636 };
6637
6638 module_param(max_session_slots, ushort, 0644);
6639 MODULE_PARM_DESC(max_session_slots, "Maximum number of outstanding NFSv4.1 "
6640                 "requests the client will negotiate");
6641
6642 /*
6643  * Local variables:
6644  *  c-basic-offset: 8
6645  * End:
6646  */