NFSv4.1: Ensure we call FREE_STATEID if needed on close/delegreturn/locku
[cascardo/linux.git] / fs / nfs / nfs4proc.c
1 /*
2  *  fs/nfs/nfs4proc.c
3  *
4  *  Client-side procedure declarations for NFSv4.
5  *
6  *  Copyright (c) 2002 The Regents of the University of Michigan.
7  *  All rights reserved.
8  *
9  *  Kendrick Smith <kmsmith@umich.edu>
10  *  Andy Adamson   <andros@umich.edu>
11  *
12  *  Redistribution and use in source and binary forms, with or without
13  *  modification, are permitted provided that the following conditions
14  *  are met:
15  *
16  *  1. Redistributions of source code must retain the above copyright
17  *     notice, this list of conditions and the following disclaimer.
18  *  2. Redistributions in binary form must reproduce the above copyright
19  *     notice, this list of conditions and the following disclaimer in the
20  *     documentation and/or other materials provided with the distribution.
21  *  3. Neither the name of the University nor the names of its
22  *     contributors may be used to endorse or promote products derived
23  *     from this software without specific prior written permission.
24  *
25  *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
26  *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
27  *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
28  *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
29  *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
30  *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
31  *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
32  *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
33  *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
34  *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
35  *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36  */
37
38 #include <linux/mm.h>
39 #include <linux/delay.h>
40 #include <linux/errno.h>
41 #include <linux/file.h>
42 #include <linux/string.h>
43 #include <linux/ratelimit.h>
44 #include <linux/printk.h>
45 #include <linux/slab.h>
46 #include <linux/sunrpc/clnt.h>
47 #include <linux/nfs.h>
48 #include <linux/nfs4.h>
49 #include <linux/nfs_fs.h>
50 #include <linux/nfs_page.h>
51 #include <linux/nfs_mount.h>
52 #include <linux/namei.h>
53 #include <linux/mount.h>
54 #include <linux/module.h>
55 #include <linux/xattr.h>
56 #include <linux/utsname.h>
57 #include <linux/freezer.h>
58
59 #include "nfs4_fs.h"
60 #include "delegation.h"
61 #include "internal.h"
62 #include "iostat.h"
63 #include "callback.h"
64 #include "pnfs.h"
65 #include "netns.h"
66 #include "nfs4idmap.h"
67 #include "nfs4session.h"
68 #include "fscache.h"
69
70 #include "nfs4trace.h"
71
72 #define NFSDBG_FACILITY         NFSDBG_PROC
73
74 #define NFS4_POLL_RETRY_MIN     (HZ/10)
75 #define NFS4_POLL_RETRY_MAX     (15*HZ)
76
77 /* file attributes which can be mapped to nfs attributes */
78 #define NFS4_VALID_ATTRS (ATTR_MODE \
79         | ATTR_UID \
80         | ATTR_GID \
81         | ATTR_SIZE \
82         | ATTR_ATIME \
83         | ATTR_MTIME \
84         | ATTR_CTIME \
85         | ATTR_ATIME_SET \
86         | ATTR_MTIME_SET)
87
88 struct nfs4_opendata;
89 static int _nfs4_proc_open(struct nfs4_opendata *data);
90 static int _nfs4_recover_proc_open(struct nfs4_opendata *data);
91 static int nfs4_do_fsinfo(struct nfs_server *, struct nfs_fh *, struct nfs_fsinfo *);
92 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr);
93 static int nfs4_proc_getattr(struct nfs_server *, struct nfs_fh *, struct nfs_fattr *, struct nfs4_label *label);
94 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr, struct nfs4_label *label);
95 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
96                             struct nfs_fattr *fattr, struct iattr *sattr,
97                             struct nfs4_state *state, struct nfs4_label *ilabel,
98                             struct nfs4_label *olabel);
99 #ifdef CONFIG_NFS_V4_1
100 static int nfs41_test_stateid(struct nfs_server *, nfs4_stateid *,
101                 struct rpc_cred *);
102 static int nfs41_free_stateid(struct nfs_server *, const nfs4_stateid *,
103                 struct rpc_cred *, bool);
104 #endif
105
106 #ifdef CONFIG_NFS_V4_SECURITY_LABEL
107 static inline struct nfs4_label *
108 nfs4_label_init_security(struct inode *dir, struct dentry *dentry,
109         struct iattr *sattr, struct nfs4_label *label)
110 {
111         int err;
112
113         if (label == NULL)
114                 return NULL;
115
116         if (nfs_server_capable(dir, NFS_CAP_SECURITY_LABEL) == 0)
117                 return NULL;
118
119         err = security_dentry_init_security(dentry, sattr->ia_mode,
120                                 &dentry->d_name, (void **)&label->label, &label->len);
121         if (err == 0)
122                 return label;
123
124         return NULL;
125 }
126 static inline void
127 nfs4_label_release_security(struct nfs4_label *label)
128 {
129         if (label)
130                 security_release_secctx(label->label, label->len);
131 }
132 static inline u32 *nfs4_bitmask(struct nfs_server *server, struct nfs4_label *label)
133 {
134         if (label)
135                 return server->attr_bitmask;
136
137         return server->attr_bitmask_nl;
138 }
139 #else
140 static inline struct nfs4_label *
141 nfs4_label_init_security(struct inode *dir, struct dentry *dentry,
142         struct iattr *sattr, struct nfs4_label *l)
143 { return NULL; }
144 static inline void
145 nfs4_label_release_security(struct nfs4_label *label)
146 { return; }
147 static inline u32 *
148 nfs4_bitmask(struct nfs_server *server, struct nfs4_label *label)
149 { return server->attr_bitmask; }
150 #endif
151
152 /* Prevent leaks of NFSv4 errors into userland */
153 static int nfs4_map_errors(int err)
154 {
155         if (err >= -1000)
156                 return err;
157         switch (err) {
158         case -NFS4ERR_RESOURCE:
159         case -NFS4ERR_LAYOUTTRYLATER:
160         case -NFS4ERR_RECALLCONFLICT:
161                 return -EREMOTEIO;
162         case -NFS4ERR_WRONGSEC:
163         case -NFS4ERR_WRONG_CRED:
164                 return -EPERM;
165         case -NFS4ERR_BADOWNER:
166         case -NFS4ERR_BADNAME:
167                 return -EINVAL;
168         case -NFS4ERR_SHARE_DENIED:
169                 return -EACCES;
170         case -NFS4ERR_MINOR_VERS_MISMATCH:
171                 return -EPROTONOSUPPORT;
172         case -NFS4ERR_FILE_OPEN:
173                 return -EBUSY;
174         default:
175                 dprintk("%s could not handle NFSv4 error %d\n",
176                                 __func__, -err);
177                 break;
178         }
179         return -EIO;
180 }
181
182 /*
183  * This is our standard bitmap for GETATTR requests.
184  */
185 const u32 nfs4_fattr_bitmap[3] = {
186         FATTR4_WORD0_TYPE
187         | FATTR4_WORD0_CHANGE
188         | FATTR4_WORD0_SIZE
189         | FATTR4_WORD0_FSID
190         | FATTR4_WORD0_FILEID,
191         FATTR4_WORD1_MODE
192         | FATTR4_WORD1_NUMLINKS
193         | FATTR4_WORD1_OWNER
194         | FATTR4_WORD1_OWNER_GROUP
195         | FATTR4_WORD1_RAWDEV
196         | FATTR4_WORD1_SPACE_USED
197         | FATTR4_WORD1_TIME_ACCESS
198         | FATTR4_WORD1_TIME_METADATA
199         | FATTR4_WORD1_TIME_MODIFY
200         | FATTR4_WORD1_MOUNTED_ON_FILEID,
201 #ifdef CONFIG_NFS_V4_SECURITY_LABEL
202         FATTR4_WORD2_SECURITY_LABEL
203 #endif
204 };
205
206 static const u32 nfs4_pnfs_open_bitmap[3] = {
207         FATTR4_WORD0_TYPE
208         | FATTR4_WORD0_CHANGE
209         | FATTR4_WORD0_SIZE
210         | FATTR4_WORD0_FSID
211         | FATTR4_WORD0_FILEID,
212         FATTR4_WORD1_MODE
213         | FATTR4_WORD1_NUMLINKS
214         | FATTR4_WORD1_OWNER
215         | FATTR4_WORD1_OWNER_GROUP
216         | FATTR4_WORD1_RAWDEV
217         | FATTR4_WORD1_SPACE_USED
218         | FATTR4_WORD1_TIME_ACCESS
219         | FATTR4_WORD1_TIME_METADATA
220         | FATTR4_WORD1_TIME_MODIFY,
221         FATTR4_WORD2_MDSTHRESHOLD
222 #ifdef CONFIG_NFS_V4_SECURITY_LABEL
223         | FATTR4_WORD2_SECURITY_LABEL
224 #endif
225 };
226
227 static const u32 nfs4_open_noattr_bitmap[3] = {
228         FATTR4_WORD0_TYPE
229         | FATTR4_WORD0_CHANGE
230         | FATTR4_WORD0_FILEID,
231 };
232
233 const u32 nfs4_statfs_bitmap[3] = {
234         FATTR4_WORD0_FILES_AVAIL
235         | FATTR4_WORD0_FILES_FREE
236         | FATTR4_WORD0_FILES_TOTAL,
237         FATTR4_WORD1_SPACE_AVAIL
238         | FATTR4_WORD1_SPACE_FREE
239         | FATTR4_WORD1_SPACE_TOTAL
240 };
241
242 const u32 nfs4_pathconf_bitmap[3] = {
243         FATTR4_WORD0_MAXLINK
244         | FATTR4_WORD0_MAXNAME,
245         0
246 };
247
248 const u32 nfs4_fsinfo_bitmap[3] = { FATTR4_WORD0_MAXFILESIZE
249                         | FATTR4_WORD0_MAXREAD
250                         | FATTR4_WORD0_MAXWRITE
251                         | FATTR4_WORD0_LEASE_TIME,
252                         FATTR4_WORD1_TIME_DELTA
253                         | FATTR4_WORD1_FS_LAYOUT_TYPES,
254                         FATTR4_WORD2_LAYOUT_BLKSIZE
255                         | FATTR4_WORD2_CLONE_BLKSIZE
256 };
257
258 const u32 nfs4_fs_locations_bitmap[3] = {
259         FATTR4_WORD0_TYPE
260         | FATTR4_WORD0_CHANGE
261         | FATTR4_WORD0_SIZE
262         | FATTR4_WORD0_FSID
263         | FATTR4_WORD0_FILEID
264         | FATTR4_WORD0_FS_LOCATIONS,
265         FATTR4_WORD1_MODE
266         | FATTR4_WORD1_NUMLINKS
267         | FATTR4_WORD1_OWNER
268         | FATTR4_WORD1_OWNER_GROUP
269         | FATTR4_WORD1_RAWDEV
270         | FATTR4_WORD1_SPACE_USED
271         | FATTR4_WORD1_TIME_ACCESS
272         | FATTR4_WORD1_TIME_METADATA
273         | FATTR4_WORD1_TIME_MODIFY
274         | FATTR4_WORD1_MOUNTED_ON_FILEID,
275 };
276
277 static void nfs4_setup_readdir(u64 cookie, __be32 *verifier, struct dentry *dentry,
278                 struct nfs4_readdir_arg *readdir)
279 {
280         __be32 *start, *p;
281
282         if (cookie > 2) {
283                 readdir->cookie = cookie;
284                 memcpy(&readdir->verifier, verifier, sizeof(readdir->verifier));
285                 return;
286         }
287
288         readdir->cookie = 0;
289         memset(&readdir->verifier, 0, sizeof(readdir->verifier));
290         if (cookie == 2)
291                 return;
292         
293         /*
294          * NFSv4 servers do not return entries for '.' and '..'
295          * Therefore, we fake these entries here.  We let '.'
296          * have cookie 0 and '..' have cookie 1.  Note that
297          * when talking to the server, we always send cookie 0
298          * instead of 1 or 2.
299          */
300         start = p = kmap_atomic(*readdir->pages);
301         
302         if (cookie == 0) {
303                 *p++ = xdr_one;                                  /* next */
304                 *p++ = xdr_zero;                   /* cookie, first word */
305                 *p++ = xdr_one;                   /* cookie, second word */
306                 *p++ = xdr_one;                             /* entry len */
307                 memcpy(p, ".\0\0\0", 4);                        /* entry */
308                 p++;
309                 *p++ = xdr_one;                         /* bitmap length */
310                 *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
311                 *p++ = htonl(8);              /* attribute buffer length */
312                 p = xdr_encode_hyper(p, NFS_FILEID(d_inode(dentry)));
313         }
314         
315         *p++ = xdr_one;                                  /* next */
316         *p++ = xdr_zero;                   /* cookie, first word */
317         *p++ = xdr_two;                   /* cookie, second word */
318         *p++ = xdr_two;                             /* entry len */
319         memcpy(p, "..\0\0", 4);                         /* entry */
320         p++;
321         *p++ = xdr_one;                         /* bitmap length */
322         *p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
323         *p++ = htonl(8);              /* attribute buffer length */
324         p = xdr_encode_hyper(p, NFS_FILEID(d_inode(dentry->d_parent)));
325
326         readdir->pgbase = (char *)p - (char *)start;
327         readdir->count -= readdir->pgbase;
328         kunmap_atomic(start);
329 }
330
331 static void nfs4_test_and_free_stateid(struct nfs_server *server,
332                 nfs4_stateid *stateid,
333                 struct rpc_cred *cred)
334 {
335         const struct nfs4_minor_version_ops *ops = server->nfs_client->cl_mvops;
336
337         ops->test_and_free_expired(server, stateid, cred);
338 }
339
340 static void __nfs4_free_revoked_stateid(struct nfs_server *server,
341                 nfs4_stateid *stateid,
342                 struct rpc_cred *cred)
343 {
344         stateid->type = NFS4_REVOKED_STATEID_TYPE;
345         nfs4_test_and_free_stateid(server, stateid, cred);
346 }
347
348 static void nfs4_free_revoked_stateid(struct nfs_server *server,
349                 const nfs4_stateid *stateid,
350                 struct rpc_cred *cred)
351 {
352         nfs4_stateid tmp;
353
354         nfs4_stateid_copy(&tmp, stateid);
355         __nfs4_free_revoked_stateid(server, &tmp, cred);
356 }
357
358 static long nfs4_update_delay(long *timeout)
359 {
360         long ret;
361         if (!timeout)
362                 return NFS4_POLL_RETRY_MAX;
363         if (*timeout <= 0)
364                 *timeout = NFS4_POLL_RETRY_MIN;
365         if (*timeout > NFS4_POLL_RETRY_MAX)
366                 *timeout = NFS4_POLL_RETRY_MAX;
367         ret = *timeout;
368         *timeout <<= 1;
369         return ret;
370 }
371
372 static int nfs4_delay(struct rpc_clnt *clnt, long *timeout)
373 {
374         int res = 0;
375
376         might_sleep();
377
378         freezable_schedule_timeout_killable_unsafe(
379                 nfs4_update_delay(timeout));
380         if (fatal_signal_pending(current))
381                 res = -ERESTARTSYS;
382         return res;
383 }
384
385 /* This is the error handling routine for processes that are allowed
386  * to sleep.
387  */
388 static int nfs4_do_handle_exception(struct nfs_server *server,
389                 int errorcode, struct nfs4_exception *exception)
390 {
391         struct nfs_client *clp = server->nfs_client;
392         struct nfs4_state *state = exception->state;
393         const nfs4_stateid *stateid = exception->stateid;
394         struct inode *inode = exception->inode;
395         int ret = errorcode;
396
397         exception->delay = 0;
398         exception->recovering = 0;
399         exception->retry = 0;
400         switch(errorcode) {
401                 case 0:
402                         return 0;
403                 case -NFS4ERR_OPENMODE:
404                 case -NFS4ERR_DELEG_REVOKED:
405                 case -NFS4ERR_ADMIN_REVOKED:
406                 case -NFS4ERR_BAD_STATEID:
407                         if (inode) {
408                                 int err;
409
410                                 err = nfs_async_inode_return_delegation(inode,
411                                                 stateid);
412                                 if (err == 0)
413                                         goto wait_on_recovery;
414                                 if (stateid != NULL && stateid->type == NFS4_DELEGATION_STATEID_TYPE) {
415                                         exception->retry = 1;
416                                         break;
417                                 }
418                         }
419                         if (state == NULL)
420                                 break;
421                         ret = nfs4_schedule_stateid_recovery(server, state);
422                         if (ret < 0)
423                                 break;
424                         goto wait_on_recovery;
425                 case -NFS4ERR_EXPIRED:
426                         if (state != NULL) {
427                                 ret = nfs4_schedule_stateid_recovery(server, state);
428                                 if (ret < 0)
429                                         break;
430                         }
431                 case -NFS4ERR_STALE_STATEID:
432                 case -NFS4ERR_STALE_CLIENTID:
433                         nfs4_schedule_lease_recovery(clp);
434                         goto wait_on_recovery;
435                 case -NFS4ERR_MOVED:
436                         ret = nfs4_schedule_migration_recovery(server);
437                         if (ret < 0)
438                                 break;
439                         goto wait_on_recovery;
440                 case -NFS4ERR_LEASE_MOVED:
441                         nfs4_schedule_lease_moved_recovery(clp);
442                         goto wait_on_recovery;
443 #if defined(CONFIG_NFS_V4_1)
444                 case -NFS4ERR_BADSESSION:
445                 case -NFS4ERR_BADSLOT:
446                 case -NFS4ERR_BAD_HIGH_SLOT:
447                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
448                 case -NFS4ERR_DEADSESSION:
449                 case -NFS4ERR_SEQ_FALSE_RETRY:
450                 case -NFS4ERR_SEQ_MISORDERED:
451                         dprintk("%s ERROR: %d Reset session\n", __func__,
452                                 errorcode);
453                         nfs4_schedule_session_recovery(clp->cl_session, errorcode);
454                         goto wait_on_recovery;
455 #endif /* defined(CONFIG_NFS_V4_1) */
456                 case -NFS4ERR_FILE_OPEN:
457                         if (exception->timeout > HZ) {
458                                 /* We have retried a decent amount, time to
459                                  * fail
460                                  */
461                                 ret = -EBUSY;
462                                 break;
463                         }
464                 case -NFS4ERR_DELAY:
465                         nfs_inc_server_stats(server, NFSIOS_DELAY);
466                 case -NFS4ERR_GRACE:
467                 case -NFS4ERR_LAYOUTTRYLATER:
468                 case -NFS4ERR_RECALLCONFLICT:
469                         exception->delay = 1;
470                         return 0;
471
472                 case -NFS4ERR_RETRY_UNCACHED_REP:
473                 case -NFS4ERR_OLD_STATEID:
474                         exception->retry = 1;
475                         break;
476                 case -NFS4ERR_BADOWNER:
477                         /* The following works around a Linux server bug! */
478                 case -NFS4ERR_BADNAME:
479                         if (server->caps & NFS_CAP_UIDGID_NOMAP) {
480                                 server->caps &= ~NFS_CAP_UIDGID_NOMAP;
481                                 exception->retry = 1;
482                                 printk(KERN_WARNING "NFS: v4 server %s "
483                                                 "does not accept raw "
484                                                 "uid/gids. "
485                                                 "Reenabling the idmapper.\n",
486                                                 server->nfs_client->cl_hostname);
487                         }
488         }
489         /* We failed to handle the error */
490         return nfs4_map_errors(ret);
491 wait_on_recovery:
492         exception->recovering = 1;
493         return 0;
494 }
495
496 /* This is the error handling routine for processes that are allowed
497  * to sleep.
498  */
499 int nfs4_handle_exception(struct nfs_server *server, int errorcode, struct nfs4_exception *exception)
500 {
501         struct nfs_client *clp = server->nfs_client;
502         int ret;
503
504         ret = nfs4_do_handle_exception(server, errorcode, exception);
505         if (exception->delay) {
506                 ret = nfs4_delay(server->client, &exception->timeout);
507                 goto out_retry;
508         }
509         if (exception->recovering) {
510                 ret = nfs4_wait_clnt_recover(clp);
511                 if (test_bit(NFS_MIG_FAILED, &server->mig_status))
512                         return -EIO;
513                 goto out_retry;
514         }
515         return ret;
516 out_retry:
517         if (ret == 0)
518                 exception->retry = 1;
519         return ret;
520 }
521
522 static int
523 nfs4_async_handle_exception(struct rpc_task *task, struct nfs_server *server,
524                 int errorcode, struct nfs4_exception *exception)
525 {
526         struct nfs_client *clp = server->nfs_client;
527         int ret;
528
529         ret = nfs4_do_handle_exception(server, errorcode, exception);
530         if (exception->delay) {
531                 rpc_delay(task, nfs4_update_delay(&exception->timeout));
532                 goto out_retry;
533         }
534         if (exception->recovering) {
535                 rpc_sleep_on(&clp->cl_rpcwaitq, task, NULL);
536                 if (test_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) == 0)
537                         rpc_wake_up_queued_task(&clp->cl_rpcwaitq, task);
538                 goto out_retry;
539         }
540         if (test_bit(NFS_MIG_FAILED, &server->mig_status))
541                 ret = -EIO;
542         return ret;
543 out_retry:
544         if (ret == 0)
545                 exception->retry = 1;
546         return ret;
547 }
548
549 static int
550 nfs4_async_handle_error(struct rpc_task *task, struct nfs_server *server,
551                         struct nfs4_state *state, long *timeout)
552 {
553         struct nfs4_exception exception = {
554                 .state = state,
555         };
556
557         if (task->tk_status >= 0)
558                 return 0;
559         if (timeout)
560                 exception.timeout = *timeout;
561         task->tk_status = nfs4_async_handle_exception(task, server,
562                         task->tk_status,
563                         &exception);
564         if (exception.delay && timeout)
565                 *timeout = exception.timeout;
566         if (exception.retry)
567                 return -EAGAIN;
568         return 0;
569 }
570
571 /*
572  * Return 'true' if 'clp' is using an rpc_client that is integrity protected
573  * or 'false' otherwise.
574  */
575 static bool _nfs4_is_integrity_protected(struct nfs_client *clp)
576 {
577         rpc_authflavor_t flavor = clp->cl_rpcclient->cl_auth->au_flavor;
578
579         if (flavor == RPC_AUTH_GSS_KRB5I ||
580             flavor == RPC_AUTH_GSS_KRB5P)
581                 return true;
582
583         return false;
584 }
585
586 static void do_renew_lease(struct nfs_client *clp, unsigned long timestamp)
587 {
588         spin_lock(&clp->cl_lock);
589         if (time_before(clp->cl_last_renewal,timestamp))
590                 clp->cl_last_renewal = timestamp;
591         spin_unlock(&clp->cl_lock);
592 }
593
594 static void renew_lease(const struct nfs_server *server, unsigned long timestamp)
595 {
596         struct nfs_client *clp = server->nfs_client;
597
598         if (!nfs4_has_session(clp))
599                 do_renew_lease(clp, timestamp);
600 }
601
602 struct nfs4_call_sync_data {
603         const struct nfs_server *seq_server;
604         struct nfs4_sequence_args *seq_args;
605         struct nfs4_sequence_res *seq_res;
606 };
607
608 void nfs4_init_sequence(struct nfs4_sequence_args *args,
609                         struct nfs4_sequence_res *res, int cache_reply)
610 {
611         args->sa_slot = NULL;
612         args->sa_cache_this = cache_reply;
613         args->sa_privileged = 0;
614
615         res->sr_slot = NULL;
616 }
617
618 static void nfs4_set_sequence_privileged(struct nfs4_sequence_args *args)
619 {
620         args->sa_privileged = 1;
621 }
622
623 int nfs40_setup_sequence(struct nfs4_slot_table *tbl,
624                          struct nfs4_sequence_args *args,
625                          struct nfs4_sequence_res *res,
626                          struct rpc_task *task)
627 {
628         struct nfs4_slot *slot;
629
630         /* slot already allocated? */
631         if (res->sr_slot != NULL)
632                 goto out_start;
633
634         spin_lock(&tbl->slot_tbl_lock);
635         if (nfs4_slot_tbl_draining(tbl) && !args->sa_privileged)
636                 goto out_sleep;
637
638         slot = nfs4_alloc_slot(tbl);
639         if (IS_ERR(slot)) {
640                 if (slot == ERR_PTR(-ENOMEM))
641                         task->tk_timeout = HZ >> 2;
642                 goto out_sleep;
643         }
644         spin_unlock(&tbl->slot_tbl_lock);
645
646         slot->privileged = args->sa_privileged ? 1 : 0;
647         args->sa_slot = slot;
648         res->sr_slot = slot;
649
650 out_start:
651         rpc_call_start(task);
652         return 0;
653
654 out_sleep:
655         if (args->sa_privileged)
656                 rpc_sleep_on_priority(&tbl->slot_tbl_waitq, task,
657                                 NULL, RPC_PRIORITY_PRIVILEGED);
658         else
659                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
660         spin_unlock(&tbl->slot_tbl_lock);
661         return -EAGAIN;
662 }
663 EXPORT_SYMBOL_GPL(nfs40_setup_sequence);
664
665 static void nfs40_sequence_free_slot(struct nfs4_sequence_res *res)
666 {
667         struct nfs4_slot *slot = res->sr_slot;
668         struct nfs4_slot_table *tbl;
669
670         tbl = slot->table;
671         spin_lock(&tbl->slot_tbl_lock);
672         if (!nfs41_wake_and_assign_slot(tbl, slot))
673                 nfs4_free_slot(tbl, slot);
674         spin_unlock(&tbl->slot_tbl_lock);
675
676         res->sr_slot = NULL;
677 }
678
679 static int nfs40_sequence_done(struct rpc_task *task,
680                                struct nfs4_sequence_res *res)
681 {
682         if (res->sr_slot != NULL)
683                 nfs40_sequence_free_slot(res);
684         return 1;
685 }
686
687 #if defined(CONFIG_NFS_V4_1)
688
689 static void nfs41_sequence_free_slot(struct nfs4_sequence_res *res)
690 {
691         struct nfs4_session *session;
692         struct nfs4_slot_table *tbl;
693         struct nfs4_slot *slot = res->sr_slot;
694         bool send_new_highest_used_slotid = false;
695
696         tbl = slot->table;
697         session = tbl->session;
698
699         /* Bump the slot sequence number */
700         if (slot->seq_done)
701                 slot->seq_nr++;
702         slot->seq_done = 0;
703
704         spin_lock(&tbl->slot_tbl_lock);
705         /* Be nice to the server: try to ensure that the last transmitted
706          * value for highest_user_slotid <= target_highest_slotid
707          */
708         if (tbl->highest_used_slotid > tbl->target_highest_slotid)
709                 send_new_highest_used_slotid = true;
710
711         if (nfs41_wake_and_assign_slot(tbl, slot)) {
712                 send_new_highest_used_slotid = false;
713                 goto out_unlock;
714         }
715         nfs4_free_slot(tbl, slot);
716
717         if (tbl->highest_used_slotid != NFS4_NO_SLOT)
718                 send_new_highest_used_slotid = false;
719 out_unlock:
720         spin_unlock(&tbl->slot_tbl_lock);
721         res->sr_slot = NULL;
722         if (send_new_highest_used_slotid)
723                 nfs41_notify_server(session->clp);
724         if (waitqueue_active(&tbl->slot_waitq))
725                 wake_up_all(&tbl->slot_waitq);
726 }
727
728 static int nfs41_sequence_process(struct rpc_task *task,
729                 struct nfs4_sequence_res *res)
730 {
731         struct nfs4_session *session;
732         struct nfs4_slot *slot = res->sr_slot;
733         struct nfs_client *clp;
734         bool interrupted = false;
735         int ret = 1;
736
737         if (slot == NULL)
738                 goto out_noaction;
739         /* don't increment the sequence number if the task wasn't sent */
740         if (!RPC_WAS_SENT(task))
741                 goto out;
742
743         session = slot->table->session;
744
745         if (slot->interrupted) {
746                 slot->interrupted = 0;
747                 interrupted = true;
748         }
749
750         trace_nfs4_sequence_done(session, res);
751         /* Check the SEQUENCE operation status */
752         switch (res->sr_status) {
753         case 0:
754                 /* Update the slot's sequence and clientid lease timer */
755                 slot->seq_done = 1;
756                 clp = session->clp;
757                 do_renew_lease(clp, res->sr_timestamp);
758                 /* Check sequence flags */
759                 nfs41_handle_sequence_flag_errors(clp, res->sr_status_flags,
760                                 !!slot->privileged);
761                 nfs41_update_target_slotid(slot->table, slot, res);
762                 break;
763         case 1:
764                 /*
765                  * sr_status remains 1 if an RPC level error occurred.
766                  * The server may or may not have processed the sequence
767                  * operation..
768                  * Mark the slot as having hosted an interrupted RPC call.
769                  */
770                 slot->interrupted = 1;
771                 goto out;
772         case -NFS4ERR_DELAY:
773                 /* The server detected a resend of the RPC call and
774                  * returned NFS4ERR_DELAY as per Section 2.10.6.2
775                  * of RFC5661.
776                  */
777                 dprintk("%s: slot=%u seq=%u: Operation in progress\n",
778                         __func__,
779                         slot->slot_nr,
780                         slot->seq_nr);
781                 goto out_retry;
782         case -NFS4ERR_BADSLOT:
783                 /*
784                  * The slot id we used was probably retired. Try again
785                  * using a different slot id.
786                  */
787                 goto retry_nowait;
788         case -NFS4ERR_SEQ_MISORDERED:
789                 /*
790                  * Was the last operation on this sequence interrupted?
791                  * If so, retry after bumping the sequence number.
792                  */
793                 if (interrupted) {
794                         ++slot->seq_nr;
795                         goto retry_nowait;
796                 }
797                 /*
798                  * Could this slot have been previously retired?
799                  * If so, then the server may be expecting seq_nr = 1!
800                  */
801                 if (slot->seq_nr != 1) {
802                         slot->seq_nr = 1;
803                         goto retry_nowait;
804                 }
805                 break;
806         case -NFS4ERR_SEQ_FALSE_RETRY:
807                 ++slot->seq_nr;
808                 goto retry_nowait;
809         default:
810                 /* Just update the slot sequence no. */
811                 slot->seq_done = 1;
812         }
813 out:
814         /* The session may be reset by one of the error handlers. */
815         dprintk("%s: Error %d free the slot \n", __func__, res->sr_status);
816 out_noaction:
817         return ret;
818 retry_nowait:
819         if (rpc_restart_call_prepare(task)) {
820                 nfs41_sequence_free_slot(res);
821                 task->tk_status = 0;
822                 ret = 0;
823         }
824         goto out;
825 out_retry:
826         if (!rpc_restart_call(task))
827                 goto out;
828         rpc_delay(task, NFS4_POLL_RETRY_MAX);
829         return 0;
830 }
831
832 int nfs41_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
833 {
834         if (!nfs41_sequence_process(task, res))
835                 return 0;
836         if (res->sr_slot != NULL)
837                 nfs41_sequence_free_slot(res);
838         return 1;
839
840 }
841 EXPORT_SYMBOL_GPL(nfs41_sequence_done);
842
843 static int nfs4_sequence_process(struct rpc_task *task, struct nfs4_sequence_res *res)
844 {
845         if (res->sr_slot == NULL)
846                 return 1;
847         if (res->sr_slot->table->session != NULL)
848                 return nfs41_sequence_process(task, res);
849         return nfs40_sequence_done(task, res);
850 }
851
852 static void nfs4_sequence_free_slot(struct nfs4_sequence_res *res)
853 {
854         if (res->sr_slot != NULL) {
855                 if (res->sr_slot->table->session != NULL)
856                         nfs41_sequence_free_slot(res);
857                 else
858                         nfs40_sequence_free_slot(res);
859         }
860 }
861
862 int nfs4_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
863 {
864         if (res->sr_slot == NULL)
865                 return 1;
866         if (!res->sr_slot->table->session)
867                 return nfs40_sequence_done(task, res);
868         return nfs41_sequence_done(task, res);
869 }
870 EXPORT_SYMBOL_GPL(nfs4_sequence_done);
871
872 int nfs41_setup_sequence(struct nfs4_session *session,
873                                 struct nfs4_sequence_args *args,
874                                 struct nfs4_sequence_res *res,
875                                 struct rpc_task *task)
876 {
877         struct nfs4_slot *slot;
878         struct nfs4_slot_table *tbl;
879
880         dprintk("--> %s\n", __func__);
881         /* slot already allocated? */
882         if (res->sr_slot != NULL)
883                 goto out_success;
884
885         tbl = &session->fc_slot_table;
886
887         task->tk_timeout = 0;
888
889         spin_lock(&tbl->slot_tbl_lock);
890         if (test_bit(NFS4_SLOT_TBL_DRAINING, &tbl->slot_tbl_state) &&
891             !args->sa_privileged) {
892                 /* The state manager will wait until the slot table is empty */
893                 dprintk("%s session is draining\n", __func__);
894                 goto out_sleep;
895         }
896
897         slot = nfs4_alloc_slot(tbl);
898         if (IS_ERR(slot)) {
899                 /* If out of memory, try again in 1/4 second */
900                 if (slot == ERR_PTR(-ENOMEM))
901                         task->tk_timeout = HZ >> 2;
902                 dprintk("<-- %s: no free slots\n", __func__);
903                 goto out_sleep;
904         }
905         spin_unlock(&tbl->slot_tbl_lock);
906
907         slot->privileged = args->sa_privileged ? 1 : 0;
908         args->sa_slot = slot;
909
910         dprintk("<-- %s slotid=%u seqid=%u\n", __func__,
911                         slot->slot_nr, slot->seq_nr);
912
913         res->sr_slot = slot;
914         res->sr_timestamp = jiffies;
915         res->sr_status_flags = 0;
916         /*
917          * sr_status is only set in decode_sequence, and so will remain
918          * set to 1 if an rpc level failure occurs.
919          */
920         res->sr_status = 1;
921         trace_nfs4_setup_sequence(session, args);
922 out_success:
923         rpc_call_start(task);
924         return 0;
925 out_sleep:
926         /* Privileged tasks are queued with top priority */
927         if (args->sa_privileged)
928                 rpc_sleep_on_priority(&tbl->slot_tbl_waitq, task,
929                                 NULL, RPC_PRIORITY_PRIVILEGED);
930         else
931                 rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
932         spin_unlock(&tbl->slot_tbl_lock);
933         return -EAGAIN;
934 }
935 EXPORT_SYMBOL_GPL(nfs41_setup_sequence);
936
937 static int nfs4_setup_sequence(const struct nfs_server *server,
938                                struct nfs4_sequence_args *args,
939                                struct nfs4_sequence_res *res,
940                                struct rpc_task *task)
941 {
942         struct nfs4_session *session = nfs4_get_session(server);
943         int ret = 0;
944
945         if (!session)
946                 return nfs40_setup_sequence(server->nfs_client->cl_slot_tbl,
947                                             args, res, task);
948
949         dprintk("--> %s clp %p session %p sr_slot %u\n",
950                 __func__, session->clp, session, res->sr_slot ?
951                         res->sr_slot->slot_nr : NFS4_NO_SLOT);
952
953         ret = nfs41_setup_sequence(session, args, res, task);
954
955         dprintk("<-- %s status=%d\n", __func__, ret);
956         return ret;
957 }
958
959 static void nfs41_call_sync_prepare(struct rpc_task *task, void *calldata)
960 {
961         struct nfs4_call_sync_data *data = calldata;
962         struct nfs4_session *session = nfs4_get_session(data->seq_server);
963
964         dprintk("--> %s data->seq_server %p\n", __func__, data->seq_server);
965
966         nfs41_setup_sequence(session, data->seq_args, data->seq_res, task);
967 }
968
969 static void nfs41_call_sync_done(struct rpc_task *task, void *calldata)
970 {
971         struct nfs4_call_sync_data *data = calldata;
972
973         nfs41_sequence_done(task, data->seq_res);
974 }
975
976 static const struct rpc_call_ops nfs41_call_sync_ops = {
977         .rpc_call_prepare = nfs41_call_sync_prepare,
978         .rpc_call_done = nfs41_call_sync_done,
979 };
980
981 #else   /* !CONFIG_NFS_V4_1 */
982
983 static int nfs4_setup_sequence(const struct nfs_server *server,
984                                struct nfs4_sequence_args *args,
985                                struct nfs4_sequence_res *res,
986                                struct rpc_task *task)
987 {
988         return nfs40_setup_sequence(server->nfs_client->cl_slot_tbl,
989                                     args, res, task);
990 }
991
992 static int nfs4_sequence_process(struct rpc_task *task, struct nfs4_sequence_res *res)
993 {
994         return nfs40_sequence_done(task, res);
995 }
996
997 static void nfs4_sequence_free_slot(struct nfs4_sequence_res *res)
998 {
999         if (res->sr_slot != NULL)
1000                 nfs40_sequence_free_slot(res);
1001 }
1002
1003 int nfs4_sequence_done(struct rpc_task *task,
1004                        struct nfs4_sequence_res *res)
1005 {
1006         return nfs40_sequence_done(task, res);
1007 }
1008 EXPORT_SYMBOL_GPL(nfs4_sequence_done);
1009
1010 #endif  /* !CONFIG_NFS_V4_1 */
1011
1012 static void nfs40_call_sync_prepare(struct rpc_task *task, void *calldata)
1013 {
1014         struct nfs4_call_sync_data *data = calldata;
1015         nfs4_setup_sequence(data->seq_server,
1016                                 data->seq_args, data->seq_res, task);
1017 }
1018
1019 static void nfs40_call_sync_done(struct rpc_task *task, void *calldata)
1020 {
1021         struct nfs4_call_sync_data *data = calldata;
1022         nfs4_sequence_done(task, data->seq_res);
1023 }
1024
1025 static const struct rpc_call_ops nfs40_call_sync_ops = {
1026         .rpc_call_prepare = nfs40_call_sync_prepare,
1027         .rpc_call_done = nfs40_call_sync_done,
1028 };
1029
1030 static int nfs4_call_sync_sequence(struct rpc_clnt *clnt,
1031                                    struct nfs_server *server,
1032                                    struct rpc_message *msg,
1033                                    struct nfs4_sequence_args *args,
1034                                    struct nfs4_sequence_res *res)
1035 {
1036         int ret;
1037         struct rpc_task *task;
1038         struct nfs_client *clp = server->nfs_client;
1039         struct nfs4_call_sync_data data = {
1040                 .seq_server = server,
1041                 .seq_args = args,
1042                 .seq_res = res,
1043         };
1044         struct rpc_task_setup task_setup = {
1045                 .rpc_client = clnt,
1046                 .rpc_message = msg,
1047                 .callback_ops = clp->cl_mvops->call_sync_ops,
1048                 .callback_data = &data
1049         };
1050
1051         task = rpc_run_task(&task_setup);
1052         if (IS_ERR(task))
1053                 ret = PTR_ERR(task);
1054         else {
1055                 ret = task->tk_status;
1056                 rpc_put_task(task);
1057         }
1058         return ret;
1059 }
1060
1061 int nfs4_call_sync(struct rpc_clnt *clnt,
1062                    struct nfs_server *server,
1063                    struct rpc_message *msg,
1064                    struct nfs4_sequence_args *args,
1065                    struct nfs4_sequence_res *res,
1066                    int cache_reply)
1067 {
1068         nfs4_init_sequence(args, res, cache_reply);
1069         return nfs4_call_sync_sequence(clnt, server, msg, args, res);
1070 }
1071
1072 static void update_changeattr(struct inode *dir, struct nfs4_change_info *cinfo)
1073 {
1074         struct nfs_inode *nfsi = NFS_I(dir);
1075
1076         spin_lock(&dir->i_lock);
1077         nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA;
1078         if (!cinfo->atomic || cinfo->before != dir->i_version)
1079                 nfs_force_lookup_revalidate(dir);
1080         dir->i_version = cinfo->after;
1081         nfsi->attr_gencount = nfs_inc_attr_generation_counter();
1082         nfs_fscache_invalidate(dir);
1083         spin_unlock(&dir->i_lock);
1084 }
1085
1086 struct nfs4_opendata {
1087         struct kref kref;
1088         struct nfs_openargs o_arg;
1089         struct nfs_openres o_res;
1090         struct nfs_open_confirmargs c_arg;
1091         struct nfs_open_confirmres c_res;
1092         struct nfs4_string owner_name;
1093         struct nfs4_string group_name;
1094         struct nfs4_label *a_label;
1095         struct nfs_fattr f_attr;
1096         struct nfs4_label *f_label;
1097         struct dentry *dir;
1098         struct dentry *dentry;
1099         struct nfs4_state_owner *owner;
1100         struct nfs4_state *state;
1101         struct iattr attrs;
1102         unsigned long timestamp;
1103         unsigned int rpc_done : 1;
1104         unsigned int file_created : 1;
1105         unsigned int is_recover : 1;
1106         int rpc_status;
1107         int cancelled;
1108 };
1109
1110 static bool nfs4_clear_cap_atomic_open_v1(struct nfs_server *server,
1111                 int err, struct nfs4_exception *exception)
1112 {
1113         if (err != -EINVAL)
1114                 return false;
1115         if (!(server->caps & NFS_CAP_ATOMIC_OPEN_V1))
1116                 return false;
1117         server->caps &= ~NFS_CAP_ATOMIC_OPEN_V1;
1118         exception->retry = 1;
1119         return true;
1120 }
1121
1122 static u32
1123 nfs4_map_atomic_open_share(struct nfs_server *server,
1124                 fmode_t fmode, int openflags)
1125 {
1126         u32 res = 0;
1127
1128         switch (fmode & (FMODE_READ | FMODE_WRITE)) {
1129         case FMODE_READ:
1130                 res = NFS4_SHARE_ACCESS_READ;
1131                 break;
1132         case FMODE_WRITE:
1133                 res = NFS4_SHARE_ACCESS_WRITE;
1134                 break;
1135         case FMODE_READ|FMODE_WRITE:
1136                 res = NFS4_SHARE_ACCESS_BOTH;
1137         }
1138         if (!(server->caps & NFS_CAP_ATOMIC_OPEN_V1))
1139                 goto out;
1140         /* Want no delegation if we're using O_DIRECT */
1141         if (openflags & O_DIRECT)
1142                 res |= NFS4_SHARE_WANT_NO_DELEG;
1143 out:
1144         return res;
1145 }
1146
1147 static enum open_claim_type4
1148 nfs4_map_atomic_open_claim(struct nfs_server *server,
1149                 enum open_claim_type4 claim)
1150 {
1151         if (server->caps & NFS_CAP_ATOMIC_OPEN_V1)
1152                 return claim;
1153         switch (claim) {
1154         default:
1155                 return claim;
1156         case NFS4_OPEN_CLAIM_FH:
1157                 return NFS4_OPEN_CLAIM_NULL;
1158         case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
1159                 return NFS4_OPEN_CLAIM_DELEGATE_CUR;
1160         case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
1161                 return NFS4_OPEN_CLAIM_DELEGATE_PREV;
1162         }
1163 }
1164
1165 static void nfs4_init_opendata_res(struct nfs4_opendata *p)
1166 {
1167         p->o_res.f_attr = &p->f_attr;
1168         p->o_res.f_label = p->f_label;
1169         p->o_res.seqid = p->o_arg.seqid;
1170         p->c_res.seqid = p->c_arg.seqid;
1171         p->o_res.server = p->o_arg.server;
1172         p->o_res.access_request = p->o_arg.access;
1173         nfs_fattr_init(&p->f_attr);
1174         nfs_fattr_init_names(&p->f_attr, &p->owner_name, &p->group_name);
1175 }
1176
1177 static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
1178                 struct nfs4_state_owner *sp, fmode_t fmode, int flags,
1179                 const struct iattr *attrs,
1180                 struct nfs4_label *label,
1181                 enum open_claim_type4 claim,
1182                 gfp_t gfp_mask)
1183 {
1184         struct dentry *parent = dget_parent(dentry);
1185         struct inode *dir = d_inode(parent);
1186         struct nfs_server *server = NFS_SERVER(dir);
1187         struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
1188         struct nfs4_opendata *p;
1189
1190         p = kzalloc(sizeof(*p), gfp_mask);
1191         if (p == NULL)
1192                 goto err;
1193
1194         p->f_label = nfs4_label_alloc(server, gfp_mask);
1195         if (IS_ERR(p->f_label))
1196                 goto err_free_p;
1197
1198         p->a_label = nfs4_label_alloc(server, gfp_mask);
1199         if (IS_ERR(p->a_label))
1200                 goto err_free_f;
1201
1202         alloc_seqid = server->nfs_client->cl_mvops->alloc_seqid;
1203         p->o_arg.seqid = alloc_seqid(&sp->so_seqid, gfp_mask);
1204         if (IS_ERR(p->o_arg.seqid))
1205                 goto err_free_label;
1206         nfs_sb_active(dentry->d_sb);
1207         p->dentry = dget(dentry);
1208         p->dir = parent;
1209         p->owner = sp;
1210         atomic_inc(&sp->so_count);
1211         p->o_arg.open_flags = flags;
1212         p->o_arg.fmode = fmode & (FMODE_READ|FMODE_WRITE);
1213         p->o_arg.share_access = nfs4_map_atomic_open_share(server,
1214                         fmode, flags);
1215         /* don't put an ACCESS op in OPEN compound if O_EXCL, because ACCESS
1216          * will return permission denied for all bits until close */
1217         if (!(flags & O_EXCL)) {
1218                 /* ask server to check for all possible rights as results
1219                  * are cached */
1220                 p->o_arg.access = NFS4_ACCESS_READ | NFS4_ACCESS_MODIFY |
1221                                   NFS4_ACCESS_EXTEND | NFS4_ACCESS_EXECUTE;
1222         }
1223         p->o_arg.clientid = server->nfs_client->cl_clientid;
1224         p->o_arg.id.create_time = ktime_to_ns(sp->so_seqid.create_time);
1225         p->o_arg.id.uniquifier = sp->so_seqid.owner_id;
1226         p->o_arg.name = &dentry->d_name;
1227         p->o_arg.server = server;
1228         p->o_arg.bitmask = nfs4_bitmask(server, label);
1229         p->o_arg.open_bitmap = &nfs4_fattr_bitmap[0];
1230         p->o_arg.label = nfs4_label_copy(p->a_label, label);
1231         p->o_arg.claim = nfs4_map_atomic_open_claim(server, claim);
1232         switch (p->o_arg.claim) {
1233         case NFS4_OPEN_CLAIM_NULL:
1234         case NFS4_OPEN_CLAIM_DELEGATE_CUR:
1235         case NFS4_OPEN_CLAIM_DELEGATE_PREV:
1236                 p->o_arg.fh = NFS_FH(dir);
1237                 break;
1238         case NFS4_OPEN_CLAIM_PREVIOUS:
1239         case NFS4_OPEN_CLAIM_FH:
1240         case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
1241         case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
1242                 p->o_arg.fh = NFS_FH(d_inode(dentry));
1243         }
1244         if (attrs != NULL && attrs->ia_valid != 0) {
1245                 __u32 verf[2];
1246
1247                 p->o_arg.u.attrs = &p->attrs;
1248                 memcpy(&p->attrs, attrs, sizeof(p->attrs));
1249
1250                 verf[0] = jiffies;
1251                 verf[1] = current->pid;
1252                 memcpy(p->o_arg.u.verifier.data, verf,
1253                                 sizeof(p->o_arg.u.verifier.data));
1254         }
1255         p->c_arg.fh = &p->o_res.fh;
1256         p->c_arg.stateid = &p->o_res.stateid;
1257         p->c_arg.seqid = p->o_arg.seqid;
1258         nfs4_init_opendata_res(p);
1259         kref_init(&p->kref);
1260         return p;
1261
1262 err_free_label:
1263         nfs4_label_free(p->a_label);
1264 err_free_f:
1265         nfs4_label_free(p->f_label);
1266 err_free_p:
1267         kfree(p);
1268 err:
1269         dput(parent);
1270         return NULL;
1271 }
1272
1273 static void nfs4_opendata_free(struct kref *kref)
1274 {
1275         struct nfs4_opendata *p = container_of(kref,
1276                         struct nfs4_opendata, kref);
1277         struct super_block *sb = p->dentry->d_sb;
1278
1279         nfs_free_seqid(p->o_arg.seqid);
1280         nfs4_sequence_free_slot(&p->o_res.seq_res);
1281         if (p->state != NULL)
1282                 nfs4_put_open_state(p->state);
1283         nfs4_put_state_owner(p->owner);
1284
1285         nfs4_label_free(p->a_label);
1286         nfs4_label_free(p->f_label);
1287
1288         dput(p->dir);
1289         dput(p->dentry);
1290         nfs_sb_deactive(sb);
1291         nfs_fattr_free_names(&p->f_attr);
1292         kfree(p->f_attr.mdsthreshold);
1293         kfree(p);
1294 }
1295
1296 static void nfs4_opendata_put(struct nfs4_opendata *p)
1297 {
1298         if (p != NULL)
1299                 kref_put(&p->kref, nfs4_opendata_free);
1300 }
1301
1302 static int nfs4_wait_for_completion_rpc_task(struct rpc_task *task)
1303 {
1304         int ret;
1305
1306         ret = rpc_wait_for_completion_task(task);
1307         return ret;
1308 }
1309
1310 static bool nfs4_mode_match_open_stateid(struct nfs4_state *state,
1311                 fmode_t fmode)
1312 {
1313         switch(fmode & (FMODE_READ|FMODE_WRITE)) {
1314         case FMODE_READ|FMODE_WRITE:
1315                 return state->n_rdwr != 0;
1316         case FMODE_WRITE:
1317                 return state->n_wronly != 0;
1318         case FMODE_READ:
1319                 return state->n_rdonly != 0;
1320         }
1321         WARN_ON_ONCE(1);
1322         return false;
1323 }
1324
1325 static int can_open_cached(struct nfs4_state *state, fmode_t mode, int open_mode)
1326 {
1327         int ret = 0;
1328
1329         if (open_mode & (O_EXCL|O_TRUNC))
1330                 goto out;
1331         switch (mode & (FMODE_READ|FMODE_WRITE)) {
1332                 case FMODE_READ:
1333                         ret |= test_bit(NFS_O_RDONLY_STATE, &state->flags) != 0
1334                                 && state->n_rdonly != 0;
1335                         break;
1336                 case FMODE_WRITE:
1337                         ret |= test_bit(NFS_O_WRONLY_STATE, &state->flags) != 0
1338                                 && state->n_wronly != 0;
1339                         break;
1340                 case FMODE_READ|FMODE_WRITE:
1341                         ret |= test_bit(NFS_O_RDWR_STATE, &state->flags) != 0
1342                                 && state->n_rdwr != 0;
1343         }
1344 out:
1345         return ret;
1346 }
1347
1348 static int can_open_delegated(struct nfs_delegation *delegation, fmode_t fmode,
1349                 enum open_claim_type4 claim)
1350 {
1351         if (delegation == NULL)
1352                 return 0;
1353         if ((delegation->type & fmode) != fmode)
1354                 return 0;
1355         if (test_bit(NFS_DELEGATION_RETURNING, &delegation->flags))
1356                 return 0;
1357         switch (claim) {
1358         case NFS4_OPEN_CLAIM_NULL:
1359         case NFS4_OPEN_CLAIM_FH:
1360                 break;
1361         case NFS4_OPEN_CLAIM_PREVIOUS:
1362                 if (!test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags))
1363                         break;
1364         default:
1365                 return 0;
1366         }
1367         nfs_mark_delegation_referenced(delegation);
1368         return 1;
1369 }
1370
1371 static void update_open_stateflags(struct nfs4_state *state, fmode_t fmode)
1372 {
1373         switch (fmode) {
1374                 case FMODE_WRITE:
1375                         state->n_wronly++;
1376                         break;
1377                 case FMODE_READ:
1378                         state->n_rdonly++;
1379                         break;
1380                 case FMODE_READ|FMODE_WRITE:
1381                         state->n_rdwr++;
1382         }
1383         nfs4_state_set_mode_locked(state, state->state | fmode);
1384 }
1385
1386 static void nfs_test_and_clear_all_open_stateid(struct nfs4_state *state)
1387 {
1388         struct nfs_client *clp = state->owner->so_server->nfs_client;
1389         bool need_recover = false;
1390
1391         if (test_and_clear_bit(NFS_O_RDONLY_STATE, &state->flags) && state->n_rdonly)
1392                 need_recover = true;
1393         if (test_and_clear_bit(NFS_O_WRONLY_STATE, &state->flags) && state->n_wronly)
1394                 need_recover = true;
1395         if (test_and_clear_bit(NFS_O_RDWR_STATE, &state->flags) && state->n_rdwr)
1396                 need_recover = true;
1397         if (need_recover)
1398                 nfs4_state_mark_reclaim_nograce(clp, state);
1399 }
1400
1401 static bool nfs_need_update_open_stateid(struct nfs4_state *state,
1402                 nfs4_stateid *stateid)
1403 {
1404         if (test_and_set_bit(NFS_OPEN_STATE, &state->flags) == 0)
1405                 return true;
1406         if (!nfs4_stateid_match_other(stateid, &state->open_stateid)) {
1407                 nfs_test_and_clear_all_open_stateid(state);
1408                 return true;
1409         }
1410         if (nfs4_stateid_is_newer(stateid, &state->open_stateid))
1411                 return true;
1412         return false;
1413 }
1414
1415 static void nfs_resync_open_stateid_locked(struct nfs4_state *state)
1416 {
1417         if (!(state->n_wronly || state->n_rdonly || state->n_rdwr))
1418                 return;
1419         if (state->n_wronly)
1420                 set_bit(NFS_O_WRONLY_STATE, &state->flags);
1421         if (state->n_rdonly)
1422                 set_bit(NFS_O_RDONLY_STATE, &state->flags);
1423         if (state->n_rdwr)
1424                 set_bit(NFS_O_RDWR_STATE, &state->flags);
1425         set_bit(NFS_OPEN_STATE, &state->flags);
1426 }
1427
1428 static void nfs_clear_open_stateid_locked(struct nfs4_state *state,
1429                 nfs4_stateid *arg_stateid,
1430                 nfs4_stateid *stateid, fmode_t fmode)
1431 {
1432         clear_bit(NFS_O_RDWR_STATE, &state->flags);
1433         switch (fmode & (FMODE_READ|FMODE_WRITE)) {
1434         case FMODE_WRITE:
1435                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1436                 break;
1437         case FMODE_READ:
1438                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1439                 break;
1440         case 0:
1441                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1442                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1443                 clear_bit(NFS_OPEN_STATE, &state->flags);
1444         }
1445         if (stateid == NULL)
1446                 return;
1447         /* Handle races with OPEN */
1448         if (!nfs4_stateid_match_other(arg_stateid, &state->open_stateid) ||
1449             (nfs4_stateid_match_other(stateid, &state->open_stateid) &&
1450             !nfs4_stateid_is_newer(stateid, &state->open_stateid))) {
1451                 nfs_resync_open_stateid_locked(state);
1452                 return;
1453         }
1454         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1455                 nfs4_stateid_copy(&state->stateid, stateid);
1456         nfs4_stateid_copy(&state->open_stateid, stateid);
1457 }
1458
1459 static void nfs_clear_open_stateid(struct nfs4_state *state,
1460         nfs4_stateid *arg_stateid,
1461         nfs4_stateid *stateid, fmode_t fmode)
1462 {
1463         write_seqlock(&state->seqlock);
1464         nfs_clear_open_stateid_locked(state, arg_stateid, stateid, fmode);
1465         write_sequnlock(&state->seqlock);
1466         if (test_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags))
1467                 nfs4_schedule_state_manager(state->owner->so_server->nfs_client);
1468 }
1469
1470 static void nfs_set_open_stateid_locked(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
1471 {
1472         switch (fmode) {
1473                 case FMODE_READ:
1474                         set_bit(NFS_O_RDONLY_STATE, &state->flags);
1475                         break;
1476                 case FMODE_WRITE:
1477                         set_bit(NFS_O_WRONLY_STATE, &state->flags);
1478                         break;
1479                 case FMODE_READ|FMODE_WRITE:
1480                         set_bit(NFS_O_RDWR_STATE, &state->flags);
1481         }
1482         if (!nfs_need_update_open_stateid(state, stateid))
1483                 return;
1484         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1485                 nfs4_stateid_copy(&state->stateid, stateid);
1486         nfs4_stateid_copy(&state->open_stateid, stateid);
1487 }
1488
1489 static void __update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, const nfs4_stateid *deleg_stateid, fmode_t fmode)
1490 {
1491         /*
1492          * Protect the call to nfs4_state_set_mode_locked and
1493          * serialise the stateid update
1494          */
1495         spin_lock(&state->owner->so_lock);
1496         write_seqlock(&state->seqlock);
1497         if (deleg_stateid != NULL) {
1498                 nfs4_stateid_copy(&state->stateid, deleg_stateid);
1499                 set_bit(NFS_DELEGATED_STATE, &state->flags);
1500         }
1501         if (open_stateid != NULL)
1502                 nfs_set_open_stateid_locked(state, open_stateid, fmode);
1503         write_sequnlock(&state->seqlock);
1504         update_open_stateflags(state, fmode);
1505         spin_unlock(&state->owner->so_lock);
1506 }
1507
1508 static int update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, nfs4_stateid *delegation, fmode_t fmode)
1509 {
1510         struct nfs_inode *nfsi = NFS_I(state->inode);
1511         struct nfs_delegation *deleg_cur;
1512         int ret = 0;
1513
1514         fmode &= (FMODE_READ|FMODE_WRITE);
1515
1516         rcu_read_lock();
1517         deleg_cur = rcu_dereference(nfsi->delegation);
1518         if (deleg_cur == NULL)
1519                 goto no_delegation;
1520
1521         spin_lock(&deleg_cur->lock);
1522         if (rcu_dereference(nfsi->delegation) != deleg_cur ||
1523            test_bit(NFS_DELEGATION_RETURNING, &deleg_cur->flags) ||
1524             (deleg_cur->type & fmode) != fmode)
1525                 goto no_delegation_unlock;
1526
1527         if (delegation == NULL)
1528                 delegation = &deleg_cur->stateid;
1529         else if (!nfs4_stateid_match(&deleg_cur->stateid, delegation))
1530                 goto no_delegation_unlock;
1531
1532         nfs_mark_delegation_referenced(deleg_cur);
1533         __update_open_stateid(state, open_stateid, &deleg_cur->stateid, fmode);
1534         ret = 1;
1535 no_delegation_unlock:
1536         spin_unlock(&deleg_cur->lock);
1537 no_delegation:
1538         rcu_read_unlock();
1539
1540         if (!ret && open_stateid != NULL) {
1541                 __update_open_stateid(state, open_stateid, NULL, fmode);
1542                 ret = 1;
1543         }
1544         if (test_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags))
1545                 nfs4_schedule_state_manager(state->owner->so_server->nfs_client);
1546
1547         return ret;
1548 }
1549
1550 static bool nfs4_update_lock_stateid(struct nfs4_lock_state *lsp,
1551                 const nfs4_stateid *stateid)
1552 {
1553         struct nfs4_state *state = lsp->ls_state;
1554         bool ret = false;
1555
1556         spin_lock(&state->state_lock);
1557         if (!nfs4_stateid_match_other(stateid, &lsp->ls_stateid))
1558                 goto out_noupdate;
1559         if (!nfs4_stateid_is_newer(stateid, &lsp->ls_stateid))
1560                 goto out_noupdate;
1561         nfs4_stateid_copy(&lsp->ls_stateid, stateid);
1562         ret = true;
1563 out_noupdate:
1564         spin_unlock(&state->state_lock);
1565         return ret;
1566 }
1567
1568 static void nfs4_return_incompatible_delegation(struct inode *inode, fmode_t fmode)
1569 {
1570         struct nfs_delegation *delegation;
1571
1572         rcu_read_lock();
1573         delegation = rcu_dereference(NFS_I(inode)->delegation);
1574         if (delegation == NULL || (delegation->type & fmode) == fmode) {
1575                 rcu_read_unlock();
1576                 return;
1577         }
1578         rcu_read_unlock();
1579         nfs4_inode_return_delegation(inode);
1580 }
1581
1582 static struct nfs4_state *nfs4_try_open_cached(struct nfs4_opendata *opendata)
1583 {
1584         struct nfs4_state *state = opendata->state;
1585         struct nfs_inode *nfsi = NFS_I(state->inode);
1586         struct nfs_delegation *delegation;
1587         int open_mode = opendata->o_arg.open_flags;
1588         fmode_t fmode = opendata->o_arg.fmode;
1589         enum open_claim_type4 claim = opendata->o_arg.claim;
1590         nfs4_stateid stateid;
1591         int ret = -EAGAIN;
1592
1593         for (;;) {
1594                 spin_lock(&state->owner->so_lock);
1595                 if (can_open_cached(state, fmode, open_mode)) {
1596                         update_open_stateflags(state, fmode);
1597                         spin_unlock(&state->owner->so_lock);
1598                         goto out_return_state;
1599                 }
1600                 spin_unlock(&state->owner->so_lock);
1601                 rcu_read_lock();
1602                 delegation = rcu_dereference(nfsi->delegation);
1603                 if (!can_open_delegated(delegation, fmode, claim)) {
1604                         rcu_read_unlock();
1605                         break;
1606                 }
1607                 /* Save the delegation */
1608                 nfs4_stateid_copy(&stateid, &delegation->stateid);
1609                 rcu_read_unlock();
1610                 nfs_release_seqid(opendata->o_arg.seqid);
1611                 if (!opendata->is_recover) {
1612                         ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
1613                         if (ret != 0)
1614                                 goto out;
1615                 }
1616                 ret = -EAGAIN;
1617
1618                 /* Try to update the stateid using the delegation */
1619                 if (update_open_stateid(state, NULL, &stateid, fmode))
1620                         goto out_return_state;
1621         }
1622 out:
1623         return ERR_PTR(ret);
1624 out_return_state:
1625         atomic_inc(&state->count);
1626         return state;
1627 }
1628
1629 static void
1630 nfs4_opendata_check_deleg(struct nfs4_opendata *data, struct nfs4_state *state)
1631 {
1632         struct nfs_client *clp = NFS_SERVER(state->inode)->nfs_client;
1633         struct nfs_delegation *delegation;
1634         int delegation_flags = 0;
1635
1636         rcu_read_lock();
1637         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1638         if (delegation)
1639                 delegation_flags = delegation->flags;
1640         rcu_read_unlock();
1641         switch (data->o_arg.claim) {
1642         default:
1643                 break;
1644         case NFS4_OPEN_CLAIM_DELEGATE_CUR:
1645         case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
1646                 pr_err_ratelimited("NFS: Broken NFSv4 server %s is "
1647                                    "returning a delegation for "
1648                                    "OPEN(CLAIM_DELEGATE_CUR)\n",
1649                                    clp->cl_hostname);
1650                 return;
1651         }
1652         if ((delegation_flags & 1UL<<NFS_DELEGATION_NEED_RECLAIM) == 0)
1653                 nfs_inode_set_delegation(state->inode,
1654                                          data->owner->so_cred,
1655                                          &data->o_res);
1656         else
1657                 nfs_inode_reclaim_delegation(state->inode,
1658                                              data->owner->so_cred,
1659                                              &data->o_res);
1660 }
1661
1662 /*
1663  * Check the inode attributes against the CLAIM_PREVIOUS returned attributes
1664  * and update the nfs4_state.
1665  */
1666 static struct nfs4_state *
1667 _nfs4_opendata_reclaim_to_nfs4_state(struct nfs4_opendata *data)
1668 {
1669         struct inode *inode = data->state->inode;
1670         struct nfs4_state *state = data->state;
1671         int ret;
1672
1673         if (!data->rpc_done) {
1674                 if (data->rpc_status) {
1675                         ret = data->rpc_status;
1676                         goto err;
1677                 }
1678                 /* cached opens have already been processed */
1679                 goto update;
1680         }
1681
1682         ret = nfs_refresh_inode(inode, &data->f_attr);
1683         if (ret)
1684                 goto err;
1685
1686         if (data->o_res.delegation_type != 0)
1687                 nfs4_opendata_check_deleg(data, state);
1688 update:
1689         update_open_stateid(state, &data->o_res.stateid, NULL,
1690                             data->o_arg.fmode);
1691         atomic_inc(&state->count);
1692
1693         return state;
1694 err:
1695         return ERR_PTR(ret);
1696
1697 }
1698
1699 static struct nfs4_state *
1700 _nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
1701 {
1702         struct inode *inode;
1703         struct nfs4_state *state = NULL;
1704         int ret;
1705
1706         if (!data->rpc_done) {
1707                 state = nfs4_try_open_cached(data);
1708                 trace_nfs4_cached_open(data->state);
1709                 goto out;
1710         }
1711
1712         ret = -EAGAIN;
1713         if (!(data->f_attr.valid & NFS_ATTR_FATTR))
1714                 goto err;
1715         inode = nfs_fhget(data->dir->d_sb, &data->o_res.fh, &data->f_attr, data->f_label);
1716         ret = PTR_ERR(inode);
1717         if (IS_ERR(inode))
1718                 goto err;
1719         ret = -ENOMEM;
1720         state = nfs4_get_open_state(inode, data->owner);
1721         if (state == NULL)
1722                 goto err_put_inode;
1723         if (data->o_res.delegation_type != 0)
1724                 nfs4_opendata_check_deleg(data, state);
1725         update_open_stateid(state, &data->o_res.stateid, NULL,
1726                         data->o_arg.fmode);
1727         iput(inode);
1728 out:
1729         nfs_release_seqid(data->o_arg.seqid);
1730         return state;
1731 err_put_inode:
1732         iput(inode);
1733 err:
1734         return ERR_PTR(ret);
1735 }
1736
1737 static struct nfs4_state *
1738 nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
1739 {
1740         struct nfs4_state *ret;
1741
1742         if (data->o_arg.claim == NFS4_OPEN_CLAIM_PREVIOUS)
1743                 ret =_nfs4_opendata_reclaim_to_nfs4_state(data);
1744         else
1745                 ret = _nfs4_opendata_to_nfs4_state(data);
1746         nfs4_sequence_free_slot(&data->o_res.seq_res);
1747         return ret;
1748 }
1749
1750 static struct nfs_open_context *nfs4_state_find_open_context(struct nfs4_state *state)
1751 {
1752         struct nfs_inode *nfsi = NFS_I(state->inode);
1753         struct nfs_open_context *ctx;
1754
1755         spin_lock(&state->inode->i_lock);
1756         list_for_each_entry(ctx, &nfsi->open_files, list) {
1757                 if (ctx->state != state)
1758                         continue;
1759                 get_nfs_open_context(ctx);
1760                 spin_unlock(&state->inode->i_lock);
1761                 return ctx;
1762         }
1763         spin_unlock(&state->inode->i_lock);
1764         return ERR_PTR(-ENOENT);
1765 }
1766
1767 static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx,
1768                 struct nfs4_state *state, enum open_claim_type4 claim)
1769 {
1770         struct nfs4_opendata *opendata;
1771
1772         opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0,
1773                         NULL, NULL, claim, GFP_NOFS);
1774         if (opendata == NULL)
1775                 return ERR_PTR(-ENOMEM);
1776         opendata->state = state;
1777         atomic_inc(&state->count);
1778         return opendata;
1779 }
1780
1781 static int nfs4_open_recover_helper(struct nfs4_opendata *opendata,
1782                 fmode_t fmode)
1783 {
1784         struct nfs4_state *newstate;
1785         int ret;
1786
1787         if (!nfs4_mode_match_open_stateid(opendata->state, fmode))
1788                 return 0;
1789         opendata->o_arg.open_flags = 0;
1790         opendata->o_arg.fmode = fmode;
1791         opendata->o_arg.share_access = nfs4_map_atomic_open_share(
1792                         NFS_SB(opendata->dentry->d_sb),
1793                         fmode, 0);
1794         memset(&opendata->o_res, 0, sizeof(opendata->o_res));
1795         memset(&opendata->c_res, 0, sizeof(opendata->c_res));
1796         nfs4_init_opendata_res(opendata);
1797         ret = _nfs4_recover_proc_open(opendata);
1798         if (ret != 0)
1799                 return ret; 
1800         newstate = nfs4_opendata_to_nfs4_state(opendata);
1801         if (IS_ERR(newstate))
1802                 return PTR_ERR(newstate);
1803         if (newstate != opendata->state)
1804                 ret = -ESTALE;
1805         nfs4_close_state(newstate, fmode);
1806         return ret;
1807 }
1808
1809 static int nfs4_open_recover(struct nfs4_opendata *opendata, struct nfs4_state *state)
1810 {
1811         int ret;
1812
1813         /* Don't trigger recovery in nfs_test_and_clear_all_open_stateid */
1814         clear_bit(NFS_O_RDWR_STATE, &state->flags);
1815         clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1816         clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1817         /* memory barrier prior to reading state->n_* */
1818         clear_bit(NFS_DELEGATED_STATE, &state->flags);
1819         clear_bit(NFS_OPEN_STATE, &state->flags);
1820         smp_rmb();
1821         ret = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE);
1822         if (ret != 0)
1823                 return ret;
1824         ret = nfs4_open_recover_helper(opendata, FMODE_WRITE);
1825         if (ret != 0)
1826                 return ret;
1827         ret = nfs4_open_recover_helper(opendata, FMODE_READ);
1828         if (ret != 0)
1829                 return ret;
1830         /*
1831          * We may have performed cached opens for all three recoveries.
1832          * Check if we need to update the current stateid.
1833          */
1834         if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0 &&
1835             !nfs4_stateid_match(&state->stateid, &state->open_stateid)) {
1836                 write_seqlock(&state->seqlock);
1837                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1838                         nfs4_stateid_copy(&state->stateid, &state->open_stateid);
1839                 write_sequnlock(&state->seqlock);
1840         }
1841         return 0;
1842 }
1843
1844 /*
1845  * OPEN_RECLAIM:
1846  *      reclaim state on the server after a reboot.
1847  */
1848 static int _nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1849 {
1850         struct nfs_delegation *delegation;
1851         struct nfs4_opendata *opendata;
1852         fmode_t delegation_type = 0;
1853         int status;
1854
1855         opendata = nfs4_open_recoverdata_alloc(ctx, state,
1856                         NFS4_OPEN_CLAIM_PREVIOUS);
1857         if (IS_ERR(opendata))
1858                 return PTR_ERR(opendata);
1859         rcu_read_lock();
1860         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1861         if (delegation != NULL && test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) != 0)
1862                 delegation_type = delegation->type;
1863         rcu_read_unlock();
1864         opendata->o_arg.u.delegation_type = delegation_type;
1865         status = nfs4_open_recover(opendata, state);
1866         nfs4_opendata_put(opendata);
1867         return status;
1868 }
1869
1870 static int nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
1871 {
1872         struct nfs_server *server = NFS_SERVER(state->inode);
1873         struct nfs4_exception exception = { };
1874         int err;
1875         do {
1876                 err = _nfs4_do_open_reclaim(ctx, state);
1877                 trace_nfs4_open_reclaim(ctx, 0, err);
1878                 if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
1879                         continue;
1880                 if (err != -NFS4ERR_DELAY)
1881                         break;
1882                 nfs4_handle_exception(server, err, &exception);
1883         } while (exception.retry);
1884         return err;
1885 }
1886
1887 static int nfs4_open_reclaim(struct nfs4_state_owner *sp, struct nfs4_state *state)
1888 {
1889         struct nfs_open_context *ctx;
1890         int ret;
1891
1892         ctx = nfs4_state_find_open_context(state);
1893         if (IS_ERR(ctx))
1894                 return -EAGAIN;
1895         ret = nfs4_do_open_reclaim(ctx, state);
1896         put_nfs_open_context(ctx);
1897         return ret;
1898 }
1899
1900 static int nfs4_handle_delegation_recall_error(struct nfs_server *server, struct nfs4_state *state, const nfs4_stateid *stateid, int err)
1901 {
1902         switch (err) {
1903                 default:
1904                         printk(KERN_ERR "NFS: %s: unhandled error "
1905                                         "%d.\n", __func__, err);
1906                 case 0:
1907                 case -ENOENT:
1908                 case -EAGAIN:
1909                 case -ESTALE:
1910                         break;
1911                 case -NFS4ERR_BADSESSION:
1912                 case -NFS4ERR_BADSLOT:
1913                 case -NFS4ERR_BAD_HIGH_SLOT:
1914                 case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
1915                 case -NFS4ERR_DEADSESSION:
1916                         set_bit(NFS_DELEGATED_STATE, &state->flags);
1917                         nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
1918                         return -EAGAIN;
1919                 case -NFS4ERR_STALE_CLIENTID:
1920                 case -NFS4ERR_STALE_STATEID:
1921                         set_bit(NFS_DELEGATED_STATE, &state->flags);
1922                 case -NFS4ERR_EXPIRED:
1923                         /* Don't recall a delegation if it was lost */
1924                         nfs4_schedule_lease_recovery(server->nfs_client);
1925                         return -EAGAIN;
1926                 case -NFS4ERR_MOVED:
1927                         nfs4_schedule_migration_recovery(server);
1928                         return -EAGAIN;
1929                 case -NFS4ERR_LEASE_MOVED:
1930                         nfs4_schedule_lease_moved_recovery(server->nfs_client);
1931                         return -EAGAIN;
1932                 case -NFS4ERR_DELEG_REVOKED:
1933                 case -NFS4ERR_ADMIN_REVOKED:
1934                 case -NFS4ERR_BAD_STATEID:
1935                 case -NFS4ERR_OPENMODE:
1936                         nfs_inode_find_state_and_recover(state->inode,
1937                                         stateid);
1938                         nfs4_schedule_stateid_recovery(server, state);
1939                         return -EAGAIN;
1940                 case -NFS4ERR_DELAY:
1941                 case -NFS4ERR_GRACE:
1942                         set_bit(NFS_DELEGATED_STATE, &state->flags);
1943                         ssleep(1);
1944                         return -EAGAIN;
1945                 case -ENOMEM:
1946                 case -NFS4ERR_DENIED:
1947                         /* kill_proc(fl->fl_pid, SIGLOST, 1); */
1948                         return 0;
1949         }
1950         return err;
1951 }
1952
1953 int nfs4_open_delegation_recall(struct nfs_open_context *ctx,
1954                 struct nfs4_state *state, const nfs4_stateid *stateid,
1955                 fmode_t type)
1956 {
1957         struct nfs_server *server = NFS_SERVER(state->inode);
1958         struct nfs4_opendata *opendata;
1959         int err = 0;
1960
1961         opendata = nfs4_open_recoverdata_alloc(ctx, state,
1962                         NFS4_OPEN_CLAIM_DELEG_CUR_FH);
1963         if (IS_ERR(opendata))
1964                 return PTR_ERR(opendata);
1965         nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
1966         write_seqlock(&state->seqlock);
1967         nfs4_stateid_copy(&state->stateid, &state->open_stateid);
1968         write_sequnlock(&state->seqlock);
1969         clear_bit(NFS_DELEGATED_STATE, &state->flags);
1970         switch (type & (FMODE_READ|FMODE_WRITE)) {
1971         case FMODE_READ|FMODE_WRITE:
1972         case FMODE_WRITE:
1973                 err = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE);
1974                 if (err)
1975                         break;
1976                 err = nfs4_open_recover_helper(opendata, FMODE_WRITE);
1977                 if (err)
1978                         break;
1979         case FMODE_READ:
1980                 err = nfs4_open_recover_helper(opendata, FMODE_READ);
1981         }
1982         nfs4_opendata_put(opendata);
1983         return nfs4_handle_delegation_recall_error(server, state, stateid, err);
1984 }
1985
1986 static void nfs4_open_confirm_prepare(struct rpc_task *task, void *calldata)
1987 {
1988         struct nfs4_opendata *data = calldata;
1989
1990         nfs40_setup_sequence(data->o_arg.server->nfs_client->cl_slot_tbl,
1991                              &data->c_arg.seq_args, &data->c_res.seq_res, task);
1992 }
1993
1994 static void nfs4_open_confirm_done(struct rpc_task *task, void *calldata)
1995 {
1996         struct nfs4_opendata *data = calldata;
1997
1998         nfs40_sequence_done(task, &data->c_res.seq_res);
1999
2000         data->rpc_status = task->tk_status;
2001         if (data->rpc_status == 0) {
2002                 nfs4_stateid_copy(&data->o_res.stateid, &data->c_res.stateid);
2003                 nfs_confirm_seqid(&data->owner->so_seqid, 0);
2004                 renew_lease(data->o_res.server, data->timestamp);
2005                 data->rpc_done = 1;
2006         }
2007 }
2008
2009 static void nfs4_open_confirm_release(void *calldata)
2010 {
2011         struct nfs4_opendata *data = calldata;
2012         struct nfs4_state *state = NULL;
2013
2014         /* If this request hasn't been cancelled, do nothing */
2015         if (data->cancelled == 0)
2016                 goto out_free;
2017         /* In case of error, no cleanup! */
2018         if (!data->rpc_done)
2019                 goto out_free;
2020         state = nfs4_opendata_to_nfs4_state(data);
2021         if (!IS_ERR(state))
2022                 nfs4_close_state(state, data->o_arg.fmode);
2023 out_free:
2024         nfs4_opendata_put(data);
2025 }
2026
2027 static const struct rpc_call_ops nfs4_open_confirm_ops = {
2028         .rpc_call_prepare = nfs4_open_confirm_prepare,
2029         .rpc_call_done = nfs4_open_confirm_done,
2030         .rpc_release = nfs4_open_confirm_release,
2031 };
2032
2033 /*
2034  * Note: On error, nfs4_proc_open_confirm will free the struct nfs4_opendata
2035  */
2036 static int _nfs4_proc_open_confirm(struct nfs4_opendata *data)
2037 {
2038         struct nfs_server *server = NFS_SERVER(d_inode(data->dir));
2039         struct rpc_task *task;
2040         struct  rpc_message msg = {
2041                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_CONFIRM],
2042                 .rpc_argp = &data->c_arg,
2043                 .rpc_resp = &data->c_res,
2044                 .rpc_cred = data->owner->so_cred,
2045         };
2046         struct rpc_task_setup task_setup_data = {
2047                 .rpc_client = server->client,
2048                 .rpc_message = &msg,
2049                 .callback_ops = &nfs4_open_confirm_ops,
2050                 .callback_data = data,
2051                 .workqueue = nfsiod_workqueue,
2052                 .flags = RPC_TASK_ASYNC,
2053         };
2054         int status;
2055
2056         nfs4_init_sequence(&data->c_arg.seq_args, &data->c_res.seq_res, 1);
2057         kref_get(&data->kref);
2058         data->rpc_done = 0;
2059         data->rpc_status = 0;
2060         data->timestamp = jiffies;
2061         if (data->is_recover)
2062                 nfs4_set_sequence_privileged(&data->c_arg.seq_args);
2063         task = rpc_run_task(&task_setup_data);
2064         if (IS_ERR(task))
2065                 return PTR_ERR(task);
2066         status = nfs4_wait_for_completion_rpc_task(task);
2067         if (status != 0) {
2068                 data->cancelled = 1;
2069                 smp_wmb();
2070         } else
2071                 status = data->rpc_status;
2072         rpc_put_task(task);
2073         return status;
2074 }
2075
2076 static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
2077 {
2078         struct nfs4_opendata *data = calldata;
2079         struct nfs4_state_owner *sp = data->owner;
2080         struct nfs_client *clp = sp->so_server->nfs_client;
2081         enum open_claim_type4 claim = data->o_arg.claim;
2082
2083         if (nfs_wait_on_sequence(data->o_arg.seqid, task) != 0)
2084                 goto out_wait;
2085         /*
2086          * Check if we still need to send an OPEN call, or if we can use
2087          * a delegation instead.
2088          */
2089         if (data->state != NULL) {
2090                 struct nfs_delegation *delegation;
2091
2092                 if (can_open_cached(data->state, data->o_arg.fmode, data->o_arg.open_flags))
2093                         goto out_no_action;
2094                 rcu_read_lock();
2095                 delegation = rcu_dereference(NFS_I(data->state->inode)->delegation);
2096                 if (can_open_delegated(delegation, data->o_arg.fmode, claim))
2097                         goto unlock_no_action;
2098                 rcu_read_unlock();
2099         }
2100         /* Update client id. */
2101         data->o_arg.clientid = clp->cl_clientid;
2102         switch (claim) {
2103         default:
2104                 break;
2105         case NFS4_OPEN_CLAIM_PREVIOUS:
2106         case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
2107         case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
2108                 data->o_arg.open_bitmap = &nfs4_open_noattr_bitmap[0];
2109         case NFS4_OPEN_CLAIM_FH:
2110                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
2111                 nfs_copy_fh(&data->o_res.fh, data->o_arg.fh);
2112         }
2113         data->timestamp = jiffies;
2114         if (nfs4_setup_sequence(data->o_arg.server,
2115                                 &data->o_arg.seq_args,
2116                                 &data->o_res.seq_res,
2117                                 task) != 0)
2118                 nfs_release_seqid(data->o_arg.seqid);
2119
2120         /* Set the create mode (note dependency on the session type) */
2121         data->o_arg.createmode = NFS4_CREATE_UNCHECKED;
2122         if (data->o_arg.open_flags & O_EXCL) {
2123                 data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE;
2124                 if (nfs4_has_persistent_session(clp))
2125                         data->o_arg.createmode = NFS4_CREATE_GUARDED;
2126                 else if (clp->cl_mvops->minor_version > 0)
2127                         data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE4_1;
2128         }
2129         return;
2130 unlock_no_action:
2131         trace_nfs4_cached_open(data->state);
2132         rcu_read_unlock();
2133 out_no_action:
2134         task->tk_action = NULL;
2135 out_wait:
2136         nfs4_sequence_done(task, &data->o_res.seq_res);
2137 }
2138
2139 static void nfs4_open_done(struct rpc_task *task, void *calldata)
2140 {
2141         struct nfs4_opendata *data = calldata;
2142
2143         data->rpc_status = task->tk_status;
2144
2145         if (!nfs4_sequence_process(task, &data->o_res.seq_res))
2146                 return;
2147
2148         if (task->tk_status == 0) {
2149                 if (data->o_res.f_attr->valid & NFS_ATTR_FATTR_TYPE) {
2150                         switch (data->o_res.f_attr->mode & S_IFMT) {
2151                         case S_IFREG:
2152                                 break;
2153                         case S_IFLNK:
2154                                 data->rpc_status = -ELOOP;
2155                                 break;
2156                         case S_IFDIR:
2157                                 data->rpc_status = -EISDIR;
2158                                 break;
2159                         default:
2160                                 data->rpc_status = -ENOTDIR;
2161                         }
2162                 }
2163                 renew_lease(data->o_res.server, data->timestamp);
2164                 if (!(data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM))
2165                         nfs_confirm_seqid(&data->owner->so_seqid, 0);
2166         }
2167         data->rpc_done = 1;
2168 }
2169
2170 static void nfs4_open_release(void *calldata)
2171 {
2172         struct nfs4_opendata *data = calldata;
2173         struct nfs4_state *state = NULL;
2174
2175         /* If this request hasn't been cancelled, do nothing */
2176         if (data->cancelled == 0)
2177                 goto out_free;
2178         /* In case of error, no cleanup! */
2179         if (data->rpc_status != 0 || !data->rpc_done)
2180                 goto out_free;
2181         /* In case we need an open_confirm, no cleanup! */
2182         if (data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM)
2183                 goto out_free;
2184         state = nfs4_opendata_to_nfs4_state(data);
2185         if (!IS_ERR(state))
2186                 nfs4_close_state(state, data->o_arg.fmode);
2187 out_free:
2188         nfs4_opendata_put(data);
2189 }
2190
2191 static const struct rpc_call_ops nfs4_open_ops = {
2192         .rpc_call_prepare = nfs4_open_prepare,
2193         .rpc_call_done = nfs4_open_done,
2194         .rpc_release = nfs4_open_release,
2195 };
2196
2197 static int nfs4_run_open_task(struct nfs4_opendata *data, int isrecover)
2198 {
2199         struct inode *dir = d_inode(data->dir);
2200         struct nfs_server *server = NFS_SERVER(dir);
2201         struct nfs_openargs *o_arg = &data->o_arg;
2202         struct nfs_openres *o_res = &data->o_res;
2203         struct rpc_task *task;
2204         struct rpc_message msg = {
2205                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN],
2206                 .rpc_argp = o_arg,
2207                 .rpc_resp = o_res,
2208                 .rpc_cred = data->owner->so_cred,
2209         };
2210         struct rpc_task_setup task_setup_data = {
2211                 .rpc_client = server->client,
2212                 .rpc_message = &msg,
2213                 .callback_ops = &nfs4_open_ops,
2214                 .callback_data = data,
2215                 .workqueue = nfsiod_workqueue,
2216                 .flags = RPC_TASK_ASYNC,
2217         };
2218         int status;
2219
2220         nfs4_init_sequence(&o_arg->seq_args, &o_res->seq_res, 1);
2221         kref_get(&data->kref);
2222         data->rpc_done = 0;
2223         data->rpc_status = 0;
2224         data->cancelled = 0;
2225         data->is_recover = 0;
2226         if (isrecover) {
2227                 nfs4_set_sequence_privileged(&o_arg->seq_args);
2228                 data->is_recover = 1;
2229         }
2230         task = rpc_run_task(&task_setup_data);
2231         if (IS_ERR(task))
2232                 return PTR_ERR(task);
2233         status = nfs4_wait_for_completion_rpc_task(task);
2234         if (status != 0) {
2235                 data->cancelled = 1;
2236                 smp_wmb();
2237         } else
2238                 status = data->rpc_status;
2239         rpc_put_task(task);
2240
2241         return status;
2242 }
2243
2244 static int _nfs4_recover_proc_open(struct nfs4_opendata *data)
2245 {
2246         struct inode *dir = d_inode(data->dir);
2247         struct nfs_openres *o_res = &data->o_res;
2248         int status;
2249
2250         status = nfs4_run_open_task(data, 1);
2251         if (status != 0 || !data->rpc_done)
2252                 return status;
2253
2254         nfs_fattr_map_and_free_names(NFS_SERVER(dir), &data->f_attr);
2255
2256         if (o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
2257                 status = _nfs4_proc_open_confirm(data);
2258                 if (status != 0)
2259                         return status;
2260         }
2261
2262         return status;
2263 }
2264
2265 /*
2266  * Additional permission checks in order to distinguish between an
2267  * open for read, and an open for execute. This works around the
2268  * fact that NFSv4 OPEN treats read and execute permissions as being
2269  * the same.
2270  * Note that in the non-execute case, we want to turn off permission
2271  * checking if we just created a new file (POSIX open() semantics).
2272  */
2273 static int nfs4_opendata_access(struct rpc_cred *cred,
2274                                 struct nfs4_opendata *opendata,
2275                                 struct nfs4_state *state, fmode_t fmode,
2276                                 int openflags)
2277 {
2278         struct nfs_access_entry cache;
2279         u32 mask;
2280
2281         /* access call failed or for some reason the server doesn't
2282          * support any access modes -- defer access call until later */
2283         if (opendata->o_res.access_supported == 0)
2284                 return 0;
2285
2286         mask = 0;
2287         /*
2288          * Use openflags to check for exec, because fmode won't
2289          * always have FMODE_EXEC set when file open for exec.
2290          */
2291         if (openflags & __FMODE_EXEC) {
2292                 /* ONLY check for exec rights */
2293                 mask = MAY_EXEC;
2294         } else if ((fmode & FMODE_READ) && !opendata->file_created)
2295                 mask = MAY_READ;
2296
2297         cache.cred = cred;
2298         cache.jiffies = jiffies;
2299         nfs_access_set_mask(&cache, opendata->o_res.access_result);
2300         nfs_access_add_cache(state->inode, &cache);
2301
2302         if ((mask & ~cache.mask & (MAY_READ | MAY_EXEC)) == 0)
2303                 return 0;
2304
2305         /* even though OPEN succeeded, access is denied. Close the file */
2306         nfs4_close_state(state, fmode);
2307         return -EACCES;
2308 }
2309
2310 /*
2311  * Note: On error, nfs4_proc_open will free the struct nfs4_opendata
2312  */
2313 static int _nfs4_proc_open(struct nfs4_opendata *data)
2314 {
2315         struct inode *dir = d_inode(data->dir);
2316         struct nfs_server *server = NFS_SERVER(dir);
2317         struct nfs_openargs *o_arg = &data->o_arg;
2318         struct nfs_openres *o_res = &data->o_res;
2319         int status;
2320
2321         status = nfs4_run_open_task(data, 0);
2322         if (!data->rpc_done)
2323                 return status;
2324         if (status != 0) {
2325                 if (status == -NFS4ERR_BADNAME &&
2326                                 !(o_arg->open_flags & O_CREAT))
2327                         return -ENOENT;
2328                 return status;
2329         }
2330
2331         nfs_fattr_map_and_free_names(server, &data->f_attr);
2332
2333         if (o_arg->open_flags & O_CREAT) {
2334                 update_changeattr(dir, &o_res->cinfo);
2335                 if (o_arg->open_flags & O_EXCL)
2336                         data->file_created = 1;
2337                 else if (o_res->cinfo.before != o_res->cinfo.after)
2338                         data->file_created = 1;
2339         }
2340         if ((o_res->rflags & NFS4_OPEN_RESULT_LOCKTYPE_POSIX) == 0)
2341                 server->caps &= ~NFS_CAP_POSIX_LOCK;
2342         if(o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
2343                 status = _nfs4_proc_open_confirm(data);
2344                 if (status != 0)
2345                         return status;
2346         }
2347         if (!(o_res->f_attr->valid & NFS_ATTR_FATTR))
2348                 nfs4_proc_getattr(server, &o_res->fh, o_res->f_attr, o_res->f_label);
2349         return 0;
2350 }
2351
2352 static int nfs4_recover_expired_lease(struct nfs_server *server)
2353 {
2354         return nfs4_client_recover_expired_lease(server->nfs_client);
2355 }
2356
2357 /*
2358  * OPEN_EXPIRED:
2359  *      reclaim state on the server after a network partition.
2360  *      Assumes caller holds the appropriate lock
2361  */
2362 static int _nfs4_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
2363 {
2364         struct nfs4_opendata *opendata;
2365         int ret;
2366
2367         opendata = nfs4_open_recoverdata_alloc(ctx, state,
2368                         NFS4_OPEN_CLAIM_FH);
2369         if (IS_ERR(opendata))
2370                 return PTR_ERR(opendata);
2371         ret = nfs4_open_recover(opendata, state);
2372         if (ret == -ESTALE)
2373                 d_drop(ctx->dentry);
2374         nfs4_opendata_put(opendata);
2375         return ret;
2376 }
2377
2378 static int nfs4_do_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
2379 {
2380         struct nfs_server *server = NFS_SERVER(state->inode);
2381         struct nfs4_exception exception = { };
2382         int err;
2383
2384         do {
2385                 err = _nfs4_open_expired(ctx, state);
2386                 trace_nfs4_open_expired(ctx, 0, err);
2387                 if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
2388                         continue;
2389                 switch (err) {
2390                 default:
2391                         goto out;
2392                 case -NFS4ERR_GRACE:
2393                 case -NFS4ERR_DELAY:
2394                         nfs4_handle_exception(server, err, &exception);
2395                         err = 0;
2396                 }
2397         } while (exception.retry);
2398 out:
2399         return err;
2400 }
2401
2402 static int nfs4_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
2403 {
2404         struct nfs_open_context *ctx;
2405         int ret;
2406
2407         ctx = nfs4_state_find_open_context(state);
2408         if (IS_ERR(ctx))
2409                 return -EAGAIN;
2410         ret = nfs4_do_open_expired(ctx, state);
2411         put_nfs_open_context(ctx);
2412         return ret;
2413 }
2414
2415 static void nfs_finish_clear_delegation_stateid(struct nfs4_state *state,
2416                 const nfs4_stateid *stateid)
2417 {
2418         nfs_remove_bad_delegation(state->inode, stateid);
2419         write_seqlock(&state->seqlock);
2420         nfs4_stateid_copy(&state->stateid, &state->open_stateid);
2421         write_sequnlock(&state->seqlock);
2422         clear_bit(NFS_DELEGATED_STATE, &state->flags);
2423 }
2424
2425 static void nfs40_clear_delegation_stateid(struct nfs4_state *state)
2426 {
2427         if (rcu_access_pointer(NFS_I(state->inode)->delegation) != NULL)
2428                 nfs_finish_clear_delegation_stateid(state, NULL);
2429 }
2430
2431 static int nfs40_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
2432 {
2433         /* NFSv4.0 doesn't allow for delegation recovery on open expire */
2434         nfs40_clear_delegation_stateid(state);
2435         return nfs4_open_expired(sp, state);
2436 }
2437
2438 static int nfs40_test_and_free_expired_stateid(struct nfs_server *server,
2439                 nfs4_stateid *stateid,
2440                 struct rpc_cred *cred)
2441 {
2442         return -NFS4ERR_BAD_STATEID;
2443 }
2444
2445 #if defined(CONFIG_NFS_V4_1)
2446 static int nfs41_test_and_free_expired_stateid(struct nfs_server *server,
2447                 nfs4_stateid *stateid,
2448                 struct rpc_cred *cred)
2449 {
2450         int status;
2451
2452         switch (stateid->type) {
2453         default:
2454                 break;
2455         case NFS4_INVALID_STATEID_TYPE:
2456         case NFS4_SPECIAL_STATEID_TYPE:
2457                 return -NFS4ERR_BAD_STATEID;
2458         case NFS4_REVOKED_STATEID_TYPE:
2459                 goto out_free;
2460         }
2461
2462         status = nfs41_test_stateid(server, stateid, cred);
2463         switch (status) {
2464         case -NFS4ERR_EXPIRED:
2465         case -NFS4ERR_ADMIN_REVOKED:
2466         case -NFS4ERR_DELEG_REVOKED:
2467                 break;
2468         default:
2469                 return status;
2470         }
2471 out_free:
2472         /* Ack the revoked state to the server */
2473         nfs41_free_stateid(server, stateid, cred, true);
2474         return -NFS4ERR_EXPIRED;
2475 }
2476
2477 static void nfs41_check_delegation_stateid(struct nfs4_state *state)
2478 {
2479         struct nfs_server *server = NFS_SERVER(state->inode);
2480         nfs4_stateid stateid;
2481         struct nfs_delegation *delegation;
2482         struct rpc_cred *cred;
2483         int status;
2484
2485         /* Get the delegation credential for use by test/free_stateid */
2486         rcu_read_lock();
2487         delegation = rcu_dereference(NFS_I(state->inode)->delegation);
2488         if (delegation == NULL) {
2489                 rcu_read_unlock();
2490                 return;
2491         }
2492
2493         nfs4_stateid_copy(&stateid, &delegation->stateid);
2494         if (test_bit(NFS_DELEGATION_REVOKED, &delegation->flags)) {
2495                 rcu_read_unlock();
2496                 nfs_finish_clear_delegation_stateid(state, &stateid);
2497                 return;
2498         }
2499
2500         if (!test_and_clear_bit(NFS_DELEGATION_TEST_EXPIRED, &delegation->flags)) {
2501                 rcu_read_unlock();
2502                 return;
2503         }
2504
2505         cred = get_rpccred(delegation->cred);
2506         rcu_read_unlock();
2507         status = nfs41_test_and_free_expired_stateid(server, &stateid, cred);
2508         trace_nfs4_test_delegation_stateid(state, NULL, status);
2509         if (status == -NFS4ERR_EXPIRED || status == -NFS4ERR_BAD_STATEID)
2510                 nfs_finish_clear_delegation_stateid(state, &stateid);
2511
2512         put_rpccred(cred);
2513 }
2514
2515 /**
2516  * nfs41_check_expired_locks - possibly free a lock stateid
2517  *
2518  * @state: NFSv4 state for an inode
2519  *
2520  * Returns NFS_OK if recovery for this stateid is now finished.
2521  * Otherwise a negative NFS4ERR value is returned.
2522  */
2523 static int nfs41_check_expired_locks(struct nfs4_state *state)
2524 {
2525         int status, ret = NFS_OK;
2526         struct nfs4_lock_state *lsp;
2527         struct nfs_server *server = NFS_SERVER(state->inode);
2528
2529         if (!test_bit(LK_STATE_IN_USE, &state->flags))
2530                 goto out;
2531         list_for_each_entry(lsp, &state->lock_states, ls_locks) {
2532                 if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags)) {
2533                         struct rpc_cred *cred = lsp->ls_state->owner->so_cred;
2534
2535                         status = nfs41_test_and_free_expired_stateid(server,
2536                                         &lsp->ls_stateid,
2537                                         cred);
2538                         trace_nfs4_test_lock_stateid(state, lsp, status);
2539                         if (status == -NFS4ERR_EXPIRED ||
2540                             status == -NFS4ERR_BAD_STATEID) {
2541                                 clear_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags);
2542                                 if (!recover_lost_locks)
2543                                         set_bit(NFS_LOCK_LOST, &lsp->ls_flags);
2544                         } else if (status != NFS_OK) {
2545                                 ret = status;
2546                                 break;
2547                         }
2548                 }
2549         };
2550 out:
2551         return ret;
2552 }
2553
2554 /**
2555  * nfs41_check_open_stateid - possibly free an open stateid
2556  *
2557  * @state: NFSv4 state for an inode
2558  *
2559  * Returns NFS_OK if recovery for this stateid is now finished.
2560  * Otherwise a negative NFS4ERR value is returned.
2561  */
2562 static int nfs41_check_open_stateid(struct nfs4_state *state)
2563 {
2564         struct nfs_server *server = NFS_SERVER(state->inode);
2565         nfs4_stateid *stateid = &state->open_stateid;
2566         struct rpc_cred *cred = state->owner->so_cred;
2567         int status;
2568
2569         /* If a state reset has been done, test_stateid is unneeded */
2570         if ((test_bit(NFS_O_RDONLY_STATE, &state->flags) == 0) &&
2571             (test_bit(NFS_O_WRONLY_STATE, &state->flags) == 0) &&
2572             (test_bit(NFS_O_RDWR_STATE, &state->flags) == 0))
2573                 return -NFS4ERR_BAD_STATEID;
2574
2575         status = nfs41_test_and_free_expired_stateid(server, stateid, cred);
2576         trace_nfs4_test_open_stateid(state, NULL, status);
2577         if (status == -NFS4ERR_EXPIRED || status == -NFS4ERR_BAD_STATEID) {
2578                 clear_bit(NFS_O_RDONLY_STATE, &state->flags);
2579                 clear_bit(NFS_O_WRONLY_STATE, &state->flags);
2580                 clear_bit(NFS_O_RDWR_STATE, &state->flags);
2581                 clear_bit(NFS_OPEN_STATE, &state->flags);
2582         }
2583         return status;
2584 }
2585
2586 static int nfs41_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
2587 {
2588         int status;
2589
2590         nfs41_check_delegation_stateid(state);
2591         status = nfs41_check_expired_locks(state);
2592         if (status != NFS_OK)
2593                 return status;
2594         status = nfs41_check_open_stateid(state);
2595         if (status != NFS_OK)
2596                 status = nfs4_open_expired(sp, state);
2597         return status;
2598 }
2599 #endif
2600
2601 /*
2602  * on an EXCLUSIVE create, the server should send back a bitmask with FATTR4-*
2603  * fields corresponding to attributes that were used to store the verifier.
2604  * Make sure we clobber those fields in the later setattr call
2605  */
2606 static inline void nfs4_exclusive_attrset(struct nfs4_opendata *opendata,
2607                                 struct iattr *sattr, struct nfs4_label **label)
2608 {
2609         const u32 *attrset = opendata->o_res.attrset;
2610
2611         if ((attrset[1] & FATTR4_WORD1_TIME_ACCESS) &&
2612             !(sattr->ia_valid & ATTR_ATIME_SET))
2613                 sattr->ia_valid |= ATTR_ATIME;
2614
2615         if ((attrset[1] & FATTR4_WORD1_TIME_MODIFY) &&
2616             !(sattr->ia_valid & ATTR_MTIME_SET))
2617                 sattr->ia_valid |= ATTR_MTIME;
2618
2619         /* Except MODE, it seems harmless of setting twice. */
2620         if ((attrset[1] & FATTR4_WORD1_MODE))
2621                 sattr->ia_valid &= ~ATTR_MODE;
2622
2623         if (attrset[2] & FATTR4_WORD2_SECURITY_LABEL)
2624                 *label = NULL;
2625 }
2626
2627 static int _nfs4_open_and_get_state(struct nfs4_opendata *opendata,
2628                 fmode_t fmode,
2629                 int flags,
2630                 struct nfs_open_context *ctx)
2631 {
2632         struct nfs4_state_owner *sp = opendata->owner;
2633         struct nfs_server *server = sp->so_server;
2634         struct dentry *dentry;
2635         struct nfs4_state *state;
2636         unsigned int seq;
2637         int ret;
2638
2639         seq = raw_seqcount_begin(&sp->so_reclaim_seqcount);
2640
2641         ret = _nfs4_proc_open(opendata);
2642         if (ret != 0)
2643                 goto out;
2644
2645         state = nfs4_opendata_to_nfs4_state(opendata);
2646         ret = PTR_ERR(state);
2647         if (IS_ERR(state))
2648                 goto out;
2649         if (server->caps & NFS_CAP_POSIX_LOCK)
2650                 set_bit(NFS_STATE_POSIX_LOCKS, &state->flags);
2651         if (opendata->o_res.rflags & NFS4_OPEN_RESULT_MAY_NOTIFY_LOCK)
2652                 set_bit(NFS_STATE_MAY_NOTIFY_LOCK, &state->flags);
2653
2654         dentry = opendata->dentry;
2655         if (d_really_is_negative(dentry)) {
2656                 struct dentry *alias;
2657                 d_drop(dentry);
2658                 alias = d_exact_alias(dentry, state->inode);
2659                 if (!alias)
2660                         alias = d_splice_alias(igrab(state->inode), dentry);
2661                 /* d_splice_alias() can't fail here - it's a non-directory */
2662                 if (alias) {
2663                         dput(ctx->dentry);
2664                         ctx->dentry = dentry = alias;
2665                 }
2666                 nfs_set_verifier(dentry,
2667                                 nfs_save_change_attribute(d_inode(opendata->dir)));
2668         }
2669
2670         ret = nfs4_opendata_access(sp->so_cred, opendata, state, fmode, flags);
2671         if (ret != 0)
2672                 goto out;
2673
2674         ctx->state = state;
2675         if (d_inode(dentry) == state->inode) {
2676                 nfs_inode_attach_open_context(ctx);
2677                 if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq))
2678                         nfs4_schedule_stateid_recovery(server, state);
2679         }
2680 out:
2681         return ret;
2682 }
2683
2684 /*
2685  * Returns a referenced nfs4_state
2686  */
2687 static int _nfs4_do_open(struct inode *dir,
2688                         struct nfs_open_context *ctx,
2689                         int flags,
2690                         struct iattr *sattr,
2691                         struct nfs4_label *label,
2692                         int *opened)
2693 {
2694         struct nfs4_state_owner  *sp;
2695         struct nfs4_state     *state = NULL;
2696         struct nfs_server       *server = NFS_SERVER(dir);
2697         struct nfs4_opendata *opendata;
2698         struct dentry *dentry = ctx->dentry;
2699         struct rpc_cred *cred = ctx->cred;
2700         struct nfs4_threshold **ctx_th = &ctx->mdsthreshold;
2701         fmode_t fmode = ctx->mode & (FMODE_READ|FMODE_WRITE|FMODE_EXEC);
2702         enum open_claim_type4 claim = NFS4_OPEN_CLAIM_NULL;
2703         struct nfs4_label *olabel = NULL;
2704         int status;
2705
2706         /* Protect against reboot recovery conflicts */
2707         status = -ENOMEM;
2708         sp = nfs4_get_state_owner(server, cred, GFP_KERNEL);
2709         if (sp == NULL) {
2710                 dprintk("nfs4_do_open: nfs4_get_state_owner failed!\n");
2711                 goto out_err;
2712         }
2713         status = nfs4_recover_expired_lease(server);
2714         if (status != 0)
2715                 goto err_put_state_owner;
2716         if (d_really_is_positive(dentry))
2717                 nfs4_return_incompatible_delegation(d_inode(dentry), fmode);
2718         status = -ENOMEM;
2719         if (d_really_is_positive(dentry))
2720                 claim = NFS4_OPEN_CLAIM_FH;
2721         opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags, sattr,
2722                         label, claim, GFP_KERNEL);
2723         if (opendata == NULL)
2724                 goto err_put_state_owner;
2725
2726         if (label) {
2727                 olabel = nfs4_label_alloc(server, GFP_KERNEL);
2728                 if (IS_ERR(olabel)) {
2729                         status = PTR_ERR(olabel);
2730                         goto err_opendata_put;
2731                 }
2732         }
2733
2734         if (server->attr_bitmask[2] & FATTR4_WORD2_MDSTHRESHOLD) {
2735                 if (!opendata->f_attr.mdsthreshold) {
2736                         opendata->f_attr.mdsthreshold = pnfs_mdsthreshold_alloc();
2737                         if (!opendata->f_attr.mdsthreshold)
2738                                 goto err_free_label;
2739                 }
2740                 opendata->o_arg.open_bitmap = &nfs4_pnfs_open_bitmap[0];
2741         }
2742         if (d_really_is_positive(dentry))
2743                 opendata->state = nfs4_get_open_state(d_inode(dentry), sp);
2744
2745         status = _nfs4_open_and_get_state(opendata, fmode, flags, ctx);
2746         if (status != 0)
2747                 goto err_free_label;
2748         state = ctx->state;
2749
2750         if ((opendata->o_arg.open_flags & (O_CREAT|O_EXCL)) == (O_CREAT|O_EXCL) &&
2751             (opendata->o_arg.createmode != NFS4_CREATE_GUARDED)) {
2752                 nfs4_exclusive_attrset(opendata, sattr, &label);
2753                 /*
2754                  * send create attributes which was not set by open
2755                  * with an extra setattr.
2756                  */
2757                 if (sattr->ia_valid & NFS4_VALID_ATTRS) {
2758                         nfs_fattr_init(opendata->o_res.f_attr);
2759                         status = nfs4_do_setattr(state->inode, cred,
2760                                         opendata->o_res.f_attr, sattr,
2761                                         state, label, olabel);
2762                         if (status == 0) {
2763                                 nfs_setattr_update_inode(state->inode, sattr,
2764                                                 opendata->o_res.f_attr);
2765                                 nfs_setsecurity(state->inode, opendata->o_res.f_attr, olabel);
2766                         }
2767                 }
2768         }
2769         if (opened && opendata->file_created)
2770                 *opened |= FILE_CREATED;
2771
2772         if (pnfs_use_threshold(ctx_th, opendata->f_attr.mdsthreshold, server)) {
2773                 *ctx_th = opendata->f_attr.mdsthreshold;
2774                 opendata->f_attr.mdsthreshold = NULL;
2775         }
2776
2777         nfs4_label_free(olabel);
2778
2779         nfs4_opendata_put(opendata);
2780         nfs4_put_state_owner(sp);
2781         return 0;
2782 err_free_label:
2783         nfs4_label_free(olabel);
2784 err_opendata_put:
2785         nfs4_opendata_put(opendata);
2786 err_put_state_owner:
2787         nfs4_put_state_owner(sp);
2788 out_err:
2789         return status;
2790 }
2791
2792
2793 static struct nfs4_state *nfs4_do_open(struct inode *dir,
2794                                         struct nfs_open_context *ctx,
2795                                         int flags,
2796                                         struct iattr *sattr,
2797                                         struct nfs4_label *label,
2798                                         int *opened)
2799 {
2800         struct nfs_server *server = NFS_SERVER(dir);
2801         struct nfs4_exception exception = { };
2802         struct nfs4_state *res;
2803         int status;
2804
2805         do {
2806                 status = _nfs4_do_open(dir, ctx, flags, sattr, label, opened);
2807                 res = ctx->state;
2808                 trace_nfs4_open_file(ctx, flags, status);
2809                 if (status == 0)
2810                         break;
2811                 /* NOTE: BAD_SEQID means the server and client disagree about the
2812                  * book-keeping w.r.t. state-changing operations
2813                  * (OPEN/CLOSE/LOCK/LOCKU...)
2814                  * It is actually a sign of a bug on the client or on the server.
2815                  *
2816                  * If we receive a BAD_SEQID error in the particular case of
2817                  * doing an OPEN, we assume that nfs_increment_open_seqid() will
2818                  * have unhashed the old state_owner for us, and that we can
2819                  * therefore safely retry using a new one. We should still warn
2820                  * the user though...
2821                  */
2822                 if (status == -NFS4ERR_BAD_SEQID) {
2823                         pr_warn_ratelimited("NFS: v4 server %s "
2824                                         " returned a bad sequence-id error!\n",
2825                                         NFS_SERVER(dir)->nfs_client->cl_hostname);
2826                         exception.retry = 1;
2827                         continue;
2828                 }
2829                 /*
2830                  * BAD_STATEID on OPEN means that the server cancelled our
2831                  * state before it received the OPEN_CONFIRM.
2832                  * Recover by retrying the request as per the discussion
2833                  * on Page 181 of RFC3530.
2834                  */
2835                 if (status == -NFS4ERR_BAD_STATEID) {
2836                         exception.retry = 1;
2837                         continue;
2838                 }
2839                 if (status == -EAGAIN) {
2840                         /* We must have found a delegation */
2841                         exception.retry = 1;
2842                         continue;
2843                 }
2844                 if (nfs4_clear_cap_atomic_open_v1(server, status, &exception))
2845                         continue;
2846                 res = ERR_PTR(nfs4_handle_exception(server,
2847                                         status, &exception));
2848         } while (exception.retry);
2849         return res;
2850 }
2851
2852 static int _nfs4_do_setattr(struct inode *inode,
2853                             struct nfs_setattrargs *arg,
2854                             struct nfs_setattrres *res,
2855                             struct rpc_cred *cred,
2856                             struct nfs4_state *state)
2857 {
2858         struct nfs_server *server = NFS_SERVER(inode);
2859         struct rpc_message msg = {
2860                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
2861                 .rpc_argp       = arg,
2862                 .rpc_resp       = res,
2863                 .rpc_cred       = cred,
2864         };
2865         struct rpc_cred *delegation_cred = NULL;
2866         unsigned long timestamp = jiffies;
2867         fmode_t fmode;
2868         bool truncate;
2869         int status;
2870
2871         nfs_fattr_init(res->fattr);
2872
2873         /* Servers should only apply open mode checks for file size changes */
2874         truncate = (arg->iap->ia_valid & ATTR_SIZE) ? true : false;
2875         fmode = truncate ? FMODE_WRITE : FMODE_READ;
2876
2877         if (nfs4_copy_delegation_stateid(inode, fmode, &arg->stateid, &delegation_cred)) {
2878                 /* Use that stateid */
2879         } else if (truncate && state != NULL) {
2880                 struct nfs_lockowner lockowner = {
2881                         .l_owner = current->files,
2882                         .l_pid = current->tgid,
2883                 };
2884                 if (!nfs4_valid_open_stateid(state))
2885                         return -EBADF;
2886                 if (nfs4_select_rw_stateid(state, FMODE_WRITE, &lockowner,
2887                                 &arg->stateid, &delegation_cred) == -EIO)
2888                         return -EBADF;
2889         } else
2890                 nfs4_stateid_copy(&arg->stateid, &zero_stateid);
2891         if (delegation_cred)
2892                 msg.rpc_cred = delegation_cred;
2893
2894         status = nfs4_call_sync(server->client, server, &msg, &arg->seq_args, &res->seq_res, 1);
2895
2896         put_rpccred(delegation_cred);
2897         if (status == 0 && state != NULL)
2898                 renew_lease(server, timestamp);
2899         trace_nfs4_setattr(inode, &arg->stateid, status);
2900         return status;
2901 }
2902
2903 static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
2904                            struct nfs_fattr *fattr, struct iattr *sattr,
2905                            struct nfs4_state *state, struct nfs4_label *ilabel,
2906                            struct nfs4_label *olabel)
2907 {
2908         struct nfs_server *server = NFS_SERVER(inode);
2909         struct nfs_setattrargs  arg = {
2910                 .fh             = NFS_FH(inode),
2911                 .iap            = sattr,
2912                 .server         = server,
2913                 .bitmask = server->attr_bitmask,
2914                 .label          = ilabel,
2915         };
2916         struct nfs_setattrres  res = {
2917                 .fattr          = fattr,
2918                 .label          = olabel,
2919                 .server         = server,
2920         };
2921         struct nfs4_exception exception = {
2922                 .state = state,
2923                 .inode = inode,
2924                 .stateid = &arg.stateid,
2925         };
2926         int err;
2927
2928         arg.bitmask = nfs4_bitmask(server, ilabel);
2929         if (ilabel)
2930                 arg.bitmask = nfs4_bitmask(server, olabel);
2931
2932         do {
2933                 err = _nfs4_do_setattr(inode, &arg, &res, cred, state);
2934                 switch (err) {
2935                 case -NFS4ERR_OPENMODE:
2936                         if (!(sattr->ia_valid & ATTR_SIZE)) {
2937                                 pr_warn_once("NFSv4: server %s is incorrectly "
2938                                                 "applying open mode checks to "
2939                                                 "a SETATTR that is not "
2940                                                 "changing file size.\n",
2941                                                 server->nfs_client->cl_hostname);
2942                         }
2943                         if (state && !(state->state & FMODE_WRITE)) {
2944                                 err = -EBADF;
2945                                 if (sattr->ia_valid & ATTR_OPEN)
2946                                         err = -EACCES;
2947                                 goto out;
2948                         }
2949                 }
2950                 err = nfs4_handle_exception(server, err, &exception);
2951         } while (exception.retry);
2952 out:
2953         return err;
2954 }
2955
2956 static bool
2957 nfs4_wait_on_layoutreturn(struct inode *inode, struct rpc_task *task)
2958 {
2959         if (inode == NULL || !nfs_have_layout(inode))
2960                 return false;
2961
2962         return pnfs_wait_on_layoutreturn(inode, task);
2963 }
2964
2965 struct nfs4_closedata {
2966         struct inode *inode;
2967         struct nfs4_state *state;
2968         struct nfs_closeargs arg;
2969         struct nfs_closeres res;
2970         struct nfs_fattr fattr;
2971         unsigned long timestamp;
2972         bool roc;
2973         u32 roc_barrier;
2974 };
2975
2976 static void nfs4_free_closedata(void *data)
2977 {
2978         struct nfs4_closedata *calldata = data;
2979         struct nfs4_state_owner *sp = calldata->state->owner;
2980         struct super_block *sb = calldata->state->inode->i_sb;
2981
2982         if (calldata->roc)
2983                 pnfs_roc_release(calldata->state->inode);
2984         nfs4_put_open_state(calldata->state);
2985         nfs_free_seqid(calldata->arg.seqid);
2986         nfs4_put_state_owner(sp);
2987         nfs_sb_deactive(sb);
2988         kfree(calldata);
2989 }
2990
2991 static void nfs4_close_done(struct rpc_task *task, void *data)
2992 {
2993         struct nfs4_closedata *calldata = data;
2994         struct nfs4_state *state = calldata->state;
2995         struct nfs_server *server = NFS_SERVER(calldata->inode);
2996         nfs4_stateid *res_stateid = NULL;
2997
2998         dprintk("%s: begin!\n", __func__);
2999         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
3000                 return;
3001         trace_nfs4_close(state, &calldata->arg, &calldata->res, task->tk_status);
3002         /* hmm. we are done with the inode, and in the process of freeing
3003          * the state_owner. we keep this around to process errors
3004          */
3005         switch (task->tk_status) {
3006                 case 0:
3007                         res_stateid = &calldata->res.stateid;
3008                         if (calldata->roc)
3009                                 pnfs_roc_set_barrier(state->inode,
3010                                                      calldata->roc_barrier);
3011                         renew_lease(server, calldata->timestamp);
3012                         break;
3013                 case -NFS4ERR_ADMIN_REVOKED:
3014                 case -NFS4ERR_STALE_STATEID:
3015                 case -NFS4ERR_EXPIRED:
3016                         nfs4_free_revoked_stateid(server,
3017                                         &calldata->arg.stateid,
3018                                         task->tk_msg.rpc_cred);
3019                 case -NFS4ERR_OLD_STATEID:
3020                 case -NFS4ERR_BAD_STATEID:
3021                         if (!nfs4_stateid_match(&calldata->arg.stateid,
3022                                                 &state->open_stateid)) {
3023                                 rpc_restart_call_prepare(task);
3024                                 goto out_release;
3025                         }
3026                         if (calldata->arg.fmode == 0)
3027                                 break;
3028                 default:
3029                         if (nfs4_async_handle_error(task, server, state, NULL) == -EAGAIN) {
3030                                 rpc_restart_call_prepare(task);
3031                                 goto out_release;
3032                         }
3033         }
3034         nfs_clear_open_stateid(state, &calldata->arg.stateid,
3035                         res_stateid, calldata->arg.fmode);
3036 out_release:
3037         nfs_release_seqid(calldata->arg.seqid);
3038         nfs_refresh_inode(calldata->inode, calldata->res.fattr);
3039         dprintk("%s: done, ret = %d!\n", __func__, task->tk_status);
3040 }
3041
3042 static void nfs4_close_prepare(struct rpc_task *task, void *data)
3043 {
3044         struct nfs4_closedata *calldata = data;
3045         struct nfs4_state *state = calldata->state;
3046         struct inode *inode = calldata->inode;
3047         bool is_rdonly, is_wronly, is_rdwr;
3048         int call_close = 0;
3049
3050         dprintk("%s: begin!\n", __func__);
3051         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
3052                 goto out_wait;
3053
3054         task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_DOWNGRADE];
3055         spin_lock(&state->owner->so_lock);
3056         is_rdwr = test_bit(NFS_O_RDWR_STATE, &state->flags);
3057         is_rdonly = test_bit(NFS_O_RDONLY_STATE, &state->flags);
3058         is_wronly = test_bit(NFS_O_WRONLY_STATE, &state->flags);
3059         nfs4_stateid_copy(&calldata->arg.stateid, &state->open_stateid);
3060         /* Calculate the change in open mode */
3061         calldata->arg.fmode = 0;
3062         if (state->n_rdwr == 0) {
3063                 if (state->n_rdonly == 0)
3064                         call_close |= is_rdonly;
3065                 else if (is_rdonly)
3066                         calldata->arg.fmode |= FMODE_READ;
3067                 if (state->n_wronly == 0)
3068                         call_close |= is_wronly;
3069                 else if (is_wronly)
3070                         calldata->arg.fmode |= FMODE_WRITE;
3071                 if (calldata->arg.fmode != (FMODE_READ|FMODE_WRITE))
3072                         call_close |= is_rdwr;
3073         } else if (is_rdwr)
3074                 calldata->arg.fmode |= FMODE_READ|FMODE_WRITE;
3075
3076         if (!nfs4_valid_open_stateid(state))
3077                 call_close = 0;
3078         spin_unlock(&state->owner->so_lock);
3079
3080         if (!call_close) {
3081                 /* Note: exit _without_ calling nfs4_close_done */
3082                 goto out_no_action;
3083         }
3084
3085         if (nfs4_wait_on_layoutreturn(inode, task)) {
3086                 nfs_release_seqid(calldata->arg.seqid);
3087                 goto out_wait;
3088         }
3089
3090         if (calldata->arg.fmode == 0)
3091                 task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE];
3092         if (calldata->roc)
3093                 pnfs_roc_get_barrier(inode, &calldata->roc_barrier);
3094
3095         calldata->arg.share_access =
3096                 nfs4_map_atomic_open_share(NFS_SERVER(inode),
3097                                 calldata->arg.fmode, 0);
3098
3099         nfs_fattr_init(calldata->res.fattr);
3100         calldata->timestamp = jiffies;
3101         if (nfs4_setup_sequence(NFS_SERVER(inode),
3102                                 &calldata->arg.seq_args,
3103                                 &calldata->res.seq_res,
3104                                 task) != 0)
3105                 nfs_release_seqid(calldata->arg.seqid);
3106         dprintk("%s: done!\n", __func__);
3107         return;
3108 out_no_action:
3109         task->tk_action = NULL;
3110 out_wait:
3111         nfs4_sequence_done(task, &calldata->res.seq_res);
3112 }
3113
3114 static const struct rpc_call_ops nfs4_close_ops = {
3115         .rpc_call_prepare = nfs4_close_prepare,
3116         .rpc_call_done = nfs4_close_done,
3117         .rpc_release = nfs4_free_closedata,
3118 };
3119
3120 static bool nfs4_roc(struct inode *inode)
3121 {
3122         if (!nfs_have_layout(inode))
3123                 return false;
3124         return pnfs_roc(inode);
3125 }
3126
3127 /* 
3128  * It is possible for data to be read/written from a mem-mapped file 
3129  * after the sys_close call (which hits the vfs layer as a flush).
3130  * This means that we can't safely call nfsv4 close on a file until 
3131  * the inode is cleared. This in turn means that we are not good
3132  * NFSv4 citizens - we do not indicate to the server to update the file's 
3133  * share state even when we are done with one of the three share 
3134  * stateid's in the inode.
3135  *
3136  * NOTE: Caller must be holding the sp->so_owner semaphore!
3137  */
3138 int nfs4_do_close(struct nfs4_state *state, gfp_t gfp_mask, int wait)
3139 {
3140         struct nfs_server *server = NFS_SERVER(state->inode);
3141         struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
3142         struct nfs4_closedata *calldata;
3143         struct nfs4_state_owner *sp = state->owner;
3144         struct rpc_task *task;
3145         struct rpc_message msg = {
3146                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE],
3147                 .rpc_cred = state->owner->so_cred,
3148         };
3149         struct rpc_task_setup task_setup_data = {
3150                 .rpc_client = server->client,
3151                 .rpc_message = &msg,
3152                 .callback_ops = &nfs4_close_ops,
3153                 .workqueue = nfsiod_workqueue,
3154                 .flags = RPC_TASK_ASYNC,
3155         };
3156         int status = -ENOMEM;
3157
3158         nfs4_state_protect(server->nfs_client, NFS_SP4_MACH_CRED_CLEANUP,
3159                 &task_setup_data.rpc_client, &msg);
3160
3161         calldata = kzalloc(sizeof(*calldata), gfp_mask);
3162         if (calldata == NULL)
3163                 goto out;
3164         nfs4_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 1);
3165         calldata->inode = state->inode;
3166         calldata->state = state;
3167         calldata->arg.fh = NFS_FH(state->inode);
3168         /* Serialization for the sequence id */
3169         alloc_seqid = server->nfs_client->cl_mvops->alloc_seqid;
3170         calldata->arg.seqid = alloc_seqid(&state->owner->so_seqid, gfp_mask);
3171         if (IS_ERR(calldata->arg.seqid))
3172                 goto out_free_calldata;
3173         calldata->arg.fmode = 0;
3174         calldata->arg.bitmask = server->cache_consistency_bitmask;
3175         calldata->res.fattr = &calldata->fattr;
3176         calldata->res.seqid = calldata->arg.seqid;
3177         calldata->res.server = server;
3178         calldata->roc = nfs4_roc(state->inode);
3179         nfs_sb_active(calldata->inode->i_sb);
3180
3181         msg.rpc_argp = &calldata->arg;
3182         msg.rpc_resp = &calldata->res;
3183         task_setup_data.callback_data = calldata;
3184         task = rpc_run_task(&task_setup_data);
3185         if (IS_ERR(task))
3186                 return PTR_ERR(task);
3187         status = 0;
3188         if (wait)
3189                 status = rpc_wait_for_completion_task(task);
3190         rpc_put_task(task);
3191         return status;
3192 out_free_calldata:
3193         kfree(calldata);
3194 out:
3195         nfs4_put_open_state(state);
3196         nfs4_put_state_owner(sp);
3197         return status;
3198 }
3199
3200 static struct inode *
3201 nfs4_atomic_open(struct inode *dir, struct nfs_open_context *ctx,
3202                 int open_flags, struct iattr *attr, int *opened)
3203 {
3204         struct nfs4_state *state;
3205         struct nfs4_label l = {0, 0, 0, NULL}, *label = NULL;
3206
3207         label = nfs4_label_init_security(dir, ctx->dentry, attr, &l);
3208
3209         /* Protect against concurrent sillydeletes */
3210         state = nfs4_do_open(dir, ctx, open_flags, attr, label, opened);
3211
3212         nfs4_label_release_security(label);
3213
3214         if (IS_ERR(state))
3215                 return ERR_CAST(state);
3216         return state->inode;
3217 }
3218
3219 static void nfs4_close_context(struct nfs_open_context *ctx, int is_sync)
3220 {
3221         if (ctx->state == NULL)
3222                 return;
3223         if (is_sync)
3224                 nfs4_close_sync(ctx->state, ctx->mode);
3225         else
3226                 nfs4_close_state(ctx->state, ctx->mode);
3227 }
3228
3229 #define FATTR4_WORD1_NFS40_MASK (2*FATTR4_WORD1_MOUNTED_ON_FILEID - 1UL)
3230 #define FATTR4_WORD2_NFS41_MASK (2*FATTR4_WORD2_SUPPATTR_EXCLCREAT - 1UL)
3231 #define FATTR4_WORD2_NFS42_MASK (2*FATTR4_WORD2_SECURITY_LABEL - 1UL)
3232
3233 static int _nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
3234 {
3235         u32 bitmask[3] = {}, minorversion = server->nfs_client->cl_minorversion;
3236         struct nfs4_server_caps_arg args = {
3237                 .fhandle = fhandle,
3238                 .bitmask = bitmask,
3239         };
3240         struct nfs4_server_caps_res res = {};
3241         struct rpc_message msg = {
3242                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SERVER_CAPS],
3243                 .rpc_argp = &args,
3244                 .rpc_resp = &res,
3245         };
3246         int status;
3247
3248         bitmask[0] = FATTR4_WORD0_SUPPORTED_ATTRS |
3249                      FATTR4_WORD0_FH_EXPIRE_TYPE |
3250                      FATTR4_WORD0_LINK_SUPPORT |
3251                      FATTR4_WORD0_SYMLINK_SUPPORT |
3252                      FATTR4_WORD0_ACLSUPPORT;
3253         if (minorversion)
3254                 bitmask[2] = FATTR4_WORD2_SUPPATTR_EXCLCREAT;
3255
3256         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3257         if (status == 0) {
3258                 /* Sanity check the server answers */
3259                 switch (minorversion) {
3260                 case 0:
3261                         res.attr_bitmask[1] &= FATTR4_WORD1_NFS40_MASK;
3262                         res.attr_bitmask[2] = 0;
3263                         break;
3264                 case 1:
3265                         res.attr_bitmask[2] &= FATTR4_WORD2_NFS41_MASK;
3266                         break;
3267                 case 2:
3268                         res.attr_bitmask[2] &= FATTR4_WORD2_NFS42_MASK;
3269                 }
3270                 memcpy(server->attr_bitmask, res.attr_bitmask, sizeof(server->attr_bitmask));
3271                 server->caps &= ~(NFS_CAP_ACLS|NFS_CAP_HARDLINKS|
3272                                 NFS_CAP_SYMLINKS|NFS_CAP_FILEID|
3273                                 NFS_CAP_MODE|NFS_CAP_NLINK|NFS_CAP_OWNER|
3274                                 NFS_CAP_OWNER_GROUP|NFS_CAP_ATIME|
3275                                 NFS_CAP_CTIME|NFS_CAP_MTIME|
3276                                 NFS_CAP_SECURITY_LABEL);
3277                 if (res.attr_bitmask[0] & FATTR4_WORD0_ACL &&
3278                                 res.acl_bitmask & ACL4_SUPPORT_ALLOW_ACL)
3279                         server->caps |= NFS_CAP_ACLS;
3280                 if (res.has_links != 0)
3281                         server->caps |= NFS_CAP_HARDLINKS;
3282                 if (res.has_symlinks != 0)
3283                         server->caps |= NFS_CAP_SYMLINKS;
3284                 if (res.attr_bitmask[0] & FATTR4_WORD0_FILEID)
3285                         server->caps |= NFS_CAP_FILEID;
3286                 if (res.attr_bitmask[1] & FATTR4_WORD1_MODE)
3287                         server->caps |= NFS_CAP_MODE;
3288                 if (res.attr_bitmask[1] & FATTR4_WORD1_NUMLINKS)
3289                         server->caps |= NFS_CAP_NLINK;
3290                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER)
3291                         server->caps |= NFS_CAP_OWNER;
3292                 if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER_GROUP)
3293                         server->caps |= NFS_CAP_OWNER_GROUP;
3294                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_ACCESS)
3295                         server->caps |= NFS_CAP_ATIME;
3296                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_METADATA)
3297                         server->caps |= NFS_CAP_CTIME;
3298                 if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_MODIFY)
3299                         server->caps |= NFS_CAP_MTIME;
3300 #ifdef CONFIG_NFS_V4_SECURITY_LABEL
3301                 if (res.attr_bitmask[2] & FATTR4_WORD2_SECURITY_LABEL)
3302                         server->caps |= NFS_CAP_SECURITY_LABEL;
3303 #endif
3304                 memcpy(server->attr_bitmask_nl, res.attr_bitmask,
3305                                 sizeof(server->attr_bitmask));
3306                 server->attr_bitmask_nl[2] &= ~FATTR4_WORD2_SECURITY_LABEL;
3307
3308                 memcpy(server->cache_consistency_bitmask, res.attr_bitmask, sizeof(server->cache_consistency_bitmask));
3309                 server->cache_consistency_bitmask[0] &= FATTR4_WORD0_CHANGE|FATTR4_WORD0_SIZE;
3310                 server->cache_consistency_bitmask[1] &= FATTR4_WORD1_TIME_METADATA|FATTR4_WORD1_TIME_MODIFY;
3311                 server->cache_consistency_bitmask[2] = 0;
3312                 memcpy(server->exclcreat_bitmask, res.exclcreat_bitmask,
3313                         sizeof(server->exclcreat_bitmask));
3314                 server->acl_bitmask = res.acl_bitmask;
3315                 server->fh_expire_type = res.fh_expire_type;
3316         }
3317
3318         return status;
3319 }
3320
3321 int nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
3322 {
3323         struct nfs4_exception exception = { };
3324         int err;
3325         do {
3326                 err = nfs4_handle_exception(server,
3327                                 _nfs4_server_capabilities(server, fhandle),
3328                                 &exception);
3329         } while (exception.retry);
3330         return err;
3331 }
3332
3333 static int _nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
3334                 struct nfs_fsinfo *info)
3335 {
3336         u32 bitmask[3];
3337         struct nfs4_lookup_root_arg args = {
3338                 .bitmask = bitmask,
3339         };
3340         struct nfs4_lookup_res res = {
3341                 .server = server,
3342                 .fattr = info->fattr,
3343                 .fh = fhandle,
3344         };
3345         struct rpc_message msg = {
3346                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP_ROOT],
3347                 .rpc_argp = &args,
3348                 .rpc_resp = &res,
3349         };
3350
3351         bitmask[0] = nfs4_fattr_bitmap[0];
3352         bitmask[1] = nfs4_fattr_bitmap[1];
3353         /*
3354          * Process the label in the upcoming getfattr
3355          */
3356         bitmask[2] = nfs4_fattr_bitmap[2] & ~FATTR4_WORD2_SECURITY_LABEL;
3357
3358         nfs_fattr_init(info->fattr);
3359         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3360 }
3361
3362 static int nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
3363                 struct nfs_fsinfo *info)
3364 {
3365         struct nfs4_exception exception = { };
3366         int err;
3367         do {
3368                 err = _nfs4_lookup_root(server, fhandle, info);
3369                 trace_nfs4_lookup_root(server, fhandle, info->fattr, err);
3370                 switch (err) {
3371                 case 0:
3372                 case -NFS4ERR_WRONGSEC:
3373                         goto out;
3374                 default:
3375                         err = nfs4_handle_exception(server, err, &exception);
3376                 }
3377         } while (exception.retry);
3378 out:
3379         return err;
3380 }
3381
3382 static int nfs4_lookup_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
3383                                 struct nfs_fsinfo *info, rpc_authflavor_t flavor)
3384 {
3385         struct rpc_auth_create_args auth_args = {
3386                 .pseudoflavor = flavor,
3387         };
3388         struct rpc_auth *auth;
3389         int ret;
3390
3391         auth = rpcauth_create(&auth_args, server->client);
3392         if (IS_ERR(auth)) {
3393                 ret = -EACCES;
3394                 goto out;
3395         }
3396         ret = nfs4_lookup_root(server, fhandle, info);
3397 out:
3398         return ret;
3399 }
3400
3401 /*
3402  * Retry pseudoroot lookup with various security flavors.  We do this when:
3403  *
3404  *   NFSv4.0: the PUTROOTFH operation returns NFS4ERR_WRONGSEC
3405  *   NFSv4.1: the server does not support the SECINFO_NO_NAME operation
3406  *
3407  * Returns zero on success, or a negative NFS4ERR value, or a
3408  * negative errno value.
3409  */
3410 static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
3411                               struct nfs_fsinfo *info)
3412 {
3413         /* Per 3530bis 15.33.5 */
3414         static const rpc_authflavor_t flav_array[] = {
3415                 RPC_AUTH_GSS_KRB5P,
3416                 RPC_AUTH_GSS_KRB5I,
3417                 RPC_AUTH_GSS_KRB5,
3418                 RPC_AUTH_UNIX,                  /* courtesy */
3419                 RPC_AUTH_NULL,
3420         };
3421         int status = -EPERM;
3422         size_t i;
3423
3424         if (server->auth_info.flavor_len > 0) {
3425                 /* try each flavor specified by user */
3426                 for (i = 0; i < server->auth_info.flavor_len; i++) {
3427                         status = nfs4_lookup_root_sec(server, fhandle, info,
3428                                                 server->auth_info.flavors[i]);
3429                         if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
3430                                 continue;
3431                         break;
3432                 }
3433         } else {
3434                 /* no flavors specified by user, try default list */
3435                 for (i = 0; i < ARRAY_SIZE(flav_array); i++) {
3436                         status = nfs4_lookup_root_sec(server, fhandle, info,
3437                                                       flav_array[i]);
3438                         if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
3439                                 continue;
3440                         break;
3441                 }
3442         }
3443
3444         /*
3445          * -EACCESS could mean that the user doesn't have correct permissions
3446          * to access the mount.  It could also mean that we tried to mount
3447          * with a gss auth flavor, but rpc.gssd isn't running.  Either way,
3448          * existing mount programs don't handle -EACCES very well so it should
3449          * be mapped to -EPERM instead.
3450          */
3451         if (status == -EACCES)
3452                 status = -EPERM;
3453         return status;
3454 }
3455
3456 /**
3457  * nfs4_proc_get_rootfh - get file handle for server's pseudoroot
3458  * @server: initialized nfs_server handle
3459  * @fhandle: we fill in the pseudo-fs root file handle
3460  * @info: we fill in an FSINFO struct
3461  * @auth_probe: probe the auth flavours
3462  *
3463  * Returns zero on success, or a negative errno.
3464  */
3465 int nfs4_proc_get_rootfh(struct nfs_server *server, struct nfs_fh *fhandle,
3466                          struct nfs_fsinfo *info,
3467                          bool auth_probe)
3468 {
3469         int status = 0;
3470
3471         if (!auth_probe)
3472                 status = nfs4_lookup_root(server, fhandle, info);
3473
3474         if (auth_probe || status == NFS4ERR_WRONGSEC)
3475                 status = server->nfs_client->cl_mvops->find_root_sec(server,
3476                                 fhandle, info);
3477
3478         if (status == 0)
3479                 status = nfs4_server_capabilities(server, fhandle);
3480         if (status == 0)
3481                 status = nfs4_do_fsinfo(server, fhandle, info);
3482
3483         return nfs4_map_errors(status);
3484 }
3485
3486 static int nfs4_proc_get_root(struct nfs_server *server, struct nfs_fh *mntfh,
3487                               struct nfs_fsinfo *info)
3488 {
3489         int error;
3490         struct nfs_fattr *fattr = info->fattr;
3491         struct nfs4_label *label = NULL;
3492
3493         error = nfs4_server_capabilities(server, mntfh);
3494         if (error < 0) {
3495                 dprintk("nfs4_get_root: getcaps error = %d\n", -error);
3496                 return error;
3497         }
3498
3499         label = nfs4_label_alloc(server, GFP_KERNEL);
3500         if (IS_ERR(label))
3501                 return PTR_ERR(label);
3502
3503         error = nfs4_proc_getattr(server, mntfh, fattr, label);
3504         if (error < 0) {
3505                 dprintk("nfs4_get_root: getattr error = %d\n", -error);
3506                 goto err_free_label;
3507         }
3508
3509         if (fattr->valid & NFS_ATTR_FATTR_FSID &&
3510             !nfs_fsid_equal(&server->fsid, &fattr->fsid))
3511                 memcpy(&server->fsid, &fattr->fsid, sizeof(server->fsid));
3512
3513 err_free_label:
3514         nfs4_label_free(label);
3515
3516         return error;
3517 }
3518
3519 /*
3520  * Get locations and (maybe) other attributes of a referral.
3521  * Note that we'll actually follow the referral later when
3522  * we detect fsid mismatch in inode revalidation
3523  */
3524 static int nfs4_get_referral(struct rpc_clnt *client, struct inode *dir,
3525                              const struct qstr *name, struct nfs_fattr *fattr,
3526                              struct nfs_fh *fhandle)
3527 {
3528         int status = -ENOMEM;
3529         struct page *page = NULL;
3530         struct nfs4_fs_locations *locations = NULL;
3531
3532         page = alloc_page(GFP_KERNEL);
3533         if (page == NULL)
3534                 goto out;
3535         locations = kmalloc(sizeof(struct nfs4_fs_locations), GFP_KERNEL);
3536         if (locations == NULL)
3537                 goto out;
3538
3539         status = nfs4_proc_fs_locations(client, dir, name, locations, page);
3540         if (status != 0)
3541                 goto out;
3542
3543         /*
3544          * If the fsid didn't change, this is a migration event, not a
3545          * referral.  Cause us to drop into the exception handler, which
3546          * will kick off migration recovery.
3547          */
3548         if (nfs_fsid_equal(&NFS_SERVER(dir)->fsid, &locations->fattr.fsid)) {
3549                 dprintk("%s: server did not return a different fsid for"
3550                         " a referral at %s\n", __func__, name->name);
3551                 status = -NFS4ERR_MOVED;
3552                 goto out;
3553         }
3554         /* Fixup attributes for the nfs_lookup() call to nfs_fhget() */
3555         nfs_fixup_referral_attributes(&locations->fattr);
3556
3557         /* replace the lookup nfs_fattr with the locations nfs_fattr */
3558         memcpy(fattr, &locations->fattr, sizeof(struct nfs_fattr));
3559         memset(fhandle, 0, sizeof(struct nfs_fh));
3560 out:
3561         if (page)
3562                 __free_page(page);
3563         kfree(locations);
3564         return status;
3565 }
3566
3567 static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle,
3568                                 struct nfs_fattr *fattr, struct nfs4_label *label)
3569 {
3570         struct nfs4_getattr_arg args = {
3571                 .fh = fhandle,
3572                 .bitmask = server->attr_bitmask,
3573         };
3574         struct nfs4_getattr_res res = {
3575                 .fattr = fattr,
3576                 .label = label,
3577                 .server = server,
3578         };
3579         struct rpc_message msg = {
3580                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
3581                 .rpc_argp = &args,
3582                 .rpc_resp = &res,
3583         };
3584
3585         args.bitmask = nfs4_bitmask(server, label);
3586
3587         nfs_fattr_init(fattr);
3588         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3589 }
3590
3591 static int nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle,
3592                                 struct nfs_fattr *fattr, struct nfs4_label *label)
3593 {
3594         struct nfs4_exception exception = { };
3595         int err;
3596         do {
3597                 err = _nfs4_proc_getattr(server, fhandle, fattr, label);
3598                 trace_nfs4_getattr(server, fhandle, fattr, err);
3599                 err = nfs4_handle_exception(server, err,
3600                                 &exception);
3601         } while (exception.retry);
3602         return err;
3603 }
3604
3605 /* 
3606  * The file is not closed if it is opened due to the a request to change
3607  * the size of the file. The open call will not be needed once the
3608  * VFS layer lookup-intents are implemented.
3609  *
3610  * Close is called when the inode is destroyed.
3611  * If we haven't opened the file for O_WRONLY, we
3612  * need to in the size_change case to obtain a stateid.
3613  *
3614  * Got race?
3615  * Because OPEN is always done by name in nfsv4, it is
3616  * possible that we opened a different file by the same
3617  * name.  We can recognize this race condition, but we
3618  * can't do anything about it besides returning an error.
3619  *
3620  * This will be fixed with VFS changes (lookup-intent).
3621  */
3622 static int
3623 nfs4_proc_setattr(struct dentry *dentry, struct nfs_fattr *fattr,
3624                   struct iattr *sattr)
3625 {
3626         struct inode *inode = d_inode(dentry);
3627         struct rpc_cred *cred = NULL;
3628         struct nfs4_state *state = NULL;
3629         struct nfs4_label *label = NULL;
3630         int status;
3631
3632         if (pnfs_ld_layoutret_on_setattr(inode) &&
3633             sattr->ia_valid & ATTR_SIZE &&
3634             sattr->ia_size < i_size_read(inode))
3635                 pnfs_commit_and_return_layout(inode);
3636
3637         nfs_fattr_init(fattr);
3638         
3639         /* Deal with open(O_TRUNC) */
3640         if (sattr->ia_valid & ATTR_OPEN)
3641                 sattr->ia_valid &= ~(ATTR_MTIME|ATTR_CTIME);
3642
3643         /* Optimization: if the end result is no change, don't RPC */
3644         if ((sattr->ia_valid & ~(ATTR_FILE|ATTR_OPEN)) == 0)
3645                 return 0;
3646
3647         /* Search for an existing open(O_WRITE) file */
3648         if (sattr->ia_valid & ATTR_FILE) {
3649                 struct nfs_open_context *ctx;
3650
3651                 ctx = nfs_file_open_context(sattr->ia_file);
3652                 if (ctx) {
3653                         cred = ctx->cred;
3654                         state = ctx->state;
3655                 }
3656         }
3657
3658         label = nfs4_label_alloc(NFS_SERVER(inode), GFP_KERNEL);
3659         if (IS_ERR(label))
3660                 return PTR_ERR(label);
3661
3662         status = nfs4_do_setattr(inode, cred, fattr, sattr, state, NULL, label);
3663         if (status == 0) {
3664                 nfs_setattr_update_inode(inode, sattr, fattr);
3665                 nfs_setsecurity(inode, fattr, label);
3666         }
3667         nfs4_label_free(label);
3668         return status;
3669 }
3670
3671 static int _nfs4_proc_lookup(struct rpc_clnt *clnt, struct inode *dir,
3672                 const struct qstr *name, struct nfs_fh *fhandle,
3673                 struct nfs_fattr *fattr, struct nfs4_label *label)
3674 {
3675         struct nfs_server *server = NFS_SERVER(dir);
3676         int                    status;
3677         struct nfs4_lookup_arg args = {
3678                 .bitmask = server->attr_bitmask,
3679                 .dir_fh = NFS_FH(dir),
3680                 .name = name,
3681         };
3682         struct nfs4_lookup_res res = {
3683                 .server = server,
3684                 .fattr = fattr,
3685                 .label = label,
3686                 .fh = fhandle,
3687         };
3688         struct rpc_message msg = {
3689                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP],
3690                 .rpc_argp = &args,
3691                 .rpc_resp = &res,
3692         };
3693
3694         args.bitmask = nfs4_bitmask(server, label);
3695
3696         nfs_fattr_init(fattr);
3697
3698         dprintk("NFS call  lookup %s\n", name->name);
3699         status = nfs4_call_sync(clnt, server, &msg, &args.seq_args, &res.seq_res, 0);
3700         dprintk("NFS reply lookup: %d\n", status);
3701         return status;
3702 }
3703
3704 static void nfs_fixup_secinfo_attributes(struct nfs_fattr *fattr)
3705 {
3706         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
3707                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_MOUNTPOINT;
3708         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
3709         fattr->nlink = 2;
3710 }
3711
3712 static int nfs4_proc_lookup_common(struct rpc_clnt **clnt, struct inode *dir,
3713                                    const struct qstr *name, struct nfs_fh *fhandle,
3714                                    struct nfs_fattr *fattr, struct nfs4_label *label)
3715 {
3716         struct nfs4_exception exception = { };
3717         struct rpc_clnt *client = *clnt;
3718         int err;
3719         do {
3720                 err = _nfs4_proc_lookup(client, dir, name, fhandle, fattr, label);
3721                 trace_nfs4_lookup(dir, name, err);
3722                 switch (err) {
3723                 case -NFS4ERR_BADNAME:
3724                         err = -ENOENT;
3725                         goto out;
3726                 case -NFS4ERR_MOVED:
3727                         err = nfs4_get_referral(client, dir, name, fattr, fhandle);
3728                         if (err == -NFS4ERR_MOVED)
3729                                 err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
3730                         goto out;
3731                 case -NFS4ERR_WRONGSEC:
3732                         err = -EPERM;
3733                         if (client != *clnt)
3734                                 goto out;
3735                         client = nfs4_negotiate_security(client, dir, name);
3736                         if (IS_ERR(client))
3737                                 return PTR_ERR(client);
3738
3739                         exception.retry = 1;
3740                         break;
3741                 default:
3742                         err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
3743                 }
3744         } while (exception.retry);
3745
3746 out:
3747         if (err == 0)
3748                 *clnt = client;
3749         else if (client != *clnt)
3750                 rpc_shutdown_client(client);
3751
3752         return err;
3753 }
3754
3755 static int nfs4_proc_lookup(struct inode *dir, const struct qstr *name,
3756                             struct nfs_fh *fhandle, struct nfs_fattr *fattr,
3757                             struct nfs4_label *label)
3758 {
3759         int status;
3760         struct rpc_clnt *client = NFS_CLIENT(dir);
3761
3762         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr, label);
3763         if (client != NFS_CLIENT(dir)) {
3764                 rpc_shutdown_client(client);
3765                 nfs_fixup_secinfo_attributes(fattr);
3766         }
3767         return status;
3768 }
3769
3770 struct rpc_clnt *
3771 nfs4_proc_lookup_mountpoint(struct inode *dir, const struct qstr *name,
3772                             struct nfs_fh *fhandle, struct nfs_fattr *fattr)
3773 {
3774         struct rpc_clnt *client = NFS_CLIENT(dir);
3775         int status;
3776
3777         status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr, NULL);
3778         if (status < 0)
3779                 return ERR_PTR(status);
3780         return (client == NFS_CLIENT(dir)) ? rpc_clone_client(client) : client;
3781 }
3782
3783 static int _nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
3784 {
3785         struct nfs_server *server = NFS_SERVER(inode);
3786         struct nfs4_accessargs args = {
3787                 .fh = NFS_FH(inode),
3788                 .bitmask = server->cache_consistency_bitmask,
3789         };
3790         struct nfs4_accessres res = {
3791                 .server = server,
3792         };
3793         struct rpc_message msg = {
3794                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_ACCESS],
3795                 .rpc_argp = &args,
3796                 .rpc_resp = &res,
3797                 .rpc_cred = entry->cred,
3798         };
3799         int mode = entry->mask;
3800         int status = 0;
3801
3802         /*
3803          * Determine which access bits we want to ask for...
3804          */
3805         if (mode & MAY_READ)
3806                 args.access |= NFS4_ACCESS_READ;
3807         if (S_ISDIR(inode->i_mode)) {
3808                 if (mode & MAY_WRITE)
3809                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND | NFS4_ACCESS_DELETE;
3810                 if (mode & MAY_EXEC)
3811                         args.access |= NFS4_ACCESS_LOOKUP;
3812         } else {
3813                 if (mode & MAY_WRITE)
3814                         args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND;
3815                 if (mode & MAY_EXEC)
3816                         args.access |= NFS4_ACCESS_EXECUTE;
3817         }
3818
3819         res.fattr = nfs_alloc_fattr();
3820         if (res.fattr == NULL)
3821                 return -ENOMEM;
3822
3823         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
3824         if (!status) {
3825                 nfs_access_set_mask(entry, res.access);
3826                 nfs_refresh_inode(inode, res.fattr);
3827         }
3828         nfs_free_fattr(res.fattr);
3829         return status;
3830 }
3831
3832 static int nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
3833 {
3834         struct nfs4_exception exception = { };
3835         int err;
3836         do {
3837                 err = _nfs4_proc_access(inode, entry);
3838                 trace_nfs4_access(inode, err);
3839                 err = nfs4_handle_exception(NFS_SERVER(inode), err,
3840                                 &exception);
3841         } while (exception.retry);
3842         return err;
3843 }
3844
3845 /*
3846  * TODO: For the time being, we don't try to get any attributes
3847  * along with any of the zero-copy operations READ, READDIR,
3848  * READLINK, WRITE.
3849  *
3850  * In the case of the first three, we want to put the GETATTR
3851  * after the read-type operation -- this is because it is hard
3852  * to predict the length of a GETATTR response in v4, and thus
3853  * align the READ data correctly.  This means that the GETATTR
3854  * may end up partially falling into the page cache, and we should
3855  * shift it into the 'tail' of the xdr_buf before processing.
3856  * To do this efficiently, we need to know the total length
3857  * of data received, which doesn't seem to be available outside
3858  * of the RPC layer.
3859  *
3860  * In the case of WRITE, we also want to put the GETATTR after
3861  * the operation -- in this case because we want to make sure
3862  * we get the post-operation mtime and size.
3863  *
3864  * Both of these changes to the XDR layer would in fact be quite
3865  * minor, but I decided to leave them for a subsequent patch.
3866  */
3867 static int _nfs4_proc_readlink(struct inode *inode, struct page *page,
3868                 unsigned int pgbase, unsigned int pglen)
3869 {
3870         struct nfs4_readlink args = {
3871                 .fh       = NFS_FH(inode),
3872                 .pgbase   = pgbase,
3873                 .pglen    = pglen,
3874                 .pages    = &page,
3875         };
3876         struct nfs4_readlink_res res;
3877         struct rpc_message msg = {
3878                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READLINK],
3879                 .rpc_argp = &args,
3880                 .rpc_resp = &res,
3881         };
3882
3883         return nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode), &msg, &args.seq_args, &res.seq_res, 0);
3884 }
3885
3886 static int nfs4_proc_readlink(struct inode *inode, struct page *page,
3887                 unsigned int pgbase, unsigned int pglen)
3888 {
3889         struct nfs4_exception exception = { };
3890         int err;
3891         do {
3892                 err = _nfs4_proc_readlink(inode, page, pgbase, pglen);
3893                 trace_nfs4_readlink(inode, err);
3894                 err = nfs4_handle_exception(NFS_SERVER(inode), err,
3895                                 &exception);
3896         } while (exception.retry);
3897         return err;
3898 }
3899
3900 /*
3901  * This is just for mknod.  open(O_CREAT) will always do ->open_context().
3902  */
3903 static int
3904 nfs4_proc_create(struct inode *dir, struct dentry *dentry, struct iattr *sattr,
3905                  int flags)
3906 {
3907         struct nfs4_label l, *ilabel = NULL;
3908         struct nfs_open_context *ctx;
3909         struct nfs4_state *state;
3910         int status = 0;
3911
3912         ctx = alloc_nfs_open_context(dentry, FMODE_READ);
3913         if (IS_ERR(ctx))
3914                 return PTR_ERR(ctx);
3915
3916         ilabel = nfs4_label_init_security(dir, dentry, sattr, &l);
3917
3918         sattr->ia_mode &= ~current_umask();
3919         state = nfs4_do_open(dir, ctx, flags, sattr, ilabel, NULL);
3920         if (IS_ERR(state)) {
3921                 status = PTR_ERR(state);
3922                 goto out;
3923         }
3924 out:
3925         nfs4_label_release_security(ilabel);
3926         put_nfs_open_context(ctx);
3927         return status;
3928 }
3929
3930 static int _nfs4_proc_remove(struct inode *dir, const struct qstr *name)
3931 {
3932         struct nfs_server *server = NFS_SERVER(dir);
3933         struct nfs_removeargs args = {
3934                 .fh = NFS_FH(dir),
3935                 .name = *name,
3936         };
3937         struct nfs_removeres res = {
3938                 .server = server,
3939         };
3940         struct rpc_message msg = {
3941                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE],
3942                 .rpc_argp = &args,
3943                 .rpc_resp = &res,
3944         };
3945         int status;
3946
3947         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
3948         if (status == 0)
3949                 update_changeattr(dir, &res.cinfo);
3950         return status;
3951 }
3952
3953 static int nfs4_proc_remove(struct inode *dir, const struct qstr *name)
3954 {
3955         struct nfs4_exception exception = { };
3956         int err;
3957         do {
3958                 err = _nfs4_proc_remove(dir, name);
3959                 trace_nfs4_remove(dir, name, err);
3960                 err = nfs4_handle_exception(NFS_SERVER(dir), err,
3961                                 &exception);
3962         } while (exception.retry);
3963         return err;
3964 }
3965
3966 static void nfs4_proc_unlink_setup(struct rpc_message *msg, struct inode *dir)
3967 {
3968         struct nfs_server *server = NFS_SERVER(dir);
3969         struct nfs_removeargs *args = msg->rpc_argp;
3970         struct nfs_removeres *res = msg->rpc_resp;
3971
3972         res->server = server;
3973         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE];
3974         nfs4_init_sequence(&args->seq_args, &res->seq_res, 1);
3975
3976         nfs_fattr_init(res->dir_attr);
3977 }
3978
3979 static void nfs4_proc_unlink_rpc_prepare(struct rpc_task *task, struct nfs_unlinkdata *data)
3980 {
3981         nfs4_setup_sequence(NFS_SB(data->dentry->d_sb),
3982                         &data->args.seq_args,
3983                         &data->res.seq_res,
3984                         task);
3985 }
3986
3987 static int nfs4_proc_unlink_done(struct rpc_task *task, struct inode *dir)
3988 {
3989         struct nfs_unlinkdata *data = task->tk_calldata;
3990         struct nfs_removeres *res = &data->res;
3991
3992         if (!nfs4_sequence_done(task, &res->seq_res))
3993                 return 0;
3994         if (nfs4_async_handle_error(task, res->server, NULL,
3995                                     &data->timeout) == -EAGAIN)
3996                 return 0;
3997         update_changeattr(dir, &res->cinfo);
3998         return 1;
3999 }
4000
4001 static void nfs4_proc_rename_setup(struct rpc_message *msg, struct inode *dir)
4002 {
4003         struct nfs_server *server = NFS_SERVER(dir);
4004         struct nfs_renameargs *arg = msg->rpc_argp;
4005         struct nfs_renameres *res = msg->rpc_resp;
4006
4007         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME];
4008         res->server = server;
4009         nfs4_init_sequence(&arg->seq_args, &res->seq_res, 1);
4010 }
4011
4012 static void nfs4_proc_rename_rpc_prepare(struct rpc_task *task, struct nfs_renamedata *data)
4013 {
4014         nfs4_setup_sequence(NFS_SERVER(data->old_dir),
4015                         &data->args.seq_args,
4016                         &data->res.seq_res,
4017                         task);
4018 }
4019
4020 static int nfs4_proc_rename_done(struct rpc_task *task, struct inode *old_dir,
4021                                  struct inode *new_dir)
4022 {
4023         struct nfs_renamedata *data = task->tk_calldata;
4024         struct nfs_renameres *res = &data->res;
4025
4026         if (!nfs4_sequence_done(task, &res->seq_res))
4027                 return 0;
4028         if (nfs4_async_handle_error(task, res->server, NULL, &data->timeout) == -EAGAIN)
4029                 return 0;
4030
4031         update_changeattr(old_dir, &res->old_cinfo);
4032         update_changeattr(new_dir, &res->new_cinfo);
4033         return 1;
4034 }
4035
4036 static int _nfs4_proc_link(struct inode *inode, struct inode *dir, const struct qstr *name)
4037 {
4038         struct nfs_server *server = NFS_SERVER(inode);
4039         struct nfs4_link_arg arg = {
4040                 .fh     = NFS_FH(inode),
4041                 .dir_fh = NFS_FH(dir),
4042                 .name   = name,
4043                 .bitmask = server->attr_bitmask,
4044         };
4045         struct nfs4_link_res res = {
4046                 .server = server,
4047                 .label = NULL,
4048         };
4049         struct rpc_message msg = {
4050                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LINK],
4051                 .rpc_argp = &arg,
4052                 .rpc_resp = &res,
4053         };
4054         int status = -ENOMEM;
4055
4056         res.fattr = nfs_alloc_fattr();
4057         if (res.fattr == NULL)
4058                 goto out;
4059
4060         res.label = nfs4_label_alloc(server, GFP_KERNEL);
4061         if (IS_ERR(res.label)) {
4062                 status = PTR_ERR(res.label);
4063                 goto out;
4064         }
4065         arg.bitmask = nfs4_bitmask(server, res.label);
4066
4067         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
4068         if (!status) {
4069                 update_changeattr(dir, &res.cinfo);
4070                 status = nfs_post_op_update_inode(inode, res.fattr);
4071                 if (!status)
4072                         nfs_setsecurity(inode, res.fattr, res.label);
4073         }
4074
4075
4076         nfs4_label_free(res.label);
4077
4078 out:
4079         nfs_free_fattr(res.fattr);
4080         return status;
4081 }
4082
4083 static int nfs4_proc_link(struct inode *inode, struct inode *dir, const struct qstr *name)
4084 {
4085         struct nfs4_exception exception = { };
4086         int err;
4087         do {
4088                 err = nfs4_handle_exception(NFS_SERVER(inode),
4089                                 _nfs4_proc_link(inode, dir, name),
4090                                 &exception);
4091         } while (exception.retry);
4092         return err;
4093 }
4094
4095 struct nfs4_createdata {
4096         struct rpc_message msg;
4097         struct nfs4_create_arg arg;
4098         struct nfs4_create_res res;
4099         struct nfs_fh fh;
4100         struct nfs_fattr fattr;
4101         struct nfs4_label *label;
4102 };
4103
4104 static struct nfs4_createdata *nfs4_alloc_createdata(struct inode *dir,
4105                 const struct qstr *name, struct iattr *sattr, u32 ftype)
4106 {
4107         struct nfs4_createdata *data;
4108
4109         data = kzalloc(sizeof(*data), GFP_KERNEL);
4110         if (data != NULL) {
4111                 struct nfs_server *server = NFS_SERVER(dir);
4112
4113                 data->label = nfs4_label_alloc(server, GFP_KERNEL);
4114                 if (IS_ERR(data->label))
4115                         goto out_free;
4116
4117                 data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE];
4118                 data->msg.rpc_argp = &data->arg;
4119                 data->msg.rpc_resp = &data->res;
4120                 data->arg.dir_fh = NFS_FH(dir);
4121                 data->arg.server = server;
4122                 data->arg.name = name;
4123                 data->arg.attrs = sattr;
4124                 data->arg.ftype = ftype;
4125                 data->arg.bitmask = nfs4_bitmask(server, data->label);
4126                 data->res.server = server;
4127                 data->res.fh = &data->fh;
4128                 data->res.fattr = &data->fattr;
4129                 data->res.label = data->label;
4130                 nfs_fattr_init(data->res.fattr);
4131         }
4132         return data;
4133 out_free:
4134         kfree(data);
4135         return NULL;
4136 }
4137
4138 static int nfs4_do_create(struct inode *dir, struct dentry *dentry, struct nfs4_createdata *data)
4139 {
4140         int status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &data->msg,
4141                                     &data->arg.seq_args, &data->res.seq_res, 1);
4142         if (status == 0) {
4143                 update_changeattr(dir, &data->res.dir_cinfo);
4144                 status = nfs_instantiate(dentry, data->res.fh, data->res.fattr, data->res.label);
4145         }
4146         return status;
4147 }
4148
4149 static void nfs4_free_createdata(struct nfs4_createdata *data)
4150 {
4151         nfs4_label_free(data->label);
4152         kfree(data);
4153 }
4154
4155 static int _nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
4156                 struct page *page, unsigned int len, struct iattr *sattr,
4157                 struct nfs4_label *label)
4158 {
4159         struct nfs4_createdata *data;
4160         int status = -ENAMETOOLONG;
4161
4162         if (len > NFS4_MAXPATHLEN)
4163                 goto out;
4164
4165         status = -ENOMEM;
4166         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4LNK);
4167         if (data == NULL)
4168                 goto out;
4169
4170         data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SYMLINK];
4171         data->arg.u.symlink.pages = &page;
4172         data->arg.u.symlink.len = len;
4173         data->arg.label = label;
4174         
4175         status = nfs4_do_create(dir, dentry, data);
4176
4177         nfs4_free_createdata(data);
4178 out:
4179         return status;
4180 }
4181
4182 static int nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
4183                 struct page *page, unsigned int len, struct iattr *sattr)
4184 {
4185         struct nfs4_exception exception = { };
4186         struct nfs4_label l, *label = NULL;
4187         int err;
4188
4189         label = nfs4_label_init_security(dir, dentry, sattr, &l);
4190
4191         do {
4192                 err = _nfs4_proc_symlink(dir, dentry, page, len, sattr, label);
4193                 trace_nfs4_symlink(dir, &dentry->d_name, err);
4194                 err = nfs4_handle_exception(NFS_SERVER(dir), err,
4195                                 &exception);
4196         } while (exception.retry);
4197
4198         nfs4_label_release_security(label);
4199         return err;
4200 }
4201
4202 static int _nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
4203                 struct iattr *sattr, struct nfs4_label *label)
4204 {
4205         struct nfs4_createdata *data;
4206         int status = -ENOMEM;
4207
4208         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4DIR);
4209         if (data == NULL)
4210                 goto out;
4211
4212         data->arg.label = label;
4213         status = nfs4_do_create(dir, dentry, data);
4214
4215         nfs4_free_createdata(data);
4216 out:
4217         return status;
4218 }
4219
4220 static int nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
4221                 struct iattr *sattr)
4222 {
4223         struct nfs4_exception exception = { };
4224         struct nfs4_label l, *label = NULL;
4225         int err;
4226
4227         label = nfs4_label_init_security(dir, dentry, sattr, &l);
4228
4229         sattr->ia_mode &= ~current_umask();
4230         do {
4231                 err = _nfs4_proc_mkdir(dir, dentry, sattr, label);
4232                 trace_nfs4_mkdir(dir, &dentry->d_name, err);
4233                 err = nfs4_handle_exception(NFS_SERVER(dir), err,
4234                                 &exception);
4235         } while (exception.retry);
4236         nfs4_label_release_security(label);
4237
4238         return err;
4239 }
4240
4241 static int _nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
4242                 u64 cookie, struct page **pages, unsigned int count, int plus)
4243 {
4244         struct inode            *dir = d_inode(dentry);
4245         struct nfs4_readdir_arg args = {
4246                 .fh = NFS_FH(dir),
4247                 .pages = pages,
4248                 .pgbase = 0,
4249                 .count = count,
4250                 .bitmask = NFS_SERVER(d_inode(dentry))->attr_bitmask,
4251                 .plus = plus,
4252         };
4253         struct nfs4_readdir_res res;
4254         struct rpc_message msg = {
4255                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READDIR],
4256                 .rpc_argp = &args,
4257                 .rpc_resp = &res,
4258                 .rpc_cred = cred,
4259         };
4260         int                     status;
4261
4262         dprintk("%s: dentry = %pd2, cookie = %Lu\n", __func__,
4263                         dentry,
4264                         (unsigned long long)cookie);
4265         nfs4_setup_readdir(cookie, NFS_I(dir)->cookieverf, dentry, &args);
4266         res.pgbase = args.pgbase;
4267         status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
4268         if (status >= 0) {
4269                 memcpy(NFS_I(dir)->cookieverf, res.verifier.data, NFS4_VERIFIER_SIZE);
4270                 status += args.pgbase;
4271         }
4272
4273         nfs_invalidate_atime(dir);
4274
4275         dprintk("%s: returns %d\n", __func__, status);
4276         return status;
4277 }
4278
4279 static int nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
4280                 u64 cookie, struct page **pages, unsigned int count, int plus)
4281 {
4282         struct nfs4_exception exception = { };
4283         int err;
4284         do {
4285                 err = _nfs4_proc_readdir(dentry, cred, cookie,
4286                                 pages, count, plus);
4287                 trace_nfs4_readdir(d_inode(dentry), err);
4288                 err = nfs4_handle_exception(NFS_SERVER(d_inode(dentry)), err,
4289                                 &exception);
4290         } while (exception.retry);
4291         return err;
4292 }
4293
4294 static int _nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
4295                 struct iattr *sattr, struct nfs4_label *label, dev_t rdev)
4296 {
4297         struct nfs4_createdata *data;
4298         int mode = sattr->ia_mode;
4299         int status = -ENOMEM;
4300
4301         data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4SOCK);
4302         if (data == NULL)
4303                 goto out;
4304
4305         if (S_ISFIFO(mode))
4306                 data->arg.ftype = NF4FIFO;
4307         else if (S_ISBLK(mode)) {
4308                 data->arg.ftype = NF4BLK;
4309                 data->arg.u.device.specdata1 = MAJOR(rdev);
4310                 data->arg.u.device.specdata2 = MINOR(rdev);
4311         }
4312         else if (S_ISCHR(mode)) {
4313                 data->arg.ftype = NF4CHR;
4314                 data->arg.u.device.specdata1 = MAJOR(rdev);
4315                 data->arg.u.device.specdata2 = MINOR(rdev);
4316         } else if (!S_ISSOCK(mode)) {
4317                 status = -EINVAL;
4318                 goto out_free;
4319         }
4320
4321         data->arg.label = label;
4322         status = nfs4_do_create(dir, dentry, data);
4323 out_free:
4324         nfs4_free_createdata(data);
4325 out:
4326         return status;
4327 }
4328
4329 static int nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
4330                 struct iattr *sattr, dev_t rdev)
4331 {
4332         struct nfs4_exception exception = { };
4333         struct nfs4_label l, *label = NULL;
4334         int err;
4335
4336         label = nfs4_label_init_security(dir, dentry, sattr, &l);
4337
4338         sattr->ia_mode &= ~current_umask();
4339         do {
4340                 err = _nfs4_proc_mknod(dir, dentry, sattr, label, rdev);
4341                 trace_nfs4_mknod(dir, &dentry->d_name, err);
4342                 err = nfs4_handle_exception(NFS_SERVER(dir), err,
4343                                 &exception);
4344         } while (exception.retry);
4345
4346         nfs4_label_release_security(label);
4347
4348         return err;
4349 }
4350
4351 static int _nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle,
4352                  struct nfs_fsstat *fsstat)
4353 {
4354         struct nfs4_statfs_arg args = {
4355                 .fh = fhandle,
4356                 .bitmask = server->attr_bitmask,
4357         };
4358         struct nfs4_statfs_res res = {
4359                 .fsstat = fsstat,
4360         };
4361         struct rpc_message msg = {
4362                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_STATFS],
4363                 .rpc_argp = &args,
4364                 .rpc_resp = &res,
4365         };
4366
4367         nfs_fattr_init(fsstat->fattr);
4368         return  nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
4369 }
4370
4371 static int nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsstat *fsstat)
4372 {
4373         struct nfs4_exception exception = { };
4374         int err;
4375         do {
4376                 err = nfs4_handle_exception(server,
4377                                 _nfs4_proc_statfs(server, fhandle, fsstat),
4378                                 &exception);
4379         } while (exception.retry);
4380         return err;
4381 }
4382
4383 static int _nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle,
4384                 struct nfs_fsinfo *fsinfo)
4385 {
4386         struct nfs4_fsinfo_arg args = {
4387                 .fh = fhandle,
4388                 .bitmask = server->attr_bitmask,
4389         };
4390         struct nfs4_fsinfo_res res = {
4391                 .fsinfo = fsinfo,
4392         };
4393         struct rpc_message msg = {
4394                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSINFO],
4395                 .rpc_argp = &args,
4396                 .rpc_resp = &res,
4397         };
4398
4399         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
4400 }
4401
4402 static int nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
4403 {
4404         struct nfs4_exception exception = { };
4405         unsigned long now = jiffies;
4406         int err;
4407
4408         do {
4409                 err = _nfs4_do_fsinfo(server, fhandle, fsinfo);
4410                 trace_nfs4_fsinfo(server, fhandle, fsinfo->fattr, err);
4411                 if (err == 0) {
4412                         nfs4_set_lease_period(server->nfs_client,
4413                                         fsinfo->lease_time * HZ,
4414                                         now);
4415                         break;
4416                 }
4417                 err = nfs4_handle_exception(server, err, &exception);
4418         } while (exception.retry);
4419         return err;
4420 }
4421
4422 static int nfs4_proc_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
4423 {
4424         int error;
4425
4426         nfs_fattr_init(fsinfo->fattr);
4427         error = nfs4_do_fsinfo(server, fhandle, fsinfo);
4428         if (error == 0) {
4429                 /* block layout checks this! */
4430                 server->pnfs_blksize = fsinfo->blksize;
4431                 set_pnfs_layoutdriver(server, fhandle, fsinfo);
4432         }
4433
4434         return error;
4435 }
4436
4437 static int _nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
4438                 struct nfs_pathconf *pathconf)
4439 {
4440         struct nfs4_pathconf_arg args = {
4441                 .fh = fhandle,
4442                 .bitmask = server->attr_bitmask,
4443         };
4444         struct nfs4_pathconf_res res = {
4445                 .pathconf = pathconf,
4446         };
4447         struct rpc_message msg = {
4448                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_PATHCONF],
4449                 .rpc_argp = &args,
4450                 .rpc_resp = &res,
4451         };
4452
4453         /* None of the pathconf attributes are mandatory to implement */
4454         if ((args.bitmask[0] & nfs4_pathconf_bitmap[0]) == 0) {
4455                 memset(pathconf, 0, sizeof(*pathconf));
4456                 return 0;
4457         }
4458
4459         nfs_fattr_init(pathconf->fattr);
4460         return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
4461 }
4462
4463 static int nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
4464                 struct nfs_pathconf *pathconf)
4465 {
4466         struct nfs4_exception exception = { };
4467         int err;
4468
4469         do {
4470                 err = nfs4_handle_exception(server,
4471                                 _nfs4_proc_pathconf(server, fhandle, pathconf),
4472                                 &exception);
4473         } while (exception.retry);
4474         return err;
4475 }
4476
4477 int nfs4_set_rw_stateid(nfs4_stateid *stateid,
4478                 const struct nfs_open_context *ctx,
4479                 const struct nfs_lock_context *l_ctx,
4480                 fmode_t fmode)
4481 {
4482         const struct nfs_lockowner *lockowner = NULL;
4483
4484         if (l_ctx != NULL)
4485                 lockowner = &l_ctx->lockowner;
4486         return nfs4_select_rw_stateid(ctx->state, fmode, lockowner, stateid, NULL);
4487 }
4488 EXPORT_SYMBOL_GPL(nfs4_set_rw_stateid);
4489
4490 static bool nfs4_stateid_is_current(nfs4_stateid *stateid,
4491                 const struct nfs_open_context *ctx,
4492                 const struct nfs_lock_context *l_ctx,
4493                 fmode_t fmode)
4494 {
4495         nfs4_stateid current_stateid;
4496
4497         /* If the current stateid represents a lost lock, then exit */
4498         if (nfs4_set_rw_stateid(&current_stateid, ctx, l_ctx, fmode) == -EIO)
4499                 return true;
4500         return nfs4_stateid_match(stateid, &current_stateid);
4501 }
4502
4503 static bool nfs4_error_stateid_expired(int err)
4504 {
4505         switch (err) {
4506         case -NFS4ERR_DELEG_REVOKED:
4507         case -NFS4ERR_ADMIN_REVOKED:
4508         case -NFS4ERR_BAD_STATEID:
4509         case -NFS4ERR_STALE_STATEID:
4510         case -NFS4ERR_OLD_STATEID:
4511         case -NFS4ERR_OPENMODE:
4512         case -NFS4ERR_EXPIRED:
4513                 return true;
4514         }
4515         return false;
4516 }
4517
4518 void __nfs4_read_done_cb(struct nfs_pgio_header *hdr)
4519 {
4520         nfs_invalidate_atime(hdr->inode);
4521 }
4522
4523 static int nfs4_read_done_cb(struct rpc_task *task, struct nfs_pgio_header *hdr)
4524 {
4525         struct nfs_server *server = NFS_SERVER(hdr->inode);
4526
4527         trace_nfs4_read(hdr, task->tk_status);
4528         if (nfs4_async_handle_error(task, server,
4529                                     hdr->args.context->state,
4530                                     NULL) == -EAGAIN) {
4531                 rpc_restart_call_prepare(task);
4532                 return -EAGAIN;
4533         }
4534
4535         __nfs4_read_done_cb(hdr);
4536         if (task->tk_status > 0)
4537                 renew_lease(server, hdr->timestamp);
4538         return 0;
4539 }
4540
4541 static bool nfs4_read_stateid_changed(struct rpc_task *task,
4542                 struct nfs_pgio_args *args)
4543 {
4544
4545         if (!nfs4_error_stateid_expired(task->tk_status) ||
4546                 nfs4_stateid_is_current(&args->stateid,
4547                                 args->context,
4548                                 args->lock_context,
4549                                 FMODE_READ))
4550                 return false;
4551         rpc_restart_call_prepare(task);
4552         return true;
4553 }
4554
4555 static int nfs4_read_done(struct rpc_task *task, struct nfs_pgio_header *hdr)
4556 {
4557
4558         dprintk("--> %s\n", __func__);
4559
4560         if (!nfs4_sequence_done(task, &hdr->res.seq_res))
4561                 return -EAGAIN;
4562         if (nfs4_read_stateid_changed(task, &hdr->args))
4563                 return -EAGAIN;
4564         return hdr->pgio_done_cb ? hdr->pgio_done_cb(task, hdr) :
4565                                     nfs4_read_done_cb(task, hdr);
4566 }
4567
4568 static void nfs4_proc_read_setup(struct nfs_pgio_header *hdr,
4569                                  struct rpc_message *msg)
4570 {
4571         hdr->timestamp   = jiffies;
4572         if (!hdr->pgio_done_cb)
4573                 hdr->pgio_done_cb = nfs4_read_done_cb;
4574         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READ];
4575         nfs4_init_sequence(&hdr->args.seq_args, &hdr->res.seq_res, 0);
4576 }
4577
4578 static int nfs4_proc_pgio_rpc_prepare(struct rpc_task *task,
4579                                       struct nfs_pgio_header *hdr)
4580 {
4581         if (nfs4_setup_sequence(NFS_SERVER(hdr->inode),
4582                         &hdr->args.seq_args,
4583                         &hdr->res.seq_res,
4584                         task))
4585                 return 0;
4586         if (nfs4_set_rw_stateid(&hdr->args.stateid, hdr->args.context,
4587                                 hdr->args.lock_context,
4588                                 hdr->rw_ops->rw_mode) == -EIO)
4589                 return -EIO;
4590         if (unlikely(test_bit(NFS_CONTEXT_BAD, &hdr->args.context->flags)))
4591                 return -EIO;
4592         return 0;
4593 }
4594
4595 static int nfs4_write_done_cb(struct rpc_task *task,
4596                               struct nfs_pgio_header *hdr)
4597 {
4598         struct inode *inode = hdr->inode;
4599
4600         trace_nfs4_write(hdr, task->tk_status);
4601         if (nfs4_async_handle_error(task, NFS_SERVER(inode),
4602                                     hdr->args.context->state,
4603                                     NULL) == -EAGAIN) {
4604                 rpc_restart_call_prepare(task);
4605                 return -EAGAIN;
4606         }
4607         if (task->tk_status >= 0) {
4608                 renew_lease(NFS_SERVER(inode), hdr->timestamp);
4609                 nfs_writeback_update_inode(hdr);
4610         }
4611         return 0;
4612 }
4613
4614 static bool nfs4_write_stateid_changed(struct rpc_task *task,
4615                 struct nfs_pgio_args *args)
4616 {
4617
4618         if (!nfs4_error_stateid_expired(task->tk_status) ||
4619                 nfs4_stateid_is_current(&args->stateid,
4620                                 args->context,
4621                                 args->lock_context,
4622                                 FMODE_WRITE))
4623                 return false;
4624         rpc_restart_call_prepare(task);
4625         return true;
4626 }
4627
4628 static int nfs4_write_done(struct rpc_task *task, struct nfs_pgio_header *hdr)
4629 {
4630         if (!nfs4_sequence_done(task, &hdr->res.seq_res))
4631                 return -EAGAIN;
4632         if (nfs4_write_stateid_changed(task, &hdr->args))
4633                 return -EAGAIN;
4634         return hdr->pgio_done_cb ? hdr->pgio_done_cb(task, hdr) :
4635                 nfs4_write_done_cb(task, hdr);
4636 }
4637
4638 static
4639 bool nfs4_write_need_cache_consistency_data(struct nfs_pgio_header *hdr)
4640 {
4641         /* Don't request attributes for pNFS or O_DIRECT writes */
4642         if (hdr->ds_clp != NULL || hdr->dreq != NULL)
4643                 return false;
4644         /* Otherwise, request attributes if and only if we don't hold
4645          * a delegation
4646          */
4647         return nfs4_have_delegation(hdr->inode, FMODE_READ) == 0;
4648 }
4649
4650 static void nfs4_proc_write_setup(struct nfs_pgio_header *hdr,
4651                                   struct rpc_message *msg)
4652 {
4653         struct nfs_server *server = NFS_SERVER(hdr->inode);
4654
4655         if (!nfs4_write_need_cache_consistency_data(hdr)) {
4656                 hdr->args.bitmask = NULL;
4657                 hdr->res.fattr = NULL;
4658         } else
4659                 hdr->args.bitmask = server->cache_consistency_bitmask;
4660
4661         if (!hdr->pgio_done_cb)
4662                 hdr->pgio_done_cb = nfs4_write_done_cb;
4663         hdr->res.server = server;
4664         hdr->timestamp   = jiffies;
4665
4666         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_WRITE];
4667         nfs4_init_sequence(&hdr->args.seq_args, &hdr->res.seq_res, 1);
4668 }
4669
4670 static void nfs4_proc_commit_rpc_prepare(struct rpc_task *task, struct nfs_commit_data *data)
4671 {
4672         nfs4_setup_sequence(NFS_SERVER(data->inode),
4673                         &data->args.seq_args,
4674                         &data->res.seq_res,
4675                         task);
4676 }
4677
4678 static int nfs4_commit_done_cb(struct rpc_task *task, struct nfs_commit_data *data)
4679 {
4680         struct inode *inode = data->inode;
4681
4682         trace_nfs4_commit(data, task->tk_status);
4683         if (nfs4_async_handle_error(task, NFS_SERVER(inode),
4684                                     NULL, NULL) == -EAGAIN) {
4685                 rpc_restart_call_prepare(task);
4686                 return -EAGAIN;
4687         }
4688         return 0;
4689 }
4690
4691 static int nfs4_commit_done(struct rpc_task *task, struct nfs_commit_data *data)
4692 {
4693         if (!nfs4_sequence_done(task, &data->res.seq_res))
4694                 return -EAGAIN;
4695         return data->commit_done_cb(task, data);
4696 }
4697
4698 static void nfs4_proc_commit_setup(struct nfs_commit_data *data, struct rpc_message *msg)
4699 {
4700         struct nfs_server *server = NFS_SERVER(data->inode);
4701
4702         if (data->commit_done_cb == NULL)
4703                 data->commit_done_cb = nfs4_commit_done_cb;
4704         data->res.server = server;
4705         msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_COMMIT];
4706         nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
4707 }
4708
4709 struct nfs4_renewdata {
4710         struct nfs_client       *client;
4711         unsigned long           timestamp;
4712 };
4713
4714 /*
4715  * nfs4_proc_async_renew(): This is not one of the nfs_rpc_ops; it is a special
4716  * standalone procedure for queueing an asynchronous RENEW.
4717  */
4718 static void nfs4_renew_release(void *calldata)
4719 {
4720         struct nfs4_renewdata *data = calldata;
4721         struct nfs_client *clp = data->client;
4722
4723         if (atomic_read(&clp->cl_count) > 1)
4724                 nfs4_schedule_state_renewal(clp);
4725         nfs_put_client(clp);
4726         kfree(data);
4727 }
4728
4729 static void nfs4_renew_done(struct rpc_task *task, void *calldata)
4730 {
4731         struct nfs4_renewdata *data = calldata;
4732         struct nfs_client *clp = data->client;
4733         unsigned long timestamp = data->timestamp;
4734
4735         trace_nfs4_renew_async(clp, task->tk_status);
4736         switch (task->tk_status) {
4737         case 0:
4738                 break;
4739         case -NFS4ERR_LEASE_MOVED:
4740                 nfs4_schedule_lease_moved_recovery(clp);
4741                 break;
4742         default:
4743                 /* Unless we're shutting down, schedule state recovery! */
4744                 if (test_bit(NFS_CS_RENEWD, &clp->cl_res_state) == 0)
4745                         return;
4746                 if (task->tk_status != NFS4ERR_CB_PATH_DOWN) {
4747                         nfs4_schedule_lease_recovery(clp);
4748                         return;
4749                 }
4750                 nfs4_schedule_path_down_recovery(clp);
4751         }
4752         do_renew_lease(clp, timestamp);
4753 }
4754
4755 static const struct rpc_call_ops nfs4_renew_ops = {
4756         .rpc_call_done = nfs4_renew_done,
4757         .rpc_release = nfs4_renew_release,
4758 };
4759
4760 static int nfs4_proc_async_renew(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
4761 {
4762         struct rpc_message msg = {
4763                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
4764                 .rpc_argp       = clp,
4765                 .rpc_cred       = cred,
4766         };
4767         struct nfs4_renewdata *data;
4768
4769         if (renew_flags == 0)
4770                 return 0;
4771         if (!atomic_inc_not_zero(&clp->cl_count))
4772                 return -EIO;
4773         data = kmalloc(sizeof(*data), GFP_NOFS);
4774         if (data == NULL)
4775                 return -ENOMEM;
4776         data->client = clp;
4777         data->timestamp = jiffies;
4778         return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT,
4779                         &nfs4_renew_ops, data);
4780 }
4781
4782 static int nfs4_proc_renew(struct nfs_client *clp, struct rpc_cred *cred)
4783 {
4784         struct rpc_message msg = {
4785                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
4786                 .rpc_argp       = clp,
4787                 .rpc_cred       = cred,
4788         };
4789         unsigned long now = jiffies;
4790         int status;
4791
4792         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
4793         if (status < 0)
4794                 return status;
4795         do_renew_lease(clp, now);
4796         return 0;
4797 }
4798
4799 static inline int nfs4_server_supports_acls(struct nfs_server *server)
4800 {
4801         return server->caps & NFS_CAP_ACLS;
4802 }
4803
4804 /* Assuming that XATTR_SIZE_MAX is a multiple of PAGE_SIZE, and that
4805  * it's OK to put sizeof(void) * (XATTR_SIZE_MAX/PAGE_SIZE) bytes on
4806  * the stack.
4807  */
4808 #define NFS4ACL_MAXPAGES DIV_ROUND_UP(XATTR_SIZE_MAX, PAGE_SIZE)
4809
4810 static int buf_to_pages_noslab(const void *buf, size_t buflen,
4811                 struct page **pages)
4812 {
4813         struct page *newpage, **spages;
4814         int rc = 0;
4815         size_t len;
4816         spages = pages;
4817
4818         do {
4819                 len = min_t(size_t, PAGE_SIZE, buflen);
4820                 newpage = alloc_page(GFP_KERNEL);
4821
4822                 if (newpage == NULL)
4823                         goto unwind;
4824                 memcpy(page_address(newpage), buf, len);
4825                 buf += len;
4826                 buflen -= len;
4827                 *pages++ = newpage;
4828                 rc++;
4829         } while (buflen != 0);
4830
4831         return rc;
4832
4833 unwind:
4834         for(; rc > 0; rc--)
4835                 __free_page(spages[rc-1]);
4836         return -ENOMEM;
4837 }
4838
4839 struct nfs4_cached_acl {
4840         int cached;
4841         size_t len;
4842         char data[0];
4843 };
4844
4845 static void nfs4_set_cached_acl(struct inode *inode, struct nfs4_cached_acl *acl)
4846 {
4847         struct nfs_inode *nfsi = NFS_I(inode);
4848
4849         spin_lock(&inode->i_lock);
4850         kfree(nfsi->nfs4_acl);
4851         nfsi->nfs4_acl = acl;
4852         spin_unlock(&inode->i_lock);
4853 }
4854
4855 static void nfs4_zap_acl_attr(struct inode *inode)
4856 {
4857         nfs4_set_cached_acl(inode, NULL);
4858 }
4859
4860 static inline ssize_t nfs4_read_cached_acl(struct inode *inode, char *buf, size_t buflen)
4861 {
4862         struct nfs_inode *nfsi = NFS_I(inode);
4863         struct nfs4_cached_acl *acl;
4864         int ret = -ENOENT;
4865
4866         spin_lock(&inode->i_lock);
4867         acl = nfsi->nfs4_acl;
4868         if (acl == NULL)
4869                 goto out;
4870         if (buf == NULL) /* user is just asking for length */
4871                 goto out_len;
4872         if (acl->cached == 0)
4873                 goto out;
4874         ret = -ERANGE; /* see getxattr(2) man page */
4875         if (acl->len > buflen)
4876                 goto out;
4877         memcpy(buf, acl->data, acl->len);
4878 out_len:
4879         ret = acl->len;
4880 out:
4881         spin_unlock(&inode->i_lock);
4882         return ret;
4883 }
4884
4885 static void nfs4_write_cached_acl(struct inode *inode, struct page **pages, size_t pgbase, size_t acl_len)
4886 {
4887         struct nfs4_cached_acl *acl;
4888         size_t buflen = sizeof(*acl) + acl_len;
4889
4890         if (buflen <= PAGE_SIZE) {
4891                 acl = kmalloc(buflen, GFP_KERNEL);
4892                 if (acl == NULL)
4893                         goto out;
4894                 acl->cached = 1;
4895                 _copy_from_pages(acl->data, pages, pgbase, acl_len);
4896         } else {
4897                 acl = kmalloc(sizeof(*acl), GFP_KERNEL);
4898                 if (acl == NULL)
4899                         goto out;
4900                 acl->cached = 0;
4901         }
4902         acl->len = acl_len;
4903 out:
4904         nfs4_set_cached_acl(inode, acl);
4905 }
4906
4907 /*
4908  * The getxattr API returns the required buffer length when called with a
4909  * NULL buf. The NFSv4 acl tool then calls getxattr again after allocating
4910  * the required buf.  On a NULL buf, we send a page of data to the server
4911  * guessing that the ACL request can be serviced by a page. If so, we cache
4912  * up to the page of ACL data, and the 2nd call to getxattr is serviced by
4913  * the cache. If not so, we throw away the page, and cache the required
4914  * length. The next getxattr call will then produce another round trip to
4915  * the server, this time with the input buf of the required size.
4916  */
4917 static ssize_t __nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
4918 {
4919         struct page *pages[NFS4ACL_MAXPAGES] = {NULL, };
4920         struct nfs_getaclargs args = {
4921                 .fh = NFS_FH(inode),
4922                 .acl_pages = pages,
4923                 .acl_len = buflen,
4924         };
4925         struct nfs_getaclres res = {
4926                 .acl_len = buflen,
4927         };
4928         struct rpc_message msg = {
4929                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETACL],
4930                 .rpc_argp = &args,
4931                 .rpc_resp = &res,
4932         };
4933         unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE);
4934         int ret = -ENOMEM, i;
4935
4936         /* As long as we're doing a round trip to the server anyway,
4937          * let's be prepared for a page of acl data. */
4938         if (npages == 0)
4939                 npages = 1;
4940         if (npages > ARRAY_SIZE(pages))
4941                 return -ERANGE;
4942
4943         for (i = 0; i < npages; i++) {
4944                 pages[i] = alloc_page(GFP_KERNEL);
4945                 if (!pages[i])
4946                         goto out_free;
4947         }
4948
4949         /* for decoding across pages */
4950         res.acl_scratch = alloc_page(GFP_KERNEL);
4951         if (!res.acl_scratch)
4952                 goto out_free;
4953
4954         args.acl_len = npages * PAGE_SIZE;
4955
4956         dprintk("%s  buf %p buflen %zu npages %d args.acl_len %zu\n",
4957                 __func__, buf, buflen, npages, args.acl_len);
4958         ret = nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode),
4959                              &msg, &args.seq_args, &res.seq_res, 0);
4960         if (ret)
4961                 goto out_free;
4962
4963         /* Handle the case where the passed-in buffer is too short */
4964         if (res.acl_flags & NFS4_ACL_TRUNC) {
4965                 /* Did the user only issue a request for the acl length? */
4966                 if (buf == NULL)
4967                         goto out_ok;
4968                 ret = -ERANGE;
4969                 goto out_free;
4970         }
4971         nfs4_write_cached_acl(inode, pages, res.acl_data_offset, res.acl_len);
4972         if (buf) {
4973                 if (res.acl_len > buflen) {
4974                         ret = -ERANGE;
4975                         goto out_free;
4976                 }
4977                 _copy_from_pages(buf, pages, res.acl_data_offset, res.acl_len);
4978         }
4979 out_ok:
4980         ret = res.acl_len;
4981 out_free:
4982         for (i = 0; i < npages; i++)
4983                 if (pages[i])
4984                         __free_page(pages[i]);
4985         if (res.acl_scratch)
4986                 __free_page(res.acl_scratch);
4987         return ret;
4988 }
4989
4990 static ssize_t nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
4991 {
4992         struct nfs4_exception exception = { };
4993         ssize_t ret;
4994         do {
4995                 ret = __nfs4_get_acl_uncached(inode, buf, buflen);
4996                 trace_nfs4_get_acl(inode, ret);
4997                 if (ret >= 0)
4998                         break;
4999                 ret = nfs4_handle_exception(NFS_SERVER(inode), ret, &exception);
5000         } while (exception.retry);
5001         return ret;
5002 }
5003
5004 static ssize_t nfs4_proc_get_acl(struct inode *inode, void *buf, size_t buflen)
5005 {
5006         struct nfs_server *server = NFS_SERVER(inode);
5007         int ret;
5008
5009         if (!nfs4_server_supports_acls(server))
5010                 return -EOPNOTSUPP;
5011         ret = nfs_revalidate_inode(server, inode);
5012         if (ret < 0)
5013                 return ret;
5014         if (NFS_I(inode)->cache_validity & NFS_INO_INVALID_ACL)
5015                 nfs_zap_acl_cache(inode);
5016         ret = nfs4_read_cached_acl(inode, buf, buflen);
5017         if (ret != -ENOENT)
5018                 /* -ENOENT is returned if there is no ACL or if there is an ACL
5019                  * but no cached acl data, just the acl length */
5020                 return ret;
5021         return nfs4_get_acl_uncached(inode, buf, buflen);
5022 }
5023
5024 static int __nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
5025 {
5026         struct nfs_server *server = NFS_SERVER(inode);
5027         struct page *pages[NFS4ACL_MAXPAGES];
5028         struct nfs_setaclargs arg = {
5029                 .fh             = NFS_FH(inode),
5030                 .acl_pages      = pages,
5031                 .acl_len        = buflen,
5032         };
5033         struct nfs_setaclres res;
5034         struct rpc_message msg = {
5035                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETACL],
5036                 .rpc_argp       = &arg,
5037                 .rpc_resp       = &res,
5038         };
5039         unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE);
5040         int ret, i;
5041
5042         if (!nfs4_server_supports_acls(server))
5043                 return -EOPNOTSUPP;
5044         if (npages > ARRAY_SIZE(pages))
5045                 return -ERANGE;
5046         i = buf_to_pages_noslab(buf, buflen, arg.acl_pages);
5047         if (i < 0)
5048                 return i;
5049         nfs4_inode_return_delegation(inode);
5050         ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
5051
5052         /*
5053          * Free each page after tx, so the only ref left is
5054          * held by the network stack
5055          */
5056         for (; i > 0; i--)
5057                 put_page(pages[i-1]);
5058
5059         /*
5060          * Acl update can result in inode attribute update.
5061          * so mark the attribute cache invalid.
5062          */
5063         spin_lock(&inode->i_lock);
5064         NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATTR;
5065         spin_unlock(&inode->i_lock);
5066         nfs_access_zap_cache(inode);
5067         nfs_zap_acl_cache(inode);
5068         return ret;
5069 }
5070
5071 static int nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
5072 {
5073         struct nfs4_exception exception = { };
5074         int err;
5075         do {
5076                 err = __nfs4_proc_set_acl(inode, buf, buflen);
5077                 trace_nfs4_set_acl(inode, err);
5078                 err = nfs4_handle_exception(NFS_SERVER(inode), err,
5079                                 &exception);
5080         } while (exception.retry);
5081         return err;
5082 }
5083
5084 #ifdef CONFIG_NFS_V4_SECURITY_LABEL
5085 static int _nfs4_get_security_label(struct inode *inode, void *buf,
5086                                         size_t buflen)
5087 {
5088         struct nfs_server *server = NFS_SERVER(inode);
5089         struct nfs_fattr fattr;
5090         struct nfs4_label label = {0, 0, buflen, buf};
5091
5092         u32 bitmask[3] = { 0, 0, FATTR4_WORD2_SECURITY_LABEL };
5093         struct nfs4_getattr_arg arg = {
5094                 .fh             = NFS_FH(inode),
5095                 .bitmask        = bitmask,
5096         };
5097         struct nfs4_getattr_res res = {
5098                 .fattr          = &fattr,
5099                 .label          = &label,
5100                 .server         = server,
5101         };
5102         struct rpc_message msg = {
5103                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
5104                 .rpc_argp       = &arg,
5105                 .rpc_resp       = &res,
5106         };
5107         int ret;
5108
5109         nfs_fattr_init(&fattr);
5110
5111         ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 0);
5112         if (ret)
5113                 return ret;
5114         if (!(fattr.valid & NFS_ATTR_FATTR_V4_SECURITY_LABEL))
5115                 return -ENOENT;
5116         if (buflen < label.len)
5117                 return -ERANGE;
5118         return 0;
5119 }
5120
5121 static int nfs4_get_security_label(struct inode *inode, void *buf,
5122                                         size_t buflen)
5123 {
5124         struct nfs4_exception exception = { };
5125         int err;
5126
5127         if (!nfs_server_capable(inode, NFS_CAP_SECURITY_LABEL))
5128                 return -EOPNOTSUPP;
5129
5130         do {
5131                 err = _nfs4_get_security_label(inode, buf, buflen);
5132                 trace_nfs4_get_security_label(inode, err);
5133                 err = nfs4_handle_exception(NFS_SERVER(inode), err,
5134                                 &exception);
5135         } while (exception.retry);
5136         return err;
5137 }
5138
5139 static int _nfs4_do_set_security_label(struct inode *inode,
5140                 struct nfs4_label *ilabel,
5141                 struct nfs_fattr *fattr,
5142                 struct nfs4_label *olabel)
5143 {
5144
5145         struct iattr sattr = {0};
5146         struct nfs_server *server = NFS_SERVER(inode);
5147         const u32 bitmask[3] = { 0, 0, FATTR4_WORD2_SECURITY_LABEL };
5148         struct nfs_setattrargs arg = {
5149                 .fh             = NFS_FH(inode),
5150                 .iap            = &sattr,
5151                 .server         = server,
5152                 .bitmask        = bitmask,
5153                 .label          = ilabel,
5154         };
5155         struct nfs_setattrres res = {
5156                 .fattr          = fattr,
5157                 .label          = olabel,
5158                 .server         = server,
5159         };
5160         struct rpc_message msg = {
5161                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
5162                 .rpc_argp       = &arg,
5163                 .rpc_resp       = &res,
5164         };
5165         int status;
5166
5167         nfs4_stateid_copy(&arg.stateid, &zero_stateid);
5168
5169         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
5170         if (status)
5171                 dprintk("%s failed: %d\n", __func__, status);
5172
5173         return status;
5174 }
5175
5176 static int nfs4_do_set_security_label(struct inode *inode,
5177                 struct nfs4_label *ilabel,
5178                 struct nfs_fattr *fattr,
5179                 struct nfs4_label *olabel)
5180 {
5181         struct nfs4_exception exception = { };
5182         int err;
5183
5184         do {
5185                 err = _nfs4_do_set_security_label(inode, ilabel,
5186                                 fattr, olabel);
5187                 trace_nfs4_set_security_label(inode, err);
5188                 err = nfs4_handle_exception(NFS_SERVER(inode), err,
5189                                 &exception);
5190         } while (exception.retry);
5191         return err;
5192 }
5193
5194 static int
5195 nfs4_set_security_label(struct inode *inode, const void *buf, size_t buflen)
5196 {
5197         struct nfs4_label ilabel, *olabel = NULL;
5198         struct nfs_fattr fattr;
5199         struct rpc_cred *cred;
5200         int status;
5201
5202         if (!nfs_server_capable(inode, NFS_CAP_SECURITY_LABEL))
5203                 return -EOPNOTSUPP;
5204
5205         nfs_fattr_init(&fattr);
5206
5207         ilabel.pi = 0;
5208         ilabel.lfs = 0;
5209         ilabel.label = (char *)buf;
5210         ilabel.len = buflen;
5211
5212         cred = rpc_lookup_cred();
5213         if (IS_ERR(cred))
5214                 return PTR_ERR(cred);
5215
5216         olabel = nfs4_label_alloc(NFS_SERVER(inode), GFP_KERNEL);
5217         if (IS_ERR(olabel)) {
5218                 status = -PTR_ERR(olabel);
5219                 goto out;
5220         }
5221
5222         status = nfs4_do_set_security_label(inode, &ilabel, &fattr, olabel);
5223         if (status == 0)
5224                 nfs_setsecurity(inode, &fattr, olabel);
5225
5226         nfs4_label_free(olabel);
5227 out:
5228         put_rpccred(cred);
5229         return status;
5230 }
5231 #endif  /* CONFIG_NFS_V4_SECURITY_LABEL */
5232
5233
5234 static void nfs4_init_boot_verifier(const struct nfs_client *clp,
5235                                     nfs4_verifier *bootverf)
5236 {
5237         __be32 verf[2];
5238
5239         if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) {
5240                 /* An impossible timestamp guarantees this value
5241                  * will never match a generated boot time. */
5242                 verf[0] = 0;
5243                 verf[1] = cpu_to_be32(NSEC_PER_SEC + 1);
5244         } else {
5245                 struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
5246                 verf[0] = cpu_to_be32(nn->boot_time.tv_sec);
5247                 verf[1] = cpu_to_be32(nn->boot_time.tv_nsec);
5248         }
5249         memcpy(bootverf->data, verf, sizeof(bootverf->data));
5250 }
5251
5252 static int
5253 nfs4_init_nonuniform_client_string(struct nfs_client *clp)
5254 {
5255         size_t len;
5256         char *str;
5257
5258         if (clp->cl_owner_id != NULL)
5259                 return 0;
5260
5261         rcu_read_lock();
5262         len = 14 + strlen(clp->cl_ipaddr) + 1 +
5263                 strlen(rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR)) +
5264                 1 +
5265                 strlen(rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO)) +
5266                 1;
5267         rcu_read_unlock();
5268
5269         if (len > NFS4_OPAQUE_LIMIT + 1)
5270                 return -EINVAL;
5271
5272         /*
5273          * Since this string is allocated at mount time, and held until the
5274          * nfs_client is destroyed, we can use GFP_KERNEL here w/o worrying
5275          * about a memory-reclaim deadlock.
5276          */
5277         str = kmalloc(len, GFP_KERNEL);
5278         if (!str)
5279                 return -ENOMEM;
5280
5281         rcu_read_lock();
5282         scnprintf(str, len, "Linux NFSv4.0 %s/%s %s",
5283                         clp->cl_ipaddr,
5284                         rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR),
5285                         rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO));
5286         rcu_read_unlock();
5287
5288         clp->cl_owner_id = str;
5289         return 0;
5290 }
5291
5292 static int
5293 nfs4_init_uniquifier_client_string(struct nfs_client *clp)
5294 {
5295         size_t len;
5296         char *str;
5297
5298         len = 10 + 10 + 1 + 10 + 1 +
5299                 strlen(nfs4_client_id_uniquifier) + 1 +
5300                 strlen(clp->cl_rpcclient->cl_nodename) + 1;
5301
5302         if (len > NFS4_OPAQUE_LIMIT + 1)
5303                 return -EINVAL;
5304
5305         /*
5306          * Since this string is allocated at mount time, and held until the
5307          * nfs_client is destroyed, we can use GFP_KERNEL here w/o worrying
5308          * about a memory-reclaim deadlock.
5309          */
5310         str = kmalloc(len, GFP_KERNEL);
5311         if (!str)
5312                 return -ENOMEM;
5313
5314         scnprintf(str, len, "Linux NFSv%u.%u %s/%s",
5315                         clp->rpc_ops->version, clp->cl_minorversion,
5316                         nfs4_client_id_uniquifier,
5317                         clp->cl_rpcclient->cl_nodename);
5318         clp->cl_owner_id = str;
5319         return 0;
5320 }
5321
5322 static int
5323 nfs4_init_uniform_client_string(struct nfs_client *clp)
5324 {
5325         size_t len;
5326         char *str;
5327
5328         if (clp->cl_owner_id != NULL)
5329                 return 0;
5330
5331         if (nfs4_client_id_uniquifier[0] != '\0')
5332                 return nfs4_init_uniquifier_client_string(clp);
5333
5334         len = 10 + 10 + 1 + 10 + 1 +
5335                 strlen(clp->cl_rpcclient->cl_nodename) + 1;
5336
5337         if (len > NFS4_OPAQUE_LIMIT + 1)
5338                 return -EINVAL;
5339
5340         /*
5341          * Since this string is allocated at mount time, and held until the
5342          * nfs_client is destroyed, we can use GFP_KERNEL here w/o worrying
5343          * about a memory-reclaim deadlock.
5344          */
5345         str = kmalloc(len, GFP_KERNEL);
5346         if (!str)
5347                 return -ENOMEM;
5348
5349         scnprintf(str, len, "Linux NFSv%u.%u %s",
5350                         clp->rpc_ops->version, clp->cl_minorversion,
5351                         clp->cl_rpcclient->cl_nodename);
5352         clp->cl_owner_id = str;
5353         return 0;
5354 }
5355
5356 /*
5357  * nfs4_callback_up_net() starts only "tcp" and "tcp6" callback
5358  * services.  Advertise one based on the address family of the
5359  * clientaddr.
5360  */
5361 static unsigned int
5362 nfs4_init_callback_netid(const struct nfs_client *clp, char *buf, size_t len)
5363 {
5364         if (strchr(clp->cl_ipaddr, ':') != NULL)
5365                 return scnprintf(buf, len, "tcp6");
5366         else
5367                 return scnprintf(buf, len, "tcp");
5368 }
5369
5370 static void nfs4_setclientid_done(struct rpc_task *task, void *calldata)
5371 {
5372         struct nfs4_setclientid *sc = calldata;
5373
5374         if (task->tk_status == 0)
5375                 sc->sc_cred = get_rpccred(task->tk_rqstp->rq_cred);
5376 }
5377
5378 static const struct rpc_call_ops nfs4_setclientid_ops = {
5379         .rpc_call_done = nfs4_setclientid_done,
5380 };
5381
5382 /**
5383  * nfs4_proc_setclientid - Negotiate client ID
5384  * @clp: state data structure
5385  * @program: RPC program for NFSv4 callback service
5386  * @port: IP port number for NFS4 callback service
5387  * @cred: RPC credential to use for this call
5388  * @res: where to place the result
5389  *
5390  * Returns zero, a negative errno, or a negative NFS4ERR status code.
5391  */
5392 int nfs4_proc_setclientid(struct nfs_client *clp, u32 program,
5393                 unsigned short port, struct rpc_cred *cred,
5394                 struct nfs4_setclientid_res *res)
5395 {
5396         nfs4_verifier sc_verifier;
5397         struct nfs4_setclientid setclientid = {
5398                 .sc_verifier = &sc_verifier,
5399                 .sc_prog = program,
5400                 .sc_clnt = clp,
5401         };
5402         struct rpc_message msg = {
5403                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID],
5404                 .rpc_argp = &setclientid,
5405                 .rpc_resp = res,
5406                 .rpc_cred = cred,
5407         };
5408         struct rpc_task *task;
5409         struct rpc_task_setup task_setup_data = {
5410                 .rpc_client = clp->cl_rpcclient,
5411                 .rpc_message = &msg,
5412                 .callback_ops = &nfs4_setclientid_ops,
5413                 .callback_data = &setclientid,
5414                 .flags = RPC_TASK_TIMEOUT,
5415         };
5416         int status;
5417
5418         /* nfs_client_id4 */
5419         nfs4_init_boot_verifier(clp, &sc_verifier);
5420
5421         if (test_bit(NFS_CS_MIGRATION, &clp->cl_flags))
5422                 status = nfs4_init_uniform_client_string(clp);
5423         else
5424                 status = nfs4_init_nonuniform_client_string(clp);
5425
5426         if (status)
5427                 goto out;
5428
5429         /* cb_client4 */
5430         setclientid.sc_netid_len =
5431                                 nfs4_init_callback_netid(clp,
5432                                                 setclientid.sc_netid,
5433                                                 sizeof(setclientid.sc_netid));
5434         setclientid.sc_uaddr_len = scnprintf(setclientid.sc_uaddr,
5435                                 sizeof(setclientid.sc_uaddr), "%s.%u.%u",
5436                                 clp->cl_ipaddr, port >> 8, port & 255);
5437
5438         dprintk("NFS call  setclientid auth=%s, '%s'\n",
5439                 clp->cl_rpcclient->cl_auth->au_ops->au_name,
5440                 clp->cl_owner_id);
5441         task = rpc_run_task(&task_setup_data);
5442         if (IS_ERR(task)) {
5443                 status = PTR_ERR(task);
5444                 goto out;
5445         }
5446         status = task->tk_status;
5447         if (setclientid.sc_cred) {
5448                 clp->cl_acceptor = rpcauth_stringify_acceptor(setclientid.sc_cred);
5449                 put_rpccred(setclientid.sc_cred);
5450         }
5451         rpc_put_task(task);
5452 out:
5453         trace_nfs4_setclientid(clp, status);
5454         dprintk("NFS reply setclientid: %d\n", status);
5455         return status;
5456 }
5457
5458 /**
5459  * nfs4_proc_setclientid_confirm - Confirm client ID
5460  * @clp: state data structure
5461  * @res: result of a previous SETCLIENTID
5462  * @cred: RPC credential to use for this call
5463  *
5464  * Returns zero, a negative errno, or a negative NFS4ERR status code.
5465  */
5466 int nfs4_proc_setclientid_confirm(struct nfs_client *clp,
5467                 struct nfs4_setclientid_res *arg,
5468                 struct rpc_cred *cred)
5469 {
5470         struct rpc_message msg = {
5471                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID_CONFIRM],
5472                 .rpc_argp = arg,
5473                 .rpc_cred = cred,
5474         };
5475         int status;
5476
5477         dprintk("NFS call  setclientid_confirm auth=%s, (client ID %llx)\n",
5478                 clp->cl_rpcclient->cl_auth->au_ops->au_name,
5479                 clp->cl_clientid);
5480         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5481         trace_nfs4_setclientid_confirm(clp, status);
5482         dprintk("NFS reply setclientid_confirm: %d\n", status);
5483         return status;
5484 }
5485
5486 struct nfs4_delegreturndata {
5487         struct nfs4_delegreturnargs args;
5488         struct nfs4_delegreturnres res;
5489         struct nfs_fh fh;
5490         nfs4_stateid stateid;
5491         unsigned long timestamp;
5492         struct nfs_fattr fattr;
5493         int rpc_status;
5494         struct inode *inode;
5495         bool roc;
5496         u32 roc_barrier;
5497 };
5498
5499 static void nfs4_delegreturn_done(struct rpc_task *task, void *calldata)
5500 {
5501         struct nfs4_delegreturndata *data = calldata;
5502
5503         if (!nfs4_sequence_done(task, &data->res.seq_res))
5504                 return;
5505
5506         trace_nfs4_delegreturn_exit(&data->args, &data->res, task->tk_status);
5507         switch (task->tk_status) {
5508         case 0:
5509                 renew_lease(data->res.server, data->timestamp);
5510         case -NFS4ERR_ADMIN_REVOKED:
5511         case -NFS4ERR_DELEG_REVOKED:
5512         case -NFS4ERR_EXPIRED:
5513                 nfs4_free_revoked_stateid(data->res.server,
5514                                 data->args.stateid,
5515                                 task->tk_msg.rpc_cred);
5516         case -NFS4ERR_BAD_STATEID:
5517         case -NFS4ERR_OLD_STATEID:
5518         case -NFS4ERR_STALE_STATEID:
5519                 task->tk_status = 0;
5520                 if (data->roc)
5521                         pnfs_roc_set_barrier(data->inode, data->roc_barrier);
5522                 break;
5523         default:
5524                 if (nfs4_async_handle_error(task, data->res.server,
5525                                             NULL, NULL) == -EAGAIN) {
5526                         rpc_restart_call_prepare(task);
5527                         return;
5528                 }
5529         }
5530         data->rpc_status = task->tk_status;
5531 }
5532
5533 static void nfs4_delegreturn_release(void *calldata)
5534 {
5535         struct nfs4_delegreturndata *data = calldata;
5536         struct inode *inode = data->inode;
5537
5538         if (inode) {
5539                 if (data->roc)
5540                         pnfs_roc_release(inode);
5541                 nfs_iput_and_deactive(inode);
5542         }
5543         kfree(calldata);
5544 }
5545
5546 static void nfs4_delegreturn_prepare(struct rpc_task *task, void *data)
5547 {
5548         struct nfs4_delegreturndata *d_data;
5549
5550         d_data = (struct nfs4_delegreturndata *)data;
5551
5552         if (nfs4_wait_on_layoutreturn(d_data->inode, task))
5553                 return;
5554
5555         if (d_data->roc)
5556                 pnfs_roc_get_barrier(d_data->inode, &d_data->roc_barrier);
5557
5558         nfs4_setup_sequence(d_data->res.server,
5559                         &d_data->args.seq_args,
5560                         &d_data->res.seq_res,
5561                         task);
5562 }
5563
5564 static const struct rpc_call_ops nfs4_delegreturn_ops = {
5565         .rpc_call_prepare = nfs4_delegreturn_prepare,
5566         .rpc_call_done = nfs4_delegreturn_done,
5567         .rpc_release = nfs4_delegreturn_release,
5568 };
5569
5570 static int _nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
5571 {
5572         struct nfs4_delegreturndata *data;
5573         struct nfs_server *server = NFS_SERVER(inode);
5574         struct rpc_task *task;
5575         struct rpc_message msg = {
5576                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DELEGRETURN],
5577                 .rpc_cred = cred,
5578         };
5579         struct rpc_task_setup task_setup_data = {
5580                 .rpc_client = server->client,
5581                 .rpc_message = &msg,
5582                 .callback_ops = &nfs4_delegreturn_ops,
5583                 .flags = RPC_TASK_ASYNC,
5584         };
5585         int status = 0;
5586
5587         data = kzalloc(sizeof(*data), GFP_NOFS);
5588         if (data == NULL)
5589                 return -ENOMEM;
5590         nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
5591
5592         nfs4_state_protect(server->nfs_client,
5593                         NFS_SP4_MACH_CRED_CLEANUP,
5594                         &task_setup_data.rpc_client, &msg);
5595
5596         data->args.fhandle = &data->fh;
5597         data->args.stateid = &data->stateid;
5598         data->args.bitmask = server->cache_consistency_bitmask;
5599         nfs_copy_fh(&data->fh, NFS_FH(inode));
5600         nfs4_stateid_copy(&data->stateid, stateid);
5601         data->res.fattr = &data->fattr;
5602         data->res.server = server;
5603         nfs_fattr_init(data->res.fattr);
5604         data->timestamp = jiffies;
5605         data->rpc_status = 0;
5606         data->inode = nfs_igrab_and_active(inode);
5607         if (data->inode)
5608                 data->roc = nfs4_roc(inode);
5609
5610         task_setup_data.callback_data = data;
5611         msg.rpc_argp = &data->args;
5612         msg.rpc_resp = &data->res;
5613         task = rpc_run_task(&task_setup_data);
5614         if (IS_ERR(task))
5615                 return PTR_ERR(task);
5616         if (!issync)
5617                 goto out;
5618         status = nfs4_wait_for_completion_rpc_task(task);
5619         if (status != 0)
5620                 goto out;
5621         status = data->rpc_status;
5622         if (status == 0)
5623                 nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
5624         else
5625                 nfs_refresh_inode(inode, &data->fattr);
5626 out:
5627         rpc_put_task(task);
5628         return status;
5629 }
5630
5631 int nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
5632 {
5633         struct nfs_server *server = NFS_SERVER(inode);
5634         struct nfs4_exception exception = { };
5635         int err;
5636         do {
5637                 err = _nfs4_proc_delegreturn(inode, cred, stateid, issync);
5638                 trace_nfs4_delegreturn(inode, stateid, err);
5639                 switch (err) {
5640                         case -NFS4ERR_STALE_STATEID:
5641                         case -NFS4ERR_EXPIRED:
5642                         case 0:
5643                                 return 0;
5644                 }
5645                 err = nfs4_handle_exception(server, err, &exception);
5646         } while (exception.retry);
5647         return err;
5648 }
5649
5650 static int _nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
5651 {
5652         struct inode *inode = state->inode;
5653         struct nfs_server *server = NFS_SERVER(inode);
5654         struct nfs_client *clp = server->nfs_client;
5655         struct nfs_lockt_args arg = {
5656                 .fh = NFS_FH(inode),
5657                 .fl = request,
5658         };
5659         struct nfs_lockt_res res = {
5660                 .denied = request,
5661         };
5662         struct rpc_message msg = {
5663                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_LOCKT],
5664                 .rpc_argp       = &arg,
5665                 .rpc_resp       = &res,
5666                 .rpc_cred       = state->owner->so_cred,
5667         };
5668         struct nfs4_lock_state *lsp;
5669         int status;
5670
5671         arg.lock_owner.clientid = clp->cl_clientid;
5672         status = nfs4_set_lock_state(state, request);
5673         if (status != 0)
5674                 goto out;
5675         lsp = request->fl_u.nfs4_fl.owner;
5676         arg.lock_owner.id = lsp->ls_seqid.owner_id;
5677         arg.lock_owner.s_dev = server->s_dev;
5678         status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
5679         switch (status) {
5680                 case 0:
5681                         request->fl_type = F_UNLCK;
5682                         break;
5683                 case -NFS4ERR_DENIED:
5684                         status = 0;
5685         }
5686         request->fl_ops->fl_release_private(request);
5687         request->fl_ops = NULL;
5688 out:
5689         return status;
5690 }
5691
5692 static int nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
5693 {
5694         struct nfs4_exception exception = { };
5695         int err;
5696
5697         do {
5698                 err = _nfs4_proc_getlk(state, cmd, request);
5699                 trace_nfs4_get_lock(request, state, cmd, err);
5700                 err = nfs4_handle_exception(NFS_SERVER(state->inode), err,
5701                                 &exception);
5702         } while (exception.retry);
5703         return err;
5704 }
5705
5706 struct nfs4_unlockdata {
5707         struct nfs_locku_args arg;
5708         struct nfs_locku_res res;
5709         struct nfs4_lock_state *lsp;
5710         struct nfs_open_context *ctx;
5711         struct file_lock fl;
5712         struct nfs_server *server;
5713         unsigned long timestamp;
5714 };
5715
5716 static struct nfs4_unlockdata *nfs4_alloc_unlockdata(struct file_lock *fl,
5717                 struct nfs_open_context *ctx,
5718                 struct nfs4_lock_state *lsp,
5719                 struct nfs_seqid *seqid)
5720 {
5721         struct nfs4_unlockdata *p;
5722         struct inode *inode = lsp->ls_state->inode;
5723
5724         p = kzalloc(sizeof(*p), GFP_NOFS);
5725         if (p == NULL)
5726                 return NULL;
5727         p->arg.fh = NFS_FH(inode);
5728         p->arg.fl = &p->fl;
5729         p->arg.seqid = seqid;
5730         p->res.seqid = seqid;
5731         p->lsp = lsp;
5732         atomic_inc(&lsp->ls_count);
5733         /* Ensure we don't close file until we're done freeing locks! */
5734         p->ctx = get_nfs_open_context(ctx);
5735         memcpy(&p->fl, fl, sizeof(p->fl));
5736         p->server = NFS_SERVER(inode);
5737         return p;
5738 }
5739
5740 static void nfs4_locku_release_calldata(void *data)
5741 {
5742         struct nfs4_unlockdata *calldata = data;
5743         nfs_free_seqid(calldata->arg.seqid);
5744         nfs4_put_lock_state(calldata->lsp);
5745         put_nfs_open_context(calldata->ctx);
5746         kfree(calldata);
5747 }
5748
5749 static void nfs4_locku_done(struct rpc_task *task, void *data)
5750 {
5751         struct nfs4_unlockdata *calldata = data;
5752
5753         if (!nfs4_sequence_done(task, &calldata->res.seq_res))
5754                 return;
5755         switch (task->tk_status) {
5756                 case 0:
5757                         renew_lease(calldata->server, calldata->timestamp);
5758                         locks_lock_inode_wait(calldata->lsp->ls_state->inode, &calldata->fl);
5759                         if (nfs4_update_lock_stateid(calldata->lsp,
5760                                         &calldata->res.stateid))
5761                                 break;
5762                 case -NFS4ERR_ADMIN_REVOKED:
5763                 case -NFS4ERR_EXPIRED:
5764                         nfs4_free_revoked_stateid(calldata->server,
5765                                         &calldata->arg.stateid,
5766                                         task->tk_msg.rpc_cred);
5767                 case -NFS4ERR_BAD_STATEID:
5768                 case -NFS4ERR_OLD_STATEID:
5769                 case -NFS4ERR_STALE_STATEID:
5770                         if (!nfs4_stateid_match(&calldata->arg.stateid,
5771                                                 &calldata->lsp->ls_stateid))
5772                                 rpc_restart_call_prepare(task);
5773                         break;
5774                 default:
5775                         if (nfs4_async_handle_error(task, calldata->server,
5776                                                     NULL, NULL) == -EAGAIN)
5777                                 rpc_restart_call_prepare(task);
5778         }
5779         nfs_release_seqid(calldata->arg.seqid);
5780 }
5781
5782 static void nfs4_locku_prepare(struct rpc_task *task, void *data)
5783 {
5784         struct nfs4_unlockdata *calldata = data;
5785
5786         if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
5787                 goto out_wait;
5788         nfs4_stateid_copy(&calldata->arg.stateid, &calldata->lsp->ls_stateid);
5789         if (test_bit(NFS_LOCK_INITIALIZED, &calldata->lsp->ls_flags) == 0) {
5790                 /* Note: exit _without_ running nfs4_locku_done */
5791                 goto out_no_action;
5792         }
5793         calldata->timestamp = jiffies;
5794         if (nfs4_setup_sequence(calldata->server,
5795                                 &calldata->arg.seq_args,
5796                                 &calldata->res.seq_res,
5797                                 task) != 0)
5798                 nfs_release_seqid(calldata->arg.seqid);
5799         return;
5800 out_no_action:
5801         task->tk_action = NULL;
5802 out_wait:
5803         nfs4_sequence_done(task, &calldata->res.seq_res);
5804 }
5805
5806 static const struct rpc_call_ops nfs4_locku_ops = {
5807         .rpc_call_prepare = nfs4_locku_prepare,
5808         .rpc_call_done = nfs4_locku_done,
5809         .rpc_release = nfs4_locku_release_calldata,
5810 };
5811
5812 static struct rpc_task *nfs4_do_unlck(struct file_lock *fl,
5813                 struct nfs_open_context *ctx,
5814                 struct nfs4_lock_state *lsp,
5815                 struct nfs_seqid *seqid)
5816 {
5817         struct nfs4_unlockdata *data;
5818         struct rpc_message msg = {
5819                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCKU],
5820                 .rpc_cred = ctx->cred,
5821         };
5822         struct rpc_task_setup task_setup_data = {
5823                 .rpc_client = NFS_CLIENT(lsp->ls_state->inode),
5824                 .rpc_message = &msg,
5825                 .callback_ops = &nfs4_locku_ops,
5826                 .workqueue = nfsiod_workqueue,
5827                 .flags = RPC_TASK_ASYNC,
5828         };
5829
5830         nfs4_state_protect(NFS_SERVER(lsp->ls_state->inode)->nfs_client,
5831                 NFS_SP4_MACH_CRED_CLEANUP, &task_setup_data.rpc_client, &msg);
5832
5833         /* Ensure this is an unlock - when canceling a lock, the
5834          * canceled lock is passed in, and it won't be an unlock.
5835          */
5836         fl->fl_type = F_UNLCK;
5837
5838         data = nfs4_alloc_unlockdata(fl, ctx, lsp, seqid);
5839         if (data == NULL) {
5840                 nfs_free_seqid(seqid);
5841                 return ERR_PTR(-ENOMEM);
5842         }
5843
5844         nfs4_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
5845         msg.rpc_argp = &data->arg;
5846         msg.rpc_resp = &data->res;
5847         task_setup_data.callback_data = data;
5848         return rpc_run_task(&task_setup_data);
5849 }
5850
5851 static int nfs4_proc_unlck(struct nfs4_state *state, int cmd, struct file_lock *request)
5852 {
5853         struct inode *inode = state->inode;
5854         struct nfs4_state_owner *sp = state->owner;
5855         struct nfs_inode *nfsi = NFS_I(inode);
5856         struct nfs_seqid *seqid;
5857         struct nfs4_lock_state *lsp;
5858         struct rpc_task *task;
5859         struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
5860         int status = 0;
5861         unsigned char fl_flags = request->fl_flags;
5862
5863         status = nfs4_set_lock_state(state, request);
5864         /* Unlock _before_ we do the RPC call */
5865         request->fl_flags |= FL_EXISTS;
5866         /* Exclude nfs_delegation_claim_locks() */
5867         mutex_lock(&sp->so_delegreturn_mutex);
5868         /* Exclude nfs4_reclaim_open_stateid() - note nesting! */
5869         down_read(&nfsi->rwsem);
5870         if (locks_lock_inode_wait(inode, request) == -ENOENT) {
5871                 up_read(&nfsi->rwsem);
5872                 mutex_unlock(&sp->so_delegreturn_mutex);
5873                 goto out;
5874         }
5875         up_read(&nfsi->rwsem);
5876         mutex_unlock(&sp->so_delegreturn_mutex);
5877         if (status != 0)
5878                 goto out;
5879         /* Is this a delegated lock? */
5880         lsp = request->fl_u.nfs4_fl.owner;
5881         if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) == 0)
5882                 goto out;
5883         alloc_seqid = NFS_SERVER(inode)->nfs_client->cl_mvops->alloc_seqid;
5884         seqid = alloc_seqid(&lsp->ls_seqid, GFP_KERNEL);
5885         status = -ENOMEM;
5886         if (IS_ERR(seqid))
5887                 goto out;
5888         task = nfs4_do_unlck(request, nfs_file_open_context(request->fl_file), lsp, seqid);
5889         status = PTR_ERR(task);
5890         if (IS_ERR(task))
5891                 goto out;
5892         status = nfs4_wait_for_completion_rpc_task(task);
5893         rpc_put_task(task);
5894 out:
5895         request->fl_flags = fl_flags;
5896         trace_nfs4_unlock(request, state, F_SETLK, status);
5897         return status;
5898 }
5899
5900 struct nfs4_lockdata {
5901         struct nfs_lock_args arg;
5902         struct nfs_lock_res res;
5903         struct nfs4_lock_state *lsp;
5904         struct nfs_open_context *ctx;
5905         struct file_lock fl;
5906         unsigned long timestamp;
5907         int rpc_status;
5908         int cancelled;
5909         struct nfs_server *server;
5910 };
5911
5912 static struct nfs4_lockdata *nfs4_alloc_lockdata(struct file_lock *fl,
5913                 struct nfs_open_context *ctx, struct nfs4_lock_state *lsp,
5914                 gfp_t gfp_mask)
5915 {
5916         struct nfs4_lockdata *p;
5917         struct inode *inode = lsp->ls_state->inode;
5918         struct nfs_server *server = NFS_SERVER(inode);
5919         struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
5920
5921         p = kzalloc(sizeof(*p), gfp_mask);
5922         if (p == NULL)
5923                 return NULL;
5924
5925         p->arg.fh = NFS_FH(inode);
5926         p->arg.fl = &p->fl;
5927         p->arg.open_seqid = nfs_alloc_seqid(&lsp->ls_state->owner->so_seqid, gfp_mask);
5928         if (IS_ERR(p->arg.open_seqid))
5929                 goto out_free;
5930         alloc_seqid = server->nfs_client->cl_mvops->alloc_seqid;
5931         p->arg.lock_seqid = alloc_seqid(&lsp->ls_seqid, gfp_mask);
5932         if (IS_ERR(p->arg.lock_seqid))
5933                 goto out_free_seqid;
5934         p->arg.lock_owner.clientid = server->nfs_client->cl_clientid;
5935         p->arg.lock_owner.id = lsp->ls_seqid.owner_id;
5936         p->arg.lock_owner.s_dev = server->s_dev;
5937         p->res.lock_seqid = p->arg.lock_seqid;
5938         p->lsp = lsp;
5939         p->server = server;
5940         atomic_inc(&lsp->ls_count);
5941         p->ctx = get_nfs_open_context(ctx);
5942         get_file(fl->fl_file);
5943         memcpy(&p->fl, fl, sizeof(p->fl));
5944         return p;
5945 out_free_seqid:
5946         nfs_free_seqid(p->arg.open_seqid);
5947 out_free:
5948         kfree(p);
5949         return NULL;
5950 }
5951
5952 static void nfs4_lock_prepare(struct rpc_task *task, void *calldata)
5953 {
5954         struct nfs4_lockdata *data = calldata;
5955         struct nfs4_state *state = data->lsp->ls_state;
5956
5957         dprintk("%s: begin!\n", __func__);
5958         if (nfs_wait_on_sequence(data->arg.lock_seqid, task) != 0)
5959                 goto out_wait;
5960         /* Do we need to do an open_to_lock_owner? */
5961         if (!test_bit(NFS_LOCK_INITIALIZED, &data->lsp->ls_flags)) {
5962                 if (nfs_wait_on_sequence(data->arg.open_seqid, task) != 0) {
5963                         goto out_release_lock_seqid;
5964                 }
5965                 nfs4_stateid_copy(&data->arg.open_stateid,
5966                                 &state->open_stateid);
5967                 data->arg.new_lock_owner = 1;
5968                 data->res.open_seqid = data->arg.open_seqid;
5969         } else {
5970                 data->arg.new_lock_owner = 0;
5971                 nfs4_stateid_copy(&data->arg.lock_stateid,
5972                                 &data->lsp->ls_stateid);
5973         }
5974         if (!nfs4_valid_open_stateid(state)) {
5975                 data->rpc_status = -EBADF;
5976                 task->tk_action = NULL;
5977                 goto out_release_open_seqid;
5978         }
5979         data->timestamp = jiffies;
5980         if (nfs4_setup_sequence(data->server,
5981                                 &data->arg.seq_args,
5982                                 &data->res.seq_res,
5983                                 task) == 0)
5984                 return;
5985 out_release_open_seqid:
5986         nfs_release_seqid(data->arg.open_seqid);
5987 out_release_lock_seqid:
5988         nfs_release_seqid(data->arg.lock_seqid);
5989 out_wait:
5990         nfs4_sequence_done(task, &data->res.seq_res);
5991         dprintk("%s: done!, ret = %d\n", __func__, data->rpc_status);
5992 }
5993
5994 static void nfs4_lock_done(struct rpc_task *task, void *calldata)
5995 {
5996         struct nfs4_lockdata *data = calldata;
5997         struct nfs4_lock_state *lsp = data->lsp;
5998
5999         dprintk("%s: begin!\n", __func__);
6000
6001         if (!nfs4_sequence_done(task, &data->res.seq_res))
6002                 return;
6003
6004         data->rpc_status = task->tk_status;
6005         switch (task->tk_status) {
6006         case 0:
6007                 renew_lease(NFS_SERVER(d_inode(data->ctx->dentry)),
6008                                 data->timestamp);
6009                 if (data->arg.new_lock) {
6010                         data->fl.fl_flags &= ~(FL_SLEEP | FL_ACCESS);
6011                         if (locks_lock_inode_wait(lsp->ls_state->inode, &data->fl) < 0) {
6012                                 rpc_restart_call_prepare(task);
6013                                 break;
6014                         }
6015                 }
6016                 if (data->arg.new_lock_owner != 0) {
6017                         nfs_confirm_seqid(&lsp->ls_seqid, 0);
6018                         nfs4_stateid_copy(&lsp->ls_stateid, &data->res.stateid);
6019                         set_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags);
6020                 } else if (!nfs4_update_lock_stateid(lsp, &data->res.stateid))
6021                         rpc_restart_call_prepare(task);
6022                 break;
6023         case -NFS4ERR_BAD_STATEID:
6024         case -NFS4ERR_OLD_STATEID:
6025         case -NFS4ERR_STALE_STATEID:
6026         case -NFS4ERR_EXPIRED:
6027                 if (data->arg.new_lock_owner != 0) {
6028                         if (!nfs4_stateid_match(&data->arg.open_stateid,
6029                                                 &lsp->ls_state->open_stateid))
6030                                 rpc_restart_call_prepare(task);
6031                 } else if (!nfs4_stateid_match(&data->arg.lock_stateid,
6032                                                 &lsp->ls_stateid))
6033                                 rpc_restart_call_prepare(task);
6034         }
6035         dprintk("%s: done, ret = %d!\n", __func__, data->rpc_status);
6036 }
6037
6038 static void nfs4_lock_release(void *calldata)
6039 {
6040         struct nfs4_lockdata *data = calldata;
6041
6042         dprintk("%s: begin!\n", __func__);
6043         nfs_free_seqid(data->arg.open_seqid);
6044         if (data->cancelled != 0) {
6045                 struct rpc_task *task;
6046                 task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
6047                                 data->arg.lock_seqid);
6048                 if (!IS_ERR(task))
6049                         rpc_put_task_async(task);
6050                 dprintk("%s: cancelling lock!\n", __func__);
6051         } else
6052                 nfs_free_seqid(data->arg.lock_seqid);
6053         nfs4_put_lock_state(data->lsp);
6054         put_nfs_open_context(data->ctx);
6055         fput(data->fl.fl_file);
6056         kfree(data);
6057         dprintk("%s: done!\n", __func__);
6058 }
6059
6060 static const struct rpc_call_ops nfs4_lock_ops = {
6061         .rpc_call_prepare = nfs4_lock_prepare,
6062         .rpc_call_done = nfs4_lock_done,
6063         .rpc_release = nfs4_lock_release,
6064 };
6065
6066 static void nfs4_handle_setlk_error(struct nfs_server *server, struct nfs4_lock_state *lsp, int new_lock_owner, int error)
6067 {
6068         switch (error) {
6069         case -NFS4ERR_ADMIN_REVOKED:
6070         case -NFS4ERR_BAD_STATEID:
6071                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
6072                 if (new_lock_owner != 0 ||
6073                    test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) != 0)
6074                         nfs4_schedule_stateid_recovery(server, lsp->ls_state);
6075                 break;
6076         case -NFS4ERR_STALE_STATEID:
6077                 lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
6078         case -NFS4ERR_EXPIRED:
6079                 nfs4_schedule_lease_recovery(server->nfs_client);
6080         };
6081 }
6082
6083 static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int recovery_type)
6084 {
6085         struct nfs4_lockdata *data;
6086         struct rpc_task *task;
6087         struct rpc_message msg = {
6088                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCK],
6089                 .rpc_cred = state->owner->so_cred,
6090         };
6091         struct rpc_task_setup task_setup_data = {
6092                 .rpc_client = NFS_CLIENT(state->inode),
6093                 .rpc_message = &msg,
6094                 .callback_ops = &nfs4_lock_ops,
6095                 .workqueue = nfsiod_workqueue,
6096                 .flags = RPC_TASK_ASYNC,
6097         };
6098         int ret;
6099
6100         dprintk("%s: begin!\n", __func__);
6101         data = nfs4_alloc_lockdata(fl, nfs_file_open_context(fl->fl_file),
6102                         fl->fl_u.nfs4_fl.owner,
6103                         recovery_type == NFS_LOCK_NEW ? GFP_KERNEL : GFP_NOFS);
6104         if (data == NULL)
6105                 return -ENOMEM;
6106         if (IS_SETLKW(cmd))
6107                 data->arg.block = 1;
6108         nfs4_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
6109         msg.rpc_argp = &data->arg;
6110         msg.rpc_resp = &data->res;
6111         task_setup_data.callback_data = data;
6112         if (recovery_type > NFS_LOCK_NEW) {
6113                 if (recovery_type == NFS_LOCK_RECLAIM)
6114                         data->arg.reclaim = NFS_LOCK_RECLAIM;
6115                 nfs4_set_sequence_privileged(&data->arg.seq_args);
6116         } else
6117                 data->arg.new_lock = 1;
6118         task = rpc_run_task(&task_setup_data);
6119         if (IS_ERR(task))
6120                 return PTR_ERR(task);
6121         ret = nfs4_wait_for_completion_rpc_task(task);
6122         if (ret == 0) {
6123                 ret = data->rpc_status;
6124                 if (ret)
6125                         nfs4_handle_setlk_error(data->server, data->lsp,
6126                                         data->arg.new_lock_owner, ret);
6127         } else
6128                 data->cancelled = 1;
6129         rpc_put_task(task);
6130         dprintk("%s: done, ret = %d!\n", __func__, ret);
6131         trace_nfs4_set_lock(fl, state, &data->res.stateid, cmd, ret);
6132         return ret;
6133 }
6134
6135 static int nfs4_lock_reclaim(struct nfs4_state *state, struct file_lock *request)
6136 {
6137         struct nfs_server *server = NFS_SERVER(state->inode);
6138         struct nfs4_exception exception = {
6139                 .inode = state->inode,
6140         };
6141         int err;
6142
6143         do {
6144                 /* Cache the lock if possible... */
6145                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
6146                         return 0;
6147                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_RECLAIM);
6148                 if (err != -NFS4ERR_DELAY)
6149                         break;
6150                 nfs4_handle_exception(server, err, &exception);
6151         } while (exception.retry);
6152         return err;
6153 }
6154
6155 static int nfs4_lock_expired(struct nfs4_state *state, struct file_lock *request)
6156 {
6157         struct nfs_server *server = NFS_SERVER(state->inode);
6158         struct nfs4_exception exception = {
6159                 .inode = state->inode,
6160         };
6161         int err;
6162
6163         err = nfs4_set_lock_state(state, request);
6164         if (err != 0)
6165                 return err;
6166         if (!recover_lost_locks) {
6167                 set_bit(NFS_LOCK_LOST, &request->fl_u.nfs4_fl.owner->ls_flags);
6168                 return 0;
6169         }
6170         do {
6171                 if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
6172                         return 0;
6173                 err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_EXPIRED);
6174                 switch (err) {
6175                 default:
6176                         goto out;
6177                 case -NFS4ERR_GRACE:
6178                 case -NFS4ERR_DELAY:
6179                         nfs4_handle_exception(server, err, &exception);
6180                         err = 0;
6181                 }
6182         } while (exception.retry);
6183 out:
6184         return err;
6185 }
6186
6187 #if defined(CONFIG_NFS_V4_1)
6188 static int nfs41_lock_expired(struct nfs4_state *state, struct file_lock *request)
6189 {
6190         struct nfs4_lock_state *lsp;
6191         int status;
6192
6193         status = nfs4_set_lock_state(state, request);
6194         if (status != 0)
6195                 return status;
6196         lsp = request->fl_u.nfs4_fl.owner;
6197         if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) ||
6198             test_bit(NFS_LOCK_LOST, &lsp->ls_flags))
6199                 return 0;
6200         status = nfs4_lock_expired(state, request);
6201         return status;
6202 }
6203 #endif
6204
6205 static int _nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
6206 {
6207         struct nfs_inode *nfsi = NFS_I(state->inode);
6208         struct nfs4_state_owner *sp = state->owner;
6209         unsigned char fl_flags = request->fl_flags;
6210         int status;
6211
6212         request->fl_flags |= FL_ACCESS;
6213         status = locks_lock_inode_wait(state->inode, request);
6214         if (status < 0)
6215                 goto out;
6216         mutex_lock(&sp->so_delegreturn_mutex);
6217         down_read(&nfsi->rwsem);
6218         if (test_bit(NFS_DELEGATED_STATE, &state->flags)) {
6219                 /* Yes: cache locks! */
6220                 /* ...but avoid races with delegation recall... */
6221                 request->fl_flags = fl_flags & ~FL_SLEEP;
6222                 status = locks_lock_inode_wait(state->inode, request);
6223                 up_read(&nfsi->rwsem);
6224                 mutex_unlock(&sp->so_delegreturn_mutex);
6225                 goto out;
6226         }
6227         up_read(&nfsi->rwsem);
6228         mutex_unlock(&sp->so_delegreturn_mutex);
6229         status = _nfs4_do_setlk(state, cmd, request, NFS_LOCK_NEW);
6230 out:
6231         request->fl_flags = fl_flags;
6232         return status;
6233 }
6234
6235 static int nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
6236 {
6237         struct nfs4_exception exception = {
6238                 .state = state,
6239                 .inode = state->inode,
6240         };
6241         int err;
6242
6243         do {
6244                 err = _nfs4_proc_setlk(state, cmd, request);
6245                 if (err == -NFS4ERR_DENIED)
6246                         err = -EAGAIN;
6247                 err = nfs4_handle_exception(NFS_SERVER(state->inode),
6248                                 err, &exception);
6249         } while (exception.retry);
6250         return err;
6251 }
6252
6253 #define NFS4_LOCK_MINTIMEOUT (1 * HZ)
6254 #define NFS4_LOCK_MAXTIMEOUT (30 * HZ)
6255
6256 static int
6257 nfs4_retry_setlk_simple(struct nfs4_state *state, int cmd,
6258                         struct file_lock *request)
6259 {
6260         int             status = -ERESTARTSYS;
6261         unsigned long   timeout = NFS4_LOCK_MINTIMEOUT;
6262
6263         while(!signalled()) {
6264                 status = nfs4_proc_setlk(state, cmd, request);
6265                 if ((status != -EAGAIN) || IS_SETLK(cmd))
6266                         break;
6267                 freezable_schedule_timeout_interruptible(timeout);
6268                 timeout *= 2;
6269                 timeout = min_t(unsigned long, NFS4_LOCK_MAXTIMEOUT, timeout);
6270                 status = -ERESTARTSYS;
6271         }
6272         return status;
6273 }
6274
6275 #ifdef CONFIG_NFS_V4_1
6276 struct nfs4_lock_waiter {
6277         struct task_struct      *task;
6278         struct inode            *inode;
6279         struct nfs_lowner       *owner;
6280         bool                    notified;
6281 };
6282
6283 static int
6284 nfs4_wake_lock_waiter(wait_queue_t *wait, unsigned int mode, int flags, void *key)
6285 {
6286         int ret;
6287         struct cb_notify_lock_args *cbnl = key;
6288         struct nfs4_lock_waiter *waiter = wait->private;
6289         struct nfs_lowner       *lowner = &cbnl->cbnl_owner,
6290                                 *wowner = waiter->owner;
6291
6292         /* Only wake if the callback was for the same owner */
6293         if (lowner->clientid != wowner->clientid ||
6294             lowner->id != wowner->id             ||
6295             lowner->s_dev != wowner->s_dev)
6296                 return 0;
6297
6298         /* Make sure it's for the right inode */
6299         if (nfs_compare_fh(NFS_FH(waiter->inode), &cbnl->cbnl_fh))
6300                 return 0;
6301
6302         waiter->notified = true;
6303
6304         /* override "private" so we can use default_wake_function */
6305         wait->private = waiter->task;
6306         ret = autoremove_wake_function(wait, mode, flags, key);
6307         wait->private = waiter;
6308         return ret;
6309 }
6310
6311 static int
6312 nfs4_retry_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
6313 {
6314         int status = -ERESTARTSYS;
6315         unsigned long flags;
6316         struct nfs4_lock_state *lsp = request->fl_u.nfs4_fl.owner;
6317         struct nfs_server *server = NFS_SERVER(state->inode);
6318         struct nfs_client *clp = server->nfs_client;
6319         wait_queue_head_t *q = &clp->cl_lock_waitq;
6320         struct nfs_lowner owner = { .clientid = clp->cl_clientid,
6321                                     .id = lsp->ls_seqid.owner_id,
6322                                     .s_dev = server->s_dev };
6323         struct nfs4_lock_waiter waiter = { .task  = current,
6324                                            .inode = state->inode,
6325                                            .owner = &owner,
6326                                            .notified = false };
6327         wait_queue_t wait;
6328
6329         /* Don't bother with waitqueue if we don't expect a callback */
6330         if (!test_bit(NFS_STATE_MAY_NOTIFY_LOCK, &state->flags))
6331                 return nfs4_retry_setlk_simple(state, cmd, request);
6332
6333         init_wait(&wait);
6334         wait.private = &waiter;
6335         wait.func = nfs4_wake_lock_waiter;
6336         add_wait_queue(q, &wait);
6337
6338         while(!signalled()) {
6339                 status = nfs4_proc_setlk(state, cmd, request);
6340                 if ((status != -EAGAIN) || IS_SETLK(cmd))
6341                         break;
6342
6343                 status = -ERESTARTSYS;
6344                 spin_lock_irqsave(&q->lock, flags);
6345                 if (waiter.notified) {
6346                         spin_unlock_irqrestore(&q->lock, flags);
6347                         continue;
6348                 }
6349                 set_current_state(TASK_INTERRUPTIBLE);
6350                 spin_unlock_irqrestore(&q->lock, flags);
6351
6352                 freezable_schedule_timeout_interruptible(NFS4_LOCK_MAXTIMEOUT);
6353         }
6354
6355         finish_wait(q, &wait);
6356         return status;
6357 }
6358 #else /* !CONFIG_NFS_V4_1 */
6359 static inline int
6360 nfs4_retry_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
6361 {
6362         return nfs4_retry_setlk_simple(state, cmd, request);
6363 }
6364 #endif
6365
6366 static int
6367 nfs4_proc_lock(struct file *filp, int cmd, struct file_lock *request)
6368 {
6369         struct nfs_open_context *ctx;
6370         struct nfs4_state *state;
6371         int status;
6372
6373         /* verify open state */
6374         ctx = nfs_file_open_context(filp);
6375         state = ctx->state;
6376
6377         if (request->fl_start < 0 || request->fl_end < 0)
6378                 return -EINVAL;
6379
6380         if (IS_GETLK(cmd)) {
6381                 if (state != NULL)
6382                         return nfs4_proc_getlk(state, F_GETLK, request);
6383                 return 0;
6384         }
6385
6386         if (!(IS_SETLK(cmd) || IS_SETLKW(cmd)))
6387                 return -EINVAL;
6388
6389         if (request->fl_type == F_UNLCK) {
6390                 if (state != NULL)
6391                         return nfs4_proc_unlck(state, cmd, request);
6392                 return 0;
6393         }
6394
6395         if (state == NULL)
6396                 return -ENOLCK;
6397
6398         if ((request->fl_flags & FL_POSIX) &&
6399             !test_bit(NFS_STATE_POSIX_LOCKS, &state->flags))
6400                 return -ENOLCK;
6401
6402         /*
6403          * Don't rely on the VFS having checked the file open mode,
6404          * since it won't do this for flock() locks.
6405          */
6406         switch (request->fl_type) {
6407         case F_RDLCK:
6408                 if (!(filp->f_mode & FMODE_READ))
6409                         return -EBADF;
6410                 break;
6411         case F_WRLCK:
6412                 if (!(filp->f_mode & FMODE_WRITE))
6413                         return -EBADF;
6414         }
6415
6416         status = nfs4_set_lock_state(state, request);
6417         if (status != 0)
6418                 return status;
6419
6420         return nfs4_retry_setlk(state, cmd, request);
6421 }
6422
6423 int nfs4_lock_delegation_recall(struct file_lock *fl, struct nfs4_state *state, const nfs4_stateid *stateid)
6424 {
6425         struct nfs_server *server = NFS_SERVER(state->inode);
6426         int err;
6427
6428         err = nfs4_set_lock_state(state, fl);
6429         if (err != 0)
6430                 return err;
6431         err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
6432         return nfs4_handle_delegation_recall_error(server, state, stateid, err);
6433 }
6434
6435 struct nfs_release_lockowner_data {
6436         struct nfs4_lock_state *lsp;
6437         struct nfs_server *server;
6438         struct nfs_release_lockowner_args args;
6439         struct nfs_release_lockowner_res res;
6440         unsigned long timestamp;
6441 };
6442
6443 static void nfs4_release_lockowner_prepare(struct rpc_task *task, void *calldata)
6444 {
6445         struct nfs_release_lockowner_data *data = calldata;
6446         struct nfs_server *server = data->server;
6447         nfs40_setup_sequence(server->nfs_client->cl_slot_tbl,
6448                              &data->args.seq_args, &data->res.seq_res, task);
6449         data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
6450         data->timestamp = jiffies;
6451 }
6452
6453 static void nfs4_release_lockowner_done(struct rpc_task *task, void *calldata)
6454 {
6455         struct nfs_release_lockowner_data *data = calldata;
6456         struct nfs_server *server = data->server;
6457
6458         nfs40_sequence_done(task, &data->res.seq_res);
6459
6460         switch (task->tk_status) {
6461         case 0:
6462                 renew_lease(server, data->timestamp);
6463                 break;
6464         case -NFS4ERR_STALE_CLIENTID:
6465         case -NFS4ERR_EXPIRED:
6466                 nfs4_schedule_lease_recovery(server->nfs_client);
6467                 break;
6468         case -NFS4ERR_LEASE_MOVED:
6469         case -NFS4ERR_DELAY:
6470                 if (nfs4_async_handle_error(task, server,
6471                                             NULL, NULL) == -EAGAIN)
6472                         rpc_restart_call_prepare(task);
6473         }
6474 }
6475
6476 static void nfs4_release_lockowner_release(void *calldata)
6477 {
6478         struct nfs_release_lockowner_data *data = calldata;
6479         nfs4_free_lock_state(data->server, data->lsp);
6480         kfree(calldata);
6481 }
6482
6483 static const struct rpc_call_ops nfs4_release_lockowner_ops = {
6484         .rpc_call_prepare = nfs4_release_lockowner_prepare,
6485         .rpc_call_done = nfs4_release_lockowner_done,
6486         .rpc_release = nfs4_release_lockowner_release,
6487 };
6488
6489 static void
6490 nfs4_release_lockowner(struct nfs_server *server, struct nfs4_lock_state *lsp)
6491 {
6492         struct nfs_release_lockowner_data *data;
6493         struct rpc_message msg = {
6494                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RELEASE_LOCKOWNER],
6495         };
6496
6497         if (server->nfs_client->cl_mvops->minor_version != 0)
6498                 return;
6499
6500         data = kmalloc(sizeof(*data), GFP_NOFS);
6501         if (!data)
6502                 return;
6503         data->lsp = lsp;
6504         data->server = server;
6505         data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
6506         data->args.lock_owner.id = lsp->ls_seqid.owner_id;
6507         data->args.lock_owner.s_dev = server->s_dev;
6508
6509         msg.rpc_argp = &data->args;
6510         msg.rpc_resp = &data->res;
6511         nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
6512         rpc_call_async(server->client, &msg, 0, &nfs4_release_lockowner_ops, data);
6513 }
6514
6515 #define XATTR_NAME_NFSV4_ACL "system.nfs4_acl"
6516
6517 static int nfs4_xattr_set_nfs4_acl(const struct xattr_handler *handler,
6518                                    struct dentry *unused, struct inode *inode,
6519                                    const char *key, const void *buf,
6520                                    size_t buflen, int flags)
6521 {
6522         return nfs4_proc_set_acl(inode, buf, buflen);
6523 }
6524
6525 static int nfs4_xattr_get_nfs4_acl(const struct xattr_handler *handler,
6526                                    struct dentry *unused, struct inode *inode,
6527                                    const char *key, void *buf, size_t buflen)
6528 {
6529         return nfs4_proc_get_acl(inode, buf, buflen);
6530 }
6531
6532 static bool nfs4_xattr_list_nfs4_acl(struct dentry *dentry)
6533 {
6534         return nfs4_server_supports_acls(NFS_SERVER(d_inode(dentry)));
6535 }
6536
6537 #ifdef CONFIG_NFS_V4_SECURITY_LABEL
6538
6539 static int nfs4_xattr_set_nfs4_label(const struct xattr_handler *handler,
6540                                      struct dentry *unused, struct inode *inode,
6541                                      const char *key, const void *buf,
6542                                      size_t buflen, int flags)
6543 {
6544         if (security_ismaclabel(key))
6545                 return nfs4_set_security_label(inode, buf, buflen);
6546
6547         return -EOPNOTSUPP;
6548 }
6549
6550 static int nfs4_xattr_get_nfs4_label(const struct xattr_handler *handler,
6551                                      struct dentry *unused, struct inode *inode,
6552                                      const char *key, void *buf, size_t buflen)
6553 {
6554         if (security_ismaclabel(key))
6555                 return nfs4_get_security_label(inode, buf, buflen);
6556         return -EOPNOTSUPP;
6557 }
6558
6559 static ssize_t
6560 nfs4_listxattr_nfs4_label(struct inode *inode, char *list, size_t list_len)
6561 {
6562         int len = 0;
6563
6564         if (nfs_server_capable(inode, NFS_CAP_SECURITY_LABEL)) {
6565                 len = security_inode_listsecurity(inode, list, list_len);
6566                 if (list_len && len > list_len)
6567                         return -ERANGE;
6568         }
6569         return len;
6570 }
6571
6572 static const struct xattr_handler nfs4_xattr_nfs4_label_handler = {
6573         .prefix = XATTR_SECURITY_PREFIX,
6574         .get    = nfs4_xattr_get_nfs4_label,
6575         .set    = nfs4_xattr_set_nfs4_label,
6576 };
6577
6578 #else
6579
6580 static ssize_t
6581 nfs4_listxattr_nfs4_label(struct inode *inode, char *list, size_t list_len)
6582 {
6583         return 0;
6584 }
6585
6586 #endif
6587
6588 /*
6589  * nfs_fhget will use either the mounted_on_fileid or the fileid
6590  */
6591 static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr)
6592 {
6593         if (!(((fattr->valid & NFS_ATTR_FATTR_MOUNTED_ON_FILEID) ||
6594                (fattr->valid & NFS_ATTR_FATTR_FILEID)) &&
6595               (fattr->valid & NFS_ATTR_FATTR_FSID) &&
6596               (fattr->valid & NFS_ATTR_FATTR_V4_LOCATIONS)))
6597                 return;
6598
6599         fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
6600                 NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_V4_REFERRAL;
6601         fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
6602         fattr->nlink = 2;
6603 }
6604
6605 static int _nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
6606                                    const struct qstr *name,
6607                                    struct nfs4_fs_locations *fs_locations,
6608                                    struct page *page)
6609 {
6610         struct nfs_server *server = NFS_SERVER(dir);
6611         u32 bitmask[3] = {
6612                 [0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
6613         };
6614         struct nfs4_fs_locations_arg args = {
6615                 .dir_fh = NFS_FH(dir),
6616                 .name = name,
6617                 .page = page,
6618                 .bitmask = bitmask,
6619         };
6620         struct nfs4_fs_locations_res res = {
6621                 .fs_locations = fs_locations,
6622         };
6623         struct rpc_message msg = {
6624                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
6625                 .rpc_argp = &args,
6626                 .rpc_resp = &res,
6627         };
6628         int status;
6629
6630         dprintk("%s: start\n", __func__);
6631
6632         /* Ask for the fileid of the absent filesystem if mounted_on_fileid
6633          * is not supported */
6634         if (NFS_SERVER(dir)->attr_bitmask[1] & FATTR4_WORD1_MOUNTED_ON_FILEID)
6635                 bitmask[1] |= FATTR4_WORD1_MOUNTED_ON_FILEID;
6636         else
6637                 bitmask[0] |= FATTR4_WORD0_FILEID;
6638
6639         nfs_fattr_init(&fs_locations->fattr);
6640         fs_locations->server = server;
6641         fs_locations->nlocations = 0;
6642         status = nfs4_call_sync(client, server, &msg, &args.seq_args, &res.seq_res, 0);
6643         dprintk("%s: returned status = %d\n", __func__, status);
6644         return status;
6645 }
6646
6647 int nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
6648                            const struct qstr *name,
6649                            struct nfs4_fs_locations *fs_locations,
6650                            struct page *page)
6651 {
6652         struct nfs4_exception exception = { };
6653         int err;
6654         do {
6655                 err = _nfs4_proc_fs_locations(client, dir, name,
6656                                 fs_locations, page);
6657                 trace_nfs4_get_fs_locations(dir, name, err);
6658                 err = nfs4_handle_exception(NFS_SERVER(dir), err,
6659                                 &exception);
6660         } while (exception.retry);
6661         return err;
6662 }
6663
6664 /*
6665  * This operation also signals the server that this client is
6666  * performing migration recovery.  The server can stop returning
6667  * NFS4ERR_LEASE_MOVED to this client.  A RENEW operation is
6668  * appended to this compound to identify the client ID which is
6669  * performing recovery.
6670  */
6671 static int _nfs40_proc_get_locations(struct inode *inode,
6672                                      struct nfs4_fs_locations *locations,
6673                                      struct page *page, struct rpc_cred *cred)
6674 {
6675         struct nfs_server *server = NFS_SERVER(inode);
6676         struct rpc_clnt *clnt = server->client;
6677         u32 bitmask[2] = {
6678                 [0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
6679         };
6680         struct nfs4_fs_locations_arg args = {
6681                 .clientid       = server->nfs_client->cl_clientid,
6682                 .fh             = NFS_FH(inode),
6683                 .page           = page,
6684                 .bitmask        = bitmask,
6685                 .migration      = 1,            /* skip LOOKUP */
6686                 .renew          = 1,            /* append RENEW */
6687         };
6688         struct nfs4_fs_locations_res res = {
6689                 .fs_locations   = locations,
6690                 .migration      = 1,
6691                 .renew          = 1,
6692         };
6693         struct rpc_message msg = {
6694                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
6695                 .rpc_argp       = &args,
6696                 .rpc_resp       = &res,
6697                 .rpc_cred       = cred,
6698         };
6699         unsigned long now = jiffies;
6700         int status;
6701
6702         nfs_fattr_init(&locations->fattr);
6703         locations->server = server;
6704         locations->nlocations = 0;
6705
6706         nfs4_init_sequence(&args.seq_args, &res.seq_res, 0);
6707         nfs4_set_sequence_privileged(&args.seq_args);
6708         status = nfs4_call_sync_sequence(clnt, server, &msg,
6709                                         &args.seq_args, &res.seq_res);
6710         if (status)
6711                 return status;
6712
6713         renew_lease(server, now);
6714         return 0;
6715 }
6716
6717 #ifdef CONFIG_NFS_V4_1
6718
6719 /*
6720  * This operation also signals the server that this client is
6721  * performing migration recovery.  The server can stop asserting
6722  * SEQ4_STATUS_LEASE_MOVED for this client.  The client ID
6723  * performing this operation is identified in the SEQUENCE
6724  * operation in this compound.
6725  *
6726  * When the client supports GETATTR(fs_locations_info), it can
6727  * be plumbed in here.
6728  */
6729 static int _nfs41_proc_get_locations(struct inode *inode,
6730                                      struct nfs4_fs_locations *locations,
6731                                      struct page *page, struct rpc_cred *cred)
6732 {
6733         struct nfs_server *server = NFS_SERVER(inode);
6734         struct rpc_clnt *clnt = server->client;
6735         u32 bitmask[2] = {
6736                 [0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
6737         };
6738         struct nfs4_fs_locations_arg args = {
6739                 .fh             = NFS_FH(inode),
6740                 .page           = page,
6741                 .bitmask        = bitmask,
6742                 .migration      = 1,            /* skip LOOKUP */
6743         };
6744         struct nfs4_fs_locations_res res = {
6745                 .fs_locations   = locations,
6746                 .migration      = 1,
6747         };
6748         struct rpc_message msg = {
6749                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
6750                 .rpc_argp       = &args,
6751                 .rpc_resp       = &res,
6752                 .rpc_cred       = cred,
6753         };
6754         int status;
6755
6756         nfs_fattr_init(&locations->fattr);
6757         locations->server = server;
6758         locations->nlocations = 0;
6759
6760         nfs4_init_sequence(&args.seq_args, &res.seq_res, 0);
6761         nfs4_set_sequence_privileged(&args.seq_args);
6762         status = nfs4_call_sync_sequence(clnt, server, &msg,
6763                                         &args.seq_args, &res.seq_res);
6764         if (status == NFS4_OK &&
6765             res.seq_res.sr_status_flags & SEQ4_STATUS_LEASE_MOVED)
6766                 status = -NFS4ERR_LEASE_MOVED;
6767         return status;
6768 }
6769
6770 #endif  /* CONFIG_NFS_V4_1 */
6771
6772 /**
6773  * nfs4_proc_get_locations - discover locations for a migrated FSID
6774  * @inode: inode on FSID that is migrating
6775  * @locations: result of query
6776  * @page: buffer
6777  * @cred: credential to use for this operation
6778  *
6779  * Returns NFS4_OK on success, a negative NFS4ERR status code if the
6780  * operation failed, or a negative errno if a local error occurred.
6781  *
6782  * On success, "locations" is filled in, but if the server has
6783  * no locations information, NFS_ATTR_FATTR_V4_LOCATIONS is not
6784  * asserted.
6785  *
6786  * -NFS4ERR_LEASE_MOVED is returned if the server still has leases
6787  * from this client that require migration recovery.
6788  */
6789 int nfs4_proc_get_locations(struct inode *inode,
6790                             struct nfs4_fs_locations *locations,
6791                             struct page *page, struct rpc_cred *cred)
6792 {
6793         struct nfs_server *server = NFS_SERVER(inode);
6794         struct nfs_client *clp = server->nfs_client;
6795         const struct nfs4_mig_recovery_ops *ops =
6796                                         clp->cl_mvops->mig_recovery_ops;
6797         struct nfs4_exception exception = { };
6798         int status;
6799
6800         dprintk("%s: FSID %llx:%llx on \"%s\"\n", __func__,
6801                 (unsigned long long)server->fsid.major,
6802                 (unsigned long long)server->fsid.minor,
6803                 clp->cl_hostname);
6804         nfs_display_fhandle(NFS_FH(inode), __func__);
6805
6806         do {
6807                 status = ops->get_locations(inode, locations, page, cred);
6808                 if (status != -NFS4ERR_DELAY)
6809                         break;
6810                 nfs4_handle_exception(server, status, &exception);
6811         } while (exception.retry);
6812         return status;
6813 }
6814
6815 /*
6816  * This operation also signals the server that this client is
6817  * performing "lease moved" recovery.  The server can stop
6818  * returning NFS4ERR_LEASE_MOVED to this client.  A RENEW operation
6819  * is appended to this compound to identify the client ID which is
6820  * performing recovery.
6821  */
6822 static int _nfs40_proc_fsid_present(struct inode *inode, struct rpc_cred *cred)
6823 {
6824         struct nfs_server *server = NFS_SERVER(inode);
6825         struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
6826         struct rpc_clnt *clnt = server->client;
6827         struct nfs4_fsid_present_arg args = {
6828                 .fh             = NFS_FH(inode),
6829                 .clientid       = clp->cl_clientid,
6830                 .renew          = 1,            /* append RENEW */
6831         };
6832         struct nfs4_fsid_present_res res = {
6833                 .renew          = 1,
6834         };
6835         struct rpc_message msg = {
6836                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_FSID_PRESENT],
6837                 .rpc_argp       = &args,
6838                 .rpc_resp       = &res,
6839                 .rpc_cred       = cred,
6840         };
6841         unsigned long now = jiffies;
6842         int status;
6843
6844         res.fh = nfs_alloc_fhandle();
6845         if (res.fh == NULL)
6846                 return -ENOMEM;
6847
6848         nfs4_init_sequence(&args.seq_args, &res.seq_res, 0);
6849         nfs4_set_sequence_privileged(&args.seq_args);
6850         status = nfs4_call_sync_sequence(clnt, server, &msg,
6851                                                 &args.seq_args, &res.seq_res);
6852         nfs_free_fhandle(res.fh);
6853         if (status)
6854                 return status;
6855
6856         do_renew_lease(clp, now);
6857         return 0;
6858 }
6859
6860 #ifdef CONFIG_NFS_V4_1
6861
6862 /*
6863  * This operation also signals the server that this client is
6864  * performing "lease moved" recovery.  The server can stop asserting
6865  * SEQ4_STATUS_LEASE_MOVED for this client.  The client ID performing
6866  * this operation is identified in the SEQUENCE operation in this
6867  * compound.
6868  */
6869 static int _nfs41_proc_fsid_present(struct inode *inode, struct rpc_cred *cred)
6870 {
6871         struct nfs_server *server = NFS_SERVER(inode);
6872         struct rpc_clnt *clnt = server->client;
6873         struct nfs4_fsid_present_arg args = {
6874                 .fh             = NFS_FH(inode),
6875         };
6876         struct nfs4_fsid_present_res res = {
6877         };
6878         struct rpc_message msg = {
6879                 .rpc_proc       = &nfs4_procedures[NFSPROC4_CLNT_FSID_PRESENT],
6880                 .rpc_argp       = &args,
6881                 .rpc_resp       = &res,
6882                 .rpc_cred       = cred,
6883         };
6884         int status;
6885
6886         res.fh = nfs_alloc_fhandle();
6887         if (res.fh == NULL)
6888                 return -ENOMEM;
6889
6890         nfs4_init_sequence(&args.seq_args, &res.seq_res, 0);
6891         nfs4_set_sequence_privileged(&args.seq_args);
6892         status = nfs4_call_sync_sequence(clnt, server, &msg,
6893                                                 &args.seq_args, &res.seq_res);
6894         nfs_free_fhandle(res.fh);
6895         if (status == NFS4_OK &&
6896             res.seq_res.sr_status_flags & SEQ4_STATUS_LEASE_MOVED)
6897                 status = -NFS4ERR_LEASE_MOVED;
6898         return status;
6899 }
6900
6901 #endif  /* CONFIG_NFS_V4_1 */
6902
6903 /**
6904  * nfs4_proc_fsid_present - Is this FSID present or absent on server?
6905  * @inode: inode on FSID to check
6906  * @cred: credential to use for this operation
6907  *
6908  * Server indicates whether the FSID is present, moved, or not
6909  * recognized.  This operation is necessary to clear a LEASE_MOVED
6910  * condition for this client ID.
6911  *
6912  * Returns NFS4_OK if the FSID is present on this server,
6913  * -NFS4ERR_MOVED if the FSID is no longer present, a negative
6914  *  NFS4ERR code if some error occurred on the server, or a
6915  *  negative errno if a local failure occurred.
6916  */
6917 int nfs4_proc_fsid_present(struct inode *inode, struct rpc_cred *cred)
6918 {
6919         struct nfs_server *server = NFS_SERVER(inode);
6920         struct nfs_client *clp = server->nfs_client;
6921         const struct nfs4_mig_recovery_ops *ops =
6922                                         clp->cl_mvops->mig_recovery_ops;
6923         struct nfs4_exception exception = { };
6924         int status;
6925
6926         dprintk("%s: FSID %llx:%llx on \"%s\"\n", __func__,
6927                 (unsigned long long)server->fsid.major,
6928                 (unsigned long long)server->fsid.minor,
6929                 clp->cl_hostname);
6930         nfs_display_fhandle(NFS_FH(inode), __func__);
6931
6932         do {
6933                 status = ops->fsid_present(inode, cred);
6934                 if (status != -NFS4ERR_DELAY)
6935                         break;
6936                 nfs4_handle_exception(server, status, &exception);
6937         } while (exception.retry);
6938         return status;
6939 }
6940
6941 /**
6942  * If 'use_integrity' is true and the state managment nfs_client
6943  * cl_rpcclient is using krb5i/p, use the integrity protected cl_rpcclient
6944  * and the machine credential as per RFC3530bis and RFC5661 Security
6945  * Considerations sections. Otherwise, just use the user cred with the
6946  * filesystem's rpc_client.
6947  */
6948 static int _nfs4_proc_secinfo(struct inode *dir, const struct qstr *name, struct nfs4_secinfo_flavors *flavors, bool use_integrity)
6949 {
6950         int status;
6951         struct nfs4_secinfo_arg args = {
6952                 .dir_fh = NFS_FH(dir),
6953                 .name   = name,
6954         };
6955         struct nfs4_secinfo_res res = {
6956                 .flavors     = flavors,
6957         };
6958         struct rpc_message msg = {
6959                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO],
6960                 .rpc_argp = &args,
6961                 .rpc_resp = &res,
6962         };
6963         struct rpc_clnt *clnt = NFS_SERVER(dir)->client;
6964         struct rpc_cred *cred = NULL;
6965
6966         if (use_integrity) {
6967                 clnt = NFS_SERVER(dir)->nfs_client->cl_rpcclient;
6968                 cred = nfs4_get_clid_cred(NFS_SERVER(dir)->nfs_client);
6969                 msg.rpc_cred = cred;
6970         }
6971
6972         dprintk("NFS call  secinfo %s\n", name->name);
6973
6974         nfs4_state_protect(NFS_SERVER(dir)->nfs_client,
6975                 NFS_SP4_MACH_CRED_SECINFO, &clnt, &msg);
6976
6977         status = nfs4_call_sync(clnt, NFS_SERVER(dir), &msg, &args.seq_args,
6978                                 &res.seq_res, 0);
6979         dprintk("NFS reply  secinfo: %d\n", status);
6980
6981         if (cred)
6982                 put_rpccred(cred);
6983
6984         return status;
6985 }
6986
6987 int nfs4_proc_secinfo(struct inode *dir, const struct qstr *name,
6988                       struct nfs4_secinfo_flavors *flavors)
6989 {
6990         struct nfs4_exception exception = { };
6991         int err;
6992         do {
6993                 err = -NFS4ERR_WRONGSEC;
6994
6995                 /* try to use integrity protection with machine cred */
6996                 if (_nfs4_is_integrity_protected(NFS_SERVER(dir)->nfs_client))
6997                         err = _nfs4_proc_secinfo(dir, name, flavors, true);
6998
6999                 /*
7000                  * if unable to use integrity protection, or SECINFO with
7001                  * integrity protection returns NFS4ERR_WRONGSEC (which is
7002                  * disallowed by spec, but exists in deployed servers) use
7003                  * the current filesystem's rpc_client and the user cred.
7004                  */
7005                 if (err == -NFS4ERR_WRONGSEC)
7006                         err = _nfs4_proc_secinfo(dir, name, flavors, false);
7007
7008                 trace_nfs4_secinfo(dir, name, err);
7009                 err = nfs4_handle_exception(NFS_SERVER(dir), err,
7010                                 &exception);
7011         } while (exception.retry);
7012         return err;
7013 }
7014
7015 #ifdef CONFIG_NFS_V4_1
7016 /*
7017  * Check the exchange flags returned by the server for invalid flags, having
7018  * both PNFS and NON_PNFS flags set, and not having one of NON_PNFS, PNFS, or
7019  * DS flags set.
7020  */
7021 static int nfs4_check_cl_exchange_flags(u32 flags)
7022 {
7023         if (flags & ~EXCHGID4_FLAG_MASK_R)
7024                 goto out_inval;
7025         if ((flags & EXCHGID4_FLAG_USE_PNFS_MDS) &&
7026             (flags & EXCHGID4_FLAG_USE_NON_PNFS))
7027                 goto out_inval;
7028         if (!(flags & (EXCHGID4_FLAG_MASK_PNFS)))
7029                 goto out_inval;
7030         return NFS_OK;
7031 out_inval:
7032         return -NFS4ERR_INVAL;
7033 }
7034
7035 static bool
7036 nfs41_same_server_scope(struct nfs41_server_scope *a,
7037                         struct nfs41_server_scope *b)
7038 {
7039         if (a->server_scope_sz == b->server_scope_sz &&
7040             memcmp(a->server_scope, b->server_scope, a->server_scope_sz) == 0)
7041                 return true;
7042
7043         return false;
7044 }
7045
7046 static void
7047 nfs4_bind_one_conn_to_session_done(struct rpc_task *task, void *calldata)
7048 {
7049 }
7050
7051 static const struct rpc_call_ops nfs4_bind_one_conn_to_session_ops = {
7052         .rpc_call_done =  &nfs4_bind_one_conn_to_session_done,
7053 };
7054
7055 /*
7056  * nfs4_proc_bind_one_conn_to_session()
7057  *
7058  * The 4.1 client currently uses the same TCP connection for the
7059  * fore and backchannel.
7060  */
7061 static
7062 int nfs4_proc_bind_one_conn_to_session(struct rpc_clnt *clnt,
7063                 struct rpc_xprt *xprt,
7064                 struct nfs_client *clp,
7065                 struct rpc_cred *cred)
7066 {
7067         int status;
7068         struct nfs41_bind_conn_to_session_args args = {
7069                 .client = clp,
7070                 .dir = NFS4_CDFC4_FORE_OR_BOTH,
7071         };
7072         struct nfs41_bind_conn_to_session_res res;
7073         struct rpc_message msg = {
7074                 .rpc_proc =
7075                         &nfs4_procedures[NFSPROC4_CLNT_BIND_CONN_TO_SESSION],
7076                 .rpc_argp = &args,
7077                 .rpc_resp = &res,
7078                 .rpc_cred = cred,
7079         };
7080         struct rpc_task_setup task_setup_data = {
7081                 .rpc_client = clnt,
7082                 .rpc_xprt = xprt,
7083                 .callback_ops = &nfs4_bind_one_conn_to_session_ops,
7084                 .rpc_message = &msg,
7085                 .flags = RPC_TASK_TIMEOUT,
7086         };
7087         struct rpc_task *task;
7088
7089         dprintk("--> %s\n", __func__);
7090
7091         nfs4_copy_sessionid(&args.sessionid, &clp->cl_session->sess_id);
7092         if (!(clp->cl_session->flags & SESSION4_BACK_CHAN))
7093                 args.dir = NFS4_CDFC4_FORE;
7094
7095         /* Do not set the backchannel flag unless this is clnt->cl_xprt */
7096         if (xprt != rcu_access_pointer(clnt->cl_xprt))
7097                 args.dir = NFS4_CDFC4_FORE;
7098
7099         task = rpc_run_task(&task_setup_data);
7100         if (!IS_ERR(task)) {
7101                 status = task->tk_status;
7102                 rpc_put_task(task);
7103         } else
7104                 status = PTR_ERR(task);
7105         trace_nfs4_bind_conn_to_session(clp, status);
7106         if (status == 0) {
7107                 if (memcmp(res.sessionid.data,
7108                     clp->cl_session->sess_id.data, NFS4_MAX_SESSIONID_LEN)) {
7109                         dprintk("NFS: %s: Session ID mismatch\n", __func__);
7110                         status = -EIO;
7111                         goto out;
7112                 }
7113                 if ((res.dir & args.dir) != res.dir || res.dir == 0) {
7114                         dprintk("NFS: %s: Unexpected direction from server\n",
7115                                 __func__);
7116                         status = -EIO;
7117                         goto out;
7118                 }
7119                 if (res.use_conn_in_rdma_mode != args.use_conn_in_rdma_mode) {
7120                         dprintk("NFS: %s: Server returned RDMA mode = true\n",
7121                                 __func__);
7122                         status = -EIO;
7123                         goto out;
7124                 }
7125         }
7126 out:
7127         dprintk("<-- %s status= %d\n", __func__, status);
7128         return status;
7129 }
7130
7131 struct rpc_bind_conn_calldata {
7132         struct nfs_client *clp;
7133         struct rpc_cred *cred;
7134 };
7135
7136 static int
7137 nfs4_proc_bind_conn_to_session_callback(struct rpc_clnt *clnt,
7138                 struct rpc_xprt *xprt,
7139                 void *calldata)
7140 {
7141         struct rpc_bind_conn_calldata *p = calldata;
7142
7143         return nfs4_proc_bind_one_conn_to_session(clnt, xprt, p->clp, p->cred);
7144 }
7145
7146 int nfs4_proc_bind_conn_to_session(struct nfs_client *clp, struct rpc_cred *cred)
7147 {
7148         struct rpc_bind_conn_calldata data = {
7149                 .clp = clp,
7150                 .cred = cred,
7151         };
7152         return rpc_clnt_iterate_for_each_xprt(clp->cl_rpcclient,
7153                         nfs4_proc_bind_conn_to_session_callback, &data);
7154 }
7155
7156 /*
7157  * Minimum set of SP4_MACH_CRED operations from RFC 5661 in the enforce map
7158  * and operations we'd like to see to enable certain features in the allow map
7159  */
7160 static const struct nfs41_state_protection nfs4_sp4_mach_cred_request = {
7161         .how = SP4_MACH_CRED,
7162         .enforce.u.words = {
7163                 [1] = 1 << (OP_BIND_CONN_TO_SESSION - 32) |
7164                       1 << (OP_EXCHANGE_ID - 32) |
7165                       1 << (OP_CREATE_SESSION - 32) |
7166                       1 << (OP_DESTROY_SESSION - 32) |
7167                       1 << (OP_DESTROY_CLIENTID - 32)
7168         },
7169         .allow.u.words = {
7170                 [0] = 1 << (OP_CLOSE) |
7171                       1 << (OP_OPEN_DOWNGRADE) |
7172                       1 << (OP_LOCKU) |
7173                       1 << (OP_DELEGRETURN) |
7174                       1 << (OP_COMMIT),
7175                 [1] = 1 << (OP_SECINFO - 32) |
7176                       1 << (OP_SECINFO_NO_NAME - 32) |
7177                       1 << (OP_LAYOUTRETURN - 32) |
7178                       1 << (OP_TEST_STATEID - 32) |
7179                       1 << (OP_FREE_STATEID - 32) |
7180                       1 << (OP_WRITE - 32)
7181         }
7182 };
7183
7184 /*
7185  * Select the state protection mode for client `clp' given the server results
7186  * from exchange_id in `sp'.
7187  *
7188  * Returns 0 on success, negative errno otherwise.
7189  */
7190 static int nfs4_sp4_select_mode(struct nfs_client *clp,
7191                                  struct nfs41_state_protection *sp)
7192 {
7193         static const u32 supported_enforce[NFS4_OP_MAP_NUM_WORDS] = {
7194                 [1] = 1 << (OP_BIND_CONN_TO_SESSION - 32) |
7195                       1 << (OP_EXCHANGE_ID - 32) |
7196                       1 << (OP_CREATE_SESSION - 32) |
7197                       1 << (OP_DESTROY_SESSION - 32) |
7198                       1 << (OP_DESTROY_CLIENTID - 32)
7199         };
7200         unsigned int i;
7201
7202         if (sp->how == SP4_MACH_CRED) {
7203                 /* Print state protect result */
7204                 dfprintk(MOUNT, "Server SP4_MACH_CRED support:\n");
7205                 for (i = 0; i <= LAST_NFS4_OP; i++) {
7206                         if (test_bit(i, sp->enforce.u.longs))
7207                                 dfprintk(MOUNT, "  enforce op %d\n", i);
7208                         if (test_bit(i, sp->allow.u.longs))
7209                                 dfprintk(MOUNT, "  allow op %d\n", i);
7210                 }
7211
7212                 /* make sure nothing is on enforce list that isn't supported */
7213                 for (i = 0; i < NFS4_OP_MAP_NUM_WORDS; i++) {
7214                         if (sp->enforce.u.words[i] & ~supported_enforce[i]) {
7215                                 dfprintk(MOUNT, "sp4_mach_cred: disabled\n");
7216                                 return -EINVAL;
7217                         }
7218                 }
7219
7220                 /*
7221                  * Minimal mode - state operations are allowed to use machine
7222                  * credential.  Note this already happens by default, so the
7223                  * client doesn't have to do anything more than the negotiation.
7224                  *
7225                  * NOTE: we don't care if EXCHANGE_ID is in the list -
7226                  *       we're already using the machine cred for exchange_id
7227                  *       and will never use a different cred.
7228                  */
7229                 if (test_bit(OP_BIND_CONN_TO_SESSION, sp->enforce.u.longs) &&
7230                     test_bit(OP_CREATE_SESSION, sp->enforce.u.longs) &&
7231                     test_bit(OP_DESTROY_SESSION, sp->enforce.u.longs) &&
7232                     test_bit(OP_DESTROY_CLIENTID, sp->enforce.u.longs)) {
7233                         dfprintk(MOUNT, "sp4_mach_cred:\n");
7234                         dfprintk(MOUNT, "  minimal mode enabled\n");
7235                         set_bit(NFS_SP4_MACH_CRED_MINIMAL, &clp->cl_sp4_flags);
7236                 } else {
7237                         dfprintk(MOUNT, "sp4_mach_cred: disabled\n");
7238                         return -EINVAL;
7239                 }
7240
7241                 if (test_bit(OP_CLOSE, sp->allow.u.longs) &&
7242                     test_bit(OP_OPEN_DOWNGRADE, sp->allow.u.longs) &&
7243                     test_bit(OP_DELEGRETURN, sp->allow.u.longs) &&
7244                     test_bit(OP_LOCKU, sp->allow.u.longs)) {
7245                         dfprintk(MOUNT, "  cleanup mode enabled\n");
7246                         set_bit(NFS_SP4_MACH_CRED_CLEANUP, &clp->cl_sp4_flags);
7247                 }
7248
7249                 if (test_bit(OP_LAYOUTRETURN, sp->allow.u.longs)) {
7250                         dfprintk(MOUNT, "  pnfs cleanup mode enabled\n");
7251                         set_bit(NFS_SP4_MACH_CRED_PNFS_CLEANUP,
7252                                 &clp->cl_sp4_flags);
7253                 }
7254
7255                 if (test_bit(OP_SECINFO, sp->allow.u.longs) &&
7256                     test_bit(OP_SECINFO_NO_NAME, sp->allow.u.longs)) {
7257                         dfprintk(MOUNT, "  secinfo mode enabled\n");
7258                         set_bit(NFS_SP4_MACH_CRED_SECINFO, &clp->cl_sp4_flags);
7259                 }
7260
7261                 if (test_bit(OP_TEST_STATEID, sp->allow.u.longs) &&
7262                     test_bit(OP_FREE_STATEID, sp->allow.u.longs)) {
7263                         dfprintk(MOUNT, "  stateid mode enabled\n");
7264                         set_bit(NFS_SP4_MACH_CRED_STATEID, &clp->cl_sp4_flags);
7265                 }
7266
7267                 if (test_bit(OP_WRITE, sp->allow.u.longs)) {
7268                         dfprintk(MOUNT, "  write mode enabled\n");
7269                         set_bit(NFS_SP4_MACH_CRED_WRITE, &clp->cl_sp4_flags);
7270                 }
7271
7272                 if (test_bit(OP_COMMIT, sp->allow.u.longs)) {
7273                         dfprintk(MOUNT, "  commit mode enabled\n");
7274                         set_bit(NFS_SP4_MACH_CRED_COMMIT, &clp->cl_sp4_flags);
7275                 }
7276         }
7277
7278         return 0;
7279 }
7280
7281 struct nfs41_exchange_id_data {
7282         struct nfs41_exchange_id_res res;
7283         struct nfs41_exchange_id_args args;
7284         struct rpc_xprt *xprt;
7285         int rpc_status;
7286 };
7287
7288 static void nfs4_exchange_id_done(struct rpc_task *task, void *data)
7289 {
7290         struct nfs41_exchange_id_data *cdata =
7291                                         (struct nfs41_exchange_id_data *)data;
7292         struct nfs_client *clp = cdata->args.client;
7293         int status = task->tk_status;
7294
7295         trace_nfs4_exchange_id(clp, status);
7296
7297         if (status == 0)
7298                 status = nfs4_check_cl_exchange_flags(cdata->res.flags);
7299
7300         if (cdata->xprt && status == 0) {
7301                 status = nfs4_detect_session_trunking(clp, &cdata->res,
7302                                                       cdata->xprt);
7303                 goto out;
7304         }
7305
7306         if (status  == 0)
7307                 status = nfs4_sp4_select_mode(clp, &cdata->res.state_protect);
7308
7309         if (status == 0) {
7310                 clp->cl_clientid = cdata->res.clientid;
7311                 clp->cl_exchange_flags = cdata->res.flags;
7312                 /* Client ID is not confirmed */
7313                 if (!(cdata->res.flags & EXCHGID4_FLAG_CONFIRMED_R)) {
7314                         clear_bit(NFS4_SESSION_ESTABLISHED,
7315                         &clp->cl_session->session_state);
7316                         clp->cl_seqid = cdata->res.seqid;
7317                 }
7318
7319                 kfree(clp->cl_serverowner);
7320                 clp->cl_serverowner = cdata->res.server_owner;
7321                 cdata->res.server_owner = NULL;
7322
7323                 /* use the most recent implementation id */
7324                 kfree(clp->cl_implid);
7325                 clp->cl_implid = cdata->res.impl_id;
7326                 cdata->res.impl_id = NULL;
7327
7328                 if (clp->cl_serverscope != NULL &&
7329                     !nfs41_same_server_scope(clp->cl_serverscope,
7330                                         cdata->res.server_scope)) {
7331                         dprintk("%s: server_scope mismatch detected\n",
7332                                 __func__);
7333                         set_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state);
7334                         kfree(clp->cl_serverscope);
7335                         clp->cl_serverscope = NULL;
7336                 }
7337
7338                 if (clp->cl_serverscope == NULL) {
7339                         clp->cl_serverscope = cdata->res.server_scope;
7340                         cdata->res.server_scope = NULL;
7341                 }
7342                 /* Save the EXCHANGE_ID verifier session trunk tests */
7343                 memcpy(clp->cl_confirm.data, cdata->args.verifier->data,
7344                        sizeof(clp->cl_confirm.data));
7345         }
7346 out:
7347         cdata->rpc_status = status;
7348         return;
7349 }
7350
7351 static void nfs4_exchange_id_release(void *data)
7352 {
7353         struct nfs41_exchange_id_data *cdata =
7354                                         (struct nfs41_exchange_id_data *)data;
7355
7356         nfs_put_client(cdata->args.client);
7357         if (cdata->xprt) {
7358                 xprt_put(cdata->xprt);
7359                 rpc_clnt_xprt_switch_put(cdata->args.client->cl_rpcclient);
7360         }
7361         kfree(cdata->res.impl_id);
7362         kfree(cdata->res.server_scope);
7363         kfree(cdata->res.server_owner);
7364         kfree(cdata);
7365 }
7366
7367 static const struct rpc_call_ops nfs4_exchange_id_call_ops = {
7368         .rpc_call_done = nfs4_exchange_id_done,
7369         .rpc_release = nfs4_exchange_id_release,
7370 };
7371
7372 /*
7373  * _nfs4_proc_exchange_id()
7374  *
7375  * Wrapper for EXCHANGE_ID operation.
7376  */
7377 static int _nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred,
7378                         u32 sp4_how, struct rpc_xprt *xprt)
7379 {
7380         nfs4_verifier verifier;
7381         struct rpc_message msg = {
7382                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_EXCHANGE_ID],
7383                 .rpc_cred = cred,
7384         };
7385         struct rpc_task_setup task_setup_data = {
7386                 .rpc_client = clp->cl_rpcclient,
7387                 .callback_ops = &nfs4_exchange_id_call_ops,
7388                 .rpc_message = &msg,
7389                 .flags = RPC_TASK_ASYNC | RPC_TASK_TIMEOUT,
7390         };
7391         struct nfs41_exchange_id_data *calldata;
7392         struct rpc_task *task;
7393         int status = -EIO;
7394
7395         if (!atomic_inc_not_zero(&clp->cl_count))
7396                 goto out;
7397
7398         status = -ENOMEM;
7399         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
7400         if (!calldata)
7401                 goto out;
7402
7403         if (!xprt)
7404                 nfs4_init_boot_verifier(clp, &verifier);
7405
7406         status = nfs4_init_uniform_client_string(clp);
7407         if (status)
7408                 goto out_calldata;
7409
7410         dprintk("NFS call  exchange_id auth=%s, '%s'\n",
7411                 clp->cl_rpcclient->cl_auth->au_ops->au_name,
7412                 clp->cl_owner_id);
7413
7414         calldata->res.server_owner = kzalloc(sizeof(struct nfs41_server_owner),
7415                                                 GFP_NOFS);
7416         status = -ENOMEM;
7417         if (unlikely(calldata->res.server_owner == NULL))
7418                 goto out_calldata;
7419
7420         calldata->res.server_scope = kzalloc(sizeof(struct nfs41_server_scope),
7421                                         GFP_NOFS);
7422         if (unlikely(calldata->res.server_scope == NULL))
7423                 goto out_server_owner;
7424
7425         calldata->res.impl_id = kzalloc(sizeof(struct nfs41_impl_id), GFP_NOFS);
7426         if (unlikely(calldata->res.impl_id == NULL))
7427                 goto out_server_scope;
7428
7429         switch (sp4_how) {
7430         case SP4_NONE:
7431                 calldata->args.state_protect.how = SP4_NONE;
7432                 break;
7433
7434         case SP4_MACH_CRED:
7435                 calldata->args.state_protect = nfs4_sp4_mach_cred_request;
7436                 break;
7437
7438         default:
7439                 /* unsupported! */
7440                 WARN_ON_ONCE(1);
7441                 status = -EINVAL;
7442                 goto out_impl_id;
7443         }
7444         if (xprt) {
7445                 calldata->xprt = xprt;
7446                 task_setup_data.rpc_xprt = xprt;
7447                 task_setup_data.flags =
7448                                 RPC_TASK_SOFT|RPC_TASK_SOFTCONN|RPC_TASK_ASYNC;
7449                 calldata->args.verifier = &clp->cl_confirm;
7450         } else {
7451                 calldata->args.verifier = &verifier;
7452         }
7453         calldata->args.client = clp;
7454 #ifdef CONFIG_NFS_V4_1_MIGRATION
7455         calldata->args.flags = EXCHGID4_FLAG_SUPP_MOVED_REFER |
7456         EXCHGID4_FLAG_BIND_PRINC_STATEID |
7457         EXCHGID4_FLAG_SUPP_MOVED_MIGR,
7458 #else
7459         calldata->args.flags = EXCHGID4_FLAG_SUPP_MOVED_REFER |
7460         EXCHGID4_FLAG_BIND_PRINC_STATEID,
7461 #endif
7462         msg.rpc_argp = &calldata->args;
7463         msg.rpc_resp = &calldata->res;
7464         task_setup_data.callback_data = calldata;
7465
7466         task = rpc_run_task(&task_setup_data);
7467         if (IS_ERR(task)) {
7468         status = PTR_ERR(task);
7469                 goto out_impl_id;
7470         }
7471
7472         if (!xprt) {
7473                 status = rpc_wait_for_completion_task(task);
7474                 if (!status)
7475                         status = calldata->rpc_status;
7476         } else  /* session trunking test */
7477                 status = calldata->rpc_status;
7478
7479         rpc_put_task(task);
7480 out:
7481         if (clp->cl_implid != NULL)
7482                 dprintk("NFS reply exchange_id: Server Implementation ID: "
7483                         "domain: %s, name: %s, date: %llu,%u\n",
7484                         clp->cl_implid->domain, clp->cl_implid->name,
7485                         clp->cl_implid->date.seconds,
7486                         clp->cl_implid->date.nseconds);
7487         dprintk("NFS reply exchange_id: %d\n", status);
7488         return status;
7489
7490 out_impl_id:
7491         kfree(calldata->res.impl_id);
7492 out_server_scope:
7493         kfree(calldata->res.server_scope);
7494 out_server_owner:
7495         kfree(calldata->res.server_owner);
7496 out_calldata:
7497         kfree(calldata);
7498         goto out;
7499 }
7500
7501 /*
7502  * nfs4_proc_exchange_id()
7503  *
7504  * Returns zero, a negative errno, or a negative NFS4ERR status code.
7505  *
7506  * Since the clientid has expired, all compounds using sessions
7507  * associated with the stale clientid will be returning
7508  * NFS4ERR_BADSESSION in the sequence operation, and will therefore
7509  * be in some phase of session reset.
7510  *
7511  * Will attempt to negotiate SP4_MACH_CRED if krb5i / krb5p auth is used.
7512  */
7513 int nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred)
7514 {
7515         rpc_authflavor_t authflavor = clp->cl_rpcclient->cl_auth->au_flavor;
7516         int status;
7517
7518         /* try SP4_MACH_CRED if krb5i/p */
7519         if (authflavor == RPC_AUTH_GSS_KRB5I ||
7520             authflavor == RPC_AUTH_GSS_KRB5P) {
7521                 status = _nfs4_proc_exchange_id(clp, cred, SP4_MACH_CRED, NULL);
7522                 if (!status)
7523                         return 0;
7524         }
7525
7526         /* try SP4_NONE */
7527         return _nfs4_proc_exchange_id(clp, cred, SP4_NONE, NULL);
7528 }
7529
7530 /**
7531  * nfs4_test_session_trunk
7532  *
7533  * This is an add_xprt_test() test function called from
7534  * rpc_clnt_setup_test_and_add_xprt.
7535  *
7536  * The rpc_xprt_switch is referrenced by rpc_clnt_setup_test_and_add_xprt
7537  * and is dereferrenced in nfs4_exchange_id_release
7538  *
7539  * Upon success, add the new transport to the rpc_clnt
7540  *
7541  * @clnt: struct rpc_clnt to get new transport
7542  * @xprt: the rpc_xprt to test
7543  * @data: call data for _nfs4_proc_exchange_id.
7544  */
7545 int nfs4_test_session_trunk(struct rpc_clnt *clnt, struct rpc_xprt *xprt,
7546                             void *data)
7547 {
7548         struct nfs4_add_xprt_data *adata = (struct nfs4_add_xprt_data *)data;
7549         u32 sp4_how;
7550
7551         dprintk("--> %s try %s\n", __func__,
7552                 xprt->address_strings[RPC_DISPLAY_ADDR]);
7553
7554         sp4_how = (adata->clp->cl_sp4_flags == 0 ? SP4_NONE : SP4_MACH_CRED);
7555
7556         /* Test connection for session trunking. Async exchange_id call */
7557         return  _nfs4_proc_exchange_id(adata->clp, adata->cred, sp4_how, xprt);
7558 }
7559 EXPORT_SYMBOL_GPL(nfs4_test_session_trunk);
7560
7561 static int _nfs4_proc_destroy_clientid(struct nfs_client *clp,
7562                 struct rpc_cred *cred)
7563 {
7564         struct rpc_message msg = {
7565                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_CLIENTID],
7566                 .rpc_argp = clp,
7567                 .rpc_cred = cred,
7568         };
7569         int status;
7570
7571         status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
7572         trace_nfs4_destroy_clientid(clp, status);
7573         if (status)
7574                 dprintk("NFS: Got error %d from the server %s on "
7575                         "DESTROY_CLIENTID.", status, clp->cl_hostname);
7576         return status;
7577 }
7578
7579 static int nfs4_proc_destroy_clientid(struct nfs_client *clp,
7580                 struct rpc_cred *cred)
7581 {
7582         unsigned int loop;
7583         int ret;
7584
7585         for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
7586                 ret = _nfs4_proc_destroy_clientid(clp, cred);
7587                 switch (ret) {
7588                 case -NFS4ERR_DELAY:
7589                 case -NFS4ERR_CLIENTID_BUSY:
7590                         ssleep(1);
7591                         break;
7592                 default:
7593                         return ret;
7594                 }
7595         }
7596         return 0;
7597 }
7598
7599 int nfs4_destroy_clientid(struct nfs_client *clp)
7600 {
7601         struct rpc_cred *cred;
7602         int ret = 0;
7603
7604         if (clp->cl_mvops->minor_version < 1)
7605                 goto out;
7606         if (clp->cl_exchange_flags == 0)
7607                 goto out;
7608         if (clp->cl_preserve_clid)
7609                 goto out;
7610         cred = nfs4_get_clid_cred(clp);
7611         ret = nfs4_proc_destroy_clientid(clp, cred);
7612         if (cred)
7613                 put_rpccred(cred);
7614         switch (ret) {
7615         case 0:
7616         case -NFS4ERR_STALE_CLIENTID:
7617                 clp->cl_exchange_flags = 0;
7618         }
7619 out:
7620         return ret;
7621 }
7622
7623 struct nfs4_get_lease_time_data {
7624         struct nfs4_get_lease_time_args *args;
7625         struct nfs4_get_lease_time_res *res;
7626         struct nfs_client *clp;
7627 };
7628
7629 static void nfs4_get_lease_time_prepare(struct rpc_task *task,
7630                                         void *calldata)
7631 {
7632         struct nfs4_get_lease_time_data *data =
7633                         (struct nfs4_get_lease_time_data *)calldata;
7634
7635         dprintk("--> %s\n", __func__);
7636         /* just setup sequence, do not trigger session recovery
7637            since we're invoked within one */
7638         nfs41_setup_sequence(data->clp->cl_session,
7639                         &data->args->la_seq_args,
7640                         &data->res->lr_seq_res,
7641                         task);
7642         dprintk("<-- %s\n", __func__);
7643 }
7644
7645 /*
7646  * Called from nfs4_state_manager thread for session setup, so don't recover
7647  * from sequence operation or clientid errors.
7648  */
7649 static void nfs4_get_lease_time_done(struct rpc_task *task, void *calldata)
7650 {
7651         struct nfs4_get_lease_time_data *data =
7652                         (struct nfs4_get_lease_time_data *)calldata;
7653
7654         dprintk("--> %s\n", __func__);
7655         if (!nfs41_sequence_done(task, &data->res->lr_seq_res))
7656                 return;
7657         switch (task->tk_status) {
7658         case -NFS4ERR_DELAY:
7659         case -NFS4ERR_GRACE:
7660                 dprintk("%s Retry: tk_status %d\n", __func__, task->tk_status);
7661                 rpc_delay(task, NFS4_POLL_RETRY_MIN);
7662                 task->tk_status = 0;
7663                 /* fall through */
7664         case -NFS4ERR_RETRY_UNCACHED_REP:
7665                 rpc_restart_call_prepare(task);
7666                 return;
7667         }
7668         dprintk("<-- %s\n", __func__);
7669 }
7670
7671 static const struct rpc_call_ops nfs4_get_lease_time_ops = {
7672         .rpc_call_prepare = nfs4_get_lease_time_prepare,
7673         .rpc_call_done = nfs4_get_lease_time_done,
7674 };
7675
7676 int nfs4_proc_get_lease_time(struct nfs_client *clp, struct nfs_fsinfo *fsinfo)
7677 {
7678         struct rpc_task *task;
7679         struct nfs4_get_lease_time_args args;
7680         struct nfs4_get_lease_time_res res = {
7681                 .lr_fsinfo = fsinfo,
7682         };
7683         struct nfs4_get_lease_time_data data = {
7684                 .args = &args,
7685                 .res = &res,
7686                 .clp = clp,
7687         };
7688         struct rpc_message msg = {
7689                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GET_LEASE_TIME],
7690                 .rpc_argp = &args,
7691                 .rpc_resp = &res,
7692         };
7693         struct rpc_task_setup task_setup = {
7694                 .rpc_client = clp->cl_rpcclient,
7695                 .rpc_message = &msg,
7696                 .callback_ops = &nfs4_get_lease_time_ops,
7697                 .callback_data = &data,
7698                 .flags = RPC_TASK_TIMEOUT,
7699         };
7700         int status;
7701
7702         nfs4_init_sequence(&args.la_seq_args, &res.lr_seq_res, 0);
7703         nfs4_set_sequence_privileged(&args.la_seq_args);
7704         dprintk("--> %s\n", __func__);
7705         task = rpc_run_task(&task_setup);
7706
7707         if (IS_ERR(task))
7708                 status = PTR_ERR(task);
7709         else {
7710                 status = task->tk_status;
7711                 rpc_put_task(task);
7712         }
7713         dprintk("<-- %s return %d\n", __func__, status);
7714
7715         return status;
7716 }
7717
7718 /*
7719  * Initialize the values to be used by the client in CREATE_SESSION
7720  * If nfs4_init_session set the fore channel request and response sizes,
7721  * use them.
7722  *
7723  * Set the back channel max_resp_sz_cached to zero to force the client to
7724  * always set csa_cachethis to FALSE because the current implementation
7725  * of the back channel DRC only supports caching the CB_SEQUENCE operation.
7726  */
7727 static void nfs4_init_channel_attrs(struct nfs41_create_session_args *args,
7728                                     struct rpc_clnt *clnt)
7729 {
7730         unsigned int max_rqst_sz, max_resp_sz;
7731         unsigned int max_bc_payload = rpc_max_bc_payload(clnt);
7732
7733         max_rqst_sz = NFS_MAX_FILE_IO_SIZE + nfs41_maxwrite_overhead;
7734         max_resp_sz = NFS_MAX_FILE_IO_SIZE + nfs41_maxread_overhead;
7735
7736         /* Fore channel attributes */
7737         args->fc_attrs.max_rqst_sz = max_rqst_sz;
7738         args->fc_attrs.max_resp_sz = max_resp_sz;
7739         args->fc_attrs.max_ops = NFS4_MAX_OPS;
7740         args->fc_attrs.max_reqs = max_session_slots;
7741
7742         dprintk("%s: Fore Channel : max_rqst_sz=%u max_resp_sz=%u "
7743                 "max_ops=%u max_reqs=%u\n",
7744                 __func__,
7745                 args->fc_attrs.max_rqst_sz, args->fc_attrs.max_resp_sz,
7746                 args->fc_attrs.max_ops, args->fc_attrs.max_reqs);
7747
7748         /* Back channel attributes */
7749         args->bc_attrs.max_rqst_sz = max_bc_payload;
7750         args->bc_attrs.max_resp_sz = max_bc_payload;
7751         args->bc_attrs.max_resp_sz_cached = 0;
7752         args->bc_attrs.max_ops = NFS4_MAX_BACK_CHANNEL_OPS;
7753         args->bc_attrs.max_reqs = min_t(unsigned short, max_session_cb_slots, 1);
7754
7755         dprintk("%s: Back Channel : max_rqst_sz=%u max_resp_sz=%u "
7756                 "max_resp_sz_cached=%u max_ops=%u max_reqs=%u\n",
7757                 __func__,
7758                 args->bc_attrs.max_rqst_sz, args->bc_attrs.max_resp_sz,
7759                 args->bc_attrs.max_resp_sz_cached, args->bc_attrs.max_ops,
7760                 args->bc_attrs.max_reqs);
7761 }
7762
7763 static int nfs4_verify_fore_channel_attrs(struct nfs41_create_session_args *args,
7764                 struct nfs41_create_session_res *res)
7765 {
7766         struct nfs4_channel_attrs *sent = &args->fc_attrs;
7767         struct nfs4_channel_attrs *rcvd = &res->fc_attrs;
7768
7769         if (rcvd->max_resp_sz > sent->max_resp_sz)
7770                 return -EINVAL;
7771         /*
7772          * Our requested max_ops is the minimum we need; we're not
7773          * prepared to break up compounds into smaller pieces than that.
7774          * So, no point even trying to continue if the server won't
7775          * cooperate:
7776          */
7777         if (rcvd->max_ops < sent->max_ops)
7778                 return -EINVAL;
7779         if (rcvd->max_reqs == 0)
7780                 return -EINVAL;
7781         if (rcvd->max_reqs > NFS4_MAX_SLOT_TABLE)
7782                 rcvd->max_reqs = NFS4_MAX_SLOT_TABLE;
7783         return 0;
7784 }
7785
7786 static int nfs4_verify_back_channel_attrs(struct nfs41_create_session_args *args,
7787                 struct nfs41_create_session_res *res)
7788 {
7789         struct nfs4_channel_attrs *sent = &args->bc_attrs;
7790         struct nfs4_channel_attrs *rcvd = &res->bc_attrs;
7791
7792         if (!(res->flags & SESSION4_BACK_CHAN))
7793                 goto out;
7794         if (rcvd->max_rqst_sz > sent->max_rqst_sz)
7795                 return -EINVAL;
7796         if (rcvd->max_resp_sz < sent->max_resp_sz)
7797                 return -EINVAL;
7798         if (rcvd->max_resp_sz_cached > sent->max_resp_sz_cached)
7799                 return -EINVAL;
7800         if (rcvd->max_ops > sent->max_ops)
7801                 return -EINVAL;
7802         if (rcvd->max_reqs > sent->max_reqs)
7803                 return -EINVAL;
7804 out:
7805         return 0;
7806 }
7807
7808 static int nfs4_verify_channel_attrs(struct nfs41_create_session_args *args,
7809                                      struct nfs41_create_session_res *res)
7810 {
7811         int ret;
7812
7813         ret = nfs4_verify_fore_channel_attrs(args, res);
7814         if (ret)
7815                 return ret;
7816         return nfs4_verify_back_channel_attrs(args, res);
7817 }
7818
7819 static void nfs4_update_session(struct nfs4_session *session,
7820                 struct nfs41_create_session_res *res)
7821 {
7822         nfs4_copy_sessionid(&session->sess_id, &res->sessionid);
7823         /* Mark client id and session as being confirmed */
7824         session->clp->cl_exchange_flags |= EXCHGID4_FLAG_CONFIRMED_R;
7825         set_bit(NFS4_SESSION_ESTABLISHED, &session->session_state);
7826         session->flags = res->flags;
7827         memcpy(&session->fc_attrs, &res->fc_attrs, sizeof(session->fc_attrs));
7828         if (res->flags & SESSION4_BACK_CHAN)
7829                 memcpy(&session->bc_attrs, &res->bc_attrs,
7830                                 sizeof(session->bc_attrs));
7831 }
7832
7833 static int _nfs4_proc_create_session(struct nfs_client *clp,
7834                 struct rpc_cred *cred)
7835 {
7836         struct nfs4_session *session = clp->cl_session;
7837         struct nfs41_create_session_args args = {
7838                 .client = clp,
7839                 .clientid = clp->cl_clientid,
7840                 .seqid = clp->cl_seqid,
7841                 .cb_program = NFS4_CALLBACK,
7842         };
7843         struct nfs41_create_session_res res;
7844
7845         struct rpc_message msg = {
7846                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE_SESSION],
7847                 .rpc_argp = &args,
7848                 .rpc_resp = &res,
7849                 .rpc_cred = cred,
7850         };
7851         int status;
7852
7853         nfs4_init_channel_attrs(&args, clp->cl_rpcclient);
7854         args.flags = (SESSION4_PERSIST | SESSION4_BACK_CHAN);
7855
7856         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
7857         trace_nfs4_create_session(clp, status);
7858
7859         switch (status) {
7860         case -NFS4ERR_STALE_CLIENTID:
7861         case -NFS4ERR_DELAY:
7862         case -ETIMEDOUT:
7863         case -EACCES:
7864         case -EAGAIN:
7865                 goto out;
7866         };
7867
7868         clp->cl_seqid++;
7869         if (!status) {
7870                 /* Verify the session's negotiated channel_attrs values */
7871                 status = nfs4_verify_channel_attrs(&args, &res);
7872                 /* Increment the clientid slot sequence id */
7873                 if (status)
7874                         goto out;
7875                 nfs4_update_session(session, &res);
7876         }
7877 out:
7878         return status;
7879 }
7880
7881 /*
7882  * Issues a CREATE_SESSION operation to the server.
7883  * It is the responsibility of the caller to verify the session is
7884  * expired before calling this routine.
7885  */
7886 int nfs4_proc_create_session(struct nfs_client *clp, struct rpc_cred *cred)
7887 {
7888         int status;
7889         unsigned *ptr;
7890         struct nfs4_session *session = clp->cl_session;
7891
7892         dprintk("--> %s clp=%p session=%p\n", __func__, clp, session);
7893
7894         status = _nfs4_proc_create_session(clp, cred);
7895         if (status)
7896                 goto out;
7897
7898         /* Init or reset the session slot tables */
7899         status = nfs4_setup_session_slot_tables(session);
7900         dprintk("slot table setup returned %d\n", status);
7901         if (status)
7902                 goto out;
7903
7904         ptr = (unsigned *)&session->sess_id.data[0];
7905         dprintk("%s client>seqid %d sessionid %u:%u:%u:%u\n", __func__,
7906                 clp->cl_seqid, ptr[0], ptr[1], ptr[2], ptr[3]);
7907 out:
7908         dprintk("<-- %s\n", __func__);
7909         return status;
7910 }
7911
7912 /*
7913  * Issue the over-the-wire RPC DESTROY_SESSION.
7914  * The caller must serialize access to this routine.
7915  */
7916 int nfs4_proc_destroy_session(struct nfs4_session *session,
7917                 struct rpc_cred *cred)
7918 {
7919         struct rpc_message msg = {
7920                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_SESSION],
7921                 .rpc_argp = session,
7922                 .rpc_cred = cred,
7923         };
7924         int status = 0;
7925
7926         dprintk("--> nfs4_proc_destroy_session\n");
7927
7928         /* session is still being setup */
7929         if (!test_and_clear_bit(NFS4_SESSION_ESTABLISHED, &session->session_state))
7930                 return 0;
7931
7932         status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
7933         trace_nfs4_destroy_session(session->clp, status);
7934
7935         if (status)
7936                 dprintk("NFS: Got error %d from the server on DESTROY_SESSION. "
7937                         "Session has been destroyed regardless...\n", status);
7938
7939         dprintk("<-- nfs4_proc_destroy_session\n");
7940         return status;
7941 }
7942
7943 /*
7944  * Renew the cl_session lease.
7945  */
7946 struct nfs4_sequence_data {
7947         struct nfs_client *clp;
7948         struct nfs4_sequence_args args;
7949         struct nfs4_sequence_res res;
7950 };
7951
7952 static void nfs41_sequence_release(void *data)
7953 {
7954         struct nfs4_sequence_data *calldata = data;
7955         struct nfs_client *clp = calldata->clp;
7956
7957         if (atomic_read(&clp->cl_count) > 1)
7958                 nfs4_schedule_state_renewal(clp);
7959         nfs_put_client(clp);
7960         kfree(calldata);
7961 }
7962
7963 static int nfs41_sequence_handle_errors(struct rpc_task *task, struct nfs_client *clp)
7964 {
7965         switch(task->tk_status) {
7966         case -NFS4ERR_DELAY:
7967                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
7968                 return -EAGAIN;
7969         default:
7970                 nfs4_schedule_lease_recovery(clp);
7971         }
7972         return 0;
7973 }
7974
7975 static void nfs41_sequence_call_done(struct rpc_task *task, void *data)
7976 {
7977         struct nfs4_sequence_data *calldata = data;
7978         struct nfs_client *clp = calldata->clp;
7979
7980         if (!nfs41_sequence_done(task, task->tk_msg.rpc_resp))
7981                 return;
7982
7983         trace_nfs4_sequence(clp, task->tk_status);
7984         if (task->tk_status < 0) {
7985                 dprintk("%s ERROR %d\n", __func__, task->tk_status);
7986                 if (atomic_read(&clp->cl_count) == 1)
7987                         goto out;
7988
7989                 if (nfs41_sequence_handle_errors(task, clp) == -EAGAIN) {
7990                         rpc_restart_call_prepare(task);
7991                         return;
7992                 }
7993         }
7994         dprintk("%s rpc_cred %p\n", __func__, task->tk_msg.rpc_cred);
7995 out:
7996         dprintk("<-- %s\n", __func__);
7997 }
7998
7999 static void nfs41_sequence_prepare(struct rpc_task *task, void *data)
8000 {
8001         struct nfs4_sequence_data *calldata = data;
8002         struct nfs_client *clp = calldata->clp;
8003         struct nfs4_sequence_args *args;
8004         struct nfs4_sequence_res *res;
8005
8006         args = task->tk_msg.rpc_argp;
8007         res = task->tk_msg.rpc_resp;
8008
8009         nfs41_setup_sequence(clp->cl_session, args, res, task);
8010 }
8011
8012 static const struct rpc_call_ops nfs41_sequence_ops = {
8013         .rpc_call_done = nfs41_sequence_call_done,
8014         .rpc_call_prepare = nfs41_sequence_prepare,
8015         .rpc_release = nfs41_sequence_release,
8016 };
8017
8018 static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp,
8019                 struct rpc_cred *cred,
8020                 bool is_privileged)
8021 {
8022         struct nfs4_sequence_data *calldata;
8023         struct rpc_message msg = {
8024                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SEQUENCE],
8025                 .rpc_cred = cred,
8026         };
8027         struct rpc_task_setup task_setup_data = {
8028                 .rpc_client = clp->cl_rpcclient,
8029                 .rpc_message = &msg,
8030                 .callback_ops = &nfs41_sequence_ops,
8031                 .flags = RPC_TASK_ASYNC | RPC_TASK_TIMEOUT,
8032         };
8033
8034         if (!atomic_inc_not_zero(&clp->cl_count))
8035                 return ERR_PTR(-EIO);
8036         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
8037         if (calldata == NULL) {
8038                 nfs_put_client(clp);
8039                 return ERR_PTR(-ENOMEM);
8040         }
8041         nfs4_init_sequence(&calldata->args, &calldata->res, 0);
8042         if (is_privileged)
8043                 nfs4_set_sequence_privileged(&calldata->args);
8044         msg.rpc_argp = &calldata->args;
8045         msg.rpc_resp = &calldata->res;
8046         calldata->clp = clp;
8047         task_setup_data.callback_data = calldata;
8048
8049         return rpc_run_task(&task_setup_data);
8050 }
8051
8052 static int nfs41_proc_async_sequence(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
8053 {
8054         struct rpc_task *task;
8055         int ret = 0;
8056
8057         if ((renew_flags & NFS4_RENEW_TIMEOUT) == 0)
8058                 return -EAGAIN;
8059         task = _nfs41_proc_sequence(clp, cred, false);
8060         if (IS_ERR(task))
8061                 ret = PTR_ERR(task);
8062         else
8063                 rpc_put_task_async(task);
8064         dprintk("<-- %s status=%d\n", __func__, ret);
8065         return ret;
8066 }
8067
8068 static int nfs4_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
8069 {
8070         struct rpc_task *task;
8071         int ret;
8072
8073         task = _nfs41_proc_sequence(clp, cred, true);
8074         if (IS_ERR(task)) {
8075                 ret = PTR_ERR(task);
8076                 goto out;
8077         }
8078         ret = rpc_wait_for_completion_task(task);
8079         if (!ret)
8080                 ret = task->tk_status;
8081         rpc_put_task(task);
8082 out:
8083         dprintk("<-- %s status=%d\n", __func__, ret);
8084         return ret;
8085 }
8086
8087 struct nfs4_reclaim_complete_data {
8088         struct nfs_client *clp;
8089         struct nfs41_reclaim_complete_args arg;
8090         struct nfs41_reclaim_complete_res res;
8091 };
8092
8093 static void nfs4_reclaim_complete_prepare(struct rpc_task *task, void *data)
8094 {
8095         struct nfs4_reclaim_complete_data *calldata = data;
8096
8097         nfs41_setup_sequence(calldata->clp->cl_session,
8098                         &calldata->arg.seq_args,
8099                         &calldata->res.seq_res,
8100                         task);
8101 }
8102
8103 static int nfs41_reclaim_complete_handle_errors(struct rpc_task *task, struct nfs_client *clp)
8104 {
8105         switch(task->tk_status) {
8106         case 0:
8107         case -NFS4ERR_COMPLETE_ALREADY:
8108         case -NFS4ERR_WRONG_CRED: /* What to do here? */
8109                 break;
8110         case -NFS4ERR_DELAY:
8111                 rpc_delay(task, NFS4_POLL_RETRY_MAX);
8112                 /* fall through */
8113         case -NFS4ERR_RETRY_UNCACHED_REP:
8114                 return -EAGAIN;
8115         default:
8116                 nfs4_schedule_lease_recovery(clp);
8117         }
8118         return 0;
8119 }
8120
8121 static void nfs4_reclaim_complete_done(struct rpc_task *task, void *data)
8122 {
8123         struct nfs4_reclaim_complete_data *calldata = data;
8124         struct nfs_client *clp = calldata->clp;
8125         struct nfs4_sequence_res *res = &calldata->res.seq_res;
8126
8127         dprintk("--> %s\n", __func__);
8128         if (!nfs41_sequence_done(task, res))
8129                 return;
8130
8131         trace_nfs4_reclaim_complete(clp, task->tk_status);
8132         if (nfs41_reclaim_complete_handle_errors(task, clp) == -EAGAIN) {
8133                 rpc_restart_call_prepare(task);
8134                 return;
8135         }
8136         dprintk("<-- %s\n", __func__);
8137 }
8138
8139 static void nfs4_free_reclaim_complete_data(void *data)
8140 {
8141         struct nfs4_reclaim_complete_data *calldata = data;
8142
8143         kfree(calldata);
8144 }
8145
8146 static const struct rpc_call_ops nfs4_reclaim_complete_call_ops = {
8147         .rpc_call_prepare = nfs4_reclaim_complete_prepare,
8148         .rpc_call_done = nfs4_reclaim_complete_done,
8149         .rpc_release = nfs4_free_reclaim_complete_data,
8150 };
8151
8152 /*
8153  * Issue a global reclaim complete.
8154  */
8155 static int nfs41_proc_reclaim_complete(struct nfs_client *clp,
8156                 struct rpc_cred *cred)
8157 {
8158         struct nfs4_reclaim_complete_data *calldata;
8159         struct rpc_task *task;
8160         struct rpc_message msg = {
8161                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RECLAIM_COMPLETE],
8162                 .rpc_cred = cred,
8163         };
8164         struct rpc_task_setup task_setup_data = {
8165                 .rpc_client = clp->cl_rpcclient,
8166                 .rpc_message = &msg,
8167                 .callback_ops = &nfs4_reclaim_complete_call_ops,
8168                 .flags = RPC_TASK_ASYNC,
8169         };
8170         int status = -ENOMEM;
8171
8172         dprintk("--> %s\n", __func__);
8173         calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
8174         if (calldata == NULL)
8175                 goto out;
8176         calldata->clp = clp;
8177         calldata->arg.one_fs = 0;
8178
8179         nfs4_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 0);
8180         nfs4_set_sequence_privileged(&calldata->arg.seq_args);
8181         msg.rpc_argp = &calldata->arg;
8182         msg.rpc_resp = &calldata->res;
8183         task_setup_data.callback_data = calldata;
8184         task = rpc_run_task(&task_setup_data);
8185         if (IS_ERR(task)) {
8186                 status = PTR_ERR(task);
8187                 goto out;
8188         }
8189         status = nfs4_wait_for_completion_rpc_task(task);
8190         if (status == 0)
8191                 status = task->tk_status;
8192         rpc_put_task(task);
8193         return 0;
8194 out:
8195         dprintk("<-- %s status=%d\n", __func__, status);
8196         return status;
8197 }
8198
8199 static void
8200 nfs4_layoutget_prepare(struct rpc_task *task, void *calldata)
8201 {
8202         struct nfs4_layoutget *lgp = calldata;
8203         struct nfs_server *server = NFS_SERVER(lgp->args.inode);
8204         struct nfs4_session *session = nfs4_get_session(server);
8205
8206         dprintk("--> %s\n", __func__);
8207         nfs41_setup_sequence(session, &lgp->args.seq_args,
8208                                 &lgp->res.seq_res, task);
8209         dprintk("<-- %s\n", __func__);
8210 }
8211
8212 static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
8213 {
8214         struct nfs4_layoutget *lgp = calldata;
8215
8216         dprintk("--> %s\n", __func__);
8217         nfs41_sequence_process(task, &lgp->res.seq_res);
8218         dprintk("<-- %s\n", __func__);
8219 }
8220
8221 static int
8222 nfs4_layoutget_handle_exception(struct rpc_task *task,
8223                 struct nfs4_layoutget *lgp, struct nfs4_exception *exception)
8224 {
8225         struct inode *inode = lgp->args.inode;
8226         struct nfs_server *server = NFS_SERVER(inode);
8227         struct pnfs_layout_hdr *lo;
8228         int nfs4err = task->tk_status;
8229         int err, status = 0;
8230         LIST_HEAD(head);
8231
8232         dprintk("--> %s tk_status => %d\n", __func__, -task->tk_status);
8233
8234         switch (nfs4err) {
8235         case 0:
8236                 goto out;
8237
8238         /*
8239          * NFS4ERR_LAYOUTUNAVAILABLE means we are not supposed to use pnfs
8240          * on the file. set tk_status to -ENODATA to tell upper layer to
8241          * retry go inband.
8242          */
8243         case -NFS4ERR_LAYOUTUNAVAILABLE:
8244                 status = -ENODATA;
8245                 goto out;
8246         /*
8247          * NFS4ERR_BADLAYOUT means the MDS cannot return a layout of
8248          * length lgp->args.minlength != 0 (see RFC5661 section 18.43.3).
8249          */
8250         case -NFS4ERR_BADLAYOUT:
8251                 status = -EOVERFLOW;
8252                 goto out;
8253         /*
8254          * NFS4ERR_LAYOUTTRYLATER is a conflict with another client
8255          * (or clients) writing to the same RAID stripe except when
8256          * the minlength argument is 0 (see RFC5661 section 18.43.3).
8257          *
8258          * Treat it like we would RECALLCONFLICT -- we retry for a little
8259          * while, and then eventually give up.
8260          */
8261         case -NFS4ERR_LAYOUTTRYLATER:
8262                 if (lgp->args.minlength == 0) {
8263                         status = -EOVERFLOW;
8264                         goto out;
8265                 }
8266                 status = -EBUSY;
8267                 break;
8268         case -NFS4ERR_RECALLCONFLICT:
8269                 status = -ERECALLCONFLICT;
8270                 break;
8271         case -NFS4ERR_EXPIRED:
8272         case -NFS4ERR_BAD_STATEID:
8273                 exception->timeout = 0;
8274                 spin_lock(&inode->i_lock);
8275                 lo = NFS_I(inode)->layout;
8276                 /* If the open stateid was bad, then recover it. */
8277                 if (!lo || test_bit(NFS_LAYOUT_INVALID_STID, &lo->plh_flags) ||
8278                     nfs4_stateid_match_other(&lgp->args.stateid,
8279                                         &lgp->args.ctx->state->stateid)) {
8280                         spin_unlock(&inode->i_lock);
8281                         exception->state = lgp->args.ctx->state;
8282                         break;
8283                 }
8284
8285                 /*
8286                  * Mark the bad layout state as invalid, then retry
8287                  */
8288                 pnfs_mark_layout_stateid_invalid(lo, &head);
8289                 spin_unlock(&inode->i_lock);
8290                 pnfs_free_lseg_list(&head);
8291                 status = -EAGAIN;
8292                 goto out;
8293         }
8294
8295         err = nfs4_handle_exception(server, nfs4err, exception);
8296         if (!status) {
8297                 if (exception->retry)
8298                         status = -EAGAIN;
8299                 else
8300                         status = err;
8301         }
8302 out:
8303         dprintk("<-- %s\n", __func__);
8304         return status;
8305 }
8306
8307 static size_t max_response_pages(struct nfs_server *server)
8308 {
8309         u32 max_resp_sz = server->nfs_client->cl_session->fc_attrs.max_resp_sz;
8310         return nfs_page_array_len(0, max_resp_sz);
8311 }
8312
8313 static void nfs4_free_pages(struct page **pages, size_t size)
8314 {
8315         int i;
8316
8317         if (!pages)
8318                 return;
8319
8320         for (i = 0; i < size; i++) {
8321                 if (!pages[i])
8322                         break;
8323                 __free_page(pages[i]);
8324         }
8325         kfree(pages);
8326 }
8327
8328 static struct page **nfs4_alloc_pages(size_t size, gfp_t gfp_flags)
8329 {
8330         struct page **pages;
8331         int i;
8332
8333         pages = kcalloc(size, sizeof(struct page *), gfp_flags);
8334         if (!pages) {
8335                 dprintk("%s: can't alloc array of %zu pages\n", __func__, size);
8336                 return NULL;
8337         }
8338
8339         for (i = 0; i < size; i++) {
8340                 pages[i] = alloc_page(gfp_flags);
8341                 if (!pages[i]) {
8342                         dprintk("%s: failed to allocate page\n", __func__);
8343                         nfs4_free_pages(pages, size);
8344                         return NULL;
8345                 }
8346         }
8347
8348         return pages;
8349 }
8350
8351 static void nfs4_layoutget_release(void *calldata)
8352 {
8353         struct nfs4_layoutget *lgp = calldata;
8354         struct inode *inode = lgp->args.inode;
8355         struct nfs_server *server = NFS_SERVER(inode);
8356         size_t max_pages = max_response_pages(server);
8357
8358         dprintk("--> %s\n", __func__);
8359         nfs4_free_pages(lgp->args.layout.pages, max_pages);
8360         pnfs_put_layout_hdr(NFS_I(inode)->layout);
8361         put_nfs_open_context(lgp->args.ctx);
8362         kfree(calldata);
8363         dprintk("<-- %s\n", __func__);
8364 }
8365
8366 static const struct rpc_call_ops nfs4_layoutget_call_ops = {
8367         .rpc_call_prepare = nfs4_layoutget_prepare,
8368         .rpc_call_done = nfs4_layoutget_done,
8369         .rpc_release = nfs4_layoutget_release,
8370 };
8371
8372 struct pnfs_layout_segment *
8373 nfs4_proc_layoutget(struct nfs4_layoutget *lgp, long *timeout, gfp_t gfp_flags)
8374 {
8375         struct inode *inode = lgp->args.inode;
8376         struct nfs_server *server = NFS_SERVER(inode);
8377         size_t max_pages = max_response_pages(server);
8378         struct rpc_task *task;
8379         struct rpc_message msg = {
8380                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTGET],
8381                 .rpc_argp = &lgp->args,
8382                 .rpc_resp = &lgp->res,
8383                 .rpc_cred = lgp->cred,
8384         };
8385         struct rpc_task_setup task_setup_data = {
8386                 .rpc_client = server->client,
8387                 .rpc_message = &msg,
8388                 .callback_ops = &nfs4_layoutget_call_ops,
8389                 .callback_data = lgp,
8390                 .flags = RPC_TASK_ASYNC,
8391         };
8392         struct pnfs_layout_segment *lseg = NULL;
8393         struct nfs4_exception exception = {
8394                 .inode = inode,
8395                 .timeout = *timeout,
8396         };
8397         int status = 0;
8398
8399         dprintk("--> %s\n", __func__);
8400
8401         /* nfs4_layoutget_release calls pnfs_put_layout_hdr */
8402         pnfs_get_layout_hdr(NFS_I(inode)->layout);
8403
8404         lgp->args.layout.pages = nfs4_alloc_pages(max_pages, gfp_flags);
8405         if (!lgp->args.layout.pages) {
8406                 nfs4_layoutget_release(lgp);
8407                 return ERR_PTR(-ENOMEM);
8408         }
8409         lgp->args.layout.pglen = max_pages * PAGE_SIZE;
8410
8411         lgp->res.layoutp = &lgp->args.layout;
8412         lgp->res.seq_res.sr_slot = NULL;
8413         nfs4_init_sequence(&lgp->args.seq_args, &lgp->res.seq_res, 0);
8414
8415         task = rpc_run_task(&task_setup_data);
8416         if (IS_ERR(task))
8417                 return ERR_CAST(task);
8418         status = nfs4_wait_for_completion_rpc_task(task);
8419         if (status == 0) {
8420                 status = nfs4_layoutget_handle_exception(task, lgp, &exception);
8421                 *timeout = exception.timeout;
8422         }
8423
8424         trace_nfs4_layoutget(lgp->args.ctx,
8425                         &lgp->args.range,
8426                         &lgp->res.range,
8427                         &lgp->res.stateid,
8428                         status);
8429
8430         /* if layoutp->len is 0, nfs4_layoutget_prepare called rpc_exit */
8431         if (status == 0 && lgp->res.layoutp->len)
8432                 lseg = pnfs_layout_process(lgp);
8433         nfs4_sequence_free_slot(&lgp->res.seq_res);
8434         rpc_put_task(task);
8435         dprintk("<-- %s status=%d\n", __func__, status);
8436         if (status)
8437                 return ERR_PTR(status);
8438         return lseg;
8439 }
8440
8441 static void
8442 nfs4_layoutreturn_prepare(struct rpc_task *task, void *calldata)
8443 {
8444         struct nfs4_layoutreturn *lrp = calldata;
8445
8446         dprintk("--> %s\n", __func__);
8447         nfs41_setup_sequence(lrp->clp->cl_session,
8448                         &lrp->args.seq_args,
8449                         &lrp->res.seq_res,
8450                         task);
8451 }
8452
8453 static void nfs4_layoutreturn_done(struct rpc_task *task, void *calldata)
8454 {
8455         struct nfs4_layoutreturn *lrp = calldata;
8456         struct nfs_server *server;
8457
8458         dprintk("--> %s\n", __func__);
8459
8460         if (!nfs41_sequence_process(task, &lrp->res.seq_res))
8461                 return;
8462
8463         server = NFS_SERVER(lrp->args.inode);
8464         switch (task->tk_status) {
8465         default:
8466                 task->tk_status = 0;
8467         case 0:
8468                 break;
8469         case -NFS4ERR_DELAY:
8470                 if (nfs4_async_handle_error(task, server, NULL, NULL) != -EAGAIN)
8471                         break;
8472                 nfs4_sequence_free_slot(&lrp->res.seq_res);
8473                 rpc_restart_call_prepare(task);
8474                 return;
8475         }
8476         dprintk("<-- %s\n", __func__);
8477 }
8478
8479 static void nfs4_layoutreturn_release(void *calldata)
8480 {
8481         struct nfs4_layoutreturn *lrp = calldata;
8482         struct pnfs_layout_hdr *lo = lrp->args.layout;
8483         LIST_HEAD(freeme);
8484
8485         dprintk("--> %s\n", __func__);
8486         spin_lock(&lo->plh_inode->i_lock);
8487         if (lrp->res.lrs_present) {
8488                 pnfs_mark_matching_lsegs_invalid(lo, &freeme,
8489                                 &lrp->args.range,
8490                                 be32_to_cpu(lrp->args.stateid.seqid));
8491                 pnfs_set_layout_stateid(lo, &lrp->res.stateid, true);
8492         } else
8493                 pnfs_mark_layout_stateid_invalid(lo, &freeme);
8494         pnfs_clear_layoutreturn_waitbit(lo);
8495         spin_unlock(&lo->plh_inode->i_lock);
8496         nfs4_sequence_free_slot(&lrp->res.seq_res);
8497         pnfs_free_lseg_list(&freeme);
8498         pnfs_put_layout_hdr(lrp->args.layout);
8499         nfs_iput_and_deactive(lrp->inode);
8500         kfree(calldata);
8501         dprintk("<-- %s\n", __func__);
8502 }
8503
8504 static const struct rpc_call_ops nfs4_layoutreturn_call_ops = {
8505         .rpc_call_prepare = nfs4_layoutreturn_prepare,
8506         .rpc_call_done = nfs4_layoutreturn_done,
8507         .rpc_release = nfs4_layoutreturn_release,
8508 };
8509
8510 int nfs4_proc_layoutreturn(struct nfs4_layoutreturn *lrp, bool sync)
8511 {
8512         struct rpc_task *task;
8513         struct rpc_message msg = {
8514                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTRETURN],
8515                 .rpc_argp = &lrp->args,
8516                 .rpc_resp = &lrp->res,
8517                 .rpc_cred = lrp->cred,
8518         };
8519         struct rpc_task_setup task_setup_data = {
8520                 .rpc_client = NFS_SERVER(lrp->args.inode)->client,
8521                 .rpc_message = &msg,
8522                 .callback_ops = &nfs4_layoutreturn_call_ops,
8523                 .callback_data = lrp,
8524         };
8525         int status = 0;
8526
8527         nfs4_state_protect(NFS_SERVER(lrp->args.inode)->nfs_client,
8528                         NFS_SP4_MACH_CRED_PNFS_CLEANUP,
8529                         &task_setup_data.rpc_client, &msg);
8530
8531         dprintk("--> %s\n", __func__);
8532         if (!sync) {
8533                 lrp->inode = nfs_igrab_and_active(lrp->args.inode);
8534                 if (!lrp->inode) {
8535                         nfs4_layoutreturn_release(lrp);
8536                         return -EAGAIN;
8537                 }
8538                 task_setup_data.flags |= RPC_TASK_ASYNC;
8539         }
8540         nfs4_init_sequence(&lrp->args.seq_args, &lrp->res.seq_res, 1);
8541         task = rpc_run_task(&task_setup_data);
8542         if (IS_ERR(task))
8543                 return PTR_ERR(task);
8544         if (sync)
8545                 status = task->tk_status;
8546         trace_nfs4_layoutreturn(lrp->args.inode, &lrp->args.stateid, status);
8547         dprintk("<-- %s status=%d\n", __func__, status);
8548         rpc_put_task(task);
8549         return status;
8550 }
8551
8552 static int
8553 _nfs4_proc_getdeviceinfo(struct nfs_server *server,
8554                 struct pnfs_device *pdev,
8555                 struct rpc_cred *cred)
8556 {
8557         struct nfs4_getdeviceinfo_args args = {
8558                 .pdev = pdev,
8559                 .notify_types = NOTIFY_DEVICEID4_CHANGE |
8560                         NOTIFY_DEVICEID4_DELETE,
8561         };
8562         struct nfs4_getdeviceinfo_res res = {
8563                 .pdev = pdev,
8564         };
8565         struct rpc_message msg = {
8566                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICEINFO],
8567                 .rpc_argp = &args,
8568                 .rpc_resp = &res,
8569                 .rpc_cred = cred,
8570         };
8571         int status;
8572
8573         dprintk("--> %s\n", __func__);
8574         status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
8575         if (res.notification & ~args.notify_types)
8576                 dprintk("%s: unsupported notification\n", __func__);
8577         if (res.notification != args.notify_types)
8578                 pdev->nocache = 1;
8579
8580         dprintk("<-- %s status=%d\n", __func__, status);
8581
8582         return status;
8583 }
8584
8585 int nfs4_proc_getdeviceinfo(struct nfs_server *server,
8586                 struct pnfs_device *pdev,
8587                 struct rpc_cred *cred)
8588 {
8589         struct nfs4_exception exception = { };
8590         int err;
8591
8592         do {
8593                 err = nfs4_handle_exception(server,
8594                                         _nfs4_proc_getdeviceinfo(server, pdev, cred),
8595                                         &exception);
8596         } while (exception.retry);
8597         return err;
8598 }
8599 EXPORT_SYMBOL_GPL(nfs4_proc_getdeviceinfo);
8600
8601 static void nfs4_layoutcommit_prepare(struct rpc_task *task, void *calldata)
8602 {
8603         struct nfs4_layoutcommit_data *data = calldata;
8604         struct nfs_server *server = NFS_SERVER(data->args.inode);
8605         struct nfs4_session *session = nfs4_get_session(server);
8606
8607         nfs41_setup_sequence(session,
8608                         &data->args.seq_args,
8609                         &data->res.seq_res,
8610                         task);
8611 }
8612
8613 static void
8614 nfs4_layoutcommit_done(struct rpc_task *task, void *calldata)
8615 {
8616         struct nfs4_layoutcommit_data *data = calldata;
8617         struct nfs_server *server = NFS_SERVER(data->args.inode);
8618
8619         if (!nfs41_sequence_done(task, &data->res.seq_res))
8620                 return;
8621
8622         switch (task->tk_status) { /* Just ignore these failures */
8623         case -NFS4ERR_DELEG_REVOKED: /* layout was recalled */
8624         case -NFS4ERR_BADIOMODE:     /* no IOMODE_RW layout for range */
8625         case -NFS4ERR_BADLAYOUT:     /* no layout */
8626         case -NFS4ERR_GRACE:        /* loca_recalim always false */
8627                 task->tk_status = 0;
8628         case 0:
8629                 break;
8630         default:
8631                 if (nfs4_async_handle_error(task, server, NULL, NULL) == -EAGAIN) {
8632                         rpc_restart_call_prepare(task);
8633                         return;
8634                 }
8635         }
8636 }
8637
8638 static void nfs4_layoutcommit_release(void *calldata)
8639 {
8640         struct nfs4_layoutcommit_data *data = calldata;
8641
8642         pnfs_cleanup_layoutcommit(data);
8643         nfs_post_op_update_inode_force_wcc(data->args.inode,
8644                                            data->res.fattr);
8645         put_rpccred(data->cred);
8646         nfs_iput_and_deactive(data->inode);
8647         kfree(data);
8648 }
8649
8650 static const struct rpc_call_ops nfs4_layoutcommit_ops = {
8651         .rpc_call_prepare = nfs4_layoutcommit_prepare,
8652         .rpc_call_done = nfs4_layoutcommit_done,
8653         .rpc_release = nfs4_layoutcommit_release,
8654 };
8655
8656 int
8657 nfs4_proc_layoutcommit(struct nfs4_layoutcommit_data *data, bool sync)
8658 {
8659         struct rpc_message msg = {
8660                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTCOMMIT],
8661                 .rpc_argp = &data->args,
8662                 .rpc_resp = &data->res,
8663                 .rpc_cred = data->cred,
8664         };
8665         struct rpc_task_setup task_setup_data = {
8666                 .task = &data->task,
8667                 .rpc_client = NFS_CLIENT(data->args.inode),
8668                 .rpc_message = &msg,
8669                 .callback_ops = &nfs4_layoutcommit_ops,
8670                 .callback_data = data,
8671         };
8672         struct rpc_task *task;
8673         int status = 0;
8674
8675         dprintk("NFS: initiating layoutcommit call. sync %d "
8676                 "lbw: %llu inode %lu\n", sync,
8677                 data->args.lastbytewritten,
8678                 data->args.inode->i_ino);
8679
8680         if (!sync) {
8681                 data->inode = nfs_igrab_and_active(data->args.inode);
8682                 if (data->inode == NULL) {
8683                         nfs4_layoutcommit_release(data);
8684                         return -EAGAIN;
8685                 }
8686                 task_setup_data.flags = RPC_TASK_ASYNC;
8687         }
8688         nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
8689         task = rpc_run_task(&task_setup_data);
8690         if (IS_ERR(task))
8691                 return PTR_ERR(task);
8692         if (sync)
8693                 status = task->tk_status;
8694         trace_nfs4_layoutcommit(data->args.inode, &data->args.stateid, status);
8695         dprintk("%s: status %d\n", __func__, status);
8696         rpc_put_task(task);
8697         return status;
8698 }
8699
8700 /**
8701  * Use the state managment nfs_client cl_rpcclient, which uses krb5i (if
8702  * possible) as per RFC3530bis and RFC5661 Security Considerations sections
8703  */
8704 static int
8705 _nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
8706                     struct nfs_fsinfo *info,
8707                     struct nfs4_secinfo_flavors *flavors, bool use_integrity)
8708 {
8709         struct nfs41_secinfo_no_name_args args = {
8710                 .style = SECINFO_STYLE_CURRENT_FH,
8711         };
8712         struct nfs4_secinfo_res res = {
8713                 .flavors = flavors,
8714         };
8715         struct rpc_message msg = {
8716                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO_NO_NAME],
8717                 .rpc_argp = &args,
8718                 .rpc_resp = &res,
8719         };
8720         struct rpc_clnt *clnt = server->client;
8721         struct rpc_cred *cred = NULL;
8722         int status;
8723
8724         if (use_integrity) {
8725                 clnt = server->nfs_client->cl_rpcclient;
8726                 cred = nfs4_get_clid_cred(server->nfs_client);
8727                 msg.rpc_cred = cred;
8728         }
8729
8730         dprintk("--> %s\n", __func__);
8731         status = nfs4_call_sync(clnt, server, &msg, &args.seq_args,
8732                                 &res.seq_res, 0);
8733         dprintk("<-- %s status=%d\n", __func__, status);
8734
8735         if (cred)
8736                 put_rpccred(cred);
8737
8738         return status;
8739 }
8740
8741 static int
8742 nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
8743                            struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
8744 {
8745         struct nfs4_exception exception = { };
8746         int err;
8747         do {
8748                 /* first try using integrity protection */
8749                 err = -NFS4ERR_WRONGSEC;
8750
8751                 /* try to use integrity protection with machine cred */
8752                 if (_nfs4_is_integrity_protected(server->nfs_client))
8753                         err = _nfs41_proc_secinfo_no_name(server, fhandle, info,
8754                                                           flavors, true);
8755
8756                 /*
8757                  * if unable to use integrity protection, or SECINFO with
8758                  * integrity protection returns NFS4ERR_WRONGSEC (which is
8759                  * disallowed by spec, but exists in deployed servers) use
8760                  * the current filesystem's rpc_client and the user cred.
8761                  */
8762                 if (err == -NFS4ERR_WRONGSEC)
8763                         err = _nfs41_proc_secinfo_no_name(server, fhandle, info,
8764                                                           flavors, false);
8765
8766                 switch (err) {
8767                 case 0:
8768                 case -NFS4ERR_WRONGSEC:
8769                 case -ENOTSUPP:
8770                         goto out;
8771                 default:
8772                         err = nfs4_handle_exception(server, err, &exception);
8773                 }
8774         } while (exception.retry);
8775 out:
8776         return err;
8777 }
8778
8779 static int
8780 nfs41_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
8781                     struct nfs_fsinfo *info)
8782 {
8783         int err;
8784         struct page *page;
8785         rpc_authflavor_t flavor = RPC_AUTH_MAXFLAVOR;
8786         struct nfs4_secinfo_flavors *flavors;
8787         struct nfs4_secinfo4 *secinfo;
8788         int i;
8789
8790         page = alloc_page(GFP_KERNEL);
8791         if (!page) {
8792                 err = -ENOMEM;
8793                 goto out;
8794         }
8795
8796         flavors = page_address(page);
8797         err = nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
8798
8799         /*
8800          * Fall back on "guess and check" method if
8801          * the server doesn't support SECINFO_NO_NAME
8802          */
8803         if (err == -NFS4ERR_WRONGSEC || err == -ENOTSUPP) {
8804                 err = nfs4_find_root_sec(server, fhandle, info);
8805                 goto out_freepage;
8806         }
8807         if (err)
8808                 goto out_freepage;
8809
8810         for (i = 0; i < flavors->num_flavors; i++) {
8811                 secinfo = &flavors->flavors[i];
8812
8813                 switch (secinfo->flavor) {
8814                 case RPC_AUTH_NULL:
8815                 case RPC_AUTH_UNIX:
8816                 case RPC_AUTH_GSS:
8817                         flavor = rpcauth_get_pseudoflavor(secinfo->flavor,
8818                                         &secinfo->flavor_info);
8819                         break;
8820                 default:
8821                         flavor = RPC_AUTH_MAXFLAVOR;
8822                         break;
8823                 }
8824
8825                 if (!nfs_auth_info_match(&server->auth_info, flavor))
8826                         flavor = RPC_AUTH_MAXFLAVOR;
8827
8828                 if (flavor != RPC_AUTH_MAXFLAVOR) {
8829                         err = nfs4_lookup_root_sec(server, fhandle,
8830                                                    info, flavor);
8831                         if (!err)
8832                                 break;
8833                 }
8834         }
8835
8836         if (flavor == RPC_AUTH_MAXFLAVOR)
8837                 err = -EPERM;
8838
8839 out_freepage:
8840         put_page(page);
8841         if (err == -EACCES)
8842                 return -EPERM;
8843 out:
8844         return err;
8845 }
8846
8847 static int _nfs41_test_stateid(struct nfs_server *server,
8848                 nfs4_stateid *stateid,
8849                 struct rpc_cred *cred)
8850 {
8851         int status;
8852         struct nfs41_test_stateid_args args = {
8853                 .stateid = stateid,
8854         };
8855         struct nfs41_test_stateid_res res;
8856         struct rpc_message msg = {
8857                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_TEST_STATEID],
8858                 .rpc_argp = &args,
8859                 .rpc_resp = &res,
8860                 .rpc_cred = cred,
8861         };
8862         struct rpc_clnt *rpc_client = server->client;
8863
8864         nfs4_state_protect(server->nfs_client, NFS_SP4_MACH_CRED_STATEID,
8865                 &rpc_client, &msg);
8866
8867         dprintk("NFS call  test_stateid %p\n", stateid);
8868         nfs4_init_sequence(&args.seq_args, &res.seq_res, 0);
8869         nfs4_set_sequence_privileged(&args.seq_args);
8870         status = nfs4_call_sync_sequence(rpc_client, server, &msg,
8871                         &args.seq_args, &res.seq_res);
8872         if (status != NFS_OK) {
8873                 dprintk("NFS reply test_stateid: failed, %d\n", status);
8874                 return status;
8875         }
8876         dprintk("NFS reply test_stateid: succeeded, %d\n", -res.status);
8877         return -res.status;
8878 }
8879
8880 static void nfs4_handle_delay_or_session_error(struct nfs_server *server,
8881                 int err, struct nfs4_exception *exception)
8882 {
8883         exception->retry = 0;
8884         switch(err) {
8885         case -NFS4ERR_DELAY:
8886                 nfs4_handle_exception(server, err, exception);
8887                 break;
8888         case -NFS4ERR_BADSESSION:
8889         case -NFS4ERR_BADSLOT:
8890         case -NFS4ERR_BAD_HIGH_SLOT:
8891         case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
8892         case -NFS4ERR_DEADSESSION:
8893                 nfs4_do_handle_exception(server, err, exception);
8894         }
8895 }
8896
8897 /**
8898  * nfs41_test_stateid - perform a TEST_STATEID operation
8899  *
8900  * @server: server / transport on which to perform the operation
8901  * @stateid: state ID to test
8902  * @cred: credential
8903  *
8904  * Returns NFS_OK if the server recognizes that "stateid" is valid.
8905  * Otherwise a negative NFS4ERR value is returned if the operation
8906  * failed or the state ID is not currently valid.
8907  */
8908 static int nfs41_test_stateid(struct nfs_server *server,
8909                 nfs4_stateid *stateid,
8910                 struct rpc_cred *cred)
8911 {
8912         struct nfs4_exception exception = { };
8913         int err;
8914         do {
8915                 err = _nfs41_test_stateid(server, stateid, cred);
8916                 nfs4_handle_delay_or_session_error(server, err, &exception);
8917         } while (exception.retry);
8918         return err;
8919 }
8920
8921 struct nfs_free_stateid_data {
8922         struct nfs_server *server;
8923         struct nfs41_free_stateid_args args;
8924         struct nfs41_free_stateid_res res;
8925 };
8926
8927 static void nfs41_free_stateid_prepare(struct rpc_task *task, void *calldata)
8928 {
8929         struct nfs_free_stateid_data *data = calldata;
8930         nfs41_setup_sequence(nfs4_get_session(data->server),
8931                         &data->args.seq_args,
8932                         &data->res.seq_res,
8933                         task);
8934 }
8935
8936 static void nfs41_free_stateid_done(struct rpc_task *task, void *calldata)
8937 {
8938         struct nfs_free_stateid_data *data = calldata;
8939
8940         nfs41_sequence_done(task, &data->res.seq_res);
8941
8942         switch (task->tk_status) {
8943         case -NFS4ERR_DELAY:
8944                 if (nfs4_async_handle_error(task, data->server, NULL, NULL) == -EAGAIN)
8945                         rpc_restart_call_prepare(task);
8946         }
8947 }
8948
8949 static void nfs41_free_stateid_release(void *calldata)
8950 {
8951         kfree(calldata);
8952 }
8953
8954 static const struct rpc_call_ops nfs41_free_stateid_ops = {
8955         .rpc_call_prepare = nfs41_free_stateid_prepare,
8956         .rpc_call_done = nfs41_free_stateid_done,
8957         .rpc_release = nfs41_free_stateid_release,
8958 };
8959
8960 static struct rpc_task *_nfs41_free_stateid(struct nfs_server *server,
8961                 const nfs4_stateid *stateid,
8962                 struct rpc_cred *cred,
8963                 bool privileged)
8964 {
8965         struct rpc_message msg = {
8966                 .rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FREE_STATEID],
8967                 .rpc_cred = cred,
8968         };
8969         struct rpc_task_setup task_setup = {
8970                 .rpc_client = server->client,
8971                 .rpc_message = &msg,
8972                 .callback_ops = &nfs41_free_stateid_ops,
8973                 .flags = RPC_TASK_ASYNC,
8974         };
8975         struct nfs_free_stateid_data *data;
8976
8977         nfs4_state_protect(server->nfs_client, NFS_SP4_MACH_CRED_STATEID,
8978                 &task_setup.rpc_client, &msg);
8979
8980         dprintk("NFS call  free_stateid %p\n", stateid);
8981         data = kmalloc(sizeof(*data), GFP_NOFS);
8982         if (!data)
8983                 return ERR_PTR(-ENOMEM);
8984         data->server = server;
8985         nfs4_stateid_copy(&data->args.stateid, stateid);
8986
8987         task_setup.callback_data = data;
8988
8989         msg.rpc_argp = &data->args;
8990         msg.rpc_resp = &data->res;
8991         nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
8992         if (privileged)
8993                 nfs4_set_sequence_privileged(&data->args.seq_args);
8994
8995         return rpc_run_task(&task_setup);
8996 }
8997
8998 /**
8999  * nfs41_free_stateid - perform a FREE_STATEID operation
9000  *
9001  * @server: server / transport on which to perform the operation
9002  * @stateid: state ID to release
9003  * @cred: credential
9004  * @is_recovery: set to true if this call needs to be privileged
9005  *
9006  * Note: this function is always asynchronous.
9007  */
9008 static int nfs41_free_stateid(struct nfs_server *server,
9009                 const nfs4_stateid *stateid,
9010                 struct rpc_cred *cred,
9011                 bool is_recovery)
9012 {
9013         struct rpc_task *task;
9014
9015         task = _nfs41_free_stateid(server, stateid, cred, is_recovery);
9016         if (IS_ERR(task))
9017                 return PTR_ERR(task);
9018         rpc_put_task(task);
9019         return 0;
9020 }
9021
9022 static void
9023 nfs41_free_lock_state(struct nfs_server *server, struct nfs4_lock_state *lsp)
9024 {
9025         struct rpc_cred *cred = lsp->ls_state->owner->so_cred;
9026
9027         nfs41_free_stateid(server, &lsp->ls_stateid, cred, false);
9028         nfs4_free_lock_state(server, lsp);
9029 }
9030
9031 static bool nfs41_match_stateid(const nfs4_stateid *s1,
9032                 const nfs4_stateid *s2)
9033 {
9034         if (s1->type != s2->type)
9035                 return false;
9036
9037         if (memcmp(s1->other, s2->other, sizeof(s1->other)) != 0)
9038                 return false;
9039
9040         if (s1->seqid == s2->seqid)
9041                 return true;
9042         if (s1->seqid == 0 || s2->seqid == 0)
9043                 return true;
9044
9045         return false;
9046 }
9047
9048 #endif /* CONFIG_NFS_V4_1 */
9049
9050 static bool nfs4_match_stateid(const nfs4_stateid *s1,
9051                 const nfs4_stateid *s2)
9052 {
9053         return nfs4_stateid_match(s1, s2);
9054 }
9055
9056
9057 static const struct nfs4_state_recovery_ops nfs40_reboot_recovery_ops = {
9058         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
9059         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
9060         .recover_open   = nfs4_open_reclaim,
9061         .recover_lock   = nfs4_lock_reclaim,
9062         .establish_clid = nfs4_init_clientid,
9063         .detect_trunking = nfs40_discover_server_trunking,
9064 };
9065
9066 #if defined(CONFIG_NFS_V4_1)
9067 static const struct nfs4_state_recovery_ops nfs41_reboot_recovery_ops = {
9068         .owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
9069         .state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
9070         .recover_open   = nfs4_open_reclaim,
9071         .recover_lock   = nfs4_lock_reclaim,
9072         .establish_clid = nfs41_init_clientid,
9073         .reclaim_complete = nfs41_proc_reclaim_complete,
9074         .detect_trunking = nfs41_discover_server_trunking,
9075 };
9076 #endif /* CONFIG_NFS_V4_1 */
9077
9078 static const struct nfs4_state_recovery_ops nfs40_nograce_recovery_ops = {
9079         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
9080         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
9081         .recover_open   = nfs40_open_expired,
9082         .recover_lock   = nfs4_lock_expired,
9083         .establish_clid = nfs4_init_clientid,
9084 };
9085
9086 #if defined(CONFIG_NFS_V4_1)
9087 static const struct nfs4_state_recovery_ops nfs41_nograce_recovery_ops = {
9088         .owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
9089         .state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
9090         .recover_open   = nfs41_open_expired,
9091         .recover_lock   = nfs41_lock_expired,
9092         .establish_clid = nfs41_init_clientid,
9093 };
9094 #endif /* CONFIG_NFS_V4_1 */
9095
9096 static const struct nfs4_state_maintenance_ops nfs40_state_renewal_ops = {
9097         .sched_state_renewal = nfs4_proc_async_renew,
9098         .get_state_renewal_cred_locked = nfs4_get_renew_cred_locked,
9099         .renew_lease = nfs4_proc_renew,
9100 };
9101
9102 #if defined(CONFIG_NFS_V4_1)
9103 static const struct nfs4_state_maintenance_ops nfs41_state_renewal_ops = {
9104         .sched_state_renewal = nfs41_proc_async_sequence,
9105         .get_state_renewal_cred_locked = nfs4_get_machine_cred_locked,
9106         .renew_lease = nfs4_proc_sequence,
9107 };
9108 #endif
9109
9110 static const struct nfs4_mig_recovery_ops nfs40_mig_recovery_ops = {
9111         .get_locations = _nfs40_proc_get_locations,
9112         .fsid_present = _nfs40_proc_fsid_present,
9113 };
9114
9115 #if defined(CONFIG_NFS_V4_1)
9116 static const struct nfs4_mig_recovery_ops nfs41_mig_recovery_ops = {
9117         .get_locations = _nfs41_proc_get_locations,
9118         .fsid_present = _nfs41_proc_fsid_present,
9119 };
9120 #endif  /* CONFIG_NFS_V4_1 */
9121
9122 static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
9123         .minor_version = 0,
9124         .init_caps = NFS_CAP_READDIRPLUS
9125                 | NFS_CAP_ATOMIC_OPEN
9126                 | NFS_CAP_POSIX_LOCK,
9127         .init_client = nfs40_init_client,
9128         .shutdown_client = nfs40_shutdown_client,
9129         .match_stateid = nfs4_match_stateid,
9130         .find_root_sec = nfs4_find_root_sec,
9131         .free_lock_state = nfs4_release_lockowner,
9132         .test_and_free_expired = nfs40_test_and_free_expired_stateid,
9133         .alloc_seqid = nfs_alloc_seqid,
9134         .call_sync_ops = &nfs40_call_sync_ops,
9135         .reboot_recovery_ops = &nfs40_reboot_recovery_ops,
9136         .nograce_recovery_ops = &nfs40_nograce_recovery_ops,
9137         .state_renewal_ops = &nfs40_state_renewal_ops,
9138         .mig_recovery_ops = &nfs40_mig_recovery_ops,
9139 };
9140
9141 #if defined(CONFIG_NFS_V4_1)
9142 static struct nfs_seqid *
9143 nfs_alloc_no_seqid(struct nfs_seqid_counter *arg1, gfp_t arg2)
9144 {
9145         return NULL;
9146 }
9147
9148 static const struct nfs4_minor_version_ops nfs_v4_1_minor_ops = {
9149         .minor_version = 1,
9150         .init_caps = NFS_CAP_READDIRPLUS
9151                 | NFS_CAP_ATOMIC_OPEN
9152                 | NFS_CAP_POSIX_LOCK
9153                 | NFS_CAP_STATEID_NFSV41
9154                 | NFS_CAP_ATOMIC_OPEN_V1,
9155         .init_client = nfs41_init_client,
9156         .shutdown_client = nfs41_shutdown_client,
9157         .match_stateid = nfs41_match_stateid,
9158         .find_root_sec = nfs41_find_root_sec,
9159         .free_lock_state = nfs41_free_lock_state,
9160         .test_and_free_expired = nfs41_test_and_free_expired_stateid,
9161         .alloc_seqid = nfs_alloc_no_seqid,
9162         .session_trunk = nfs4_test_session_trunk,
9163         .call_sync_ops = &nfs41_call_sync_ops,
9164         .reboot_recovery_ops = &nfs41_reboot_recovery_ops,
9165         .nograce_recovery_ops = &nfs41_nograce_recovery_ops,
9166         .state_renewal_ops = &nfs41_state_renewal_ops,
9167         .mig_recovery_ops = &nfs41_mig_recovery_ops,
9168 };
9169 #endif
9170
9171 #if defined(CONFIG_NFS_V4_2)
9172 static const struct nfs4_minor_version_ops nfs_v4_2_minor_ops = {
9173         .minor_version = 2,
9174         .init_caps = NFS_CAP_READDIRPLUS
9175                 | NFS_CAP_ATOMIC_OPEN
9176                 | NFS_CAP_POSIX_LOCK
9177                 | NFS_CAP_STATEID_NFSV41
9178                 | NFS_CAP_ATOMIC_OPEN_V1
9179                 | NFS_CAP_ALLOCATE
9180                 | NFS_CAP_COPY
9181                 | NFS_CAP_DEALLOCATE
9182                 | NFS_CAP_SEEK
9183                 | NFS_CAP_LAYOUTSTATS
9184                 | NFS_CAP_CLONE,
9185         .init_client = nfs41_init_client,
9186         .shutdown_client = nfs41_shutdown_client,
9187         .match_stateid = nfs41_match_stateid,
9188         .find_root_sec = nfs41_find_root_sec,
9189         .free_lock_state = nfs41_free_lock_state,
9190         .call_sync_ops = &nfs41_call_sync_ops,
9191         .test_and_free_expired = nfs41_test_and_free_expired_stateid,
9192         .alloc_seqid = nfs_alloc_no_seqid,
9193         .session_trunk = nfs4_test_session_trunk,
9194         .reboot_recovery_ops = &nfs41_reboot_recovery_ops,
9195         .nograce_recovery_ops = &nfs41_nograce_recovery_ops,
9196         .state_renewal_ops = &nfs41_state_renewal_ops,
9197         .mig_recovery_ops = &nfs41_mig_recovery_ops,
9198 };
9199 #endif
9200
9201 const struct nfs4_minor_version_ops *nfs_v4_minor_ops[] = {
9202         [0] = &nfs_v4_0_minor_ops,
9203 #if defined(CONFIG_NFS_V4_1)
9204         [1] = &nfs_v4_1_minor_ops,
9205 #endif
9206 #if defined(CONFIG_NFS_V4_2)
9207         [2] = &nfs_v4_2_minor_ops,
9208 #endif
9209 };
9210
9211 static ssize_t nfs4_listxattr(struct dentry *dentry, char *list, size_t size)
9212 {
9213         ssize_t error, error2;
9214
9215         error = generic_listxattr(dentry, list, size);
9216         if (error < 0)
9217                 return error;
9218         if (list) {
9219                 list += error;
9220                 size -= error;
9221         }
9222
9223         error2 = nfs4_listxattr_nfs4_label(d_inode(dentry), list, size);
9224         if (error2 < 0)
9225                 return error2;
9226         return error + error2;
9227 }
9228
9229 static const struct inode_operations nfs4_dir_inode_operations = {
9230         .create         = nfs_create,
9231         .lookup         = nfs_lookup,
9232         .atomic_open    = nfs_atomic_open,
9233         .link           = nfs_link,
9234         .unlink         = nfs_unlink,
9235         .symlink        = nfs_symlink,
9236         .mkdir          = nfs_mkdir,
9237         .rmdir          = nfs_rmdir,
9238         .mknod          = nfs_mknod,
9239         .rename         = nfs_rename,
9240         .permission     = nfs_permission,
9241         .getattr        = nfs_getattr,
9242         .setattr        = nfs_setattr,
9243         .getxattr       = generic_getxattr,
9244         .setxattr       = generic_setxattr,
9245         .listxattr      = nfs4_listxattr,
9246         .removexattr    = generic_removexattr,
9247 };
9248
9249 static const struct inode_operations nfs4_file_inode_operations = {
9250         .permission     = nfs_permission,
9251         .getattr        = nfs_getattr,
9252         .setattr        = nfs_setattr,
9253         .getxattr       = generic_getxattr,
9254         .setxattr       = generic_setxattr,
9255         .listxattr      = nfs4_listxattr,
9256         .removexattr    = generic_removexattr,
9257 };
9258
9259 const struct nfs_rpc_ops nfs_v4_clientops = {
9260         .version        = 4,                    /* protocol version */
9261         .dentry_ops     = &nfs4_dentry_operations,
9262         .dir_inode_ops  = &nfs4_dir_inode_operations,
9263         .file_inode_ops = &nfs4_file_inode_operations,
9264         .file_ops       = &nfs4_file_operations,
9265         .getroot        = nfs4_proc_get_root,
9266         .submount       = nfs4_submount,
9267         .try_mount      = nfs4_try_mount,
9268         .getattr        = nfs4_proc_getattr,
9269         .setattr        = nfs4_proc_setattr,
9270         .lookup         = nfs4_proc_lookup,
9271         .access         = nfs4_proc_access,
9272         .readlink       = nfs4_proc_readlink,
9273         .create         = nfs4_proc_create,
9274         .remove         = nfs4_proc_remove,
9275         .unlink_setup   = nfs4_proc_unlink_setup,
9276         .unlink_rpc_prepare = nfs4_proc_unlink_rpc_prepare,
9277         .unlink_done    = nfs4_proc_unlink_done,
9278         .rename_setup   = nfs4_proc_rename_setup,
9279         .rename_rpc_prepare = nfs4_proc_rename_rpc_prepare,
9280         .rename_done    = nfs4_proc_rename_done,
9281         .link           = nfs4_proc_link,
9282         .symlink        = nfs4_proc_symlink,
9283         .mkdir          = nfs4_proc_mkdir,
9284         .rmdir          = nfs4_proc_remove,
9285         .readdir        = nfs4_proc_readdir,
9286         .mknod          = nfs4_proc_mknod,
9287         .statfs         = nfs4_proc_statfs,
9288         .fsinfo         = nfs4_proc_fsinfo,
9289         .pathconf       = nfs4_proc_pathconf,
9290         .set_capabilities = nfs4_server_capabilities,
9291         .decode_dirent  = nfs4_decode_dirent,
9292         .pgio_rpc_prepare = nfs4_proc_pgio_rpc_prepare,
9293         .read_setup     = nfs4_proc_read_setup,
9294         .read_done      = nfs4_read_done,
9295         .write_setup    = nfs4_proc_write_setup,
9296         .write_done     = nfs4_write_done,
9297         .commit_setup   = nfs4_proc_commit_setup,
9298         .commit_rpc_prepare = nfs4_proc_commit_rpc_prepare,
9299         .commit_done    = nfs4_commit_done,
9300         .lock           = nfs4_proc_lock,
9301         .clear_acl_cache = nfs4_zap_acl_attr,
9302         .close_context  = nfs4_close_context,
9303         .open_context   = nfs4_atomic_open,
9304         .have_delegation = nfs4_have_delegation,
9305         .return_delegation = nfs4_inode_return_delegation,
9306         .alloc_client   = nfs4_alloc_client,
9307         .init_client    = nfs4_init_client,
9308         .free_client    = nfs4_free_client,
9309         .create_server  = nfs4_create_server,
9310         .clone_server   = nfs_clone_server,
9311 };
9312
9313 static const struct xattr_handler nfs4_xattr_nfs4_acl_handler = {
9314         .name   = XATTR_NAME_NFSV4_ACL,
9315         .list   = nfs4_xattr_list_nfs4_acl,
9316         .get    = nfs4_xattr_get_nfs4_acl,
9317         .set    = nfs4_xattr_set_nfs4_acl,
9318 };
9319
9320 const struct xattr_handler *nfs4_xattr_handlers[] = {
9321         &nfs4_xattr_nfs4_acl_handler,
9322 #ifdef CONFIG_NFS_V4_SECURITY_LABEL
9323         &nfs4_xattr_nfs4_label_handler,
9324 #endif
9325         NULL
9326 };
9327
9328 /*
9329  * Local variables:
9330  *  c-basic-offset: 8
9331  * End:
9332  */