2 * Server-side procedures for NFSv4.
4 * Copyright (c) 2002 The Regents of the University of Michigan.
7 * Kendrick Smith <kmsmith@umich.edu>
8 * Andy Adamson <andros@umich.edu>
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. Neither the name of the University nor the names of its
20 * contributors may be used to endorse or promote products derived
21 * from this software without specific prior written permission.
23 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
24 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
25 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
26 * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
30 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
31 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
32 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
33 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
35 #include <linux/file.h>
36 #include <linux/slab.h>
42 #include "current_stateid.h"
46 #ifdef CONFIG_NFSD_V4_SECURITY_LABEL
47 #include <linux/security.h>
50 nfsd4_security_inode_setsecctx(struct svc_fh *resfh, struct xdr_netobj *label, u32 *bmval)
52 struct inode *inode = resfh->fh_dentry->d_inode;
55 mutex_lock(&inode->i_mutex);
56 status = security_inode_setsecctx(resfh->fh_dentry,
57 label->data, label->len);
58 mutex_unlock(&inode->i_mutex);
62 * XXX: We should really fail the whole open, but we may
63 * already have created a new file, so it may be too
64 * late. For now this seems the least of evils:
66 bmval[2] &= ~FATTR4_WORD2_SECURITY_LABEL;
72 nfsd4_security_inode_setsecctx(struct svc_fh *resfh, struct xdr_netobj *label, u32 *bmval)
76 #define NFSDDBG_FACILITY NFSDDBG_PROC
78 static u32 nfsd_attrmask[] = {
79 NFSD_WRITEABLE_ATTRS_WORD0,
80 NFSD_WRITEABLE_ATTRS_WORD1,
81 NFSD_WRITEABLE_ATTRS_WORD2
84 static u32 nfsd41_ex_attrmask[] = {
85 NFSD_SUPPATTR_EXCLCREAT_WORD0,
86 NFSD_SUPPATTR_EXCLCREAT_WORD1,
87 NFSD_SUPPATTR_EXCLCREAT_WORD2
91 check_attr_support(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
92 u32 *bmval, u32 *writable)
94 struct dentry *dentry = cstate->current_fh.fh_dentry;
97 * Check about attributes are supported by the NFSv4 server or not.
98 * According to spec, unsupported attributes return ERR_ATTRNOTSUPP.
100 if ((bmval[0] & ~nfsd_suppattrs0(cstate->minorversion)) ||
101 (bmval[1] & ~nfsd_suppattrs1(cstate->minorversion)) ||
102 (bmval[2] & ~nfsd_suppattrs2(cstate->minorversion)))
103 return nfserr_attrnotsupp;
106 * Check FATTR4_WORD0_ACL can be supported
107 * in current environment or not.
109 if (bmval[0] & FATTR4_WORD0_ACL) {
110 if (!IS_POSIXACL(dentry->d_inode))
111 return nfserr_attrnotsupp;
115 * According to spec, read-only attributes return ERR_INVAL.
118 if ((bmval[0] & ~writable[0]) || (bmval[1] & ~writable[1]) ||
119 (bmval[2] & ~writable[2]))
127 nfsd4_check_open_attributes(struct svc_rqst *rqstp,
128 struct nfsd4_compound_state *cstate, struct nfsd4_open *open)
130 __be32 status = nfs_ok;
132 if (open->op_create == NFS4_OPEN_CREATE) {
133 if (open->op_createmode == NFS4_CREATE_UNCHECKED
134 || open->op_createmode == NFS4_CREATE_GUARDED)
135 status = check_attr_support(rqstp, cstate,
136 open->op_bmval, nfsd_attrmask);
137 else if (open->op_createmode == NFS4_CREATE_EXCLUSIVE4_1)
138 status = check_attr_support(rqstp, cstate,
139 open->op_bmval, nfsd41_ex_attrmask);
146 is_create_with_attrs(struct nfsd4_open *open)
148 return open->op_create == NFS4_OPEN_CREATE
149 && (open->op_createmode == NFS4_CREATE_UNCHECKED
150 || open->op_createmode == NFS4_CREATE_GUARDED
151 || open->op_createmode == NFS4_CREATE_EXCLUSIVE4_1);
155 * if error occurs when setting the acl, just clear the acl bit
156 * in the returned attr bitmap.
159 do_set_nfs4_acl(struct svc_rqst *rqstp, struct svc_fh *fhp,
160 struct nfs4_acl *acl, u32 *bmval)
164 status = nfsd4_set_nfs4_acl(rqstp, fhp, acl);
167 * We should probably fail the whole open at this point,
168 * but we've already created the file, so it's too late;
169 * So this seems the least of evils:
171 bmval[0] &= ~FATTR4_WORD0_ACL;
175 fh_dup2(struct svc_fh *dst, struct svc_fh *src)
178 dget(src->fh_dentry);
180 exp_get(src->fh_export);
185 do_open_permission(struct svc_rqst *rqstp, struct svc_fh *current_fh, struct nfsd4_open *open, int accmode)
189 if (open->op_truncate &&
190 !(open->op_share_access & NFS4_SHARE_ACCESS_WRITE))
193 accmode |= NFSD_MAY_READ_IF_EXEC;
195 if (open->op_share_access & NFS4_SHARE_ACCESS_READ)
196 accmode |= NFSD_MAY_READ;
197 if (open->op_share_access & NFS4_SHARE_ACCESS_WRITE)
198 accmode |= (NFSD_MAY_WRITE | NFSD_MAY_TRUNC);
199 if (open->op_share_deny & NFS4_SHARE_DENY_READ)
200 accmode |= NFSD_MAY_WRITE;
202 status = fh_verify(rqstp, current_fh, S_IFREG, accmode);
207 static __be32 nfsd_check_obj_isreg(struct svc_fh *fh)
209 umode_t mode = fh->fh_dentry->d_inode->i_mode;
216 * Using err_symlink as our catch-all case may look odd; but
217 * there's no other obvious error for this case in 4.0, and we
218 * happen to know that it will cause the linux v4 client to do
219 * the right thing on attempts to open something other than a
222 return nfserr_symlink;
225 static void nfsd4_set_open_owner_reply_cache(struct nfsd4_compound_state *cstate, struct nfsd4_open *open, struct svc_fh *resfh)
227 if (nfsd4_has_session(cstate))
229 fh_copy_shallow(&open->op_openowner->oo_owner.so_replay.rp_openfh,
234 do_open_lookup(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_open *open, struct svc_fh **resfh)
236 struct svc_fh *current_fh = &cstate->current_fh;
240 *resfh = kmalloc(sizeof(struct svc_fh), GFP_KERNEL);
242 return nfserr_jukebox;
243 fh_init(*resfh, NFS4_FHSIZE);
244 open->op_truncate = 0;
246 if (open->op_create) {
247 /* FIXME: check session persistence and pnfs flags.
248 * The nfsv4.1 spec requires the following semantics:
250 * Persistent | pNFS | Server REQUIRED | Client Allowed
251 * Reply Cache | server | |
252 * -------------+--------+-----------------+--------------------
253 * no | no | EXCLUSIVE4_1 | EXCLUSIVE4_1
255 * | | and EXCLUSIVE4 | or EXCLUSIVE4
257 * no | yes | EXCLUSIVE4_1 | EXCLUSIVE4_1
258 * yes | no | GUARDED4 | GUARDED4
259 * yes | yes | GUARDED4 | GUARDED4
263 * Note: create modes (UNCHECKED,GUARDED...) are the same
264 * in NFSv4 as in v3 except EXCLUSIVE4_1.
266 status = do_nfsd_create(rqstp, current_fh, open->op_fname.data,
267 open->op_fname.len, &open->op_iattr,
268 *resfh, open->op_createmode,
269 (u32 *)open->op_verf.data,
270 &open->op_truncate, &open->op_created);
272 if (!status && open->op_label.len)
273 nfsd4_security_inode_setsecctx(*resfh, &open->op_label, open->op_bmval);
276 * Following rfc 3530 14.2.16, use the returned bitmask
277 * to indicate which attributes we used to store the
280 if (open->op_createmode == NFS4_CREATE_EXCLUSIVE && status == 0)
281 open->op_bmval[1] = (FATTR4_WORD1_TIME_ACCESS |
282 FATTR4_WORD1_TIME_MODIFY);
285 * Note this may exit with the parent still locked.
286 * We will hold the lock until nfsd4_open's final
287 * lookup, to prevent renames or unlinks until we've had
288 * a chance to an acquire a delegation if appropriate.
290 status = nfsd_lookup(rqstp, current_fh,
291 open->op_fname.data, open->op_fname.len, *resfh);
294 status = nfsd_check_obj_isreg(*resfh);
298 if (is_create_with_attrs(open) && open->op_acl != NULL)
299 do_set_nfs4_acl(rqstp, *resfh, open->op_acl, open->op_bmval);
301 nfsd4_set_open_owner_reply_cache(cstate, open, *resfh);
302 accmode = NFSD_MAY_NOP;
303 if (open->op_created ||
304 open->op_claim_type == NFS4_OPEN_CLAIM_DELEGATE_CUR)
305 accmode |= NFSD_MAY_OWNER_OVERRIDE;
306 status = do_open_permission(rqstp, *resfh, open, accmode);
307 set_change_info(&open->op_cinfo, current_fh);
313 do_open_fhandle(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_open *open)
315 struct svc_fh *current_fh = &cstate->current_fh;
319 /* We don't know the target directory, and therefore can not
320 * set the change info
323 memset(&open->op_cinfo, 0, sizeof(struct nfsd4_change_info));
325 nfsd4_set_open_owner_reply_cache(cstate, open, current_fh);
327 open->op_truncate = (open->op_iattr.ia_valid & ATTR_SIZE) &&
328 (open->op_iattr.ia_size == 0);
330 * In the delegation case, the client is telling us about an
331 * open that it *already* performed locally, some time ago. We
332 * should let it succeed now if possible.
334 * In the case of a CLAIM_FH open, on the other hand, the client
335 * may be counting on us to enforce permissions (the Linux 4.1
336 * client uses this for normal opens, for example).
338 if (open->op_claim_type == NFS4_OPEN_CLAIM_DELEG_CUR_FH)
339 accmode = NFSD_MAY_OWNER_OVERRIDE;
341 status = do_open_permission(rqstp, current_fh, open, accmode);
347 copy_clientid(clientid_t *clid, struct nfsd4_session *session)
349 struct nfsd4_sessionid *sid =
350 (struct nfsd4_sessionid *)session->se_sessionid.data;
352 clid->cl_boot = sid->clientid.cl_boot;
353 clid->cl_id = sid->clientid.cl_id;
357 nfsd4_open(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
358 struct nfsd4_open *open)
361 struct svc_fh *resfh = NULL;
362 struct nfsd4_compoundres *resp;
363 struct net *net = SVC_NET(rqstp);
364 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
366 dprintk("NFSD: nfsd4_open filename %.*s op_openowner %p\n",
367 (int)open->op_fname.len, open->op_fname.data,
370 /* This check required by spec. */
371 if (open->op_create && open->op_claim_type != NFS4_OPEN_CLAIM_NULL)
374 open->op_created = 0;
377 * Before RECLAIM_COMPLETE done, server should deny new lock
379 if (nfsd4_has_session(cstate) &&
380 !test_bit(NFSD4_CLIENT_RECLAIM_COMPLETE,
381 &cstate->session->se_client->cl_flags) &&
382 open->op_claim_type != NFS4_OPEN_CLAIM_PREVIOUS)
385 if (nfsd4_has_session(cstate))
386 copy_clientid(&open->op_clientid, cstate->session);
390 /* check seqid for replay. set nfs4_owner */
391 resp = rqstp->rq_resp;
392 status = nfsd4_process_open1(&resp->cstate, open, nn);
393 if (status == nfserr_replay_me) {
394 struct nfs4_replay *rp = &open->op_openowner->oo_owner.so_replay;
395 fh_put(&cstate->current_fh);
396 fh_copy_shallow(&cstate->current_fh.fh_handle,
398 status = fh_verify(rqstp, &cstate->current_fh, 0, NFSD_MAY_NOP);
400 dprintk("nfsd4_open: replay failed"
401 " restoring previous filehandle\n");
403 status = nfserr_replay_me;
407 if (open->op_xdr_error) {
408 status = open->op_xdr_error;
412 status = nfsd4_check_open_attributes(rqstp, cstate, open);
416 /* Openowner is now set, so sequence id will get bumped. Now we need
417 * these checks before we do any creates: */
418 status = nfserr_grace;
419 if (locks_in_grace(net) && open->op_claim_type != NFS4_OPEN_CLAIM_PREVIOUS)
421 status = nfserr_no_grace;
422 if (!locks_in_grace(net) && open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS)
425 switch (open->op_claim_type) {
426 case NFS4_OPEN_CLAIM_DELEGATE_CUR:
427 case NFS4_OPEN_CLAIM_NULL:
428 status = do_open_lookup(rqstp, cstate, open, &resfh);
432 case NFS4_OPEN_CLAIM_PREVIOUS:
433 status = nfs4_check_open_reclaim(&open->op_clientid,
434 cstate->minorversion,
438 open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
439 case NFS4_OPEN_CLAIM_FH:
440 case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
441 status = do_open_fhandle(rqstp, cstate, open);
444 resfh = &cstate->current_fh;
446 case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
447 case NFS4_OPEN_CLAIM_DELEGATE_PREV:
448 dprintk("NFSD: unsupported OPEN claim type %d\n",
449 open->op_claim_type);
450 status = nfserr_notsupp;
453 dprintk("NFSD: Invalid OPEN claim type %d\n",
454 open->op_claim_type);
455 status = nfserr_inval;
459 * nfsd4_process_open2() does the actual opening of the file. If
460 * successful, it (1) truncates the file if open->op_truncate was
461 * set, (2) sets open->op_stateid, (3) sets open->op_delegation.
463 status = nfsd4_process_open2(rqstp, resfh, open);
464 WARN_ON(status && open->op_created);
466 if (resfh && resfh != &cstate->current_fh) {
467 fh_dup2(&cstate->current_fh, resfh);
471 nfsd4_cleanup_open_state(open, status);
472 if (open->op_openowner && !nfsd4_has_session(cstate))
473 cstate->replay_owner = &open->op_openowner->oo_owner;
474 nfsd4_bump_seqid(cstate, status);
475 if (!cstate->replay_owner)
481 * OPEN is the only seqid-mutating operation whose decoding can fail
482 * with a seqid-mutating error (specifically, decoding of user names in
483 * the attributes). Therefore we have to do some processing to look up
484 * the stateowner so that we can bump the seqid.
486 static __be32 nfsd4_open_omfg(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_op *op)
488 struct nfsd4_open *open = (struct nfsd4_open *)&op->u;
490 if (!seqid_mutating_err(ntohl(op->status)))
492 if (nfsd4_has_session(cstate))
494 open->op_xdr_error = op->status;
495 return nfsd4_open(rqstp, cstate, open);
499 * filehandle-manipulating ops.
502 nfsd4_getfh(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
503 struct svc_fh **getfh)
505 if (!cstate->current_fh.fh_dentry)
506 return nfserr_nofilehandle;
508 *getfh = &cstate->current_fh;
513 nfsd4_putfh(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
514 struct nfsd4_putfh *putfh)
516 fh_put(&cstate->current_fh);
517 cstate->current_fh.fh_handle.fh_size = putfh->pf_fhlen;
518 memcpy(&cstate->current_fh.fh_handle.fh_base, putfh->pf_fhval,
520 return fh_verify(rqstp, &cstate->current_fh, 0, NFSD_MAY_BYPASS_GSS);
524 nfsd4_putrootfh(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
529 fh_put(&cstate->current_fh);
530 status = exp_pseudoroot(rqstp, &cstate->current_fh);
535 nfsd4_restorefh(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
538 if (!cstate->save_fh.fh_dentry)
539 return nfserr_restorefh;
541 fh_dup2(&cstate->current_fh, &cstate->save_fh);
542 if (HAS_STATE_ID(cstate, SAVED_STATE_ID_FLAG)) {
543 memcpy(&cstate->current_stateid, &cstate->save_stateid, sizeof(stateid_t));
544 SET_STATE_ID(cstate, CURRENT_STATE_ID_FLAG);
550 nfsd4_savefh(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
553 if (!cstate->current_fh.fh_dentry)
554 return nfserr_nofilehandle;
556 fh_dup2(&cstate->save_fh, &cstate->current_fh);
557 if (HAS_STATE_ID(cstate, CURRENT_STATE_ID_FLAG)) {
558 memcpy(&cstate->save_stateid, &cstate->current_stateid, sizeof(stateid_t));
559 SET_STATE_ID(cstate, SAVED_STATE_ID_FLAG);
568 nfsd4_access(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
569 struct nfsd4_access *access)
571 if (access->ac_req_access & ~NFS3_ACCESS_FULL)
574 access->ac_resp_access = access->ac_req_access;
575 return nfsd_access(rqstp, &cstate->current_fh, &access->ac_resp_access,
576 &access->ac_supported);
579 static void gen_boot_verifier(nfs4_verifier *verifier, struct net *net)
582 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
585 * This is opaque to client, so no need to byte-swap. Use
586 * __force to keep sparse happy
588 verf[0] = (__force __be32)nn->nfssvc_boot.tv_sec;
589 verf[1] = (__force __be32)nn->nfssvc_boot.tv_usec;
590 memcpy(verifier->data, verf, sizeof(verifier->data));
594 nfsd4_commit(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
595 struct nfsd4_commit *commit)
597 gen_boot_verifier(&commit->co_verf, SVC_NET(rqstp));
598 return nfsd_commit(rqstp, &cstate->current_fh, commit->co_offset,
603 nfsd4_create(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
604 struct nfsd4_create *create)
610 fh_init(&resfh, NFS4_FHSIZE);
612 status = fh_verify(rqstp, &cstate->current_fh, S_IFDIR,
617 status = check_attr_support(rqstp, cstate, create->cr_bmval,
622 switch (create->cr_type) {
624 status = nfsd_symlink(rqstp, &cstate->current_fh,
625 create->cr_name, create->cr_namelen,
627 &resfh, &create->cr_iattr);
631 rdev = MKDEV(create->cr_specdata1, create->cr_specdata2);
632 if (MAJOR(rdev) != create->cr_specdata1 ||
633 MINOR(rdev) != create->cr_specdata2)
635 status = nfsd_create(rqstp, &cstate->current_fh,
636 create->cr_name, create->cr_namelen,
637 &create->cr_iattr, S_IFBLK, rdev, &resfh);
641 rdev = MKDEV(create->cr_specdata1, create->cr_specdata2);
642 if (MAJOR(rdev) != create->cr_specdata1 ||
643 MINOR(rdev) != create->cr_specdata2)
645 status = nfsd_create(rqstp, &cstate->current_fh,
646 create->cr_name, create->cr_namelen,
647 &create->cr_iattr,S_IFCHR, rdev, &resfh);
651 status = nfsd_create(rqstp, &cstate->current_fh,
652 create->cr_name, create->cr_namelen,
653 &create->cr_iattr, S_IFSOCK, 0, &resfh);
657 status = nfsd_create(rqstp, &cstate->current_fh,
658 create->cr_name, create->cr_namelen,
659 &create->cr_iattr, S_IFIFO, 0, &resfh);
663 create->cr_iattr.ia_valid &= ~ATTR_SIZE;
664 status = nfsd_create(rqstp, &cstate->current_fh,
665 create->cr_name, create->cr_namelen,
666 &create->cr_iattr, S_IFDIR, 0, &resfh);
670 status = nfserr_badtype;
676 if (create->cr_label.len)
677 nfsd4_security_inode_setsecctx(&resfh, &create->cr_label, create->cr_bmval);
679 if (create->cr_acl != NULL)
680 do_set_nfs4_acl(rqstp, &resfh, create->cr_acl,
683 fh_unlock(&cstate->current_fh);
684 set_change_info(&create->cr_cinfo, &cstate->current_fh);
685 fh_dup2(&cstate->current_fh, &resfh);
692 nfsd4_getattr(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
693 struct nfsd4_getattr *getattr)
697 status = fh_verify(rqstp, &cstate->current_fh, 0, NFSD_MAY_NOP);
701 if (getattr->ga_bmval[1] & NFSD_WRITEONLY_ATTRS_WORD1)
704 getattr->ga_bmval[0] &= nfsd_suppattrs0(cstate->minorversion);
705 getattr->ga_bmval[1] &= nfsd_suppattrs1(cstate->minorversion);
706 getattr->ga_bmval[2] &= nfsd_suppattrs2(cstate->minorversion);
708 getattr->ga_fhp = &cstate->current_fh;
713 nfsd4_link(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
714 struct nfsd4_link *link)
716 __be32 status = nfserr_nofilehandle;
718 if (!cstate->save_fh.fh_dentry)
720 status = nfsd_link(rqstp, &cstate->current_fh,
721 link->li_name, link->li_namelen, &cstate->save_fh);
723 set_change_info(&link->li_cinfo, &cstate->current_fh);
727 static __be32 nfsd4_do_lookupp(struct svc_rqst *rqstp, struct svc_fh *fh)
729 struct svc_fh tmp_fh;
732 fh_init(&tmp_fh, NFS4_FHSIZE);
733 ret = exp_pseudoroot(rqstp, &tmp_fh);
736 if (tmp_fh.fh_dentry == fh->fh_dentry) {
741 return nfsd_lookup(rqstp, fh, "..", 2, fh);
745 nfsd4_lookupp(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
748 return nfsd4_do_lookupp(rqstp, &cstate->current_fh);
752 nfsd4_lookup(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
753 struct nfsd4_lookup *lookup)
755 return nfsd_lookup(rqstp, &cstate->current_fh,
756 lookup->lo_name, lookup->lo_len,
757 &cstate->current_fh);
761 nfsd4_read(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
762 struct nfsd4_read *read)
766 /* no need to check permission - this will be done in nfsd_read() */
768 read->rd_filp = NULL;
769 if (read->rd_offset >= OFFSET_MAX)
773 * If we do a zero copy read, then a client will see read data
774 * that reflects the state of the file *after* performing the
775 * following compound.
777 * To ensure proper ordering, we therefore turn off zero copy if
778 * the client wants us to do more in this compound:
780 if (!nfsd4_last_compound_op(rqstp))
781 rqstp->rq_splice_ok = false;
784 if ((status = nfs4_preprocess_stateid_op(SVC_NET(rqstp),
785 cstate, &read->rd_stateid,
786 RD_STATE, &read->rd_filp))) {
787 dprintk("NFSD: nfsd4_read: couldn't process stateid!\n");
792 read->rd_rqstp = rqstp;
793 read->rd_fhp = &cstate->current_fh;
798 nfsd4_readdir(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
799 struct nfsd4_readdir *readdir)
801 u64 cookie = readdir->rd_cookie;
802 static const nfs4_verifier zeroverf;
804 /* no need to check permission - this will be done in nfsd_readdir() */
806 if (readdir->rd_bmval[1] & NFSD_WRITEONLY_ATTRS_WORD1)
809 readdir->rd_bmval[0] &= nfsd_suppattrs0(cstate->minorversion);
810 readdir->rd_bmval[1] &= nfsd_suppattrs1(cstate->minorversion);
811 readdir->rd_bmval[2] &= nfsd_suppattrs2(cstate->minorversion);
813 if ((cookie == 1) || (cookie == 2) ||
814 (cookie == 0 && memcmp(readdir->rd_verf.data, zeroverf.data, NFS4_VERIFIER_SIZE)))
815 return nfserr_bad_cookie;
817 readdir->rd_rqstp = rqstp;
818 readdir->rd_fhp = &cstate->current_fh;
823 nfsd4_readlink(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
824 struct nfsd4_readlink *readlink)
826 readlink->rl_rqstp = rqstp;
827 readlink->rl_fhp = &cstate->current_fh;
832 nfsd4_remove(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
833 struct nfsd4_remove *remove)
837 if (locks_in_grace(SVC_NET(rqstp)))
839 status = nfsd_unlink(rqstp, &cstate->current_fh, 0,
840 remove->rm_name, remove->rm_namelen);
842 fh_unlock(&cstate->current_fh);
843 set_change_info(&remove->rm_cinfo, &cstate->current_fh);
849 nfsd4_rename(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
850 struct nfsd4_rename *rename)
852 __be32 status = nfserr_nofilehandle;
854 if (!cstate->save_fh.fh_dentry)
856 if (locks_in_grace(SVC_NET(rqstp)) &&
857 !(cstate->save_fh.fh_export->ex_flags & NFSEXP_NOSUBTREECHECK))
859 status = nfsd_rename(rqstp, &cstate->save_fh, rename->rn_sname,
860 rename->rn_snamelen, &cstate->current_fh,
861 rename->rn_tname, rename->rn_tnamelen);
864 set_change_info(&rename->rn_sinfo, &cstate->current_fh);
865 set_change_info(&rename->rn_tinfo, &cstate->save_fh);
870 nfsd4_secinfo(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
871 struct nfsd4_secinfo *secinfo)
874 struct svc_export *exp;
875 struct dentry *dentry;
878 fh_init(&resfh, NFS4_FHSIZE);
879 err = fh_verify(rqstp, &cstate->current_fh, S_IFDIR, NFSD_MAY_EXEC);
882 err = nfsd_lookup_dentry(rqstp, &cstate->current_fh,
883 secinfo->si_name, secinfo->si_namelen,
887 if (dentry->d_inode == NULL) {
891 secinfo->si_exp = exp;
893 if (cstate->minorversion)
894 /* See rfc 5661 section 2.6.3.1.1.8 */
895 fh_put(&cstate->current_fh);
900 nfsd4_secinfo_no_name(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
901 struct nfsd4_secinfo_no_name *sin)
905 switch (sin->sin_style) {
906 case NFS4_SECINFO_STYLE4_CURRENT_FH:
908 case NFS4_SECINFO_STYLE4_PARENT:
909 err = nfsd4_do_lookupp(rqstp, &cstate->current_fh);
917 sin->sin_exp = exp_get(cstate->current_fh.fh_export);
918 fh_put(&cstate->current_fh);
923 nfsd4_setattr(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
924 struct nfsd4_setattr *setattr)
926 __be32 status = nfs_ok;
929 if (setattr->sa_iattr.ia_valid & ATTR_SIZE) {
930 status = nfs4_preprocess_stateid_op(SVC_NET(rqstp), cstate,
931 &setattr->sa_stateid, WR_STATE, NULL);
933 dprintk("NFSD: nfsd4_setattr: couldn't process stateid!\n");
937 err = fh_want_write(&cstate->current_fh);
939 return nfserrno(err);
942 status = check_attr_support(rqstp, cstate, setattr->sa_bmval,
947 if (setattr->sa_acl != NULL)
948 status = nfsd4_set_nfs4_acl(rqstp, &cstate->current_fh,
952 if (setattr->sa_label.len)
953 status = nfsd4_set_nfs4_label(rqstp, &cstate->current_fh,
957 status = nfsd_setattr(rqstp, &cstate->current_fh, &setattr->sa_iattr,
960 fh_drop_write(&cstate->current_fh);
964 static int fill_in_write_vector(struct kvec *vec, struct nfsd4_write *write)
967 int buflen = write->wr_buflen;
969 vec[0].iov_base = write->wr_head.iov_base;
970 vec[0].iov_len = min_t(int, buflen, write->wr_head.iov_len);
971 buflen -= vec[0].iov_len;
974 vec[i].iov_base = page_address(write->wr_pagelist[i - 1]);
975 vec[i].iov_len = min_t(int, PAGE_SIZE, buflen);
976 buflen -= vec[i].iov_len;
983 nfsd4_write(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
984 struct nfsd4_write *write)
986 stateid_t *stateid = &write->wr_stateid;
987 struct file *filp = NULL;
988 __be32 status = nfs_ok;
992 /* no need to check permission - this will be done in nfsd_write() */
994 if (write->wr_offset >= OFFSET_MAX)
997 status = nfs4_preprocess_stateid_op(SVC_NET(rqstp),
998 cstate, stateid, WR_STATE, &filp);
1000 dprintk("NFSD: nfsd4_write: couldn't process stateid!\n");
1004 cnt = write->wr_buflen;
1005 write->wr_how_written = write->wr_stable_how;
1006 gen_boot_verifier(&write->wr_verifier, SVC_NET(rqstp));
1008 nvecs = fill_in_write_vector(rqstp->rq_vec, write);
1009 WARN_ON_ONCE(nvecs > ARRAY_SIZE(rqstp->rq_vec));
1011 status = nfsd_write(rqstp, &cstate->current_fh, filp,
1012 write->wr_offset, rqstp->rq_vec, nvecs,
1013 &cnt, &write->wr_how_written);
1017 write->wr_bytes_written = cnt;
1022 /* This routine never returns NFS_OK! If there are no other errors, it
1023 * will return NFSERR_SAME or NFSERR_NOT_SAME depending on whether the
1024 * attributes matched. VERIFY is implemented by mapping NFSERR_SAME
1025 * to NFS_OK after the call; NVERIFY by mapping NFSERR_NOT_SAME to NFS_OK.
1028 _nfsd4_verify(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
1029 struct nfsd4_verify *verify)
1035 status = fh_verify(rqstp, &cstate->current_fh, 0, NFSD_MAY_NOP);
1039 status = check_attr_support(rqstp, cstate, verify->ve_bmval, NULL);
1043 if ((verify->ve_bmval[0] & FATTR4_WORD0_RDATTR_ERROR)
1044 || (verify->ve_bmval[1] & NFSD_WRITEONLY_ATTRS_WORD1))
1045 return nfserr_inval;
1046 if (verify->ve_attrlen & 3)
1047 return nfserr_inval;
1050 * bitmap_len(1) + bitmap(2) + attr_len(1) = 4
1052 count = 4 + (verify->ve_attrlen >> 2);
1053 buf = kmalloc(count << 2, GFP_KERNEL);
1055 return nfserr_jukebox;
1058 status = nfsd4_encode_fattr_to_buf(&p, count, &cstate->current_fh,
1059 cstate->current_fh.fh_export,
1060 cstate->current_fh.fh_dentry,
1064 * If nfsd4_encode_fattr() ran out of space, assume that's because
1065 * the attributes are longer (hence different) than those given:
1067 if (status == nfserr_resource)
1068 status = nfserr_not_same;
1073 p = buf + 1 + ntohl(buf[0]);
1074 status = nfserr_not_same;
1075 if (ntohl(*p++) != verify->ve_attrlen)
1077 if (!memcmp(p, verify->ve_attrval, verify->ve_attrlen))
1078 status = nfserr_same;
1086 nfsd4_nverify(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
1087 struct nfsd4_verify *verify)
1091 status = _nfsd4_verify(rqstp, cstate, verify);
1092 return status == nfserr_not_same ? nfs_ok : status;
1096 nfsd4_verify(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
1097 struct nfsd4_verify *verify)
1101 status = _nfsd4_verify(rqstp, cstate, verify);
1102 return status == nfserr_same ? nfs_ok : status;
1109 nfsd4_proc_null(struct svc_rqst *rqstp, void *argp, void *resp)
1114 static inline void nfsd4_increment_op_stats(u32 opnum)
1116 if (opnum >= FIRST_NFS4_OP && opnum <= LAST_NFS4_OP)
1117 nfsdstats.nfs4_opcount[opnum]++;
1120 typedef __be32(*nfsd4op_func)(struct svc_rqst *, struct nfsd4_compound_state *,
1122 typedef u32(*nfsd4op_rsize)(struct svc_rqst *, struct nfsd4_op *op);
1123 typedef void(*stateid_setter)(struct nfsd4_compound_state *, void *);
1124 typedef void(*stateid_getter)(struct nfsd4_compound_state *, void *);
1126 enum nfsd4_op_flags {
1127 ALLOWED_WITHOUT_FH = 1 << 0, /* No current filehandle required */
1128 ALLOWED_ON_ABSENT_FS = 1 << 1, /* ops processed on absent fs */
1129 ALLOWED_AS_FIRST_OP = 1 << 2, /* ops reqired first in compound */
1130 /* For rfc 5661 section 2.6.3.1.1: */
1131 OP_HANDLES_WRONGSEC = 1 << 3,
1132 OP_IS_PUTFH_LIKE = 1 << 4,
1134 * These are the ops whose result size we estimate before
1135 * encoding, to avoid performing an op then not being able to
1136 * respond or cache a response. This includes writes and setattrs
1137 * as well as the operations usually called "nonidempotent":
1139 OP_MODIFIES_SOMETHING = 1 << 5,
1141 * Cache compounds containing these ops in the xid-based drc:
1142 * We use the DRC for compounds containing non-idempotent
1143 * operations, *except* those that are 4.1-specific (since
1144 * sessions provide their own EOS), and except for stateful
1145 * operations other than setclientid and setclientid_confirm
1146 * (since sequence numbers provide EOS for open, lock, etc in
1149 OP_CACHEME = 1 << 6,
1151 * These are ops which clear current state id.
1153 OP_CLEAR_STATEID = 1 << 7,
1156 struct nfsd4_operation {
1157 nfsd4op_func op_func;
1160 /* Try to get response size before operation */
1161 nfsd4op_rsize op_rsize_bop;
1162 stateid_getter op_get_currentstateid;
1163 stateid_setter op_set_currentstateid;
1166 static struct nfsd4_operation nfsd4_ops[];
1168 static const char *nfsd4_op_name(unsigned opnum);
1171 * Enforce NFSv4.1 COMPOUND ordering rules:
1173 * Also note, enforced elsewhere:
1174 * - SEQUENCE other than as first op results in
1175 * NFS4ERR_SEQUENCE_POS. (Enforced in nfsd4_sequence().)
1176 * - BIND_CONN_TO_SESSION must be the only op in its compound.
1177 * (Enforced in nfsd4_bind_conn_to_session().)
1178 * - DESTROY_SESSION must be the final operation in a compound, if
1179 * sessionid's in SEQUENCE and DESTROY_SESSION are the same.
1180 * (Enforced in nfsd4_destroy_session().)
1182 static __be32 nfs41_check_op_ordering(struct nfsd4_compoundargs *args)
1184 struct nfsd4_op *op = &args->ops[0];
1186 /* These ordering requirements don't apply to NFSv4.0: */
1187 if (args->minorversion == 0)
1189 /* This is weird, but OK, not our problem: */
1190 if (args->opcnt == 0)
1192 if (op->status == nfserr_op_illegal)
1194 if (!(nfsd4_ops[op->opnum].op_flags & ALLOWED_AS_FIRST_OP))
1195 return nfserr_op_not_in_session;
1196 if (op->opnum == OP_SEQUENCE)
1198 if (args->opcnt != 1)
1199 return nfserr_not_only_op;
1203 static inline struct nfsd4_operation *OPDESC(struct nfsd4_op *op)
1205 return &nfsd4_ops[op->opnum];
1208 bool nfsd4_cache_this_op(struct nfsd4_op *op)
1210 if (op->opnum == OP_ILLEGAL)
1212 return OPDESC(op)->op_flags & OP_CACHEME;
1215 static bool need_wrongsec_check(struct svc_rqst *rqstp)
1217 struct nfsd4_compoundres *resp = rqstp->rq_resp;
1218 struct nfsd4_compoundargs *argp = rqstp->rq_argp;
1219 struct nfsd4_op *this = &argp->ops[resp->opcnt - 1];
1220 struct nfsd4_op *next = &argp->ops[resp->opcnt];
1221 struct nfsd4_operation *thisd;
1222 struct nfsd4_operation *nextd;
1224 thisd = OPDESC(this);
1226 * Most ops check wronsec on our own; only the putfh-like ops
1227 * have special rules.
1229 if (!(thisd->op_flags & OP_IS_PUTFH_LIKE))
1232 * rfc 5661 2.6.3.1.1.6: don't bother erroring out a
1233 * put-filehandle operation if we're not going to use the
1236 if (argp->opcnt == resp->opcnt)
1239 nextd = OPDESC(next);
1241 * Rest of 2.6.3.1.1: certain operations will return WRONGSEC
1242 * errors themselves as necessary; others should check for them
1245 return !(nextd->op_flags & OP_HANDLES_WRONGSEC);
1248 static void svcxdr_init_encode(struct svc_rqst *rqstp,
1249 struct nfsd4_compoundres *resp)
1251 struct xdr_stream *xdr = &resp->xdr;
1252 struct xdr_buf *buf = &rqstp->rq_res;
1253 struct kvec *head = buf->head;
1257 xdr->p = head->iov_base + head->iov_len;
1258 xdr->end = head->iov_base + PAGE_SIZE - rqstp->rq_auth_slack;
1259 /* Tail and page_len should be zero at this point: */
1260 buf->len = buf->head[0].iov_len;
1261 xdr->scratch.iov_len = 0;
1262 xdr->page_ptr = buf->pages - 1;
1263 buf->buflen = PAGE_SIZE * (1 + rqstp->rq_page_end - buf->pages)
1264 - rqstp->rq_auth_slack;
1271 nfsd4_proc_compound(struct svc_rqst *rqstp,
1272 struct nfsd4_compoundargs *args,
1273 struct nfsd4_compoundres *resp)
1275 struct nfsd4_op *op;
1276 struct nfsd4_operation *opdesc;
1277 struct nfsd4_compound_state *cstate = &resp->cstate;
1278 struct svc_fh *current_fh = &cstate->current_fh;
1279 struct svc_fh *save_fh = &cstate->save_fh;
1282 svcxdr_init_encode(rqstp, resp);
1283 resp->tagp = resp->xdr.p;
1284 /* reserve space for: taglen, tag, and opcnt */
1285 xdr_reserve_space(&resp->xdr, 8 + args->taglen);
1286 resp->taglen = args->taglen;
1287 resp->tag = args->tag;
1288 resp->rqstp = rqstp;
1289 cstate->minorversion = args->minorversion;
1290 fh_init(current_fh, NFS4_FHSIZE);
1291 fh_init(save_fh, NFS4_FHSIZE);
1293 * Don't use the deferral mechanism for NFSv4; compounds make it
1294 * too hard to avoid non-idempotency problems.
1296 rqstp->rq_usedeferral = false;
1299 * According to RFC3010, this takes precedence over all other errors.
1301 status = nfserr_minor_vers_mismatch;
1302 if (nfsd_minorversion(args->minorversion, NFSD_TEST) <= 0)
1305 status = nfs41_check_op_ordering(args);
1308 op->status = status;
1312 while (!status && resp->opcnt < args->opcnt) {
1313 op = &args->ops[resp->opcnt++];
1315 dprintk("nfsv4 compound op #%d/%d: %d (%s)\n",
1316 resp->opcnt, args->opcnt, op->opnum,
1317 nfsd4_op_name(op->opnum));
1319 * The XDR decode routines may have pre-set op->status;
1320 * for example, if there is a miscellaneous XDR error
1321 * it will be set to nfserr_bad_xdr.
1324 if (op->opnum == OP_OPEN)
1325 op->status = nfsd4_open_omfg(rqstp, cstate, op);
1329 opdesc = OPDESC(op);
1331 if (!current_fh->fh_dentry) {
1332 if (!(opdesc->op_flags & ALLOWED_WITHOUT_FH)) {
1333 op->status = nfserr_nofilehandle;
1336 } else if (current_fh->fh_export->ex_fslocs.migrated &&
1337 !(opdesc->op_flags & ALLOWED_ON_ABSENT_FS)) {
1338 op->status = nfserr_moved;
1342 fh_clear_wcc(current_fh);
1344 /* If op is non-idempotent */
1345 if (opdesc->op_flags & OP_MODIFIES_SOMETHING) {
1347 * Don't execute this op if we couldn't encode a
1350 u32 plen = opdesc->op_rsize_bop(rqstp, op);
1352 * Plus if there's another operation, make sure
1353 * we'll have space to at least encode an error:
1355 if (resp->opcnt < args->opcnt)
1356 plen += COMPOUND_ERR_SLACK_SPACE;
1357 op->status = nfsd4_check_resp_size(resp, plen);
1363 if (opdesc->op_get_currentstateid)
1364 opdesc->op_get_currentstateid(cstate, &op->u);
1365 op->status = opdesc->op_func(rqstp, cstate, &op->u);
1368 if (opdesc->op_set_currentstateid)
1369 opdesc->op_set_currentstateid(cstate, &op->u);
1371 if (opdesc->op_flags & OP_CLEAR_STATEID)
1372 clear_current_stateid(cstate);
1374 if (need_wrongsec_check(rqstp))
1375 op->status = check_nfsd_access(current_fh->fh_export, rqstp);
1379 /* Only from SEQUENCE */
1380 if (cstate->status == nfserr_replay_cache) {
1381 dprintk("%s NFS4.1 replay from cache\n", __func__);
1382 status = op->status;
1385 if (op->status == nfserr_replay_me) {
1386 op->replay = &cstate->replay_owner->so_replay;
1387 nfsd4_encode_replay(&resp->xdr, op);
1388 status = op->status = op->replay->rp_status;
1390 nfsd4_encode_operation(resp, op);
1391 status = op->status;
1394 dprintk("nfsv4 compound op %p opcnt %d #%d: %d: status %d\n",
1395 args->ops, args->opcnt, resp->opcnt, op->opnum,
1396 be32_to_cpu(status));
1398 if (cstate->replay_owner) {
1399 nfs4_unlock_state();
1400 cstate->replay_owner = NULL;
1402 /* XXX Ugh, we need to get rid of this kind of special case: */
1403 if (op->opnum == OP_READ && op->u.read.rd_filp)
1404 fput(op->u.read.rd_filp);
1406 nfsd4_increment_op_stats(op->opnum);
1409 cstate->status = status;
1412 BUG_ON(cstate->replay_owner);
1414 /* Reset deferral mechanism for RPC deferrals */
1415 rqstp->rq_usedeferral = true;
1416 dprintk("nfsv4 compound returned %d\n", ntohl(status));
1420 #define op_encode_hdr_size (2)
1421 #define op_encode_stateid_maxsz (XDR_QUADLEN(NFS4_STATEID_SIZE))
1422 #define op_encode_verifier_maxsz (XDR_QUADLEN(NFS4_VERIFIER_SIZE))
1423 #define op_encode_change_info_maxsz (5)
1424 #define nfs4_fattr_bitmap_maxsz (4)
1426 /* We'll fall back on returning no lockowner if run out of space: */
1427 #define op_encode_lockowner_maxsz (0)
1428 #define op_encode_lock_denied_maxsz (8 + op_encode_lockowner_maxsz)
1430 #define nfs4_owner_maxsz (1 + XDR_QUADLEN(IDMAP_NAMESZ))
1432 #define op_encode_ace_maxsz (3 + nfs4_owner_maxsz)
1433 #define op_encode_delegation_maxsz (1 + op_encode_stateid_maxsz + 1 + \
1434 op_encode_ace_maxsz)
1436 #define op_encode_channel_attrs_maxsz (6 + 1 + 1)
1438 static inline u32 nfsd4_only_status_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1440 return (op_encode_hdr_size) * sizeof(__be32);
1443 static inline u32 nfsd4_status_stateid_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1445 return (op_encode_hdr_size + op_encode_stateid_maxsz)* sizeof(__be32);
1448 static inline u32 nfsd4_commit_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1450 return (op_encode_hdr_size + op_encode_verifier_maxsz) * sizeof(__be32);
1453 static inline u32 nfsd4_create_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1455 return (op_encode_hdr_size + op_encode_change_info_maxsz
1456 + nfs4_fattr_bitmap_maxsz) * sizeof(__be32);
1460 * Note since this is an idempotent operation we won't insist on failing
1461 * the op prematurely if the estimate is too large. We may turn off splice
1462 * reads unnecessarily.
1464 static inline u32 nfsd4_getattr_rsize(struct svc_rqst *rqstp,
1465 struct nfsd4_op *op)
1467 u32 *bmap = op->u.getattr.ga_bmval;
1468 u32 bmap0 = bmap[0], bmap1 = bmap[1], bmap2 = bmap[2];
1471 if (bmap0 & FATTR4_WORD0_ACL)
1472 return svc_max_payload(rqstp);
1473 if (bmap0 & FATTR4_WORD0_FS_LOCATIONS)
1474 return svc_max_payload(rqstp);
1476 if (bmap1 & FATTR4_WORD1_OWNER) {
1477 ret += IDMAP_NAMESZ + 4;
1478 bmap1 &= ~FATTR4_WORD1_OWNER;
1480 if (bmap1 & FATTR4_WORD1_OWNER_GROUP) {
1481 ret += IDMAP_NAMESZ + 4;
1482 bmap1 &= ~FATTR4_WORD1_OWNER_GROUP;
1484 if (bmap0 & FATTR4_WORD0_FILEHANDLE) {
1485 ret += NFS4_FHSIZE + 4;
1486 bmap0 &= ~FATTR4_WORD0_FILEHANDLE;
1488 if (bmap2 & FATTR4_WORD2_SECURITY_LABEL) {
1489 ret += NFSD4_MAX_SEC_LABEL_LEN + 12;
1490 bmap2 &= ~FATTR4_WORD2_SECURITY_LABEL;
1493 * Largest of remaining attributes are 16 bytes (e.g.,
1494 * supported_attributes)
1496 ret += 16 * (hweight32(bmap0) + hweight32(bmap1) + hweight32(bmap2));
1497 /* bitmask, length */
1502 static inline u32 nfsd4_link_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1504 return (op_encode_hdr_size + op_encode_change_info_maxsz)
1508 static inline u32 nfsd4_lock_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1510 return (op_encode_hdr_size + op_encode_lock_denied_maxsz)
1514 static inline u32 nfsd4_open_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1516 return (op_encode_hdr_size + op_encode_stateid_maxsz
1517 + op_encode_change_info_maxsz + 1
1518 + nfs4_fattr_bitmap_maxsz
1519 + op_encode_delegation_maxsz) * sizeof(__be32);
1522 static inline u32 nfsd4_read_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1524 u32 maxcount = 0, rlen = 0;
1526 maxcount = svc_max_payload(rqstp);
1527 rlen = min(op->u.read.rd_length, maxcount);
1529 return (op_encode_hdr_size + 2 + XDR_QUADLEN(rlen)) * sizeof(__be32);
1532 static inline u32 nfsd4_readdir_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1534 u32 maxcount = 0, rlen = 0;
1536 maxcount = svc_max_payload(rqstp);
1537 rlen = min(op->u.readdir.rd_maxcount, maxcount);
1539 return (op_encode_hdr_size + op_encode_verifier_maxsz +
1540 XDR_QUADLEN(rlen)) * sizeof(__be32);
1543 static inline u32 nfsd4_remove_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1545 return (op_encode_hdr_size + op_encode_change_info_maxsz)
1549 static inline u32 nfsd4_rename_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1551 return (op_encode_hdr_size + op_encode_change_info_maxsz
1552 + op_encode_change_info_maxsz) * sizeof(__be32);
1555 static inline u32 nfsd4_sequence_rsize(struct svc_rqst *rqstp,
1556 struct nfsd4_op *op)
1558 return NFS4_MAX_SESSIONID_LEN + 20;
1561 static inline u32 nfsd4_setattr_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1563 return (op_encode_hdr_size + nfs4_fattr_bitmap_maxsz) * sizeof(__be32);
1566 static inline u32 nfsd4_setclientid_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1568 return (op_encode_hdr_size + 2 + XDR_QUADLEN(NFS4_VERIFIER_SIZE)) *
1572 static inline u32 nfsd4_write_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1574 return (op_encode_hdr_size + 2 + op_encode_verifier_maxsz) * sizeof(__be32);
1577 static inline u32 nfsd4_exchange_id_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1579 return (op_encode_hdr_size + 2 + 1 + /* eir_clientid, eir_sequenceid */\
1580 1 + 1 + /* eir_flags, spr_how */\
1581 4 + /* spo_must_enforce & _allow with bitmap */\
1582 2 + /*eir_server_owner.so_minor_id */\
1583 /* eir_server_owner.so_major_id<> */\
1584 XDR_QUADLEN(NFS4_OPAQUE_LIMIT) + 1 +\
1585 /* eir_server_scope<> */\
1586 XDR_QUADLEN(NFS4_OPAQUE_LIMIT) + 1 +\
1587 1 + /* eir_server_impl_id array length */\
1588 0 /* ignored eir_server_impl_id contents */) * sizeof(__be32);
1591 static inline u32 nfsd4_bind_conn_to_session_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1593 return (op_encode_hdr_size + \
1594 XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + /* bctsr_sessid */\
1595 2 /* bctsr_dir, use_conn_in_rdma_mode */) * sizeof(__be32);
1598 static inline u32 nfsd4_create_session_rsize(struct svc_rqst *rqstp, struct nfsd4_op *op)
1600 return (op_encode_hdr_size + \
1601 XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + /* sessionid */\
1602 2 + /* csr_sequence, csr_flags */\
1603 op_encode_channel_attrs_maxsz + \
1604 op_encode_channel_attrs_maxsz) * sizeof(__be32);
1607 static struct nfsd4_operation nfsd4_ops[] = {
1609 .op_func = (nfsd4op_func)nfsd4_access,
1610 .op_name = "OP_ACCESS",
1613 .op_func = (nfsd4op_func)nfsd4_close,
1614 .op_flags = OP_MODIFIES_SOMETHING,
1615 .op_name = "OP_CLOSE",
1616 .op_rsize_bop = (nfsd4op_rsize)nfsd4_status_stateid_rsize,
1617 .op_get_currentstateid = (stateid_getter)nfsd4_get_closestateid,
1618 .op_set_currentstateid = (stateid_setter)nfsd4_set_closestateid,
1621 .op_func = (nfsd4op_func)nfsd4_commit,
1622 .op_flags = OP_MODIFIES_SOMETHING,
1623 .op_name = "OP_COMMIT",
1624 .op_rsize_bop = (nfsd4op_rsize)nfsd4_commit_rsize,
1627 .op_func = (nfsd4op_func)nfsd4_create,
1628 .op_flags = OP_MODIFIES_SOMETHING | OP_CACHEME | OP_CLEAR_STATEID,
1629 .op_name = "OP_CREATE",
1630 .op_rsize_bop = (nfsd4op_rsize)nfsd4_create_rsize,
1632 [OP_DELEGRETURN] = {
1633 .op_func = (nfsd4op_func)nfsd4_delegreturn,
1634 .op_flags = OP_MODIFIES_SOMETHING,
1635 .op_name = "OP_DELEGRETURN",
1636 .op_rsize_bop = nfsd4_only_status_rsize,
1637 .op_get_currentstateid = (stateid_getter)nfsd4_get_delegreturnstateid,
1640 .op_func = (nfsd4op_func)nfsd4_getattr,
1641 .op_flags = ALLOWED_ON_ABSENT_FS,
1642 .op_rsize_bop = nfsd4_getattr_rsize,
1643 .op_name = "OP_GETATTR",
1646 .op_func = (nfsd4op_func)nfsd4_getfh,
1647 .op_name = "OP_GETFH",
1650 .op_func = (nfsd4op_func)nfsd4_link,
1651 .op_flags = ALLOWED_ON_ABSENT_FS | OP_MODIFIES_SOMETHING
1653 .op_name = "OP_LINK",
1654 .op_rsize_bop = (nfsd4op_rsize)nfsd4_link_rsize,
1657 .op_func = (nfsd4op_func)nfsd4_lock,
1658 .op_flags = OP_MODIFIES_SOMETHING,
1659 .op_name = "OP_LOCK",
1660 .op_rsize_bop = (nfsd4op_rsize)nfsd4_lock_rsize,
1661 .op_set_currentstateid = (stateid_setter)nfsd4_set_lockstateid,
1664 .op_func = (nfsd4op_func)nfsd4_lockt,
1665 .op_name = "OP_LOCKT",
1668 .op_func = (nfsd4op_func)nfsd4_locku,
1669 .op_flags = OP_MODIFIES_SOMETHING,
1670 .op_name = "OP_LOCKU",
1671 .op_rsize_bop = (nfsd4op_rsize)nfsd4_status_stateid_rsize,
1672 .op_get_currentstateid = (stateid_getter)nfsd4_get_lockustateid,
1675 .op_func = (nfsd4op_func)nfsd4_lookup,
1676 .op_flags = OP_HANDLES_WRONGSEC | OP_CLEAR_STATEID,
1677 .op_name = "OP_LOOKUP",
1680 .op_func = (nfsd4op_func)nfsd4_lookupp,
1681 .op_flags = OP_HANDLES_WRONGSEC | OP_CLEAR_STATEID,
1682 .op_name = "OP_LOOKUPP",
1685 .op_func = (nfsd4op_func)nfsd4_nverify,
1686 .op_name = "OP_NVERIFY",
1689 .op_func = (nfsd4op_func)nfsd4_open,
1690 .op_flags = OP_HANDLES_WRONGSEC | OP_MODIFIES_SOMETHING,
1691 .op_name = "OP_OPEN",
1692 .op_rsize_bop = (nfsd4op_rsize)nfsd4_open_rsize,
1693 .op_set_currentstateid = (stateid_setter)nfsd4_set_openstateid,
1695 [OP_OPEN_CONFIRM] = {
1696 .op_func = (nfsd4op_func)nfsd4_open_confirm,
1697 .op_flags = OP_MODIFIES_SOMETHING,
1698 .op_name = "OP_OPEN_CONFIRM",
1699 .op_rsize_bop = (nfsd4op_rsize)nfsd4_status_stateid_rsize,
1701 [OP_OPEN_DOWNGRADE] = {
1702 .op_func = (nfsd4op_func)nfsd4_open_downgrade,
1703 .op_flags = OP_MODIFIES_SOMETHING,
1704 .op_name = "OP_OPEN_DOWNGRADE",
1705 .op_rsize_bop = (nfsd4op_rsize)nfsd4_status_stateid_rsize,
1706 .op_get_currentstateid = (stateid_getter)nfsd4_get_opendowngradestateid,
1707 .op_set_currentstateid = (stateid_setter)nfsd4_set_opendowngradestateid,
1710 .op_func = (nfsd4op_func)nfsd4_putfh,
1711 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1712 | OP_IS_PUTFH_LIKE | OP_CLEAR_STATEID,
1713 .op_name = "OP_PUTFH",
1714 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1717 .op_func = (nfsd4op_func)nfsd4_putrootfh,
1718 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1719 | OP_IS_PUTFH_LIKE | OP_CLEAR_STATEID,
1720 .op_name = "OP_PUTPUBFH",
1721 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1724 .op_func = (nfsd4op_func)nfsd4_putrootfh,
1725 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1726 | OP_IS_PUTFH_LIKE | OP_CLEAR_STATEID,
1727 .op_name = "OP_PUTROOTFH",
1728 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1731 .op_func = (nfsd4op_func)nfsd4_read,
1732 .op_name = "OP_READ",
1733 .op_rsize_bop = (nfsd4op_rsize)nfsd4_read_rsize,
1734 .op_get_currentstateid = (stateid_getter)nfsd4_get_readstateid,
1737 .op_func = (nfsd4op_func)nfsd4_readdir,
1738 .op_name = "OP_READDIR",
1739 .op_rsize_bop = (nfsd4op_rsize)nfsd4_readdir_rsize,
1742 .op_func = (nfsd4op_func)nfsd4_readlink,
1743 .op_name = "OP_READLINK",
1746 .op_func = (nfsd4op_func)nfsd4_remove,
1747 .op_flags = OP_MODIFIES_SOMETHING | OP_CACHEME,
1748 .op_name = "OP_REMOVE",
1749 .op_rsize_bop = (nfsd4op_rsize)nfsd4_remove_rsize,
1752 .op_func = (nfsd4op_func)nfsd4_rename,
1753 .op_flags = OP_MODIFIES_SOMETHING | OP_CACHEME,
1754 .op_name = "OP_RENAME",
1755 .op_rsize_bop = (nfsd4op_rsize)nfsd4_rename_rsize,
1758 .op_func = (nfsd4op_func)nfsd4_renew,
1759 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1760 | OP_MODIFIES_SOMETHING,
1761 .op_name = "OP_RENEW",
1762 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1766 .op_func = (nfsd4op_func)nfsd4_restorefh,
1767 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1768 | OP_IS_PUTFH_LIKE | OP_MODIFIES_SOMETHING,
1769 .op_name = "OP_RESTOREFH",
1770 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1773 .op_func = (nfsd4op_func)nfsd4_savefh,
1774 .op_flags = OP_HANDLES_WRONGSEC | OP_MODIFIES_SOMETHING,
1775 .op_name = "OP_SAVEFH",
1776 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1779 .op_func = (nfsd4op_func)nfsd4_secinfo,
1780 .op_flags = OP_HANDLES_WRONGSEC,
1781 .op_name = "OP_SECINFO",
1784 .op_func = (nfsd4op_func)nfsd4_setattr,
1785 .op_name = "OP_SETATTR",
1786 .op_flags = OP_MODIFIES_SOMETHING | OP_CACHEME,
1787 .op_rsize_bop = (nfsd4op_rsize)nfsd4_setattr_rsize,
1788 .op_get_currentstateid = (stateid_getter)nfsd4_get_setattrstateid,
1790 [OP_SETCLIENTID] = {
1791 .op_func = (nfsd4op_func)nfsd4_setclientid,
1792 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1793 | OP_MODIFIES_SOMETHING | OP_CACHEME,
1794 .op_name = "OP_SETCLIENTID",
1795 .op_rsize_bop = (nfsd4op_rsize)nfsd4_setclientid_rsize,
1797 [OP_SETCLIENTID_CONFIRM] = {
1798 .op_func = (nfsd4op_func)nfsd4_setclientid_confirm,
1799 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1800 | OP_MODIFIES_SOMETHING | OP_CACHEME,
1801 .op_name = "OP_SETCLIENTID_CONFIRM",
1802 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1805 .op_func = (nfsd4op_func)nfsd4_verify,
1806 .op_name = "OP_VERIFY",
1809 .op_func = (nfsd4op_func)nfsd4_write,
1810 .op_flags = OP_MODIFIES_SOMETHING | OP_CACHEME,
1811 .op_name = "OP_WRITE",
1812 .op_rsize_bop = (nfsd4op_rsize)nfsd4_write_rsize,
1813 .op_get_currentstateid = (stateid_getter)nfsd4_get_writestateid,
1815 [OP_RELEASE_LOCKOWNER] = {
1816 .op_func = (nfsd4op_func)nfsd4_release_lockowner,
1817 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_ON_ABSENT_FS
1818 | OP_MODIFIES_SOMETHING,
1819 .op_name = "OP_RELEASE_LOCKOWNER",
1820 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1823 /* NFSv4.1 operations */
1824 [OP_EXCHANGE_ID] = {
1825 .op_func = (nfsd4op_func)nfsd4_exchange_id,
1826 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_AS_FIRST_OP
1827 | OP_MODIFIES_SOMETHING,
1828 .op_name = "OP_EXCHANGE_ID",
1829 .op_rsize_bop = (nfsd4op_rsize)nfsd4_exchange_id_rsize,
1831 [OP_BACKCHANNEL_CTL] = {
1832 .op_func = (nfsd4op_func)nfsd4_backchannel_ctl,
1833 .op_flags = ALLOWED_WITHOUT_FH | OP_MODIFIES_SOMETHING,
1834 .op_name = "OP_BACKCHANNEL_CTL",
1835 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1837 [OP_BIND_CONN_TO_SESSION] = {
1838 .op_func = (nfsd4op_func)nfsd4_bind_conn_to_session,
1839 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_AS_FIRST_OP
1840 | OP_MODIFIES_SOMETHING,
1841 .op_name = "OP_BIND_CONN_TO_SESSION",
1842 .op_rsize_bop = (nfsd4op_rsize)nfsd4_bind_conn_to_session_rsize,
1844 [OP_CREATE_SESSION] = {
1845 .op_func = (nfsd4op_func)nfsd4_create_session,
1846 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_AS_FIRST_OP
1847 | OP_MODIFIES_SOMETHING,
1848 .op_name = "OP_CREATE_SESSION",
1849 .op_rsize_bop = (nfsd4op_rsize)nfsd4_create_session_rsize,
1851 [OP_DESTROY_SESSION] = {
1852 .op_func = (nfsd4op_func)nfsd4_destroy_session,
1853 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_AS_FIRST_OP
1854 | OP_MODIFIES_SOMETHING,
1855 .op_name = "OP_DESTROY_SESSION",
1856 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1859 .op_func = (nfsd4op_func)nfsd4_sequence,
1860 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_AS_FIRST_OP,
1861 .op_name = "OP_SEQUENCE",
1863 [OP_DESTROY_CLIENTID] = {
1864 .op_func = (nfsd4op_func)nfsd4_destroy_clientid,
1865 .op_flags = ALLOWED_WITHOUT_FH | ALLOWED_AS_FIRST_OP
1866 | OP_MODIFIES_SOMETHING,
1867 .op_name = "OP_DESTROY_CLIENTID",
1868 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1870 [OP_RECLAIM_COMPLETE] = {
1871 .op_func = (nfsd4op_func)nfsd4_reclaim_complete,
1872 .op_flags = ALLOWED_WITHOUT_FH | OP_MODIFIES_SOMETHING,
1873 .op_name = "OP_RECLAIM_COMPLETE",
1874 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1876 [OP_SECINFO_NO_NAME] = {
1877 .op_func = (nfsd4op_func)nfsd4_secinfo_no_name,
1878 .op_flags = OP_HANDLES_WRONGSEC,
1879 .op_name = "OP_SECINFO_NO_NAME",
1881 [OP_TEST_STATEID] = {
1882 .op_func = (nfsd4op_func)nfsd4_test_stateid,
1883 .op_flags = ALLOWED_WITHOUT_FH,
1884 .op_name = "OP_TEST_STATEID",
1886 [OP_FREE_STATEID] = {
1887 .op_func = (nfsd4op_func)nfsd4_free_stateid,
1888 .op_flags = ALLOWED_WITHOUT_FH | OP_MODIFIES_SOMETHING,
1889 .op_name = "OP_FREE_STATEID",
1890 .op_get_currentstateid = (stateid_getter)nfsd4_get_freestateid,
1891 .op_rsize_bop = (nfsd4op_rsize)nfsd4_only_status_rsize,
1895 int nfsd4_max_reply(struct svc_rqst *rqstp, struct nfsd4_op *op)
1897 struct nfsd4_operation *opdesc;
1898 nfsd4op_rsize estimator;
1900 if (op->opnum == OP_ILLEGAL)
1901 return op_encode_hdr_size * sizeof(__be32);
1902 opdesc = OPDESC(op);
1903 estimator = opdesc->op_rsize_bop;
1904 return estimator ? estimator(rqstp, op) : PAGE_SIZE;
1907 void warn_on_nonidempotent_op(struct nfsd4_op *op)
1909 if (OPDESC(op)->op_flags & OP_MODIFIES_SOMETHING) {
1910 pr_err("unable to encode reply to nonidempotent op %d (%s)\n",
1911 op->opnum, nfsd4_op_name(op->opnum));
1916 static const char *nfsd4_op_name(unsigned opnum)
1918 if (opnum < ARRAY_SIZE(nfsd4_ops))
1919 return nfsd4_ops[opnum].op_name;
1920 return "unknown_operation";
1923 #define nfsd4_voidres nfsd4_voidargs
1924 struct nfsd4_voidargs { int dummy; };
1926 static struct svc_procedure nfsd_procedures4[2] = {
1928 .pc_func = (svc_procfunc) nfsd4_proc_null,
1929 .pc_encode = (kxdrproc_t) nfs4svc_encode_voidres,
1930 .pc_argsize = sizeof(struct nfsd4_voidargs),
1931 .pc_ressize = sizeof(struct nfsd4_voidres),
1932 .pc_cachetype = RC_NOCACHE,
1935 [NFSPROC4_COMPOUND] = {
1936 .pc_func = (svc_procfunc) nfsd4_proc_compound,
1937 .pc_decode = (kxdrproc_t) nfs4svc_decode_compoundargs,
1938 .pc_encode = (kxdrproc_t) nfs4svc_encode_compoundres,
1939 .pc_argsize = sizeof(struct nfsd4_compoundargs),
1940 .pc_ressize = sizeof(struct nfsd4_compoundres),
1941 .pc_release = nfsd4_release_compoundargs,
1942 .pc_cachetype = RC_NOCACHE,
1943 .pc_xdrressize = NFSD_BUFSIZE/4,
1947 struct svc_version nfsd_version4 = {
1950 .vs_proc = nfsd_procedures4,
1951 .vs_dispatch = nfsd_dispatch,
1952 .vs_xdrsize = NFS4_SVC_XDRSIZE,