2005-04-17 05:20:36 +07:00
|
|
|
/*
|
|
|
|
* fs/nfs/nfs4proc.c
|
|
|
|
*
|
|
|
|
* Client-side procedure declarations for NFSv4.
|
|
|
|
*
|
|
|
|
* Copyright (c) 2002 The Regents of the University of Michigan.
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Kendrick Smith <kmsmith@umich.edu>
|
|
|
|
* Andy Adamson <andros@umich.edu>
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
*
|
|
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the distribution.
|
|
|
|
* 3. Neither the name of the University nor the names of its
|
|
|
|
* contributors may be used to endorse or promote products derived
|
|
|
|
* from this software without specific prior written permission.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
|
|
|
|
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
|
|
|
|
* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
* DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
|
|
|
|
* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
|
|
|
* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
|
|
|
* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
|
|
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/mm.h>
|
|
|
|
#include <linux/delay.h>
|
|
|
|
#include <linux/errno.h>
|
|
|
|
#include <linux/string.h>
|
2011-12-10 07:05:58 +07:00
|
|
|
#include <linux/ratelimit.h>
|
|
|
|
#include <linux/printk.h>
|
include cleanup: Update gfp.h and slab.h includes to prepare for breaking implicit slab.h inclusion from percpu.h
percpu.h is included by sched.h and module.h and thus ends up being
included when building most .c files. percpu.h includes slab.h which
in turn includes gfp.h making everything defined by the two files
universally available and complicating inclusion dependencies.
percpu.h -> slab.h dependency is about to be removed. Prepare for
this change by updating users of gfp and slab facilities include those
headers directly instead of assuming availability. As this conversion
needs to touch large number of source files, the following script is
used as the basis of conversion.
http://userweb.kernel.org/~tj/misc/slabh-sweep.py
The script does the followings.
* Scan files for gfp and slab usages and update includes such that
only the necessary includes are there. ie. if only gfp is used,
gfp.h, if slab is used, slab.h.
* When the script inserts a new include, it looks at the include
blocks and try to put the new include such that its order conforms
to its surrounding. It's put in the include block which contains
core kernel includes, in the same order that the rest are ordered -
alphabetical, Christmas tree, rev-Xmas-tree or at the end if there
doesn't seem to be any matching order.
* If the script can't find a place to put a new include (mostly
because the file doesn't have fitting include block), it prints out
an error message indicating which .h file needs to be added to the
file.
The conversion was done in the following steps.
1. The initial automatic conversion of all .c files updated slightly
over 4000 files, deleting around 700 includes and adding ~480 gfp.h
and ~3000 slab.h inclusions. The script emitted errors for ~400
files.
2. Each error was manually checked. Some didn't need the inclusion,
some needed manual addition while adding it to implementation .h or
embedding .c file was more appropriate for others. This step added
inclusions to around 150 files.
3. The script was run again and the output was compared to the edits
from #2 to make sure no file was left behind.
4. Several build tests were done and a couple of problems were fixed.
e.g. lib/decompress_*.c used malloc/free() wrappers around slab
APIs requiring slab.h to be added manually.
5. The script was run on all .h files but without automatically
editing them as sprinkling gfp.h and slab.h inclusions around .h
files could easily lead to inclusion dependency hell. Most gfp.h
inclusion directives were ignored as stuff from gfp.h was usually
wildly available and often used in preprocessor macros. Each
slab.h inclusion directive was examined and added manually as
necessary.
6. percpu.h was updated not to include slab.h.
7. Build test were done on the following configurations and failures
were fixed. CONFIG_GCOV_KERNEL was turned off for all tests (as my
distributed build env didn't work with gcov compiles) and a few
more options had to be turned off depending on archs to make things
build (like ipr on powerpc/64 which failed due to missing writeq).
* x86 and x86_64 UP and SMP allmodconfig and a custom test config.
* powerpc and powerpc64 SMP allmodconfig
* sparc and sparc64 SMP allmodconfig
* ia64 SMP allmodconfig
* s390 SMP allmodconfig
* alpha SMP allmodconfig
* um on x86_64 SMP allmodconfig
8. percpu.h modifications were reverted so that it could be applied as
a separate patch and serve as bisection point.
Given the fact that I had only a couple of failures from tests on step
6, I'm fairly confident about the coverage of this conversion patch.
If there is a breakage, it's likely to be something in one of the arch
headers which should be easily discoverable easily on most builds of
the specific arch.
Signed-off-by: Tejun Heo <tj@kernel.org>
Guess-its-ok-by: Christoph Lameter <cl@linux-foundation.org>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Lee Schermerhorn <Lee.Schermerhorn@hp.com>
2010-03-24 15:04:11 +07:00
|
|
|
#include <linux/slab.h>
|
2005-04-17 05:20:36 +07:00
|
|
|
#include <linux/sunrpc/clnt.h>
|
|
|
|
#include <linux/nfs.h>
|
|
|
|
#include <linux/nfs4.h>
|
|
|
|
#include <linux/nfs_fs.h>
|
|
|
|
#include <linux/nfs_page.h>
|
2011-04-14 01:31:30 +07:00
|
|
|
#include <linux/nfs_mount.h>
|
2005-04-17 05:20:36 +07:00
|
|
|
#include <linux/namei.h>
|
2005-10-19 04:20:17 +07:00
|
|
|
#include <linux/mount.h>
|
2009-04-01 20:22:29 +07:00
|
|
|
#include <linux/module.h>
|
2010-12-09 18:35:25 +07:00
|
|
|
#include <linux/xattr.h>
|
2011-01-26 07:15:32 +07:00
|
|
|
#include <linux/utsname.h>
|
2011-12-02 04:44:39 +07:00
|
|
|
#include <linux/freezer.h>
|
2018-01-09 20:21:17 +07:00
|
|
|
#include <linux/iversion.h>
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2005-06-23 00:16:21 +07:00
|
|
|
#include "nfs4_fs.h"
|
2005-04-17 05:20:36 +07:00
|
|
|
#include "delegation.h"
|
2008-02-20 08:04:23 +07:00
|
|
|
#include "internal.h"
|
2006-03-21 01:44:14 +07:00
|
|
|
#include "iostat.h"
|
2009-04-01 20:22:31 +07:00
|
|
|
#include "callback.h"
|
2010-10-20 11:18:03 +07:00
|
|
|
#include "pnfs.h"
|
NFS: Always use the same SETCLIENTID boot verifier
Currently our NFS client assigns a unique SETCLIENTID boot verifier
for each server IP address it knows about. It's set to CURRENT_TIME
when the struct nfs_client for that server IP is created.
During the SETCLIENTID operation, our client also presents an
nfs_client_id4 string to servers, as an identifier on which the server
can hang all of this client's NFSv4 state. Our client's
nfs_client_id4 string is unique for each server IP address.
An NFSv4 server is obligated to wipe all NFSv4 state associated with
an nfs_client_id4 string when the client presents the same
nfs_client_id4 string along with a changed SETCLIENTID boot verifier.
When our client unmounts the last of a server's shares, it destroys
that server's struct nfs_client. The next time the client mounts that
NFS server, it creates a fresh struct nfs_client with a fresh boot
verifier. On seeing the fresh verifer, the server wipes any previous
NFSv4 state associated with that nfs_client_id4.
However, NFSv4.1 clients are supposed to present the same
nfs_client_id4 string to all servers. And, to support Transparent
State Migration, the same nfs_client_id4 string should be presented
to all NFSv4.0 servers so they recognize that migrated state for this
client belongs with state a server may already have for this client.
(This is known as the Uniform Client String model).
If the nfs_client_id4 string is the same but the boot verifier changes
for each server IP address, SETCLIENTID and EXCHANGE_ID operations
from such a client could unintentionally result in a server wiping a
client's previously obtained lease.
Thus, if our NFS client is going to use a fixed nfs_client_id4 string,
either for NFSv4.0 or NFSv4.1 mounts, our NFS client should use a
boot verifier that does not change depending on server IP address.
Replace our current per-nfs_client boot verifier with a per-nfs_net
boot verifier.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-05-22 09:45:41 +07:00
|
|
|
#include "netns.h"
|
2015-04-16 00:00:05 +07:00
|
|
|
#include "nfs4idmap.h"
|
2012-11-27 00:49:34 +07:00
|
|
|
#include "nfs4session.h"
|
2012-12-21 04:52:38 +07:00
|
|
|
#include "fscache.h"
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-08-09 22:51:26 +07:00
|
|
|
#include "nfs4trace.h"
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
#define NFSDBG_FACILITY NFSDBG_PROC
|
|
|
|
|
2018-04-08 00:44:28 +07:00
|
|
|
#define NFS4_BITMASK_SZ 3
|
|
|
|
|
2006-09-15 19:30:46 +07:00
|
|
|
#define NFS4_POLL_RETRY_MIN (HZ/10)
|
2005-04-17 05:20:36 +07:00
|
|
|
#define NFS4_POLL_RETRY_MAX (15*HZ)
|
|
|
|
|
2016-05-12 16:16:38 +07:00
|
|
|
/* file attributes which can be mapped to nfs attributes */
|
|
|
|
#define NFS4_VALID_ATTRS (ATTR_MODE \
|
|
|
|
| ATTR_UID \
|
|
|
|
| ATTR_GID \
|
|
|
|
| ATTR_SIZE \
|
|
|
|
| ATTR_ATIME \
|
|
|
|
| ATTR_MTIME \
|
|
|
|
| ATTR_CTIME \
|
|
|
|
| ATTR_ATIME_SET \
|
|
|
|
| ATTR_MTIME_SET)
|
|
|
|
|
2006-01-03 15:55:12 +07:00
|
|
|
struct nfs4_opendata;
|
2009-12-15 12:27:57 +07:00
|
|
|
static int _nfs4_recover_proc_open(struct nfs4_opendata *data);
|
2005-04-17 05:20:36 +07:00
|
|
|
static int nfs4_do_fsinfo(struct nfs_server *, struct nfs_fh *, struct nfs_fsinfo *);
|
2012-03-02 05:01:57 +07:00
|
|
|
static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr);
|
2018-04-08 00:50:59 +07:00
|
|
|
static int nfs4_proc_getattr(struct nfs_server *, struct nfs_fh *, struct nfs_fattr *, struct nfs4_label *label, struct inode *inode);
|
|
|
|
static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr, struct nfs4_label *label, struct inode *inode);
|
2010-04-17 03:22:51 +07:00
|
|
|
static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
|
|
|
|
struct nfs_fattr *fattr, struct iattr *sattr,
|
2016-10-13 11:26:47 +07:00
|
|
|
struct nfs_open_context *ctx, struct nfs4_label *ilabel,
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs4_label *olabel);
|
2011-06-03 01:59:10 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_1
|
2017-10-20 02:46:45 +07:00
|
|
|
static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp,
|
|
|
|
struct rpc_cred *cred,
|
|
|
|
struct nfs4_slot *slot,
|
|
|
|
bool is_privileged);
|
2013-05-20 22:20:27 +07:00
|
|
|
static int nfs41_test_stateid(struct nfs_server *, nfs4_stateid *,
|
|
|
|
struct rpc_cred *);
|
2016-09-23 00:39:04 +07:00
|
|
|
static int nfs41_free_stateid(struct nfs_server *, const nfs4_stateid *,
|
|
|
|
struct rpc_cred *, bool);
|
2011-06-03 01:59:10 +07:00
|
|
|
#endif
|
2013-05-22 23:50:44 +07:00
|
|
|
|
|
|
|
#ifdef CONFIG_NFS_V4_SECURITY_LABEL
|
|
|
|
static inline struct nfs4_label *
|
|
|
|
nfs4_label_init_security(struct inode *dir, struct dentry *dentry,
|
|
|
|
struct iattr *sattr, struct nfs4_label *label)
|
|
|
|
{
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (label == NULL)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
if (nfs_server_capable(dir, NFS_CAP_SECURITY_LABEL) == 0)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
err = security_dentry_init_security(dentry, sattr->ia_mode,
|
|
|
|
&dentry->d_name, (void **)&label->label, &label->len);
|
|
|
|
if (err == 0)
|
|
|
|
return label;
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
static inline void
|
|
|
|
nfs4_label_release_security(struct nfs4_label *label)
|
|
|
|
{
|
|
|
|
if (label)
|
|
|
|
security_release_secctx(label->label, label->len);
|
|
|
|
}
|
|
|
|
static inline u32 *nfs4_bitmask(struct nfs_server *server, struct nfs4_label *label)
|
|
|
|
{
|
|
|
|
if (label)
|
|
|
|
return server->attr_bitmask;
|
|
|
|
|
|
|
|
return server->attr_bitmask_nl;
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
static inline struct nfs4_label *
|
|
|
|
nfs4_label_init_security(struct inode *dir, struct dentry *dentry,
|
|
|
|
struct iattr *sattr, struct nfs4_label *l)
|
|
|
|
{ return NULL; }
|
|
|
|
static inline void
|
|
|
|
nfs4_label_release_security(struct nfs4_label *label)
|
|
|
|
{ return; }
|
|
|
|
static inline u32 *
|
|
|
|
nfs4_bitmask(struct nfs_server *server, struct nfs4_label *label)
|
|
|
|
{ return server->attr_bitmask; }
|
|
|
|
#endif
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
/* Prevent leaks of NFSv4 errors into userland */
|
2008-12-31 04:35:55 +07:00
|
|
|
static int nfs4_map_errors(int err)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2009-10-24 01:46:42 +07:00
|
|
|
if (err >= -1000)
|
|
|
|
return err;
|
|
|
|
switch (err) {
|
|
|
|
case -NFS4ERR_RESOURCE:
|
2013-03-01 08:30:10 +07:00
|
|
|
case -NFS4ERR_LAYOUTTRYLATER:
|
|
|
|
case -NFS4ERR_RECALLCONFLICT:
|
2009-10-24 01:46:42 +07:00
|
|
|
return -EREMOTEIO;
|
2011-03-25 00:12:30 +07:00
|
|
|
case -NFS4ERR_WRONGSEC:
|
2013-08-14 03:37:38 +07:00
|
|
|
case -NFS4ERR_WRONG_CRED:
|
2011-03-25 00:12:30 +07:00
|
|
|
return -EPERM;
|
2011-02-23 06:44:31 +07:00
|
|
|
case -NFS4ERR_BADOWNER:
|
|
|
|
case -NFS4ERR_BADNAME:
|
|
|
|
return -EINVAL;
|
2012-05-28 22:36:28 +07:00
|
|
|
case -NFS4ERR_SHARE_DENIED:
|
|
|
|
return -EACCES;
|
2012-06-07 01:12:07 +07:00
|
|
|
case -NFS4ERR_MINOR_VERS_MISMATCH:
|
|
|
|
return -EPROTONOSUPPORT;
|
2013-03-24 02:22:45 +07:00
|
|
|
case -NFS4ERR_FILE_OPEN:
|
|
|
|
return -EBUSY;
|
2009-10-24 01:46:42 +07:00
|
|
|
default:
|
2005-04-17 05:20:36 +07:00
|
|
|
dprintk("%s could not handle NFSv4 error %d\n",
|
2008-05-03 03:42:44 +07:00
|
|
|
__func__, -err);
|
2009-10-24 01:46:42 +07:00
|
|
|
break;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2009-10-24 01:46:42 +07:00
|
|
|
return -EIO;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This is our standard bitmap for GETATTR requests.
|
|
|
|
*/
|
2012-06-05 20:16:47 +07:00
|
|
|
const u32 nfs4_fattr_bitmap[3] = {
|
2005-04-17 05:20:36 +07:00
|
|
|
FATTR4_WORD0_TYPE
|
|
|
|
| FATTR4_WORD0_CHANGE
|
|
|
|
| FATTR4_WORD0_SIZE
|
|
|
|
| FATTR4_WORD0_FSID
|
|
|
|
| FATTR4_WORD0_FILEID,
|
|
|
|
FATTR4_WORD1_MODE
|
|
|
|
| FATTR4_WORD1_NUMLINKS
|
|
|
|
| FATTR4_WORD1_OWNER
|
|
|
|
| FATTR4_WORD1_OWNER_GROUP
|
|
|
|
| FATTR4_WORD1_RAWDEV
|
|
|
|
| FATTR4_WORD1_SPACE_USED
|
|
|
|
| FATTR4_WORD1_TIME_ACCESS
|
|
|
|
| FATTR4_WORD1_TIME_METADATA
|
nfs: Fetch MOUNTED_ON_FILEID when updating an inode
2ef47eb1 (NFS: Fix use of nfs_attr_use_mounted_on_fileid()) was a good
start to fixing a circular directory structure warning for NFS v4
"junctioned" mountpoints. Unfortunately, further testing continued to
generate this error.
My server is configured like this:
anna@nfsd ~ % df
Filesystem Size Used Avail Use% Mounted on
/dev/vda1 9.1G 2.0G 6.5G 24% /
/dev/vdc1 1014M 33M 982M 4% /exports
/dev/vdc2 1014M 33M 982M 4% /exports/vol1
/dev/vdc3 1014M 33M 982M 4% /exports/vol1/vol2
anna@nfsd ~ % cat /etc/exports
/exports/ *(rw,async,no_subtree_check,no_root_squash)
/exports/vol1/ *(rw,async,no_subtree_check,no_root_squash)
/exports/vol1/vol2 *(rw,async,no_subtree_check,no_root_squash)
I've been running chown across the entire mountpoint twice in a row to
hit this problem. The first run succeeds, but the second one fails with
the circular directory warning along with:
anna@client ~ % dmesg
[Apr 3 14:28] NFS: server 192.168.100.204 error: fileid changed
fsid 0:39: expected fileid 0x100080, got 0x80
WHere 0x80 is the mountpoint's fileid and 0x100080 is the mounted-on
fileid.
This patch fixes the issue by requesting an updated mounted-on fileid
from the server during nfs_update_inode(), and then checking that the
fileid stored in the nfs_inode matches either the fileid or mounted-on
fileid returned by the server.
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-04-04 01:35:59 +07:00
|
|
|
| FATTR4_WORD1_TIME_MODIFY
|
|
|
|
| FATTR4_WORD1_MOUNTED_ON_FILEID,
|
2013-05-22 23:50:44 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_SECURITY_LABEL
|
|
|
|
FATTR4_WORD2_SECURITY_LABEL
|
|
|
|
#endif
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2012-06-05 20:16:47 +07:00
|
|
|
static const u32 nfs4_pnfs_open_bitmap[3] = {
|
|
|
|
FATTR4_WORD0_TYPE
|
|
|
|
| FATTR4_WORD0_CHANGE
|
|
|
|
| FATTR4_WORD0_SIZE
|
|
|
|
| FATTR4_WORD0_FSID
|
|
|
|
| FATTR4_WORD0_FILEID,
|
|
|
|
FATTR4_WORD1_MODE
|
|
|
|
| FATTR4_WORD1_NUMLINKS
|
|
|
|
| FATTR4_WORD1_OWNER
|
|
|
|
| FATTR4_WORD1_OWNER_GROUP
|
|
|
|
| FATTR4_WORD1_RAWDEV
|
|
|
|
| FATTR4_WORD1_SPACE_USED
|
|
|
|
| FATTR4_WORD1_TIME_ACCESS
|
|
|
|
| FATTR4_WORD1_TIME_METADATA
|
|
|
|
| FATTR4_WORD1_TIME_MODIFY,
|
|
|
|
FATTR4_WORD2_MDSTHRESHOLD
|
2015-12-27 03:06:03 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_SECURITY_LABEL
|
|
|
|
| FATTR4_WORD2_SECURITY_LABEL
|
|
|
|
#endif
|
2012-06-05 20:16:47 +07:00
|
|
|
};
|
|
|
|
|
2012-10-03 08:07:32 +07:00
|
|
|
static const u32 nfs4_open_noattr_bitmap[3] = {
|
|
|
|
FATTR4_WORD0_TYPE
|
|
|
|
| FATTR4_WORD0_FILEID,
|
|
|
|
};
|
|
|
|
|
2013-05-22 23:50:41 +07:00
|
|
|
const u32 nfs4_statfs_bitmap[3] = {
|
2005-04-17 05:20:36 +07:00
|
|
|
FATTR4_WORD0_FILES_AVAIL
|
|
|
|
| FATTR4_WORD0_FILES_FREE
|
|
|
|
| FATTR4_WORD0_FILES_TOTAL,
|
|
|
|
FATTR4_WORD1_SPACE_AVAIL
|
|
|
|
| FATTR4_WORD1_SPACE_FREE
|
|
|
|
| FATTR4_WORD1_SPACE_TOTAL
|
|
|
|
};
|
|
|
|
|
2013-05-22 23:50:41 +07:00
|
|
|
const u32 nfs4_pathconf_bitmap[3] = {
|
2005-04-17 05:20:36 +07:00
|
|
|
FATTR4_WORD0_MAXLINK
|
|
|
|
| FATTR4_WORD0_MAXNAME,
|
|
|
|
0
|
|
|
|
};
|
|
|
|
|
2011-07-31 07:52:37 +07:00
|
|
|
const u32 nfs4_fsinfo_bitmap[3] = { FATTR4_WORD0_MAXFILESIZE
|
2005-04-17 05:20:36 +07:00
|
|
|
| FATTR4_WORD0_MAXREAD
|
|
|
|
| FATTR4_WORD0_MAXWRITE
|
|
|
|
| FATTR4_WORD0_LEASE_TIME,
|
2010-10-13 06:30:06 +07:00
|
|
|
FATTR4_WORD1_TIME_DELTA
|
2011-07-31 07:52:37 +07:00
|
|
|
| FATTR4_WORD1_FS_LAYOUT_TYPES,
|
|
|
|
FATTR4_WORD2_LAYOUT_BLKSIZE
|
2015-09-26 01:24:37 +07:00
|
|
|
| FATTR4_WORD2_CLONE_BLKSIZE
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2013-05-22 23:50:41 +07:00
|
|
|
const u32 nfs4_fs_locations_bitmap[3] = {
|
2017-11-06 03:45:22 +07:00
|
|
|
FATTR4_WORD0_CHANGE
|
2006-06-09 20:34:25 +07:00
|
|
|
| FATTR4_WORD0_SIZE
|
|
|
|
| FATTR4_WORD0_FSID
|
|
|
|
| FATTR4_WORD0_FILEID
|
|
|
|
| FATTR4_WORD0_FS_LOCATIONS,
|
2017-11-06 03:45:22 +07:00
|
|
|
FATTR4_WORD1_OWNER
|
2006-06-09 20:34:25 +07:00
|
|
|
| FATTR4_WORD1_OWNER_GROUP
|
|
|
|
| FATTR4_WORD1_RAWDEV
|
|
|
|
| FATTR4_WORD1_SPACE_USED
|
|
|
|
| FATTR4_WORD1_TIME_ACCESS
|
|
|
|
| FATTR4_WORD1_TIME_METADATA
|
|
|
|
| FATTR4_WORD1_TIME_MODIFY
|
2013-05-22 23:50:41 +07:00
|
|
|
| FATTR4_WORD1_MOUNTED_ON_FILEID,
|
2006-06-09 20:34:25 +07:00
|
|
|
};
|
|
|
|
|
2018-04-08 00:44:28 +07:00
|
|
|
static void nfs4_bitmap_copy_adjust(__u32 *dst, const __u32 *src,
|
|
|
|
struct inode *inode)
|
|
|
|
{
|
|
|
|
unsigned long cache_validity;
|
|
|
|
|
|
|
|
memcpy(dst, src, NFS4_BITMASK_SZ*sizeof(*dst));
|
|
|
|
if (!inode || !nfs4_have_delegation(inode, FMODE_READ))
|
|
|
|
return;
|
|
|
|
|
|
|
|
cache_validity = READ_ONCE(NFS_I(inode)->cache_validity);
|
|
|
|
if (!(cache_validity & NFS_INO_REVAL_FORCED))
|
|
|
|
cache_validity &= ~(NFS_INO_INVALID_CHANGE
|
|
|
|
| NFS_INO_INVALID_SIZE);
|
|
|
|
|
|
|
|
if (!(cache_validity & NFS_INO_INVALID_SIZE))
|
|
|
|
dst[0] &= ~FATTR4_WORD0_SIZE;
|
|
|
|
|
|
|
|
if (!(cache_validity & NFS_INO_INVALID_CHANGE))
|
|
|
|
dst[0] &= ~FATTR4_WORD0_CHANGE;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_bitmap_copy_adjust_setattr(__u32 *dst,
|
|
|
|
const __u32 *src, struct inode *inode)
|
|
|
|
{
|
|
|
|
nfs4_bitmap_copy_adjust(dst, src, inode);
|
|
|
|
}
|
|
|
|
|
2006-10-20 13:28:51 +07:00
|
|
|
static void nfs4_setup_readdir(u64 cookie, __be32 *verifier, struct dentry *dentry,
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_readdir_arg *readdir)
|
|
|
|
{
|
2017-06-16 23:06:59 +07:00
|
|
|
unsigned int attrs = FATTR4_WORD0_FILEID | FATTR4_WORD0_TYPE;
|
2006-10-20 13:28:49 +07:00
|
|
|
__be32 *start, *p;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
|
|
|
if (cookie > 2) {
|
2005-06-23 00:16:28 +07:00
|
|
|
readdir->cookie = cookie;
|
2005-04-17 05:20:36 +07:00
|
|
|
memcpy(&readdir->verifier, verifier, sizeof(readdir->verifier));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
readdir->cookie = 0;
|
|
|
|
memset(&readdir->verifier, 0, sizeof(readdir->verifier));
|
|
|
|
if (cookie == 2)
|
|
|
|
return;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* NFSv4 servers do not return entries for '.' and '..'
|
|
|
|
* Therefore, we fake these entries here. We let '.'
|
|
|
|
* have cookie 0 and '..' have cookie 1. Note that
|
|
|
|
* when talking to the server, we always send cookie 0
|
|
|
|
* instead of 1 or 2.
|
|
|
|
*/
|
2011-11-25 22:14:33 +07:00
|
|
|
start = p = kmap_atomic(*readdir->pages);
|
2005-04-17 05:20:36 +07:00
|
|
|
|
|
|
|
if (cookie == 0) {
|
|
|
|
*p++ = xdr_one; /* next */
|
|
|
|
*p++ = xdr_zero; /* cookie, first word */
|
|
|
|
*p++ = xdr_one; /* cookie, second word */
|
|
|
|
*p++ = xdr_one; /* entry len */
|
|
|
|
memcpy(p, ".\0\0\0", 4); /* entry */
|
|
|
|
p++;
|
|
|
|
*p++ = xdr_one; /* bitmap length */
|
2017-06-16 23:06:59 +07:00
|
|
|
*p++ = htonl(attrs); /* bitmap */
|
|
|
|
*p++ = htonl(12); /* attribute buffer length */
|
|
|
|
*p++ = htonl(NF4DIR);
|
2015-03-18 05:25:59 +07:00
|
|
|
p = xdr_encode_hyper(p, NFS_FILEID(d_inode(dentry)));
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
*p++ = xdr_one; /* next */
|
|
|
|
*p++ = xdr_zero; /* cookie, first word */
|
|
|
|
*p++ = xdr_two; /* cookie, second word */
|
|
|
|
*p++ = xdr_two; /* entry len */
|
|
|
|
memcpy(p, "..\0\0", 4); /* entry */
|
|
|
|
p++;
|
|
|
|
*p++ = xdr_one; /* bitmap length */
|
2017-06-16 23:06:59 +07:00
|
|
|
*p++ = htonl(attrs); /* bitmap */
|
|
|
|
*p++ = htonl(12); /* attribute buffer length */
|
|
|
|
*p++ = htonl(NF4DIR);
|
2015-03-18 05:25:59 +07:00
|
|
|
p = xdr_encode_hyper(p, NFS_FILEID(d_inode(dentry->d_parent)));
|
2005-04-17 05:20:36 +07:00
|
|
|
|
|
|
|
readdir->pgbase = (char *)p - (char *)start;
|
|
|
|
readdir->count -= readdir->pgbase;
|
2011-11-25 22:14:33 +07:00
|
|
|
kunmap_atomic(start);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2016-09-23 00:39:05 +07:00
|
|
|
static void nfs4_test_and_free_stateid(struct nfs_server *server,
|
|
|
|
nfs4_stateid *stateid,
|
|
|
|
struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
const struct nfs4_minor_version_ops *ops = server->nfs_client->cl_mvops;
|
|
|
|
|
|
|
|
ops->test_and_free_expired(server, stateid, cred);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void __nfs4_free_revoked_stateid(struct nfs_server *server,
|
|
|
|
nfs4_stateid *stateid,
|
|
|
|
struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
stateid->type = NFS4_REVOKED_STATEID_TYPE;
|
|
|
|
nfs4_test_and_free_stateid(server, stateid, cred);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_free_revoked_stateid(struct nfs_server *server,
|
|
|
|
const nfs4_stateid *stateid,
|
|
|
|
struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
nfs4_stateid tmp;
|
|
|
|
|
|
|
|
nfs4_stateid_copy(&tmp, stateid);
|
|
|
|
__nfs4_free_revoked_stateid(server, &tmp, cred);
|
|
|
|
}
|
|
|
|
|
2014-09-18 13:09:27 +07:00
|
|
|
static long nfs4_update_delay(long *timeout)
|
|
|
|
{
|
|
|
|
long ret;
|
|
|
|
if (!timeout)
|
|
|
|
return NFS4_POLL_RETRY_MAX;
|
|
|
|
if (*timeout <= 0)
|
|
|
|
*timeout = NFS4_POLL_RETRY_MIN;
|
|
|
|
if (*timeout > NFS4_POLL_RETRY_MAX)
|
|
|
|
*timeout = NFS4_POLL_RETRY_MAX;
|
|
|
|
ret = *timeout;
|
|
|
|
*timeout <<= 1;
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2008-12-24 03:21:44 +07:00
|
|
|
static int nfs4_delay(struct rpc_clnt *clnt, long *timeout)
|
|
|
|
{
|
|
|
|
int res = 0;
|
|
|
|
|
|
|
|
might_sleep();
|
|
|
|
|
2014-09-18 13:09:27 +07:00
|
|
|
freezable_schedule_timeout_killable_unsafe(
|
|
|
|
nfs4_update_delay(timeout));
|
2008-12-24 03:21:44 +07:00
|
|
|
if (fatal_signal_pending(current))
|
|
|
|
res = -ERESTARTSYS;
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This is the error handling routine for processes that are allowed
|
|
|
|
* to sleep.
|
|
|
|
*/
|
2015-09-21 01:32:45 +07:00
|
|
|
static int nfs4_do_handle_exception(struct nfs_server *server,
|
|
|
|
int errorcode, struct nfs4_exception *exception)
|
2008-12-24 03:21:44 +07:00
|
|
|
{
|
|
|
|
struct nfs_client *clp = server->nfs_client;
|
2008-12-24 03:21:46 +07:00
|
|
|
struct nfs4_state *state = exception->state;
|
2016-06-26 19:44:35 +07:00
|
|
|
const nfs4_stateid *stateid = exception->stateid;
|
2012-03-08 04:39:06 +07:00
|
|
|
struct inode *inode = exception->inode;
|
2008-12-24 03:21:44 +07:00
|
|
|
int ret = errorcode;
|
|
|
|
|
2015-09-21 01:32:45 +07:00
|
|
|
exception->delay = 0;
|
|
|
|
exception->recovering = 0;
|
2008-12-24 03:21:44 +07:00
|
|
|
exception->retry = 0;
|
2016-09-23 00:39:15 +07:00
|
|
|
|
|
|
|
if (stateid == NULL && state != NULL)
|
|
|
|
stateid = &state->stateid;
|
|
|
|
|
2008-12-24 03:21:44 +07:00
|
|
|
switch(errorcode) {
|
|
|
|
case 0:
|
|
|
|
return 0;
|
2018-05-30 09:06:08 +07:00
|
|
|
case -NFS4ERR_BADHANDLE:
|
|
|
|
case -ESTALE:
|
|
|
|
if (inode != NULL && S_ISREG(inode->i_mode))
|
|
|
|
pnfs_destroy_layout(NFS_I(inode));
|
|
|
|
break;
|
2015-06-16 22:26:35 +07:00
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
2016-09-23 00:39:15 +07:00
|
|
|
case -NFS4ERR_EXPIRED:
|
2015-06-16 22:26:35 +07:00
|
|
|
case -NFS4ERR_BAD_STATEID:
|
2016-09-23 00:39:15 +07:00
|
|
|
if (inode != NULL && stateid != NULL) {
|
|
|
|
nfs_inode_find_state_and_recover(inode,
|
|
|
|
stateid);
|
|
|
|
goto wait_on_recovery;
|
|
|
|
}
|
|
|
|
case -NFS4ERR_OPENMODE:
|
2016-06-26 19:44:35 +07:00
|
|
|
if (inode) {
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = nfs_async_inode_return_delegation(inode,
|
|
|
|
stateid);
|
|
|
|
if (err == 0)
|
|
|
|
goto wait_on_recovery;
|
|
|
|
if (stateid != NULL && stateid->type == NFS4_DELEGATION_STATEID_TYPE) {
|
|
|
|
exception->retry = 1;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2012-03-08 04:39:06 +07:00
|
|
|
if (state == NULL)
|
|
|
|
break;
|
2013-03-15 03:57:48 +07:00
|
|
|
ret = nfs4_schedule_stateid_recovery(server, state);
|
|
|
|
if (ret < 0)
|
|
|
|
break;
|
2012-03-08 04:39:06 +07:00
|
|
|
goto wait_on_recovery;
|
2008-12-24 03:21:44 +07:00
|
|
|
case -NFS4ERR_STALE_STATEID:
|
2010-01-27 03:42:47 +07:00
|
|
|
case -NFS4ERR_STALE_CLIENTID:
|
2011-03-10 04:00:53 +07:00
|
|
|
nfs4_schedule_lease_recovery(clp);
|
|
|
|
goto wait_on_recovery;
|
2013-10-18 01:13:19 +07:00
|
|
|
case -NFS4ERR_MOVED:
|
|
|
|
ret = nfs4_schedule_migration_recovery(server);
|
|
|
|
if (ret < 0)
|
|
|
|
break;
|
|
|
|
goto wait_on_recovery;
|
2013-10-18 01:13:41 +07:00
|
|
|
case -NFS4ERR_LEASE_MOVED:
|
|
|
|
nfs4_schedule_lease_moved_recovery(clp);
|
|
|
|
goto wait_on_recovery;
|
2010-01-27 03:42:38 +07:00
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
nfs41: kick start nfs41 session recovery when handling errors
Remove checking for any errors that the SEQUENCE operation does not return.
-NFS4ERR_STALE_CLIENTID, NFS4ERR_EXPIRED, NFS4ERR_CB_PATH_DOWN, NFS4ERR_BACK_CHAN_BUSY, NFS4ERR_OP_NOT_IN_SESSION.
SEQUENCE operation error recovery is very primative, we only reset the session.
Remove checking for any errors that are returned by the SEQUENCE operation, but
that resetting the session won't address.
NFS4ERR_RETRY_UNCACHED_REP, NFS4ERR_SEQUENCE_POS,NFS4ERR_TOO_MANY_OPS.
Add error checking for missing SEQUENCE errors that a session reset will
address.
NFS4ERR_BAD_HIGH_SLOT, NFS4ERR_DEADSESSION, NFS4ERR_SEQ_FALSE_RETRY.
A reset of the session is currently our only response to a SEQUENCE operation
error. Don't reset the session on errors where a new session won't help.
Don't reset the session on errors where a new session won't help.
[nfs41: nfs4_async_handle_error update error checking]
Signed-off-by: Andy Adamson <andros@netapp.com>
Signed-off-by: Benny Halevy <bhalevy@panasas.com>
[nfs41: trigger the state manager for session reset]
Replace session state bit with nfs_client state bit. Set the
NFS4CLNT_SESSION_SETUP bit upon a session related error in the sync/async
error handlers.
[nfs41: _nfs4_async_handle_error fix session reset error list]
Sequence operation errors that session reset could help.
NFS4ERR_BADSESSION
NFS4ERR_BADSLOT
NFS4ERR_BAD_HIGH_SLOT
NFS4ERR_DEADSESSION
NFS4ERR_CONN_NOT_BOUND_TO_SESSION
NFS4ERR_SEQ_FALSE_RETRY
NFS4ERR_SEQ_MISORDERED
Sequence operation errors that a session reset would not help
NFS4ERR_BADXDR
NFS4ERR_DELAY
NFS4ERR_REP_TOO_BIG
NFS4ERR_REP_TOO_BIG_TO_CACHE
NFS4ERR_REQ_TOO_BIG
NFS4ERR_RETRY_UNCACHED_REP
NFS4ERR_SEQUENCE_POS
NFS4ERR_TOO_MANY_OPS
Signed-off-by: Andy Adamson <andros@netapp.com>
[nfs41 nfs4_handle_exception fix session reset error list]
Signed-off-by: Andy Adamson <andros@netapp.com>
Signed-off-by: Benny Halevy <bhalevy@panasas.com>
[moved nfs41_sequece_call_done code to nfs41: sequence operation]
Signed-off-by: Andy Adamson <andros@netapp.com>
Signed-off-by: Benny Halevy <bhalevy@panasas.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2009-04-01 20:22:42 +07:00
|
|
|
case -NFS4ERR_BADSESSION:
|
|
|
|
case -NFS4ERR_BADSLOT:
|
|
|
|
case -NFS4ERR_BAD_HIGH_SLOT:
|
|
|
|
case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
|
|
|
|
case -NFS4ERR_DEADSESSION:
|
|
|
|
case -NFS4ERR_SEQ_FALSE_RETRY:
|
|
|
|
case -NFS4ERR_SEQ_MISORDERED:
|
|
|
|
dprintk("%s ERROR: %d Reset session\n", __func__,
|
|
|
|
errorcode);
|
2012-05-28 00:02:53 +07:00
|
|
|
nfs4_schedule_session_recovery(clp->cl_session, errorcode);
|
2012-10-31 03:06:35 +07:00
|
|
|
goto wait_on_recovery;
|
2010-01-27 03:42:38 +07:00
|
|
|
#endif /* defined(CONFIG_NFS_V4_1) */
|
2008-12-24 03:21:44 +07:00
|
|
|
case -NFS4ERR_FILE_OPEN:
|
2009-12-04 03:58:56 +07:00
|
|
|
if (exception->timeout > HZ) {
|
|
|
|
/* We have retried a decent amount, time to
|
|
|
|
* fail
|
|
|
|
*/
|
|
|
|
ret = -EBUSY;
|
|
|
|
break;
|
|
|
|
}
|
2008-12-24 03:21:44 +07:00
|
|
|
case -NFS4ERR_DELAY:
|
2015-09-21 03:10:18 +07:00
|
|
|
nfs_inc_server_stats(server, NFSIOS_DELAY);
|
|
|
|
case -NFS4ERR_GRACE:
|
2016-07-15 05:46:24 +07:00
|
|
|
case -NFS4ERR_LAYOUTTRYLATER:
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
case -NFS4ERR_RECALLCONFLICT:
|
2015-09-21 01:32:45 +07:00
|
|
|
exception->delay = 1;
|
|
|
|
return 0;
|
|
|
|
|
2011-05-04 00:43:03 +07:00
|
|
|
case -NFS4ERR_RETRY_UNCACHED_REP:
|
2008-12-24 03:21:44 +07:00
|
|
|
case -NFS4ERR_OLD_STATEID:
|
|
|
|
exception->retry = 1;
|
2011-02-23 06:44:32 +07:00
|
|
|
break;
|
|
|
|
case -NFS4ERR_BADOWNER:
|
|
|
|
/* The following works around a Linux server bug! */
|
|
|
|
case -NFS4ERR_BADNAME:
|
|
|
|
if (server->caps & NFS_CAP_UIDGID_NOMAP) {
|
|
|
|
server->caps &= ~NFS_CAP_UIDGID_NOMAP;
|
|
|
|
exception->retry = 1;
|
|
|
|
printk(KERN_WARNING "NFS: v4 server %s "
|
|
|
|
"does not accept raw "
|
|
|
|
"uid/gids. "
|
|
|
|
"Reenabling the idmapper.\n",
|
|
|
|
server->nfs_client->cl_hostname);
|
|
|
|
}
|
2008-12-24 03:21:44 +07:00
|
|
|
}
|
|
|
|
/* We failed to handle the error */
|
|
|
|
return nfs4_map_errors(ret);
|
2011-03-10 04:00:53 +07:00
|
|
|
wait_on_recovery:
|
2015-09-21 01:32:45 +07:00
|
|
|
exception->recovering = 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This is the error handling routine for processes that are allowed
|
|
|
|
* to sleep.
|
|
|
|
*/
|
|
|
|
int nfs4_handle_exception(struct nfs_server *server, int errorcode, struct nfs4_exception *exception)
|
|
|
|
{
|
|
|
|
struct nfs_client *clp = server->nfs_client;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
ret = nfs4_do_handle_exception(server, errorcode, exception);
|
|
|
|
if (exception->delay) {
|
|
|
|
ret = nfs4_delay(server->client, &exception->timeout);
|
|
|
|
goto out_retry;
|
|
|
|
}
|
|
|
|
if (exception->recovering) {
|
|
|
|
ret = nfs4_wait_clnt_recover(clp);
|
|
|
|
if (test_bit(NFS_MIG_FAILED, &server->mig_status))
|
|
|
|
return -EIO;
|
|
|
|
goto out_retry;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
out_retry:
|
2010-01-27 03:42:47 +07:00
|
|
|
if (ret == 0)
|
|
|
|
exception->retry = 1;
|
|
|
|
return ret;
|
2008-12-24 03:21:44 +07:00
|
|
|
}
|
|
|
|
|
2015-09-21 02:51:00 +07:00
|
|
|
static int
|
|
|
|
nfs4_async_handle_exception(struct rpc_task *task, struct nfs_server *server,
|
|
|
|
int errorcode, struct nfs4_exception *exception)
|
|
|
|
{
|
|
|
|
struct nfs_client *clp = server->nfs_client;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
ret = nfs4_do_handle_exception(server, errorcode, exception);
|
|
|
|
if (exception->delay) {
|
|
|
|
rpc_delay(task, nfs4_update_delay(&exception->timeout));
|
|
|
|
goto out_retry;
|
|
|
|
}
|
|
|
|
if (exception->recovering) {
|
|
|
|
rpc_sleep_on(&clp->cl_rpcwaitq, task, NULL);
|
|
|
|
if (test_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) == 0)
|
|
|
|
rpc_wake_up_queued_task(&clp->cl_rpcwaitq, task);
|
|
|
|
goto out_retry;
|
|
|
|
}
|
2013-10-18 01:13:19 +07:00
|
|
|
if (test_bit(NFS_MIG_FAILED, &server->mig_status))
|
2015-09-21 02:51:00 +07:00
|
|
|
ret = -EIO;
|
|
|
|
return ret;
|
|
|
|
out_retry:
|
2010-01-27 03:42:47 +07:00
|
|
|
if (ret == 0)
|
|
|
|
exception->retry = 1;
|
|
|
|
return ret;
|
2008-12-24 03:21:44 +07:00
|
|
|
}
|
|
|
|
|
2015-09-21 02:51:00 +07:00
|
|
|
static int
|
|
|
|
nfs4_async_handle_error(struct rpc_task *task, struct nfs_server *server,
|
|
|
|
struct nfs4_state *state, long *timeout)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.state = state,
|
|
|
|
};
|
|
|
|
|
|
|
|
if (task->tk_status >= 0)
|
|
|
|
return 0;
|
|
|
|
if (timeout)
|
|
|
|
exception.timeout = *timeout;
|
|
|
|
task->tk_status = nfs4_async_handle_exception(task, server,
|
|
|
|
task->tk_status,
|
|
|
|
&exception);
|
|
|
|
if (exception.delay && timeout)
|
|
|
|
*timeout = exception.timeout;
|
|
|
|
if (exception.retry)
|
|
|
|
return -EAGAIN;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-09-04 02:18:49 +07:00
|
|
|
/*
|
|
|
|
* Return 'true' if 'clp' is using an rpc_client that is integrity protected
|
|
|
|
* or 'false' otherwise.
|
|
|
|
*/
|
|
|
|
static bool _nfs4_is_integrity_protected(struct nfs_client *clp)
|
|
|
|
{
|
|
|
|
rpc_authflavor_t flavor = clp->cl_rpcclient->cl_auth->au_flavor;
|
2017-01-12 04:01:21 +07:00
|
|
|
return (flavor == RPC_AUTH_GSS_KRB5I) || (flavor == RPC_AUTH_GSS_KRB5P);
|
2013-09-04 02:18:49 +07:00
|
|
|
}
|
2008-12-24 03:21:44 +07:00
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
static void do_renew_lease(struct nfs_client *clp, unsigned long timestamp)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
spin_lock(&clp->cl_lock);
|
|
|
|
if (time_before(clp->cl_last_renewal,timestamp))
|
|
|
|
clp->cl_last_renewal = timestamp;
|
|
|
|
spin_unlock(&clp->cl_lock);
|
|
|
|
}
|
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
static void renew_lease(const struct nfs_server *server, unsigned long timestamp)
|
|
|
|
{
|
2015-07-06 01:50:46 +07:00
|
|
|
struct nfs_client *clp = server->nfs_client;
|
|
|
|
|
|
|
|
if (!nfs4_has_session(clp))
|
|
|
|
do_renew_lease(clp, timestamp);
|
2010-08-01 01:29:06 +07:00
|
|
|
}
|
|
|
|
|
2013-08-09 23:48:00 +07:00
|
|
|
struct nfs4_call_sync_data {
|
|
|
|
const struct nfs_server *seq_server;
|
|
|
|
struct nfs4_sequence_args *seq_args;
|
|
|
|
struct nfs4_sequence_res *seq_res;
|
|
|
|
};
|
|
|
|
|
2015-06-23 18:51:55 +07:00
|
|
|
void nfs4_init_sequence(struct nfs4_sequence_args *args,
|
2018-05-05 03:22:50 +07:00
|
|
|
struct nfs4_sequence_res *res, int cache_reply,
|
|
|
|
int privileged)
|
2013-08-09 23:48:18 +07:00
|
|
|
{
|
|
|
|
args->sa_slot = NULL;
|
|
|
|
args->sa_cache_this = cache_reply;
|
2018-05-05 03:22:50 +07:00
|
|
|
args->sa_privileged = privileged;
|
2013-08-09 23:48:18 +07:00
|
|
|
|
|
|
|
res->sr_slot = NULL;
|
|
|
|
}
|
|
|
|
|
2016-08-28 22:50:26 +07:00
|
|
|
static void nfs40_sequence_free_slot(struct nfs4_sequence_res *res)
|
2013-08-09 23:49:19 +07:00
|
|
|
{
|
|
|
|
struct nfs4_slot *slot = res->sr_slot;
|
|
|
|
struct nfs4_slot_table *tbl;
|
|
|
|
|
|
|
|
tbl = slot->table;
|
|
|
|
spin_lock(&tbl->slot_tbl_lock);
|
|
|
|
if (!nfs41_wake_and_assign_slot(tbl, slot))
|
|
|
|
nfs4_free_slot(tbl, slot);
|
|
|
|
spin_unlock(&tbl->slot_tbl_lock);
|
|
|
|
|
|
|
|
res->sr_slot = NULL;
|
2016-08-28 22:50:26 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs40_sequence_done(struct rpc_task *task,
|
|
|
|
struct nfs4_sequence_res *res)
|
|
|
|
{
|
|
|
|
if (res->sr_slot != NULL)
|
|
|
|
nfs40_sequence_free_slot(res);
|
2013-08-09 23:49:19 +07:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:03 +07:00
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
static void nfs41_release_slot(struct nfs4_slot *slot)
|
2009-04-01 20:22:17 +07:00
|
|
|
{
|
2012-11-17 00:25:01 +07:00
|
|
|
struct nfs4_session *session;
|
2009-04-01 20:22:17 +07:00
|
|
|
struct nfs4_slot_table *tbl;
|
2012-11-27 04:16:54 +07:00
|
|
|
bool send_new_highest_used_slotid = false;
|
2009-04-01 20:22:17 +07:00
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
if (!slot)
|
|
|
|
return;
|
2014-01-30 00:24:03 +07:00
|
|
|
tbl = slot->table;
|
2012-11-17 00:25:01 +07:00
|
|
|
session = tbl->session;
|
2009-12-05 03:55:38 +07:00
|
|
|
|
2016-08-28 21:28:25 +07:00
|
|
|
/* Bump the slot sequence number */
|
|
|
|
if (slot->seq_done)
|
|
|
|
slot->seq_nr++;
|
|
|
|
slot->seq_done = 0;
|
|
|
|
|
2009-12-06 07:32:19 +07:00
|
|
|
spin_lock(&tbl->slot_tbl_lock);
|
2012-11-27 04:16:54 +07:00
|
|
|
/* Be nice to the server: try to ensure that the last transmitted
|
|
|
|
* value for highest_user_slotid <= target_highest_slotid
|
|
|
|
*/
|
|
|
|
if (tbl->highest_used_slotid > tbl->target_highest_slotid)
|
|
|
|
send_new_highest_used_slotid = true;
|
|
|
|
|
2014-01-30 00:24:03 +07:00
|
|
|
if (nfs41_wake_and_assign_slot(tbl, slot)) {
|
2012-11-30 05:27:47 +07:00
|
|
|
send_new_highest_used_slotid = false;
|
|
|
|
goto out_unlock;
|
|
|
|
}
|
2014-01-30 00:24:03 +07:00
|
|
|
nfs4_free_slot(tbl, slot);
|
2012-11-27 04:16:54 +07:00
|
|
|
|
|
|
|
if (tbl->highest_used_slotid != NFS4_NO_SLOT)
|
|
|
|
send_new_highest_used_slotid = false;
|
2012-11-30 05:27:47 +07:00
|
|
|
out_unlock:
|
2009-12-06 07:32:19 +07:00
|
|
|
spin_unlock(&tbl->slot_tbl_lock);
|
2012-11-27 04:16:54 +07:00
|
|
|
if (send_new_highest_used_slotid)
|
2015-07-14 01:01:31 +07:00
|
|
|
nfs41_notify_server(session->clp);
|
2016-08-29 00:25:43 +07:00
|
|
|
if (waitqueue_active(&tbl->slot_waitq))
|
|
|
|
wake_up_all(&tbl->slot_waitq);
|
2009-04-01 20:22:17 +07:00
|
|
|
}
|
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
static void nfs41_sequence_free_slot(struct nfs4_sequence_res *res)
|
|
|
|
{
|
|
|
|
nfs41_release_slot(res->sr_slot);
|
|
|
|
res->sr_slot = NULL;
|
|
|
|
}
|
|
|
|
|
2016-08-28 22:50:26 +07:00
|
|
|
static int nfs41_sequence_process(struct rpc_task *task,
|
|
|
|
struct nfs4_sequence_res *res)
|
2009-04-01 20:22:18 +07:00
|
|
|
{
|
2012-11-17 00:25:01 +07:00
|
|
|
struct nfs4_session *session;
|
2014-01-30 00:24:03 +07:00
|
|
|
struct nfs4_slot *slot = res->sr_slot;
|
2010-08-01 01:29:06 +07:00
|
|
|
struct nfs_client *clp;
|
2012-12-16 03:36:07 +07:00
|
|
|
bool interrupted = false;
|
2012-12-11 22:31:12 +07:00
|
|
|
int ret = 1;
|
2009-04-01 20:22:18 +07:00
|
|
|
|
2014-01-30 00:24:03 +07:00
|
|
|
if (slot == NULL)
|
|
|
|
goto out_noaction;
|
2011-04-19 02:57:32 +07:00
|
|
|
/* don't increment the sequence number if the task wasn't sent */
|
|
|
|
if (!RPC_WAS_SENT(task))
|
2009-04-01 20:22:18 +07:00
|
|
|
goto out;
|
|
|
|
|
2012-11-17 00:25:01 +07:00
|
|
|
session = slot->table->session;
|
2012-11-17 00:12:38 +07:00
|
|
|
|
2012-12-16 03:36:07 +07:00
|
|
|
if (slot->interrupted) {
|
2017-04-27 01:21:22 +07:00
|
|
|
if (res->sr_status != -NFS4ERR_DELAY)
|
|
|
|
slot->interrupted = 0;
|
2012-12-16 03:36:07 +07:00
|
|
|
interrupted = true;
|
|
|
|
}
|
|
|
|
|
2013-08-15 04:58:28 +07:00
|
|
|
trace_nfs4_sequence_done(session, res);
|
2009-12-05 03:55:39 +07:00
|
|
|
/* Check the SEQUENCE operation status */
|
2010-08-01 01:29:06 +07:00
|
|
|
switch (res->sr_status) {
|
|
|
|
case 0:
|
2009-04-01 20:22:18 +07:00
|
|
|
/* Update the slot's sequence and clientid lease timer */
|
2016-08-28 21:28:25 +07:00
|
|
|
slot->seq_done = 1;
|
2012-11-17 00:25:01 +07:00
|
|
|
clp = session->clp;
|
2012-12-16 03:21:52 +07:00
|
|
|
do_renew_lease(clp, res->sr_timestamp);
|
2009-12-06 01:46:14 +07:00
|
|
|
/* Check sequence flags */
|
2016-09-23 00:38:51 +07:00
|
|
|
nfs41_handle_sequence_flag_errors(clp, res->sr_status_flags,
|
|
|
|
!!slot->privileged);
|
2012-11-21 00:49:27 +07:00
|
|
|
nfs41_update_target_slotid(slot->table, slot, res);
|
2010-08-01 01:29:06 +07:00
|
|
|
break;
|
2012-12-16 03:36:07 +07:00
|
|
|
case 1:
|
|
|
|
/*
|
|
|
|
* sr_status remains 1 if an RPC level error occurred.
|
|
|
|
* The server may or may not have processed the sequence
|
|
|
|
* operation..
|
|
|
|
* Mark the slot as having hosted an interrupted RPC call.
|
|
|
|
*/
|
|
|
|
slot->interrupted = 1;
|
|
|
|
goto out;
|
2010-08-01 01:29:06 +07:00
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
/* The server detected a resend of the RPC call and
|
|
|
|
* returned NFS4ERR_DELAY as per Section 2.10.6.2
|
|
|
|
* of RFC5661.
|
|
|
|
*/
|
2012-11-17 00:45:06 +07:00
|
|
|
dprintk("%s: slot=%u seq=%u: Operation in progress\n",
|
2010-09-24 20:17:01 +07:00
|
|
|
__func__,
|
2012-11-17 00:45:06 +07:00
|
|
|
slot->slot_nr,
|
2012-11-17 00:12:38 +07:00
|
|
|
slot->seq_nr);
|
2010-08-01 01:29:06 +07:00
|
|
|
goto out_retry;
|
2018-06-10 06:10:31 +07:00
|
|
|
case -NFS4ERR_RETRY_UNCACHED_REP:
|
|
|
|
case -NFS4ERR_SEQ_FALSE_RETRY:
|
|
|
|
/*
|
|
|
|
* The server thinks we tried to replay a request.
|
|
|
|
* Retry the call after bumping the sequence ID.
|
|
|
|
*/
|
|
|
|
goto retry_new_seq;
|
2012-12-11 22:31:12 +07:00
|
|
|
case -NFS4ERR_BADSLOT:
|
|
|
|
/*
|
|
|
|
* The slot id we used was probably retired. Try again
|
|
|
|
* using a different slot id.
|
|
|
|
*/
|
2018-06-09 23:50:50 +07:00
|
|
|
if (slot->slot_nr < slot->table->target_highest_slotid)
|
2017-10-20 02:46:45 +07:00
|
|
|
goto session_recover;
|
2012-12-16 01:56:18 +07:00
|
|
|
goto retry_nowait;
|
|
|
|
case -NFS4ERR_SEQ_MISORDERED:
|
2012-12-16 03:36:07 +07:00
|
|
|
/*
|
|
|
|
* Was the last operation on this sequence interrupted?
|
|
|
|
* If so, retry after bumping the sequence number.
|
|
|
|
*/
|
2017-10-20 02:46:45 +07:00
|
|
|
if (interrupted)
|
|
|
|
goto retry_new_seq;
|
2012-12-16 01:56:18 +07:00
|
|
|
/*
|
|
|
|
* Could this slot have been previously retired?
|
|
|
|
* If so, then the server may be expecting seq_nr = 1!
|
|
|
|
*/
|
2012-12-16 03:21:52 +07:00
|
|
|
if (slot->seq_nr != 1) {
|
|
|
|
slot->seq_nr = 1;
|
|
|
|
goto retry_nowait;
|
|
|
|
}
|
2017-10-20 02:46:45 +07:00
|
|
|
goto session_recover;
|
2010-08-01 01:29:06 +07:00
|
|
|
default:
|
|
|
|
/* Just update the slot sequence no. */
|
2016-08-28 21:28:25 +07:00
|
|
|
slot->seq_done = 1;
|
2009-04-01 20:22:18 +07:00
|
|
|
}
|
|
|
|
out:
|
|
|
|
/* The session may be reset by one of the error handlers. */
|
|
|
|
dprintk("%s: Error %d free the slot \n", __func__, res->sr_status);
|
2014-01-30 00:24:03 +07:00
|
|
|
out_noaction:
|
2012-12-11 22:31:12 +07:00
|
|
|
return ret;
|
2017-10-20 02:46:45 +07:00
|
|
|
session_recover:
|
|
|
|
nfs4_schedule_session_recovery(session, res->sr_status);
|
|
|
|
goto retry_nowait;
|
|
|
|
retry_new_seq:
|
|
|
|
++slot->seq_nr;
|
2012-12-16 01:56:18 +07:00
|
|
|
retry_nowait:
|
|
|
|
if (rpc_restart_call_prepare(task)) {
|
2016-08-28 22:50:26 +07:00
|
|
|
nfs41_sequence_free_slot(res);
|
2012-12-16 01:56:18 +07:00
|
|
|
task->tk_status = 0;
|
|
|
|
ret = 0;
|
|
|
|
}
|
|
|
|
goto out;
|
2010-08-01 01:29:06 +07:00
|
|
|
out_retry:
|
2010-08-01 01:29:07 +07:00
|
|
|
if (!rpc_restart_call(task))
|
2010-08-01 01:29:06 +07:00
|
|
|
goto out;
|
|
|
|
rpc_delay(task, NFS4_POLL_RETRY_MAX);
|
|
|
|
return 0;
|
2009-04-01 20:22:18 +07:00
|
|
|
}
|
2016-08-28 22:50:26 +07:00
|
|
|
|
|
|
|
int nfs41_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
|
|
|
|
{
|
|
|
|
if (!nfs41_sequence_process(task, res))
|
|
|
|
return 0;
|
|
|
|
if (res->sr_slot != NULL)
|
|
|
|
nfs41_sequence_free_slot(res);
|
|
|
|
return 1;
|
|
|
|
|
|
|
|
}
|
2014-01-29 23:34:38 +07:00
|
|
|
EXPORT_SYMBOL_GPL(nfs41_sequence_done);
|
2009-04-01 20:22:18 +07:00
|
|
|
|
2016-08-28 22:50:26 +07:00
|
|
|
static int nfs4_sequence_process(struct rpc_task *task, struct nfs4_sequence_res *res)
|
|
|
|
{
|
|
|
|
if (res->sr_slot == NULL)
|
|
|
|
return 1;
|
|
|
|
if (res->sr_slot->table->session != NULL)
|
|
|
|
return nfs41_sequence_process(task, res);
|
|
|
|
return nfs40_sequence_done(task, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_sequence_free_slot(struct nfs4_sequence_res *res)
|
|
|
|
{
|
|
|
|
if (res->sr_slot != NULL) {
|
|
|
|
if (res->sr_slot->table->session != NULL)
|
|
|
|
nfs41_sequence_free_slot(res);
|
|
|
|
else
|
|
|
|
nfs40_sequence_free_slot(res);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-06-11 04:24:16 +07:00
|
|
|
int nfs4_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
|
2010-06-16 20:52:26 +07:00
|
|
|
{
|
2012-11-17 00:25:01 +07:00
|
|
|
if (res->sr_slot == NULL)
|
2010-08-01 01:29:06 +07:00
|
|
|
return 1;
|
2013-08-09 23:49:19 +07:00
|
|
|
if (!res->sr_slot->table->session)
|
|
|
|
return nfs40_sequence_done(task, res);
|
2010-08-01 01:29:06 +07:00
|
|
|
return nfs41_sequence_done(task, res);
|
2010-06-16 20:52:26 +07:00
|
|
|
}
|
2014-06-11 04:24:16 +07:00
|
|
|
EXPORT_SYMBOL_GPL(nfs4_sequence_done);
|
2010-06-16 20:52:26 +07:00
|
|
|
|
2009-04-01 20:22:13 +07:00
|
|
|
static void nfs41_call_sync_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
2013-08-09 23:48:00 +07:00
|
|
|
struct nfs4_call_sync_data *data = calldata;
|
2009-04-01 20:22:13 +07:00
|
|
|
|
2010-06-16 20:52:26 +07:00
|
|
|
dprintk("--> %s data->seq_server %p\n", __func__, data->seq_server);
|
|
|
|
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(data->seq_server->nfs_client,
|
|
|
|
data->seq_args, data->seq_res, task);
|
2009-04-01 20:22:13 +07:00
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:19 +07:00
|
|
|
static void nfs41_call_sync_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
2013-08-09 23:48:00 +07:00
|
|
|
struct nfs4_call_sync_data *data = calldata;
|
2009-04-01 20:22:19 +07:00
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
nfs41_sequence_done(task, data->seq_res);
|
2009-04-01 20:22:19 +07:00
|
|
|
}
|
|
|
|
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct rpc_call_ops nfs41_call_sync_ops = {
|
2009-04-01 20:22:13 +07:00
|
|
|
.rpc_call_prepare = nfs41_call_sync_prepare,
|
2009-04-01 20:22:19 +07:00
|
|
|
.rpc_call_done = nfs41_call_sync_done,
|
2009-04-01 20:22:13 +07:00
|
|
|
};
|
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
static void
|
|
|
|
nfs4_sequence_process_interrupted(struct nfs_client *client,
|
|
|
|
struct nfs4_slot *slot, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct rpc_task *task;
|
|
|
|
|
|
|
|
task = _nfs41_proc_sequence(client, cred, slot, true);
|
|
|
|
if (!IS_ERR(task))
|
|
|
|
rpc_put_task_async(task);
|
|
|
|
}
|
|
|
|
|
2013-08-09 23:49:19 +07:00
|
|
|
#else /* !CONFIG_NFS_V4_1 */
|
|
|
|
|
2016-08-28 22:50:26 +07:00
|
|
|
static int nfs4_sequence_process(struct rpc_task *task, struct nfs4_sequence_res *res)
|
|
|
|
{
|
|
|
|
return nfs40_sequence_done(task, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_sequence_free_slot(struct nfs4_sequence_res *res)
|
|
|
|
{
|
|
|
|
if (res->sr_slot != NULL)
|
|
|
|
nfs40_sequence_free_slot(res);
|
|
|
|
}
|
|
|
|
|
2014-06-11 04:24:16 +07:00
|
|
|
int nfs4_sequence_done(struct rpc_task *task,
|
|
|
|
struct nfs4_sequence_res *res)
|
2013-08-09 23:48:27 +07:00
|
|
|
{
|
2013-08-09 23:49:19 +07:00
|
|
|
return nfs40_sequence_done(task, res);
|
2013-08-09 23:48:27 +07:00
|
|
|
}
|
2014-06-11 04:24:16 +07:00
|
|
|
EXPORT_SYMBOL_GPL(nfs4_sequence_done);
|
2013-08-09 23:49:19 +07:00
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
static void
|
|
|
|
nfs4_sequence_process_interrupted(struct nfs_client *client,
|
|
|
|
struct nfs4_slot *slot, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
WARN_ON_ONCE(1);
|
|
|
|
slot->interrupted = 0;
|
|
|
|
}
|
|
|
|
|
2013-08-09 23:49:19 +07:00
|
|
|
#endif /* !CONFIG_NFS_V4_1 */
|
2013-08-09 23:48:27 +07:00
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
static
|
|
|
|
void nfs4_sequence_attach_slot(struct nfs4_sequence_args *args,
|
|
|
|
struct nfs4_sequence_res *res,
|
|
|
|
struct nfs4_slot *slot)
|
|
|
|
{
|
|
|
|
if (!slot)
|
|
|
|
return;
|
|
|
|
slot->privileged = args->sa_privileged ? 1 : 0;
|
|
|
|
args->sa_slot = slot;
|
|
|
|
|
|
|
|
res->sr_slot = slot;
|
|
|
|
res->sr_timestamp = jiffies;
|
|
|
|
res->sr_status_flags = 0;
|
|
|
|
res->sr_status = 1;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
int nfs4_setup_sequence(struct nfs_client *client,
|
2017-01-10 23:39:53 +07:00
|
|
|
struct nfs4_sequence_args *args,
|
|
|
|
struct nfs4_sequence_res *res,
|
|
|
|
struct rpc_task *task)
|
|
|
|
{
|
|
|
|
struct nfs4_session *session = nfs4_get_session(client);
|
2017-01-11 04:49:31 +07:00
|
|
|
struct nfs4_slot_table *tbl = client->cl_slot_tbl;
|
2017-01-11 22:54:04 +07:00
|
|
|
struct nfs4_slot *slot;
|
2017-01-10 23:39:53 +07:00
|
|
|
|
2017-01-11 00:01:46 +07:00
|
|
|
/* slot already allocated? */
|
|
|
|
if (res->sr_slot != NULL)
|
|
|
|
goto out_start;
|
|
|
|
|
2017-01-11 04:49:31 +07:00
|
|
|
if (session) {
|
|
|
|
tbl = &session->fc_slot_table;
|
|
|
|
task->tk_timeout = 0;
|
|
|
|
}
|
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
for (;;) {
|
|
|
|
spin_lock(&tbl->slot_tbl_lock);
|
|
|
|
/* The state manager will wait until the slot table is empty */
|
|
|
|
if (nfs4_slot_tbl_draining(tbl) && !args->sa_privileged)
|
|
|
|
goto out_sleep;
|
|
|
|
|
|
|
|
slot = nfs4_alloc_slot(tbl);
|
|
|
|
if (IS_ERR(slot)) {
|
|
|
|
/* Try again in 1/4 second */
|
|
|
|
if (slot == ERR_PTR(-ENOMEM))
|
|
|
|
task->tk_timeout = HZ >> 2;
|
|
|
|
goto out_sleep;
|
|
|
|
}
|
|
|
|
spin_unlock(&tbl->slot_tbl_lock);
|
2017-01-11 04:13:27 +07:00
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
if (likely(!slot->interrupted))
|
|
|
|
break;
|
|
|
|
nfs4_sequence_process_interrupted(client,
|
|
|
|
slot, task->tk_msg.rpc_cred);
|
2017-01-11 22:54:04 +07:00
|
|
|
}
|
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
nfs4_sequence_attach_slot(args, res, slot);
|
2017-01-11 22:54:04 +07:00
|
|
|
|
2017-01-12 01:37:06 +07:00
|
|
|
trace_nfs4_setup_sequence(session, args);
|
2017-01-11 00:01:46 +07:00
|
|
|
out_start:
|
|
|
|
rpc_call_start(task);
|
|
|
|
return 0;
|
2017-01-11 04:29:54 +07:00
|
|
|
|
|
|
|
out_sleep:
|
|
|
|
if (args->sa_privileged)
|
|
|
|
rpc_sleep_on_priority(&tbl->slot_tbl_waitq, task,
|
|
|
|
NULL, RPC_PRIORITY_PRIVILEGED);
|
|
|
|
else
|
|
|
|
rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
|
|
|
|
spin_unlock(&tbl->slot_tbl_lock);
|
|
|
|
return -EAGAIN;
|
2017-01-10 23:39:53 +07:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(nfs4_setup_sequence);
|
|
|
|
|
2013-08-09 23:48:27 +07:00
|
|
|
static void nfs40_call_sync_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_call_sync_data *data = calldata;
|
2017-01-10 03:48:22 +07:00
|
|
|
nfs4_setup_sequence(data->seq_server->nfs_client,
|
2013-08-09 23:48:27 +07:00
|
|
|
data->seq_args, data->seq_res, task);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs40_call_sync_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_call_sync_data *data = calldata;
|
|
|
|
nfs4_sequence_done(task, data->seq_res);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs40_call_sync_ops = {
|
|
|
|
.rpc_call_prepare = nfs40_call_sync_prepare,
|
|
|
|
.rpc_call_done = nfs40_call_sync_done,
|
|
|
|
};
|
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
static int nfs4_call_sync_sequence(struct rpc_clnt *clnt,
|
|
|
|
struct nfs_server *server,
|
2009-04-01 20:22:13 +07:00
|
|
|
struct rpc_message *msg,
|
|
|
|
struct nfs4_sequence_args *args,
|
2012-10-30 06:02:20 +07:00
|
|
|
struct nfs4_sequence_res *res)
|
2009-04-01 20:22:13 +07:00
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
struct rpc_task *task;
|
2013-08-09 23:48:27 +07:00
|
|
|
struct nfs_client *clp = server->nfs_client;
|
2013-08-09 23:48:00 +07:00
|
|
|
struct nfs4_call_sync_data data = {
|
2010-06-16 20:52:26 +07:00
|
|
|
.seq_server = server,
|
2009-04-01 20:22:13 +07:00
|
|
|
.seq_args = args,
|
|
|
|
.seq_res = res,
|
|
|
|
};
|
|
|
|
struct rpc_task_setup task_setup = {
|
2011-03-25 00:12:24 +07:00
|
|
|
.rpc_client = clnt,
|
2009-04-01 20:22:13 +07:00
|
|
|
.rpc_message = msg,
|
2013-08-09 23:48:27 +07:00
|
|
|
.callback_ops = clp->cl_mvops->call_sync_ops,
|
2009-04-01 20:22:13 +07:00
|
|
|
.callback_data = &data
|
|
|
|
};
|
|
|
|
|
|
|
|
task = rpc_run_task(&task_setup);
|
|
|
|
if (IS_ERR(task))
|
|
|
|
ret = PTR_ERR(task);
|
|
|
|
else {
|
|
|
|
ret = task->tk_status;
|
|
|
|
rpc_put_task(task);
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
int nfs4_call_sync(struct rpc_clnt *clnt,
|
|
|
|
struct nfs_server *server,
|
2011-03-25 00:12:23 +07:00
|
|
|
struct rpc_message *msg,
|
|
|
|
struct nfs4_sequence_args *args,
|
|
|
|
struct nfs4_sequence_res *res,
|
|
|
|
int cache_reply)
|
|
|
|
{
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(args, res, cache_reply, 0);
|
2013-08-09 23:48:27 +07:00
|
|
|
return nfs4_call_sync_sequence(clnt, server, msg, args, res);
|
2011-03-25 00:12:23 +07:00
|
|
|
}
|
2009-04-01 20:22:03 +07:00
|
|
|
|
2017-01-12 10:07:28 +07:00
|
|
|
static void update_changeattr(struct inode *dir, struct nfs4_change_info *cinfo,
|
|
|
|
unsigned long timestamp)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-05-25 12:40:57 +07:00
|
|
|
struct nfs_inode *nfsi = NFS_I(dir);
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2006-05-25 12:40:57 +07:00
|
|
|
spin_lock(&dir->i_lock);
|
2018-03-21 03:53:31 +07:00
|
|
|
nfsi->cache_validity |= NFS_INO_INVALID_CTIME
|
|
|
|
| NFS_INO_INVALID_MTIME
|
|
|
|
| NFS_INO_INVALID_DATA;
|
2018-01-09 20:21:17 +07:00
|
|
|
if (cinfo->atomic && cinfo->before == inode_peek_iversion_raw(dir)) {
|
2016-12-17 04:55:55 +07:00
|
|
|
nfsi->cache_validity &= ~NFS_INO_REVAL_PAGECACHE;
|
|
|
|
nfsi->attrtimeo_timestamp = jiffies;
|
|
|
|
} else {
|
2007-10-16 05:18:29 +07:00
|
|
|
nfs_force_lookup_revalidate(dir);
|
2018-01-09 20:21:17 +07:00
|
|
|
if (cinfo->before != inode_peek_iversion_raw(dir))
|
2016-12-17 04:55:55 +07:00
|
|
|
nfsi->cache_validity |= NFS_INO_INVALID_ACCESS |
|
|
|
|
NFS_INO_INVALID_ACL;
|
|
|
|
}
|
2018-01-09 20:21:17 +07:00
|
|
|
inode_set_iversion_raw(dir, cinfo->after);
|
2017-01-12 10:07:28 +07:00
|
|
|
nfsi->read_cache_jiffies = timestamp;
|
2015-02-27 07:52:06 +07:00
|
|
|
nfsi->attr_gencount = nfs_inc_attr_generation_counter();
|
2012-12-21 04:52:38 +07:00
|
|
|
nfs_fscache_invalidate(dir);
|
2006-05-25 12:40:57 +07:00
|
|
|
spin_unlock(&dir->i_lock);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2017-11-07 03:28:03 +07:00
|
|
|
struct nfs4_open_createattrs {
|
|
|
|
struct nfs4_label *label;
|
|
|
|
struct iattr *sattr;
|
|
|
|
const __u32 verf[2];
|
|
|
|
};
|
|
|
|
|
2013-03-16 03:44:28 +07:00
|
|
|
static bool nfs4_clear_cap_atomic_open_v1(struct nfs_server *server,
|
|
|
|
int err, struct nfs4_exception *exception)
|
|
|
|
{
|
|
|
|
if (err != -EINVAL)
|
|
|
|
return false;
|
|
|
|
if (!(server->caps & NFS_CAP_ATOMIC_OPEN_V1))
|
|
|
|
return false;
|
|
|
|
server->caps &= ~NFS_CAP_ATOMIC_OPEN_V1;
|
|
|
|
exception->retry = 1;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2015-01-31 02:21:14 +07:00
|
|
|
static u32
|
|
|
|
nfs4_map_atomic_open_share(struct nfs_server *server,
|
|
|
|
fmode_t fmode, int openflags)
|
|
|
|
{
|
|
|
|
u32 res = 0;
|
|
|
|
|
|
|
|
switch (fmode & (FMODE_READ | FMODE_WRITE)) {
|
|
|
|
case FMODE_READ:
|
|
|
|
res = NFS4_SHARE_ACCESS_READ;
|
|
|
|
break;
|
|
|
|
case FMODE_WRITE:
|
|
|
|
res = NFS4_SHARE_ACCESS_WRITE;
|
|
|
|
break;
|
|
|
|
case FMODE_READ|FMODE_WRITE:
|
|
|
|
res = NFS4_SHARE_ACCESS_BOTH;
|
|
|
|
}
|
|
|
|
if (!(server->caps & NFS_CAP_ATOMIC_OPEN_V1))
|
|
|
|
goto out;
|
|
|
|
/* Want no delegation if we're using O_DIRECT */
|
|
|
|
if (openflags & O_DIRECT)
|
|
|
|
res |= NFS4_SHARE_WANT_NO_DELEG;
|
|
|
|
out:
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2013-03-16 03:44:28 +07:00
|
|
|
static enum open_claim_type4
|
|
|
|
nfs4_map_atomic_open_claim(struct nfs_server *server,
|
|
|
|
enum open_claim_type4 claim)
|
|
|
|
{
|
|
|
|
if (server->caps & NFS_CAP_ATOMIC_OPEN_V1)
|
|
|
|
return claim;
|
|
|
|
switch (claim) {
|
|
|
|
default:
|
|
|
|
return claim;
|
|
|
|
case NFS4_OPEN_CLAIM_FH:
|
|
|
|
return NFS4_OPEN_CLAIM_NULL;
|
|
|
|
case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
|
|
|
|
return NFS4_OPEN_CLAIM_DELEGATE_CUR;
|
|
|
|
case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
|
|
|
|
return NFS4_OPEN_CLAIM_DELEGATE_PREV;
|
|
|
|
}
|
|
|
|
}
|
2007-07-04 10:48:13 +07:00
|
|
|
|
|
|
|
static void nfs4_init_opendata_res(struct nfs4_opendata *p)
|
|
|
|
{
|
|
|
|
p->o_res.f_attr = &p->f_attr;
|
2013-05-22 23:50:42 +07:00
|
|
|
p->o_res.f_label = p->f_label;
|
2008-04-08 00:20:54 +07:00
|
|
|
p->o_res.seqid = p->o_arg.seqid;
|
|
|
|
p->c_res.seqid = p->c_arg.seqid;
|
2007-07-04 10:48:13 +07:00
|
|
|
p->o_res.server = p->o_arg.server;
|
2012-10-03 13:39:34 +07:00
|
|
|
p->o_res.access_request = p->o_arg.access;
|
2007-07-04 10:48:13 +07:00
|
|
|
nfs_fattr_init(&p->f_attr);
|
2012-01-08 01:22:46 +07:00
|
|
|
nfs_fattr_init_names(&p->f_attr, &p->owner_name, &p->group_name);
|
2007-07-04 10:48:13 +07:00
|
|
|
}
|
|
|
|
|
2011-06-23 05:30:55 +07:00
|
|
|
static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
|
2008-12-24 03:21:56 +07:00
|
|
|
struct nfs4_state_owner *sp, fmode_t fmode, int flags,
|
2017-11-07 03:28:03 +07:00
|
|
|
const struct nfs4_open_createattrs *c,
|
2013-03-16 01:57:33 +07:00
|
|
|
enum open_claim_type4 claim,
|
2010-05-13 23:51:01 +07:00
|
|
|
gfp_t gfp_mask)
|
2006-01-03 15:55:08 +07:00
|
|
|
{
|
2011-06-23 05:30:55 +07:00
|
|
|
struct dentry *parent = dget_parent(dentry);
|
2015-03-18 05:25:59 +07:00
|
|
|
struct inode *dir = d_inode(parent);
|
2006-01-03 15:55:08 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2015-01-24 07:19:25 +07:00
|
|
|
struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
|
2017-11-07 03:28:03 +07:00
|
|
|
struct nfs4_label *label = (c != NULL) ? c->label : NULL;
|
2006-01-03 15:55:08 +07:00
|
|
|
struct nfs4_opendata *p;
|
|
|
|
|
2010-05-13 23:51:01 +07:00
|
|
|
p = kzalloc(sizeof(*p), gfp_mask);
|
2006-01-03 15:55:08 +07:00
|
|
|
if (p == NULL)
|
|
|
|
goto err;
|
2013-05-22 23:50:43 +07:00
|
|
|
|
|
|
|
p->f_label = nfs4_label_alloc(server, gfp_mask);
|
|
|
|
if (IS_ERR(p->f_label))
|
|
|
|
goto err_free_p;
|
|
|
|
|
2015-07-27 14:31:38 +07:00
|
|
|
p->a_label = nfs4_label_alloc(server, gfp_mask);
|
|
|
|
if (IS_ERR(p->a_label))
|
|
|
|
goto err_free_f;
|
|
|
|
|
2015-01-24 07:19:25 +07:00
|
|
|
alloc_seqid = server->nfs_client->cl_mvops->alloc_seqid;
|
|
|
|
p->o_arg.seqid = alloc_seqid(&sp->so_seqid, gfp_mask);
|
2015-01-24 06:48:00 +07:00
|
|
|
if (IS_ERR(p->o_arg.seqid))
|
2013-05-22 23:50:43 +07:00
|
|
|
goto err_free_label;
|
2011-06-23 05:30:55 +07:00
|
|
|
nfs_sb_active(dentry->d_sb);
|
|
|
|
p->dentry = dget(dentry);
|
2006-01-03 15:55:08 +07:00
|
|
|
p->dir = parent;
|
|
|
|
p->owner = sp;
|
|
|
|
atomic_inc(&sp->so_count);
|
2008-12-24 03:21:56 +07:00
|
|
|
p->o_arg.open_flags = flags;
|
|
|
|
p->o_arg.fmode = fmode & (FMODE_READ|FMODE_WRITE);
|
2016-12-03 10:53:30 +07:00
|
|
|
p->o_arg.umask = current_umask();
|
2016-11-11 03:40:34 +07:00
|
|
|
p->o_arg.claim = nfs4_map_atomic_open_claim(server, claim);
|
2015-01-31 02:21:14 +07:00
|
|
|
p->o_arg.share_access = nfs4_map_atomic_open_share(server,
|
|
|
|
fmode, flags);
|
2012-10-03 04:49:52 +07:00
|
|
|
/* don't put an ACCESS op in OPEN compound if O_EXCL, because ACCESS
|
|
|
|
* will return permission denied for all bits until close */
|
|
|
|
if (!(flags & O_EXCL)) {
|
|
|
|
/* ask server to check for all possible rights as results
|
|
|
|
* are cached */
|
2016-11-11 03:40:34 +07:00
|
|
|
switch (p->o_arg.claim) {
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
case NFS4_OPEN_CLAIM_NULL:
|
|
|
|
case NFS4_OPEN_CLAIM_FH:
|
|
|
|
p->o_arg.access = NFS4_ACCESS_READ |
|
|
|
|
NFS4_ACCESS_MODIFY |
|
|
|
|
NFS4_ACCESS_EXTEND |
|
|
|
|
NFS4_ACCESS_EXECUTE;
|
|
|
|
}
|
2012-10-03 04:49:52 +07:00
|
|
|
}
|
2006-08-23 07:06:09 +07:00
|
|
|
p->o_arg.clientid = server->nfs_client->cl_clientid;
|
2012-04-21 06:24:51 +07:00
|
|
|
p->o_arg.id.create_time = ktime_to_ns(sp->so_seqid.create_time);
|
|
|
|
p->o_arg.id.uniquifier = sp->so_seqid.owner_id;
|
2011-06-23 05:30:55 +07:00
|
|
|
p->o_arg.name = &dentry->d_name;
|
2006-01-03 15:55:08 +07:00
|
|
|
p->o_arg.server = server;
|
2013-05-22 23:50:44 +07:00
|
|
|
p->o_arg.bitmask = nfs4_bitmask(server, label);
|
2012-06-05 20:16:47 +07:00
|
|
|
p->o_arg.open_bitmap = &nfs4_fattr_bitmap[0];
|
2015-07-27 14:31:38 +07:00
|
|
|
p->o_arg.label = nfs4_label_copy(p->a_label, label);
|
2013-03-16 03:44:28 +07:00
|
|
|
switch (p->o_arg.claim) {
|
2013-03-16 01:57:33 +07:00
|
|
|
case NFS4_OPEN_CLAIM_NULL:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEGATE_CUR:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEGATE_PREV:
|
|
|
|
p->o_arg.fh = NFS_FH(dir);
|
|
|
|
break;
|
|
|
|
case NFS4_OPEN_CLAIM_PREVIOUS:
|
|
|
|
case NFS4_OPEN_CLAIM_FH:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
|
2015-03-18 05:25:59 +07:00
|
|
|
p->o_arg.fh = NFS_FH(d_inode(dentry));
|
2013-03-16 01:57:33 +07:00
|
|
|
}
|
2017-11-07 03:28:03 +07:00
|
|
|
if (c != NULL && c->sattr != NULL && c->sattr->ia_valid != 0) {
|
2006-01-03 15:55:08 +07:00
|
|
|
p->o_arg.u.attrs = &p->attrs;
|
2017-11-07 03:28:03 +07:00
|
|
|
memcpy(&p->attrs, c->sattr, sizeof(p->attrs));
|
2012-03-03 05:14:31 +07:00
|
|
|
|
2017-11-07 03:28:03 +07:00
|
|
|
memcpy(p->o_arg.u.verifier.data, c->verf,
|
2012-03-03 05:14:31 +07:00
|
|
|
sizeof(p->o_arg.u.verifier.data));
|
2006-01-03 15:55:08 +07:00
|
|
|
}
|
2006-01-03 15:55:12 +07:00
|
|
|
p->c_arg.fh = &p->o_res.fh;
|
|
|
|
p->c_arg.stateid = &p->o_res.stateid;
|
|
|
|
p->c_arg.seqid = p->o_arg.seqid;
|
2007-07-04 10:48:13 +07:00
|
|
|
nfs4_init_opendata_res(p);
|
2007-06-18 03:02:44 +07:00
|
|
|
kref_init(&p->kref);
|
2006-01-03 15:55:08 +07:00
|
|
|
return p;
|
2013-05-22 23:50:43 +07:00
|
|
|
|
|
|
|
err_free_label:
|
2015-07-27 14:31:38 +07:00
|
|
|
nfs4_label_free(p->a_label);
|
|
|
|
err_free_f:
|
2013-05-22 23:50:43 +07:00
|
|
|
nfs4_label_free(p->f_label);
|
|
|
|
err_free_p:
|
2006-01-03 15:55:08 +07:00
|
|
|
kfree(p);
|
|
|
|
err:
|
|
|
|
dput(parent);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2007-06-18 03:02:44 +07:00
|
|
|
static void nfs4_opendata_free(struct kref *kref)
|
2006-01-03 15:55:08 +07:00
|
|
|
{
|
2007-06-18 03:02:44 +07:00
|
|
|
struct nfs4_opendata *p = container_of(kref,
|
|
|
|
struct nfs4_opendata, kref);
|
2011-06-23 05:30:55 +07:00
|
|
|
struct super_block *sb = p->dentry->d_sb;
|
2007-06-18 03:02:44 +07:00
|
|
|
|
2016-10-19 00:39:51 +07:00
|
|
|
nfs4_lgopen_release(p->lgp);
|
2007-06-18 03:02:44 +07:00
|
|
|
nfs_free_seqid(p->o_arg.seqid);
|
2016-08-28 22:50:26 +07:00
|
|
|
nfs4_sequence_free_slot(&p->o_res.seq_res);
|
2007-07-06 06:02:21 +07:00
|
|
|
if (p->state != NULL)
|
|
|
|
nfs4_put_open_state(p->state);
|
2007-06-18 03:02:44 +07:00
|
|
|
nfs4_put_state_owner(p->owner);
|
2013-05-22 23:50:43 +07:00
|
|
|
|
2015-07-27 14:31:38 +07:00
|
|
|
nfs4_label_free(p->a_label);
|
2013-05-22 23:50:43 +07:00
|
|
|
nfs4_label_free(p->f_label);
|
|
|
|
|
2007-06-18 03:02:44 +07:00
|
|
|
dput(p->dir);
|
2011-06-23 05:30:55 +07:00
|
|
|
dput(p->dentry);
|
|
|
|
nfs_sb_deactive(sb);
|
2012-01-08 01:22:46 +07:00
|
|
|
nfs_fattr_free_names(&p->f_attr);
|
2014-03-27 03:24:37 +07:00
|
|
|
kfree(p->f_attr.mdsthreshold);
|
2007-06-18 03:02:44 +07:00
|
|
|
kfree(p);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_opendata_put(struct nfs4_opendata *p)
|
|
|
|
{
|
|
|
|
if (p != NULL)
|
|
|
|
kref_put(&p->kref, nfs4_opendata_free);
|
2006-01-03 15:55:08 +07:00
|
|
|
}
|
|
|
|
|
2015-09-20 21:50:17 +07:00
|
|
|
static bool nfs4_mode_match_open_stateid(struct nfs4_state *state,
|
|
|
|
fmode_t fmode)
|
|
|
|
{
|
|
|
|
switch(fmode & (FMODE_READ|FMODE_WRITE)) {
|
|
|
|
case FMODE_READ|FMODE_WRITE:
|
|
|
|
return state->n_rdwr != 0;
|
|
|
|
case FMODE_WRITE:
|
|
|
|
return state->n_wronly != 0;
|
|
|
|
case FMODE_READ:
|
|
|
|
return state->n_rdonly != 0;
|
|
|
|
}
|
|
|
|
WARN_ON_ONCE(1);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2008-12-24 03:21:56 +07:00
|
|
|
static int can_open_cached(struct nfs4_state *state, fmode_t mode, int open_mode)
|
2007-07-09 01:11:36 +07:00
|
|
|
{
|
|
|
|
int ret = 0;
|
2008-12-24 03:21:56 +07:00
|
|
|
|
2012-01-18 10:04:26 +07:00
|
|
|
if (open_mode & (O_EXCL|O_TRUNC))
|
2008-12-24 03:21:56 +07:00
|
|
|
goto out;
|
|
|
|
switch (mode & (FMODE_READ|FMODE_WRITE)) {
|
2007-07-09 01:11:36 +07:00
|
|
|
case FMODE_READ:
|
2009-12-08 20:33:16 +07:00
|
|
|
ret |= test_bit(NFS_O_RDONLY_STATE, &state->flags) != 0
|
|
|
|
&& state->n_rdonly != 0;
|
2007-07-09 01:11:36 +07:00
|
|
|
break;
|
|
|
|
case FMODE_WRITE:
|
2009-12-08 20:33:16 +07:00
|
|
|
ret |= test_bit(NFS_O_WRONLY_STATE, &state->flags) != 0
|
|
|
|
&& state->n_wronly != 0;
|
2007-07-09 01:11:36 +07:00
|
|
|
break;
|
|
|
|
case FMODE_READ|FMODE_WRITE:
|
2009-12-08 20:33:16 +07:00
|
|
|
ret |= test_bit(NFS_O_RDWR_STATE, &state->flags) != 0
|
|
|
|
&& state->n_rdwr != 0;
|
2007-07-09 01:11:36 +07:00
|
|
|
}
|
2008-12-24 03:21:56 +07:00
|
|
|
out:
|
2007-07-09 01:11:36 +07:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2015-08-20 10:30:00 +07:00
|
|
|
static int can_open_delegated(struct nfs_delegation *delegation, fmode_t fmode,
|
|
|
|
enum open_claim_type4 claim)
|
2007-07-06 06:02:21 +07:00
|
|
|
{
|
2011-12-10 07:05:58 +07:00
|
|
|
if (delegation == NULL)
|
|
|
|
return 0;
|
2008-12-24 03:21:56 +07:00
|
|
|
if ((delegation->type & fmode) != fmode)
|
2007-07-06 06:02:21 +07:00
|
|
|
return 0;
|
2013-02-05 23:43:28 +07:00
|
|
|
if (test_bit(NFS_DELEGATION_RETURNING, &delegation->flags))
|
|
|
|
return 0;
|
2015-08-20 10:30:00 +07:00
|
|
|
switch (claim) {
|
|
|
|
case NFS4_OPEN_CLAIM_NULL:
|
|
|
|
case NFS4_OPEN_CLAIM_FH:
|
|
|
|
break;
|
|
|
|
case NFS4_OPEN_CLAIM_PREVIOUS:
|
|
|
|
if (!test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags))
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return 0;
|
|
|
|
}
|
2008-12-24 03:21:52 +07:00
|
|
|
nfs_mark_delegation_referenced(delegation);
|
2007-07-06 06:02:21 +07:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2008-12-24 03:21:56 +07:00
|
|
|
static void update_open_stateflags(struct nfs4_state *state, fmode_t fmode)
|
2006-01-03 15:55:13 +07:00
|
|
|
{
|
2008-12-24 03:21:56 +07:00
|
|
|
switch (fmode) {
|
2006-01-03 15:55:13 +07:00
|
|
|
case FMODE_WRITE:
|
|
|
|
state->n_wronly++;
|
|
|
|
break;
|
|
|
|
case FMODE_READ:
|
|
|
|
state->n_rdonly++;
|
|
|
|
break;
|
|
|
|
case FMODE_READ|FMODE_WRITE:
|
|
|
|
state->n_rdwr++;
|
|
|
|
}
|
2008-12-24 03:21:56 +07:00
|
|
|
nfs4_state_set_mode_locked(state, state->state | fmode);
|
2007-07-06 05:07:55 +07:00
|
|
|
}
|
|
|
|
|
2016-09-23 00:39:21 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_1
|
|
|
|
static bool nfs_open_stateid_recover_openmode(struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
if (state->n_rdonly && !test_bit(NFS_O_RDONLY_STATE, &state->flags))
|
|
|
|
return true;
|
|
|
|
if (state->n_wronly && !test_bit(NFS_O_WRONLY_STATE, &state->flags))
|
|
|
|
return true;
|
|
|
|
if (state->n_rdwr && !test_bit(NFS_O_RDWR_STATE, &state->flags))
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
#endif /* CONFIG_NFS_V4_1 */
|
|
|
|
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
static void nfs_state_log_update_open_stateid(struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
if (test_and_clear_bit(NFS_STATE_CHANGE_WAIT, &state->flags))
|
|
|
|
wake_up_all(&state->waitq);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs_state_log_out_of_order_open_stateid(struct nfs4_state *state,
|
|
|
|
const nfs4_stateid *stateid)
|
|
|
|
{
|
|
|
|
u32 state_seqid = be32_to_cpu(state->open_stateid.seqid);
|
|
|
|
u32 stateid_seqid = be32_to_cpu(stateid->seqid);
|
|
|
|
|
|
|
|
if (stateid_seqid == state_seqid + 1U ||
|
|
|
|
(stateid_seqid == 1U && state_seqid == 0xffffffffU))
|
|
|
|
nfs_state_log_update_open_stateid(state);
|
|
|
|
else
|
|
|
|
set_bit(NFS_STATE_CHANGE_WAIT, &state->flags);
|
|
|
|
}
|
|
|
|
|
2014-02-13 07:15:06 +07:00
|
|
|
static void nfs_test_and_clear_all_open_stateid(struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
struct nfs_client *clp = state->owner->so_server->nfs_client;
|
|
|
|
bool need_recover = false;
|
|
|
|
|
|
|
|
if (test_and_clear_bit(NFS_O_RDONLY_STATE, &state->flags) && state->n_rdonly)
|
|
|
|
need_recover = true;
|
|
|
|
if (test_and_clear_bit(NFS_O_WRONLY_STATE, &state->flags) && state->n_wronly)
|
|
|
|
need_recover = true;
|
|
|
|
if (test_and_clear_bit(NFS_O_RDWR_STATE, &state->flags) && state->n_rdwr)
|
|
|
|
need_recover = true;
|
|
|
|
if (need_recover)
|
|
|
|
nfs4_state_mark_reclaim_nograce(clp, state);
|
|
|
|
}
|
|
|
|
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
/*
|
|
|
|
* Check for whether or not the caller may update the open stateid
|
|
|
|
* to the value passed in by stateid.
|
|
|
|
*
|
|
|
|
* Note: This function relies heavily on the server implementing
|
|
|
|
* RFC7530 Section 9.1.4.2, and RFC5661 Section 8.2.2
|
|
|
|
* correctly.
|
|
|
|
* i.e. The stateid seqids have to be initialised to 1, and
|
|
|
|
* are then incremented on every state transition.
|
|
|
|
*/
|
2014-02-11 06:20:47 +07:00
|
|
|
static bool nfs_need_update_open_stateid(struct nfs4_state *state,
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
const nfs4_stateid *stateid)
|
2014-02-11 06:20:47 +07:00
|
|
|
{
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
if (test_bit(NFS_OPEN_STATE, &state->flags) == 0 ||
|
|
|
|
!nfs4_stateid_match_other(stateid, &state->open_stateid)) {
|
|
|
|
if (stateid->seqid == cpu_to_be32(1))
|
|
|
|
nfs_state_log_update_open_stateid(state);
|
|
|
|
else
|
|
|
|
set_bit(NFS_STATE_CHANGE_WAIT, &state->flags);
|
2014-02-11 06:20:47 +07:00
|
|
|
return true;
|
2014-02-13 07:15:06 +07:00
|
|
|
}
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
|
|
|
|
if (nfs4_stateid_is_newer(stateid, &state->open_stateid)) {
|
|
|
|
nfs_state_log_out_of_order_open_stateid(state, stateid);
|
2014-02-11 06:20:47 +07:00
|
|
|
return true;
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
}
|
2014-02-11 06:20:47 +07:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2015-01-24 06:06:09 +07:00
|
|
|
static void nfs_resync_open_stateid_locked(struct nfs4_state *state)
|
|
|
|
{
|
2015-07-23 00:46:13 +07:00
|
|
|
if (!(state->n_wronly || state->n_rdonly || state->n_rdwr))
|
|
|
|
return;
|
2015-01-24 06:06:09 +07:00
|
|
|
if (state->n_wronly)
|
|
|
|
set_bit(NFS_O_WRONLY_STATE, &state->flags);
|
|
|
|
if (state->n_rdonly)
|
|
|
|
set_bit(NFS_O_RDONLY_STATE, &state->flags);
|
|
|
|
if (state->n_rdwr)
|
|
|
|
set_bit(NFS_O_RDWR_STATE, &state->flags);
|
2015-07-23 00:46:13 +07:00
|
|
|
set_bit(NFS_OPEN_STATE, &state->flags);
|
2015-01-24 06:06:09 +07:00
|
|
|
}
|
|
|
|
|
2014-02-11 22:41:07 +07:00
|
|
|
static void nfs_clear_open_stateid_locked(struct nfs4_state *state,
|
|
|
|
nfs4_stateid *stateid, fmode_t fmode)
|
2007-07-06 05:07:55 +07:00
|
|
|
{
|
2014-02-11 22:41:07 +07:00
|
|
|
clear_bit(NFS_O_RDWR_STATE, &state->flags);
|
|
|
|
switch (fmode & (FMODE_READ|FMODE_WRITE)) {
|
|
|
|
case FMODE_WRITE:
|
|
|
|
clear_bit(NFS_O_RDONLY_STATE, &state->flags);
|
|
|
|
break;
|
|
|
|
case FMODE_READ:
|
|
|
|
clear_bit(NFS_O_WRONLY_STATE, &state->flags);
|
|
|
|
break;
|
|
|
|
case 0:
|
|
|
|
clear_bit(NFS_O_RDONLY_STATE, &state->flags);
|
|
|
|
clear_bit(NFS_O_WRONLY_STATE, &state->flags);
|
|
|
|
clear_bit(NFS_OPEN_STATE, &state->flags);
|
|
|
|
}
|
|
|
|
if (stateid == NULL)
|
|
|
|
return;
|
2016-11-14 23:19:55 +07:00
|
|
|
/* Handle OPEN+OPEN_DOWNGRADE races */
|
|
|
|
if (nfs4_stateid_match_other(stateid, &state->open_stateid) &&
|
|
|
|
!nfs4_stateid_is_newer(stateid, &state->open_stateid)) {
|
2015-01-24 06:06:09 +07:00
|
|
|
nfs_resync_open_stateid_locked(state);
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
goto out;
|
2015-01-24 06:06:09 +07:00
|
|
|
}
|
2007-07-06 05:07:55 +07:00
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
|
2012-03-05 06:13:56 +07:00
|
|
|
nfs4_stateid_copy(&state->stateid, stateid);
|
|
|
|
nfs4_stateid_copy(&state->open_stateid, stateid);
|
2017-11-07 03:28:02 +07:00
|
|
|
trace_nfs4_open_stateid_update(state->inode, stateid, 0);
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
out:
|
|
|
|
nfs_state_log_update_open_stateid(state);
|
2014-02-11 22:41:07 +07:00
|
|
|
}
|
|
|
|
|
2015-08-31 08:37:59 +07:00
|
|
|
static void nfs_clear_open_stateid(struct nfs4_state *state,
|
|
|
|
nfs4_stateid *arg_stateid,
|
|
|
|
nfs4_stateid *stateid, fmode_t fmode)
|
2014-02-11 22:41:07 +07:00
|
|
|
{
|
|
|
|
write_seqlock(&state->seqlock);
|
2016-11-14 23:19:55 +07:00
|
|
|
/* Ignore, if the CLOSE argment doesn't match the current stateid */
|
|
|
|
if (nfs4_state_match_open_stateid_other(state, arg_stateid))
|
|
|
|
nfs_clear_open_stateid_locked(state, stateid, fmode);
|
2014-02-11 22:41:07 +07:00
|
|
|
write_sequnlock(&state->seqlock);
|
2014-02-13 07:15:06 +07:00
|
|
|
if (test_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags))
|
|
|
|
nfs4_schedule_state_manager(state->owner->so_server->nfs_client);
|
2014-02-11 22:41:07 +07:00
|
|
|
}
|
|
|
|
|
2016-09-23 00:39:13 +07:00
|
|
|
static void nfs_set_open_stateid_locked(struct nfs4_state *state,
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
const nfs4_stateid *stateid, nfs4_stateid *freeme)
|
2007-07-06 05:07:55 +07:00
|
|
|
{
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
DEFINE_WAIT(wait);
|
|
|
|
int status = 0;
|
|
|
|
for (;;) {
|
|
|
|
|
|
|
|
if (!nfs_need_update_open_stateid(state, stateid))
|
|
|
|
return;
|
|
|
|
if (!test_bit(NFS_STATE_CHANGE_WAIT, &state->flags))
|
2007-07-06 05:07:55 +07:00
|
|
|
break;
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
if (status)
|
2007-07-06 05:07:55 +07:00
|
|
|
break;
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
/* Rely on seqids for serialisation with NFSv4.0 */
|
|
|
|
if (!nfs4_has_session(NFS_SERVER(state->inode)->nfs_client))
|
|
|
|
break;
|
|
|
|
|
|
|
|
prepare_to_wait(&state->waitq, &wait, TASK_KILLABLE);
|
|
|
|
/*
|
|
|
|
* Ensure we process the state changes in the same order
|
|
|
|
* in which the server processed them by delaying the
|
|
|
|
* update of the stateid until we are in sequence.
|
|
|
|
*/
|
|
|
|
write_sequnlock(&state->seqlock);
|
|
|
|
spin_unlock(&state->owner->so_lock);
|
|
|
|
rcu_read_unlock();
|
2017-11-07 03:28:02 +07:00
|
|
|
trace_nfs4_open_stateid_update_wait(state->inode, stateid, 0);
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
if (!signal_pending(current)) {
|
|
|
|
if (schedule_timeout(5*HZ) == 0)
|
|
|
|
status = -EAGAIN;
|
|
|
|
else
|
|
|
|
status = 0;
|
|
|
|
} else
|
|
|
|
status = -EINTR;
|
|
|
|
finish_wait(&state->waitq, &wait);
|
|
|
|
rcu_read_lock();
|
|
|
|
spin_lock(&state->owner->so_lock);
|
|
|
|
write_seqlock(&state->seqlock);
|
2007-07-06 05:07:55 +07:00
|
|
|
}
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
|
2017-11-08 01:10:46 +07:00
|
|
|
if (test_bit(NFS_OPEN_STATE, &state->flags) &&
|
|
|
|
!nfs4_stateid_match_other(stateid, &state->open_stateid)) {
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
nfs4_stateid_copy(freeme, &state->open_stateid);
|
|
|
|
nfs_test_and_clear_all_open_stateid(state);
|
|
|
|
}
|
|
|
|
|
2014-02-11 06:20:47 +07:00
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
|
|
|
|
nfs4_stateid_copy(&state->stateid, stateid);
|
|
|
|
nfs4_stateid_copy(&state->open_stateid, stateid);
|
2017-11-07 03:28:02 +07:00
|
|
|
trace_nfs4_open_stateid_update(state->inode, stateid, status);
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
nfs_state_log_update_open_stateid(state);
|
2007-07-06 05:07:55 +07:00
|
|
|
}
|
|
|
|
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
static void nfs_state_set_open_stateid(struct nfs4_state *state,
|
2016-09-23 00:39:13 +07:00
|
|
|
const nfs4_stateid *open_stateid,
|
|
|
|
fmode_t fmode,
|
|
|
|
nfs4_stateid *freeme)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2007-07-09 21:45:42 +07:00
|
|
|
/*
|
|
|
|
* Protect the call to nfs4_state_set_mode_locked and
|
|
|
|
* serialise the stateid update
|
|
|
|
*/
|
|
|
|
write_seqlock(&state->seqlock);
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
nfs_set_open_stateid_locked(state, open_stateid, freeme);
|
|
|
|
switch (fmode) {
|
|
|
|
case FMODE_READ:
|
|
|
|
set_bit(NFS_O_RDONLY_STATE, &state->flags);
|
|
|
|
break;
|
|
|
|
case FMODE_WRITE:
|
|
|
|
set_bit(NFS_O_WRONLY_STATE, &state->flags);
|
|
|
|
break;
|
|
|
|
case FMODE_READ|FMODE_WRITE:
|
|
|
|
set_bit(NFS_O_RDWR_STATE, &state->flags);
|
2007-07-06 05:07:55 +07:00
|
|
|
}
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
set_bit(NFS_OPEN_STATE, &state->flags);
|
|
|
|
write_sequnlock(&state->seqlock);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs_state_set_delegation(struct nfs4_state *state,
|
|
|
|
const nfs4_stateid *deleg_stateid,
|
|
|
|
fmode_t fmode)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* Protect the call to nfs4_state_set_mode_locked and
|
|
|
|
* serialise the stateid update
|
|
|
|
*/
|
|
|
|
write_seqlock(&state->seqlock);
|
|
|
|
nfs4_stateid_copy(&state->stateid, deleg_stateid);
|
|
|
|
set_bit(NFS_DELEGATED_STATE, &state->flags);
|
2007-07-09 21:45:42 +07:00
|
|
|
write_sequnlock(&state->seqlock);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2016-09-23 00:39:13 +07:00
|
|
|
static int update_open_stateid(struct nfs4_state *state,
|
|
|
|
const nfs4_stateid *open_stateid,
|
|
|
|
const nfs4_stateid *delegation,
|
|
|
|
fmode_t fmode)
|
2008-12-24 03:21:38 +07:00
|
|
|
{
|
2016-09-23 00:39:13 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
|
|
|
struct nfs_client *clp = server->nfs_client;
|
2008-12-24 03:21:38 +07:00
|
|
|
struct nfs_inode *nfsi = NFS_I(state->inode);
|
|
|
|
struct nfs_delegation *deleg_cur;
|
2016-10-18 22:21:30 +07:00
|
|
|
nfs4_stateid freeme = { };
|
2008-12-24 03:21:38 +07:00
|
|
|
int ret = 0;
|
|
|
|
|
2008-12-24 03:21:56 +07:00
|
|
|
fmode &= (FMODE_READ|FMODE_WRITE);
|
2008-12-24 03:21:38 +07:00
|
|
|
|
|
|
|
rcu_read_lock();
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
spin_lock(&state->owner->so_lock);
|
|
|
|
if (open_stateid != NULL) {
|
|
|
|
nfs_state_set_open_stateid(state, open_stateid, fmode, &freeme);
|
|
|
|
ret = 1;
|
|
|
|
}
|
|
|
|
|
2008-12-24 03:21:38 +07:00
|
|
|
deleg_cur = rcu_dereference(nfsi->delegation);
|
|
|
|
if (deleg_cur == NULL)
|
|
|
|
goto no_delegation;
|
|
|
|
|
|
|
|
spin_lock(&deleg_cur->lock);
|
2013-08-22 02:48:42 +07:00
|
|
|
if (rcu_dereference(nfsi->delegation) != deleg_cur ||
|
2013-02-05 23:43:28 +07:00
|
|
|
test_bit(NFS_DELEGATION_RETURNING, &deleg_cur->flags) ||
|
2008-12-24 03:21:56 +07:00
|
|
|
(deleg_cur->type & fmode) != fmode)
|
2008-12-24 03:21:38 +07:00
|
|
|
goto no_delegation_unlock;
|
|
|
|
|
|
|
|
if (delegation == NULL)
|
|
|
|
delegation = &deleg_cur->stateid;
|
2012-03-05 06:13:56 +07:00
|
|
|
else if (!nfs4_stateid_match(&deleg_cur->stateid, delegation))
|
2008-12-24 03:21:38 +07:00
|
|
|
goto no_delegation_unlock;
|
|
|
|
|
2008-12-24 03:21:52 +07:00
|
|
|
nfs_mark_delegation_referenced(deleg_cur);
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
nfs_state_set_delegation(state, &deleg_cur->stateid, fmode);
|
2008-12-24 03:21:38 +07:00
|
|
|
ret = 1;
|
|
|
|
no_delegation_unlock:
|
|
|
|
spin_unlock(&deleg_cur->lock);
|
|
|
|
no_delegation:
|
NFSv4: Fix OPEN / CLOSE race
Ben Coddington has noted the following race between OPEN and CLOSE
on a single client.
Process 1 Process 2 Server
========= ========= ======
1) OPEN file
2) OPEN file
3) Process OPEN (1) seqid=1
4) Process OPEN (2) seqid=2
5) Reply OPEN (2)
6) Receive reply (2)
7) new stateid, seqid=2
8) CLOSE file, using
stateid w/ seqid=2
9) Reply OPEN (1)
10( Process CLOSE (8)
11) Reply CLOSE (8)
12) Forget stateid
file closed
13) Receive reply (7)
14) Forget stateid
file closed.
15) Receive reply (1).
16) New stateid seqid=1
is really the same
stateid that was
closed.
IOW: the reply to the first OPEN is delayed. Since "Process 2" does
not wait before closing the file, and it does not cache the closed
stateid, then when the delayed reply is finally received, it is treated
as setting up a new stateid by the client.
The fix is to ensure that the client processes the OPEN and CLOSE calls
in the same order in which the server processed them.
This commit ensures that we examine the seqid of the stateid
returned by OPEN. If it is a new stateid, we assume the seqid
must be equal to the value 1, and that each state transition
increments the seqid value by 1 (See RFC7530, Section 9.1.4.2,
and RFC5661, Section 8.2.2).
If the tracker sees that an OPEN returns with a seqid that is greater
than the cached seqid + 1, then it bumps a flag to ensure that the
caller waits for the RPCs carrying the missing seqids to complete.
Note that there can still be pathologies where the server crashes before
it can even send us the missing seqids. Since the OPEN call is still
holding a slot when it waits here, that could cause the recovery to
stall forever. To avoid that, we time out after a 5 second wait.
Reported-by: Benjamin Coddington <bcodding@redhat.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2017-11-07 03:28:01 +07:00
|
|
|
if (ret)
|
|
|
|
update_open_stateflags(state, fmode);
|
|
|
|
spin_unlock(&state->owner->so_lock);
|
2008-12-24 03:21:38 +07:00
|
|
|
rcu_read_unlock();
|
|
|
|
|
2014-02-13 07:15:06 +07:00
|
|
|
if (test_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags))
|
2016-09-23 00:39:13 +07:00
|
|
|
nfs4_schedule_state_manager(clp);
|
|
|
|
if (freeme.type != 0)
|
|
|
|
nfs4_test_and_free_stateid(server, &freeme,
|
|
|
|
state->owner->so_cred);
|
2008-12-24 03:21:38 +07:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2015-01-25 03:07:56 +07:00
|
|
|
static bool nfs4_update_lock_stateid(struct nfs4_lock_state *lsp,
|
|
|
|
const nfs4_stateid *stateid)
|
|
|
|
{
|
|
|
|
struct nfs4_state *state = lsp->ls_state;
|
|
|
|
bool ret = false;
|
|
|
|
|
|
|
|
spin_lock(&state->state_lock);
|
|
|
|
if (!nfs4_stateid_match_other(stateid, &lsp->ls_stateid))
|
|
|
|
goto out_noupdate;
|
|
|
|
if (!nfs4_stateid_is_newer(stateid, &lsp->ls_stateid))
|
|
|
|
goto out_noupdate;
|
|
|
|
nfs4_stateid_copy(&lsp->ls_stateid, stateid);
|
|
|
|
ret = true;
|
|
|
|
out_noupdate:
|
|
|
|
spin_unlock(&state->state_lock);
|
|
|
|
return ret;
|
|
|
|
}
|
2008-12-24 03:21:38 +07:00
|
|
|
|
2008-12-24 03:21:56 +07:00
|
|
|
static void nfs4_return_incompatible_delegation(struct inode *inode, fmode_t fmode)
|
2007-07-06 06:02:21 +07:00
|
|
|
{
|
|
|
|
struct nfs_delegation *delegation;
|
|
|
|
|
2018-03-21 03:43:13 +07:00
|
|
|
fmode &= FMODE_READ|FMODE_WRITE;
|
2007-07-06 06:02:21 +07:00
|
|
|
rcu_read_lock();
|
|
|
|
delegation = rcu_dereference(NFS_I(inode)->delegation);
|
2008-12-24 03:21:56 +07:00
|
|
|
if (delegation == NULL || (delegation->type & fmode) == fmode) {
|
2007-07-06 06:02:21 +07:00
|
|
|
rcu_read_unlock();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
rcu_read_unlock();
|
2012-06-21 02:53:44 +07:00
|
|
|
nfs4_inode_return_delegation(inode);
|
2007-07-06 06:02:21 +07:00
|
|
|
}
|
|
|
|
|
2007-07-09 01:11:36 +07:00
|
|
|
static struct nfs4_state *nfs4_try_open_cached(struct nfs4_opendata *opendata)
|
2007-07-06 06:02:21 +07:00
|
|
|
{
|
|
|
|
struct nfs4_state *state = opendata->state;
|
|
|
|
struct nfs_inode *nfsi = NFS_I(state->inode);
|
|
|
|
struct nfs_delegation *delegation;
|
2013-05-30 02:36:40 +07:00
|
|
|
int open_mode = opendata->o_arg.open_flags;
|
2008-12-24 03:21:56 +07:00
|
|
|
fmode_t fmode = opendata->o_arg.fmode;
|
2015-08-20 10:30:00 +07:00
|
|
|
enum open_claim_type4 claim = opendata->o_arg.claim;
|
2007-07-06 06:02:21 +07:00
|
|
|
nfs4_stateid stateid;
|
|
|
|
int ret = -EAGAIN;
|
|
|
|
|
|
|
|
for (;;) {
|
2014-09-04 01:15:40 +07:00
|
|
|
spin_lock(&state->owner->so_lock);
|
2008-12-24 03:21:56 +07:00
|
|
|
if (can_open_cached(state, fmode, open_mode)) {
|
2014-09-04 01:15:40 +07:00
|
|
|
update_open_stateflags(state, fmode);
|
2007-07-09 01:11:36 +07:00
|
|
|
spin_unlock(&state->owner->so_lock);
|
2014-09-04 01:15:40 +07:00
|
|
|
goto out_return_state;
|
2007-07-09 01:11:36 +07:00
|
|
|
}
|
2014-09-04 01:15:40 +07:00
|
|
|
spin_unlock(&state->owner->so_lock);
|
2008-12-24 03:21:38 +07:00
|
|
|
rcu_read_lock();
|
|
|
|
delegation = rcu_dereference(nfsi->delegation);
|
2015-08-20 10:30:00 +07:00
|
|
|
if (!can_open_delegated(delegation, fmode, claim)) {
|
2008-12-24 03:21:38 +07:00
|
|
|
rcu_read_unlock();
|
2007-07-06 06:02:21 +07:00
|
|
|
break;
|
2008-12-24 03:21:38 +07:00
|
|
|
}
|
2007-07-06 06:02:21 +07:00
|
|
|
/* Save the delegation */
|
2012-03-05 06:13:56 +07:00
|
|
|
nfs4_stateid_copy(&stateid, &delegation->stateid);
|
2007-07-06 06:02:21 +07:00
|
|
|
rcu_read_unlock();
|
2013-04-09 23:56:52 +07:00
|
|
|
nfs_release_seqid(opendata->o_arg.seqid);
|
2013-04-24 01:52:44 +07:00
|
|
|
if (!opendata->is_recover) {
|
|
|
|
ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
|
|
|
|
if (ret != 0)
|
|
|
|
goto out;
|
|
|
|
}
|
2007-07-06 06:02:21 +07:00
|
|
|
ret = -EAGAIN;
|
2008-12-24 03:21:38 +07:00
|
|
|
|
|
|
|
/* Try to update the stateid using the delegation */
|
2008-12-24 03:21:56 +07:00
|
|
|
if (update_open_stateid(state, NULL, &stateid, fmode))
|
2008-12-24 03:21:38 +07:00
|
|
|
goto out_return_state;
|
2007-07-06 06:02:21 +07:00
|
|
|
}
|
|
|
|
out:
|
|
|
|
return ERR_PTR(ret);
|
|
|
|
out_return_state:
|
|
|
|
atomic_inc(&state->count);
|
|
|
|
return state;
|
|
|
|
}
|
|
|
|
|
2012-10-03 08:07:32 +07:00
|
|
|
static void
|
|
|
|
nfs4_opendata_check_deleg(struct nfs4_opendata *data, struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
struct nfs_client *clp = NFS_SERVER(state->inode)->nfs_client;
|
|
|
|
struct nfs_delegation *delegation;
|
|
|
|
int delegation_flags = 0;
|
|
|
|
|
|
|
|
rcu_read_lock();
|
|
|
|
delegation = rcu_dereference(NFS_I(state->inode)->delegation);
|
|
|
|
if (delegation)
|
|
|
|
delegation_flags = delegation->flags;
|
|
|
|
rcu_read_unlock();
|
2015-10-02 22:44:54 +07:00
|
|
|
switch (data->o_arg.claim) {
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
case NFS4_OPEN_CLAIM_DELEGATE_CUR:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
|
2012-10-03 08:07:32 +07:00
|
|
|
pr_err_ratelimited("NFS: Broken NFSv4 server %s is "
|
|
|
|
"returning a delegation for "
|
|
|
|
"OPEN(CLAIM_DELEGATE_CUR)\n",
|
|
|
|
clp->cl_hostname);
|
2015-10-02 22:44:54 +07:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
if ((delegation_flags & 1UL<<NFS_DELEGATION_NEED_RECLAIM) == 0)
|
2012-10-03 08:07:32 +07:00
|
|
|
nfs_inode_set_delegation(state->inode,
|
2018-03-21 04:03:13 +07:00
|
|
|
data->owner->so_cred,
|
|
|
|
data->o_res.delegation_type,
|
|
|
|
&data->o_res.delegation,
|
|
|
|
data->o_res.pagemod_limit);
|
2012-10-03 08:07:32 +07:00
|
|
|
else
|
|
|
|
nfs_inode_reclaim_delegation(state->inode,
|
2018-03-21 04:03:13 +07:00
|
|
|
data->owner->so_cred,
|
|
|
|
data->o_res.delegation_type,
|
|
|
|
&data->o_res.delegation,
|
|
|
|
data->o_res.pagemod_limit);
|
2012-10-03 08:07:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check the inode attributes against the CLAIM_PREVIOUS returned attributes
|
|
|
|
* and update the nfs4_state.
|
|
|
|
*/
|
|
|
|
static struct nfs4_state *
|
|
|
|
_nfs4_opendata_reclaim_to_nfs4_state(struct nfs4_opendata *data)
|
|
|
|
{
|
|
|
|
struct inode *inode = data->state->inode;
|
|
|
|
struct nfs4_state *state = data->state;
|
|
|
|
int ret;
|
|
|
|
|
2013-10-22 00:10:13 +07:00
|
|
|
if (!data->rpc_done) {
|
2017-01-12 04:08:35 +07:00
|
|
|
if (data->rpc_status)
|
|
|
|
return ERR_PTR(data->rpc_status);
|
2013-10-22 00:10:13 +07:00
|
|
|
/* cached opens have already been processed */
|
|
|
|
goto update;
|
2012-10-03 08:07:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
ret = nfs_refresh_inode(inode, &data->f_attr);
|
|
|
|
if (ret)
|
2017-01-12 04:08:35 +07:00
|
|
|
return ERR_PTR(ret);
|
2012-10-03 08:07:32 +07:00
|
|
|
|
|
|
|
if (data->o_res.delegation_type != 0)
|
|
|
|
nfs4_opendata_check_deleg(data, state);
|
2013-10-22 00:10:13 +07:00
|
|
|
update:
|
2012-10-03 08:07:32 +07:00
|
|
|
update_open_stateid(state, &data->o_res.stateid, NULL,
|
|
|
|
data->o_arg.fmode);
|
2013-10-29 01:57:12 +07:00
|
|
|
atomic_inc(&state->count);
|
2012-10-03 08:07:32 +07:00
|
|
|
|
|
|
|
return state;
|
|
|
|
}
|
|
|
|
|
2017-08-08 20:06:18 +07:00
|
|
|
static struct inode *
|
|
|
|
nfs4_opendata_get_inode(struct nfs4_opendata *data)
|
|
|
|
{
|
|
|
|
struct inode *inode;
|
|
|
|
|
|
|
|
switch (data->o_arg.claim) {
|
|
|
|
case NFS4_OPEN_CLAIM_NULL:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEGATE_CUR:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEGATE_PREV:
|
|
|
|
if (!(data->f_attr.valid & NFS_ATTR_FATTR))
|
|
|
|
return ERR_PTR(-EAGAIN);
|
|
|
|
inode = nfs_fhget(data->dir->d_sb, &data->o_res.fh,
|
|
|
|
&data->f_attr, data->f_label);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
inode = d_inode(data->dentry);
|
|
|
|
ihold(inode);
|
|
|
|
nfs_refresh_inode(inode, &data->f_attr);
|
|
|
|
}
|
|
|
|
return inode;
|
|
|
|
}
|
|
|
|
|
2012-10-03 08:07:32 +07:00
|
|
|
static struct nfs4_state *
|
2017-08-08 21:38:07 +07:00
|
|
|
nfs4_opendata_find_nfs4_state(struct nfs4_opendata *data)
|
2006-01-03 15:55:11 +07:00
|
|
|
{
|
2017-08-08 21:38:07 +07:00
|
|
|
struct nfs4_state *state;
|
2006-01-03 15:55:11 +07:00
|
|
|
struct inode *inode;
|
2017-08-08 21:38:07 +07:00
|
|
|
|
|
|
|
inode = nfs4_opendata_get_inode(data);
|
|
|
|
if (IS_ERR(inode))
|
|
|
|
return ERR_CAST(inode);
|
|
|
|
if (data->state != NULL && data->state->inode == inode) {
|
|
|
|
state = data->state;
|
|
|
|
atomic_inc(&state->count);
|
|
|
|
} else
|
|
|
|
state = nfs4_get_open_state(inode, data->owner);
|
|
|
|
iput(inode);
|
|
|
|
if (state == NULL)
|
|
|
|
state = ERR_PTR(-ENOMEM);
|
|
|
|
return state;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct nfs4_state *
|
|
|
|
_nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
|
|
|
|
{
|
|
|
|
struct nfs4_state *state;
|
2006-01-03 15:55:11 +07:00
|
|
|
|
2007-07-06 06:02:21 +07:00
|
|
|
if (!data->rpc_done) {
|
2007-07-09 01:11:36 +07:00
|
|
|
state = nfs4_try_open_cached(data);
|
2015-11-25 01:29:42 +07:00
|
|
|
trace_nfs4_cached_open(data->state);
|
2007-07-06 06:02:21 +07:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2017-08-08 21:38:07 +07:00
|
|
|
state = nfs4_opendata_find_nfs4_state(data);
|
|
|
|
if (IS_ERR(state))
|
|
|
|
goto out;
|
|
|
|
|
2012-10-03 08:07:32 +07:00
|
|
|
if (data->o_res.delegation_type != 0)
|
|
|
|
nfs4_opendata_check_deleg(data, state);
|
2008-12-24 03:21:38 +07:00
|
|
|
update_open_stateid(state, &data->o_res.stateid, NULL,
|
2008-12-24 03:21:56 +07:00
|
|
|
data->o_arg.fmode);
|
2007-07-06 06:02:21 +07:00
|
|
|
out:
|
2013-03-01 07:19:59 +07:00
|
|
|
nfs_release_seqid(data->o_arg.seqid);
|
2006-01-03 15:55:11 +07:00
|
|
|
return state;
|
|
|
|
}
|
|
|
|
|
2012-10-03 08:07:32 +07:00
|
|
|
static struct nfs4_state *
|
|
|
|
nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
|
|
|
|
{
|
2016-08-28 22:50:26 +07:00
|
|
|
struct nfs4_state *ret;
|
|
|
|
|
2012-10-03 08:07:32 +07:00
|
|
|
if (data->o_arg.claim == NFS4_OPEN_CLAIM_PREVIOUS)
|
2016-08-28 22:50:26 +07:00
|
|
|
ret =_nfs4_opendata_reclaim_to_nfs4_state(data);
|
|
|
|
else
|
|
|
|
ret = _nfs4_opendata_to_nfs4_state(data);
|
|
|
|
nfs4_sequence_free_slot(&data->o_res.seq_res);
|
|
|
|
return ret;
|
2012-10-03 08:07:32 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:15 +07:00
|
|
|
static struct nfs_open_context *nfs4_state_find_open_context(struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
struct nfs_inode *nfsi = NFS_I(state->inode);
|
|
|
|
struct nfs_open_context *ctx;
|
|
|
|
|
|
|
|
spin_lock(&state->inode->i_lock);
|
|
|
|
list_for_each_entry(ctx, &nfsi->open_files, list) {
|
|
|
|
if (ctx->state != state)
|
|
|
|
continue;
|
|
|
|
get_nfs_open_context(ctx);
|
|
|
|
spin_unlock(&state->inode->i_lock);
|
|
|
|
return ctx;
|
|
|
|
}
|
|
|
|
spin_unlock(&state->inode->i_lock);
|
|
|
|
return ERR_PTR(-ENOENT);
|
|
|
|
}
|
|
|
|
|
2013-03-16 01:57:33 +07:00
|
|
|
static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx,
|
|
|
|
struct nfs4_state *state, enum open_claim_type4 claim)
|
2007-07-18 08:50:45 +07:00
|
|
|
{
|
|
|
|
struct nfs4_opendata *opendata;
|
|
|
|
|
2013-03-16 01:57:33 +07:00
|
|
|
opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0,
|
2017-11-07 03:28:03 +07:00
|
|
|
NULL, claim, GFP_NOFS);
|
2007-07-18 08:50:45 +07:00
|
|
|
if (opendata == NULL)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
opendata->state = state;
|
|
|
|
atomic_inc(&state->count);
|
|
|
|
return opendata;
|
|
|
|
}
|
|
|
|
|
2015-09-20 21:50:17 +07:00
|
|
|
static int nfs4_open_recover_helper(struct nfs4_opendata *opendata,
|
|
|
|
fmode_t fmode)
|
2006-01-03 15:55:15 +07:00
|
|
|
{
|
2007-07-04 10:48:13 +07:00
|
|
|
struct nfs4_state *newstate;
|
2006-01-03 15:55:15 +07:00
|
|
|
int ret;
|
|
|
|
|
2015-09-20 21:50:17 +07:00
|
|
|
if (!nfs4_mode_match_open_stateid(opendata->state, fmode))
|
NFSv4: When returning a delegation, don't reclaim an incompatible open mode.
It is possible to have an active open with one mode, and a delegation
for the same file with a different mode.
In particular, a WR_ONLY open and an RD_ONLY delegation.
This happens if a WR_ONLY open is followed by a RD_ONLY open which
provides a delegation, but is then close.
When returning the delegation, we currently try to claim opens for
every open type (n_rdwr, n_rdonly, n_wronly). As there is no harm
in claiming an open for a mode that we already have, this is often
simplest.
However if the delegation only provides a subset of the modes that we
currently have open, this will produce an error from the server.
So when claiming open modes prior to returning a delegation, skip the
open request if the mode is not covered by the delegation - the open_stateid
must already cover that mode, so there is nothing to do.
Signed-off-by: NeilBrown <neilb@suse.de>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-06-29 11:28:54 +07:00
|
|
|
return 0;
|
2008-12-24 03:21:56 +07:00
|
|
|
opendata->o_arg.open_flags = 0;
|
|
|
|
opendata->o_arg.fmode = fmode;
|
2015-02-28 05:04:17 +07:00
|
|
|
opendata->o_arg.share_access = nfs4_map_atomic_open_share(
|
|
|
|
NFS_SB(opendata->dentry->d_sb),
|
|
|
|
fmode, 0);
|
2007-07-04 10:48:13 +07:00
|
|
|
memset(&opendata->o_res, 0, sizeof(opendata->o_res));
|
|
|
|
memset(&opendata->c_res, 0, sizeof(opendata->c_res));
|
|
|
|
nfs4_init_opendata_res(opendata);
|
2009-12-15 12:27:57 +07:00
|
|
|
ret = _nfs4_recover_proc_open(opendata);
|
2006-01-03 15:55:15 +07:00
|
|
|
if (ret != 0)
|
|
|
|
return ret;
|
2007-07-04 10:48:13 +07:00
|
|
|
newstate = nfs4_opendata_to_nfs4_state(opendata);
|
2007-07-07 19:04:47 +07:00
|
|
|
if (IS_ERR(newstate))
|
|
|
|
return PTR_ERR(newstate);
|
2015-09-20 21:50:17 +07:00
|
|
|
if (newstate != opendata->state)
|
|
|
|
ret = -ESTALE;
|
2011-06-23 05:20:23 +07:00
|
|
|
nfs4_close_state(newstate, fmode);
|
2015-09-20 21:50:17 +07:00
|
|
|
return ret;
|
2006-01-03 15:55:15 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_open_recover(struct nfs4_opendata *opendata, struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
|
2014-02-13 07:15:06 +07:00
|
|
|
/* Don't trigger recovery in nfs_test_and_clear_all_open_stateid */
|
|
|
|
clear_bit(NFS_O_RDWR_STATE, &state->flags);
|
|
|
|
clear_bit(NFS_O_WRONLY_STATE, &state->flags);
|
|
|
|
clear_bit(NFS_O_RDONLY_STATE, &state->flags);
|
2006-01-03 15:55:15 +07:00
|
|
|
/* memory barrier prior to reading state->n_* */
|
2007-07-04 10:48:13 +07:00
|
|
|
clear_bit(NFS_DELEGATED_STATE, &state->flags);
|
2013-04-22 22:29:51 +07:00
|
|
|
clear_bit(NFS_OPEN_STATE, &state->flags);
|
2006-01-03 15:55:15 +07:00
|
|
|
smp_rmb();
|
2015-09-20 21:50:17 +07:00
|
|
|
ret = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE);
|
|
|
|
if (ret != 0)
|
|
|
|
return ret;
|
|
|
|
ret = nfs4_open_recover_helper(opendata, FMODE_WRITE);
|
|
|
|
if (ret != 0)
|
|
|
|
return ret;
|
|
|
|
ret = nfs4_open_recover_helper(opendata, FMODE_READ);
|
|
|
|
if (ret != 0)
|
|
|
|
return ret;
|
2007-07-09 08:04:15 +07:00
|
|
|
/*
|
|
|
|
* We may have performed cached opens for all three recoveries.
|
|
|
|
* Check if we need to update the current stateid.
|
|
|
|
*/
|
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0 &&
|
2012-03-05 06:13:56 +07:00
|
|
|
!nfs4_stateid_match(&state->stateid, &state->open_stateid)) {
|
2007-07-09 21:45:42 +07:00
|
|
|
write_seqlock(&state->seqlock);
|
2007-07-09 08:04:15 +07:00
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
|
2012-03-05 06:13:56 +07:00
|
|
|
nfs4_stateid_copy(&state->stateid, &state->open_stateid);
|
2007-07-09 21:45:42 +07:00
|
|
|
write_sequnlock(&state->seqlock);
|
2007-07-09 08:04:15 +07:00
|
|
|
}
|
2006-01-03 15:55:15 +07:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
/*
|
|
|
|
* OPEN_RECLAIM:
|
|
|
|
* reclaim state on the server after a reboot.
|
|
|
|
*/
|
2007-06-05 22:46:42 +07:00
|
|
|
static int _nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2007-07-09 08:04:15 +07:00
|
|
|
struct nfs_delegation *delegation;
|
2006-01-03 15:55:15 +07:00
|
|
|
struct nfs4_opendata *opendata;
|
2008-12-24 03:21:56 +07:00
|
|
|
fmode_t delegation_type = 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
int status;
|
|
|
|
|
2013-03-16 01:57:33 +07:00
|
|
|
opendata = nfs4_open_recoverdata_alloc(ctx, state,
|
|
|
|
NFS4_OPEN_CLAIM_PREVIOUS);
|
2007-07-18 08:50:45 +07:00
|
|
|
if (IS_ERR(opendata))
|
|
|
|
return PTR_ERR(opendata);
|
2007-07-09 08:04:15 +07:00
|
|
|
rcu_read_lock();
|
|
|
|
delegation = rcu_dereference(NFS_I(state->inode)->delegation);
|
2008-12-24 03:21:39 +07:00
|
|
|
if (delegation != NULL && test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) != 0)
|
2007-08-27 20:57:46 +07:00
|
|
|
delegation_type = delegation->type;
|
2007-07-09 08:04:15 +07:00
|
|
|
rcu_read_unlock();
|
2006-01-03 15:55:15 +07:00
|
|
|
opendata->o_arg.u.delegation_type = delegation_type;
|
|
|
|
status = nfs4_open_recover(opendata, state);
|
2007-06-18 03:02:44 +07:00
|
|
|
nfs4_opendata_put(opendata);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2007-06-05 22:46:42 +07:00
|
|
|
static int nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2007-06-05 22:46:42 +07:00
|
|
|
err = _nfs4_do_open_reclaim(ctx, state);
|
2013-08-13 03:19:27 +07:00
|
|
|
trace_nfs4_open_reclaim(ctx, 0, err);
|
2013-03-16 03:44:28 +07:00
|
|
|
if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
|
|
|
|
continue;
|
2010-10-20 06:47:49 +07:00
|
|
|
if (err != -NFS4ERR_DELAY)
|
2005-06-23 00:16:29 +07:00
|
|
|
break;
|
|
|
|
nfs4_handle_exception(server, err, &exception);
|
2005-04-17 05:20:36 +07:00
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:15 +07:00
|
|
|
static int nfs4_open_reclaim(struct nfs4_state_owner *sp, struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
struct nfs_open_context *ctx;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
ctx = nfs4_state_find_open_context(state);
|
|
|
|
if (IS_ERR(ctx))
|
2013-03-29 01:01:33 +07:00
|
|
|
return -EAGAIN;
|
2007-06-05 22:46:42 +07:00
|
|
|
ret = nfs4_do_open_reclaim(ctx, state);
|
2006-01-03 15:55:15 +07:00
|
|
|
put_nfs_open_context(ctx);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2017-12-13 05:57:09 +07:00
|
|
|
static int nfs4_handle_delegation_recall_error(struct nfs_server *server, struct nfs4_state *state, const nfs4_stateid *stateid, struct file_lock *fl, int err)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2013-04-02 02:40:44 +07:00
|
|
|
switch (err) {
|
|
|
|
default:
|
|
|
|
printk(KERN_ERR "NFS: %s: unhandled error "
|
|
|
|
"%d.\n", __func__, err);
|
|
|
|
case 0:
|
|
|
|
case -ENOENT:
|
2015-06-05 00:51:13 +07:00
|
|
|
case -EAGAIN:
|
2013-04-02 02:40:44 +07:00
|
|
|
case -ESTALE:
|
|
|
|
break;
|
|
|
|
case -NFS4ERR_BADSESSION:
|
|
|
|
case -NFS4ERR_BADSLOT:
|
|
|
|
case -NFS4ERR_BAD_HIGH_SLOT:
|
|
|
|
case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
|
|
|
|
case -NFS4ERR_DEADSESSION:
|
|
|
|
set_bit(NFS_DELEGATED_STATE, &state->flags);
|
|
|
|
nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
|
|
|
|
return -EAGAIN;
|
|
|
|
case -NFS4ERR_STALE_CLIENTID:
|
|
|
|
case -NFS4ERR_STALE_STATEID:
|
|
|
|
set_bit(NFS_DELEGATED_STATE, &state->flags);
|
|
|
|
/* Don't recall a delegation if it was lost */
|
|
|
|
nfs4_schedule_lease_recovery(server->nfs_client);
|
|
|
|
return -EAGAIN;
|
2013-10-18 01:13:24 +07:00
|
|
|
case -NFS4ERR_MOVED:
|
|
|
|
nfs4_schedule_migration_recovery(server);
|
|
|
|
return -EAGAIN;
|
2013-10-18 01:13:41 +07:00
|
|
|
case -NFS4ERR_LEASE_MOVED:
|
|
|
|
nfs4_schedule_lease_moved_recovery(server->nfs_client);
|
|
|
|
return -EAGAIN;
|
2013-04-02 02:40:44 +07:00
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
2016-09-23 00:39:08 +07:00
|
|
|
case -NFS4ERR_EXPIRED:
|
2013-04-02 02:40:44 +07:00
|
|
|
case -NFS4ERR_BAD_STATEID:
|
2013-04-02 02:56:46 +07:00
|
|
|
case -NFS4ERR_OPENMODE:
|
2013-04-02 02:40:44 +07:00
|
|
|
nfs_inode_find_state_and_recover(state->inode,
|
|
|
|
stateid);
|
|
|
|
nfs4_schedule_stateid_recovery(server, state);
|
2014-11-11 06:43:56 +07:00
|
|
|
return -EAGAIN;
|
2013-04-02 02:40:44 +07:00
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
case -NFS4ERR_GRACE:
|
|
|
|
set_bit(NFS_DELEGATED_STATE, &state->flags);
|
|
|
|
ssleep(1);
|
|
|
|
return -EAGAIN;
|
2013-04-02 02:56:46 +07:00
|
|
|
case -ENOMEM:
|
|
|
|
case -NFS4ERR_DENIED:
|
2017-12-13 05:57:09 +07:00
|
|
|
if (fl) {
|
|
|
|
struct nfs4_lock_state *lsp = fl->fl_u.nfs4_fl.owner;
|
|
|
|
if (lsp)
|
|
|
|
set_bit(NFS_LOCK_LOST, &lsp->ls_flags);
|
|
|
|
}
|
2013-04-02 02:56:46 +07:00
|
|
|
return 0;
|
2013-04-02 02:40:44 +07:00
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2015-09-20 21:50:17 +07:00
|
|
|
int nfs4_open_delegation_recall(struct nfs_open_context *ctx,
|
|
|
|
struct nfs4_state *state, const nfs4_stateid *stateid,
|
|
|
|
fmode_t type)
|
2013-04-02 02:56:46 +07:00
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
|
|
|
struct nfs4_opendata *opendata;
|
2015-09-20 21:50:17 +07:00
|
|
|
int err = 0;
|
2013-04-02 02:56:46 +07:00
|
|
|
|
|
|
|
opendata = nfs4_open_recoverdata_alloc(ctx, state,
|
|
|
|
NFS4_OPEN_CLAIM_DELEG_CUR_FH);
|
|
|
|
if (IS_ERR(opendata))
|
|
|
|
return PTR_ERR(opendata);
|
|
|
|
nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
|
2015-10-03 00:14:37 +07:00
|
|
|
write_seqlock(&state->seqlock);
|
|
|
|
nfs4_stateid_copy(&state->stateid, &state->open_stateid);
|
|
|
|
write_sequnlock(&state->seqlock);
|
2015-09-20 21:50:17 +07:00
|
|
|
clear_bit(NFS_DELEGATED_STATE, &state->flags);
|
|
|
|
switch (type & (FMODE_READ|FMODE_WRITE)) {
|
|
|
|
case FMODE_READ|FMODE_WRITE:
|
|
|
|
case FMODE_WRITE:
|
|
|
|
err = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE);
|
|
|
|
if (err)
|
|
|
|
break;
|
|
|
|
err = nfs4_open_recover_helper(opendata, FMODE_WRITE);
|
|
|
|
if (err)
|
|
|
|
break;
|
|
|
|
case FMODE_READ:
|
|
|
|
err = nfs4_open_recover_helper(opendata, FMODE_READ);
|
|
|
|
}
|
2013-04-02 02:56:46 +07:00
|
|
|
nfs4_opendata_put(opendata);
|
2017-12-13 05:57:09 +07:00
|
|
|
return nfs4_handle_delegation_recall_error(server, state, stateid, NULL, err);
|
2013-04-02 02:56:46 +07:00
|
|
|
}
|
|
|
|
|
2013-08-09 23:49:47 +07:00
|
|
|
static void nfs4_open_confirm_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_opendata *data = calldata;
|
|
|
|
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(data->o_arg.server->nfs_client,
|
|
|
|
&data->c_arg.seq_args, &data->c_res.seq_res, task);
|
2013-08-09 23:49:47 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:12 +07:00
|
|
|
static void nfs4_open_confirm_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_opendata *data = calldata;
|
|
|
|
|
2014-02-02 02:53:23 +07:00
|
|
|
nfs40_sequence_done(task, &data->c_res.seq_res);
|
2013-08-09 23:49:47 +07:00
|
|
|
|
2006-01-03 15:55:12 +07:00
|
|
|
data->rpc_status = task->tk_status;
|
2006-01-03 15:55:21 +07:00
|
|
|
if (data->rpc_status == 0) {
|
2012-03-05 06:13:56 +07:00
|
|
|
nfs4_stateid_copy(&data->o_res.stateid, &data->c_res.stateid);
|
2008-01-03 03:19:18 +07:00
|
|
|
nfs_confirm_seqid(&data->owner->so_seqid, 0);
|
2006-01-03 15:55:21 +07:00
|
|
|
renew_lease(data->o_res.server, data->timestamp);
|
2017-06-20 19:33:44 +07:00
|
|
|
data->rpc_done = true;
|
2006-01-03 15:55:21 +07:00
|
|
|
}
|
2006-01-03 15:55:12 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_open_confirm_release(void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_opendata *data = calldata;
|
|
|
|
struct nfs4_state *state = NULL;
|
|
|
|
|
|
|
|
/* If this request hasn't been cancelled, do nothing */
|
2017-06-20 19:33:44 +07:00
|
|
|
if (!data->cancelled)
|
2006-01-03 15:55:12 +07:00
|
|
|
goto out_free;
|
|
|
|
/* In case of error, no cleanup! */
|
2007-07-08 00:19:59 +07:00
|
|
|
if (!data->rpc_done)
|
2006-01-03 15:55:12 +07:00
|
|
|
goto out_free;
|
|
|
|
state = nfs4_opendata_to_nfs4_state(data);
|
2007-07-07 19:04:47 +07:00
|
|
|
if (!IS_ERR(state))
|
2011-06-23 05:20:23 +07:00
|
|
|
nfs4_close_state(state, data->o_arg.fmode);
|
2006-01-03 15:55:12 +07:00
|
|
|
out_free:
|
2007-06-18 03:02:44 +07:00
|
|
|
nfs4_opendata_put(data);
|
2006-01-03 15:55:12 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_open_confirm_ops = {
|
2013-08-09 23:49:47 +07:00
|
|
|
.rpc_call_prepare = nfs4_open_confirm_prepare,
|
2006-01-03 15:55:12 +07:00
|
|
|
.rpc_call_done = nfs4_open_confirm_done,
|
|
|
|
.rpc_release = nfs4_open_confirm_release,
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Note: On error, nfs4_proc_open_confirm will free the struct nfs4_opendata
|
|
|
|
*/
|
|
|
|
static int _nfs4_proc_open_confirm(struct nfs4_opendata *data)
|
|
|
|
{
|
2015-03-18 05:25:59 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(d_inode(data->dir));
|
2006-01-03 15:55:12 +07:00
|
|
|
struct rpc_task *task;
|
2007-07-15 02:40:01 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_CONFIRM],
|
|
|
|
.rpc_argp = &data->c_arg,
|
|
|
|
.rpc_resp = &data->c_res,
|
|
|
|
.rpc_cred = data->owner->so_cred,
|
|
|
|
};
|
2007-07-15 02:39:59 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = server->client,
|
2007-07-15 02:40:01 +07:00
|
|
|
.rpc_message = &msg,
|
2007-07-15 02:39:59 +07:00
|
|
|
.callback_ops = &nfs4_open_confirm_ops,
|
|
|
|
.callback_data = data,
|
2008-02-20 08:04:23 +07:00
|
|
|
.workqueue = nfsiod_workqueue,
|
2007-07-15 02:39:59 +07:00
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
int status;
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->c_arg.seq_args, &data->c_res.seq_res, 1,
|
|
|
|
data->is_recover);
|
2007-06-18 03:02:44 +07:00
|
|
|
kref_get(&data->kref);
|
2017-06-20 19:33:44 +07:00
|
|
|
data->rpc_done = false;
|
2007-07-08 00:19:59 +07:00
|
|
|
data->rpc_status = 0;
|
2007-07-15 02:40:01 +07:00
|
|
|
data->timestamp = jiffies;
|
2007-07-15 02:39:59 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
2006-03-21 06:11:10 +07:00
|
|
|
if (IS_ERR(task))
|
2006-01-03 15:55:12 +07:00
|
|
|
return PTR_ERR(task);
|
2017-01-12 03:01:43 +07:00
|
|
|
status = rpc_wait_for_completion_task(task);
|
2006-01-03 15:55:12 +07:00
|
|
|
if (status != 0) {
|
2017-06-20 19:33:44 +07:00
|
|
|
data->cancelled = true;
|
2006-01-03 15:55:12 +07:00
|
|
|
smp_wmb();
|
|
|
|
} else
|
|
|
|
status = data->rpc_status;
|
2006-11-12 10:18:03 +07:00
|
|
|
rpc_put_task(task);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:11 +07:00
|
|
|
static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-01-03 15:55:11 +07:00
|
|
|
struct nfs4_opendata *data = calldata;
|
|
|
|
struct nfs4_state_owner *sp = data->owner;
|
2013-04-17 05:42:34 +07:00
|
|
|
struct nfs_client *clp = sp->so_server->nfs_client;
|
2015-08-20 10:30:00 +07:00
|
|
|
enum open_claim_type4 claim = data->o_arg.claim;
|
2007-07-15 02:40:01 +07:00
|
|
|
|
2006-01-03 15:55:11 +07:00
|
|
|
if (nfs_wait_on_sequence(data->o_arg.seqid, task) != 0)
|
2013-02-12 07:01:21 +07:00
|
|
|
goto out_wait;
|
2007-07-06 06:02:21 +07:00
|
|
|
/*
|
|
|
|
* Check if we still need to send an OPEN call, or if we can use
|
|
|
|
* a delegation instead.
|
|
|
|
*/
|
|
|
|
if (data->state != NULL) {
|
|
|
|
struct nfs_delegation *delegation;
|
|
|
|
|
2008-12-24 03:21:56 +07:00
|
|
|
if (can_open_cached(data->state, data->o_arg.fmode, data->o_arg.open_flags))
|
2007-07-09 01:11:36 +07:00
|
|
|
goto out_no_action;
|
2007-07-06 06:02:21 +07:00
|
|
|
rcu_read_lock();
|
|
|
|
delegation = rcu_dereference(NFS_I(data->state->inode)->delegation);
|
2015-08-20 10:30:00 +07:00
|
|
|
if (can_open_delegated(delegation, data->o_arg.fmode, claim))
|
2011-12-10 07:05:58 +07:00
|
|
|
goto unlock_no_action;
|
2007-07-06 06:02:21 +07:00
|
|
|
rcu_read_unlock();
|
|
|
|
}
|
2012-04-21 06:24:51 +07:00
|
|
|
/* Update client id. */
|
2013-04-17 05:42:34 +07:00
|
|
|
data->o_arg.clientid = clp->cl_clientid;
|
2015-08-20 10:30:00 +07:00
|
|
|
switch (claim) {
|
|
|
|
default:
|
|
|
|
break;
|
2013-04-24 01:31:19 +07:00
|
|
|
case NFS4_OPEN_CLAIM_PREVIOUS:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
|
|
|
|
case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
|
2012-10-03 08:07:32 +07:00
|
|
|
data->o_arg.open_bitmap = &nfs4_open_noattr_bitmap[0];
|
2013-04-24 01:31:19 +07:00
|
|
|
case NFS4_OPEN_CLAIM_FH:
|
|
|
|
task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
|
2007-07-18 08:50:45 +07:00
|
|
|
}
|
2006-01-03 15:55:21 +07:00
|
|
|
data->timestamp = jiffies;
|
2017-01-10 03:48:22 +07:00
|
|
|
if (nfs4_setup_sequence(data->o_arg.server->nfs_client,
|
2009-04-01 20:22:21 +07:00
|
|
|
&data->o_arg.seq_args,
|
2012-10-30 05:37:40 +07:00
|
|
|
&data->o_res.seq_res,
|
|
|
|
task) != 0)
|
|
|
|
nfs_release_seqid(data->o_arg.seqid);
|
2013-04-17 05:42:34 +07:00
|
|
|
|
|
|
|
/* Set the create mode (note dependency on the session type) */
|
|
|
|
data->o_arg.createmode = NFS4_CREATE_UNCHECKED;
|
|
|
|
if (data->o_arg.open_flags & O_EXCL) {
|
|
|
|
data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE;
|
|
|
|
if (nfs4_has_persistent_session(clp))
|
|
|
|
data->o_arg.createmode = NFS4_CREATE_GUARDED;
|
|
|
|
else if (clp->cl_mvops->minor_version > 0)
|
|
|
|
data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE4_1;
|
|
|
|
}
|
2007-07-09 01:11:36 +07:00
|
|
|
return;
|
2011-12-10 07:05:58 +07:00
|
|
|
unlock_no_action:
|
2015-11-25 01:29:42 +07:00
|
|
|
trace_nfs4_cached_open(data->state);
|
2011-12-10 07:05:58 +07:00
|
|
|
rcu_read_unlock();
|
2007-07-09 01:11:36 +07:00
|
|
|
out_no_action:
|
|
|
|
task->tk_action = NULL;
|
2013-02-12 07:01:21 +07:00
|
|
|
out_wait:
|
2012-11-30 05:27:47 +07:00
|
|
|
nfs4_sequence_done(task, &data->o_res.seq_res);
|
2009-12-15 12:27:57 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:11 +07:00
|
|
|
static void nfs4_open_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_opendata *data = calldata;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2006-01-03 15:55:11 +07:00
|
|
|
data->rpc_status = task->tk_status;
|
2009-04-01 20:22:21 +07:00
|
|
|
|
2016-08-28 22:50:26 +07:00
|
|
|
if (!nfs4_sequence_process(task, &data->o_res.seq_res))
|
2010-08-01 01:29:06 +07:00
|
|
|
return;
|
2009-04-01 20:22:21 +07:00
|
|
|
|
2006-01-03 15:55:11 +07:00
|
|
|
if (task->tk_status == 0) {
|
2012-10-03 07:09:00 +07:00
|
|
|
if (data->o_res.f_attr->valid & NFS_ATTR_FATTR_TYPE) {
|
|
|
|
switch (data->o_res.f_attr->mode & S_IFMT) {
|
2005-10-19 04:20:18 +07:00
|
|
|
case S_IFREG:
|
|
|
|
break;
|
|
|
|
case S_IFLNK:
|
2006-01-03 15:55:11 +07:00
|
|
|
data->rpc_status = -ELOOP;
|
2005-10-19 04:20:18 +07:00
|
|
|
break;
|
|
|
|
case S_IFDIR:
|
2006-01-03 15:55:11 +07:00
|
|
|
data->rpc_status = -EISDIR;
|
2005-10-19 04:20:18 +07:00
|
|
|
break;
|
|
|
|
default:
|
2006-01-03 15:55:11 +07:00
|
|
|
data->rpc_status = -ENOTDIR;
|
2012-10-03 07:09:00 +07:00
|
|
|
}
|
2005-10-19 04:20:18 +07:00
|
|
|
}
|
2006-01-03 15:55:21 +07:00
|
|
|
renew_lease(data->o_res.server, data->timestamp);
|
2007-07-09 03:19:56 +07:00
|
|
|
if (!(data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM))
|
|
|
|
nfs_confirm_seqid(&data->owner->so_seqid, 0);
|
2005-10-19 04:20:18 +07:00
|
|
|
}
|
2017-06-20 19:33:44 +07:00
|
|
|
data->rpc_done = true;
|
2006-01-03 15:55:11 +07:00
|
|
|
}
|
2005-10-19 04:20:18 +07:00
|
|
|
|
2006-01-03 15:55:11 +07:00
|
|
|
static void nfs4_open_release(void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_opendata *data = calldata;
|
|
|
|
struct nfs4_state *state = NULL;
|
|
|
|
|
|
|
|
/* If this request hasn't been cancelled, do nothing */
|
2017-06-20 19:33:44 +07:00
|
|
|
if (!data->cancelled)
|
2006-01-03 15:55:11 +07:00
|
|
|
goto out_free;
|
|
|
|
/* In case of error, no cleanup! */
|
2007-07-08 00:19:59 +07:00
|
|
|
if (data->rpc_status != 0 || !data->rpc_done)
|
2006-01-03 15:55:11 +07:00
|
|
|
goto out_free;
|
|
|
|
/* In case we need an open_confirm, no cleanup! */
|
|
|
|
if (data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM)
|
|
|
|
goto out_free;
|
|
|
|
state = nfs4_opendata_to_nfs4_state(data);
|
2007-07-07 19:04:47 +07:00
|
|
|
if (!IS_ERR(state))
|
2011-06-23 05:20:23 +07:00
|
|
|
nfs4_close_state(state, data->o_arg.fmode);
|
2006-01-03 15:55:11 +07:00
|
|
|
out_free:
|
2007-06-18 03:02:44 +07:00
|
|
|
nfs4_opendata_put(data);
|
2006-01-03 15:55:11 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_open_ops = {
|
|
|
|
.rpc_call_prepare = nfs4_open_prepare,
|
|
|
|
.rpc_call_done = nfs4_open_done,
|
|
|
|
.rpc_release = nfs4_open_release,
|
|
|
|
};
|
|
|
|
|
2016-09-19 21:06:49 +07:00
|
|
|
static int nfs4_run_open_task(struct nfs4_opendata *data,
|
|
|
|
struct nfs_open_context *ctx)
|
2006-01-03 15:55:11 +07:00
|
|
|
{
|
2015-03-18 05:25:59 +07:00
|
|
|
struct inode *dir = d_inode(data->dir);
|
2006-01-03 15:55:11 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
|
|
|
struct nfs_openargs *o_arg = &data->o_arg;
|
|
|
|
struct nfs_openres *o_res = &data->o_res;
|
|
|
|
struct rpc_task *task;
|
2007-07-15 02:40:01 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN],
|
|
|
|
.rpc_argp = o_arg,
|
|
|
|
.rpc_resp = o_res,
|
|
|
|
.rpc_cred = data->owner->so_cred,
|
|
|
|
};
|
2007-07-15 02:39:59 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = server->client,
|
2007-07-15 02:40:01 +07:00
|
|
|
.rpc_message = &msg,
|
2007-07-15 02:39:59 +07:00
|
|
|
.callback_ops = &nfs4_open_ops,
|
|
|
|
.callback_data = data,
|
2008-02-20 08:04:23 +07:00
|
|
|
.workqueue = nfsiod_workqueue,
|
2007-07-15 02:39:59 +07:00
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
2006-01-03 15:55:11 +07:00
|
|
|
int status;
|
|
|
|
|
2007-06-18 03:02:44 +07:00
|
|
|
kref_get(&data->kref);
|
2017-06-20 19:33:44 +07:00
|
|
|
data->rpc_done = false;
|
2007-07-08 00:19:59 +07:00
|
|
|
data->rpc_status = 0;
|
2017-06-20 19:33:44 +07:00
|
|
|
data->cancelled = false;
|
|
|
|
data->is_recover = false;
|
2016-09-19 21:06:49 +07:00
|
|
|
if (!ctx) {
|
|
|
|
nfs4_init_sequence(&o_arg->seq_args, &o_res->seq_res, 1, 1);
|
2017-06-20 19:33:44 +07:00
|
|
|
data->is_recover = true;
|
2016-10-06 23:11:21 +07:00
|
|
|
} else {
|
2016-09-19 21:06:49 +07:00
|
|
|
nfs4_init_sequence(&o_arg->seq_args, &o_res->seq_res, 1, 0);
|
2016-10-06 23:11:21 +07:00
|
|
|
pnfs_lgopen_prepare(data, ctx);
|
|
|
|
}
|
2007-07-15 02:39:59 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
2017-01-12 03:04:25 +07:00
|
|
|
if (IS_ERR(task))
|
|
|
|
return PTR_ERR(task);
|
2017-01-12 03:01:43 +07:00
|
|
|
status = rpc_wait_for_completion_task(task);
|
2017-01-12 03:04:25 +07:00
|
|
|
if (status != 0) {
|
2017-06-20 19:33:44 +07:00
|
|
|
data->cancelled = true;
|
2017-01-12 03:04:25 +07:00
|
|
|
smp_wmb();
|
|
|
|
} else
|
|
|
|
status = data->rpc_status;
|
|
|
|
rpc_put_task(task);
|
2009-12-15 12:27:57 +07:00
|
|
|
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_recover_proc_open(struct nfs4_opendata *data)
|
|
|
|
{
|
2015-03-18 05:25:59 +07:00
|
|
|
struct inode *dir = d_inode(data->dir);
|
2009-12-15 12:27:57 +07:00
|
|
|
struct nfs_openres *o_res = &data->o_res;
|
2017-01-12 03:04:25 +07:00
|
|
|
int status;
|
2009-12-15 12:27:57 +07:00
|
|
|
|
2016-09-19 21:06:49 +07:00
|
|
|
status = nfs4_run_open_task(data, NULL);
|
2009-12-15 12:27:57 +07:00
|
|
|
if (status != 0 || !data->rpc_done)
|
|
|
|
return status;
|
|
|
|
|
2012-01-08 01:22:46 +07:00
|
|
|
nfs_fattr_map_and_free_names(NFS_SERVER(dir), &data->f_attr);
|
|
|
|
|
2017-01-12 04:13:29 +07:00
|
|
|
if (o_res->rflags & NFS4_OPEN_RESULT_CONFIRM)
|
2009-12-15 12:27:57 +07:00
|
|
|
status = _nfs4_proc_open_confirm(data);
|
|
|
|
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2014-07-10 19:54:32 +07:00
|
|
|
/*
|
|
|
|
* Additional permission checks in order to distinguish between an
|
|
|
|
* open for read, and an open for execute. This works around the
|
|
|
|
* fact that NFSv4 OPEN treats read and execute permissions as being
|
|
|
|
* the same.
|
|
|
|
* Note that in the non-execute case, we want to turn off permission
|
|
|
|
* checking if we just created a new file (POSIX open() semantics).
|
|
|
|
*/
|
2012-09-11 01:00:46 +07:00
|
|
|
static int nfs4_opendata_access(struct rpc_cred *cred,
|
|
|
|
struct nfs4_opendata *opendata,
|
2013-01-04 04:42:29 +07:00
|
|
|
struct nfs4_state *state, fmode_t fmode,
|
|
|
|
int openflags)
|
2012-09-11 01:00:46 +07:00
|
|
|
{
|
|
|
|
struct nfs_access_entry cache;
|
2017-07-26 03:10:47 +07:00
|
|
|
u32 mask, flags;
|
2012-09-11 01:00:46 +07:00
|
|
|
|
|
|
|
/* access call failed or for some reason the server doesn't
|
|
|
|
* support any access modes -- defer access call until later */
|
|
|
|
if (opendata->o_res.access_supported == 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
mask = 0;
|
2014-07-10 19:54:32 +07:00
|
|
|
/*
|
|
|
|
* Use openflags to check for exec, because fmode won't
|
|
|
|
* always have FMODE_EXEC set when file open for exec.
|
|
|
|
*/
|
2013-01-04 04:42:29 +07:00
|
|
|
if (openflags & __FMODE_EXEC) {
|
|
|
|
/* ONLY check for exec rights */
|
2017-07-26 03:10:47 +07:00
|
|
|
if (S_ISDIR(state->inode->i_mode))
|
|
|
|
mask = NFS4_ACCESS_LOOKUP;
|
|
|
|
else
|
|
|
|
mask = NFS4_ACCESS_EXECUTE;
|
2014-07-10 19:54:32 +07:00
|
|
|
} else if ((fmode & FMODE_READ) && !opendata->file_created)
|
2017-07-26 03:10:47 +07:00
|
|
|
mask = NFS4_ACCESS_READ;
|
2012-09-11 01:00:46 +07:00
|
|
|
|
|
|
|
cache.cred = cred;
|
|
|
|
nfs_access_set_mask(&cache, opendata->o_res.access_result);
|
|
|
|
nfs_access_add_cache(state->inode, &cache);
|
|
|
|
|
2017-07-26 03:10:47 +07:00
|
|
|
flags = NFS4_ACCESS_READ | NFS4_ACCESS_EXECUTE | NFS4_ACCESS_LOOKUP;
|
|
|
|
if ((mask & ~cache.mask & flags) == 0)
|
2012-09-11 01:00:46 +07:00
|
|
|
return 0;
|
|
|
|
|
2012-11-03 05:00:56 +07:00
|
|
|
return -EACCES;
|
2012-09-11 01:00:46 +07:00
|
|
|
}
|
|
|
|
|
2009-12-15 12:27:57 +07:00
|
|
|
/*
|
|
|
|
* Note: On error, nfs4_proc_open will free the struct nfs4_opendata
|
|
|
|
*/
|
2016-09-19 21:06:49 +07:00
|
|
|
static int _nfs4_proc_open(struct nfs4_opendata *data,
|
|
|
|
struct nfs_open_context *ctx)
|
2009-12-15 12:27:57 +07:00
|
|
|
{
|
2015-03-18 05:25:59 +07:00
|
|
|
struct inode *dir = d_inode(data->dir);
|
2009-12-15 12:27:57 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
|
|
|
struct nfs_openargs *o_arg = &data->o_arg;
|
|
|
|
struct nfs_openres *o_res = &data->o_res;
|
|
|
|
int status;
|
|
|
|
|
2016-09-19 21:06:49 +07:00
|
|
|
status = nfs4_run_open_task(data, ctx);
|
2011-10-19 06:11:49 +07:00
|
|
|
if (!data->rpc_done)
|
|
|
|
return status;
|
|
|
|
if (status != 0) {
|
|
|
|
if (status == -NFS4ERR_BADNAME &&
|
|
|
|
!(o_arg->open_flags & O_CREAT))
|
|
|
|
return -ENOENT;
|
2006-01-03 15:55:11 +07:00
|
|
|
return status;
|
2011-10-19 06:11:49 +07:00
|
|
|
}
|
2006-01-03 15:55:11 +07:00
|
|
|
|
2012-01-08 01:22:46 +07:00
|
|
|
nfs_fattr_map_and_free_names(server, &data->f_attr);
|
|
|
|
|
2013-09-24 05:01:28 +07:00
|
|
|
if (o_arg->open_flags & O_CREAT) {
|
|
|
|
if (o_arg->open_flags & O_EXCL)
|
2017-06-20 19:33:44 +07:00
|
|
|
data->file_created = true;
|
2013-09-24 05:01:28 +07:00
|
|
|
else if (o_res->cinfo.before != o_res->cinfo.after)
|
2017-06-20 19:33:44 +07:00
|
|
|
data->file_created = true;
|
2018-01-09 20:21:17 +07:00
|
|
|
if (data->file_created ||
|
|
|
|
inode_peek_iversion_raw(dir) != o_res->cinfo.after)
|
2017-01-12 10:07:28 +07:00
|
|
|
update_changeattr(dir, &o_res->cinfo,
|
|
|
|
o_res->f_attr->time_start);
|
2013-09-24 05:01:28 +07:00
|
|
|
}
|
2010-04-12 03:48:44 +07:00
|
|
|
if ((o_res->rflags & NFS4_OPEN_RESULT_LOCKTYPE_POSIX) == 0)
|
|
|
|
server->caps &= ~NFS_CAP_POSIX_LOCK;
|
2005-04-17 05:20:36 +07:00
|
|
|
if(o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
|
2006-01-03 15:55:12 +07:00
|
|
|
status = _nfs4_proc_open_confirm(data);
|
2005-04-17 05:20:36 +07:00
|
|
|
if (status != 0)
|
2006-01-03 15:55:11 +07:00
|
|
|
return status;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2017-04-16 06:20:01 +07:00
|
|
|
if (!(o_res->f_attr->valid & NFS_ATTR_FATTR)) {
|
|
|
|
nfs4_sequence_free_slot(&o_res->seq_res);
|
2018-04-08 00:50:59 +07:00
|
|
|
nfs4_proc_getattr(server, &o_res->fh, o_res->f_attr,
|
|
|
|
o_res->f_label, NULL);
|
2017-04-16 06:20:01 +07:00
|
|
|
}
|
2006-01-03 15:55:11 +07:00
|
|
|
return 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* OPEN_EXPIRED:
|
|
|
|
* reclaim state on the server after a network partition.
|
|
|
|
* Assumes caller holds the appropriate lock
|
|
|
|
*/
|
2007-06-05 22:46:42 +07:00
|
|
|
static int _nfs4_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-01-03 15:55:08 +07:00
|
|
|
struct nfs4_opendata *opendata;
|
2006-01-03 15:55:15 +07:00
|
|
|
int ret;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-03-16 01:57:33 +07:00
|
|
|
opendata = nfs4_open_recoverdata_alloc(ctx, state,
|
2013-03-16 03:44:28 +07:00
|
|
|
NFS4_OPEN_CLAIM_FH);
|
2007-07-18 08:50:45 +07:00
|
|
|
if (IS_ERR(opendata))
|
|
|
|
return PTR_ERR(opendata);
|
2006-01-03 15:55:15 +07:00
|
|
|
ret = nfs4_open_recover(opendata, state);
|
2008-04-06 02:54:17 +07:00
|
|
|
if (ret == -ESTALE)
|
2011-06-23 05:40:12 +07:00
|
|
|
d_drop(ctx->dentry);
|
2007-06-18 03:02:44 +07:00
|
|
|
nfs4_opendata_put(opendata);
|
2006-01-03 15:55:15 +07:00
|
|
|
return ret;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2009-12-04 03:53:21 +07:00
|
|
|
static int nfs4_do_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
|
2005-06-23 00:16:29 +07:00
|
|
|
{
|
2007-06-05 22:46:42 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
2005-06-23 00:16:29 +07:00
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
2007-06-05 22:46:42 +07:00
|
|
|
err = _nfs4_open_expired(ctx, state);
|
2013-08-13 03:19:27 +07:00
|
|
|
trace_nfs4_open_expired(ctx, 0, err);
|
2013-03-16 03:44:28 +07:00
|
|
|
if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
|
|
|
|
continue;
|
2009-12-04 03:53:21 +07:00
|
|
|
switch (err) {
|
|
|
|
default:
|
|
|
|
goto out;
|
|
|
|
case -NFS4ERR_GRACE:
|
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
nfs4_handle_exception(server, err, &exception);
|
|
|
|
err = 0;
|
|
|
|
}
|
2005-06-23 00:16:29 +07:00
|
|
|
} while (exception.retry);
|
2009-12-04 03:53:21 +07:00
|
|
|
out:
|
2005-06-23 00:16:29 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
static int nfs4_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
struct nfs_open_context *ctx;
|
2006-01-03 15:55:15 +07:00
|
|
|
int ret;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2006-01-03 15:55:15 +07:00
|
|
|
ctx = nfs4_state_find_open_context(state);
|
|
|
|
if (IS_ERR(ctx))
|
2013-03-29 01:01:33 +07:00
|
|
|
return -EAGAIN;
|
2007-06-05 22:46:42 +07:00
|
|
|
ret = nfs4_do_open_expired(ctx, state);
|
2006-01-03 15:55:15 +07:00
|
|
|
put_nfs_open_context(ctx);
|
|
|
|
return ret;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2016-09-23 00:38:58 +07:00
|
|
|
static void nfs_finish_clear_delegation_stateid(struct nfs4_state *state,
|
|
|
|
const nfs4_stateid *stateid)
|
2014-10-17 19:10:25 +07:00
|
|
|
{
|
2016-09-23 00:38:58 +07:00
|
|
|
nfs_remove_bad_delegation(state->inode, stateid);
|
2014-10-17 19:10:25 +07:00
|
|
|
write_seqlock(&state->seqlock);
|
|
|
|
nfs4_stateid_copy(&state->stateid, &state->open_stateid);
|
|
|
|
write_sequnlock(&state->seqlock);
|
|
|
|
clear_bit(NFS_DELEGATED_STATE, &state->flags);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs40_clear_delegation_stateid(struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
if (rcu_access_pointer(NFS_I(state->inode)->delegation) != NULL)
|
2016-09-23 00:38:58 +07:00
|
|
|
nfs_finish_clear_delegation_stateid(state, NULL);
|
2014-10-17 19:10:25 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs40_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
/* NFSv4.0 doesn't allow for delegation recovery on open expire */
|
|
|
|
nfs40_clear_delegation_stateid(state);
|
|
|
|
return nfs4_open_expired(sp, state);
|
|
|
|
}
|
|
|
|
|
2016-09-23 00:38:59 +07:00
|
|
|
static int nfs40_test_and_free_expired_stateid(struct nfs_server *server,
|
|
|
|
nfs4_stateid *stateid,
|
|
|
|
struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
return -NFS4ERR_BAD_STATEID;
|
|
|
|
}
|
|
|
|
|
2011-06-03 01:59:10 +07:00
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
2016-09-23 00:38:57 +07:00
|
|
|
static int nfs41_test_and_free_expired_stateid(struct nfs_server *server,
|
|
|
|
nfs4_stateid *stateid,
|
|
|
|
struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
int status;
|
|
|
|
|
2016-09-23 00:39:02 +07:00
|
|
|
switch (stateid->type) {
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
case NFS4_INVALID_STATEID_TYPE:
|
|
|
|
case NFS4_SPECIAL_STATEID_TYPE:
|
|
|
|
return -NFS4ERR_BAD_STATEID;
|
|
|
|
case NFS4_REVOKED_STATEID_TYPE:
|
|
|
|
goto out_free;
|
|
|
|
}
|
2016-09-23 00:38:57 +07:00
|
|
|
|
2016-09-23 00:39:02 +07:00
|
|
|
status = nfs41_test_stateid(server, stateid, cred);
|
2016-09-23 00:38:57 +07:00
|
|
|
switch (status) {
|
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
2016-09-23 00:39:02 +07:00
|
|
|
break;
|
|
|
|
default:
|
2016-09-23 00:38:57 +07:00
|
|
|
return status;
|
|
|
|
}
|
2016-09-23 00:39:02 +07:00
|
|
|
out_free:
|
|
|
|
/* Ack the revoked state to the server */
|
2016-09-23 00:39:04 +07:00
|
|
|
nfs41_free_stateid(server, stateid, cred, true);
|
2016-09-23 00:39:02 +07:00
|
|
|
return -NFS4ERR_EXPIRED;
|
2016-09-23 00:38:57 +07:00
|
|
|
}
|
|
|
|
|
2014-11-13 02:44:49 +07:00
|
|
|
static void nfs41_check_delegation_stateid(struct nfs4_state *state)
|
2011-06-03 01:59:10 +07:00
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
2014-11-13 02:44:49 +07:00
|
|
|
nfs4_stateid stateid;
|
2013-05-20 22:20:27 +07:00
|
|
|
struct nfs_delegation *delegation;
|
2014-11-13 02:44:49 +07:00
|
|
|
struct rpc_cred *cred;
|
|
|
|
int status;
|
2012-07-12 03:30:14 +07:00
|
|
|
|
2013-05-20 22:20:27 +07:00
|
|
|
/* Get the delegation credential for use by test/free_stateid */
|
|
|
|
rcu_read_lock();
|
|
|
|
delegation = rcu_dereference(NFS_I(state->inode)->delegation);
|
2014-11-13 02:44:49 +07:00
|
|
|
if (delegation == NULL) {
|
2013-05-20 22:20:27 +07:00
|
|
|
rcu_read_unlock();
|
2014-11-13 02:44:49 +07:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
nfs4_stateid_copy(&stateid, &delegation->stateid);
|
2017-03-31 00:49:03 +07:00
|
|
|
if (test_bit(NFS_DELEGATION_REVOKED, &delegation->flags) ||
|
|
|
|
!test_and_clear_bit(NFS_DELEGATION_TEST_EXPIRED,
|
|
|
|
&delegation->flags)) {
|
2016-09-23 00:38:55 +07:00
|
|
|
rcu_read_unlock();
|
2016-09-23 00:38:58 +07:00
|
|
|
nfs_finish_clear_delegation_stateid(state, &stateid);
|
2016-09-23 00:38:55 +07:00
|
|
|
return;
|
|
|
|
}
|
2014-11-13 02:44:49 +07:00
|
|
|
|
|
|
|
cred = get_rpccred(delegation->cred);
|
|
|
|
rcu_read_unlock();
|
2016-09-23 00:38:57 +07:00
|
|
|
status = nfs41_test_and_free_expired_stateid(server, &stateid, cred);
|
2014-11-13 02:44:49 +07:00
|
|
|
trace_nfs4_test_delegation_stateid(state, NULL, status);
|
2016-09-23 00:39:02 +07:00
|
|
|
if (status == -NFS4ERR_EXPIRED || status == -NFS4ERR_BAD_STATEID)
|
2016-09-23 00:38:58 +07:00
|
|
|
nfs_finish_clear_delegation_stateid(state, &stateid);
|
2013-05-20 22:20:27 +07:00
|
|
|
|
2014-11-13 02:44:49 +07:00
|
|
|
put_rpccred(cred);
|
2012-07-12 03:30:14 +07:00
|
|
|
}
|
|
|
|
|
2016-09-23 00:39:03 +07:00
|
|
|
/**
|
|
|
|
* nfs41_check_expired_locks - possibly free a lock stateid
|
|
|
|
*
|
|
|
|
* @state: NFSv4 state for an inode
|
|
|
|
*
|
|
|
|
* Returns NFS_OK if recovery for this stateid is now finished.
|
|
|
|
* Otherwise a negative NFS4ERR value is returned.
|
|
|
|
*/
|
|
|
|
static int nfs41_check_expired_locks(struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
int status, ret = NFS_OK;
|
2016-11-19 09:11:39 +07:00
|
|
|
struct nfs4_lock_state *lsp, *prev = NULL;
|
2016-09-23 00:39:03 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
|
|
|
|
|
|
|
if (!test_bit(LK_STATE_IN_USE, &state->flags))
|
|
|
|
goto out;
|
2016-11-19 09:11:39 +07:00
|
|
|
|
|
|
|
spin_lock(&state->state_lock);
|
2016-09-23 00:39:03 +07:00
|
|
|
list_for_each_entry(lsp, &state->lock_states, ls_locks) {
|
|
|
|
if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags)) {
|
|
|
|
struct rpc_cred *cred = lsp->ls_state->owner->so_cred;
|
|
|
|
|
2017-10-20 16:53:36 +07:00
|
|
|
refcount_inc(&lsp->ls_count);
|
2016-11-19 09:11:39 +07:00
|
|
|
spin_unlock(&state->state_lock);
|
|
|
|
|
|
|
|
nfs4_put_lock_state(prev);
|
|
|
|
prev = lsp;
|
|
|
|
|
2016-09-23 00:39:03 +07:00
|
|
|
status = nfs41_test_and_free_expired_stateid(server,
|
|
|
|
&lsp->ls_stateid,
|
|
|
|
cred);
|
|
|
|
trace_nfs4_test_lock_stateid(state, lsp, status);
|
|
|
|
if (status == -NFS4ERR_EXPIRED ||
|
|
|
|
status == -NFS4ERR_BAD_STATEID) {
|
|
|
|
clear_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags);
|
2016-09-23 00:39:17 +07:00
|
|
|
lsp->ls_stateid.type = NFS4_INVALID_STATEID_TYPE;
|
2016-09-23 00:39:03 +07:00
|
|
|
if (!recover_lost_locks)
|
|
|
|
set_bit(NFS_LOCK_LOST, &lsp->ls_flags);
|
|
|
|
} else if (status != NFS_OK) {
|
|
|
|
ret = status;
|
2016-11-19 09:11:39 +07:00
|
|
|
nfs4_put_lock_state(prev);
|
|
|
|
goto out;
|
2016-09-23 00:39:03 +07:00
|
|
|
}
|
2016-11-19 09:11:39 +07:00
|
|
|
spin_lock(&state->state_lock);
|
2016-09-23 00:39:03 +07:00
|
|
|
}
|
2016-11-19 09:11:39 +07:00
|
|
|
}
|
|
|
|
spin_unlock(&state->state_lock);
|
|
|
|
nfs4_put_lock_state(prev);
|
2016-09-23 00:39:03 +07:00
|
|
|
out:
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2012-07-12 03:30:14 +07:00
|
|
|
/**
|
|
|
|
* nfs41_check_open_stateid - possibly free an open stateid
|
|
|
|
*
|
|
|
|
* @state: NFSv4 state for an inode
|
|
|
|
*
|
|
|
|
* Returns NFS_OK if recovery for this stateid is now finished.
|
|
|
|
* Otherwise a negative NFS4ERR value is returned.
|
|
|
|
*/
|
|
|
|
static int nfs41_check_open_stateid(struct nfs4_state *state)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
2012-09-27 02:25:53 +07:00
|
|
|
nfs4_stateid *stateid = &state->open_stateid;
|
2013-05-20 22:20:27 +07:00
|
|
|
struct rpc_cred *cred = state->owner->so_cred;
|
2012-07-12 03:30:14 +07:00
|
|
|
int status;
|
|
|
|
|
2016-09-23 00:39:16 +07:00
|
|
|
if (test_bit(NFS_OPEN_STATE, &state->flags) == 0) {
|
2016-09-23 00:39:21 +07:00
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0) {
|
|
|
|
if (nfs4_have_delegation(state->inode, state->state))
|
|
|
|
return NFS_OK;
|
|
|
|
return -NFS4ERR_OPENMODE;
|
|
|
|
}
|
2012-07-12 03:30:14 +07:00
|
|
|
return -NFS4ERR_BAD_STATEID;
|
2016-09-23 00:39:16 +07:00
|
|
|
}
|
2016-09-23 00:38:57 +07:00
|
|
|
status = nfs41_test_and_free_expired_stateid(server, stateid, cred);
|
2013-08-21 08:59:40 +07:00
|
|
|
trace_nfs4_test_open_stateid(state, NULL, status);
|
2016-09-23 00:39:02 +07:00
|
|
|
if (status == -NFS4ERR_EXPIRED || status == -NFS4ERR_BAD_STATEID) {
|
2012-07-12 03:30:14 +07:00
|
|
|
clear_bit(NFS_O_RDONLY_STATE, &state->flags);
|
|
|
|
clear_bit(NFS_O_WRONLY_STATE, &state->flags);
|
|
|
|
clear_bit(NFS_O_RDWR_STATE, &state->flags);
|
2013-04-22 22:29:51 +07:00
|
|
|
clear_bit(NFS_OPEN_STATE, &state->flags);
|
2016-09-23 00:39:17 +07:00
|
|
|
stateid->type = NFS4_INVALID_STATEID_TYPE;
|
2016-09-23 00:39:21 +07:00
|
|
|
return status;
|
2017-08-09 08:39:28 +07:00
|
|
|
}
|
2016-09-23 00:39:21 +07:00
|
|
|
if (nfs_open_stateid_recover_openmode(state))
|
|
|
|
return -NFS4ERR_OPENMODE;
|
|
|
|
return NFS_OK;
|
2012-01-31 22:39:30 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs41_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
|
|
|
|
{
|
2012-07-12 03:30:05 +07:00
|
|
|
int status;
|
2012-01-31 22:39:30 +07:00
|
|
|
|
2014-11-13 02:44:49 +07:00
|
|
|
nfs41_check_delegation_stateid(state);
|
2016-09-23 00:39:03 +07:00
|
|
|
status = nfs41_check_expired_locks(state);
|
|
|
|
if (status != NFS_OK)
|
|
|
|
return status;
|
2012-07-12 03:30:14 +07:00
|
|
|
status = nfs41_check_open_stateid(state);
|
2012-07-12 03:30:05 +07:00
|
|
|
if (status != NFS_OK)
|
|
|
|
status = nfs4_open_expired(sp, state);
|
|
|
|
return status;
|
2011-06-03 01:59:10 +07:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2007-06-06 01:49:03 +07:00
|
|
|
/*
|
|
|
|
* on an EXCLUSIVE create, the server should send back a bitmask with FATTR4-*
|
|
|
|
* fields corresponding to attributes that were used to store the verifier.
|
|
|
|
* Make sure we clobber those fields in the later setattr call
|
|
|
|
*/
|
2018-03-29 03:18:17 +07:00
|
|
|
static unsigned nfs4_exclusive_attrset(struct nfs4_opendata *opendata,
|
2015-08-26 20:13:37 +07:00
|
|
|
struct iattr *sattr, struct nfs4_label **label)
|
2007-06-06 01:49:03 +07:00
|
|
|
{
|
2018-03-29 03:18:17 +07:00
|
|
|
const __u32 *bitmask = opendata->o_arg.server->exclcreat_bitmask;
|
|
|
|
__u32 attrset[3];
|
|
|
|
unsigned ret;
|
|
|
|
unsigned i;
|
2015-08-26 20:13:37 +07:00
|
|
|
|
2018-03-29 03:18:17 +07:00
|
|
|
for (i = 0; i < ARRAY_SIZE(attrset); i++) {
|
|
|
|
attrset[i] = opendata->o_res.attrset[i];
|
|
|
|
if (opendata->o_arg.createmode == NFS4_CREATE_EXCLUSIVE4_1)
|
|
|
|
attrset[i] &= ~bitmask[i];
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = (opendata->o_arg.createmode == NFS4_CREATE_EXCLUSIVE) ?
|
|
|
|
sattr->ia_valid : 0;
|
2007-06-06 01:49:03 +07:00
|
|
|
|
2018-03-29 03:18:17 +07:00
|
|
|
if ((attrset[1] & (FATTR4_WORD1_TIME_ACCESS|FATTR4_WORD1_TIME_ACCESS_SET))) {
|
|
|
|
if (sattr->ia_valid & ATTR_ATIME_SET)
|
|
|
|
ret |= ATTR_ATIME_SET;
|
|
|
|
else
|
|
|
|
ret |= ATTR_ATIME;
|
|
|
|
}
|
2015-08-26 20:13:37 +07:00
|
|
|
|
2018-03-29 03:18:17 +07:00
|
|
|
if ((attrset[1] & (FATTR4_WORD1_TIME_MODIFY|FATTR4_WORD1_TIME_MODIFY_SET))) {
|
|
|
|
if (sattr->ia_valid & ATTR_MTIME_SET)
|
|
|
|
ret |= ATTR_MTIME_SET;
|
|
|
|
else
|
|
|
|
ret |= ATTR_MTIME;
|
|
|
|
}
|
2015-08-26 20:13:37 +07:00
|
|
|
|
2018-03-29 03:18:17 +07:00
|
|
|
if (!(attrset[2] & FATTR4_WORD2_SECURITY_LABEL))
|
2015-08-26 20:13:37 +07:00
|
|
|
*label = NULL;
|
2018-03-29 03:18:17 +07:00
|
|
|
return ret;
|
2007-06-06 01:49:03 +07:00
|
|
|
}
|
|
|
|
|
2013-02-08 02:26:21 +07:00
|
|
|
static int _nfs4_open_and_get_state(struct nfs4_opendata *opendata,
|
|
|
|
fmode_t fmode,
|
|
|
|
int flags,
|
2013-05-30 00:17:04 +07:00
|
|
|
struct nfs_open_context *ctx)
|
2013-02-08 02:26:21 +07:00
|
|
|
{
|
|
|
|
struct nfs4_state_owner *sp = opendata->owner;
|
|
|
|
struct nfs_server *server = sp->so_server;
|
2013-05-30 00:11:28 +07:00
|
|
|
struct dentry *dentry;
|
2013-02-08 02:26:21 +07:00
|
|
|
struct nfs4_state *state;
|
|
|
|
unsigned int seq;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
seq = raw_seqcount_begin(&sp->so_reclaim_seqcount);
|
|
|
|
|
2016-09-19 21:06:49 +07:00
|
|
|
ret = _nfs4_proc_open(opendata, ctx);
|
2014-10-23 23:23:03 +07:00
|
|
|
if (ret != 0)
|
2013-02-08 02:26:21 +07:00
|
|
|
goto out;
|
|
|
|
|
2018-05-22 22:17:16 +07:00
|
|
|
state = _nfs4_opendata_to_nfs4_state(opendata);
|
2013-02-08 02:26:21 +07:00
|
|
|
ret = PTR_ERR(state);
|
|
|
|
if (IS_ERR(state))
|
|
|
|
goto out;
|
2017-02-08 23:29:46 +07:00
|
|
|
ctx->state = state;
|
2013-02-08 02:26:21 +07:00
|
|
|
if (server->caps & NFS_CAP_POSIX_LOCK)
|
|
|
|
set_bit(NFS_STATE_POSIX_LOCKS, &state->flags);
|
2016-09-18 05:17:35 +07:00
|
|
|
if (opendata->o_res.rflags & NFS4_OPEN_RESULT_MAY_NOTIFY_LOCK)
|
|
|
|
set_bit(NFS_STATE_MAY_NOTIFY_LOCK, &state->flags);
|
2013-02-08 02:26:21 +07:00
|
|
|
|
2013-05-30 00:11:28 +07:00
|
|
|
dentry = opendata->dentry;
|
2015-03-18 05:25:59 +07:00
|
|
|
if (d_really_is_negative(dentry)) {
|
2016-03-09 00:44:17 +07:00
|
|
|
struct dentry *alias;
|
2013-05-30 00:11:28 +07:00
|
|
|
d_drop(dentry);
|
2016-03-09 00:44:17 +07:00
|
|
|
alias = d_exact_alias(dentry, state->inode);
|
|
|
|
if (!alias)
|
|
|
|
alias = d_splice_alias(igrab(state->inode), dentry);
|
|
|
|
/* d_splice_alias() can't fail here - it's a non-directory */
|
|
|
|
if (alias) {
|
2013-05-30 00:11:28 +07:00
|
|
|
dput(ctx->dentry);
|
2016-03-09 00:44:17 +07:00
|
|
|
ctx->dentry = dentry = alias;
|
2013-05-30 00:11:28 +07:00
|
|
|
}
|
|
|
|
nfs_set_verifier(dentry,
|
2015-03-18 05:25:59 +07:00
|
|
|
nfs_save_change_attribute(d_inode(opendata->dir)));
|
2013-05-30 00:11:28 +07:00
|
|
|
}
|
|
|
|
|
2013-02-08 02:26:21 +07:00
|
|
|
ret = nfs4_opendata_access(sp->so_cred, opendata, state, fmode, flags);
|
|
|
|
if (ret != 0)
|
|
|
|
goto out;
|
|
|
|
|
2015-03-18 05:25:59 +07:00
|
|
|
if (d_inode(dentry) == state->inode) {
|
2013-05-30 00:34:46 +07:00
|
|
|
nfs_inode_attach_open_context(ctx);
|
|
|
|
if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq))
|
|
|
|
nfs4_schedule_stateid_recovery(server, state);
|
2016-10-06 23:11:21 +07:00
|
|
|
else
|
|
|
|
pnfs_parse_lgopen(state->inode, opendata->lgp, ctx);
|
2013-05-30 00:34:46 +07:00
|
|
|
}
|
2016-10-06 23:11:21 +07:00
|
|
|
|
2013-02-08 02:26:21 +07:00
|
|
|
out:
|
2018-05-22 22:17:16 +07:00
|
|
|
nfs4_sequence_free_slot(&opendata->o_res.seq_res);
|
2013-02-08 02:26:21 +07:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
/*
|
2006-01-03 15:55:11 +07:00
|
|
|
* Returns a referenced nfs4_state
|
2005-04-17 05:20:36 +07:00
|
|
|
*/
|
2012-05-23 16:02:35 +07:00
|
|
|
static int _nfs4_do_open(struct inode *dir,
|
2013-05-29 23:37:49 +07:00
|
|
|
struct nfs_open_context *ctx,
|
2012-05-23 16:02:35 +07:00
|
|
|
int flags,
|
2017-11-07 03:28:03 +07:00
|
|
|
const struct nfs4_open_createattrs *c,
|
2013-09-24 05:01:28 +07:00
|
|
|
int *opened)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_state_owner *sp;
|
|
|
|
struct nfs4_state *state = NULL;
|
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2006-01-03 15:55:08 +07:00
|
|
|
struct nfs4_opendata *opendata;
|
2013-05-29 23:37:49 +07:00
|
|
|
struct dentry *dentry = ctx->dentry;
|
|
|
|
struct rpc_cred *cred = ctx->cred;
|
|
|
|
struct nfs4_threshold **ctx_th = &ctx->mdsthreshold;
|
|
|
|
fmode_t fmode = ctx->mode & (FMODE_READ|FMODE_WRITE|FMODE_EXEC);
|
2013-03-16 03:44:28 +07:00
|
|
|
enum open_claim_type4 claim = NFS4_OPEN_CLAIM_NULL;
|
2017-11-07 03:28:03 +07:00
|
|
|
struct iattr *sattr = c->sattr;
|
|
|
|
struct nfs4_label *label = c->label;
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs4_label *olabel = NULL;
|
2007-07-06 06:02:21 +07:00
|
|
|
int status;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
|
|
|
/* Protect against reboot recovery conflicts */
|
|
|
|
status = -ENOMEM;
|
2012-01-18 10:04:24 +07:00
|
|
|
sp = nfs4_get_state_owner(server, cred, GFP_KERNEL);
|
|
|
|
if (sp == NULL) {
|
2005-04-17 05:20:36 +07:00
|
|
|
dprintk("nfs4_do_open: nfs4_get_state_owner failed!\n");
|
|
|
|
goto out_err;
|
|
|
|
}
|
2017-01-12 04:17:17 +07:00
|
|
|
status = nfs4_client_recover_expired_lease(server->nfs_client);
|
2006-01-03 15:55:24 +07:00
|
|
|
if (status != 0)
|
2006-01-03 15:55:25 +07:00
|
|
|
goto err_put_state_owner;
|
2015-03-18 05:25:59 +07:00
|
|
|
if (d_really_is_positive(dentry))
|
|
|
|
nfs4_return_incompatible_delegation(d_inode(dentry), fmode);
|
2006-01-03 15:55:24 +07:00
|
|
|
status = -ENOMEM;
|
2015-03-18 05:25:59 +07:00
|
|
|
if (d_really_is_positive(dentry))
|
2013-03-16 03:44:28 +07:00
|
|
|
claim = NFS4_OPEN_CLAIM_FH;
|
2017-11-07 03:28:03 +07:00
|
|
|
opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags,
|
|
|
|
c, claim, GFP_KERNEL);
|
2006-01-03 15:55:08 +07:00
|
|
|
if (opendata == NULL)
|
2008-12-24 03:21:45 +07:00
|
|
|
goto err_put_state_owner;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-05-22 23:50:43 +07:00
|
|
|
if (label) {
|
|
|
|
olabel = nfs4_label_alloc(server, GFP_KERNEL);
|
|
|
|
if (IS_ERR(olabel)) {
|
|
|
|
status = PTR_ERR(olabel);
|
|
|
|
goto err_opendata_put;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-03-27 03:24:37 +07:00
|
|
|
if (server->attr_bitmask[2] & FATTR4_WORD2_MDSTHRESHOLD) {
|
|
|
|
if (!opendata->f_attr.mdsthreshold) {
|
|
|
|
opendata->f_attr.mdsthreshold = pnfs_mdsthreshold_alloc();
|
|
|
|
if (!opendata->f_attr.mdsthreshold)
|
|
|
|
goto err_free_label;
|
|
|
|
}
|
2012-06-05 20:16:47 +07:00
|
|
|
opendata->o_arg.open_bitmap = &nfs4_pnfs_open_bitmap[0];
|
2012-05-23 16:02:35 +07:00
|
|
|
}
|
2015-03-18 05:25:59 +07:00
|
|
|
if (d_really_is_positive(dentry))
|
|
|
|
opendata->state = nfs4_get_open_state(d_inode(dentry), sp);
|
2007-07-06 06:02:21 +07:00
|
|
|
|
2013-05-30 00:17:04 +07:00
|
|
|
status = _nfs4_open_and_get_state(opendata, fmode, flags, ctx);
|
2012-09-11 01:00:46 +07:00
|
|
|
if (status != 0)
|
2013-05-22 23:50:43 +07:00
|
|
|
goto err_free_label;
|
2013-05-30 00:17:04 +07:00
|
|
|
state = ctx->state;
|
2012-09-11 01:00:46 +07:00
|
|
|
|
NFSv4: don't set SETATTR for O_RDONLY|O_EXCL
It is unusual to combine the open flags O_RDONLY and O_EXCL, but
it appears that libre-office does just that.
[pid 3250] stat("/home/USER/.config", {st_mode=S_IFDIR|0700, st_size=8192, ...}) = 0
[pid 3250] open("/home/USER/.config/libreoffice/4-suse/user/extensions/buildid", O_RDONLY|O_EXCL <unfinished ...>
NFSv4 takes O_EXCL as a sign that a setattr command should be sent,
probably to reset the timestamps.
When it was an O_RDONLY open, the SETATTR command does not
identify any actual attributes to change.
If no delegation was provided to the open, the SETATTR uses the
all-zeros stateid and the request is accepted (at least by the
Linux NFS server - no harm, no foul).
If a read-delegation was provided, this is used in the SETATTR
request, and a Netapp filer will justifiably claim
NFS4ERR_BAD_STATEID, which the Linux client takes as a sign
to retry - indefinitely.
So only treat O_EXCL specially if O_CREAT was also given.
Signed-off-by: NeilBrown <neilb@suse.com>
Cc: stable@vger.kernel.org
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-07-30 10:00:56 +07:00
|
|
|
if ((opendata->o_arg.open_flags & (O_CREAT|O_EXCL)) == (O_CREAT|O_EXCL) &&
|
2013-04-17 05:42:34 +07:00
|
|
|
(opendata->o_arg.createmode != NFS4_CREATE_GUARDED)) {
|
2018-03-29 03:18:17 +07:00
|
|
|
unsigned attrs = nfs4_exclusive_attrset(opendata, sattr, &label);
|
2016-05-12 16:16:38 +07:00
|
|
|
/*
|
|
|
|
* send create attributes which was not set by open
|
|
|
|
* with an extra setattr.
|
|
|
|
*/
|
2018-03-29 03:18:17 +07:00
|
|
|
if (attrs || label) {
|
|
|
|
unsigned ia_old = sattr->ia_valid;
|
|
|
|
|
|
|
|
sattr->ia_valid = attrs;
|
2016-05-12 16:16:38 +07:00
|
|
|
nfs_fattr_init(opendata->o_res.f_attr);
|
|
|
|
status = nfs4_do_setattr(state->inode, cred,
|
|
|
|
opendata->o_res.f_attr, sattr,
|
2016-10-13 11:26:47 +07:00
|
|
|
ctx, label, olabel);
|
2016-05-12 16:16:38 +07:00
|
|
|
if (status == 0) {
|
|
|
|
nfs_setattr_update_inode(state->inode, sattr,
|
|
|
|
opendata->o_res.f_attr);
|
|
|
|
nfs_setsecurity(state->inode, opendata->o_res.f_attr, olabel);
|
|
|
|
}
|
2018-03-29 03:18:17 +07:00
|
|
|
sattr->ia_valid = ia_old;
|
2013-05-22 23:50:42 +07:00
|
|
|
}
|
2010-04-17 03:22:51 +07:00
|
|
|
}
|
2015-08-26 20:11:39 +07:00
|
|
|
if (opened && opendata->file_created)
|
2013-09-24 05:01:28 +07:00
|
|
|
*opened |= FILE_CREATED;
|
2012-05-23 16:02:35 +07:00
|
|
|
|
2014-03-27 03:24:37 +07:00
|
|
|
if (pnfs_use_threshold(ctx_th, opendata->f_attr.mdsthreshold, server)) {
|
2012-05-23 16:02:35 +07:00
|
|
|
*ctx_th = opendata->f_attr.mdsthreshold;
|
2014-03-27 03:24:37 +07:00
|
|
|
opendata->f_attr.mdsthreshold = NULL;
|
|
|
|
}
|
2012-05-23 16:02:35 +07:00
|
|
|
|
2013-05-22 23:50:43 +07:00
|
|
|
nfs4_label_free(olabel);
|
|
|
|
|
2007-06-18 03:02:44 +07:00
|
|
|
nfs4_opendata_put(opendata);
|
2005-04-17 05:20:36 +07:00
|
|
|
nfs4_put_state_owner(sp);
|
|
|
|
return 0;
|
2013-05-22 23:50:43 +07:00
|
|
|
err_free_label:
|
|
|
|
nfs4_label_free(olabel);
|
2007-06-18 03:02:44 +07:00
|
|
|
err_opendata_put:
|
|
|
|
nfs4_opendata_put(opendata);
|
2006-01-03 15:55:08 +07:00
|
|
|
err_put_state_owner:
|
|
|
|
nfs4_put_state_owner(sp);
|
2005-04-17 05:20:36 +07:00
|
|
|
out_err:
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2012-05-23 16:02:35 +07:00
|
|
|
static struct nfs4_state *nfs4_do_open(struct inode *dir,
|
2013-05-29 23:37:49 +07:00
|
|
|
struct nfs_open_context *ctx,
|
2012-05-23 16:02:35 +07:00
|
|
|
int flags,
|
|
|
|
struct iattr *sattr,
|
2013-09-24 05:01:28 +07:00
|
|
|
struct nfs4_label *label,
|
|
|
|
int *opened)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2013-03-16 03:44:28 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
struct nfs4_state *res;
|
2017-11-07 03:28:03 +07:00
|
|
|
struct nfs4_open_createattrs c = {
|
|
|
|
.label = label,
|
|
|
|
.sattr = sattr,
|
|
|
|
.verf = {
|
|
|
|
[0] = (__u32)jiffies,
|
|
|
|
[1] = (__u32)current->pid,
|
|
|
|
},
|
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
int status;
|
|
|
|
|
|
|
|
do {
|
2017-11-07 03:28:03 +07:00
|
|
|
status = _nfs4_do_open(dir, ctx, flags, &c, opened);
|
2013-05-30 00:17:04 +07:00
|
|
|
res = ctx->state;
|
2013-08-13 03:19:27 +07:00
|
|
|
trace_nfs4_open_file(ctx, flags, status);
|
2005-04-17 05:20:36 +07:00
|
|
|
if (status == 0)
|
|
|
|
break;
|
|
|
|
/* NOTE: BAD_SEQID means the server and client disagree about the
|
|
|
|
* book-keeping w.r.t. state-changing operations
|
|
|
|
* (OPEN/CLOSE/LOCK/LOCKU...)
|
|
|
|
* It is actually a sign of a bug on the client or on the server.
|
|
|
|
*
|
|
|
|
* If we receive a BAD_SEQID error in the particular case of
|
NFSv4: Add functions to order RPC calls
NFSv4 file state-changing functions such as OPEN, CLOSE, LOCK,... are all
labelled with "sequence identifiers" in order to prevent the server from
reordering RPC requests, as this could cause its file state to
become out of sync with the client.
Currently the NFS client code enforces this ordering locally using
semaphores to restrict access to structures until the RPC call is done.
This, of course, only works with synchronous RPC calls, since the
user process must first grab the semaphore.
By dropping semaphores, and instead teaching the RPC engine to hold
the RPC calls until they are ready to be sent, we can extend this
process to work nicely with asynchronous RPC calls too.
This patch adds a new list called "rpc_sequence" that defines the order
of the RPC calls to be sent. We add one such list for each state_owner.
When an RPC call is ready to be sent, it checks if it is top of the
rpc_sequence list. If so, it proceeds. If not, it goes back to sleep,
and loops until it hits top of the list.
Once the RPC call has completed, it can then bump the sequence id counter,
and remove itself from the rpc_sequence list, and then wake up the next
sleeper.
Note that the state_owner sequence ids and lock_owner sequence ids are
all indexed to the same rpc_sequence list, so OPEN, LOCK,... requests
are all ordered w.r.t. each other.
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2005-10-19 04:20:12 +07:00
|
|
|
* doing an OPEN, we assume that nfs_increment_open_seqid() will
|
2005-04-17 05:20:36 +07:00
|
|
|
* have unhashed the old state_owner for us, and that we can
|
|
|
|
* therefore safely retry using a new one. We should still warn
|
|
|
|
* the user though...
|
|
|
|
*/
|
|
|
|
if (status == -NFS4ERR_BAD_SEQID) {
|
2012-03-13 05:01:48 +07:00
|
|
|
pr_warn_ratelimited("NFS: v4 server %s "
|
2007-07-09 03:49:11 +07:00
|
|
|
" returned a bad sequence-id error!\n",
|
|
|
|
NFS_SERVER(dir)->nfs_client->cl_hostname);
|
2005-04-17 05:20:36 +07:00
|
|
|
exception.retry = 1;
|
|
|
|
continue;
|
|
|
|
}
|
2005-10-19 04:20:21 +07:00
|
|
|
/*
|
|
|
|
* BAD_STATEID on OPEN means that the server cancelled our
|
|
|
|
* state before it received the OPEN_CONFIRM.
|
|
|
|
* Recover by retrying the request as per the discussion
|
|
|
|
* on Page 181 of RFC3530.
|
|
|
|
*/
|
|
|
|
if (status == -NFS4ERR_BAD_STATEID) {
|
|
|
|
exception.retry = 1;
|
|
|
|
continue;
|
|
|
|
}
|
2007-07-06 06:02:21 +07:00
|
|
|
if (status == -EAGAIN) {
|
|
|
|
/* We must have found a delegation */
|
|
|
|
exception.retry = 1;
|
|
|
|
continue;
|
|
|
|
}
|
2013-03-16 03:44:28 +07:00
|
|
|
if (nfs4_clear_cap_atomic_open_v1(server, status, &exception))
|
|
|
|
continue;
|
|
|
|
res = ERR_PTR(nfs4_handle_exception(server,
|
2005-04-17 05:20:36 +07:00
|
|
|
status, &exception));
|
|
|
|
} while (exception.retry);
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2016-06-26 19:44:35 +07:00
|
|
|
static int _nfs4_do_setattr(struct inode *inode,
|
|
|
|
struct nfs_setattrargs *arg,
|
|
|
|
struct nfs_setattrres *res,
|
|
|
|
struct rpc_cred *cred,
|
2016-10-13 11:26:47 +07:00
|
|
|
struct nfs_open_context *ctx)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-03-21 01:44:46 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2017-01-12 03:04:25 +07:00
|
|
|
struct rpc_message msg = {
|
2008-06-11 06:39:41 +07:00
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
|
2016-06-26 19:44:35 +07:00
|
|
|
.rpc_argp = arg,
|
|
|
|
.rpc_resp = res,
|
2008-06-11 06:39:41 +07:00
|
|
|
.rpc_cred = cred,
|
2017-01-12 03:04:25 +07:00
|
|
|
};
|
2016-05-17 04:42:44 +07:00
|
|
|
struct rpc_cred *delegation_cred = NULL;
|
2006-01-03 15:55:21 +07:00
|
|
|
unsigned long timestamp = jiffies;
|
2013-04-29 21:35:36 +07:00
|
|
|
bool truncate;
|
2005-08-16 22:49:44 +07:00
|
|
|
int status;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2016-06-26 19:44:35 +07:00
|
|
|
nfs_fattr_init(res->fattr);
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-04-29 21:35:36 +07:00
|
|
|
/* Servers should only apply open mode checks for file size changes */
|
2016-06-26 19:44:35 +07:00
|
|
|
truncate = (arg->iap->ia_valid & ATTR_SIZE) ? true : false;
|
2018-04-09 22:15:30 +07:00
|
|
|
if (!truncate)
|
|
|
|
goto zero_stateid;
|
2013-04-29 21:35:36 +07:00
|
|
|
|
2018-04-09 22:15:30 +07:00
|
|
|
if (nfs4_copy_delegation_stateid(inode, FMODE_WRITE, &arg->stateid, &delegation_cred)) {
|
2013-04-29 21:35:36 +07:00
|
|
|
/* Use that stateid */
|
2018-04-09 22:15:30 +07:00
|
|
|
} else if (ctx != NULL) {
|
2016-10-13 11:26:47 +07:00
|
|
|
struct nfs_lock_context *l_ctx;
|
2016-10-13 11:26:47 +07:00
|
|
|
if (!nfs4_valid_open_stateid(ctx->state))
|
2014-03-05 01:48:16 +07:00
|
|
|
return -EBADF;
|
2016-10-13 11:26:47 +07:00
|
|
|
l_ctx = nfs_get_lock_context(ctx);
|
|
|
|
if (IS_ERR(l_ctx))
|
|
|
|
return PTR_ERR(l_ctx);
|
2016-12-07 03:50:06 +07:00
|
|
|
status = nfs4_select_rw_stateid(ctx->state, FMODE_WRITE, l_ctx,
|
|
|
|
&arg->stateid, &delegation_cred);
|
|
|
|
nfs_put_lock_context(l_ctx);
|
|
|
|
if (status == -EIO)
|
2014-03-05 01:48:16 +07:00
|
|
|
return -EBADF;
|
2018-04-09 22:15:30 +07:00
|
|
|
} else {
|
|
|
|
zero_stateid:
|
2016-06-26 19:44:35 +07:00
|
|
|
nfs4_stateid_copy(&arg->stateid, &zero_stateid);
|
2018-04-09 22:15:30 +07:00
|
|
|
}
|
2016-05-17 04:42:44 +07:00
|
|
|
if (delegation_cred)
|
|
|
|
msg.rpc_cred = delegation_cred;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2016-06-26 19:44:35 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &arg->seq_args, &res->seq_res, 1);
|
2016-05-17 04:42:44 +07:00
|
|
|
|
|
|
|
put_rpccred(delegation_cred);
|
2016-10-13 11:26:47 +07:00
|
|
|
if (status == 0 && ctx != NULL)
|
2006-01-03 15:55:21 +07:00
|
|
|
renew_lease(server, timestamp);
|
2016-06-26 19:44:35 +07:00
|
|
|
trace_nfs4_setattr(inode, &arg->stateid, status);
|
2005-08-16 22:49:44 +07:00
|
|
|
return status;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2008-06-11 06:39:41 +07:00
|
|
|
static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
|
|
|
|
struct nfs_fattr *fattr, struct iattr *sattr,
|
2016-10-13 11:26:47 +07:00
|
|
|
struct nfs_open_context *ctx, struct nfs4_label *ilabel,
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs4_label *olabel)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-03-21 01:44:46 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2018-04-08 00:44:28 +07:00
|
|
|
__u32 bitmask[NFS4_BITMASK_SZ];
|
2016-10-13 11:26:47 +07:00
|
|
|
struct nfs4_state *state = ctx ? ctx->state : NULL;
|
2017-01-12 03:04:25 +07:00
|
|
|
struct nfs_setattrargs arg = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.iap = sattr,
|
2016-06-26 19:44:35 +07:00
|
|
|
.server = server,
|
2018-04-08 00:44:28 +07:00
|
|
|
.bitmask = bitmask,
|
2016-06-26 19:44:35 +07:00
|
|
|
.label = ilabel,
|
2017-01-12 03:04:25 +07:00
|
|
|
};
|
|
|
|
struct nfs_setattrres res = {
|
2016-06-26 19:44:35 +07:00
|
|
|
.fattr = fattr,
|
|
|
|
.label = olabel,
|
|
|
|
.server = server,
|
2017-01-12 03:04:25 +07:00
|
|
|
};
|
2012-03-06 07:56:44 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.state = state,
|
2012-03-08 04:39:06 +07:00
|
|
|
.inode = inode,
|
2016-06-26 19:44:35 +07:00
|
|
|
.stateid = &arg.stateid,
|
2012-03-06 07:56:44 +07:00
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
2016-06-26 19:44:35 +07:00
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
do {
|
2018-04-08 00:44:28 +07:00
|
|
|
nfs4_bitmap_copy_adjust_setattr(bitmask,
|
|
|
|
nfs4_bitmask(server, olabel),
|
|
|
|
inode);
|
|
|
|
|
2016-10-13 11:26:47 +07:00
|
|
|
err = _nfs4_do_setattr(inode, &arg, &res, cred, ctx);
|
2012-04-19 03:29:11 +07:00
|
|
|
switch (err) {
|
|
|
|
case -NFS4ERR_OPENMODE:
|
2013-04-29 22:11:58 +07:00
|
|
|
if (!(sattr->ia_valid & ATTR_SIZE)) {
|
|
|
|
pr_warn_once("NFSv4: server %s is incorrectly "
|
|
|
|
"applying open mode checks to "
|
|
|
|
"a SETATTR that is not "
|
|
|
|
"changing file size.\n",
|
|
|
|
server->nfs_client->cl_hostname);
|
|
|
|
}
|
2012-04-19 03:29:11 +07:00
|
|
|
if (state && !(state->state & FMODE_WRITE)) {
|
|
|
|
err = -EBADF;
|
|
|
|
if (sattr->ia_valid & ATTR_OPEN)
|
|
|
|
err = -EACCES;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
err = nfs4_handle_exception(server, err, &exception);
|
2005-04-17 05:20:36 +07:00
|
|
|
} while (exception.retry);
|
2012-04-19 03:29:11 +07:00
|
|
|
out:
|
2005-04-17 05:20:36 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2015-09-22 10:35:22 +07:00
|
|
|
static bool
|
|
|
|
nfs4_wait_on_layoutreturn(struct inode *inode, struct rpc_task *task)
|
|
|
|
{
|
|
|
|
if (inode == NULL || !nfs_have_layout(inode))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return pnfs_wait_on_layoutreturn(inode, task);
|
|
|
|
}
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_closedata {
|
|
|
|
struct inode *inode;
|
|
|
|
struct nfs4_state *state;
|
|
|
|
struct nfs_closeargs arg;
|
|
|
|
struct nfs_closeres res;
|
2016-11-16 02:56:07 +07:00
|
|
|
struct {
|
|
|
|
struct nfs4_layoutreturn_args arg;
|
|
|
|
struct nfs4_layoutreturn_res res;
|
2016-09-23 22:38:08 +07:00
|
|
|
struct nfs4_xdr_opaque_data ld_private;
|
2016-11-16 02:56:07 +07:00
|
|
|
u32 roc_barrier;
|
|
|
|
bool roc;
|
|
|
|
} lr;
|
2005-10-28 09:12:41 +07:00
|
|
|
struct nfs_fattr fattr;
|
2006-01-03 15:55:21 +07:00
|
|
|
unsigned long timestamp;
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2006-01-03 15:55:04 +07:00
|
|
|
static void nfs4_free_closedata(void *data)
|
2005-10-19 04:20:12 +07:00
|
|
|
{
|
2006-01-03 15:55:04 +07:00
|
|
|
struct nfs4_closedata *calldata = data;
|
|
|
|
struct nfs4_state_owner *sp = calldata->state->owner;
|
2011-06-23 05:20:23 +07:00
|
|
|
struct super_block *sb = calldata->state->inode->i_sb;
|
2005-10-19 04:20:12 +07:00
|
|
|
|
2016-11-16 02:56:07 +07:00
|
|
|
if (calldata->lr.roc)
|
2016-11-16 13:11:25 +07:00
|
|
|
pnfs_roc_release(&calldata->lr.arg, &calldata->lr.res,
|
|
|
|
calldata->res.lr_ret);
|
2005-10-19 04:20:12 +07:00
|
|
|
nfs4_put_open_state(calldata->state);
|
|
|
|
nfs_free_seqid(calldata->arg.seqid);
|
|
|
|
nfs4_put_state_owner(sp);
|
2013-01-12 04:39:51 +07:00
|
|
|
nfs_sb_deactive(sb);
|
2005-10-19 04:20:12 +07:00
|
|
|
kfree(calldata);
|
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:04 +07:00
|
|
|
static void nfs4_close_done(struct rpc_task *task, void *data)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-01-03 15:55:04 +07:00
|
|
|
struct nfs4_closedata *calldata = data;
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_state *state = calldata->state;
|
|
|
|
struct nfs_server *server = NFS_SERVER(calldata->inode);
|
2014-08-26 09:09:08 +07:00
|
|
|
nfs4_stateid *res_stateid = NULL;
|
2017-11-07 22:51:37 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.state = state,
|
|
|
|
.inode = calldata->inode,
|
|
|
|
.stateid = &calldata->arg.stateid,
|
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2012-03-02 05:00:40 +07:00
|
|
|
dprintk("%s: begin!\n", __func__);
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs4_sequence_done(task, &calldata->res.seq_res))
|
|
|
|
return;
|
2013-08-13 03:19:27 +07:00
|
|
|
trace_nfs4_close(state, &calldata->arg, &calldata->res, task->tk_status);
|
2016-11-16 02:56:07 +07:00
|
|
|
|
|
|
|
/* Handle Layoutreturn errors */
|
|
|
|
if (calldata->arg.lr_args && task->tk_status != 0) {
|
|
|
|
switch (calldata->res.lr_ret) {
|
|
|
|
default:
|
|
|
|
calldata->res.lr_ret = -NFS4ERR_NOMATCHING_LAYOUT;
|
|
|
|
break;
|
|
|
|
case 0:
|
|
|
|
calldata->arg.lr_args = NULL;
|
|
|
|
calldata->res.lr_res = NULL;
|
|
|
|
break;
|
2017-11-07 03:28:07 +07:00
|
|
|
case -NFS4ERR_OLD_STATEID:
|
|
|
|
if (nfs4_refresh_layout_stateid(&calldata->arg.lr_args->stateid,
|
2017-11-07 03:28:09 +07:00
|
|
|
calldata->inode))
|
|
|
|
goto lr_restart;
|
2017-11-07 03:28:07 +07:00
|
|
|
/* Fallthrough */
|
2016-11-16 02:56:07 +07:00
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
case -NFS4ERR_BAD_STATEID:
|
|
|
|
case -NFS4ERR_UNKNOWN_LAYOUTTYPE:
|
|
|
|
case -NFS4ERR_WRONG_CRED:
|
|
|
|
calldata->arg.lr_args = NULL;
|
|
|
|
calldata->res.lr_res = NULL;
|
2017-11-07 03:28:09 +07:00
|
|
|
goto lr_restart;
|
2016-11-16 02:56:07 +07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-01-12 03:04:25 +07:00
|
|
|
/* hmm. we are done with the inode, and in the process of freeing
|
2005-04-17 05:20:36 +07:00
|
|
|
* the state_owner. we keep this around to process errors
|
|
|
|
*/
|
|
|
|
switch (task->tk_status) {
|
|
|
|
case 0:
|
2014-08-26 09:09:08 +07:00
|
|
|
res_stateid = &calldata->res.stateid;
|
2006-01-03 15:55:21 +07:00
|
|
|
renew_lease(server, calldata->timestamp);
|
2014-08-26 09:09:08 +07:00
|
|
|
break;
|
2016-12-19 22:34:14 +07:00
|
|
|
case -NFS4ERR_ACCESS:
|
|
|
|
if (calldata->arg.bitmask != NULL) {
|
|
|
|
calldata->arg.bitmask = NULL;
|
|
|
|
calldata->res.fattr = NULL;
|
2017-11-07 03:28:09 +07:00
|
|
|
goto out_restart;
|
2016-12-19 22:34:14 +07:00
|
|
|
|
|
|
|
}
|
|
|
|
break;
|
2017-11-07 03:28:05 +07:00
|
|
|
case -NFS4ERR_OLD_STATEID:
|
|
|
|
/* Did we race with OPEN? */
|
|
|
|
if (nfs4_refresh_open_stateid(&calldata->arg.stateid,
|
2017-11-07 03:28:09 +07:00
|
|
|
state))
|
|
|
|
goto out_restart;
|
2017-11-07 03:28:05 +07:00
|
|
|
goto out_release;
|
2013-11-21 00:57:19 +07:00
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
2005-04-17 05:20:36 +07:00
|
|
|
case -NFS4ERR_STALE_STATEID:
|
2016-09-23 00:39:05 +07:00
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
nfs4_free_revoked_stateid(server,
|
|
|
|
&calldata->arg.stateid,
|
|
|
|
task->tk_msg.rpc_cred);
|
2017-11-07 03:28:05 +07:00
|
|
|
/* Fallthrough */
|
2008-12-24 03:21:46 +07:00
|
|
|
case -NFS4ERR_BAD_STATEID:
|
2017-11-07 03:28:06 +07:00
|
|
|
break;
|
2005-04-17 05:20:36 +07:00
|
|
|
default:
|
2017-11-07 22:51:37 +07:00
|
|
|
task->tk_status = nfs4_async_handle_exception(task,
|
|
|
|
server, task->tk_status, &exception);
|
|
|
|
if (exception.retry)
|
2017-11-07 03:28:09 +07:00
|
|
|
goto out_restart;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2015-08-31 08:37:59 +07:00
|
|
|
nfs_clear_open_stateid(state, &calldata->arg.stateid,
|
|
|
|
res_stateid, calldata->arg.fmode);
|
2013-11-21 00:57:19 +07:00
|
|
|
out_release:
|
2017-11-07 03:28:09 +07:00
|
|
|
task->tk_status = 0;
|
2009-12-16 02:47:36 +07:00
|
|
|
nfs_release_seqid(calldata->arg.seqid);
|
2016-12-20 00:14:44 +07:00
|
|
|
nfs_refresh_inode(calldata->inode, &calldata->fattr);
|
2012-03-02 05:00:40 +07:00
|
|
|
dprintk("%s: done, ret = %d!\n", __func__, task->tk_status);
|
2017-11-07 03:28:09 +07:00
|
|
|
return;
|
|
|
|
lr_restart:
|
|
|
|
calldata->res.lr_ret = 0;
|
|
|
|
out_restart:
|
|
|
|
task->tk_status = 0;
|
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
goto out_release;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:05 +07:00
|
|
|
static void nfs4_close_prepare(struct rpc_task *task, void *data)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-01-03 15:55:05 +07:00
|
|
|
struct nfs4_closedata *calldata = data;
|
2005-10-19 04:20:12 +07:00
|
|
|
struct nfs4_state *state = calldata->state;
|
2012-09-21 07:15:57 +07:00
|
|
|
struct inode *inode = calldata->inode;
|
2014-08-26 09:33:12 +07:00
|
|
|
bool is_rdonly, is_wronly, is_rdwr;
|
2009-12-08 20:33:16 +07:00
|
|
|
int call_close = 0;
|
2005-10-19 04:20:12 +07:00
|
|
|
|
2012-03-02 05:00:40 +07:00
|
|
|
dprintk("%s: begin!\n", __func__);
|
2006-01-03 15:55:04 +07:00
|
|
|
if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
|
2013-02-12 07:01:21 +07:00
|
|
|
goto out_wait;
|
2007-07-06 05:07:55 +07:00
|
|
|
|
2009-12-08 20:33:16 +07:00
|
|
|
task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_DOWNGRADE];
|
2005-11-05 03:32:58 +07:00
|
|
|
spin_lock(&state->owner->so_lock);
|
2014-08-26 09:33:12 +07:00
|
|
|
is_rdwr = test_bit(NFS_O_RDWR_STATE, &state->flags);
|
|
|
|
is_rdonly = test_bit(NFS_O_RDONLY_STATE, &state->flags);
|
|
|
|
is_wronly = test_bit(NFS_O_WRONLY_STATE, &state->flags);
|
2007-07-06 05:07:55 +07:00
|
|
|
/* Calculate the change in open mode */
|
2014-09-18 22:51:32 +07:00
|
|
|
calldata->arg.fmode = 0;
|
2006-01-03 15:55:13 +07:00
|
|
|
if (state->n_rdwr == 0) {
|
2014-09-18 22:51:32 +07:00
|
|
|
if (state->n_rdonly == 0)
|
|
|
|
call_close |= is_rdonly;
|
|
|
|
else if (is_rdonly)
|
|
|
|
calldata->arg.fmode |= FMODE_READ;
|
|
|
|
if (state->n_wronly == 0)
|
|
|
|
call_close |= is_wronly;
|
|
|
|
else if (is_wronly)
|
|
|
|
calldata->arg.fmode |= FMODE_WRITE;
|
2016-06-26 06:19:28 +07:00
|
|
|
if (calldata->arg.fmode != (FMODE_READ|FMODE_WRITE))
|
|
|
|
call_close |= is_rdwr;
|
2014-09-18 22:51:32 +07:00
|
|
|
} else if (is_rdwr)
|
|
|
|
calldata->arg.fmode |= FMODE_READ|FMODE_WRITE;
|
|
|
|
|
2016-11-14 23:19:56 +07:00
|
|
|
if (!nfs4_valid_open_stateid(state) ||
|
2017-11-07 03:28:06 +07:00
|
|
|
!nfs4_refresh_open_stateid(&calldata->arg.stateid, state))
|
2013-03-15 03:57:48 +07:00
|
|
|
call_close = 0;
|
2005-11-05 03:32:58 +07:00
|
|
|
spin_unlock(&state->owner->so_lock);
|
2009-12-08 20:33:16 +07:00
|
|
|
|
|
|
|
if (!call_close) {
|
2006-01-03 15:55:04 +07:00
|
|
|
/* Note: exit _without_ calling nfs4_close_done */
|
2013-02-12 07:01:21 +07:00
|
|
|
goto out_no_action;
|
2005-10-19 04:20:12 +07:00
|
|
|
}
|
2009-12-08 20:33:16 +07:00
|
|
|
|
2016-11-16 13:11:25 +07:00
|
|
|
if (!calldata->lr.roc && nfs4_wait_on_layoutreturn(inode, task)) {
|
2015-09-22 10:35:22 +07:00
|
|
|
nfs_release_seqid(calldata->arg.seqid);
|
|
|
|
goto out_wait;
|
|
|
|
}
|
|
|
|
|
2016-12-19 23:36:41 +07:00
|
|
|
if (calldata->arg.fmode == 0)
|
2009-12-08 20:33:16 +07:00
|
|
|
task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE];
|
2016-10-28 05:25:04 +07:00
|
|
|
|
2016-12-19 23:36:41 +07:00
|
|
|
if (calldata->arg.fmode == 0 || calldata->arg.fmode == FMODE_READ) {
|
2016-10-28 05:25:04 +07:00
|
|
|
/* Close-to-open cache consistency revalidation */
|
|
|
|
if (!nfs4_have_delegation(inode, FMODE_READ))
|
|
|
|
calldata->arg.bitmask = NFS_SERVER(inode)->cache_consistency_bitmask;
|
|
|
|
else
|
|
|
|
calldata->arg.bitmask = NULL;
|
|
|
|
}
|
2015-08-19 11:45:13 +07:00
|
|
|
|
2015-01-31 02:21:14 +07:00
|
|
|
calldata->arg.share_access =
|
|
|
|
nfs4_map_atomic_open_share(NFS_SERVER(inode),
|
|
|
|
calldata->arg.fmode, 0);
|
2009-12-08 20:33:16 +07:00
|
|
|
|
2016-12-20 00:14:44 +07:00
|
|
|
if (calldata->res.fattr == NULL)
|
|
|
|
calldata->arg.bitmask = NULL;
|
|
|
|
else if (calldata->arg.bitmask == NULL)
|
|
|
|
calldata->res.fattr = NULL;
|
2006-01-03 15:55:21 +07:00
|
|
|
calldata->timestamp = jiffies;
|
2017-01-10 03:48:22 +07:00
|
|
|
if (nfs4_setup_sequence(NFS_SERVER(inode)->nfs_client,
|
2012-01-18 10:04:25 +07:00
|
|
|
&calldata->arg.seq_args,
|
|
|
|
&calldata->res.seq_res,
|
2012-10-30 05:37:40 +07:00
|
|
|
task) != 0)
|
|
|
|
nfs_release_seqid(calldata->arg.seqid);
|
2012-03-02 05:00:40 +07:00
|
|
|
dprintk("%s: done!\n", __func__);
|
2013-02-12 07:01:21 +07:00
|
|
|
return;
|
|
|
|
out_no_action:
|
|
|
|
task->tk_action = NULL;
|
|
|
|
out_wait:
|
|
|
|
nfs4_sequence_done(task, &calldata->res.seq_res);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:04 +07:00
|
|
|
static const struct rpc_call_ops nfs4_close_ops = {
|
2006-01-03 15:55:05 +07:00
|
|
|
.rpc_call_prepare = nfs4_close_prepare,
|
2006-01-03 15:55:04 +07:00
|
|
|
.rpc_call_done = nfs4_close_done,
|
|
|
|
.rpc_release = nfs4_free_closedata,
|
|
|
|
};
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
/*
|
|
|
|
* It is possible for data to be read/written from a mem-mapped file
|
|
|
|
* after the sys_close call (which hits the vfs layer as a flush).
|
|
|
|
* This means that we can't safely call nfsv4 close on a file until
|
|
|
|
* the inode is cleared. This in turn means that we are not good
|
|
|
|
* NFSv4 citizens - we do not indicate to the server to update the file's
|
|
|
|
* share state even when we are done with one of the three share
|
|
|
|
* stateid's in the inode.
|
|
|
|
*
|
|
|
|
* NOTE: Caller must be holding the sp->so_owner semaphore!
|
|
|
|
*/
|
2012-09-21 07:31:51 +07:00
|
|
|
int nfs4_do_close(struct nfs4_state *state, gfp_t gfp_mask, int wait)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2007-06-05 21:31:33 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
2015-01-24 07:19:25 +07:00
|
|
|
struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_closedata *calldata;
|
2007-06-12 10:05:07 +07:00
|
|
|
struct nfs4_state_owner *sp = state->owner;
|
|
|
|
struct rpc_task *task;
|
2007-07-15 02:40:01 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE],
|
|
|
|
.rpc_cred = state->owner->so_cred,
|
|
|
|
};
|
2007-07-15 02:39:59 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = server->client,
|
2007-07-15 02:40:01 +07:00
|
|
|
.rpc_message = &msg,
|
2007-07-15 02:39:59 +07:00
|
|
|
.callback_ops = &nfs4_close_ops,
|
2008-02-20 08:04:23 +07:00
|
|
|
.workqueue = nfsiod_workqueue,
|
2007-07-15 02:39:59 +07:00
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
2005-10-19 04:20:12 +07:00
|
|
|
int status = -ENOMEM;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-08-14 03:37:34 +07:00
|
|
|
nfs4_state_protect(server->nfs_client, NFS_SP4_MACH_CRED_CLEANUP,
|
|
|
|
&task_setup_data.rpc_client, &msg);
|
|
|
|
|
2010-05-13 23:51:01 +07:00
|
|
|
calldata = kzalloc(sizeof(*calldata), gfp_mask);
|
2005-04-17 05:20:36 +07:00
|
|
|
if (calldata == NULL)
|
2005-10-19 04:20:12 +07:00
|
|
|
goto out;
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 1, 0);
|
2007-06-05 21:31:33 +07:00
|
|
|
calldata->inode = state->inode;
|
2005-04-17 05:20:36 +07:00
|
|
|
calldata->state = state;
|
2007-06-05 21:31:33 +07:00
|
|
|
calldata->arg.fh = NFS_FH(state->inode);
|
2017-11-07 03:28:06 +07:00
|
|
|
if (!nfs4_copy_open_stateid(&calldata->arg.stateid, state))
|
|
|
|
goto out_free_calldata;
|
2005-04-17 05:20:36 +07:00
|
|
|
/* Serialization for the sequence id */
|
2015-01-24 07:19:25 +07:00
|
|
|
alloc_seqid = server->nfs_client->cl_mvops->alloc_seqid;
|
|
|
|
calldata->arg.seqid = alloc_seqid(&state->owner->so_seqid, gfp_mask);
|
2015-01-24 06:48:00 +07:00
|
|
|
if (IS_ERR(calldata->arg.seqid))
|
2005-10-19 04:20:12 +07:00
|
|
|
goto out_free_calldata;
|
2016-12-20 00:14:44 +07:00
|
|
|
nfs_fattr_init(&calldata->fattr);
|
2008-12-24 03:21:56 +07:00
|
|
|
calldata->arg.fmode = 0;
|
2016-09-23 22:38:08 +07:00
|
|
|
calldata->lr.arg.ld_private = &calldata->lr.ld_private;
|
2005-10-28 09:12:41 +07:00
|
|
|
calldata->res.fattr = &calldata->fattr;
|
2008-04-08 00:20:54 +07:00
|
|
|
calldata->res.seqid = calldata->arg.seqid;
|
2005-10-28 09:12:41 +07:00
|
|
|
calldata->res.server = server;
|
2016-11-16 02:56:07 +07:00
|
|
|
calldata->res.lr_ret = -NFS4ERR_NOMATCHING_LAYOUT;
|
2016-11-16 13:11:25 +07:00
|
|
|
calldata->lr.roc = pnfs_roc(state->inode,
|
|
|
|
&calldata->lr.arg, &calldata->lr.res, msg.rpc_cred);
|
|
|
|
if (calldata->lr.roc) {
|
|
|
|
calldata->arg.lr_args = &calldata->lr.arg;
|
|
|
|
calldata->res.lr_res = &calldata->lr.res;
|
|
|
|
}
|
2011-06-23 05:20:23 +07:00
|
|
|
nfs_sb_active(calldata->inode->i_sb);
|
2005-10-19 04:20:12 +07:00
|
|
|
|
2010-12-21 22:52:24 +07:00
|
|
|
msg.rpc_argp = &calldata->arg;
|
|
|
|
msg.rpc_resp = &calldata->res;
|
2007-07-15 02:39:59 +07:00
|
|
|
task_setup_data.callback_data = calldata;
|
|
|
|
task = rpc_run_task(&task_setup_data);
|
2007-06-12 10:05:07 +07:00
|
|
|
if (IS_ERR(task))
|
|
|
|
return PTR_ERR(task);
|
2007-10-19 05:03:27 +07:00
|
|
|
status = 0;
|
|
|
|
if (wait)
|
|
|
|
status = rpc_wait_for_completion_task(task);
|
2007-06-12 10:05:07 +07:00
|
|
|
rpc_put_task(task);
|
2007-10-19 05:03:27 +07:00
|
|
|
return status;
|
2005-10-19 04:20:12 +07:00
|
|
|
out_free_calldata:
|
|
|
|
kfree(calldata);
|
|
|
|
out:
|
2007-06-12 10:05:07 +07:00
|
|
|
nfs4_put_open_state(state);
|
|
|
|
nfs4_put_state_owner(sp);
|
2005-10-19 04:20:12 +07:00
|
|
|
return status;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2010-09-17 21:56:51 +07:00
|
|
|
static struct inode *
|
2013-09-24 05:01:28 +07:00
|
|
|
nfs4_atomic_open(struct inode *dir, struct nfs_open_context *ctx,
|
|
|
|
int open_flags, struct iattr *attr, int *opened)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_state *state;
|
2013-05-22 23:50:44 +07:00
|
|
|
struct nfs4_label l = {0, 0, 0, NULL}, *label = NULL;
|
|
|
|
|
|
|
|
label = nfs4_label_init_security(dir, ctx->dentry, attr, &l);
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2007-10-16 05:17:53 +07:00
|
|
|
/* Protect against concurrent sillydeletes */
|
2013-09-24 05:01:28 +07:00
|
|
|
state = nfs4_do_open(dir, ctx, open_flags, attr, label, opened);
|
2013-05-22 23:50:44 +07:00
|
|
|
|
|
|
|
nfs4_label_release_security(label);
|
|
|
|
|
2010-09-17 21:56:50 +07:00
|
|
|
if (IS_ERR(state))
|
|
|
|
return ERR_CAST(state);
|
2013-05-30 00:11:28 +07:00
|
|
|
return state->inode;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2009-12-04 03:54:02 +07:00
|
|
|
static void nfs4_close_context(struct nfs_open_context *ctx, int is_sync)
|
2009-03-20 02:35:50 +07:00
|
|
|
{
|
|
|
|
if (ctx->state == NULL)
|
|
|
|
return;
|
|
|
|
if (is_sync)
|
2011-06-23 05:20:23 +07:00
|
|
|
nfs4_close_sync(ctx->state, ctx->mode);
|
2009-03-20 02:35:50 +07:00
|
|
|
else
|
2011-06-23 05:20:23 +07:00
|
|
|
nfs4_close_state(ctx->state, ctx->mode);
|
2009-03-20 02:35:50 +07:00
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-11-05 03:20:20 +07:00
|
|
|
#define FATTR4_WORD1_NFS40_MASK (2*FATTR4_WORD1_MOUNTED_ON_FILEID - 1UL)
|
|
|
|
#define FATTR4_WORD2_NFS41_MASK (2*FATTR4_WORD2_SUPPATTR_EXCLCREAT - 1UL)
|
2016-12-03 10:53:30 +07:00
|
|
|
#define FATTR4_WORD2_NFS42_MASK (2*FATTR4_WORD2_MODE_UMASK - 1UL)
|
2013-11-05 03:20:20 +07:00
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
static int _nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
|
|
|
|
{
|
2015-08-26 20:12:58 +07:00
|
|
|
u32 bitmask[3] = {}, minorversion = server->nfs_client->cl_minorversion;
|
2009-04-01 20:21:54 +07:00
|
|
|
struct nfs4_server_caps_arg args = {
|
|
|
|
.fhandle = fhandle,
|
2015-08-26 20:12:58 +07:00
|
|
|
.bitmask = bitmask,
|
2009-04-01 20:21:54 +07:00
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_server_caps_res res = {};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SERVER_CAPS],
|
2009-04-01 20:21:54 +07:00
|
|
|
.rpc_argp = &args,
|
2005-04-17 05:20:36 +07:00
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
|
|
|
int status;
|
2017-05-10 02:47:15 +07:00
|
|
|
int i;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2015-08-26 20:12:58 +07:00
|
|
|
bitmask[0] = FATTR4_WORD0_SUPPORTED_ATTRS |
|
|
|
|
FATTR4_WORD0_FH_EXPIRE_TYPE |
|
|
|
|
FATTR4_WORD0_LINK_SUPPORT |
|
|
|
|
FATTR4_WORD0_SYMLINK_SUPPORT |
|
|
|
|
FATTR4_WORD0_ACLSUPPORT;
|
|
|
|
if (minorversion)
|
|
|
|
bitmask[2] = FATTR4_WORD2_SUPPATTR_EXCLCREAT;
|
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
if (status == 0) {
|
2013-11-05 03:20:20 +07:00
|
|
|
/* Sanity check the server answers */
|
2015-08-26 20:12:58 +07:00
|
|
|
switch (minorversion) {
|
2013-11-05 03:20:20 +07:00
|
|
|
case 0:
|
|
|
|
res.attr_bitmask[1] &= FATTR4_WORD1_NFS40_MASK;
|
|
|
|
res.attr_bitmask[2] = 0;
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
res.attr_bitmask[2] &= FATTR4_WORD2_NFS41_MASK;
|
|
|
|
break;
|
|
|
|
case 2:
|
|
|
|
res.attr_bitmask[2] &= FATTR4_WORD2_NFS42_MASK;
|
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
memcpy(server->attr_bitmask, res.attr_bitmask, sizeof(server->attr_bitmask));
|
2009-08-10 02:06:19 +07:00
|
|
|
server->caps &= ~(NFS_CAP_ACLS|NFS_CAP_HARDLINKS|
|
|
|
|
NFS_CAP_SYMLINKS|NFS_CAP_FILEID|
|
|
|
|
NFS_CAP_MODE|NFS_CAP_NLINK|NFS_CAP_OWNER|
|
|
|
|
NFS_CAP_OWNER_GROUP|NFS_CAP_ATIME|
|
2013-11-05 03:20:20 +07:00
|
|
|
NFS_CAP_CTIME|NFS_CAP_MTIME|
|
|
|
|
NFS_CAP_SECURITY_LABEL);
|
2014-01-23 21:54:55 +07:00
|
|
|
if (res.attr_bitmask[0] & FATTR4_WORD0_ACL &&
|
|
|
|
res.acl_bitmask & ACL4_SUPPORT_ALLOW_ACL)
|
2005-04-17 05:20:36 +07:00
|
|
|
server->caps |= NFS_CAP_ACLS;
|
|
|
|
if (res.has_links != 0)
|
|
|
|
server->caps |= NFS_CAP_HARDLINKS;
|
|
|
|
if (res.has_symlinks != 0)
|
|
|
|
server->caps |= NFS_CAP_SYMLINKS;
|
2009-08-10 02:06:19 +07:00
|
|
|
if (res.attr_bitmask[0] & FATTR4_WORD0_FILEID)
|
|
|
|
server->caps |= NFS_CAP_FILEID;
|
|
|
|
if (res.attr_bitmask[1] & FATTR4_WORD1_MODE)
|
|
|
|
server->caps |= NFS_CAP_MODE;
|
|
|
|
if (res.attr_bitmask[1] & FATTR4_WORD1_NUMLINKS)
|
|
|
|
server->caps |= NFS_CAP_NLINK;
|
|
|
|
if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER)
|
|
|
|
server->caps |= NFS_CAP_OWNER;
|
|
|
|
if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER_GROUP)
|
|
|
|
server->caps |= NFS_CAP_OWNER_GROUP;
|
|
|
|
if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_ACCESS)
|
|
|
|
server->caps |= NFS_CAP_ATIME;
|
|
|
|
if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_METADATA)
|
|
|
|
server->caps |= NFS_CAP_CTIME;
|
|
|
|
if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_MODIFY)
|
|
|
|
server->caps |= NFS_CAP_MTIME;
|
2013-05-22 23:50:44 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_SECURITY_LABEL
|
|
|
|
if (res.attr_bitmask[2] & FATTR4_WORD2_SECURITY_LABEL)
|
|
|
|
server->caps |= NFS_CAP_SECURITY_LABEL;
|
|
|
|
#endif
|
|
|
|
memcpy(server->attr_bitmask_nl, res.attr_bitmask,
|
|
|
|
sizeof(server->attr_bitmask));
|
2013-11-05 03:20:20 +07:00
|
|
|
server->attr_bitmask_nl[2] &= ~FATTR4_WORD2_SECURITY_LABEL;
|
2009-08-10 02:06:19 +07:00
|
|
|
|
2009-03-12 01:10:28 +07:00
|
|
|
memcpy(server->cache_consistency_bitmask, res.attr_bitmask, sizeof(server->cache_consistency_bitmask));
|
|
|
|
server->cache_consistency_bitmask[0] &= FATTR4_WORD0_CHANGE|FATTR4_WORD0_SIZE;
|
|
|
|
server->cache_consistency_bitmask[1] &= FATTR4_WORD1_TIME_METADATA|FATTR4_WORD1_TIME_MODIFY;
|
2013-11-05 03:20:20 +07:00
|
|
|
server->cache_consistency_bitmask[2] = 0;
|
2017-05-10 02:47:15 +07:00
|
|
|
|
|
|
|
/* Avoid a regression due to buggy server */
|
|
|
|
for (i = 0; i < ARRAY_SIZE(res.exclcreat_bitmask); i++)
|
|
|
|
res.exclcreat_bitmask[i] &= res.attr_bitmask[i];
|
2015-08-26 20:12:58 +07:00
|
|
|
memcpy(server->exclcreat_bitmask, res.exclcreat_bitmask,
|
|
|
|
sizeof(server->exclcreat_bitmask));
|
2017-05-10 02:47:15 +07:00
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
server->acl_bitmask = res.acl_bitmask;
|
2012-03-02 05:02:05 +07:00
|
|
|
server->fh_expire_type = res.fh_expire_type;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2009-04-01 20:22:03 +07:00
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2006-06-09 20:34:19 +07:00
|
|
|
int nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
|
|
|
err = nfs4_handle_exception(server,
|
|
|
|
_nfs4_server_capabilities(server, fhandle),
|
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fsinfo *info)
|
|
|
|
{
|
2013-05-22 23:50:44 +07:00
|
|
|
u32 bitmask[3];
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_lookup_root_arg args = {
|
2013-05-22 23:50:44 +07:00
|
|
|
.bitmask = bitmask,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct nfs4_lookup_res res = {
|
|
|
|
.server = server,
|
2005-10-28 09:12:38 +07:00
|
|
|
.fattr = info->fattr,
|
2005-04-17 05:20:36 +07:00
|
|
|
.fh = fhandle,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP_ROOT],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
2009-04-01 20:22:50 +07:00
|
|
|
|
2013-05-22 23:50:44 +07:00
|
|
|
bitmask[0] = nfs4_fattr_bitmap[0];
|
|
|
|
bitmask[1] = nfs4_fattr_bitmap[1];
|
|
|
|
/*
|
|
|
|
* Process the label in the upcoming getfattr
|
|
|
|
*/
|
|
|
|
bitmask[2] = nfs4_fattr_bitmap[2] & ~FATTR4_WORD2_SECURITY_LABEL;
|
|
|
|
|
2005-10-28 09:12:38 +07:00
|
|
|
nfs_fattr_init(info->fattr);
|
2011-03-25 00:12:24 +07:00
|
|
|
return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fsinfo *info)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2011-04-19 03:52:25 +07:00
|
|
|
err = _nfs4_lookup_root(server, fhandle, info);
|
2013-08-14 00:01:39 +07:00
|
|
|
trace_nfs4_lookup_root(server, fhandle, info->fattr, err);
|
2011-04-19 03:52:25 +07:00
|
|
|
switch (err) {
|
|
|
|
case 0:
|
|
|
|
case -NFS4ERR_WRONGSEC:
|
2012-03-28 05:13:02 +07:00
|
|
|
goto out;
|
2011-04-19 03:52:25 +07:00
|
|
|
default:
|
|
|
|
err = nfs4_handle_exception(server, err, &exception);
|
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
} while (exception.retry);
|
2012-03-28 05:13:02 +07:00
|
|
|
out:
|
2005-04-17 05:20:36 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2011-03-25 00:12:31 +07:00
|
|
|
static int nfs4_lookup_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fsinfo *info, rpc_authflavor_t flavor)
|
|
|
|
{
|
2013-08-27 06:23:04 +07:00
|
|
|
struct rpc_auth_create_args auth_args = {
|
|
|
|
.pseudoflavor = flavor,
|
|
|
|
};
|
2011-03-25 00:12:31 +07:00
|
|
|
struct rpc_auth *auth;
|
|
|
|
|
2013-08-27 06:23:04 +07:00
|
|
|
auth = rpcauth_create(&auth_args, server->client);
|
2017-01-12 04:30:08 +07:00
|
|
|
if (IS_ERR(auth))
|
|
|
|
return -EACCES;
|
|
|
|
return nfs4_lookup_root(server, fhandle, info);
|
2011-03-25 00:12:31 +07:00
|
|
|
}
|
|
|
|
|
NFS: Use static list of security flavors during root FH lookup recovery
If the Linux NFS client receives an NFS4ERR_WRONGSEC error while
trying to look up an NFS server's root file handle, it retries the
lookup operation with various security flavors to see what flavor
the NFS server will accept for pseudo-fs access.
The list of flavors the client uses during retry consists only of
flavors that are currently registered in the kernel RPC client.
This list may not include any GSS pseudoflavors if auth_rpcgss.ko
has not yet been loaded.
Let's instead use a static list of security flavors that the NFS
standard requires the server to implement (RFC 3530bis, section
3.2.1). The RPC client should now be able to load support for
these dynamically; if not, they are skipped.
Recovery behavior here is prescribed by RFC 3530bis, section
15.33.5:
> For LOOKUPP, PUTROOTFH and PUTPUBFH, the client will be unable to
> use the SECINFO operation since SECINFO requires a current
> filehandle and none exist for these two [sic] operations. Therefore,
> the client must iterate through the security triples available at
> the client and reattempt the PUTROOTFH or PUTPUBFH operation. In
> the unfortunate event none of the MANDATORY security triples are
> supported by the client and server, the client SHOULD try using
> others that support integrity. Failing that, the client can try
> using AUTH_NONE, but because such forms lack integrity checks,
> this puts the client at risk.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Cc: Bryan Schumaker <bjschuma@netapp.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-03-17 02:56:02 +07:00
|
|
|
/*
|
|
|
|
* Retry pseudoroot lookup with various security flavors. We do this when:
|
|
|
|
*
|
|
|
|
* NFSv4.0: the PUTROOTFH operation returns NFS4ERR_WRONGSEC
|
|
|
|
* NFSv4.1: the server does not support the SECINFO_NO_NAME operation
|
|
|
|
*
|
|
|
|
* Returns zero on success, or a negative NFS4ERR value, or a
|
|
|
|
* negative errno value.
|
|
|
|
*/
|
2011-04-14 01:31:30 +07:00
|
|
|
static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
|
NFS: Share NFS superblocks per-protocol per-server per-FSID
The attached patch makes NFS share superblocks between mounts from the same
server and FSID over the same protocol.
It does this by creating each superblock with a false root and returning the
real root dentry in the vfsmount presented by get_sb(). The root dentry set
starts off as an anonymous dentry if we don't already have the dentry for its
inode, otherwise it simply returns the dentry we already have.
We may thus end up with several trees of dentries in the superblock, and if at
some later point one of anonymous tree roots is discovered by normal filesystem
activity to be located in another tree within the superblock, the anonymous
root is named and materialises attached to the second tree at the appropriate
point.
Why do it this way? Why not pass an extra argument to the mount() syscall to
indicate the subpath and then pathwalk from the server root to the desired
directory? You can't guarantee this will work for two reasons:
(1) The root and intervening nodes may not be accessible to the client.
With NFS2 and NFS3, for instance, mountd is called on the server to get
the filehandle for the tip of a path. mountd won't give us handles for
anything we don't have permission to access, and so we can't set up NFS
inodes for such nodes, and so can't easily set up dentries (we'd have to
have ghost inodes or something).
With this patch we don't actually create dentries until we get handles
from the server that we can use to set up their inodes, and we don't
actually bind them into the tree until we know for sure where they go.
(2) Inaccessible symbolic links.
If we're asked to mount two exports from the server, eg:
mount warthog:/warthog/aaa/xxx /mmm
mount warthog:/warthog/bbb/yyy /nnn
We may not be able to access anything nearer the root than xxx and yyy,
but we may find out later that /mmm/www/yyy, say, is actually the same
directory as the one mounted on /nnn. What we might then find out, for
example, is that /warthog/bbb was actually a symbolic link to
/warthog/aaa/xxx/www, but we can't actually determine that by talking to
the server until /warthog is made available by NFS.
This would lead to having constructed an errneous dentry tree which we
can't easily fix. We can end up with a dentry marked as a directory when
it should actually be a symlink, or we could end up with an apparently
hardlinked directory.
With this patch we need not make assumptions about the type of a dentry
for which we can't retrieve information, nor need we assume we know its
place in the grand scheme of things until we actually see that place.
This patch reduces the possibility of aliasing in the inode and page caches for
inodes that may be accessed by more than one NFS export. It also reduces the
number of superblocks required for NFS where there are many NFS exports being
used from a server (home directory server + autofs for example).
This in turn makes it simpler to do local caching of network filesystems, as it
can then be guaranteed that there won't be links from multiple inodes in
separate superblocks to the same cache file.
Obviously, cache aliasing between different levels of NFS protocol could still
be a problem, but at least that gives us another key to use when indexing the
cache.
This patch makes the following changes:
(1) The server record construction/destruction has been abstracted out into
its own set of functions to make things easier to get right. These have
been moved into fs/nfs/client.c.
All the code in fs/nfs/client.c has to do with the management of
connections to servers, and doesn't touch superblocks in any way; the
remaining code in fs/nfs/super.c has to do with VFS superblock management.
(2) The sequence of events undertaken by NFS mount is now reordered:
(a) A volume representation (struct nfs_server) is allocated.
(b) A server representation (struct nfs_client) is acquired. This may be
allocated or shared, and is keyed on server address, port and NFS
version.
(c) If allocated, the client representation is initialised. The state
member variable of nfs_client is used to prevent a race during
initialisation from two mounts.
(d) For NFS4 a simple pathwalk is performed, walking from FH to FH to find
the root filehandle for the mount (fs/nfs/getroot.c). For NFS2/3 we
are given the root FH in advance.
(e) The volume FSID is probed for on the root FH.
(f) The volume representation is initialised from the FSINFO record
retrieved on the root FH.
(g) sget() is called to acquire a superblock. This may be allocated or
shared, keyed on client pointer and FSID.
(h) If allocated, the superblock is initialised.
(i) If the superblock is shared, then the new nfs_server record is
discarded.
(j) The root dentry for this mount is looked up from the root FH.
(k) The root dentry for this mount is assigned to the vfsmount.
(3) nfs_readdir_lookup() creates dentries for each of the entries readdir()
returns; this function now attaches disconnected trees from alternate
roots that happen to be discovered attached to a directory being read (in
the same way nfs_lookup() is made to do for lookup ops).
The new d_materialise_unique() function is now used to do this, thus
permitting the whole thing to be done under one set of locks, and thus
avoiding any race between mount and lookup operations on the same
directory.
(4) The client management code uses a new debug facility: NFSDBG_CLIENT which
is set by echoing 1024 to /proc/net/sunrpc/nfs_debug.
(5) Clone mounts are now called xdev mounts.
(6) Use the dentry passed to the statfs() op as the handle for retrieving fs
statistics rather than the root dentry of the superblock (which is now a
dummy).
Signed-Off-By: David Howells <dhowells@redhat.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2006-08-23 07:06:13 +07:00
|
|
|
struct nfs_fsinfo *info)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
NFS: Use static list of security flavors during root FH lookup recovery
If the Linux NFS client receives an NFS4ERR_WRONGSEC error while
trying to look up an NFS server's root file handle, it retries the
lookup operation with various security flavors to see what flavor
the NFS server will accept for pseudo-fs access.
The list of flavors the client uses during retry consists only of
flavors that are currently registered in the kernel RPC client.
This list may not include any GSS pseudoflavors if auth_rpcgss.ko
has not yet been loaded.
Let's instead use a static list of security flavors that the NFS
standard requires the server to implement (RFC 3530bis, section
3.2.1). The RPC client should now be able to load support for
these dynamically; if not, they are skipped.
Recovery behavior here is prescribed by RFC 3530bis, section
15.33.5:
> For LOOKUPP, PUTROOTFH and PUTPUBFH, the client will be unable to
> use the SECINFO operation since SECINFO requires a current
> filehandle and none exist for these two [sic] operations. Therefore,
> the client must iterate through the security triples available at
> the client and reattempt the PUTROOTFH or PUTPUBFH operation. In
> the unfortunate event none of the MANDATORY security triples are
> supported by the client and server, the client SHOULD try using
> others that support integrity. Failing that, the client can try
> using AUTH_NONE, but because such forms lack integrity checks,
> this puts the client at risk.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Cc: Bryan Schumaker <bjschuma@netapp.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-03-17 02:56:02 +07:00
|
|
|
/* Per 3530bis 15.33.5 */
|
|
|
|
static const rpc_authflavor_t flav_array[] = {
|
|
|
|
RPC_AUTH_GSS_KRB5P,
|
|
|
|
RPC_AUTH_GSS_KRB5I,
|
|
|
|
RPC_AUTH_GSS_KRB5,
|
2013-03-17 02:56:11 +07:00
|
|
|
RPC_AUTH_UNIX, /* courtesy */
|
NFS: Use static list of security flavors during root FH lookup recovery
If the Linux NFS client receives an NFS4ERR_WRONGSEC error while
trying to look up an NFS server's root file handle, it retries the
lookup operation with various security flavors to see what flavor
the NFS server will accept for pseudo-fs access.
The list of flavors the client uses during retry consists only of
flavors that are currently registered in the kernel RPC client.
This list may not include any GSS pseudoflavors if auth_rpcgss.ko
has not yet been loaded.
Let's instead use a static list of security flavors that the NFS
standard requires the server to implement (RFC 3530bis, section
3.2.1). The RPC client should now be able to load support for
these dynamically; if not, they are skipped.
Recovery behavior here is prescribed by RFC 3530bis, section
15.33.5:
> For LOOKUPP, PUTROOTFH and PUTPUBFH, the client will be unable to
> use the SECINFO operation since SECINFO requires a current
> filehandle and none exist for these two [sic] operations. Therefore,
> the client must iterate through the security triples available at
> the client and reattempt the PUTROOTFH or PUTPUBFH operation. In
> the unfortunate event none of the MANDATORY security triples are
> supported by the client and server, the client SHOULD try using
> others that support integrity. Failing that, the client can try
> using AUTH_NONE, but because such forms lack integrity checks,
> this puts the client at risk.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Cc: Bryan Schumaker <bjschuma@netapp.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-03-17 02:56:02 +07:00
|
|
|
RPC_AUTH_NULL,
|
|
|
|
};
|
|
|
|
int status = -EPERM;
|
|
|
|
size_t i;
|
2012-07-12 03:31:08 +07:00
|
|
|
|
2013-10-19 02:15:19 +07:00
|
|
|
if (server->auth_info.flavor_len > 0) {
|
|
|
|
/* try each flavor specified by user */
|
|
|
|
for (i = 0; i < server->auth_info.flavor_len; i++) {
|
|
|
|
status = nfs4_lookup_root_sec(server, fhandle, info,
|
|
|
|
server->auth_info.flavors[i]);
|
|
|
|
if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
|
|
|
|
continue;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/* no flavors specified by user, try default list */
|
|
|
|
for (i = 0; i < ARRAY_SIZE(flav_array); i++) {
|
|
|
|
status = nfs4_lookup_root_sec(server, fhandle, info,
|
|
|
|
flav_array[i]);
|
|
|
|
if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
|
|
|
|
continue;
|
|
|
|
break;
|
|
|
|
}
|
2011-03-25 00:12:31 +07:00
|
|
|
}
|
NFS: Use static list of security flavors during root FH lookup recovery
If the Linux NFS client receives an NFS4ERR_WRONGSEC error while
trying to look up an NFS server's root file handle, it retries the
lookup operation with various security flavors to see what flavor
the NFS server will accept for pseudo-fs access.
The list of flavors the client uses during retry consists only of
flavors that are currently registered in the kernel RPC client.
This list may not include any GSS pseudoflavors if auth_rpcgss.ko
has not yet been loaded.
Let's instead use a static list of security flavors that the NFS
standard requires the server to implement (RFC 3530bis, section
3.2.1). The RPC client should now be able to load support for
these dynamically; if not, they are skipped.
Recovery behavior here is prescribed by RFC 3530bis, section
15.33.5:
> For LOOKUPP, PUTROOTFH and PUTPUBFH, the client will be unable to
> use the SECINFO operation since SECINFO requires a current
> filehandle and none exist for these two [sic] operations. Therefore,
> the client must iterate through the security triples available at
> the client and reattempt the PUTROOTFH or PUTPUBFH operation. In
> the unfortunate event none of the MANDATORY security triples are
> supported by the client and server, the client SHOULD try using
> others that support integrity. Failing that, the client can try
> using AUTH_NONE, but because such forms lack integrity checks,
> this puts the client at risk.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Cc: Bryan Schumaker <bjschuma@netapp.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-03-17 02:56:02 +07:00
|
|
|
|
2011-04-19 03:52:25 +07:00
|
|
|
/*
|
|
|
|
* -EACCESS could mean that the user doesn't have correct permissions
|
|
|
|
* to access the mount. It could also mean that we tried to mount
|
|
|
|
* with a gss auth flavor, but rpc.gssd isn't running. Either way,
|
|
|
|
* existing mount programs don't handle -EACCES very well so it should
|
|
|
|
* be mapped to -EPERM instead.
|
|
|
|
*/
|
|
|
|
if (status == -EACCES)
|
|
|
|
status = -EPERM;
|
2011-04-14 01:31:30 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2013-03-17 02:55:45 +07:00
|
|
|
/**
|
|
|
|
* nfs4_proc_get_rootfh - get file handle for server's pseudoroot
|
|
|
|
* @server: initialized nfs_server handle
|
|
|
|
* @fhandle: we fill in the pseudo-fs root file handle
|
|
|
|
* @info: we fill in an FSINFO struct
|
2013-09-07 23:58:57 +07:00
|
|
|
* @auth_probe: probe the auth flavours
|
2013-03-17 02:55:45 +07:00
|
|
|
*
|
|
|
|
* Returns zero on success, or a negative errno.
|
2011-04-14 01:31:30 +07:00
|
|
|
*/
|
2012-05-11 02:07:30 +07:00
|
|
|
int nfs4_proc_get_rootfh(struct nfs_server *server, struct nfs_fh *fhandle,
|
2013-09-07 23:58:57 +07:00
|
|
|
struct nfs_fsinfo *info,
|
|
|
|
bool auth_probe)
|
2011-04-14 01:31:30 +07:00
|
|
|
{
|
2015-04-23 23:17:40 +07:00
|
|
|
int status = 0;
|
2013-03-17 02:55:45 +07:00
|
|
|
|
2015-04-23 23:17:40 +07:00
|
|
|
if (!auth_probe)
|
2013-09-07 23:58:57 +07:00
|
|
|
status = nfs4_lookup_root(server, fhandle, info);
|
2015-04-23 23:17:40 +07:00
|
|
|
|
|
|
|
if (auth_probe || status == NFS4ERR_WRONGSEC)
|
2016-07-26 00:31:14 +07:00
|
|
|
status = server->nfs_client->cl_mvops->find_root_sec(server,
|
|
|
|
fhandle, info);
|
2013-03-17 02:55:45 +07:00
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
if (status == 0)
|
|
|
|
status = nfs4_server_capabilities(server, fhandle);
|
|
|
|
if (status == 0)
|
|
|
|
status = nfs4_do_fsinfo(server, fhandle, info);
|
2013-03-17 02:55:45 +07:00
|
|
|
|
2006-03-14 12:20:47 +07:00
|
|
|
return nfs4_map_errors(status);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2012-05-11 02:07:31 +07:00
|
|
|
static int nfs4_proc_get_root(struct nfs_server *server, struct nfs_fh *mntfh,
|
|
|
|
struct nfs_fsinfo *info)
|
|
|
|
{
|
|
|
|
int error;
|
|
|
|
struct nfs_fattr *fattr = info->fattr;
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs4_label *label = NULL;
|
2012-05-11 02:07:31 +07:00
|
|
|
|
|
|
|
error = nfs4_server_capabilities(server, mntfh);
|
|
|
|
if (error < 0) {
|
|
|
|
dprintk("nfs4_get_root: getcaps error = %d\n", -error);
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
2013-05-22 23:50:43 +07:00
|
|
|
label = nfs4_label_alloc(server, GFP_KERNEL);
|
|
|
|
if (IS_ERR(label))
|
|
|
|
return PTR_ERR(label);
|
|
|
|
|
2018-04-08 00:50:59 +07:00
|
|
|
error = nfs4_proc_getattr(server, mntfh, fattr, label, NULL);
|
2012-05-11 02:07:31 +07:00
|
|
|
if (error < 0) {
|
|
|
|
dprintk("nfs4_get_root: getattr error = %d\n", -error);
|
2013-05-22 23:50:43 +07:00
|
|
|
goto err_free_label;
|
2012-05-11 02:07:31 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
if (fattr->valid & NFS_ATTR_FATTR_FSID &&
|
|
|
|
!nfs_fsid_equal(&server->fsid, &fattr->fsid))
|
|
|
|
memcpy(&server->fsid, &fattr->fsid, sizeof(server->fsid));
|
|
|
|
|
2013-05-22 23:50:43 +07:00
|
|
|
err_free_label:
|
|
|
|
nfs4_label_free(label);
|
|
|
|
|
2012-05-11 02:07:31 +07:00
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
2006-06-09 20:34:29 +07:00
|
|
|
/*
|
|
|
|
* Get locations and (maybe) other attributes of a referral.
|
|
|
|
* Note that we'll actually follow the referral later when
|
|
|
|
* we detect fsid mismatch in inode revalidation
|
|
|
|
*/
|
2012-04-28 00:27:41 +07:00
|
|
|
static int nfs4_get_referral(struct rpc_clnt *client, struct inode *dir,
|
|
|
|
const struct qstr *name, struct nfs_fattr *fattr,
|
|
|
|
struct nfs_fh *fhandle)
|
2006-06-09 20:34:29 +07:00
|
|
|
{
|
|
|
|
int status = -ENOMEM;
|
|
|
|
struct page *page = NULL;
|
|
|
|
struct nfs4_fs_locations *locations = NULL;
|
|
|
|
|
|
|
|
page = alloc_page(GFP_KERNEL);
|
|
|
|
if (page == NULL)
|
|
|
|
goto out;
|
|
|
|
locations = kmalloc(sizeof(struct nfs4_fs_locations), GFP_KERNEL);
|
|
|
|
if (locations == NULL)
|
|
|
|
goto out;
|
|
|
|
|
2012-04-28 00:27:41 +07:00
|
|
|
status = nfs4_proc_fs_locations(client, dir, name, locations, page);
|
2006-06-09 20:34:29 +07:00
|
|
|
if (status != 0)
|
|
|
|
goto out;
|
2013-10-18 01:13:19 +07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* If the fsid didn't change, this is a migration event, not a
|
|
|
|
* referral. Cause us to drop into the exception handler, which
|
|
|
|
* will kick off migration recovery.
|
|
|
|
*/
|
2006-06-09 20:34:29 +07:00
|
|
|
if (nfs_fsid_equal(&NFS_SERVER(dir)->fsid, &locations->fattr.fsid)) {
|
2011-06-14 05:25:56 +07:00
|
|
|
dprintk("%s: server did not return a different fsid for"
|
|
|
|
" a referral at %s\n", __func__, name->name);
|
2013-10-18 01:13:19 +07:00
|
|
|
status = -NFS4ERR_MOVED;
|
2006-06-09 20:34:29 +07:00
|
|
|
goto out;
|
|
|
|
}
|
2011-06-14 05:25:56 +07:00
|
|
|
/* Fixup attributes for the nfs_lookup() call to nfs_fhget() */
|
|
|
|
nfs_fixup_referral_attributes(&locations->fattr);
|
2006-06-09 20:34:29 +07:00
|
|
|
|
2011-06-14 05:25:56 +07:00
|
|
|
/* replace the lookup nfs_fattr with the locations nfs_fattr */
|
2006-06-09 20:34:29 +07:00
|
|
|
memcpy(fattr, &locations->fattr, sizeof(struct nfs_fattr));
|
|
|
|
memset(fhandle, 0, sizeof(struct nfs_fh));
|
|
|
|
out:
|
|
|
|
if (page)
|
|
|
|
__free_page(page);
|
2010-08-11 23:42:15 +07:00
|
|
|
kfree(locations);
|
2006-06-09 20:34:29 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2013-05-22 23:50:42 +07:00
|
|
|
static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle,
|
2018-04-08 00:50:59 +07:00
|
|
|
struct nfs_fattr *fattr, struct nfs4_label *label,
|
|
|
|
struct inode *inode)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2018-04-08 00:54:23 +07:00
|
|
|
__u32 bitmask[NFS4_BITMASK_SZ];
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_getattr_arg args = {
|
|
|
|
.fh = fhandle,
|
2018-04-08 00:54:23 +07:00
|
|
|
.bitmask = bitmask,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct nfs4_getattr_res res = {
|
|
|
|
.fattr = fattr,
|
2013-05-22 23:50:42 +07:00
|
|
|
.label = label,
|
2005-04-17 05:20:36 +07:00
|
|
|
.server = server,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
2013-05-22 23:50:44 +07:00
|
|
|
|
2018-04-08 00:54:23 +07:00
|
|
|
nfs4_bitmap_copy_adjust(bitmask, nfs4_bitmask(server, label), inode);
|
2013-05-22 23:50:44 +07:00
|
|
|
|
2005-10-28 09:12:38 +07:00
|
|
|
nfs_fattr_init(fattr);
|
2011-03-25 00:12:24 +07:00
|
|
|
return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2013-05-22 23:50:42 +07:00
|
|
|
static int nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle,
|
2018-04-08 00:50:59 +07:00
|
|
|
struct nfs_fattr *fattr, struct nfs4_label *label,
|
|
|
|
struct inode *inode)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2018-04-08 00:50:59 +07:00
|
|
|
err = _nfs4_proc_getattr(server, fhandle, fattr, label, inode);
|
2013-08-14 00:01:39 +07:00
|
|
|
trace_nfs4_getattr(server, fhandle, fattr, err);
|
|
|
|
err = nfs4_handle_exception(server, err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The file is not closed if it is opened due to the a request to change
|
|
|
|
* the size of the file. The open call will not be needed once the
|
|
|
|
* VFS layer lookup-intents are implemented.
|
|
|
|
*
|
|
|
|
* Close is called when the inode is destroyed.
|
|
|
|
* If we haven't opened the file for O_WRONLY, we
|
|
|
|
* need to in the size_change case to obtain a stateid.
|
|
|
|
*
|
|
|
|
* Got race?
|
|
|
|
* Because OPEN is always done by name in nfsv4, it is
|
|
|
|
* possible that we opened a different file by the same
|
|
|
|
* name. We can recognize this race condition, but we
|
|
|
|
* can't do anything about it besides returning an error.
|
|
|
|
*
|
|
|
|
* This will be fixed with VFS changes (lookup-intent).
|
|
|
|
*/
|
|
|
|
static int
|
|
|
|
nfs4_proc_setattr(struct dentry *dentry, struct nfs_fattr *fattr,
|
|
|
|
struct iattr *sattr)
|
|
|
|
{
|
2015-03-18 05:25:59 +07:00
|
|
|
struct inode *inode = d_inode(dentry);
|
2008-06-11 06:39:41 +07:00
|
|
|
struct rpc_cred *cred = NULL;
|
2016-10-13 11:26:47 +07:00
|
|
|
struct nfs_open_context *ctx = NULL;
|
2013-05-22 23:50:43 +07:00
|
|
|
struct nfs4_label *label = NULL;
|
2005-04-17 05:20:36 +07:00
|
|
|
int status;
|
|
|
|
|
2014-09-12 10:04:10 +07:00
|
|
|
if (pnfs_ld_layoutret_on_setattr(inode) &&
|
|
|
|
sattr->ia_valid & ATTR_SIZE &&
|
|
|
|
sattr->ia_size < i_size_read(inode))
|
2013-03-21 00:23:33 +07:00
|
|
|
pnfs_commit_and_return_layout(inode);
|
2010-07-15 02:43:57 +07:00
|
|
|
|
2005-10-28 09:12:38 +07:00
|
|
|
nfs_fattr_init(fattr);
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2012-05-31 03:12:24 +07:00
|
|
|
/* Deal with open(O_TRUNC) */
|
|
|
|
if (sattr->ia_valid & ATTR_OPEN)
|
2013-07-21 21:21:43 +07:00
|
|
|
sattr->ia_valid &= ~(ATTR_MTIME|ATTR_CTIME);
|
2012-05-31 03:12:24 +07:00
|
|
|
|
|
|
|
/* Optimization: if the end result is no change, don't RPC */
|
2013-07-21 21:21:43 +07:00
|
|
|
if ((sattr->ia_valid & ~(ATTR_FILE|ATTR_OPEN)) == 0)
|
2012-05-31 03:12:24 +07:00
|
|
|
return 0;
|
|
|
|
|
2005-11-05 03:33:38 +07:00
|
|
|
/* Search for an existing open(O_WRITE) file */
|
2008-06-11 06:39:41 +07:00
|
|
|
if (sattr->ia_valid & ATTR_FILE) {
|
|
|
|
|
|
|
|
ctx = nfs_file_open_context(sattr->ia_file);
|
2016-10-13 11:26:47 +07:00
|
|
|
if (ctx)
|
2008-10-16 10:15:16 +07:00
|
|
|
cred = ctx->cred;
|
2008-06-11 06:39:41 +07:00
|
|
|
}
|
2005-06-23 00:16:29 +07:00
|
|
|
|
2013-05-22 23:50:43 +07:00
|
|
|
label = nfs4_label_alloc(NFS_SERVER(inode), GFP_KERNEL);
|
|
|
|
if (IS_ERR(label))
|
|
|
|
return PTR_ERR(label);
|
|
|
|
|
2018-03-21 03:43:18 +07:00
|
|
|
/* Return any delegations if we're going to change ACLs */
|
|
|
|
if ((sattr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0)
|
2018-03-21 03:43:20 +07:00
|
|
|
nfs4_inode_make_writeable(inode);
|
2018-03-21 03:43:18 +07:00
|
|
|
|
2016-10-13 11:26:47 +07:00
|
|
|
status = nfs4_do_setattr(inode, cred, fattr, sattr, ctx, NULL, label);
|
2013-05-22 23:50:44 +07:00
|
|
|
if (status == 0) {
|
2015-02-27 04:09:04 +07:00
|
|
|
nfs_setattr_update_inode(inode, sattr, fattr);
|
2013-05-22 23:50:44 +07:00
|
|
|
nfs_setsecurity(inode, fattr, label);
|
|
|
|
}
|
2013-05-22 23:50:43 +07:00
|
|
|
nfs4_label_free(label);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2011-10-19 06:11:22 +07:00
|
|
|
static int _nfs4_proc_lookup(struct rpc_clnt *clnt, struct inode *dir,
|
|
|
|
const struct qstr *name, struct nfs_fh *fhandle,
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs_fattr *fattr, struct nfs4_label *label)
|
2006-08-23 07:06:09 +07:00
|
|
|
{
|
2011-10-19 06:11:22 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2006-08-23 07:06:09 +07:00
|
|
|
int status;
|
|
|
|
struct nfs4_lookup_arg args = {
|
|
|
|
.bitmask = server->attr_bitmask,
|
2011-10-19 06:11:22 +07:00
|
|
|
.dir_fh = NFS_FH(dir),
|
2006-08-23 07:06:09 +07:00
|
|
|
.name = name,
|
|
|
|
};
|
|
|
|
struct nfs4_lookup_res res = {
|
|
|
|
.server = server,
|
|
|
|
.fattr = fattr,
|
2013-05-22 23:50:44 +07:00
|
|
|
.label = label,
|
2006-08-23 07:06:09 +07:00
|
|
|
.fh = fhandle,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
|
|
|
|
2013-05-22 23:50:44 +07:00
|
|
|
args.bitmask = nfs4_bitmask(server, label);
|
|
|
|
|
2006-08-23 07:06:09 +07:00
|
|
|
nfs_fattr_init(fattr);
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
dprintk("NFS call lookup %s\n", name->name);
|
2011-10-19 06:11:22 +07:00
|
|
|
status = nfs4_call_sync(clnt, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
dprintk("NFS reply lookup: %d\n", status);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2012-04-28 00:27:40 +07:00
|
|
|
static void nfs_fixup_secinfo_attributes(struct nfs_fattr *fattr)
|
2011-03-25 00:12:30 +07:00
|
|
|
{
|
|
|
|
fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
|
2012-04-28 00:27:40 +07:00
|
|
|
NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_MOUNTPOINT;
|
2011-03-25 00:12:30 +07:00
|
|
|
fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
|
|
|
|
fattr->nlink = 2;
|
|
|
|
}
|
|
|
|
|
2012-04-28 00:27:40 +07:00
|
|
|
static int nfs4_proc_lookup_common(struct rpc_clnt **clnt, struct inode *dir,
|
2016-07-21 03:34:42 +07:00
|
|
|
const struct qstr *name, struct nfs_fh *fhandle,
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs_fattr *fattr, struct nfs4_label *label)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
2012-04-28 00:27:40 +07:00
|
|
|
struct rpc_clnt *client = *clnt;
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
|
|
|
do {
|
2013-05-22 23:50:42 +07:00
|
|
|
err = _nfs4_proc_lookup(client, dir, name, fhandle, fattr, label);
|
2013-08-13 03:45:55 +07:00
|
|
|
trace_nfs4_lookup(dir, name, err);
|
2012-04-28 00:27:40 +07:00
|
|
|
switch (err) {
|
2011-10-19 06:11:49 +07:00
|
|
|
case -NFS4ERR_BADNAME:
|
2012-04-28 00:27:40 +07:00
|
|
|
err = -ENOENT;
|
|
|
|
goto out;
|
2011-10-19 06:11:22 +07:00
|
|
|
case -NFS4ERR_MOVED:
|
2012-04-28 00:27:41 +07:00
|
|
|
err = nfs4_get_referral(client, dir, name, fattr, fhandle);
|
2015-06-04 22:04:17 +07:00
|
|
|
if (err == -NFS4ERR_MOVED)
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
|
2012-04-28 00:27:40 +07:00
|
|
|
goto out;
|
2011-10-19 06:11:22 +07:00
|
|
|
case -NFS4ERR_WRONGSEC:
|
2012-04-28 00:27:40 +07:00
|
|
|
err = -EPERM;
|
|
|
|
if (client != *clnt)
|
|
|
|
goto out;
|
2014-06-13 02:02:32 +07:00
|
|
|
client = nfs4_negotiate_security(client, dir, name);
|
2012-04-28 00:27:40 +07:00
|
|
|
if (IS_ERR(client))
|
|
|
|
return PTR_ERR(client);
|
|
|
|
|
|
|
|
exception.retry = 1;
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
|
2011-10-19 06:11:22 +07:00
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
} while (exception.retry);
|
2012-04-28 00:27:40 +07:00
|
|
|
|
|
|
|
out:
|
|
|
|
if (err == 0)
|
|
|
|
*clnt = client;
|
|
|
|
else if (client != *clnt)
|
|
|
|
rpc_shutdown_client(client);
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2016-07-21 03:34:42 +07:00
|
|
|
static int nfs4_proc_lookup(struct inode *dir, const struct qstr *name,
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs_fh *fhandle, struct nfs_fattr *fattr,
|
|
|
|
struct nfs4_label *label)
|
2012-04-28 00:27:40 +07:00
|
|
|
{
|
|
|
|
int status;
|
|
|
|
struct rpc_clnt *client = NFS_CLIENT(dir);
|
|
|
|
|
2013-05-22 23:50:42 +07:00
|
|
|
status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr, label);
|
2012-04-28 00:27:40 +07:00
|
|
|
if (client != NFS_CLIENT(dir)) {
|
|
|
|
rpc_shutdown_client(client);
|
|
|
|
nfs_fixup_secinfo_attributes(fattr);
|
|
|
|
}
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2012-04-28 00:27:41 +07:00
|
|
|
struct rpc_clnt *
|
2016-07-21 03:34:42 +07:00
|
|
|
nfs4_proc_lookup_mountpoint(struct inode *dir, const struct qstr *name,
|
2012-04-28 00:27:41 +07:00
|
|
|
struct nfs_fh *fhandle, struct nfs_fattr *fattr)
|
|
|
|
{
|
2013-08-08 07:38:07 +07:00
|
|
|
struct rpc_clnt *client = NFS_CLIENT(dir);
|
2012-04-28 00:27:41 +07:00
|
|
|
int status;
|
|
|
|
|
2013-05-22 23:50:42 +07:00
|
|
|
status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr, NULL);
|
2013-08-08 07:38:07 +07:00
|
|
|
if (status < 0)
|
2012-04-28 00:27:41 +07:00
|
|
|
return ERR_PTR(status);
|
2013-08-08 07:38:07 +07:00
|
|
|
return (client == NFS_CLIENT(dir)) ? rpc_clone_client(client) : client;
|
2012-04-28 00:27:41 +07:00
|
|
|
}
|
|
|
|
|
2017-06-29 20:34:52 +07:00
|
|
|
static int _nfs4_proc_lookupp(struct inode *inode,
|
|
|
|
struct nfs_fh *fhandle, struct nfs_fattr *fattr,
|
|
|
|
struct nfs4_label *label)
|
|
|
|
{
|
|
|
|
struct rpc_clnt *clnt = NFS_CLIENT(inode);
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
int status;
|
|
|
|
struct nfs4_lookupp_arg args = {
|
|
|
|
.bitmask = server->attr_bitmask,
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
};
|
|
|
|
struct nfs4_lookupp_res res = {
|
|
|
|
.server = server,
|
|
|
|
.fattr = fattr,
|
|
|
|
.label = label,
|
|
|
|
.fh = fhandle,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUPP],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
|
|
|
|
|
|
|
args.bitmask = nfs4_bitmask(server, label);
|
|
|
|
|
|
|
|
nfs_fattr_init(fattr);
|
|
|
|
|
|
|
|
dprintk("NFS call lookupp ino=0x%lx\n", inode->i_ino);
|
|
|
|
status = nfs4_call_sync(clnt, server, &msg, &args.seq_args,
|
|
|
|
&res.seq_res, 0);
|
|
|
|
dprintk("NFS reply lookupp: %d\n", status);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_lookupp(struct inode *inode, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fattr *fattr, struct nfs4_label *label)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
|
|
|
err = _nfs4_proc_lookupp(inode, fhandle, fattr, label);
|
|
|
|
trace_nfs4_lookupp(inode, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(inode), err,
|
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
static int _nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
|
|
|
|
{
|
2007-08-11 04:45:11 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_accessargs args = {
|
|
|
|
.fh = NFS_FH(inode),
|
2017-07-26 23:00:21 +07:00
|
|
|
.access = entry->mask,
|
2007-08-11 04:45:11 +07:00
|
|
|
};
|
|
|
|
struct nfs4_accessres res = {
|
|
|
|
.server = server,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_ACCESS],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
.rpc_cred = entry->cred,
|
|
|
|
};
|
2013-05-22 23:50:44 +07:00
|
|
|
int status = 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2018-06-05 02:00:53 +07:00
|
|
|
if (!nfs4_have_delegation(inode, FMODE_READ)) {
|
2018-03-21 04:03:11 +07:00
|
|
|
res.fattr = nfs_alloc_fattr();
|
|
|
|
if (res.fattr == NULL)
|
|
|
|
return -ENOMEM;
|
|
|
|
args.bitmask = server->cache_consistency_bitmask;
|
|
|
|
}
|
2010-04-17 03:22:48 +07:00
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
if (!status) {
|
2012-09-11 01:00:46 +07:00
|
|
|
nfs_access_set_mask(entry, res.access);
|
2018-03-21 04:03:11 +07:00
|
|
|
if (res.fattr)
|
|
|
|
nfs_refresh_inode(inode, res.fattr);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2010-04-17 03:22:48 +07:00
|
|
|
nfs_free_fattr(res.fattr);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-08-13 03:58:42 +07:00
|
|
|
err = _nfs4_proc_access(inode, entry);
|
|
|
|
trace_nfs4_access(inode, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(inode), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* TODO: For the time being, we don't try to get any attributes
|
|
|
|
* along with any of the zero-copy operations READ, READDIR,
|
|
|
|
* READLINK, WRITE.
|
|
|
|
*
|
|
|
|
* In the case of the first three, we want to put the GETATTR
|
|
|
|
* after the read-type operation -- this is because it is hard
|
|
|
|
* to predict the length of a GETATTR response in v4, and thus
|
|
|
|
* align the READ data correctly. This means that the GETATTR
|
|
|
|
* may end up partially falling into the page cache, and we should
|
|
|
|
* shift it into the 'tail' of the xdr_buf before processing.
|
|
|
|
* To do this efficiently, we need to know the total length
|
|
|
|
* of data received, which doesn't seem to be available outside
|
|
|
|
* of the RPC layer.
|
|
|
|
*
|
|
|
|
* In the case of WRITE, we also want to put the GETATTR after
|
|
|
|
* the operation -- in this case because we want to make sure
|
2012-06-06 02:20:25 +07:00
|
|
|
* we get the post-operation mtime and size.
|
2005-04-17 05:20:36 +07:00
|
|
|
*
|
|
|
|
* Both of these changes to the XDR layer would in fact be quite
|
|
|
|
* minor, but I decided to leave them for a subsequent patch.
|
|
|
|
*/
|
|
|
|
static int _nfs4_proc_readlink(struct inode *inode, struct page *page,
|
|
|
|
unsigned int pgbase, unsigned int pglen)
|
|
|
|
{
|
|
|
|
struct nfs4_readlink args = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.pgbase = pgbase,
|
|
|
|
.pglen = pglen,
|
|
|
|
.pages = &page,
|
|
|
|
};
|
2009-04-01 20:21:55 +07:00
|
|
|
struct nfs4_readlink_res res;
|
2005-04-17 05:20:36 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READLINK],
|
|
|
|
.rpc_argp = &args,
|
2009-04-01 20:21:55 +07:00
|
|
|
.rpc_resp = &res,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
return nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode), &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_readlink(struct inode *inode, struct page *page,
|
|
|
|
unsigned int pgbase, unsigned int pglen)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-08-13 03:58:42 +07:00
|
|
|
err = _nfs4_proc_readlink(inode, page, pgbase, pglen);
|
|
|
|
trace_nfs4_readlink(inode, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(inode), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2012-06-05 20:10:19 +07:00
|
|
|
* This is just for mknod. open(O_CREAT) will always do ->open_context().
|
2005-04-17 05:20:36 +07:00
|
|
|
*/
|
|
|
|
static int
|
|
|
|
nfs4_proc_create(struct inode *dir, struct dentry *dentry, struct iattr *sattr,
|
2012-06-05 20:10:19 +07:00
|
|
|
int flags)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2016-12-03 10:53:30 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2013-05-22 23:50:44 +07:00
|
|
|
struct nfs4_label l, *ilabel = NULL;
|
2012-06-05 20:10:19 +07:00
|
|
|
struct nfs_open_context *ctx;
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_state *state;
|
|
|
|
int status = 0;
|
|
|
|
|
2016-10-13 11:26:47 +07:00
|
|
|
ctx = alloc_nfs_open_context(dentry, FMODE_READ, NULL);
|
2012-06-05 20:10:19 +07:00
|
|
|
if (IS_ERR(ctx))
|
|
|
|
return PTR_ERR(ctx);
|
|
|
|
|
2013-05-22 23:50:44 +07:00
|
|
|
ilabel = nfs4_label_init_security(dir, dentry, sattr, &l);
|
|
|
|
|
2016-12-03 10:53:30 +07:00
|
|
|
if (!(server->attr_bitmask[2] & FATTR4_WORD2_MODE_UMASK))
|
|
|
|
sattr->ia_mode &= ~current_umask();
|
2015-08-26 20:11:39 +07:00
|
|
|
state = nfs4_do_open(dir, ctx, flags, sattr, ilabel, NULL);
|
2005-04-17 05:20:36 +07:00
|
|
|
if (IS_ERR(state)) {
|
|
|
|
status = PTR_ERR(state);
|
2010-09-17 21:56:51 +07:00
|
|
|
goto out;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
out:
|
2013-05-22 23:50:44 +07:00
|
|
|
nfs4_label_release_security(ilabel);
|
2012-06-05 20:10:19 +07:00
|
|
|
put_nfs_open_context(ctx);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2016-07-21 03:34:42 +07:00
|
|
|
static int _nfs4_proc_remove(struct inode *dir, const struct qstr *name)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2005-10-28 09:12:44 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2007-07-15 02:39:57 +07:00
|
|
|
struct nfs_removeargs args = {
|
2005-04-17 05:20:36 +07:00
|
|
|
.fh = NFS_FH(dir),
|
2012-05-11 03:14:12 +07:00
|
|
|
.name = *name,
|
2005-10-28 09:12:44 +07:00
|
|
|
};
|
2007-07-15 02:39:57 +07:00
|
|
|
struct nfs_removeres res = {
|
2005-10-28 09:12:44 +07:00
|
|
|
.server = server,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
2007-07-15 02:39:57 +07:00
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
2017-01-12 10:07:28 +07:00
|
|
|
unsigned long timestamp = jiffies;
|
2012-04-28 00:48:19 +07:00
|
|
|
int status;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
|
2012-04-28 00:48:19 +07:00
|
|
|
if (status == 0)
|
2017-01-12 10:07:28 +07:00
|
|
|
update_changeattr(dir, &res.cinfo, timestamp);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2018-03-21 03:43:15 +07:00
|
|
|
static int nfs4_proc_remove(struct inode *dir, struct dentry *dentry)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
2018-03-21 03:43:15 +07:00
|
|
|
struct inode *inode = d_inode(dentry);
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
2018-03-21 03:43:15 +07:00
|
|
|
|
2018-03-21 03:43:20 +07:00
|
|
|
if (inode) {
|
|
|
|
if (inode->i_nlink == 1)
|
|
|
|
nfs4_inode_return_delegation(inode);
|
|
|
|
else
|
|
|
|
nfs4_inode_make_writeable(inode);
|
|
|
|
}
|
2018-03-21 03:43:15 +07:00
|
|
|
do {
|
|
|
|
err = _nfs4_proc_remove(dir, &dentry->d_name);
|
|
|
|
trace_nfs4_remove(dir, &dentry->d_name, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err,
|
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_rmdir(struct inode *dir, const struct qstr *name)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
do {
|
2013-08-13 03:45:55 +07:00
|
|
|
err = _nfs4_proc_remove(dir, name);
|
|
|
|
trace_nfs4_remove(dir, name, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2018-05-31 03:11:52 +07:00
|
|
|
static void nfs4_proc_unlink_setup(struct rpc_message *msg,
|
|
|
|
struct dentry *dentry,
|
|
|
|
struct inode *inode)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2007-07-15 02:39:58 +07:00
|
|
|
struct nfs_removeargs *args = msg->rpc_argp;
|
|
|
|
struct nfs_removeres *res = msg->rpc_resp;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2018-03-21 03:43:17 +07:00
|
|
|
res->server = NFS_SB(dentry->d_sb);
|
2005-04-17 05:20:36 +07:00
|
|
|
msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE];
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&args->seq_args, &res->seq_res, 1, 0);
|
2013-05-22 23:50:44 +07:00
|
|
|
|
|
|
|
nfs_fattr_init(res->dir_attr);
|
2018-03-21 03:43:17 +07:00
|
|
|
|
|
|
|
if (inode)
|
|
|
|
nfs4_inode_return_delegation(inode);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2012-03-20 01:54:41 +07:00
|
|
|
static void nfs4_proc_unlink_rpc_prepare(struct rpc_task *task, struct nfs_unlinkdata *data)
|
|
|
|
{
|
2017-01-10 03:48:22 +07:00
|
|
|
nfs4_setup_sequence(NFS_SB(data->dentry->d_sb)->nfs_client,
|
2012-10-23 07:28:44 +07:00
|
|
|
&data->args.seq_args,
|
|
|
|
&data->res.seq_res,
|
|
|
|
task);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2007-07-15 02:39:58 +07:00
|
|
|
static int nfs4_proc_unlink_done(struct rpc_task *task, struct inode *dir)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2013-08-13 03:45:55 +07:00
|
|
|
struct nfs_unlinkdata *data = task->tk_calldata;
|
|
|
|
struct nfs_removeres *res = &data->res;
|
2007-07-15 02:39:58 +07:00
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs4_sequence_done(task, &res->seq_res))
|
|
|
|
return 0;
|
2014-09-18 13:09:27 +07:00
|
|
|
if (nfs4_async_handle_error(task, res->server, NULL,
|
|
|
|
&data->timeout) == -EAGAIN)
|
2007-07-15 02:39:58 +07:00
|
|
|
return 0;
|
2017-01-12 00:36:11 +07:00
|
|
|
if (task->tk_status == 0)
|
2017-01-12 10:07:28 +07:00
|
|
|
update_changeattr(dir, &res->cinfo, res->dir_attr->time_start);
|
2007-07-15 02:39:58 +07:00
|
|
|
return 1;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2018-03-21 03:43:16 +07:00
|
|
|
static void nfs4_proc_rename_setup(struct rpc_message *msg,
|
|
|
|
struct dentry *old_dentry,
|
|
|
|
struct dentry *new_dentry)
|
2010-09-18 04:31:57 +07:00
|
|
|
{
|
|
|
|
struct nfs_renameargs *arg = msg->rpc_argp;
|
|
|
|
struct nfs_renameres *res = msg->rpc_resp;
|
2018-03-21 03:43:16 +07:00
|
|
|
struct inode *old_inode = d_inode(old_dentry);
|
|
|
|
struct inode *new_inode = d_inode(new_dentry);
|
2010-09-18 04:31:57 +07:00
|
|
|
|
2018-03-21 03:43:16 +07:00
|
|
|
if (old_inode)
|
2018-03-21 03:43:20 +07:00
|
|
|
nfs4_inode_make_writeable(old_inode);
|
2018-03-21 03:43:16 +07:00
|
|
|
if (new_inode)
|
|
|
|
nfs4_inode_return_delegation(new_inode);
|
2010-09-18 04:31:57 +07:00
|
|
|
msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME];
|
2018-03-21 03:43:16 +07:00
|
|
|
res->server = NFS_SB(old_dentry->d_sb);
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&arg->seq_args, &res->seq_res, 1, 0);
|
2010-09-18 04:31:57 +07:00
|
|
|
}
|
|
|
|
|
2012-03-20 01:54:42 +07:00
|
|
|
static void nfs4_proc_rename_rpc_prepare(struct rpc_task *task, struct nfs_renamedata *data)
|
|
|
|
{
|
2017-01-10 03:48:22 +07:00
|
|
|
nfs4_setup_sequence(NFS_SERVER(data->old_dir)->nfs_client,
|
2012-10-23 07:28:44 +07:00
|
|
|
&data->args.seq_args,
|
|
|
|
&data->res.seq_res,
|
|
|
|
task);
|
2010-09-18 04:31:57 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_rename_done(struct rpc_task *task, struct inode *old_dir,
|
|
|
|
struct inode *new_dir)
|
|
|
|
{
|
2013-08-13 04:08:26 +07:00
|
|
|
struct nfs_renamedata *data = task->tk_calldata;
|
|
|
|
struct nfs_renameres *res = &data->res;
|
2010-09-18 04:31:57 +07:00
|
|
|
|
|
|
|
if (!nfs4_sequence_done(task, &res->seq_res))
|
|
|
|
return 0;
|
2014-09-18 13:09:27 +07:00
|
|
|
if (nfs4_async_handle_error(task, res->server, NULL, &data->timeout) == -EAGAIN)
|
2010-09-18 04:31:57 +07:00
|
|
|
return 0;
|
|
|
|
|
2017-01-12 00:32:26 +07:00
|
|
|
if (task->tk_status == 0) {
|
2017-01-12 10:07:28 +07:00
|
|
|
update_changeattr(old_dir, &res->old_cinfo, res->old_fattr->time_start);
|
2017-01-12 00:32:26 +07:00
|
|
|
if (new_dir != old_dir)
|
2017-01-12 10:07:28 +07:00
|
|
|
update_changeattr(new_dir, &res->new_cinfo, res->new_fattr->time_start);
|
2017-01-12 00:32:26 +07:00
|
|
|
}
|
2010-09-18 04:31:57 +07:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2016-07-21 03:34:42 +07:00
|
|
|
static int _nfs4_proc_link(struct inode *inode, struct inode *dir, const struct qstr *name)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2005-10-28 09:12:42 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2018-04-09 08:06:40 +07:00
|
|
|
__u32 bitmask[NFS4_BITMASK_SZ];
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_link_arg arg = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.dir_fh = NFS_FH(dir),
|
|
|
|
.name = name,
|
2018-04-09 08:06:40 +07:00
|
|
|
.bitmask = bitmask,
|
2005-10-28 09:12:42 +07:00
|
|
|
};
|
|
|
|
struct nfs4_link_res res = {
|
|
|
|
.server = server,
|
2013-05-22 23:50:42 +07:00
|
|
|
.label = NULL,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LINK],
|
|
|
|
.rpc_argp = &arg,
|
2005-10-28 09:12:42 +07:00
|
|
|
.rpc_resp = &res,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
2010-04-17 03:22:49 +07:00
|
|
|
int status = -ENOMEM;
|
|
|
|
|
|
|
|
res.fattr = nfs_alloc_fattr();
|
2012-04-28 00:48:19 +07:00
|
|
|
if (res.fattr == NULL)
|
2010-04-17 03:22:49 +07:00
|
|
|
goto out;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-05-22 23:50:43 +07:00
|
|
|
res.label = nfs4_label_alloc(server, GFP_KERNEL);
|
|
|
|
if (IS_ERR(res.label)) {
|
|
|
|
status = PTR_ERR(res.label);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2018-03-21 03:43:20 +07:00
|
|
|
nfs4_inode_make_writeable(inode);
|
2018-04-09 08:06:40 +07:00
|
|
|
nfs4_bitmap_copy_adjust_setattr(bitmask, nfs4_bitmask(server, res.label), inode);
|
2018-03-21 03:43:14 +07:00
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
|
2005-10-28 09:12:42 +07:00
|
|
|
if (!status) {
|
2017-01-12 10:07:28 +07:00
|
|
|
update_changeattr(dir, &res.cinfo, res.fattr->time_start);
|
2013-05-22 23:50:44 +07:00
|
|
|
status = nfs_post_op_update_inode(inode, res.fattr);
|
|
|
|
if (!status)
|
|
|
|
nfs_setsecurity(inode, res.fattr, res.label);
|
2005-10-28 09:12:42 +07:00
|
|
|
}
|
2013-05-22 23:50:43 +07:00
|
|
|
|
|
|
|
|
|
|
|
nfs4_label_free(res.label);
|
|
|
|
|
2010-04-17 03:22:49 +07:00
|
|
|
out:
|
|
|
|
nfs_free_fattr(res.fattr);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2016-07-21 03:34:42 +07:00
|
|
|
static int nfs4_proc_link(struct inode *inode, struct inode *dir, const struct qstr *name)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(inode),
|
|
|
|
_nfs4_proc_link(inode, dir, name),
|
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2008-06-21 02:35:32 +07:00
|
|
|
struct nfs4_createdata {
|
|
|
|
struct rpc_message msg;
|
|
|
|
struct nfs4_create_arg arg;
|
|
|
|
struct nfs4_create_res res;
|
|
|
|
struct nfs_fh fh;
|
|
|
|
struct nfs_fattr fattr;
|
2013-05-22 23:50:42 +07:00
|
|
|
struct nfs4_label *label;
|
2008-06-21 02:35:32 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
static struct nfs4_createdata *nfs4_alloc_createdata(struct inode *dir,
|
2016-07-21 03:34:42 +07:00
|
|
|
const struct qstr *name, struct iattr *sattr, u32 ftype)
|
2008-06-21 02:35:32 +07:00
|
|
|
{
|
|
|
|
struct nfs4_createdata *data;
|
|
|
|
|
|
|
|
data = kzalloc(sizeof(*data), GFP_KERNEL);
|
|
|
|
if (data != NULL) {
|
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
|
|
|
|
2013-05-22 23:50:43 +07:00
|
|
|
data->label = nfs4_label_alloc(server, GFP_KERNEL);
|
|
|
|
if (IS_ERR(data->label))
|
|
|
|
goto out_free;
|
|
|
|
|
2008-06-21 02:35:32 +07:00
|
|
|
data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE];
|
|
|
|
data->msg.rpc_argp = &data->arg;
|
|
|
|
data->msg.rpc_resp = &data->res;
|
|
|
|
data->arg.dir_fh = NFS_FH(dir);
|
|
|
|
data->arg.server = server;
|
|
|
|
data->arg.name = name;
|
|
|
|
data->arg.attrs = sattr;
|
|
|
|
data->arg.ftype = ftype;
|
2013-05-22 23:50:44 +07:00
|
|
|
data->arg.bitmask = nfs4_bitmask(server, data->label);
|
2016-12-03 10:53:30 +07:00
|
|
|
data->arg.umask = current_umask();
|
2008-06-21 02:35:32 +07:00
|
|
|
data->res.server = server;
|
|
|
|
data->res.fh = &data->fh;
|
|
|
|
data->res.fattr = &data->fattr;
|
2013-05-22 23:50:42 +07:00
|
|
|
data->res.label = data->label;
|
2008-06-21 02:35:32 +07:00
|
|
|
nfs_fattr_init(data->res.fattr);
|
|
|
|
}
|
|
|
|
return data;
|
2013-05-22 23:50:43 +07:00
|
|
|
out_free:
|
|
|
|
kfree(data);
|
|
|
|
return NULL;
|
2008-06-21 02:35:32 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_do_create(struct inode *dir, struct dentry *dentry, struct nfs4_createdata *data)
|
|
|
|
{
|
2011-03-25 00:12:24 +07:00
|
|
|
int status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &data->msg,
|
2011-03-25 00:12:23 +07:00
|
|
|
&data->arg.seq_args, &data->res.seq_res, 1);
|
2008-06-21 02:35:32 +07:00
|
|
|
if (status == 0) {
|
2017-01-12 10:07:28 +07:00
|
|
|
update_changeattr(dir, &data->res.dir_cinfo,
|
|
|
|
data->res.fattr->time_start);
|
2013-05-22 23:50:42 +07:00
|
|
|
status = nfs_instantiate(dentry, data->res.fh, data->res.fattr, data->res.label);
|
2008-06-21 02:35:32 +07:00
|
|
|
}
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_free_createdata(struct nfs4_createdata *data)
|
|
|
|
{
|
2013-05-22 23:50:43 +07:00
|
|
|
nfs4_label_free(data->label);
|
2008-06-21 02:35:32 +07:00
|
|
|
kfree(data);
|
|
|
|
}
|
|
|
|
|
2006-08-23 07:06:22 +07:00
|
|
|
static int _nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
|
2013-05-22 23:50:42 +07:00
|
|
|
struct page *page, unsigned int len, struct iattr *sattr,
|
|
|
|
struct nfs4_label *label)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2008-06-21 02:35:32 +07:00
|
|
|
struct nfs4_createdata *data;
|
|
|
|
int status = -ENAMETOOLONG;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2006-08-23 07:06:23 +07:00
|
|
|
if (len > NFS4_MAXPATHLEN)
|
2008-06-21 02:35:32 +07:00
|
|
|
goto out;
|
2006-08-23 07:06:22 +07:00
|
|
|
|
2008-06-21 02:35:32 +07:00
|
|
|
status = -ENOMEM;
|
|
|
|
data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4LNK);
|
|
|
|
if (data == NULL)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SYMLINK];
|
|
|
|
data->arg.u.symlink.pages = &page;
|
|
|
|
data->arg.u.symlink.len = len;
|
2013-05-22 23:50:42 +07:00
|
|
|
data->arg.label = label;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2008-06-21 02:35:32 +07:00
|
|
|
status = nfs4_do_create(dir, dentry, data);
|
|
|
|
|
|
|
|
nfs4_free_createdata(data);
|
|
|
|
out:
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2006-08-23 07:06:22 +07:00
|
|
|
static int nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
|
2006-08-23 07:06:23 +07:00
|
|
|
struct page *page, unsigned int len, struct iattr *sattr)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
2013-05-22 23:50:44 +07:00
|
|
|
struct nfs4_label l, *label = NULL;
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
2013-05-22 23:50:44 +07:00
|
|
|
|
|
|
|
label = nfs4_label_init_security(dir, dentry, sattr, &l);
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
do {
|
2013-08-13 03:45:55 +07:00
|
|
|
err = _nfs4_proc_symlink(dir, dentry, page, len, sattr, label);
|
|
|
|
trace_nfs4_symlink(dir, &dentry->d_name, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
2013-05-22 23:50:44 +07:00
|
|
|
|
|
|
|
nfs4_label_release_security(label);
|
2005-04-17 05:20:36 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
|
2013-05-22 23:50:42 +07:00
|
|
|
struct iattr *sattr, struct nfs4_label *label)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2008-06-21 02:35:32 +07:00
|
|
|
struct nfs4_createdata *data;
|
|
|
|
int status = -ENOMEM;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2008-06-21 02:35:32 +07:00
|
|
|
data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4DIR);
|
|
|
|
if (data == NULL)
|
|
|
|
goto out;
|
|
|
|
|
2013-05-22 23:50:42 +07:00
|
|
|
data->arg.label = label;
|
2008-06-21 02:35:32 +07:00
|
|
|
status = nfs4_do_create(dir, dentry, data);
|
|
|
|
|
|
|
|
nfs4_free_createdata(data);
|
|
|
|
out:
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
|
|
|
|
struct iattr *sattr)
|
|
|
|
{
|
2016-12-03 10:53:30 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_exception exception = { };
|
2013-05-22 23:50:44 +07:00
|
|
|
struct nfs4_label l, *label = NULL;
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
2010-12-09 18:35:14 +07:00
|
|
|
|
2013-05-22 23:50:44 +07:00
|
|
|
label = nfs4_label_init_security(dir, dentry, sattr, &l);
|
|
|
|
|
2016-12-03 10:53:30 +07:00
|
|
|
if (!(server->attr_bitmask[2] & FATTR4_WORD2_MODE_UMASK))
|
|
|
|
sattr->ia_mode &= ~current_umask();
|
2005-04-17 05:20:36 +07:00
|
|
|
do {
|
2013-08-13 03:45:55 +07:00
|
|
|
err = _nfs4_proc_mkdir(dir, dentry, sattr, label);
|
|
|
|
trace_nfs4_mkdir(dir, &dentry->d_name, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
2013-05-22 23:50:44 +07:00
|
|
|
nfs4_label_release_security(label);
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
|
2017-06-20 19:33:44 +07:00
|
|
|
u64 cookie, struct page **pages, unsigned int count, bool plus)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2015-03-18 05:25:59 +07:00
|
|
|
struct inode *dir = d_inode(dentry);
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_readdir_arg args = {
|
|
|
|
.fh = NFS_FH(dir),
|
2010-10-21 02:44:37 +07:00
|
|
|
.pages = pages,
|
2005-04-17 05:20:36 +07:00
|
|
|
.pgbase = 0,
|
|
|
|
.count = count,
|
2015-03-18 05:25:59 +07:00
|
|
|
.bitmask = NFS_SERVER(d_inode(dentry))->attr_bitmask,
|
NFS: Readdir plus in v4
By requsting more attributes during a readdir, we can mimic the readdir plus
operation that was in NFSv3.
To test, I ran the command `ls -lU --color=none` on directories with various
numbers of files. Without readdir plus, I see this:
n files | 100 | 1,000 | 10,000 | 100,000 | 1,000,000
--------+-----------+-----------+-----------+-----------+----------
real | 0m00.153s | 0m00.589s | 0m05.601s | 0m56.691s | 9m59.128s
user | 0m00.007s | 0m00.007s | 0m00.077s | 0m00.703s | 0m06.800s
sys | 0m00.010s | 0m00.070s | 0m00.633s | 0m06.423s | 1m10.005s
access | 3 | 1 | 1 | 4 | 31
getattr | 2 | 1 | 1 | 1 | 1
lookup | 104 | 1,003 | 10,003 | 100,003 | 1,000,003
readdir | 2 | 16 | 158 | 1,575 | 15,749
total | 111 | 1,021 | 10,163 | 101,583 | 1,015,784
With readdir plus enabled, I see this:
n files | 100 | 1,000 | 10,000 | 100,000 | 1,000,000
--------+-----------+-----------+-----------+-----------+----------
real | 0m00.115s | 0m00.206s | 0m01.079s | 0m12.521s | 2m07.528s
user | 0m00.003s | 0m00.003s | 0m00.040s | 0m00.290s | 0m03.296s
sys | 0m00.007s | 0m00.020s | 0m00.120s | 0m01.357s | 0m17.556s
access | 3 | 1 | 1 | 1 | 7
getattr | 2 | 1 | 1 | 1 | 1
lookup | 4 | 3 | 3 | 3 | 3
readdir | 6 | 62 | 630 | 6,300 | 62,993
total | 15 | 67 | 635 | 6,305 | 63,004
Readdir plus disabled has about a 16x increase in the number of rpc calls and
is 4 - 5 times slower on large directories.
Signed-off-by: Bryan Schumaker <bjschuma@netapp.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2010-10-22 03:33:18 +07:00
|
|
|
.plus = plus,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct nfs4_readdir_res res;
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READDIR],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
2013-09-16 21:53:17 +07:00
|
|
|
dprintk("%s: dentry = %pd2, cookie = %Lu\n", __func__,
|
|
|
|
dentry,
|
2005-06-23 00:16:39 +07:00
|
|
|
(unsigned long long)cookie);
|
2012-09-04 01:56:02 +07:00
|
|
|
nfs4_setup_readdir(cookie, NFS_I(dir)->cookieverf, dentry, &args);
|
2005-04-17 05:20:36 +07:00
|
|
|
res.pgbase = args.pgbase;
|
2011-03-25 00:12:24 +07:00
|
|
|
status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
|
2010-11-16 08:26:22 +07:00
|
|
|
if (status >= 0) {
|
2012-09-04 01:56:02 +07:00
|
|
|
memcpy(NFS_I(dir)->cookieverf, res.verifier.data, NFS4_VERIFIER_SIZE);
|
2010-11-16 08:26:22 +07:00
|
|
|
status += args.pgbase;
|
|
|
|
}
|
2007-09-29 04:11:45 +07:00
|
|
|
|
|
|
|
nfs_invalidate_atime(dir);
|
|
|
|
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: returns %d\n", __func__, status);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
|
2017-06-20 19:33:44 +07:00
|
|
|
u64 cookie, struct page **pages, unsigned int count, bool plus)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-08-13 03:58:42 +07:00
|
|
|
err = _nfs4_proc_readdir(dentry, cred, cookie,
|
|
|
|
pages, count, plus);
|
2015-03-18 05:25:59 +07:00
|
|
|
trace_nfs4_readdir(d_inode(dentry), err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(d_inode(dentry)), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
|
2013-05-22 23:50:44 +07:00
|
|
|
struct iattr *sattr, struct nfs4_label *label, dev_t rdev)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2008-06-21 02:35:32 +07:00
|
|
|
struct nfs4_createdata *data;
|
|
|
|
int mode = sattr->ia_mode;
|
|
|
|
int status = -ENOMEM;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2008-06-21 02:35:32 +07:00
|
|
|
data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4SOCK);
|
|
|
|
if (data == NULL)
|
|
|
|
goto out;
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
if (S_ISFIFO(mode))
|
2008-06-21 02:35:32 +07:00
|
|
|
data->arg.ftype = NF4FIFO;
|
2005-04-17 05:20:36 +07:00
|
|
|
else if (S_ISBLK(mode)) {
|
2008-06-21 02:35:32 +07:00
|
|
|
data->arg.ftype = NF4BLK;
|
|
|
|
data->arg.u.device.specdata1 = MAJOR(rdev);
|
|
|
|
data->arg.u.device.specdata2 = MINOR(rdev);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
else if (S_ISCHR(mode)) {
|
2008-06-21 02:35:32 +07:00
|
|
|
data->arg.ftype = NF4CHR;
|
|
|
|
data->arg.u.device.specdata1 = MAJOR(rdev);
|
|
|
|
data->arg.u.device.specdata2 = MINOR(rdev);
|
2012-10-16 02:47:41 +07:00
|
|
|
} else if (!S_ISSOCK(mode)) {
|
|
|
|
status = -EINVAL;
|
|
|
|
goto out_free;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2013-05-22 23:50:42 +07:00
|
|
|
|
2013-05-22 23:50:44 +07:00
|
|
|
data->arg.label = label;
|
2008-06-21 02:35:32 +07:00
|
|
|
status = nfs4_do_create(dir, dentry, data);
|
2012-10-16 02:47:41 +07:00
|
|
|
out_free:
|
2008-06-21 02:35:32 +07:00
|
|
|
nfs4_free_createdata(data);
|
|
|
|
out:
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
|
|
|
|
struct iattr *sattr, dev_t rdev)
|
|
|
|
{
|
2016-12-03 10:53:30 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_exception exception = { };
|
2013-05-22 23:50:44 +07:00
|
|
|
struct nfs4_label l, *label = NULL;
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
2010-12-09 18:35:14 +07:00
|
|
|
|
2013-05-22 23:50:44 +07:00
|
|
|
label = nfs4_label_init_security(dir, dentry, sattr, &l);
|
|
|
|
|
2016-12-03 10:53:30 +07:00
|
|
|
if (!(server->attr_bitmask[2] & FATTR4_WORD2_MODE_UMASK))
|
|
|
|
sattr->ia_mode &= ~current_umask();
|
2005-04-17 05:20:36 +07:00
|
|
|
do {
|
2013-08-13 03:45:55 +07:00
|
|
|
err = _nfs4_proc_mknod(dir, dentry, sattr, label, rdev);
|
|
|
|
trace_nfs4_mknod(dir, &dentry->d_name, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
2013-05-22 23:50:44 +07:00
|
|
|
|
|
|
|
nfs4_label_release_security(label);
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fsstat *fsstat)
|
|
|
|
{
|
|
|
|
struct nfs4_statfs_arg args = {
|
|
|
|
.fh = fhandle,
|
|
|
|
.bitmask = server->attr_bitmask,
|
|
|
|
};
|
2009-04-01 20:21:56 +07:00
|
|
|
struct nfs4_statfs_res res = {
|
|
|
|
.fsstat = fsstat,
|
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_STATFS],
|
|
|
|
.rpc_argp = &args,
|
2009-04-01 20:21:56 +07:00
|
|
|
.rpc_resp = &res,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2005-10-28 09:12:38 +07:00
|
|
|
nfs_fattr_init(fsstat->fattr);
|
2011-03-25 00:12:24 +07:00
|
|
|
return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsstat *fsstat)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
|
|
|
err = nfs4_handle_exception(server,
|
|
|
|
_nfs4_proc_statfs(server, fhandle, fsstat),
|
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fsinfo *fsinfo)
|
|
|
|
{
|
|
|
|
struct nfs4_fsinfo_arg args = {
|
|
|
|
.fh = fhandle,
|
|
|
|
.bitmask = server->attr_bitmask,
|
|
|
|
};
|
2009-04-01 20:21:57 +07:00
|
|
|
struct nfs4_fsinfo_res res = {
|
|
|
|
.fsinfo = fsinfo,
|
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSINFO],
|
|
|
|
.rpc_argp = &args,
|
2009-04-01 20:21:57 +07:00
|
|
|
.rpc_resp = &res,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2011-03-25 00:12:24 +07:00
|
|
|
return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
2013-03-17 02:55:53 +07:00
|
|
|
unsigned long now = jiffies;
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
2013-03-17 02:55:53 +07:00
|
|
|
err = _nfs4_do_fsinfo(server, fhandle, fsinfo);
|
2013-08-14 00:01:39 +07:00
|
|
|
trace_nfs4_fsinfo(server, fhandle, fsinfo->fattr, err);
|
2013-03-17 02:55:53 +07:00
|
|
|
if (err == 0) {
|
2016-08-06 06:13:08 +07:00
|
|
|
nfs4_set_lease_period(server->nfs_client,
|
|
|
|
fsinfo->lease_time * HZ,
|
|
|
|
now);
|
2013-03-17 02:55:53 +07:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
err = nfs4_handle_exception(server, err, &exception);
|
2005-04-17 05:20:36 +07:00
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
|
|
|
|
{
|
2012-06-21 02:53:40 +07:00
|
|
|
int error;
|
|
|
|
|
2005-10-28 09:12:38 +07:00
|
|
|
nfs_fattr_init(fsinfo->fattr);
|
2012-06-21 02:53:40 +07:00
|
|
|
error = nfs4_do_fsinfo(server, fhandle, fsinfo);
|
2012-08-23 23:27:49 +07:00
|
|
|
if (error == 0) {
|
|
|
|
/* block layout checks this! */
|
|
|
|
server->pnfs_blksize = fsinfo->blksize;
|
2016-09-16 01:40:49 +07:00
|
|
|
set_pnfs_layoutdriver(server, fhandle, fsinfo);
|
2012-08-23 23:27:49 +07:00
|
|
|
}
|
2012-06-21 02:53:40 +07:00
|
|
|
|
|
|
|
return error;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_pathconf *pathconf)
|
|
|
|
{
|
|
|
|
struct nfs4_pathconf_arg args = {
|
|
|
|
.fh = fhandle,
|
|
|
|
.bitmask = server->attr_bitmask,
|
|
|
|
};
|
2009-04-01 20:21:58 +07:00
|
|
|
struct nfs4_pathconf_res res = {
|
|
|
|
.pathconf = pathconf,
|
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_PATHCONF],
|
|
|
|
.rpc_argp = &args,
|
2009-04-01 20:21:58 +07:00
|
|
|
.rpc_resp = &res,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
/* None of the pathconf attributes are mandatory to implement */
|
|
|
|
if ((args.bitmask[0] & nfs4_pathconf_bitmap[0]) == 0) {
|
|
|
|
memset(pathconf, 0, sizeof(*pathconf));
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2005-10-28 09:12:38 +07:00
|
|
|
nfs_fattr_init(pathconf->fattr);
|
2011-03-25 00:12:24 +07:00
|
|
|
return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_pathconf *pathconf)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
|
|
|
err = nfs4_handle_exception(server,
|
|
|
|
_nfs4_proc_pathconf(server, fhandle, pathconf),
|
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2013-03-17 07:54:34 +07:00
|
|
|
int nfs4_set_rw_stateid(nfs4_stateid *stateid,
|
2013-03-18 02:52:00 +07:00
|
|
|
const struct nfs_open_context *ctx,
|
|
|
|
const struct nfs_lock_context *l_ctx,
|
|
|
|
fmode_t fmode)
|
|
|
|
{
|
2016-10-13 11:26:47 +07:00
|
|
|
return nfs4_select_rw_stateid(ctx->state, fmode, l_ctx, stateid, NULL);
|
2013-03-18 02:52:00 +07:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(nfs4_set_rw_stateid);
|
|
|
|
|
2013-03-17 07:54:34 +07:00
|
|
|
static bool nfs4_stateid_is_current(nfs4_stateid *stateid,
|
|
|
|
const struct nfs_open_context *ctx,
|
|
|
|
const struct nfs_lock_context *l_ctx,
|
|
|
|
fmode_t fmode)
|
|
|
|
{
|
|
|
|
nfs4_stateid current_stateid;
|
|
|
|
|
2014-03-05 20:44:23 +07:00
|
|
|
/* If the current stateid represents a lost lock, then exit */
|
|
|
|
if (nfs4_set_rw_stateid(¤t_stateid, ctx, l_ctx, fmode) == -EIO)
|
|
|
|
return true;
|
2013-03-17 07:54:34 +07:00
|
|
|
return nfs4_stateid_match(stateid, ¤t_stateid);
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool nfs4_error_stateid_expired(int err)
|
|
|
|
{
|
|
|
|
switch (err) {
|
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
|
|
|
case -NFS4ERR_BAD_STATEID:
|
|
|
|
case -NFS4ERR_STALE_STATEID:
|
|
|
|
case -NFS4ERR_OLD_STATEID:
|
|
|
|
case -NFS4ERR_OPENMODE:
|
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
static int nfs4_read_done_cb(struct rpc_task *task, struct nfs_pgio_header *hdr)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2014-06-09 22:48:35 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(hdr->inode);
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
trace_nfs4_read(hdr, task->tk_status);
|
2016-09-23 00:39:11 +07:00
|
|
|
if (task->tk_status < 0) {
|
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.inode = hdr->inode,
|
|
|
|
.state = hdr->args.context->state,
|
|
|
|
.stateid = &hdr->args.stateid,
|
|
|
|
};
|
|
|
|
task->tk_status = nfs4_async_handle_exception(task,
|
|
|
|
server, task->tk_status, &exception);
|
|
|
|
if (exception.retry) {
|
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
return -EAGAIN;
|
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2007-09-29 04:20:07 +07:00
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
if (task->tk_status > 0)
|
2014-06-09 22:48:35 +07:00
|
|
|
renew_lease(server, hdr->timestamp);
|
2006-03-21 01:44:27 +07:00
|
|
|
return 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2013-03-17 07:54:34 +07:00
|
|
|
static bool nfs4_read_stateid_changed(struct rpc_task *task,
|
2014-05-06 20:12:24 +07:00
|
|
|
struct nfs_pgio_args *args)
|
2013-03-17 07:54:34 +07:00
|
|
|
{
|
|
|
|
|
|
|
|
if (!nfs4_error_stateid_expired(task->tk_status) ||
|
|
|
|
nfs4_stateid_is_current(&args->stateid,
|
|
|
|
args->context,
|
|
|
|
args->lock_context,
|
|
|
|
FMODE_READ))
|
|
|
|
return false;
|
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
static int nfs4_read_done(struct rpc_task *task, struct nfs_pgio_header *hdr)
|
2011-03-01 08:34:20 +07:00
|
|
|
{
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
if (!nfs4_sequence_done(task, &hdr->res.seq_res))
|
2011-03-01 08:34:20 +07:00
|
|
|
return -EAGAIN;
|
2014-06-09 22:48:35 +07:00
|
|
|
if (nfs4_read_stateid_changed(task, &hdr->args))
|
2013-03-17 07:54:34 +07:00
|
|
|
return -EAGAIN;
|
2016-09-16 05:26:05 +07:00
|
|
|
if (task->tk_status > 0)
|
|
|
|
nfs_invalidate_atime(hdr->inode);
|
2014-06-09 22:48:35 +07:00
|
|
|
return hdr->pgio_done_cb ? hdr->pgio_done_cb(task, hdr) :
|
|
|
|
nfs4_read_done_cb(task, hdr);
|
2011-03-01 08:34:20 +07:00
|
|
|
}
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
static void nfs4_proc_read_setup(struct nfs_pgio_header *hdr,
|
|
|
|
struct rpc_message *msg)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2014-06-09 22:48:35 +07:00
|
|
|
hdr->timestamp = jiffies;
|
2016-06-29 00:54:09 +07:00
|
|
|
if (!hdr->pgio_done_cb)
|
|
|
|
hdr->pgio_done_cb = nfs4_read_done_cb;
|
2007-07-15 02:40:00 +07:00
|
|
|
msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READ];
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&hdr->args.seq_args, &hdr->res.seq_res, 0, 0);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
static int nfs4_proc_pgio_rpc_prepare(struct rpc_task *task,
|
|
|
|
struct nfs_pgio_header *hdr)
|
2012-03-20 01:54:40 +07:00
|
|
|
{
|
2017-01-10 03:48:22 +07:00
|
|
|
if (nfs4_setup_sequence(NFS_SERVER(hdr->inode)->nfs_client,
|
2014-06-09 22:48:35 +07:00
|
|
|
&hdr->args.seq_args,
|
|
|
|
&hdr->res.seq_res,
|
2013-03-18 02:52:00 +07:00
|
|
|
task))
|
2013-09-04 14:04:49 +07:00
|
|
|
return 0;
|
2014-06-09 22:48:35 +07:00
|
|
|
if (nfs4_set_rw_stateid(&hdr->args.stateid, hdr->args.context,
|
|
|
|
hdr->args.lock_context,
|
2017-04-19 21:11:35 +07:00
|
|
|
hdr->rw_mode) == -EIO)
|
2013-09-04 14:04:49 +07:00
|
|
|
return -EIO;
|
2014-06-09 22:48:35 +07:00
|
|
|
if (unlikely(test_bit(NFS_CONTEXT_BAD, &hdr->args.context->flags)))
|
2013-09-04 14:04:49 +07:00
|
|
|
return -EIO;
|
|
|
|
return 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
static int nfs4_write_done_cb(struct rpc_task *task,
|
|
|
|
struct nfs_pgio_header *hdr)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2014-06-09 22:48:35 +07:00
|
|
|
struct inode *inode = hdr->inode;
|
2014-09-18 13:09:27 +07:00
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
trace_nfs4_write(hdr, task->tk_status);
|
2016-09-23 00:39:11 +07:00
|
|
|
if (task->tk_status < 0) {
|
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.inode = hdr->inode,
|
|
|
|
.state = hdr->args.context->state,
|
|
|
|
.stateid = &hdr->args.stateid,
|
|
|
|
};
|
|
|
|
task->tk_status = nfs4_async_handle_exception(task,
|
|
|
|
NFS_SERVER(inode), task->tk_status,
|
|
|
|
&exception);
|
|
|
|
if (exception.retry) {
|
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
return -EAGAIN;
|
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2005-10-28 09:12:44 +07:00
|
|
|
if (task->tk_status >= 0) {
|
2014-06-09 22:48:35 +07:00
|
|
|
renew_lease(NFS_SERVER(inode), hdr->timestamp);
|
2015-02-27 05:36:09 +07:00
|
|
|
nfs_writeback_update_inode(hdr);
|
2005-10-28 09:12:44 +07:00
|
|
|
}
|
2006-03-21 01:44:27 +07:00
|
|
|
return 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2013-03-17 07:54:34 +07:00
|
|
|
static bool nfs4_write_stateid_changed(struct rpc_task *task,
|
2014-05-06 20:12:24 +07:00
|
|
|
struct nfs_pgio_args *args)
|
2013-03-17 07:54:34 +07:00
|
|
|
{
|
|
|
|
|
|
|
|
if (!nfs4_error_stateid_expired(task->tk_status) ||
|
|
|
|
nfs4_stateid_is_current(&args->stateid,
|
|
|
|
args->context,
|
|
|
|
args->lock_context,
|
|
|
|
FMODE_WRITE))
|
|
|
|
return false;
|
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
static int nfs4_write_done(struct rpc_task *task, struct nfs_pgio_header *hdr)
|
2011-03-03 22:13:42 +07:00
|
|
|
{
|
2014-06-09 22:48:35 +07:00
|
|
|
if (!nfs4_sequence_done(task, &hdr->res.seq_res))
|
2011-03-03 22:13:42 +07:00
|
|
|
return -EAGAIN;
|
2014-06-09 22:48:35 +07:00
|
|
|
if (nfs4_write_stateid_changed(task, &hdr->args))
|
2013-03-17 07:54:34 +07:00
|
|
|
return -EAGAIN;
|
2014-06-09 22:48:35 +07:00
|
|
|
return hdr->pgio_done_cb ? hdr->pgio_done_cb(task, hdr) :
|
|
|
|
nfs4_write_done_cb(task, hdr);
|
2011-03-03 22:13:42 +07:00
|
|
|
}
|
|
|
|
|
2012-04-29 01:55:16 +07:00
|
|
|
static
|
2014-06-09 22:48:35 +07:00
|
|
|
bool nfs4_write_need_cache_consistency_data(struct nfs_pgio_header *hdr)
|
2011-03-03 22:13:47 +07:00
|
|
|
{
|
2012-04-29 01:55:16 +07:00
|
|
|
/* Don't request attributes for pNFS or O_DIRECT writes */
|
2014-06-09 22:48:35 +07:00
|
|
|
if (hdr->ds_clp != NULL || hdr->dreq != NULL)
|
2012-04-29 01:55:16 +07:00
|
|
|
return false;
|
|
|
|
/* Otherwise, request attributes if and only if we don't hold
|
|
|
|
* a delegation
|
|
|
|
*/
|
2012-06-21 02:53:43 +07:00
|
|
|
return nfs4_have_delegation(hdr->inode, FMODE_READ) == 0;
|
2011-03-03 22:13:47 +07:00
|
|
|
}
|
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
static void nfs4_proc_write_setup(struct nfs_pgio_header *hdr,
|
2018-05-05 03:22:48 +07:00
|
|
|
struct rpc_message *msg,
|
|
|
|
struct rpc_clnt **clnt)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2014-06-09 22:48:35 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(hdr->inode);
|
2007-07-15 02:40:00 +07:00
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
if (!nfs4_write_need_cache_consistency_data(hdr)) {
|
|
|
|
hdr->args.bitmask = NULL;
|
|
|
|
hdr->res.fattr = NULL;
|
2011-03-03 22:13:46 +07:00
|
|
|
} else
|
2014-06-09 22:48:35 +07:00
|
|
|
hdr->args.bitmask = server->cache_consistency_bitmask;
|
2012-04-29 01:55:16 +07:00
|
|
|
|
2014-06-09 22:48:35 +07:00
|
|
|
if (!hdr->pgio_done_cb)
|
|
|
|
hdr->pgio_done_cb = nfs4_write_done_cb;
|
|
|
|
hdr->res.server = server;
|
|
|
|
hdr->timestamp = jiffies;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2007-07-15 02:40:00 +07:00
|
|
|
msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_WRITE];
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&hdr->args.seq_args, &hdr->res.seq_res, 1, 0);
|
2018-05-05 03:22:48 +07:00
|
|
|
nfs4_state_protect_write(server->nfs_client, clnt, msg, hdr);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2012-04-21 01:47:39 +07:00
|
|
|
static void nfs4_proc_commit_rpc_prepare(struct rpc_task *task, struct nfs_commit_data *data)
|
2012-03-20 01:54:39 +07:00
|
|
|
{
|
2017-01-10 03:48:22 +07:00
|
|
|
nfs4_setup_sequence(NFS_SERVER(data->inode)->nfs_client,
|
2012-10-23 07:28:44 +07:00
|
|
|
&data->args.seq_args,
|
|
|
|
&data->res.seq_res,
|
|
|
|
task);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2012-04-21 01:47:39 +07:00
|
|
|
static int nfs4_commit_done_cb(struct rpc_task *task, struct nfs_commit_data *data)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct inode *inode = data->inode;
|
2010-08-01 01:29:06 +07:00
|
|
|
|
2013-08-15 02:31:28 +07:00
|
|
|
trace_nfs4_commit(data, task->tk_status);
|
2014-09-18 13:09:27 +07:00
|
|
|
if (nfs4_async_handle_error(task, NFS_SERVER(inode),
|
|
|
|
NULL, NULL) == -EAGAIN) {
|
2011-10-20 02:17:29 +07:00
|
|
|
rpc_restart_call_prepare(task);
|
2006-03-21 01:44:27 +07:00
|
|
|
return -EAGAIN;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2006-03-21 01:44:27 +07:00
|
|
|
return 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2012-04-21 01:47:39 +07:00
|
|
|
static int nfs4_commit_done(struct rpc_task *task, struct nfs_commit_data *data)
|
2011-03-23 20:27:46 +07:00
|
|
|
{
|
|
|
|
if (!nfs4_sequence_done(task, &data->res.seq_res))
|
|
|
|
return -EAGAIN;
|
2012-04-21 01:47:39 +07:00
|
|
|
return data->commit_done_cb(task, data);
|
2011-03-23 20:27:46 +07:00
|
|
|
}
|
|
|
|
|
2018-05-05 03:22:49 +07:00
|
|
|
static void nfs4_proc_commit_setup(struct nfs_commit_data *data, struct rpc_message *msg,
|
|
|
|
struct rpc_clnt **clnt)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-03-21 01:44:27 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(data->inode);
|
2011-03-23 20:27:52 +07:00
|
|
|
|
2012-04-21 01:47:39 +07:00
|
|
|
if (data->commit_done_cb == NULL)
|
|
|
|
data->commit_done_cb = nfs4_commit_done_cb;
|
2005-10-28 09:12:44 +07:00
|
|
|
data->res.server = server;
|
2007-07-15 02:40:00 +07:00
|
|
|
msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_COMMIT];
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 1, 0);
|
2018-05-05 03:22:49 +07:00
|
|
|
nfs4_state_protect(server->nfs_client, NFS_SP4_MACH_CRED_COMMIT, clnt, msg);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2010-05-08 00:34:17 +07:00
|
|
|
struct nfs4_renewdata {
|
|
|
|
struct nfs_client *client;
|
|
|
|
unsigned long timestamp;
|
|
|
|
};
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
/*
|
|
|
|
* nfs4_proc_async_renew(): This is not one of the nfs_rpc_ops; it is a special
|
|
|
|
* standalone procedure for queueing an asynchronous RENEW.
|
|
|
|
*/
|
2010-05-08 00:34:17 +07:00
|
|
|
static void nfs4_renew_release(void *calldata)
|
2010-02-05 18:45:04 +07:00
|
|
|
{
|
2010-05-08 00:34:17 +07:00
|
|
|
struct nfs4_renewdata *data = calldata;
|
|
|
|
struct nfs_client *clp = data->client;
|
2010-02-05 18:45:04 +07:00
|
|
|
|
2017-10-20 16:53:38 +07:00
|
|
|
if (refcount_read(&clp->cl_count) > 1)
|
2010-02-05 18:45:06 +07:00
|
|
|
nfs4_schedule_state_renewal(clp);
|
|
|
|
nfs_put_client(clp);
|
2010-05-08 00:34:17 +07:00
|
|
|
kfree(data);
|
2010-02-05 18:45:04 +07:00
|
|
|
}
|
|
|
|
|
2010-05-08 00:34:17 +07:00
|
|
|
static void nfs4_renew_done(struct rpc_task *task, void *calldata)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2010-05-08 00:34:17 +07:00
|
|
|
struct nfs4_renewdata *data = calldata;
|
|
|
|
struct nfs_client *clp = data->client;
|
|
|
|
unsigned long timestamp = data->timestamp;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_renew_async(clp, task->tk_status);
|
2013-10-18 01:13:53 +07:00
|
|
|
switch (task->tk_status) {
|
|
|
|
case 0:
|
|
|
|
break;
|
|
|
|
case -NFS4ERR_LEASE_MOVED:
|
|
|
|
nfs4_schedule_lease_moved_recovery(clp);
|
|
|
|
break;
|
|
|
|
default:
|
2009-05-27 01:51:00 +07:00
|
|
|
/* Unless we're shutting down, schedule state recovery! */
|
2011-08-25 02:07:37 +07:00
|
|
|
if (test_bit(NFS_CS_RENEWD, &clp->cl_res_state) == 0)
|
|
|
|
return;
|
|
|
|
if (task->tk_status != NFS4ERR_CB_PATH_DOWN) {
|
2011-03-10 04:00:53 +07:00
|
|
|
nfs4_schedule_lease_recovery(clp);
|
2011-08-25 02:07:37 +07:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
nfs4_schedule_path_down_recovery(clp);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2010-08-01 01:29:06 +07:00
|
|
|
do_renew_lease(clp, timestamp);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:04 +07:00
|
|
|
static const struct rpc_call_ops nfs4_renew_ops = {
|
|
|
|
.rpc_call_done = nfs4_renew_done,
|
2010-02-05 18:45:04 +07:00
|
|
|
.rpc_release = nfs4_renew_release,
|
2006-01-03 15:55:04 +07:00
|
|
|
};
|
|
|
|
|
2011-08-25 02:07:37 +07:00
|
|
|
static int nfs4_proc_async_renew(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
|
|
|
|
.rpc_argp = clp,
|
2006-01-03 15:55:25 +07:00
|
|
|
.rpc_cred = cred,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
2010-05-08 00:34:17 +07:00
|
|
|
struct nfs4_renewdata *data;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2011-08-25 02:07:37 +07:00
|
|
|
if (renew_flags == 0)
|
|
|
|
return 0;
|
2017-10-20 16:53:38 +07:00
|
|
|
if (!refcount_inc_not_zero(&clp->cl_count))
|
2010-02-05 18:45:06 +07:00
|
|
|
return -EIO;
|
2011-08-25 02:07:35 +07:00
|
|
|
data = kmalloc(sizeof(*data), GFP_NOFS);
|
2017-04-27 21:45:15 +07:00
|
|
|
if (data == NULL) {
|
|
|
|
nfs_put_client(clp);
|
2010-05-08 00:34:17 +07:00
|
|
|
return -ENOMEM;
|
2017-04-27 21:45:15 +07:00
|
|
|
}
|
2010-05-08 00:34:17 +07:00
|
|
|
data->client = clp;
|
|
|
|
data->timestamp = jiffies;
|
2013-04-09 04:50:28 +07:00
|
|
|
return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT,
|
2010-05-08 00:34:17 +07:00
|
|
|
&nfs4_renew_ops, data);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2011-08-25 02:07:37 +07:00
|
|
|
static int nfs4_proc_renew(struct nfs_client *clp, struct rpc_cred *cred)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENEW],
|
|
|
|
.rpc_argp = clp,
|
2006-01-03 15:55:25 +07:00
|
|
|
.rpc_cred = cred,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
unsigned long now = jiffies;
|
|
|
|
int status;
|
|
|
|
|
2013-04-09 04:50:28 +07:00
|
|
|
status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
|
2005-04-17 05:20:36 +07:00
|
|
|
if (status < 0)
|
|
|
|
return status;
|
2010-08-01 01:29:06 +07:00
|
|
|
do_renew_lease(clp, now);
|
2005-04-17 05:20:36 +07:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2005-06-23 00:16:22 +07:00
|
|
|
static inline int nfs4_server_supports_acls(struct nfs_server *server)
|
|
|
|
{
|
2014-01-23 21:54:55 +07:00
|
|
|
return server->caps & NFS_CAP_ACLS;
|
2005-06-23 00:16:22 +07:00
|
|
|
}
|
|
|
|
|
2012-08-24 21:59:25 +07:00
|
|
|
/* Assuming that XATTR_SIZE_MAX is a multiple of PAGE_SIZE, and that
|
|
|
|
* it's OK to put sizeof(void) * (XATTR_SIZE_MAX/PAGE_SIZE) bytes on
|
2005-06-23 00:16:22 +07:00
|
|
|
* the stack.
|
|
|
|
*/
|
2012-08-24 21:59:25 +07:00
|
|
|
#define NFS4ACL_MAXPAGES DIV_ROUND_UP(XATTR_SIZE_MAX, PAGE_SIZE)
|
2005-06-23 00:16:22 +07:00
|
|
|
|
nfs4: Ensure that ACL pages sent over NFS were not allocated from the slab (v3)
The "bad_page()" page allocator sanity check was reported recently (call
chain as follows):
bad_page+0x69/0x91
free_hot_cold_page+0x81/0x144
skb_release_data+0x5f/0x98
__kfree_skb+0x11/0x1a
tcp_ack+0x6a3/0x1868
tcp_rcv_established+0x7a6/0x8b9
tcp_v4_do_rcv+0x2a/0x2fa
tcp_v4_rcv+0x9a2/0x9f6
do_timer+0x2df/0x52c
ip_local_deliver+0x19d/0x263
ip_rcv+0x539/0x57c
netif_receive_skb+0x470/0x49f
:virtio_net:virtnet_poll+0x46b/0x5c5
net_rx_action+0xac/0x1b3
__do_softirq+0x89/0x133
call_softirq+0x1c/0x28
do_softirq+0x2c/0x7d
do_IRQ+0xec/0xf5
default_idle+0x0/0x50
ret_from_intr+0x0/0xa
default_idle+0x29/0x50
cpu_idle+0x95/0xb8
start_kernel+0x220/0x225
_sinittext+0x22f/0x236
It occurs because an skb with a fraglist was freed from the tcp
retransmit queue when it was acked, but a page on that fraglist had
PG_Slab set (indicating it was allocated from the Slab allocator (which
means the free path above can't safely free it via put_page.
We tracked this back to an nfsv4 setacl operation, in which the nfs code
attempted to fill convert the passed in buffer to an array of pages in
__nfs4_proc_set_acl, which gets used by the skb->frags list in
xs_sendpages. __nfs4_proc_set_acl just converts each page in the buffer
to a page struct via virt_to_page, but the vfs allocates the buffer via
kmalloc, meaning the PG_slab bit is set. We can't create a buffer with
kmalloc and free it later in the tcp ack path with put_page, so we need
to either:
1) ensure that when we create the list of pages, no page struct has
PG_Slab set
or
2) not use a page list to send this data
Given that these buffers can be multiple pages and arbitrarily sized, I
think (1) is the right way to go. I've written the below patch to
allocate a page from the buddy allocator directly and copy the data over
to it. This ensures that we have a put_page free-able page for every
entry that winds up on an skb frag list, so it can be safely freed when
the frame is acked. We do a put page on each entry after the
rpc_call_sync call so as to drop our own reference count to the page,
leaving only the ref count taken by tcp_sendpages. This way the data
will be properly freed when the ack comes in
Successfully tested by myself to solve the above oops.
Note, as this is the result of a setacl operation that exceeded a page
of data, I think this amounts to a local DOS triggerable by an
uprivlidged user, so I'm CCing security on this as well.
Signed-off-by: Neil Horman <nhorman@tuxdriver.com>
CC: Trond Myklebust <Trond.Myklebust@netapp.com>
CC: security@kernel.org
CC: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2011-03-05 07:26:03 +07:00
|
|
|
static int buf_to_pages_noslab(const void *buf, size_t buflen,
|
2015-11-04 00:25:34 +07:00
|
|
|
struct page **pages)
|
nfs4: Ensure that ACL pages sent over NFS were not allocated from the slab (v3)
The "bad_page()" page allocator sanity check was reported recently (call
chain as follows):
bad_page+0x69/0x91
free_hot_cold_page+0x81/0x144
skb_release_data+0x5f/0x98
__kfree_skb+0x11/0x1a
tcp_ack+0x6a3/0x1868
tcp_rcv_established+0x7a6/0x8b9
tcp_v4_do_rcv+0x2a/0x2fa
tcp_v4_rcv+0x9a2/0x9f6
do_timer+0x2df/0x52c
ip_local_deliver+0x19d/0x263
ip_rcv+0x539/0x57c
netif_receive_skb+0x470/0x49f
:virtio_net:virtnet_poll+0x46b/0x5c5
net_rx_action+0xac/0x1b3
__do_softirq+0x89/0x133
call_softirq+0x1c/0x28
do_softirq+0x2c/0x7d
do_IRQ+0xec/0xf5
default_idle+0x0/0x50
ret_from_intr+0x0/0xa
default_idle+0x29/0x50
cpu_idle+0x95/0xb8
start_kernel+0x220/0x225
_sinittext+0x22f/0x236
It occurs because an skb with a fraglist was freed from the tcp
retransmit queue when it was acked, but a page on that fraglist had
PG_Slab set (indicating it was allocated from the Slab allocator (which
means the free path above can't safely free it via put_page.
We tracked this back to an nfsv4 setacl operation, in which the nfs code
attempted to fill convert the passed in buffer to an array of pages in
__nfs4_proc_set_acl, which gets used by the skb->frags list in
xs_sendpages. __nfs4_proc_set_acl just converts each page in the buffer
to a page struct via virt_to_page, but the vfs allocates the buffer via
kmalloc, meaning the PG_slab bit is set. We can't create a buffer with
kmalloc and free it later in the tcp ack path with put_page, so we need
to either:
1) ensure that when we create the list of pages, no page struct has
PG_Slab set
or
2) not use a page list to send this data
Given that these buffers can be multiple pages and arbitrarily sized, I
think (1) is the right way to go. I've written the below patch to
allocate a page from the buddy allocator directly and copy the data over
to it. This ensures that we have a put_page free-able page for every
entry that winds up on an skb frag list, so it can be safely freed when
the frame is acked. We do a put page on each entry after the
rpc_call_sync call so as to drop our own reference count to the page,
leaving only the ref count taken by tcp_sendpages. This way the data
will be properly freed when the ack comes in
Successfully tested by myself to solve the above oops.
Note, as this is the result of a setacl operation that exceeded a page
of data, I think this amounts to a local DOS triggerable by an
uprivlidged user, so I'm CCing security on this as well.
Signed-off-by: Neil Horman <nhorman@tuxdriver.com>
CC: Trond Myklebust <Trond.Myklebust@netapp.com>
CC: security@kernel.org
CC: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2011-03-05 07:26:03 +07:00
|
|
|
{
|
|
|
|
struct page *newpage, **spages;
|
|
|
|
int rc = 0;
|
|
|
|
size_t len;
|
|
|
|
spages = pages;
|
|
|
|
|
|
|
|
do {
|
2012-08-24 21:59:25 +07:00
|
|
|
len = min_t(size_t, PAGE_SIZE, buflen);
|
nfs4: Ensure that ACL pages sent over NFS were not allocated from the slab (v3)
The "bad_page()" page allocator sanity check was reported recently (call
chain as follows):
bad_page+0x69/0x91
free_hot_cold_page+0x81/0x144
skb_release_data+0x5f/0x98
__kfree_skb+0x11/0x1a
tcp_ack+0x6a3/0x1868
tcp_rcv_established+0x7a6/0x8b9
tcp_v4_do_rcv+0x2a/0x2fa
tcp_v4_rcv+0x9a2/0x9f6
do_timer+0x2df/0x52c
ip_local_deliver+0x19d/0x263
ip_rcv+0x539/0x57c
netif_receive_skb+0x470/0x49f
:virtio_net:virtnet_poll+0x46b/0x5c5
net_rx_action+0xac/0x1b3
__do_softirq+0x89/0x133
call_softirq+0x1c/0x28
do_softirq+0x2c/0x7d
do_IRQ+0xec/0xf5
default_idle+0x0/0x50
ret_from_intr+0x0/0xa
default_idle+0x29/0x50
cpu_idle+0x95/0xb8
start_kernel+0x220/0x225
_sinittext+0x22f/0x236
It occurs because an skb with a fraglist was freed from the tcp
retransmit queue when it was acked, but a page on that fraglist had
PG_Slab set (indicating it was allocated from the Slab allocator (which
means the free path above can't safely free it via put_page.
We tracked this back to an nfsv4 setacl operation, in which the nfs code
attempted to fill convert the passed in buffer to an array of pages in
__nfs4_proc_set_acl, which gets used by the skb->frags list in
xs_sendpages. __nfs4_proc_set_acl just converts each page in the buffer
to a page struct via virt_to_page, but the vfs allocates the buffer via
kmalloc, meaning the PG_slab bit is set. We can't create a buffer with
kmalloc and free it later in the tcp ack path with put_page, so we need
to either:
1) ensure that when we create the list of pages, no page struct has
PG_Slab set
or
2) not use a page list to send this data
Given that these buffers can be multiple pages and arbitrarily sized, I
think (1) is the right way to go. I've written the below patch to
allocate a page from the buddy allocator directly and copy the data over
to it. This ensures that we have a put_page free-able page for every
entry that winds up on an skb frag list, so it can be safely freed when
the frame is acked. We do a put page on each entry after the
rpc_call_sync call so as to drop our own reference count to the page,
leaving only the ref count taken by tcp_sendpages. This way the data
will be properly freed when the ack comes in
Successfully tested by myself to solve the above oops.
Note, as this is the result of a setacl operation that exceeded a page
of data, I think this amounts to a local DOS triggerable by an
uprivlidged user, so I'm CCing security on this as well.
Signed-off-by: Neil Horman <nhorman@tuxdriver.com>
CC: Trond Myklebust <Trond.Myklebust@netapp.com>
CC: security@kernel.org
CC: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2011-03-05 07:26:03 +07:00
|
|
|
newpage = alloc_page(GFP_KERNEL);
|
|
|
|
|
|
|
|
if (newpage == NULL)
|
|
|
|
goto unwind;
|
|
|
|
memcpy(page_address(newpage), buf, len);
|
2017-01-12 03:04:25 +07:00
|
|
|
buf += len;
|
|
|
|
buflen -= len;
|
nfs4: Ensure that ACL pages sent over NFS were not allocated from the slab (v3)
The "bad_page()" page allocator sanity check was reported recently (call
chain as follows):
bad_page+0x69/0x91
free_hot_cold_page+0x81/0x144
skb_release_data+0x5f/0x98
__kfree_skb+0x11/0x1a
tcp_ack+0x6a3/0x1868
tcp_rcv_established+0x7a6/0x8b9
tcp_v4_do_rcv+0x2a/0x2fa
tcp_v4_rcv+0x9a2/0x9f6
do_timer+0x2df/0x52c
ip_local_deliver+0x19d/0x263
ip_rcv+0x539/0x57c
netif_receive_skb+0x470/0x49f
:virtio_net:virtnet_poll+0x46b/0x5c5
net_rx_action+0xac/0x1b3
__do_softirq+0x89/0x133
call_softirq+0x1c/0x28
do_softirq+0x2c/0x7d
do_IRQ+0xec/0xf5
default_idle+0x0/0x50
ret_from_intr+0x0/0xa
default_idle+0x29/0x50
cpu_idle+0x95/0xb8
start_kernel+0x220/0x225
_sinittext+0x22f/0x236
It occurs because an skb with a fraglist was freed from the tcp
retransmit queue when it was acked, but a page on that fraglist had
PG_Slab set (indicating it was allocated from the Slab allocator (which
means the free path above can't safely free it via put_page.
We tracked this back to an nfsv4 setacl operation, in which the nfs code
attempted to fill convert the passed in buffer to an array of pages in
__nfs4_proc_set_acl, which gets used by the skb->frags list in
xs_sendpages. __nfs4_proc_set_acl just converts each page in the buffer
to a page struct via virt_to_page, but the vfs allocates the buffer via
kmalloc, meaning the PG_slab bit is set. We can't create a buffer with
kmalloc and free it later in the tcp ack path with put_page, so we need
to either:
1) ensure that when we create the list of pages, no page struct has
PG_Slab set
or
2) not use a page list to send this data
Given that these buffers can be multiple pages and arbitrarily sized, I
think (1) is the right way to go. I've written the below patch to
allocate a page from the buddy allocator directly and copy the data over
to it. This ensures that we have a put_page free-able page for every
entry that winds up on an skb frag list, so it can be safely freed when
the frame is acked. We do a put page on each entry after the
rpc_call_sync call so as to drop our own reference count to the page,
leaving only the ref count taken by tcp_sendpages. This way the data
will be properly freed when the ack comes in
Successfully tested by myself to solve the above oops.
Note, as this is the result of a setacl operation that exceeded a page
of data, I think this amounts to a local DOS triggerable by an
uprivlidged user, so I'm CCing security on this as well.
Signed-off-by: Neil Horman <nhorman@tuxdriver.com>
CC: Trond Myklebust <Trond.Myklebust@netapp.com>
CC: security@kernel.org
CC: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2011-03-05 07:26:03 +07:00
|
|
|
*pages++ = newpage;
|
|
|
|
rc++;
|
|
|
|
} while (buflen != 0);
|
|
|
|
|
|
|
|
return rc;
|
|
|
|
|
|
|
|
unwind:
|
|
|
|
for(; rc > 0; rc--)
|
|
|
|
__free_page(spages[rc-1]);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
|
2005-06-23 00:16:23 +07:00
|
|
|
struct nfs4_cached_acl {
|
|
|
|
int cached;
|
|
|
|
size_t len;
|
2005-06-23 00:16:28 +07:00
|
|
|
char data[0];
|
2005-06-23 00:16:23 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
static void nfs4_set_cached_acl(struct inode *inode, struct nfs4_cached_acl *acl)
|
|
|
|
{
|
|
|
|
struct nfs_inode *nfsi = NFS_I(inode);
|
|
|
|
|
|
|
|
spin_lock(&inode->i_lock);
|
|
|
|
kfree(nfsi->nfs4_acl);
|
|
|
|
nfsi->nfs4_acl = acl;
|
|
|
|
spin_unlock(&inode->i_lock);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_zap_acl_attr(struct inode *inode)
|
|
|
|
{
|
|
|
|
nfs4_set_cached_acl(inode, NULL);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline ssize_t nfs4_read_cached_acl(struct inode *inode, char *buf, size_t buflen)
|
|
|
|
{
|
|
|
|
struct nfs_inode *nfsi = NFS_I(inode);
|
|
|
|
struct nfs4_cached_acl *acl;
|
|
|
|
int ret = -ENOENT;
|
|
|
|
|
|
|
|
spin_lock(&inode->i_lock);
|
|
|
|
acl = nfsi->nfs4_acl;
|
|
|
|
if (acl == NULL)
|
|
|
|
goto out;
|
|
|
|
if (buf == NULL) /* user is just asking for length */
|
|
|
|
goto out_len;
|
|
|
|
if (acl->cached == 0)
|
|
|
|
goto out;
|
|
|
|
ret = -ERANGE; /* see getxattr(2) man page */
|
|
|
|
if (acl->len > buflen)
|
|
|
|
goto out;
|
|
|
|
memcpy(buf, acl->data, acl->len);
|
|
|
|
out_len:
|
|
|
|
ret = acl->len;
|
|
|
|
out:
|
|
|
|
spin_unlock(&inode->i_lock);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2012-04-17 20:36:40 +07:00
|
|
|
static void nfs4_write_cached_acl(struct inode *inode, struct page **pages, size_t pgbase, size_t acl_len)
|
2005-06-23 00:16:23 +07:00
|
|
|
{
|
|
|
|
struct nfs4_cached_acl *acl;
|
2012-08-15 05:30:41 +07:00
|
|
|
size_t buflen = sizeof(*acl) + acl_len;
|
2005-06-23 00:16:23 +07:00
|
|
|
|
2012-08-27 01:44:43 +07:00
|
|
|
if (buflen <= PAGE_SIZE) {
|
2012-08-15 05:30:41 +07:00
|
|
|
acl = kmalloc(buflen, GFP_KERNEL);
|
2005-06-23 00:16:23 +07:00
|
|
|
if (acl == NULL)
|
|
|
|
goto out;
|
|
|
|
acl->cached = 1;
|
2012-04-17 20:36:40 +07:00
|
|
|
_copy_from_pages(acl->data, pages, pgbase, acl_len);
|
2005-06-23 00:16:23 +07:00
|
|
|
} else {
|
|
|
|
acl = kmalloc(sizeof(*acl), GFP_KERNEL);
|
|
|
|
if (acl == NULL)
|
|
|
|
goto out;
|
|
|
|
acl->cached = 0;
|
|
|
|
}
|
|
|
|
acl->len = acl_len;
|
|
|
|
out:
|
|
|
|
nfs4_set_cached_acl(inode, acl);
|
|
|
|
}
|
|
|
|
|
2011-12-07 23:55:27 +07:00
|
|
|
/*
|
|
|
|
* The getxattr API returns the required buffer length when called with a
|
|
|
|
* NULL buf. The NFSv4 acl tool then calls getxattr again after allocating
|
|
|
|
* the required buf. On a NULL buf, we send a page of data to the server
|
|
|
|
* guessing that the ACL request can be serviced by a page. If so, we cache
|
|
|
|
* up to the page of ACL data, and the 2nd call to getxattr is serviced by
|
|
|
|
* the cache. If not so, we throw away the page, and cache the required
|
|
|
|
* length. The next getxattr call will then produce another round trip to
|
|
|
|
* the server, this time with the input buf of the required size.
|
|
|
|
*/
|
2006-08-24 23:27:15 +07:00
|
|
|
static ssize_t __nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
|
2005-06-23 00:16:22 +07:00
|
|
|
{
|
2017-02-24 02:54:21 +07:00
|
|
|
struct page *pages[NFS4ACL_MAXPAGES + 1] = {NULL, };
|
2005-06-23 00:16:22 +07:00
|
|
|
struct nfs_getaclargs args = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.acl_pages = pages,
|
|
|
|
.acl_len = buflen,
|
|
|
|
};
|
2009-04-01 20:21:59 +07:00
|
|
|
struct nfs_getaclres res = {
|
|
|
|
.acl_len = buflen,
|
|
|
|
};
|
2005-06-23 00:16:22 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETACL],
|
|
|
|
.rpc_argp = &args,
|
2009-04-01 20:21:59 +07:00
|
|
|
.rpc_resp = &res,
|
2005-06-23 00:16:22 +07:00
|
|
|
};
|
2017-02-24 02:54:21 +07:00
|
|
|
unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE) + 1;
|
2012-08-24 21:59:25 +07:00
|
|
|
int ret = -ENOMEM, i;
|
2005-06-23 00:16:22 +07:00
|
|
|
|
2012-08-24 21:59:25 +07:00
|
|
|
if (npages > ARRAY_SIZE(pages))
|
|
|
|
return -ERANGE;
|
2012-04-17 20:35:39 +07:00
|
|
|
|
2011-12-07 23:55:27 +07:00
|
|
|
for (i = 0; i < npages; i++) {
|
|
|
|
pages[i] = alloc_page(GFP_KERNEL);
|
|
|
|
if (!pages[i])
|
|
|
|
goto out_free;
|
2005-06-23 00:16:23 +07:00
|
|
|
}
|
2012-04-17 20:35:39 +07:00
|
|
|
|
|
|
|
/* for decoding across pages */
|
|
|
|
res.acl_scratch = alloc_page(GFP_KERNEL);
|
|
|
|
if (!res.acl_scratch)
|
|
|
|
goto out_free;
|
|
|
|
|
2011-12-07 23:55:27 +07:00
|
|
|
args.acl_len = npages * PAGE_SIZE;
|
2012-04-17 20:35:39 +07:00
|
|
|
|
2012-01-10 21:42:47 +07:00
|
|
|
dprintk("%s buf %p buflen %zu npages %d args.acl_len %zu\n",
|
2011-12-07 23:55:27 +07:00
|
|
|
__func__, buf, buflen, npages, args.acl_len);
|
|
|
|
ret = nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode),
|
|
|
|
&msg, &args.seq_args, &res.seq_res, 0);
|
2005-06-23 00:16:23 +07:00
|
|
|
if (ret)
|
|
|
|
goto out_free;
|
2011-12-07 23:55:27 +07:00
|
|
|
|
2012-08-27 01:44:43 +07:00
|
|
|
/* Handle the case where the passed-in buffer is too short */
|
|
|
|
if (res.acl_flags & NFS4_ACL_TRUNC) {
|
|
|
|
/* Did the user only issue a request for the acl length? */
|
|
|
|
if (buf == NULL)
|
|
|
|
goto out_ok;
|
2005-06-23 00:16:23 +07:00
|
|
|
ret = -ERANGE;
|
2012-08-27 01:44:43 +07:00
|
|
|
goto out_free;
|
2005-06-23 00:16:23 +07:00
|
|
|
}
|
2012-08-27 01:44:43 +07:00
|
|
|
nfs4_write_cached_acl(inode, pages, res.acl_data_offset, res.acl_len);
|
2012-12-08 21:30:18 +07:00
|
|
|
if (buf) {
|
|
|
|
if (res.acl_len > buflen) {
|
|
|
|
ret = -ERANGE;
|
|
|
|
goto out_free;
|
|
|
|
}
|
2012-08-27 01:44:43 +07:00
|
|
|
_copy_from_pages(buf, pages, res.acl_data_offset, res.acl_len);
|
2012-12-08 21:30:18 +07:00
|
|
|
}
|
2012-08-27 01:44:43 +07:00
|
|
|
out_ok:
|
|
|
|
ret = res.acl_len;
|
2005-06-23 00:16:23 +07:00
|
|
|
out_free:
|
2011-12-07 23:55:27 +07:00
|
|
|
for (i = 0; i < npages; i++)
|
|
|
|
if (pages[i])
|
|
|
|
__free_page(pages[i]);
|
2012-02-04 06:30:53 +07:00
|
|
|
if (res.acl_scratch)
|
|
|
|
__free_page(res.acl_scratch);
|
2005-06-23 00:16:22 +07:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2006-08-24 23:27:15 +07:00
|
|
|
static ssize_t nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
ssize_t ret;
|
|
|
|
do {
|
|
|
|
ret = __nfs4_get_acl_uncached(inode, buf, buflen);
|
2013-08-13 03:58:42 +07:00
|
|
|
trace_nfs4_get_acl(inode, ret);
|
2006-08-24 23:27:15 +07:00
|
|
|
if (ret >= 0)
|
|
|
|
break;
|
|
|
|
ret = nfs4_handle_exception(NFS_SERVER(inode), ret, &exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2005-06-23 00:16:23 +07:00
|
|
|
static ssize_t nfs4_proc_get_acl(struct inode *inode, void *buf, size_t buflen)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (!nfs4_server_supports_acls(server))
|
|
|
|
return -EOPNOTSUPP;
|
|
|
|
ret = nfs_revalidate_inode(server, inode);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
2010-12-01 17:42:16 +07:00
|
|
|
if (NFS_I(inode)->cache_validity & NFS_INO_INVALID_ACL)
|
|
|
|
nfs_zap_acl_cache(inode);
|
2005-06-23 00:16:23 +07:00
|
|
|
ret = nfs4_read_cached_acl(inode, buf, buflen);
|
|
|
|
if (ret != -ENOENT)
|
2011-12-07 23:55:27 +07:00
|
|
|
/* -ENOENT is returned if there is no ACL or if there is an ACL
|
|
|
|
* but no cached acl data, just the acl length */
|
2005-06-23 00:16:23 +07:00
|
|
|
return ret;
|
|
|
|
return nfs4_get_acl_uncached(inode, buf, buflen);
|
|
|
|
}
|
|
|
|
|
2006-08-24 23:27:15 +07:00
|
|
|
static int __nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
|
2005-06-23 00:16:23 +07:00
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct page *pages[NFS4ACL_MAXPAGES];
|
|
|
|
struct nfs_setaclargs arg = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.acl_pages = pages,
|
|
|
|
.acl_len = buflen,
|
|
|
|
};
|
2009-04-01 20:22:01 +07:00
|
|
|
struct nfs_setaclres res;
|
2005-06-23 00:16:23 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETACL],
|
|
|
|
.rpc_argp = &arg,
|
2009-04-01 20:22:01 +07:00
|
|
|
.rpc_resp = &res,
|
2005-06-23 00:16:23 +07:00
|
|
|
};
|
2012-08-24 21:59:25 +07:00
|
|
|
unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE);
|
nfs4: Ensure that ACL pages sent over NFS were not allocated from the slab (v3)
The "bad_page()" page allocator sanity check was reported recently (call
chain as follows):
bad_page+0x69/0x91
free_hot_cold_page+0x81/0x144
skb_release_data+0x5f/0x98
__kfree_skb+0x11/0x1a
tcp_ack+0x6a3/0x1868
tcp_rcv_established+0x7a6/0x8b9
tcp_v4_do_rcv+0x2a/0x2fa
tcp_v4_rcv+0x9a2/0x9f6
do_timer+0x2df/0x52c
ip_local_deliver+0x19d/0x263
ip_rcv+0x539/0x57c
netif_receive_skb+0x470/0x49f
:virtio_net:virtnet_poll+0x46b/0x5c5
net_rx_action+0xac/0x1b3
__do_softirq+0x89/0x133
call_softirq+0x1c/0x28
do_softirq+0x2c/0x7d
do_IRQ+0xec/0xf5
default_idle+0x0/0x50
ret_from_intr+0x0/0xa
default_idle+0x29/0x50
cpu_idle+0x95/0xb8
start_kernel+0x220/0x225
_sinittext+0x22f/0x236
It occurs because an skb with a fraglist was freed from the tcp
retransmit queue when it was acked, but a page on that fraglist had
PG_Slab set (indicating it was allocated from the Slab allocator (which
means the free path above can't safely free it via put_page.
We tracked this back to an nfsv4 setacl operation, in which the nfs code
attempted to fill convert the passed in buffer to an array of pages in
__nfs4_proc_set_acl, which gets used by the skb->frags list in
xs_sendpages. __nfs4_proc_set_acl just converts each page in the buffer
to a page struct via virt_to_page, but the vfs allocates the buffer via
kmalloc, meaning the PG_slab bit is set. We can't create a buffer with
kmalloc and free it later in the tcp ack path with put_page, so we need
to either:
1) ensure that when we create the list of pages, no page struct has
PG_Slab set
or
2) not use a page list to send this data
Given that these buffers can be multiple pages and arbitrarily sized, I
think (1) is the right way to go. I've written the below patch to
allocate a page from the buddy allocator directly and copy the data over
to it. This ensures that we have a put_page free-able page for every
entry that winds up on an skb frag list, so it can be safely freed when
the frame is acked. We do a put page on each entry after the
rpc_call_sync call so as to drop our own reference count to the page,
leaving only the ref count taken by tcp_sendpages. This way the data
will be properly freed when the ack comes in
Successfully tested by myself to solve the above oops.
Note, as this is the result of a setacl operation that exceeded a page
of data, I think this amounts to a local DOS triggerable by an
uprivlidged user, so I'm CCing security on this as well.
Signed-off-by: Neil Horman <nhorman@tuxdriver.com>
CC: Trond Myklebust <Trond.Myklebust@netapp.com>
CC: security@kernel.org
CC: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2011-03-05 07:26:03 +07:00
|
|
|
int ret, i;
|
2005-06-23 00:16:23 +07:00
|
|
|
|
|
|
|
if (!nfs4_server_supports_acls(server))
|
|
|
|
return -EOPNOTSUPP;
|
2012-08-24 21:59:25 +07:00
|
|
|
if (npages > ARRAY_SIZE(pages))
|
|
|
|
return -ERANGE;
|
2015-11-04 00:25:34 +07:00
|
|
|
i = buf_to_pages_noslab(buf, buflen, arg.acl_pages);
|
nfs4: Ensure that ACL pages sent over NFS were not allocated from the slab (v3)
The "bad_page()" page allocator sanity check was reported recently (call
chain as follows):
bad_page+0x69/0x91
free_hot_cold_page+0x81/0x144
skb_release_data+0x5f/0x98
__kfree_skb+0x11/0x1a
tcp_ack+0x6a3/0x1868
tcp_rcv_established+0x7a6/0x8b9
tcp_v4_do_rcv+0x2a/0x2fa
tcp_v4_rcv+0x9a2/0x9f6
do_timer+0x2df/0x52c
ip_local_deliver+0x19d/0x263
ip_rcv+0x539/0x57c
netif_receive_skb+0x470/0x49f
:virtio_net:virtnet_poll+0x46b/0x5c5
net_rx_action+0xac/0x1b3
__do_softirq+0x89/0x133
call_softirq+0x1c/0x28
do_softirq+0x2c/0x7d
do_IRQ+0xec/0xf5
default_idle+0x0/0x50
ret_from_intr+0x0/0xa
default_idle+0x29/0x50
cpu_idle+0x95/0xb8
start_kernel+0x220/0x225
_sinittext+0x22f/0x236
It occurs because an skb with a fraglist was freed from the tcp
retransmit queue when it was acked, but a page on that fraglist had
PG_Slab set (indicating it was allocated from the Slab allocator (which
means the free path above can't safely free it via put_page.
We tracked this back to an nfsv4 setacl operation, in which the nfs code
attempted to fill convert the passed in buffer to an array of pages in
__nfs4_proc_set_acl, which gets used by the skb->frags list in
xs_sendpages. __nfs4_proc_set_acl just converts each page in the buffer
to a page struct via virt_to_page, but the vfs allocates the buffer via
kmalloc, meaning the PG_slab bit is set. We can't create a buffer with
kmalloc and free it later in the tcp ack path with put_page, so we need
to either:
1) ensure that when we create the list of pages, no page struct has
PG_Slab set
or
2) not use a page list to send this data
Given that these buffers can be multiple pages and arbitrarily sized, I
think (1) is the right way to go. I've written the below patch to
allocate a page from the buddy allocator directly and copy the data over
to it. This ensures that we have a put_page free-able page for every
entry that winds up on an skb frag list, so it can be safely freed when
the frame is acked. We do a put page on each entry after the
rpc_call_sync call so as to drop our own reference count to the page,
leaving only the ref count taken by tcp_sendpages. This way the data
will be properly freed when the ack comes in
Successfully tested by myself to solve the above oops.
Note, as this is the result of a setacl operation that exceeded a page
of data, I think this amounts to a local DOS triggerable by an
uprivlidged user, so I'm CCing security on this as well.
Signed-off-by: Neil Horman <nhorman@tuxdriver.com>
CC: Trond Myklebust <Trond.Myklebust@netapp.com>
CC: security@kernel.org
CC: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2011-03-05 07:26:03 +07:00
|
|
|
if (i < 0)
|
|
|
|
return i;
|
2018-03-21 03:43:20 +07:00
|
|
|
nfs4_inode_make_writeable(inode);
|
2011-03-25 00:12:24 +07:00
|
|
|
ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
|
nfs4: Ensure that ACL pages sent over NFS were not allocated from the slab (v3)
The "bad_page()" page allocator sanity check was reported recently (call
chain as follows):
bad_page+0x69/0x91
free_hot_cold_page+0x81/0x144
skb_release_data+0x5f/0x98
__kfree_skb+0x11/0x1a
tcp_ack+0x6a3/0x1868
tcp_rcv_established+0x7a6/0x8b9
tcp_v4_do_rcv+0x2a/0x2fa
tcp_v4_rcv+0x9a2/0x9f6
do_timer+0x2df/0x52c
ip_local_deliver+0x19d/0x263
ip_rcv+0x539/0x57c
netif_receive_skb+0x470/0x49f
:virtio_net:virtnet_poll+0x46b/0x5c5
net_rx_action+0xac/0x1b3
__do_softirq+0x89/0x133
call_softirq+0x1c/0x28
do_softirq+0x2c/0x7d
do_IRQ+0xec/0xf5
default_idle+0x0/0x50
ret_from_intr+0x0/0xa
default_idle+0x29/0x50
cpu_idle+0x95/0xb8
start_kernel+0x220/0x225
_sinittext+0x22f/0x236
It occurs because an skb with a fraglist was freed from the tcp
retransmit queue when it was acked, but a page on that fraglist had
PG_Slab set (indicating it was allocated from the Slab allocator (which
means the free path above can't safely free it via put_page.
We tracked this back to an nfsv4 setacl operation, in which the nfs code
attempted to fill convert the passed in buffer to an array of pages in
__nfs4_proc_set_acl, which gets used by the skb->frags list in
xs_sendpages. __nfs4_proc_set_acl just converts each page in the buffer
to a page struct via virt_to_page, but the vfs allocates the buffer via
kmalloc, meaning the PG_slab bit is set. We can't create a buffer with
kmalloc and free it later in the tcp ack path with put_page, so we need
to either:
1) ensure that when we create the list of pages, no page struct has
PG_Slab set
or
2) not use a page list to send this data
Given that these buffers can be multiple pages and arbitrarily sized, I
think (1) is the right way to go. I've written the below patch to
allocate a page from the buddy allocator directly and copy the data over
to it. This ensures that we have a put_page free-able page for every
entry that winds up on an skb frag list, so it can be safely freed when
the frame is acked. We do a put page on each entry after the
rpc_call_sync call so as to drop our own reference count to the page,
leaving only the ref count taken by tcp_sendpages. This way the data
will be properly freed when the ack comes in
Successfully tested by myself to solve the above oops.
Note, as this is the result of a setacl operation that exceeded a page
of data, I think this amounts to a local DOS triggerable by an
uprivlidged user, so I'm CCing security on this as well.
Signed-off-by: Neil Horman <nhorman@tuxdriver.com>
CC: Trond Myklebust <Trond.Myklebust@netapp.com>
CC: security@kernel.org
CC: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2011-03-05 07:26:03 +07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Free each page after tx, so the only ref left is
|
|
|
|
* held by the network stack
|
|
|
|
*/
|
|
|
|
for (; i > 0; i--)
|
|
|
|
put_page(pages[i-1]);
|
|
|
|
|
2010-12-01 17:42:16 +07:00
|
|
|
/*
|
|
|
|
* Acl update can result in inode attribute update.
|
|
|
|
* so mark the attribute cache invalid.
|
|
|
|
*/
|
|
|
|
spin_lock(&inode->i_lock);
|
2018-03-21 03:53:31 +07:00
|
|
|
NFS_I(inode)->cache_validity |= NFS_INO_INVALID_CHANGE
|
2018-04-09 05:14:43 +07:00
|
|
|
| NFS_INO_INVALID_CTIME
|
|
|
|
| NFS_INO_REVAL_FORCED;
|
2010-12-01 17:42:16 +07:00
|
|
|
spin_unlock(&inode->i_lock);
|
2008-06-12 04:39:04 +07:00
|
|
|
nfs_access_zap_cache(inode);
|
|
|
|
nfs_zap_acl_cache(inode);
|
2005-06-23 00:16:23 +07:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2006-08-24 23:27:15 +07:00
|
|
|
static int nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-08-13 03:58:42 +07:00
|
|
|
err = __nfs4_proc_set_acl(inode, buf, buflen);
|
|
|
|
trace_nfs4_set_acl(inode, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(inode), err,
|
2006-08-24 23:27:15 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2013-05-22 23:50:44 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_SECURITY_LABEL
|
|
|
|
static int _nfs4_get_security_label(struct inode *inode, void *buf,
|
|
|
|
size_t buflen)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct nfs_fattr fattr;
|
|
|
|
struct nfs4_label label = {0, 0, buflen, buf};
|
|
|
|
|
|
|
|
u32 bitmask[3] = { 0, 0, FATTR4_WORD2_SECURITY_LABEL };
|
2013-11-01 23:42:25 +07:00
|
|
|
struct nfs4_getattr_arg arg = {
|
2013-05-22 23:50:44 +07:00
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.bitmask = bitmask,
|
|
|
|
};
|
|
|
|
struct nfs4_getattr_res res = {
|
|
|
|
.fattr = &fattr,
|
|
|
|
.label = &label,
|
|
|
|
.server = server,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
|
2013-11-01 23:42:25 +07:00
|
|
|
.rpc_argp = &arg,
|
2013-05-22 23:50:44 +07:00
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
nfs_fattr_init(&fattr);
|
|
|
|
|
2013-11-01 23:42:25 +07:00
|
|
|
ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 0);
|
2013-05-22 23:50:44 +07:00
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
if (!(fattr.valid & NFS_ATTR_FATTR_V4_SECURITY_LABEL))
|
|
|
|
return -ENOENT;
|
|
|
|
if (buflen < label.len)
|
|
|
|
return -ERANGE;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_get_security_label(struct inode *inode, void *buf,
|
|
|
|
size_t buflen)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
|
|
|
|
if (!nfs_server_capable(inode, NFS_CAP_SECURITY_LABEL))
|
|
|
|
return -EOPNOTSUPP;
|
|
|
|
|
|
|
|
do {
|
2013-08-13 03:58:42 +07:00
|
|
|
err = _nfs4_get_security_label(inode, buf, buflen);
|
|
|
|
trace_nfs4_get_security_label(inode, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(inode), err,
|
2013-05-22 23:50:44 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_do_set_security_label(struct inode *inode,
|
|
|
|
struct nfs4_label *ilabel,
|
|
|
|
struct nfs_fattr *fattr,
|
|
|
|
struct nfs4_label *olabel)
|
|
|
|
{
|
|
|
|
|
|
|
|
struct iattr sattr = {0};
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
const u32 bitmask[3] = { 0, 0, FATTR4_WORD2_SECURITY_LABEL };
|
2013-11-01 21:49:32 +07:00
|
|
|
struct nfs_setattrargs arg = {
|
2017-01-12 03:04:25 +07:00
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.iap = &sattr,
|
2013-05-22 23:50:44 +07:00
|
|
|
.server = server,
|
|
|
|
.bitmask = bitmask,
|
|
|
|
.label = ilabel,
|
|
|
|
};
|
|
|
|
struct nfs_setattrres res = {
|
|
|
|
.fattr = fattr,
|
|
|
|
.label = olabel,
|
|
|
|
.server = server,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
2017-01-12 03:04:25 +07:00
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
|
|
|
|
.rpc_argp = &arg,
|
|
|
|
.rpc_resp = &res,
|
2013-05-22 23:50:44 +07:00
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
2013-11-01 21:49:32 +07:00
|
|
|
nfs4_stateid_copy(&arg.stateid, &zero_stateid);
|
2013-05-22 23:50:44 +07:00
|
|
|
|
2013-11-01 21:49:32 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
|
2013-05-22 23:50:44 +07:00
|
|
|
if (status)
|
|
|
|
dprintk("%s failed: %d\n", __func__, status);
|
|
|
|
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_do_set_security_label(struct inode *inode,
|
|
|
|
struct nfs4_label *ilabel,
|
|
|
|
struct nfs_fattr *fattr,
|
|
|
|
struct nfs4_label *olabel)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
2013-08-13 03:58:42 +07:00
|
|
|
err = _nfs4_do_set_security_label(inode, ilabel,
|
|
|
|
fattr, olabel);
|
|
|
|
trace_nfs4_set_security_label(inode, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(inode), err,
|
2013-05-22 23:50:44 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
2016-05-27 21:19:30 +07:00
|
|
|
nfs4_set_security_label(struct inode *inode, const void *buf, size_t buflen)
|
2013-05-22 23:50:44 +07:00
|
|
|
{
|
|
|
|
struct nfs4_label ilabel, *olabel = NULL;
|
|
|
|
struct nfs_fattr fattr;
|
|
|
|
struct rpc_cred *cred;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
if (!nfs_server_capable(inode, NFS_CAP_SECURITY_LABEL))
|
|
|
|
return -EOPNOTSUPP;
|
|
|
|
|
|
|
|
nfs_fattr_init(&fattr);
|
|
|
|
|
|
|
|
ilabel.pi = 0;
|
|
|
|
ilabel.lfs = 0;
|
|
|
|
ilabel.label = (char *)buf;
|
|
|
|
ilabel.len = buflen;
|
|
|
|
|
|
|
|
cred = rpc_lookup_cred();
|
|
|
|
if (IS_ERR(cred))
|
|
|
|
return PTR_ERR(cred);
|
|
|
|
|
|
|
|
olabel = nfs4_label_alloc(NFS_SERVER(inode), GFP_KERNEL);
|
|
|
|
if (IS_ERR(olabel)) {
|
|
|
|
status = -PTR_ERR(olabel);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
status = nfs4_do_set_security_label(inode, &ilabel, &fattr, olabel);
|
|
|
|
if (status == 0)
|
|
|
|
nfs_setsecurity(inode, &fattr, olabel);
|
|
|
|
|
|
|
|
nfs4_label_free(olabel);
|
|
|
|
out:
|
|
|
|
put_rpccred(cred);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
#endif /* CONFIG_NFS_V4_SECURITY_LABEL */
|
|
|
|
|
|
|
|
|
NFS: Always use the same SETCLIENTID boot verifier
Currently our NFS client assigns a unique SETCLIENTID boot verifier
for each server IP address it knows about. It's set to CURRENT_TIME
when the struct nfs_client for that server IP is created.
During the SETCLIENTID operation, our client also presents an
nfs_client_id4 string to servers, as an identifier on which the server
can hang all of this client's NFSv4 state. Our client's
nfs_client_id4 string is unique for each server IP address.
An NFSv4 server is obligated to wipe all NFSv4 state associated with
an nfs_client_id4 string when the client presents the same
nfs_client_id4 string along with a changed SETCLIENTID boot verifier.
When our client unmounts the last of a server's shares, it destroys
that server's struct nfs_client. The next time the client mounts that
NFS server, it creates a fresh struct nfs_client with a fresh boot
verifier. On seeing the fresh verifer, the server wipes any previous
NFSv4 state associated with that nfs_client_id4.
However, NFSv4.1 clients are supposed to present the same
nfs_client_id4 string to all servers. And, to support Transparent
State Migration, the same nfs_client_id4 string should be presented
to all NFSv4.0 servers so they recognize that migrated state for this
client belongs with state a server may already have for this client.
(This is known as the Uniform Client String model).
If the nfs_client_id4 string is the same but the boot verifier changes
for each server IP address, SETCLIENTID and EXCHANGE_ID operations
from such a client could unintentionally result in a server wiping a
client's previously obtained lease.
Thus, if our NFS client is going to use a fixed nfs_client_id4 string,
either for NFSv4.0 or NFSv4.1 mounts, our NFS client should use a
boot verifier that does not change depending on server IP address.
Replace our current per-nfs_client boot verifier with a per-nfs_net
boot verifier.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-05-22 09:45:41 +07:00
|
|
|
static void nfs4_init_boot_verifier(const struct nfs_client *clp,
|
|
|
|
nfs4_verifier *bootverf)
|
2012-03-03 05:14:31 +07:00
|
|
|
{
|
|
|
|
__be32 verf[2];
|
|
|
|
|
2012-05-22 09:45:33 +07:00
|
|
|
if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) {
|
|
|
|
/* An impossible timestamp guarantees this value
|
|
|
|
* will never match a generated boot time. */
|
2016-10-02 06:46:26 +07:00
|
|
|
verf[0] = cpu_to_be32(U32_MAX);
|
|
|
|
verf[1] = cpu_to_be32(U32_MAX);
|
2012-05-22 09:45:33 +07:00
|
|
|
} else {
|
NFS: Always use the same SETCLIENTID boot verifier
Currently our NFS client assigns a unique SETCLIENTID boot verifier
for each server IP address it knows about. It's set to CURRENT_TIME
when the struct nfs_client for that server IP is created.
During the SETCLIENTID operation, our client also presents an
nfs_client_id4 string to servers, as an identifier on which the server
can hang all of this client's NFSv4 state. Our client's
nfs_client_id4 string is unique for each server IP address.
An NFSv4 server is obligated to wipe all NFSv4 state associated with
an nfs_client_id4 string when the client presents the same
nfs_client_id4 string along with a changed SETCLIENTID boot verifier.
When our client unmounts the last of a server's shares, it destroys
that server's struct nfs_client. The next time the client mounts that
NFS server, it creates a fresh struct nfs_client with a fresh boot
verifier. On seeing the fresh verifer, the server wipes any previous
NFSv4 state associated with that nfs_client_id4.
However, NFSv4.1 clients are supposed to present the same
nfs_client_id4 string to all servers. And, to support Transparent
State Migration, the same nfs_client_id4 string should be presented
to all NFSv4.0 servers so they recognize that migrated state for this
client belongs with state a server may already have for this client.
(This is known as the Uniform Client String model).
If the nfs_client_id4 string is the same but the boot verifier changes
for each server IP address, SETCLIENTID and EXCHANGE_ID operations
from such a client could unintentionally result in a server wiping a
client's previously obtained lease.
Thus, if our NFS client is going to use a fixed nfs_client_id4 string,
either for NFSv4.0 or NFSv4.1 mounts, our NFS client should use a
boot verifier that does not change depending on server IP address.
Replace our current per-nfs_client boot verifier with a per-nfs_net
boot verifier.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-05-22 09:45:41 +07:00
|
|
|
struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
|
2016-10-02 06:46:26 +07:00
|
|
|
u64 ns = ktime_to_ns(nn->boot_time);
|
|
|
|
|
|
|
|
verf[0] = cpu_to_be32(ns >> 32);
|
|
|
|
verf[1] = cpu_to_be32(ns);
|
2012-05-22 09:45:33 +07:00
|
|
|
}
|
2012-03-03 05:14:31 +07:00
|
|
|
memcpy(bootverf->data, verf, sizeof(bootverf->data));
|
|
|
|
}
|
|
|
|
|
2015-06-10 06:43:59 +07:00
|
|
|
static int
|
|
|
|
nfs4_init_nonuniform_client_string(struct nfs_client *clp)
|
NFS: Use the same nfs_client_id4 for every server
Currently, when identifying itself to NFS servers, the Linux NFS
client uses a unique nfs_client_id4.id string for each server IP
address it talks with. For example, when client A talks to server X,
the client identifies itself using a string like "AX". The
requirements for these strings are specified in detail by RFC 3530
(and bis).
This form of client identification presents a problem for Transparent
State Migration. When client A's state on server X is migrated to
server Y, it continues to be associated with string "AX." But,
according to the rules of client string construction above, client
A will present string "AY" when communicating with server Y.
Server Y thus has no way to know that client A should be associated
with the state migrated from server X. "AX" is all but abandoned,
interfering with establishing fresh state for client A on server Y.
To support transparent state migration, then, NFSv4.0 clients must
instead use the same nfs_client_id4.id string to identify themselves
to every NFS server; something like "A".
Now a client identifies itself as "A" to server X. When a file
system on server X transitions to server Y, and client A identifies
itself as "A" to server Y, Y will know immediately that the state
associated with "A," whether it is native or migrated, is owned by
the client, and can merge both into a single lease.
As a pre-requisite to adding support for NFSv4 migration to the Linux
NFS client, this patch changes the way Linux identifies itself to NFS
servers via the SETCLIENTID (NFSv4 minor version 0) and EXCHANGE_ID
(NFSv4 minor version 1) operations.
In addition to removing the server's IP address from nfs_client_id4,
the Linux NFS client will also no longer use its own source IP address
as part of the nfs_client_id4 string. On multi-homed clients, the
value of this address depends on the address family and network
routing used to contact the server, thus it can be different for each
server.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-09-15 04:24:21 +07:00
|
|
|
{
|
2015-06-10 06:43:59 +07:00
|
|
|
size_t len;
|
|
|
|
char *str;
|
NFS: Use the same nfs_client_id4 for every server
Currently, when identifying itself to NFS servers, the Linux NFS
client uses a unique nfs_client_id4.id string for each server IP
address it talks with. For example, when client A talks to server X,
the client identifies itself using a string like "AX". The
requirements for these strings are specified in detail by RFC 3530
(and bis).
This form of client identification presents a problem for Transparent
State Migration. When client A's state on server X is migrated to
server Y, it continues to be associated with string "AX." But,
according to the rules of client string construction above, client
A will present string "AY" when communicating with server Y.
Server Y thus has no way to know that client A should be associated
with the state migrated from server X. "AX" is all but abandoned,
interfering with establishing fresh state for client A on server Y.
To support transparent state migration, then, NFSv4.0 clients must
instead use the same nfs_client_id4.id string to identify themselves
to every NFS server; something like "A".
Now a client identifies itself as "A" to server X. When a file
system on server X transitions to server Y, and client A identifies
itself as "A" to server Y, Y will know immediately that the state
associated with "A," whether it is native or migrated, is owned by
the client, and can merge both into a single lease.
As a pre-requisite to adding support for NFSv4 migration to the Linux
NFS client, this patch changes the way Linux identifies itself to NFS
servers via the SETCLIENTID (NFSv4 minor version 0) and EXCHANGE_ID
(NFSv4 minor version 1) operations.
In addition to removing the server's IP address from nfs_client_id4,
the Linux NFS client will also no longer use its own source IP address
as part of the nfs_client_id4 string. On multi-homed clients, the
value of this address depends on the address family and network
routing used to contact the server, thus it can be different for each
server.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-09-15 04:24:21 +07:00
|
|
|
|
2015-01-04 03:16:04 +07:00
|
|
|
if (clp->cl_owner_id != NULL)
|
2015-06-10 06:43:59 +07:00
|
|
|
return 0;
|
2015-08-31 09:53:43 +07:00
|
|
|
|
2015-06-10 06:43:59 +07:00
|
|
|
rcu_read_lock();
|
NFSv4.0: Remove cl_ipaddr from non-UCS client ID
It is possible for two distinct clients to have the same cl_ipaddr:
- if the client admin disables callback with clientaddr=0.0.0.0 on
more than one client
- if two clients behind separate NATs use the same private subnet
number
- if the client admin specifies the same address via clientaddr=
mount option (pointing the server at the same NAT box, for
example)
Because of the way the Linux NFSv4.0 client constructs its client
ID string by default, such clients could interfere with each others'
lease state when mounting the same server:
scnprintf(str, len, "Linux NFSv4.0 %s/%s %s",
clp->cl_ipaddr,
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR),
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO));
cl_ipaddr is set to the value of the clientaddr= mount option. Two
clients whose addresses are 192.168.3.77 that mount the same server
(whose public IP address is, say, 3.4.5.6) would both generate the
same client ID string when sending a SETCLIENTID:
Linux NFSv4.0 192.168.3.77/3.4.5.6 tcp
and thus the server would not be able to distinguish the clients'
leases. If both clients are using AUTH_SYS when sending SETCLIENTID
then the server could possibly permit the two clients to interfere
with or purge each others' leases.
To better ensure that Linux's NFSv4.0 client ID strings are distinct
in these cases, remove cl_ipaddr from the client ID string and
replace it with something more likely to be unique. Note that the
replacement looks a lot like the uniform client ID string.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <trond.myklebust@hammerspace.com>
2018-06-04 21:53:29 +07:00
|
|
|
len = 14 +
|
|
|
|
strlen(clp->cl_rpcclient->cl_nodename) +
|
|
|
|
1 +
|
2015-06-10 06:43:59 +07:00
|
|
|
strlen(rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR)) +
|
|
|
|
1;
|
|
|
|
rcu_read_unlock();
|
NFSv4.0: Remove cl_ipaddr from non-UCS client ID
It is possible for two distinct clients to have the same cl_ipaddr:
- if the client admin disables callback with clientaddr=0.0.0.0 on
more than one client
- if two clients behind separate NATs use the same private subnet
number
- if the client admin specifies the same address via clientaddr=
mount option (pointing the server at the same NAT box, for
example)
Because of the way the Linux NFSv4.0 client constructs its client
ID string by default, such clients could interfere with each others'
lease state when mounting the same server:
scnprintf(str, len, "Linux NFSv4.0 %s/%s %s",
clp->cl_ipaddr,
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR),
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO));
cl_ipaddr is set to the value of the clientaddr= mount option. Two
clients whose addresses are 192.168.3.77 that mount the same server
(whose public IP address is, say, 3.4.5.6) would both generate the
same client ID string when sending a SETCLIENTID:
Linux NFSv4.0 192.168.3.77/3.4.5.6 tcp
and thus the server would not be able to distinguish the clients'
leases. If both clients are using AUTH_SYS when sending SETCLIENTID
then the server could possibly permit the two clients to interfere
with or purge each others' leases.
To better ensure that Linux's NFSv4.0 client ID strings are distinct
in these cases, remove cl_ipaddr from the client ID string and
replace it with something more likely to be unique. Note that the
replacement looks a lot like the uniform client ID string.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <trond.myklebust@hammerspace.com>
2018-06-04 21:53:29 +07:00
|
|
|
if (nfs4_client_id_uniquifier[0] != '\0')
|
|
|
|
len += strlen(nfs4_client_id_uniquifier) + 1;
|
2015-06-10 06:43:59 +07:00
|
|
|
if (len > NFS4_OPAQUE_LIMIT + 1)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Since this string is allocated at mount time, and held until the
|
|
|
|
* nfs_client is destroyed, we can use GFP_KERNEL here w/o worrying
|
|
|
|
* about a memory-reclaim deadlock.
|
|
|
|
*/
|
|
|
|
str = kmalloc(len, GFP_KERNEL);
|
|
|
|
if (!str)
|
|
|
|
return -ENOMEM;
|
2015-01-04 03:16:04 +07:00
|
|
|
|
NFS: Use the same nfs_client_id4 for every server
Currently, when identifying itself to NFS servers, the Linux NFS
client uses a unique nfs_client_id4.id string for each server IP
address it talks with. For example, when client A talks to server X,
the client identifies itself using a string like "AX". The
requirements for these strings are specified in detail by RFC 3530
(and bis).
This form of client identification presents a problem for Transparent
State Migration. When client A's state on server X is migrated to
server Y, it continues to be associated with string "AX." But,
according to the rules of client string construction above, client
A will present string "AY" when communicating with server Y.
Server Y thus has no way to know that client A should be associated
with the state migrated from server X. "AX" is all but abandoned,
interfering with establishing fresh state for client A on server Y.
To support transparent state migration, then, NFSv4.0 clients must
instead use the same nfs_client_id4.id string to identify themselves
to every NFS server; something like "A".
Now a client identifies itself as "A" to server X. When a file
system on server X transitions to server Y, and client A identifies
itself as "A" to server Y, Y will know immediately that the state
associated with "A," whether it is native or migrated, is owned by
the client, and can merge both into a single lease.
As a pre-requisite to adding support for NFSv4 migration to the Linux
NFS client, this patch changes the way Linux identifies itself to NFS
servers via the SETCLIENTID (NFSv4 minor version 0) and EXCHANGE_ID
(NFSv4 minor version 1) operations.
In addition to removing the server's IP address from nfs_client_id4,
the Linux NFS client will also no longer use its own source IP address
as part of the nfs_client_id4 string. On multi-homed clients, the
value of this address depends on the address family and network
routing used to contact the server, thus it can be different for each
server.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-09-15 04:24:21 +07:00
|
|
|
rcu_read_lock();
|
NFSv4.0: Remove cl_ipaddr from non-UCS client ID
It is possible for two distinct clients to have the same cl_ipaddr:
- if the client admin disables callback with clientaddr=0.0.0.0 on
more than one client
- if two clients behind separate NATs use the same private subnet
number
- if the client admin specifies the same address via clientaddr=
mount option (pointing the server at the same NAT box, for
example)
Because of the way the Linux NFSv4.0 client constructs its client
ID string by default, such clients could interfere with each others'
lease state when mounting the same server:
scnprintf(str, len, "Linux NFSv4.0 %s/%s %s",
clp->cl_ipaddr,
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR),
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO));
cl_ipaddr is set to the value of the clientaddr= mount option. Two
clients whose addresses are 192.168.3.77 that mount the same server
(whose public IP address is, say, 3.4.5.6) would both generate the
same client ID string when sending a SETCLIENTID:
Linux NFSv4.0 192.168.3.77/3.4.5.6 tcp
and thus the server would not be able to distinguish the clients'
leases. If both clients are using AUTH_SYS when sending SETCLIENTID
then the server could possibly permit the two clients to interfere
with or purge each others' leases.
To better ensure that Linux's NFSv4.0 client ID strings are distinct
in these cases, remove cl_ipaddr from the client ID string and
replace it with something more likely to be unique. Note that the
replacement looks a lot like the uniform client ID string.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <trond.myklebust@hammerspace.com>
2018-06-04 21:53:29 +07:00
|
|
|
if (nfs4_client_id_uniquifier[0] != '\0')
|
2018-06-04 21:53:34 +07:00
|
|
|
scnprintf(str, len, "Linux NFSv4.0 %s/%s/%s",
|
NFSv4.0: Remove cl_ipaddr from non-UCS client ID
It is possible for two distinct clients to have the same cl_ipaddr:
- if the client admin disables callback with clientaddr=0.0.0.0 on
more than one client
- if two clients behind separate NATs use the same private subnet
number
- if the client admin specifies the same address via clientaddr=
mount option (pointing the server at the same NAT box, for
example)
Because of the way the Linux NFSv4.0 client constructs its client
ID string by default, such clients could interfere with each others'
lease state when mounting the same server:
scnprintf(str, len, "Linux NFSv4.0 %s/%s %s",
clp->cl_ipaddr,
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR),
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO));
cl_ipaddr is set to the value of the clientaddr= mount option. Two
clients whose addresses are 192.168.3.77 that mount the same server
(whose public IP address is, say, 3.4.5.6) would both generate the
same client ID string when sending a SETCLIENTID:
Linux NFSv4.0 192.168.3.77/3.4.5.6 tcp
and thus the server would not be able to distinguish the clients'
leases. If both clients are using AUTH_SYS when sending SETCLIENTID
then the server could possibly permit the two clients to interfere
with or purge each others' leases.
To better ensure that Linux's NFSv4.0 client ID strings are distinct
in these cases, remove cl_ipaddr from the client ID string and
replace it with something more likely to be unique. Note that the
replacement looks a lot like the uniform client ID string.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <trond.myklebust@hammerspace.com>
2018-06-04 21:53:29 +07:00
|
|
|
clp->cl_rpcclient->cl_nodename,
|
|
|
|
nfs4_client_id_uniquifier,
|
|
|
|
rpc_peeraddr2str(clp->cl_rpcclient,
|
2018-06-04 21:53:34 +07:00
|
|
|
RPC_DISPLAY_ADDR));
|
NFSv4.0: Remove cl_ipaddr from non-UCS client ID
It is possible for two distinct clients to have the same cl_ipaddr:
- if the client admin disables callback with clientaddr=0.0.0.0 on
more than one client
- if two clients behind separate NATs use the same private subnet
number
- if the client admin specifies the same address via clientaddr=
mount option (pointing the server at the same NAT box, for
example)
Because of the way the Linux NFSv4.0 client constructs its client
ID string by default, such clients could interfere with each others'
lease state when mounting the same server:
scnprintf(str, len, "Linux NFSv4.0 %s/%s %s",
clp->cl_ipaddr,
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR),
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO));
cl_ipaddr is set to the value of the clientaddr= mount option. Two
clients whose addresses are 192.168.3.77 that mount the same server
(whose public IP address is, say, 3.4.5.6) would both generate the
same client ID string when sending a SETCLIENTID:
Linux NFSv4.0 192.168.3.77/3.4.5.6 tcp
and thus the server would not be able to distinguish the clients'
leases. If both clients are using AUTH_SYS when sending SETCLIENTID
then the server could possibly permit the two clients to interfere
with or purge each others' leases.
To better ensure that Linux's NFSv4.0 client ID strings are distinct
in these cases, remove cl_ipaddr from the client ID string and
replace it with something more likely to be unique. Note that the
replacement looks a lot like the uniform client ID string.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <trond.myklebust@hammerspace.com>
2018-06-04 21:53:29 +07:00
|
|
|
else
|
2018-06-04 21:53:34 +07:00
|
|
|
scnprintf(str, len, "Linux NFSv4.0 %s/%s",
|
NFSv4.0: Remove cl_ipaddr from non-UCS client ID
It is possible for two distinct clients to have the same cl_ipaddr:
- if the client admin disables callback with clientaddr=0.0.0.0 on
more than one client
- if two clients behind separate NATs use the same private subnet
number
- if the client admin specifies the same address via clientaddr=
mount option (pointing the server at the same NAT box, for
example)
Because of the way the Linux NFSv4.0 client constructs its client
ID string by default, such clients could interfere with each others'
lease state when mounting the same server:
scnprintf(str, len, "Linux NFSv4.0 %s/%s %s",
clp->cl_ipaddr,
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR),
rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_PROTO));
cl_ipaddr is set to the value of the clientaddr= mount option. Two
clients whose addresses are 192.168.3.77 that mount the same server
(whose public IP address is, say, 3.4.5.6) would both generate the
same client ID string when sending a SETCLIENTID:
Linux NFSv4.0 192.168.3.77/3.4.5.6 tcp
and thus the server would not be able to distinguish the clients'
leases. If both clients are using AUTH_SYS when sending SETCLIENTID
then the server could possibly permit the two clients to interfere
with or purge each others' leases.
To better ensure that Linux's NFSv4.0 client ID strings are distinct
in these cases, remove cl_ipaddr from the client ID string and
replace it with something more likely to be unique. Note that the
replacement looks a lot like the uniform client ID string.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <trond.myklebust@hammerspace.com>
2018-06-04 21:53:29 +07:00
|
|
|
clp->cl_rpcclient->cl_nodename,
|
|
|
|
rpc_peeraddr2str(clp->cl_rpcclient,
|
2018-06-04 21:53:34 +07:00
|
|
|
RPC_DISPLAY_ADDR));
|
NFS: Use the same nfs_client_id4 for every server
Currently, when identifying itself to NFS servers, the Linux NFS
client uses a unique nfs_client_id4.id string for each server IP
address it talks with. For example, when client A talks to server X,
the client identifies itself using a string like "AX". The
requirements for these strings are specified in detail by RFC 3530
(and bis).
This form of client identification presents a problem for Transparent
State Migration. When client A's state on server X is migrated to
server Y, it continues to be associated with string "AX." But,
according to the rules of client string construction above, client
A will present string "AY" when communicating with server Y.
Server Y thus has no way to know that client A should be associated
with the state migrated from server X. "AX" is all but abandoned,
interfering with establishing fresh state for client A on server Y.
To support transparent state migration, then, NFSv4.0 clients must
instead use the same nfs_client_id4.id string to identify themselves
to every NFS server; something like "A".
Now a client identifies itself as "A" to server X. When a file
system on server X transitions to server Y, and client A identifies
itself as "A" to server Y, Y will know immediately that the state
associated with "A," whether it is native or migrated, is owned by
the client, and can merge both into a single lease.
As a pre-requisite to adding support for NFSv4 migration to the Linux
NFS client, this patch changes the way Linux identifies itself to NFS
servers via the SETCLIENTID (NFSv4 minor version 0) and EXCHANGE_ID
(NFSv4 minor version 1) operations.
In addition to removing the server's IP address from nfs_client_id4,
the Linux NFS client will also no longer use its own source IP address
as part of the nfs_client_id4 string. On multi-homed clients, the
value of this address depends on the address family and network
routing used to contact the server, thus it can be different for each
server.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-09-15 04:24:21 +07:00
|
|
|
rcu_read_unlock();
|
2015-06-10 06:43:59 +07:00
|
|
|
|
|
|
|
clp->cl_owner_id = str;
|
|
|
|
return 0;
|
NFS: Use the same nfs_client_id4 for every server
Currently, when identifying itself to NFS servers, the Linux NFS
client uses a unique nfs_client_id4.id string for each server IP
address it talks with. For example, when client A talks to server X,
the client identifies itself using a string like "AX". The
requirements for these strings are specified in detail by RFC 3530
(and bis).
This form of client identification presents a problem for Transparent
State Migration. When client A's state on server X is migrated to
server Y, it continues to be associated with string "AX." But,
according to the rules of client string construction above, client
A will present string "AY" when communicating with server Y.
Server Y thus has no way to know that client A should be associated
with the state migrated from server X. "AX" is all but abandoned,
interfering with establishing fresh state for client A on server Y.
To support transparent state migration, then, NFSv4.0 clients must
instead use the same nfs_client_id4.id string to identify themselves
to every NFS server; something like "A".
Now a client identifies itself as "A" to server X. When a file
system on server X transitions to server Y, and client A identifies
itself as "A" to server Y, Y will know immediately that the state
associated with "A," whether it is native or migrated, is owned by
the client, and can merge both into a single lease.
As a pre-requisite to adding support for NFSv4 migration to the Linux
NFS client, this patch changes the way Linux identifies itself to NFS
servers via the SETCLIENTID (NFSv4 minor version 0) and EXCHANGE_ID
(NFSv4 minor version 1) operations.
In addition to removing the server's IP address from nfs_client_id4,
the Linux NFS client will also no longer use its own source IP address
as part of the nfs_client_id4 string. On multi-homed clients, the
value of this address depends on the address family and network
routing used to contact the server, thus it can be different for each
server.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-09-15 04:24:21 +07:00
|
|
|
}
|
|
|
|
|
2015-06-10 06:44:00 +07:00
|
|
|
static int
|
|
|
|
nfs4_init_uniquifier_client_string(struct nfs_client *clp)
|
|
|
|
{
|
|
|
|
size_t len;
|
|
|
|
char *str;
|
|
|
|
|
|
|
|
len = 10 + 10 + 1 + 10 + 1 +
|
|
|
|
strlen(nfs4_client_id_uniquifier) + 1 +
|
|
|
|
strlen(clp->cl_rpcclient->cl_nodename) + 1;
|
|
|
|
|
|
|
|
if (len > NFS4_OPAQUE_LIMIT + 1)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Since this string is allocated at mount time, and held until the
|
|
|
|
* nfs_client is destroyed, we can use GFP_KERNEL here w/o worrying
|
|
|
|
* about a memory-reclaim deadlock.
|
|
|
|
*/
|
|
|
|
str = kmalloc(len, GFP_KERNEL);
|
|
|
|
if (!str)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
2015-10-08 22:33:17 +07:00
|
|
|
scnprintf(str, len, "Linux NFSv%u.%u %s/%s",
|
2015-06-10 06:44:00 +07:00
|
|
|
clp->rpc_ops->version, clp->cl_minorversion,
|
|
|
|
nfs4_client_id_uniquifier,
|
|
|
|
clp->cl_rpcclient->cl_nodename);
|
|
|
|
clp->cl_owner_id = str;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
nfs4_init_uniform_client_string(struct nfs_client *clp)
|
NFS: Use the same nfs_client_id4 for every server
Currently, when identifying itself to NFS servers, the Linux NFS
client uses a unique nfs_client_id4.id string for each server IP
address it talks with. For example, when client A talks to server X,
the client identifies itself using a string like "AX". The
requirements for these strings are specified in detail by RFC 3530
(and bis).
This form of client identification presents a problem for Transparent
State Migration. When client A's state on server X is migrated to
server Y, it continues to be associated with string "AX." But,
according to the rules of client string construction above, client
A will present string "AY" when communicating with server Y.
Server Y thus has no way to know that client A should be associated
with the state migrated from server X. "AX" is all but abandoned,
interfering with establishing fresh state for client A on server Y.
To support transparent state migration, then, NFSv4.0 clients must
instead use the same nfs_client_id4.id string to identify themselves
to every NFS server; something like "A".
Now a client identifies itself as "A" to server X. When a file
system on server X transitions to server Y, and client A identifies
itself as "A" to server Y, Y will know immediately that the state
associated with "A," whether it is native or migrated, is owned by
the client, and can merge both into a single lease.
As a pre-requisite to adding support for NFSv4 migration to the Linux
NFS client, this patch changes the way Linux identifies itself to NFS
servers via the SETCLIENTID (NFSv4 minor version 0) and EXCHANGE_ID
(NFSv4 minor version 1) operations.
In addition to removing the server's IP address from nfs_client_id4,
the Linux NFS client will also no longer use its own source IP address
as part of the nfs_client_id4 string. On multi-homed clients, the
value of this address depends on the address family and network
routing used to contact the server, thus it can be different for each
server.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-09-15 04:24:21 +07:00
|
|
|
{
|
2015-06-10 06:44:00 +07:00
|
|
|
size_t len;
|
|
|
|
char *str;
|
2015-01-04 03:16:04 +07:00
|
|
|
|
|
|
|
if (clp->cl_owner_id != NULL)
|
2015-06-10 06:44:00 +07:00
|
|
|
return 0;
|
2012-09-15 04:24:41 +07:00
|
|
|
|
|
|
|
if (nfs4_client_id_uniquifier[0] != '\0')
|
2015-06-10 06:44:00 +07:00
|
|
|
return nfs4_init_uniquifier_client_string(clp);
|
|
|
|
|
|
|
|
len = 10 + 10 + 1 + 10 + 1 +
|
|
|
|
strlen(clp->cl_rpcclient->cl_nodename) + 1;
|
|
|
|
|
|
|
|
if (len > NFS4_OPAQUE_LIMIT + 1)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Since this string is allocated at mount time, and held until the
|
|
|
|
* nfs_client is destroyed, we can use GFP_KERNEL here w/o worrying
|
|
|
|
* about a memory-reclaim deadlock.
|
|
|
|
*/
|
|
|
|
str = kmalloc(len, GFP_KERNEL);
|
|
|
|
if (!str)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
2015-10-08 22:33:17 +07:00
|
|
|
scnprintf(str, len, "Linux NFSv%u.%u %s",
|
2015-06-10 06:44:00 +07:00
|
|
|
clp->rpc_ops->version, clp->cl_minorversion,
|
|
|
|
clp->cl_rpcclient->cl_nodename);
|
|
|
|
clp->cl_owner_id = str;
|
|
|
|
return 0;
|
NFS: Use the same nfs_client_id4 for every server
Currently, when identifying itself to NFS servers, the Linux NFS
client uses a unique nfs_client_id4.id string for each server IP
address it talks with. For example, when client A talks to server X,
the client identifies itself using a string like "AX". The
requirements for these strings are specified in detail by RFC 3530
(and bis).
This form of client identification presents a problem for Transparent
State Migration. When client A's state on server X is migrated to
server Y, it continues to be associated with string "AX." But,
according to the rules of client string construction above, client
A will present string "AY" when communicating with server Y.
Server Y thus has no way to know that client A should be associated
with the state migrated from server X. "AX" is all but abandoned,
interfering with establishing fresh state for client A on server Y.
To support transparent state migration, then, NFSv4.0 clients must
instead use the same nfs_client_id4.id string to identify themselves
to every NFS server; something like "A".
Now a client identifies itself as "A" to server X. When a file
system on server X transitions to server Y, and client A identifies
itself as "A" to server Y, Y will know immediately that the state
associated with "A," whether it is native or migrated, is owned by
the client, and can merge both into a single lease.
As a pre-requisite to adding support for NFSv4 migration to the Linux
NFS client, this patch changes the way Linux identifies itself to NFS
servers via the SETCLIENTID (NFSv4 minor version 0) and EXCHANGE_ID
(NFSv4 minor version 1) operations.
In addition to removing the server's IP address from nfs_client_id4,
the Linux NFS client will also no longer use its own source IP address
as part of the nfs_client_id4 string. On multi-homed clients, the
value of this address depends on the address family and network
routing used to contact the server, thus it can be different for each
server.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-09-15 04:24:21 +07:00
|
|
|
}
|
|
|
|
|
2014-03-12 23:51:47 +07:00
|
|
|
/*
|
|
|
|
* nfs4_callback_up_net() starts only "tcp" and "tcp6" callback
|
|
|
|
* services. Advertise one based on the address family of the
|
|
|
|
* clientaddr.
|
|
|
|
*/
|
|
|
|
static unsigned int
|
|
|
|
nfs4_init_callback_netid(const struct nfs_client *clp, char *buf, size_t len)
|
|
|
|
{
|
|
|
|
if (strchr(clp->cl_ipaddr, ':') != NULL)
|
|
|
|
return scnprintf(buf, len, "tcp6");
|
|
|
|
else
|
|
|
|
return scnprintf(buf, len, "tcp");
|
|
|
|
}
|
|
|
|
|
2014-06-22 07:52:17 +07:00
|
|
|
static void nfs4_setclientid_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_setclientid *sc = calldata;
|
|
|
|
|
|
|
|
if (task->tk_status == 0)
|
|
|
|
sc->sc_cred = get_rpccred(task->tk_rqstp->rq_cred);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_setclientid_ops = {
|
|
|
|
.rpc_call_done = nfs4_setclientid_done,
|
|
|
|
};
|
|
|
|
|
2012-07-12 03:30:59 +07:00
|
|
|
/**
|
|
|
|
* nfs4_proc_setclientid - Negotiate client ID
|
|
|
|
* @clp: state data structure
|
|
|
|
* @program: RPC program for NFSv4 callback service
|
|
|
|
* @port: IP port number for NFS4 callback service
|
|
|
|
* @cred: RPC credential to use for this call
|
|
|
|
* @res: where to place the result
|
|
|
|
*
|
|
|
|
* Returns zero, a negative errno, or a negative NFS4ERR status code.
|
|
|
|
*/
|
2010-04-17 03:43:06 +07:00
|
|
|
int nfs4_proc_setclientid(struct nfs_client *clp, u32 program,
|
|
|
|
unsigned short port, struct rpc_cred *cred,
|
|
|
|
struct nfs4_setclientid_res *res)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
nfs4_verifier sc_verifier;
|
|
|
|
struct nfs4_setclientid setclientid = {
|
|
|
|
.sc_verifier = &sc_verifier,
|
|
|
|
.sc_prog = program,
|
2015-06-10 06:43:57 +07:00
|
|
|
.sc_clnt = clp,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID],
|
|
|
|
.rpc_argp = &setclientid,
|
2010-04-17 03:43:06 +07:00
|
|
|
.rpc_resp = res,
|
2006-01-03 15:55:26 +07:00
|
|
|
.rpc_cred = cred,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
2014-06-22 07:52:17 +07:00
|
|
|
struct rpc_task *task;
|
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = clp->cl_rpcclient,
|
|
|
|
.rpc_message = &msg,
|
|
|
|
.callback_ops = &nfs4_setclientid_ops,
|
|
|
|
.callback_data = &setclientid,
|
|
|
|
.flags = RPC_TASK_TIMEOUT,
|
|
|
|
};
|
2012-07-12 03:30:59 +07:00
|
|
|
int status;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2012-07-12 03:30:50 +07:00
|
|
|
/* nfs_client_id4 */
|
NFS: Always use the same SETCLIENTID boot verifier
Currently our NFS client assigns a unique SETCLIENTID boot verifier
for each server IP address it knows about. It's set to CURRENT_TIME
when the struct nfs_client for that server IP is created.
During the SETCLIENTID operation, our client also presents an
nfs_client_id4 string to servers, as an identifier on which the server
can hang all of this client's NFSv4 state. Our client's
nfs_client_id4 string is unique for each server IP address.
An NFSv4 server is obligated to wipe all NFSv4 state associated with
an nfs_client_id4 string when the client presents the same
nfs_client_id4 string along with a changed SETCLIENTID boot verifier.
When our client unmounts the last of a server's shares, it destroys
that server's struct nfs_client. The next time the client mounts that
NFS server, it creates a fresh struct nfs_client with a fresh boot
verifier. On seeing the fresh verifer, the server wipes any previous
NFSv4 state associated with that nfs_client_id4.
However, NFSv4.1 clients are supposed to present the same
nfs_client_id4 string to all servers. And, to support Transparent
State Migration, the same nfs_client_id4 string should be presented
to all NFSv4.0 servers so they recognize that migrated state for this
client belongs with state a server may already have for this client.
(This is known as the Uniform Client String model).
If the nfs_client_id4 string is the same but the boot verifier changes
for each server IP address, SETCLIENTID and EXCHANGE_ID operations
from such a client could unintentionally result in a server wiping a
client's previously obtained lease.
Thus, if our NFS client is going to use a fixed nfs_client_id4 string,
either for NFSv4.0 or NFSv4.1 mounts, our NFS client should use a
boot verifier that does not change depending on server IP address.
Replace our current per-nfs_client boot verifier with a per-nfs_net
boot verifier.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-05-22 09:45:41 +07:00
|
|
|
nfs4_init_boot_verifier(clp, &sc_verifier);
|
2015-06-10 06:44:00 +07:00
|
|
|
|
|
|
|
if (test_bit(NFS_CS_MIGRATION, &clp->cl_flags))
|
|
|
|
status = nfs4_init_uniform_client_string(clp);
|
|
|
|
else
|
2015-06-10 06:43:59 +07:00
|
|
|
status = nfs4_init_nonuniform_client_string(clp);
|
2015-06-10 06:44:00 +07:00
|
|
|
|
|
|
|
if (status)
|
|
|
|
goto out;
|
2015-06-10 06:43:57 +07:00
|
|
|
|
2012-07-12 03:30:50 +07:00
|
|
|
/* cb_client4 */
|
2014-03-12 23:51:47 +07:00
|
|
|
setclientid.sc_netid_len =
|
|
|
|
nfs4_init_callback_netid(clp,
|
|
|
|
setclientid.sc_netid,
|
|
|
|
sizeof(setclientid.sc_netid));
|
2012-07-12 03:30:50 +07:00
|
|
|
setclientid.sc_uaddr_len = scnprintf(setclientid.sc_uaddr,
|
2007-12-11 02:57:09 +07:00
|
|
|
sizeof(setclientid.sc_uaddr), "%s.%u.%u",
|
2005-04-17 05:20:36 +07:00
|
|
|
clp->cl_ipaddr, port >> 8, port & 255);
|
|
|
|
|
2015-06-10 06:43:57 +07:00
|
|
|
dprintk("NFS call setclientid auth=%s, '%s'\n",
|
2012-07-12 03:30:59 +07:00
|
|
|
clp->cl_rpcclient->cl_auth->au_ops->au_name,
|
2015-06-10 06:43:57 +07:00
|
|
|
clp->cl_owner_id);
|
2014-06-22 07:52:17 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
|
|
|
if (IS_ERR(task)) {
|
|
|
|
status = PTR_ERR(task);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
status = task->tk_status;
|
|
|
|
if (setclientid.sc_cred) {
|
|
|
|
clp->cl_acceptor = rpcauth_stringify_acceptor(setclientid.sc_cred);
|
|
|
|
put_rpccred(setclientid.sc_cred);
|
|
|
|
}
|
|
|
|
rpc_put_task(task);
|
|
|
|
out:
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_setclientid(clp, status);
|
2012-07-12 03:30:59 +07:00
|
|
|
dprintk("NFS reply setclientid: %d\n", status);
|
|
|
|
return status;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2012-07-12 03:30:59 +07:00
|
|
|
/**
|
|
|
|
* nfs4_proc_setclientid_confirm - Confirm client ID
|
|
|
|
* @clp: state data structure
|
|
|
|
* @res: result of a previous SETCLIENTID
|
|
|
|
* @cred: RPC credential to use for this call
|
|
|
|
*
|
|
|
|
* Returns zero, a negative errno, or a negative NFS4ERR status code.
|
|
|
|
*/
|
2011-04-25 01:28:18 +07:00
|
|
|
int nfs4_proc_setclientid_confirm(struct nfs_client *clp,
|
2010-04-17 03:43:06 +07:00
|
|
|
struct nfs4_setclientid_res *arg,
|
|
|
|
struct rpc_cred *cred)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID_CONFIRM],
|
2010-04-17 03:43:06 +07:00
|
|
|
.rpc_argp = arg,
|
2006-01-03 15:55:26 +07:00
|
|
|
.rpc_cred = cred,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
2012-07-12 03:30:59 +07:00
|
|
|
dprintk("NFS call setclientid_confirm auth=%s, (client ID %llx)\n",
|
|
|
|
clp->cl_rpcclient->cl_auth->au_ops->au_name,
|
|
|
|
clp->cl_clientid);
|
2011-04-25 01:29:33 +07:00
|
|
|
status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_setclientid_confirm(clp, status);
|
2012-07-12 03:30:59 +07:00
|
|
|
dprintk("NFS reply setclientid_confirm: %d\n", status);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:18 +07:00
|
|
|
struct nfs4_delegreturndata {
|
|
|
|
struct nfs4_delegreturnargs args;
|
2006-01-03 15:55:38 +07:00
|
|
|
struct nfs4_delegreturnres res;
|
2006-01-03 15:55:18 +07:00
|
|
|
struct nfs_fh fh;
|
|
|
|
nfs4_stateid stateid;
|
2006-01-03 15:55:21 +07:00
|
|
|
unsigned long timestamp;
|
2016-11-16 03:03:33 +07:00
|
|
|
struct {
|
|
|
|
struct nfs4_layoutreturn_args arg;
|
|
|
|
struct nfs4_layoutreturn_res res;
|
2016-09-23 22:38:08 +07:00
|
|
|
struct nfs4_xdr_opaque_data ld_private;
|
2016-11-16 03:03:33 +07:00
|
|
|
u32 roc_barrier;
|
|
|
|
bool roc;
|
|
|
|
} lr;
|
2006-01-03 15:55:38 +07:00
|
|
|
struct nfs_fattr fattr;
|
2006-01-03 15:55:18 +07:00
|
|
|
int rpc_status;
|
2014-07-03 12:05:02 +07:00
|
|
|
struct inode *inode;
|
2006-01-03 15:55:18 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
static void nfs4_delegreturn_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_delegreturndata *data = calldata;
|
2017-11-07 23:02:32 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.inode = data->inode,
|
|
|
|
.stateid = &data->stateid,
|
|
|
|
};
|
2009-04-01 20:22:28 +07:00
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs4_sequence_done(task, &data->res.seq_res))
|
|
|
|
return;
|
2009-04-01 20:22:28 +07:00
|
|
|
|
2013-08-13 21:36:56 +07:00
|
|
|
trace_nfs4_delegreturn_exit(&data->args, &data->res, task->tk_status);
|
2016-11-16 03:03:33 +07:00
|
|
|
|
|
|
|
/* Handle Layoutreturn errors */
|
|
|
|
if (data->args.lr_args && task->tk_status != 0) {
|
|
|
|
switch(data->res.lr_ret) {
|
|
|
|
default:
|
|
|
|
data->res.lr_ret = -NFS4ERR_NOMATCHING_LAYOUT;
|
|
|
|
break;
|
|
|
|
case 0:
|
|
|
|
data->args.lr_args = NULL;
|
|
|
|
data->res.lr_res = NULL;
|
|
|
|
break;
|
2017-11-07 03:28:07 +07:00
|
|
|
case -NFS4ERR_OLD_STATEID:
|
|
|
|
if (nfs4_refresh_layout_stateid(&data->args.lr_args->stateid,
|
2017-11-07 03:28:10 +07:00
|
|
|
data->inode))
|
|
|
|
goto lr_restart;
|
2017-11-07 03:28:07 +07:00
|
|
|
/* Fallthrough */
|
2016-11-16 03:03:33 +07:00
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
case -NFS4ERR_BAD_STATEID:
|
|
|
|
case -NFS4ERR_UNKNOWN_LAYOUTTYPE:
|
|
|
|
case -NFS4ERR_WRONG_CRED:
|
|
|
|
data->args.lr_args = NULL;
|
|
|
|
data->res.lr_res = NULL;
|
2017-11-07 03:28:10 +07:00
|
|
|
goto lr_restart;
|
2016-11-16 03:03:33 +07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2009-12-07 21:23:21 +07:00
|
|
|
switch (task->tk_status) {
|
|
|
|
case 0:
|
2006-01-03 15:55:38 +07:00
|
|
|
renew_lease(data->res.server, data->timestamp);
|
2016-11-11 04:06:28 +07:00
|
|
|
break;
|
2013-11-20 04:34:14 +07:00
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
2016-09-23 00:39:05 +07:00
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
nfs4_free_revoked_stateid(data->res.server,
|
|
|
|
data->args.stateid,
|
|
|
|
task->tk_msg.rpc_cred);
|
2017-11-07 03:28:05 +07:00
|
|
|
/* Fallthrough */
|
2013-11-20 04:34:14 +07:00
|
|
|
case -NFS4ERR_BAD_STATEID:
|
|
|
|
case -NFS4ERR_STALE_STATEID:
|
|
|
|
task->tk_status = 0;
|
|
|
|
break;
|
2017-11-07 03:28:05 +07:00
|
|
|
case -NFS4ERR_OLD_STATEID:
|
2017-11-07 03:28:10 +07:00
|
|
|
if (nfs4_refresh_delegation_stateid(&data->stateid, data->inode))
|
|
|
|
goto out_restart;
|
2017-11-07 03:28:05 +07:00
|
|
|
task->tk_status = 0;
|
|
|
|
break;
|
2016-12-19 22:23:10 +07:00
|
|
|
case -NFS4ERR_ACCESS:
|
|
|
|
if (data->args.bitmask) {
|
|
|
|
data->args.bitmask = NULL;
|
|
|
|
data->res.fattr = NULL;
|
2017-11-07 03:28:10 +07:00
|
|
|
goto out_restart;
|
2016-12-19 22:23:10 +07:00
|
|
|
}
|
2017-11-07 03:28:10 +07:00
|
|
|
/* Fallthrough */
|
2009-12-07 21:23:21 +07:00
|
|
|
default:
|
2017-11-07 23:02:32 +07:00
|
|
|
task->tk_status = nfs4_async_handle_exception(task,
|
|
|
|
data->res.server, task->tk_status,
|
|
|
|
&exception);
|
|
|
|
if (exception.retry)
|
2017-11-07 03:28:10 +07:00
|
|
|
goto out_restart;
|
2009-12-07 21:23:21 +07:00
|
|
|
}
|
|
|
|
data->rpc_status = task->tk_status;
|
2017-11-07 03:28:10 +07:00
|
|
|
return;
|
|
|
|
lr_restart:
|
|
|
|
data->res.lr_ret = 0;
|
|
|
|
out_restart:
|
|
|
|
task->tk_status = 0;
|
|
|
|
rpc_restart_call_prepare(task);
|
2006-01-03 15:55:18 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_delegreturn_release(void *calldata)
|
|
|
|
{
|
2014-07-03 12:05:02 +07:00
|
|
|
struct nfs4_delegreturndata *data = calldata;
|
2015-02-06 03:13:24 +07:00
|
|
|
struct inode *inode = data->inode;
|
2014-07-03 12:05:02 +07:00
|
|
|
|
2015-02-06 03:13:24 +07:00
|
|
|
if (inode) {
|
2016-11-16 03:03:33 +07:00
|
|
|
if (data->lr.roc)
|
2016-11-16 13:11:25 +07:00
|
|
|
pnfs_roc_release(&data->lr.arg, &data->lr.res,
|
|
|
|
data->res.lr_ret);
|
2016-12-17 07:48:09 +07:00
|
|
|
nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
|
2015-02-06 03:13:24 +07:00
|
|
|
nfs_iput_and_deactive(inode);
|
|
|
|
}
|
2006-01-03 15:55:18 +07:00
|
|
|
kfree(calldata);
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:28 +07:00
|
|
|
static void nfs4_delegreturn_prepare(struct rpc_task *task, void *data)
|
|
|
|
{
|
|
|
|
struct nfs4_delegreturndata *d_data;
|
|
|
|
|
|
|
|
d_data = (struct nfs4_delegreturndata *)data;
|
|
|
|
|
2016-11-16 13:11:25 +07:00
|
|
|
if (!d_data->lr.roc && nfs4_wait_on_layoutreturn(d_data->inode, task))
|
2015-09-22 10:35:22 +07:00
|
|
|
return;
|
|
|
|
|
2017-01-10 03:48:22 +07:00
|
|
|
nfs4_setup_sequence(d_data->res.server->nfs_client,
|
2012-10-23 07:28:44 +07:00
|
|
|
&d_data->args.seq_args,
|
|
|
|
&d_data->res.seq_res,
|
|
|
|
task);
|
2009-04-01 20:22:28 +07:00
|
|
|
}
|
|
|
|
|
2006-03-21 01:44:07 +07:00
|
|
|
static const struct rpc_call_ops nfs4_delegreturn_ops = {
|
2009-04-01 20:22:28 +07:00
|
|
|
.rpc_call_prepare = nfs4_delegreturn_prepare,
|
2006-01-03 15:55:18 +07:00
|
|
|
.rpc_call_done = nfs4_delegreturn_done,
|
|
|
|
.rpc_release = nfs4_delegreturn_release,
|
|
|
|
};
|
|
|
|
|
2008-01-25 06:14:34 +07:00
|
|
|
static int _nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
|
2006-01-03 15:55:18 +07:00
|
|
|
{
|
|
|
|
struct nfs4_delegreturndata *data;
|
2006-01-03 15:55:38 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2006-01-03 15:55:18 +07:00
|
|
|
struct rpc_task *task;
|
2007-07-15 02:40:01 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DELEGRETURN],
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
2007-07-15 02:39:59 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = server->client,
|
2007-07-15 02:40:01 +07:00
|
|
|
.rpc_message = &msg,
|
2007-07-15 02:39:59 +07:00
|
|
|
.callback_ops = &nfs4_delegreturn_ops,
|
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
2008-01-25 06:14:34 +07:00
|
|
|
int status = 0;
|
2006-01-03 15:55:18 +07:00
|
|
|
|
2010-05-13 23:51:01 +07:00
|
|
|
data = kzalloc(sizeof(*data), GFP_NOFS);
|
2006-01-03 15:55:18 +07:00
|
|
|
if (data == NULL)
|
|
|
|
return -ENOMEM;
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 1, 0);
|
2015-12-02 21:39:51 +07:00
|
|
|
|
|
|
|
nfs4_state_protect(server->nfs_client,
|
|
|
|
NFS_SP4_MACH_CRED_CLEANUP,
|
|
|
|
&task_setup_data.rpc_client, &msg);
|
|
|
|
|
2006-01-03 15:55:18 +07:00
|
|
|
data->args.fhandle = &data->fh;
|
|
|
|
data->args.stateid = &data->stateid;
|
2012-04-28 00:48:17 +07:00
|
|
|
data->args.bitmask = server->cache_consistency_bitmask;
|
2006-01-03 15:55:18 +07:00
|
|
|
nfs_copy_fh(&data->fh, NFS_FH(inode));
|
2012-03-05 06:13:56 +07:00
|
|
|
nfs4_stateid_copy(&data->stateid, stateid);
|
2006-01-03 15:55:38 +07:00
|
|
|
data->res.fattr = &data->fattr;
|
|
|
|
data->res.server = server;
|
2016-11-16 03:03:33 +07:00
|
|
|
data->res.lr_ret = -NFS4ERR_NOMATCHING_LAYOUT;
|
2016-09-23 22:38:08 +07:00
|
|
|
data->lr.arg.ld_private = &data->lr.ld_private;
|
2007-07-15 02:40:01 +07:00
|
|
|
nfs_fattr_init(data->res.fattr);
|
2006-01-03 15:55:21 +07:00
|
|
|
data->timestamp = jiffies;
|
2006-01-03 15:55:18 +07:00
|
|
|
data->rpc_status = 0;
|
2016-11-19 20:48:47 +07:00
|
|
|
data->lr.roc = pnfs_roc(inode, &data->lr.arg, &data->lr.res, cred);
|
2015-02-06 03:13:24 +07:00
|
|
|
data->inode = nfs_igrab_and_active(inode);
|
2016-11-16 13:11:25 +07:00
|
|
|
if (data->inode) {
|
|
|
|
if (data->lr.roc) {
|
|
|
|
data->args.lr_args = &data->lr.arg;
|
|
|
|
data->res.lr_res = &data->lr.res;
|
|
|
|
}
|
2016-11-19 20:48:47 +07:00
|
|
|
} else if (data->lr.roc) {
|
|
|
|
pnfs_roc_release(&data->lr.arg, &data->lr.res, 0);
|
|
|
|
data->lr.roc = false;
|
2016-11-16 13:11:25 +07:00
|
|
|
}
|
2006-01-03 15:55:18 +07:00
|
|
|
|
2007-07-15 02:39:59 +07:00
|
|
|
task_setup_data.callback_data = data;
|
2010-12-21 22:52:24 +07:00
|
|
|
msg.rpc_argp = &data->args;
|
|
|
|
msg.rpc_resp = &data->res;
|
2007-07-15 02:39:59 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
2006-03-21 06:11:10 +07:00
|
|
|
if (IS_ERR(task))
|
2006-01-03 15:55:18 +07:00
|
|
|
return PTR_ERR(task);
|
2008-01-25 06:14:34 +07:00
|
|
|
if (!issync)
|
|
|
|
goto out;
|
2017-01-12 03:01:43 +07:00
|
|
|
status = rpc_wait_for_completion_task(task);
|
2008-01-25 06:14:34 +07:00
|
|
|
if (status != 0)
|
|
|
|
goto out;
|
|
|
|
status = data->rpc_status;
|
|
|
|
out:
|
2006-11-12 10:18:03 +07:00
|
|
|
rpc_put_task(task);
|
2006-01-03 15:55:18 +07:00
|
|
|
return status;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2008-01-25 06:14:34 +07:00
|
|
|
int nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2008-01-25 06:14:34 +07:00
|
|
|
err = _nfs4_proc_delegreturn(inode, cred, stateid, issync);
|
Adding stateid information to tracepoints
Operations to which stateid information is added:
close, delegreturn, open, read, setattr, layoutget, layoutcommit, test_stateid,
write, lock, locku, lockt
Format is "stateid=<seqid>:<crc32 hash stateid.other>", also "openstateid=",
"layoutstateid=", and "lockstateid=" for open_file, layoutget, set_lock
tracepoints.
New function is added to internal.h, nfs_stateid_hash(), to compute the hash
trace_nfs4_setattr() is moved from nfs4_do_setattr() to _nfs4_do_setattr()
to get access to stateid.
trace_nfs4_setattr and trace_nfs4_delegreturn are changed from INODE_EVENT
to new event type, INODE_STATEID_EVENT which is same as INODE_EVENT but adds
stateid information
for locking tracepoints, moved trace_nfs4_set_lock() into _nfs4_do_setlk()
to get access to stateid information, and removed trace_nfs4_lock_reclaim(),
trace_nfs4_lock_expired() as they call into _nfs4_do_setlk() and both were
previously same LOCK_EVENT type.
Signed-off-by: Olga Kornievskaia <kolga@netapp.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-11-25 01:29:41 +07:00
|
|
|
trace_nfs4_delegreturn(inode, stateid, err);
|
2005-04-17 05:20:36 +07:00
|
|
|
switch (err) {
|
|
|
|
case -NFS4ERR_STALE_STATEID:
|
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
case 0:
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
err = nfs4_handle_exception(server, err, &exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int _nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
|
|
|
|
{
|
|
|
|
struct inode *inode = state->inode;
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2006-08-23 07:06:09 +07:00
|
|
|
struct nfs_client *clp = server->nfs_client;
|
2006-01-03 15:55:16 +07:00
|
|
|
struct nfs_lockt_args arg = {
|
2005-04-17 05:20:36 +07:00
|
|
|
.fh = NFS_FH(inode),
|
2006-01-03 15:55:16 +07:00
|
|
|
.fl = request,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
2006-01-03 15:55:16 +07:00
|
|
|
struct nfs_lockt_res res = {
|
|
|
|
.denied = request,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCKT],
|
2017-01-12 03:04:25 +07:00
|
|
|
.rpc_argp = &arg,
|
|
|
|
.rpc_resp = &res,
|
2005-04-17 05:20:36 +07:00
|
|
|
.rpc_cred = state->owner->so_cred,
|
|
|
|
};
|
|
|
|
struct nfs4_lock_state *lsp;
|
|
|
|
int status;
|
|
|
|
|
2006-01-03 15:55:16 +07:00
|
|
|
arg.lock_owner.clientid = clp->cl_clientid;
|
2005-06-23 00:16:32 +07:00
|
|
|
status = nfs4_set_lock_state(state, request);
|
|
|
|
if (status != 0)
|
|
|
|
goto out;
|
|
|
|
lsp = request->fl_u.nfs4_fl.owner;
|
2012-01-18 10:04:25 +07:00
|
|
|
arg.lock_owner.id = lsp->ls_seqid.owner_id;
|
2010-12-21 22:45:27 +07:00
|
|
|
arg.lock_owner.s_dev = server->s_dev;
|
2011-03-25 00:12:24 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
|
2006-01-03 15:55:16 +07:00
|
|
|
switch (status) {
|
|
|
|
case 0:
|
|
|
|
request->fl_type = F_UNLCK;
|
|
|
|
break;
|
|
|
|
case -NFS4ERR_DENIED:
|
|
|
|
status = 0;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
2007-02-23 06:48:53 +07:00
|
|
|
request->fl_ops->fl_release_private(request);
|
2013-10-02 01:24:58 +07:00
|
|
|
request->fl_ops = NULL;
|
2005-06-23 00:16:32 +07:00
|
|
|
out:
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
2013-08-13 03:35:20 +07:00
|
|
|
err = _nfs4_proc_getlk(state, cmd, request);
|
|
|
|
trace_nfs4_get_lock(request, state, cmd, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(state->inode), err,
|
2005-04-17 05:20:36 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2005-10-19 04:20:15 +07:00
|
|
|
struct nfs4_unlockdata {
|
2006-01-03 15:55:16 +07:00
|
|
|
struct nfs_locku_args arg;
|
|
|
|
struct nfs_locku_res res;
|
2005-10-19 04:20:15 +07:00
|
|
|
struct nfs4_lock_state *lsp;
|
|
|
|
struct nfs_open_context *ctx;
|
2017-04-11 23:50:12 +07:00
|
|
|
struct nfs_lock_context *l_ctx;
|
2006-01-03 15:55:16 +07:00
|
|
|
struct file_lock fl;
|
2015-09-21 03:15:24 +07:00
|
|
|
struct nfs_server *server;
|
2006-01-03 15:55:21 +07:00
|
|
|
unsigned long timestamp;
|
2005-10-19 04:20:15 +07:00
|
|
|
};
|
|
|
|
|
2006-01-03 15:55:16 +07:00
|
|
|
static struct nfs4_unlockdata *nfs4_alloc_unlockdata(struct file_lock *fl,
|
|
|
|
struct nfs_open_context *ctx,
|
|
|
|
struct nfs4_lock_state *lsp,
|
|
|
|
struct nfs_seqid *seqid)
|
|
|
|
{
|
|
|
|
struct nfs4_unlockdata *p;
|
|
|
|
struct inode *inode = lsp->ls_state->inode;
|
|
|
|
|
2010-05-13 23:51:01 +07:00
|
|
|
p = kzalloc(sizeof(*p), GFP_NOFS);
|
2006-01-03 15:55:16 +07:00
|
|
|
if (p == NULL)
|
|
|
|
return NULL;
|
|
|
|
p->arg.fh = NFS_FH(inode);
|
|
|
|
p->arg.fl = &p->fl;
|
|
|
|
p->arg.seqid = seqid;
|
2008-04-08 00:20:54 +07:00
|
|
|
p->res.seqid = seqid;
|
2006-01-03 15:55:16 +07:00
|
|
|
p->lsp = lsp;
|
2017-10-20 16:53:36 +07:00
|
|
|
refcount_inc(&lsp->ls_count);
|
2006-01-03 15:55:16 +07:00
|
|
|
/* Ensure we don't close file until we're done freeing locks! */
|
|
|
|
p->ctx = get_nfs_open_context(ctx);
|
2017-04-11 23:50:12 +07:00
|
|
|
p->l_ctx = nfs_get_lock_context(ctx);
|
2006-01-03 15:55:16 +07:00
|
|
|
memcpy(&p->fl, fl, sizeof(p->fl));
|
|
|
|
p->server = NFS_SERVER(inode);
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:07 +07:00
|
|
|
static void nfs4_locku_release_calldata(void *data)
|
2005-10-19 04:20:15 +07:00
|
|
|
{
|
2006-01-03 15:55:04 +07:00
|
|
|
struct nfs4_unlockdata *calldata = data;
|
2006-01-03 15:55:16 +07:00
|
|
|
nfs_free_seqid(calldata->arg.seqid);
|
2006-01-03 15:55:07 +07:00
|
|
|
nfs4_put_lock_state(calldata->lsp);
|
2017-04-11 23:50:12 +07:00
|
|
|
nfs_put_lock_context(calldata->l_ctx);
|
2006-01-03 15:55:07 +07:00
|
|
|
put_nfs_open_context(calldata->ctx);
|
|
|
|
kfree(calldata);
|
2005-10-19 04:20:15 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:04 +07:00
|
|
|
static void nfs4_locku_done(struct rpc_task *task, void *data)
|
2005-10-19 04:20:15 +07:00
|
|
|
{
|
2006-01-03 15:55:04 +07:00
|
|
|
struct nfs4_unlockdata *calldata = data;
|
2017-11-07 23:14:49 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.inode = calldata->lsp->ls_state->inode,
|
|
|
|
.stateid = &calldata->arg.stateid,
|
|
|
|
};
|
2005-10-19 04:20:15 +07:00
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs4_sequence_done(task, &calldata->res.seq_res))
|
|
|
|
return;
|
2005-10-19 04:20:15 +07:00
|
|
|
switch (task->tk_status) {
|
|
|
|
case 0:
|
2006-01-03 15:55:21 +07:00
|
|
|
renew_lease(calldata->server, calldata->timestamp);
|
2016-09-18 05:17:32 +07:00
|
|
|
locks_lock_inode_wait(calldata->lsp->ls_state->inode, &calldata->fl);
|
2015-01-25 04:03:52 +07:00
|
|
|
if (nfs4_update_lock_stateid(calldata->lsp,
|
|
|
|
&calldata->res.stateid))
|
|
|
|
break;
|
2016-09-23 00:39:05 +07:00
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
nfs4_free_revoked_stateid(calldata->server,
|
|
|
|
&calldata->arg.stateid,
|
|
|
|
task->tk_msg.rpc_cred);
|
2008-12-24 03:21:46 +07:00
|
|
|
case -NFS4ERR_BAD_STATEID:
|
|
|
|
case -NFS4ERR_OLD_STATEID:
|
2005-10-19 04:20:15 +07:00
|
|
|
case -NFS4ERR_STALE_STATEID:
|
2015-01-25 02:57:53 +07:00
|
|
|
if (!nfs4_stateid_match(&calldata->arg.stateid,
|
|
|
|
&calldata->lsp->ls_stateid))
|
|
|
|
rpc_restart_call_prepare(task);
|
2005-10-19 04:20:15 +07:00
|
|
|
break;
|
|
|
|
default:
|
2017-11-07 23:14:49 +07:00
|
|
|
task->tk_status = nfs4_async_handle_exception(task,
|
|
|
|
calldata->server, task->tk_status,
|
|
|
|
&exception);
|
|
|
|
if (exception.retry)
|
2011-10-20 02:17:29 +07:00
|
|
|
rpc_restart_call_prepare(task);
|
2005-10-19 04:20:15 +07:00
|
|
|
}
|
2012-10-30 05:53:23 +07:00
|
|
|
nfs_release_seqid(calldata->arg.seqid);
|
2005-10-19 04:20:15 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:05 +07:00
|
|
|
static void nfs4_locku_prepare(struct rpc_task *task, void *data)
|
2005-10-19 04:20:15 +07:00
|
|
|
{
|
2006-01-03 15:55:05 +07:00
|
|
|
struct nfs4_unlockdata *calldata = data;
|
2005-10-19 04:20:15 +07:00
|
|
|
|
2017-04-11 23:50:12 +07:00
|
|
|
if (test_bit(NFS_CONTEXT_UNLOCK, &calldata->l_ctx->open_context->flags) &&
|
|
|
|
nfs_async_iocounter_wait(task, calldata->l_ctx))
|
|
|
|
return;
|
|
|
|
|
2006-01-03 15:55:16 +07:00
|
|
|
if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
|
2013-02-12 07:01:21 +07:00
|
|
|
goto out_wait;
|
2015-01-25 02:57:53 +07:00
|
|
|
nfs4_stateid_copy(&calldata->arg.stateid, &calldata->lsp->ls_stateid);
|
2012-09-11 00:26:49 +07:00
|
|
|
if (test_bit(NFS_LOCK_INITIALIZED, &calldata->lsp->ls_flags) == 0) {
|
2006-01-03 15:55:04 +07:00
|
|
|
/* Note: exit _without_ running nfs4_locku_done */
|
2013-02-12 07:01:21 +07:00
|
|
|
goto out_no_action;
|
2005-10-19 04:20:15 +07:00
|
|
|
}
|
2006-01-03 15:55:21 +07:00
|
|
|
calldata->timestamp = jiffies;
|
2017-01-10 03:48:22 +07:00
|
|
|
if (nfs4_setup_sequence(calldata->server->nfs_client,
|
2009-04-01 20:22:23 +07:00
|
|
|
&calldata->arg.seq_args,
|
2012-10-30 05:37:40 +07:00
|
|
|
&calldata->res.seq_res,
|
|
|
|
task) != 0)
|
|
|
|
nfs_release_seqid(calldata->arg.seqid);
|
2013-02-12 07:01:21 +07:00
|
|
|
return;
|
|
|
|
out_no_action:
|
|
|
|
task->tk_action = NULL;
|
|
|
|
out_wait:
|
|
|
|
nfs4_sequence_done(task, &calldata->res.seq_res);
|
2005-10-19 04:20:15 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:04 +07:00
|
|
|
static const struct rpc_call_ops nfs4_locku_ops = {
|
2006-01-03 15:55:05 +07:00
|
|
|
.rpc_call_prepare = nfs4_locku_prepare,
|
2006-01-03 15:55:04 +07:00
|
|
|
.rpc_call_done = nfs4_locku_done,
|
2006-01-03 15:55:07 +07:00
|
|
|
.rpc_release = nfs4_locku_release_calldata,
|
2006-01-03 15:55:04 +07:00
|
|
|
};
|
|
|
|
|
2006-01-03 15:55:17 +07:00
|
|
|
static struct rpc_task *nfs4_do_unlck(struct file_lock *fl,
|
|
|
|
struct nfs_open_context *ctx,
|
|
|
|
struct nfs4_lock_state *lsp,
|
|
|
|
struct nfs_seqid *seqid)
|
|
|
|
{
|
|
|
|
struct nfs4_unlockdata *data;
|
2007-07-15 02:40:01 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCKU],
|
|
|
|
.rpc_cred = ctx->cred,
|
|
|
|
};
|
2007-07-15 02:39:59 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = NFS_CLIENT(lsp->ls_state->inode),
|
2007-07-15 02:40:01 +07:00
|
|
|
.rpc_message = &msg,
|
2007-07-15 02:39:59 +07:00
|
|
|
.callback_ops = &nfs4_locku_ops,
|
2008-02-20 08:04:23 +07:00
|
|
|
.workqueue = nfsiod_workqueue,
|
2007-07-15 02:39:59 +07:00
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
2006-01-03 15:55:17 +07:00
|
|
|
|
2013-08-14 03:37:34 +07:00
|
|
|
nfs4_state_protect(NFS_SERVER(lsp->ls_state->inode)->nfs_client,
|
|
|
|
NFS_SP4_MACH_CRED_CLEANUP, &task_setup_data.rpc_client, &msg);
|
|
|
|
|
NFSv4: Make sure unlock is really an unlock when cancelling a lock
I ran into a curious issue when a lock is being canceled. The
cancellation results in a lock request to the vfs layer instead of an
unlock request. This is particularly insidious when the process that
owns the lock is exiting. In that case, sometimes the erroneous lock is
applied AFTER the process has entered zombie state, preventing the lock
from ever being released. Eventually other processes block on the lock
causing a slow degredation of the system. In the 2.6.16 kernel this was
investigated on, the problem is compounded by the fact that the cl_sem
is held while blocking on the vfs lock, which results in most processes
accessing the nfs file system in question hanging.
In more detail, here is how the situation occurs:
first _nfs4_do_setlk():
static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int reclaim)
...
ret = nfs4_wait_for_completion_rpc_task(task);
if (ret == 0) {
...
} else
data->cancelled = 1;
then nfs4_lock_release():
static void nfs4_lock_release(void *calldata)
...
if (data->cancelled != 0) {
struct rpc_task *task;
task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
data->arg.lock_seqid);
The problem is the same file_lock that was passed in to _nfs4_do_setlk()
gets passed to nfs4_do_unlck() from nfs4_lock_release(). So the type is
still F_RDLCK or FWRLCK, not F_UNLCK. At some point, when cancelling the
lock, the type needs to be changed to F_UNLCK. It seemed easiest to do
that in nfs4_do_unlck(), but it could be done in nfs4_lock_release().
The concern I had with doing it there was if something still needed the
original file_lock, though it turns out the original file_lock still
needs to be modified by nfs4_do_unlck() because nfs4_do_unlck() uses the
original file_lock to pass to the vfs layer, and a copy of the original
file_lock for the RPC request.
It seems like the simplest solution is to force all situations where
nfs4_do_unlck() is being used to result in an unlock, so with that in
mind, I made the following change:
Signed-off-by: Frank Filz <ffilzlnx@us.ibm.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2007-07-10 05:32:29 +07:00
|
|
|
/* Ensure this is an unlock - when canceling a lock, the
|
|
|
|
* canceled lock is passed in, and it won't be an unlock.
|
|
|
|
*/
|
|
|
|
fl->fl_type = F_UNLCK;
|
2017-04-11 23:50:12 +07:00
|
|
|
if (fl->fl_flags & FL_CLOSE)
|
|
|
|
set_bit(NFS_CONTEXT_UNLOCK, &ctx->flags);
|
NFSv4: Make sure unlock is really an unlock when cancelling a lock
I ran into a curious issue when a lock is being canceled. The
cancellation results in a lock request to the vfs layer instead of an
unlock request. This is particularly insidious when the process that
owns the lock is exiting. In that case, sometimes the erroneous lock is
applied AFTER the process has entered zombie state, preventing the lock
from ever being released. Eventually other processes block on the lock
causing a slow degredation of the system. In the 2.6.16 kernel this was
investigated on, the problem is compounded by the fact that the cl_sem
is held while blocking on the vfs lock, which results in most processes
accessing the nfs file system in question hanging.
In more detail, here is how the situation occurs:
first _nfs4_do_setlk():
static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int reclaim)
...
ret = nfs4_wait_for_completion_rpc_task(task);
if (ret == 0) {
...
} else
data->cancelled = 1;
then nfs4_lock_release():
static void nfs4_lock_release(void *calldata)
...
if (data->cancelled != 0) {
struct rpc_task *task;
task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
data->arg.lock_seqid);
The problem is the same file_lock that was passed in to _nfs4_do_setlk()
gets passed to nfs4_do_unlck() from nfs4_lock_release(). So the type is
still F_RDLCK or FWRLCK, not F_UNLCK. At some point, when cancelling the
lock, the type needs to be changed to F_UNLCK. It seemed easiest to do
that in nfs4_do_unlck(), but it could be done in nfs4_lock_release().
The concern I had with doing it there was if something still needed the
original file_lock, though it turns out the original file_lock still
needs to be modified by nfs4_do_unlck() because nfs4_do_unlck() uses the
original file_lock to pass to the vfs layer, and a copy of the original
file_lock for the RPC request.
It seems like the simplest solution is to force all situations where
nfs4_do_unlck() is being used to result in an unlock, so with that in
mind, I made the following change:
Signed-off-by: Frank Filz <ffilzlnx@us.ibm.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2007-07-10 05:32:29 +07:00
|
|
|
|
2006-01-03 15:55:17 +07:00
|
|
|
data = nfs4_alloc_unlockdata(fl, ctx, lsp, seqid);
|
|
|
|
if (data == NULL) {
|
|
|
|
nfs_free_seqid(seqid);
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
}
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1, 0);
|
2010-12-21 22:52:24 +07:00
|
|
|
msg.rpc_argp = &data->arg;
|
|
|
|
msg.rpc_resp = &data->res;
|
2007-07-15 02:39:59 +07:00
|
|
|
task_setup_data.callback_data = data;
|
|
|
|
return rpc_run_task(&task_setup_data);
|
2006-01-03 15:55:17 +07:00
|
|
|
}
|
|
|
|
|
2005-10-19 04:20:15 +07:00
|
|
|
static int nfs4_proc_unlck(struct nfs4_state *state, int cmd, struct file_lock *request)
|
|
|
|
{
|
2013-02-07 22:54:07 +07:00
|
|
|
struct inode *inode = state->inode;
|
|
|
|
struct nfs4_state_owner *sp = state->owner;
|
|
|
|
struct nfs_inode *nfsi = NFS_I(inode);
|
2006-01-03 15:55:16 +07:00
|
|
|
struct nfs_seqid *seqid;
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs4_lock_state *lsp;
|
2006-01-03 15:55:07 +07:00
|
|
|
struct rpc_task *task;
|
2015-01-25 02:19:19 +07:00
|
|
|
struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
|
2006-01-03 15:55:07 +07:00
|
|
|
int status = 0;
|
2008-04-05 02:08:02 +07:00
|
|
|
unsigned char fl_flags = request->fl_flags;
|
2005-10-19 04:20:15 +07:00
|
|
|
|
2005-06-23 00:16:32 +07:00
|
|
|
status = nfs4_set_lock_state(state, request);
|
2006-06-30 03:38:34 +07:00
|
|
|
/* Unlock _before_ we do the RPC call */
|
|
|
|
request->fl_flags |= FL_EXISTS;
|
2013-02-07 22:54:07 +07:00
|
|
|
/* Exclude nfs_delegation_claim_locks() */
|
|
|
|
mutex_lock(&sp->so_delegreturn_mutex);
|
|
|
|
/* Exclude nfs4_reclaim_open_stateid() - note nesting! */
|
2008-12-24 03:21:44 +07:00
|
|
|
down_read(&nfsi->rwsem);
|
2016-09-18 05:17:32 +07:00
|
|
|
if (locks_lock_inode_wait(inode, request) == -ENOENT) {
|
2008-12-24 03:21:44 +07:00
|
|
|
up_read(&nfsi->rwsem);
|
2013-02-07 22:54:07 +07:00
|
|
|
mutex_unlock(&sp->so_delegreturn_mutex);
|
2006-06-30 03:38:34 +07:00
|
|
|
goto out;
|
2008-12-24 03:21:44 +07:00
|
|
|
}
|
|
|
|
up_read(&nfsi->rwsem);
|
2013-02-07 22:54:07 +07:00
|
|
|
mutex_unlock(&sp->so_delegreturn_mutex);
|
2005-06-23 00:16:32 +07:00
|
|
|
if (status != 0)
|
2006-06-30 03:38:34 +07:00
|
|
|
goto out;
|
|
|
|
/* Is this a delegated lock? */
|
2005-06-23 00:16:32 +07:00
|
|
|
lsp = request->fl_u.nfs4_fl.owner;
|
2013-04-30 23:43:42 +07:00
|
|
|
if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) == 0)
|
|
|
|
goto out;
|
2015-01-25 02:19:19 +07:00
|
|
|
alloc_seqid = NFS_SERVER(inode)->nfs_client->cl_mvops->alloc_seqid;
|
|
|
|
seqid = alloc_seqid(&lsp->ls_seqid, GFP_KERNEL);
|
2006-06-30 03:38:34 +07:00
|
|
|
status = -ENOMEM;
|
2015-01-24 06:48:00 +07:00
|
|
|
if (IS_ERR(seqid))
|
2006-06-30 03:38:34 +07:00
|
|
|
goto out;
|
2007-08-11 04:44:32 +07:00
|
|
|
task = nfs4_do_unlck(request, nfs_file_open_context(request->fl_file), lsp, seqid);
|
2006-01-03 15:55:17 +07:00
|
|
|
status = PTR_ERR(task);
|
|
|
|
if (IS_ERR(task))
|
2006-06-30 03:38:34 +07:00
|
|
|
goto out;
|
2017-01-12 03:01:43 +07:00
|
|
|
status = rpc_wait_for_completion_task(task);
|
2006-11-12 10:18:03 +07:00
|
|
|
rpc_put_task(task);
|
2006-06-30 03:38:34 +07:00
|
|
|
out:
|
2008-04-05 02:08:02 +07:00
|
|
|
request->fl_flags = fl_flags;
|
2013-08-13 03:35:20 +07:00
|
|
|
trace_nfs4_unlock(request, state, F_SETLK, status);
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:17 +07:00
|
|
|
struct nfs4_lockdata {
|
|
|
|
struct nfs_lock_args arg;
|
|
|
|
struct nfs_lock_res res;
|
|
|
|
struct nfs4_lock_state *lsp;
|
|
|
|
struct nfs_open_context *ctx;
|
|
|
|
struct file_lock fl;
|
2006-01-03 15:55:21 +07:00
|
|
|
unsigned long timestamp;
|
2006-01-03 15:55:17 +07:00
|
|
|
int rpc_status;
|
|
|
|
int cancelled;
|
2009-04-01 20:22:22 +07:00
|
|
|
struct nfs_server *server;
|
2006-01-03 15:55:17 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
static struct nfs4_lockdata *nfs4_alloc_lockdata(struct file_lock *fl,
|
2010-05-13 23:51:01 +07:00
|
|
|
struct nfs_open_context *ctx, struct nfs4_lock_state *lsp,
|
|
|
|
gfp_t gfp_mask)
|
2005-04-17 05:20:36 +07:00
|
|
|
{
|
2006-01-03 15:55:17 +07:00
|
|
|
struct nfs4_lockdata *p;
|
|
|
|
struct inode *inode = lsp->ls_state->inode;
|
2005-04-17 05:20:36 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2015-01-25 02:19:19 +07:00
|
|
|
struct nfs_seqid *(*alloc_seqid)(struct nfs_seqid_counter *, gfp_t);
|
2006-01-03 15:55:17 +07:00
|
|
|
|
2010-05-13 23:51:01 +07:00
|
|
|
p = kzalloc(sizeof(*p), gfp_mask);
|
2006-01-03 15:55:17 +07:00
|
|
|
if (p == NULL)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
p->arg.fh = NFS_FH(inode);
|
|
|
|
p->arg.fl = &p->fl;
|
2010-05-13 23:51:01 +07:00
|
|
|
p->arg.open_seqid = nfs_alloc_seqid(&lsp->ls_state->owner->so_seqid, gfp_mask);
|
2015-01-24 06:48:00 +07:00
|
|
|
if (IS_ERR(p->arg.open_seqid))
|
2008-01-09 05:56:07 +07:00
|
|
|
goto out_free;
|
2015-01-25 02:19:19 +07:00
|
|
|
alloc_seqid = server->nfs_client->cl_mvops->alloc_seqid;
|
|
|
|
p->arg.lock_seqid = alloc_seqid(&lsp->ls_seqid, gfp_mask);
|
2015-01-24 06:48:00 +07:00
|
|
|
if (IS_ERR(p->arg.lock_seqid))
|
2008-01-09 05:56:07 +07:00
|
|
|
goto out_free_seqid;
|
2006-08-23 07:06:09 +07:00
|
|
|
p->arg.lock_owner.clientid = server->nfs_client->cl_clientid;
|
2012-01-18 10:04:25 +07:00
|
|
|
p->arg.lock_owner.id = lsp->ls_seqid.owner_id;
|
2010-12-21 22:45:27 +07:00
|
|
|
p->arg.lock_owner.s_dev = server->s_dev;
|
2008-04-08 00:20:54 +07:00
|
|
|
p->res.lock_seqid = p->arg.lock_seqid;
|
2006-01-03 15:55:17 +07:00
|
|
|
p->lsp = lsp;
|
2009-04-01 20:22:22 +07:00
|
|
|
p->server = server;
|
2017-10-20 16:53:36 +07:00
|
|
|
refcount_inc(&lsp->ls_count);
|
2006-01-03 15:55:17 +07:00
|
|
|
p->ctx = get_nfs_open_context(ctx);
|
|
|
|
memcpy(&p->fl, fl, sizeof(p->fl));
|
|
|
|
return p;
|
2008-01-09 05:56:07 +07:00
|
|
|
out_free_seqid:
|
|
|
|
nfs_free_seqid(p->arg.open_seqid);
|
2006-01-03 15:55:17 +07:00
|
|
|
out_free:
|
|
|
|
kfree(p);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_lock_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_lockdata *data = calldata;
|
|
|
|
struct nfs4_state *state = data->lsp->ls_state;
|
2005-10-19 04:20:15 +07:00
|
|
|
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: begin!\n", __func__);
|
2008-01-09 05:56:07 +07:00
|
|
|
if (nfs_wait_on_sequence(data->arg.lock_seqid, task) != 0)
|
2013-02-12 07:01:21 +07:00
|
|
|
goto out_wait;
|
2006-01-03 15:55:17 +07:00
|
|
|
/* Do we need to do an open_to_lock_owner? */
|
2015-01-25 06:38:15 +07:00
|
|
|
if (!test_bit(NFS_LOCK_INITIALIZED, &data->lsp->ls_flags)) {
|
2012-10-30 06:02:20 +07:00
|
|
|
if (nfs_wait_on_sequence(data->arg.open_seqid, task) != 0) {
|
2012-10-30 05:37:40 +07:00
|
|
|
goto out_release_lock_seqid;
|
2012-10-30 06:02:20 +07:00
|
|
|
}
|
2015-01-25 02:57:53 +07:00
|
|
|
nfs4_stateid_copy(&data->arg.open_stateid,
|
|
|
|
&state->open_stateid);
|
2006-01-03 15:55:17 +07:00
|
|
|
data->arg.new_lock_owner = 1;
|
2008-04-08 00:20:54 +07:00
|
|
|
data->res.open_seqid = data->arg.open_seqid;
|
2015-01-25 02:57:53 +07:00
|
|
|
} else {
|
2008-01-09 05:56:07 +07:00
|
|
|
data->arg.new_lock_owner = 0;
|
2015-01-25 02:57:53 +07:00
|
|
|
nfs4_stateid_copy(&data->arg.lock_stateid,
|
|
|
|
&data->lsp->ls_stateid);
|
|
|
|
}
|
2013-03-15 03:57:48 +07:00
|
|
|
if (!nfs4_valid_open_stateid(state)) {
|
|
|
|
data->rpc_status = -EBADF;
|
|
|
|
task->tk_action = NULL;
|
|
|
|
goto out_release_open_seqid;
|
|
|
|
}
|
2006-01-03 15:55:21 +07:00
|
|
|
data->timestamp = jiffies;
|
2017-01-10 03:48:22 +07:00
|
|
|
if (nfs4_setup_sequence(data->server->nfs_client,
|
2010-06-16 20:52:26 +07:00
|
|
|
&data->arg.seq_args,
|
2012-10-30 05:37:40 +07:00
|
|
|
&data->res.seq_res,
|
2012-10-23 07:28:44 +07:00
|
|
|
task) == 0)
|
2009-04-01 20:22:22 +07:00
|
|
|
return;
|
2013-03-15 03:57:48 +07:00
|
|
|
out_release_open_seqid:
|
2012-10-30 05:37:40 +07:00
|
|
|
nfs_release_seqid(data->arg.open_seqid);
|
|
|
|
out_release_lock_seqid:
|
|
|
|
nfs_release_seqid(data->arg.lock_seqid);
|
2013-02-12 07:01:21 +07:00
|
|
|
out_wait:
|
|
|
|
nfs4_sequence_done(task, &data->res.seq_res);
|
2012-10-30 06:02:20 +07:00
|
|
|
dprintk("%s: done!, ret = %d\n", __func__, data->rpc_status);
|
2009-12-15 12:27:57 +07:00
|
|
|
}
|
|
|
|
|
2006-01-03 15:55:17 +07:00
|
|
|
static void nfs4_lock_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_lockdata *data = calldata;
|
2015-01-25 03:07:56 +07:00
|
|
|
struct nfs4_lock_state *lsp = data->lsp;
|
2006-01-03 15:55:17 +07:00
|
|
|
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: begin!\n", __func__);
|
2006-01-03 15:55:17 +07:00
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs4_sequence_done(task, &data->res.seq_res))
|
|
|
|
return;
|
2009-04-01 20:22:22 +07:00
|
|
|
|
2006-01-03 15:55:17 +07:00
|
|
|
data->rpc_status = task->tk_status;
|
2015-01-25 02:57:53 +07:00
|
|
|
switch (task->tk_status) {
|
|
|
|
case 0:
|
2015-03-18 05:25:59 +07:00
|
|
|
renew_lease(NFS_SERVER(d_inode(data->ctx->dentry)),
|
2015-01-25 03:07:56 +07:00
|
|
|
data->timestamp);
|
2018-05-03 18:12:57 +07:00
|
|
|
if (data->arg.new_lock && !data->cancelled) {
|
2015-01-25 04:03:52 +07:00
|
|
|
data->fl.fl_flags &= ~(FL_SLEEP | FL_ACCESS);
|
2018-05-03 18:12:57 +07:00
|
|
|
if (locks_lock_inode_wait(lsp->ls_state->inode, &data->fl) < 0)
|
2015-01-25 04:03:52 +07:00
|
|
|
break;
|
|
|
|
}
|
2018-05-03 18:12:57 +07:00
|
|
|
|
2015-01-25 03:07:56 +07:00
|
|
|
if (data->arg.new_lock_owner != 0) {
|
|
|
|
nfs_confirm_seqid(&lsp->ls_seqid, 0);
|
|
|
|
nfs4_stateid_copy(&lsp->ls_stateid, &data->res.stateid);
|
|
|
|
set_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags);
|
2018-05-03 18:12:57 +07:00
|
|
|
goto out_done;
|
|
|
|
} else if (nfs4_update_lock_stateid(lsp, &data->res.stateid))
|
|
|
|
goto out_done;
|
|
|
|
|
2015-01-25 02:57:53 +07:00
|
|
|
break;
|
|
|
|
case -NFS4ERR_BAD_STATEID:
|
|
|
|
case -NFS4ERR_OLD_STATEID:
|
|
|
|
case -NFS4ERR_STALE_STATEID:
|
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
if (data->arg.new_lock_owner != 0) {
|
2018-05-03 18:12:57 +07:00
|
|
|
if (nfs4_stateid_match(&data->arg.open_stateid,
|
2015-01-25 02:57:53 +07:00
|
|
|
&lsp->ls_state->open_stateid))
|
2018-05-03 18:12:57 +07:00
|
|
|
goto out_done;
|
|
|
|
} else if (nfs4_stateid_match(&data->arg.lock_stateid,
|
2015-01-25 02:57:53 +07:00
|
|
|
&lsp->ls_stateid))
|
2018-05-03 18:12:57 +07:00
|
|
|
goto out_done;
|
2006-01-03 15:55:17 +07:00
|
|
|
}
|
2018-05-03 18:12:57 +07:00
|
|
|
if (!data->cancelled)
|
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
out_done:
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: done, ret = %d!\n", __func__, data->rpc_status);
|
2006-01-03 15:55:17 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_lock_release(void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_lockdata *data = calldata;
|
|
|
|
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: begin!\n", __func__);
|
2008-01-09 05:56:07 +07:00
|
|
|
nfs_free_seqid(data->arg.open_seqid);
|
2017-06-20 19:33:44 +07:00
|
|
|
if (data->cancelled) {
|
2006-01-03 15:55:17 +07:00
|
|
|
struct rpc_task *task;
|
|
|
|
task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
|
|
|
|
data->arg.lock_seqid);
|
|
|
|
if (!IS_ERR(task))
|
2011-02-22 02:05:41 +07:00
|
|
|
rpc_put_task_async(task);
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: cancelling lock!\n", __func__);
|
2006-01-03 15:55:17 +07:00
|
|
|
} else
|
|
|
|
nfs_free_seqid(data->arg.lock_seqid);
|
|
|
|
nfs4_put_lock_state(data->lsp);
|
|
|
|
put_nfs_open_context(data->ctx);
|
|
|
|
kfree(data);
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: done!\n", __func__);
|
2006-01-03 15:55:17 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_lock_ops = {
|
|
|
|
.rpc_call_prepare = nfs4_lock_prepare,
|
|
|
|
.rpc_call_done = nfs4_lock_done,
|
|
|
|
.rpc_release = nfs4_lock_release,
|
|
|
|
};
|
|
|
|
|
2010-01-27 03:42:21 +07:00
|
|
|
static void nfs4_handle_setlk_error(struct nfs_server *server, struct nfs4_lock_state *lsp, int new_lock_owner, int error)
|
|
|
|
{
|
|
|
|
switch (error) {
|
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
2016-09-23 00:39:09 +07:00
|
|
|
case -NFS4ERR_EXPIRED:
|
2010-01-27 03:42:21 +07:00
|
|
|
case -NFS4ERR_BAD_STATEID:
|
2011-03-10 04:00:56 +07:00
|
|
|
lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
|
2010-01-27 03:42:21 +07:00
|
|
|
if (new_lock_owner != 0 ||
|
2012-09-11 00:26:49 +07:00
|
|
|
test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) != 0)
|
2011-03-10 04:00:56 +07:00
|
|
|
nfs4_schedule_stateid_recovery(server, lsp->ls_state);
|
2010-01-27 03:42:47 +07:00
|
|
|
break;
|
|
|
|
case -NFS4ERR_STALE_STATEID:
|
|
|
|
lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
|
2011-03-10 04:00:56 +07:00
|
|
|
nfs4_schedule_lease_recovery(server->nfs_client);
|
2010-01-27 03:42:21 +07:00
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2009-12-09 16:50:14 +07:00
|
|
|
static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int recovery_type)
|
2006-01-03 15:55:17 +07:00
|
|
|
{
|
|
|
|
struct nfs4_lockdata *data;
|
|
|
|
struct rpc_task *task;
|
2007-07-15 02:40:01 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCK],
|
|
|
|
.rpc_cred = state->owner->so_cred,
|
|
|
|
};
|
2007-07-15 02:39:59 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = NFS_CLIENT(state->inode),
|
2007-07-15 02:40:01 +07:00
|
|
|
.rpc_message = &msg,
|
2007-07-15 02:39:59 +07:00
|
|
|
.callback_ops = &nfs4_lock_ops,
|
2008-02-20 08:04:23 +07:00
|
|
|
.workqueue = nfsiod_workqueue,
|
2007-07-15 02:39:59 +07:00
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
2006-01-03 15:55:17 +07:00
|
|
|
int ret;
|
|
|
|
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: begin!\n", __func__);
|
2007-08-11 04:44:32 +07:00
|
|
|
data = nfs4_alloc_lockdata(fl, nfs_file_open_context(fl->fl_file),
|
2010-05-13 23:51:01 +07:00
|
|
|
fl->fl_u.nfs4_fl.owner,
|
|
|
|
recovery_type == NFS_LOCK_NEW ? GFP_KERNEL : GFP_NOFS);
|
2006-01-03 15:55:17 +07:00
|
|
|
if (data == NULL)
|
|
|
|
return -ENOMEM;
|
|
|
|
if (IS_SETLKW(cmd))
|
|
|
|
data->arg.block = 1;
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1,
|
|
|
|
recovery_type > NFS_LOCK_NEW);
|
2010-12-21 22:52:24 +07:00
|
|
|
msg.rpc_argp = &data->arg;
|
|
|
|
msg.rpc_resp = &data->res;
|
2007-07-15 02:39:59 +07:00
|
|
|
task_setup_data.callback_data = data;
|
2012-10-30 06:02:20 +07:00
|
|
|
if (recovery_type > NFS_LOCK_NEW) {
|
|
|
|
if (recovery_type == NFS_LOCK_RECLAIM)
|
|
|
|
data->arg.reclaim = NFS_LOCK_RECLAIM;
|
2015-01-25 04:03:52 +07:00
|
|
|
} else
|
|
|
|
data->arg.new_lock = 1;
|
2007-07-15 02:39:59 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
2006-03-21 06:11:10 +07:00
|
|
|
if (IS_ERR(task))
|
2006-01-03 15:55:17 +07:00
|
|
|
return PTR_ERR(task);
|
2017-01-12 03:01:43 +07:00
|
|
|
ret = rpc_wait_for_completion_task(task);
|
2006-01-03 15:55:17 +07:00
|
|
|
if (ret == 0) {
|
|
|
|
ret = data->rpc_status;
|
2010-01-27 03:42:21 +07:00
|
|
|
if (ret)
|
|
|
|
nfs4_handle_setlk_error(data->server, data->lsp,
|
|
|
|
data->arg.new_lock_owner, ret);
|
2006-01-03 15:55:17 +07:00
|
|
|
} else
|
2017-06-20 19:33:44 +07:00
|
|
|
data->cancelled = true;
|
2006-11-12 10:18:03 +07:00
|
|
|
rpc_put_task(task);
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: done, ret = %d!\n", __func__, ret);
|
Adding stateid information to tracepoints
Operations to which stateid information is added:
close, delegreturn, open, read, setattr, layoutget, layoutcommit, test_stateid,
write, lock, locku, lockt
Format is "stateid=<seqid>:<crc32 hash stateid.other>", also "openstateid=",
"layoutstateid=", and "lockstateid=" for open_file, layoutget, set_lock
tracepoints.
New function is added to internal.h, nfs_stateid_hash(), to compute the hash
trace_nfs4_setattr() is moved from nfs4_do_setattr() to _nfs4_do_setattr()
to get access to stateid.
trace_nfs4_setattr and trace_nfs4_delegreturn are changed from INODE_EVENT
to new event type, INODE_STATEID_EVENT which is same as INODE_EVENT but adds
stateid information
for locking tracepoints, moved trace_nfs4_set_lock() into _nfs4_do_setlk()
to get access to stateid information, and removed trace_nfs4_lock_reclaim(),
trace_nfs4_lock_expired() as they call into _nfs4_do_setlk() and both were
previously same LOCK_EVENT type.
Signed-off-by: Olga Kornievskaia <kolga@netapp.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-11-25 01:29:41 +07:00
|
|
|
trace_nfs4_set_lock(fl, state, &data->res.stateid, cmd, ret);
|
2006-01-03 15:55:17 +07:00
|
|
|
return ret;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_lock_reclaim(struct nfs4_state *state, struct file_lock *request)
|
|
|
|
{
|
2005-06-23 00:16:29 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
2012-04-18 23:20:10 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.inode = state->inode,
|
|
|
|
};
|
2005-06-23 00:16:29 +07:00
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
2006-06-30 03:38:36 +07:00
|
|
|
/* Cache the lock if possible... */
|
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
|
|
|
|
return 0;
|
2009-12-09 16:50:14 +07:00
|
|
|
err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_RECLAIM);
|
2010-10-20 06:47:49 +07:00
|
|
|
if (err != -NFS4ERR_DELAY)
|
2005-06-23 00:16:29 +07:00
|
|
|
break;
|
|
|
|
nfs4_handle_exception(server, err, &exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_lock_expired(struct nfs4_state *state, struct file_lock *request)
|
|
|
|
{
|
2005-06-23 00:16:29 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
2012-04-18 23:20:10 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.inode = state->inode,
|
|
|
|
};
|
2005-06-23 00:16:29 +07:00
|
|
|
int err;
|
|
|
|
|
2005-11-05 03:39:36 +07:00
|
|
|
err = nfs4_set_lock_state(state, request);
|
|
|
|
if (err != 0)
|
|
|
|
return err;
|
2013-09-04 21:08:54 +07:00
|
|
|
if (!recover_lost_locks) {
|
2013-09-04 14:04:49 +07:00
|
|
|
set_bit(NFS_LOCK_LOST, &request->fl_u.nfs4_fl.owner->ls_flags);
|
|
|
|
return 0;
|
|
|
|
}
|
2005-06-23 00:16:29 +07:00
|
|
|
do {
|
2006-06-30 03:38:36 +07:00
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
|
|
|
|
return 0;
|
2009-12-09 16:50:14 +07:00
|
|
|
err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_EXPIRED);
|
2009-12-04 03:53:21 +07:00
|
|
|
switch (err) {
|
|
|
|
default:
|
|
|
|
goto out;
|
|
|
|
case -NFS4ERR_GRACE:
|
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
nfs4_handle_exception(server, err, &exception);
|
|
|
|
err = 0;
|
|
|
|
}
|
2005-06-23 00:16:29 +07:00
|
|
|
} while (exception.retry);
|
2009-12-04 03:53:21 +07:00
|
|
|
out:
|
2005-06-23 00:16:29 +07:00
|
|
|
return err;
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2011-06-03 01:59:10 +07:00
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
2012-01-31 22:39:30 +07:00
|
|
|
static int nfs41_lock_expired(struct nfs4_state *state, struct file_lock *request)
|
|
|
|
{
|
2016-09-23 00:39:03 +07:00
|
|
|
struct nfs4_lock_state *lsp;
|
|
|
|
int status;
|
2012-01-31 22:39:30 +07:00
|
|
|
|
2016-09-23 00:39:03 +07:00
|
|
|
status = nfs4_set_lock_state(state, request);
|
|
|
|
if (status != 0)
|
|
|
|
return status;
|
|
|
|
lsp = request->fl_u.nfs4_fl.owner;
|
|
|
|
if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) ||
|
|
|
|
test_bit(NFS_LOCK_LOST, &lsp->ls_flags))
|
|
|
|
return 0;
|
2017-01-12 04:41:34 +07:00
|
|
|
return nfs4_lock_expired(state, request);
|
2011-06-03 01:59:10 +07:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
static int _nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
|
|
|
|
{
|
2008-12-24 03:21:44 +07:00
|
|
|
struct nfs_inode *nfsi = NFS_I(state->inode);
|
2016-04-12 03:20:22 +07:00
|
|
|
struct nfs4_state_owner *sp = state->owner;
|
2006-06-30 03:38:39 +07:00
|
|
|
unsigned char fl_flags = request->fl_flags;
|
2016-09-18 05:17:37 +07:00
|
|
|
int status;
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2006-06-30 03:38:39 +07:00
|
|
|
request->fl_flags |= FL_ACCESS;
|
2016-09-18 05:17:32 +07:00
|
|
|
status = locks_lock_inode_wait(state->inode, request);
|
2006-06-30 03:38:39 +07:00
|
|
|
if (status < 0)
|
|
|
|
goto out;
|
2016-04-12 03:20:22 +07:00
|
|
|
mutex_lock(&sp->so_delegreturn_mutex);
|
2008-12-24 03:21:44 +07:00
|
|
|
down_read(&nfsi->rwsem);
|
2006-06-30 03:38:39 +07:00
|
|
|
if (test_bit(NFS_DELEGATED_STATE, &state->flags)) {
|
|
|
|
/* Yes: cache locks! */
|
|
|
|
/* ...but avoid races with delegation recall... */
|
2008-12-24 03:21:44 +07:00
|
|
|
request->fl_flags = fl_flags & ~FL_SLEEP;
|
2016-09-18 05:17:32 +07:00
|
|
|
status = locks_lock_inode_wait(state->inode, request);
|
2015-01-25 04:03:52 +07:00
|
|
|
up_read(&nfsi->rwsem);
|
2016-04-12 03:20:22 +07:00
|
|
|
mutex_unlock(&sp->so_delegreturn_mutex);
|
2013-02-05 08:17:49 +07:00
|
|
|
goto out;
|
|
|
|
}
|
2008-12-24 03:21:44 +07:00
|
|
|
up_read(&nfsi->rwsem);
|
2016-04-12 03:20:22 +07:00
|
|
|
mutex_unlock(&sp->so_delegreturn_mutex);
|
2015-01-25 04:03:52 +07:00
|
|
|
status = _nfs4_do_setlk(state, cmd, request, NFS_LOCK_NEW);
|
2006-06-30 03:38:39 +07:00
|
|
|
out:
|
|
|
|
request->fl_flags = fl_flags;
|
2005-04-17 05:20:36 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
|
|
|
|
{
|
2012-03-06 07:56:44 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.state = state,
|
2012-04-18 23:20:10 +07:00
|
|
|
.inode = state->inode,
|
2012-03-06 07:56:44 +07:00
|
|
|
};
|
2005-04-17 05:20:36 +07:00
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
2009-06-18 03:22:59 +07:00
|
|
|
err = _nfs4_proc_setlk(state, cmd, request);
|
|
|
|
if (err == -NFS4ERR_DENIED)
|
|
|
|
err = -EAGAIN;
|
2005-04-17 05:20:36 +07:00
|
|
|
err = nfs4_handle_exception(NFS_SERVER(state->inode),
|
2009-06-18 03:22:59 +07:00
|
|
|
err, &exception);
|
2005-04-17 05:20:36 +07:00
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2016-09-18 05:17:38 +07:00
|
|
|
#define NFS4_LOCK_MINTIMEOUT (1 * HZ)
|
|
|
|
#define NFS4_LOCK_MAXTIMEOUT (30 * HZ)
|
|
|
|
|
|
|
|
static int
|
2016-09-18 05:17:39 +07:00
|
|
|
nfs4_retry_setlk_simple(struct nfs4_state *state, int cmd,
|
|
|
|
struct file_lock *request)
|
2016-09-18 05:17:38 +07:00
|
|
|
{
|
|
|
|
int status = -ERESTARTSYS;
|
|
|
|
unsigned long timeout = NFS4_LOCK_MINTIMEOUT;
|
|
|
|
|
|
|
|
while(!signalled()) {
|
|
|
|
status = nfs4_proc_setlk(state, cmd, request);
|
|
|
|
if ((status != -EAGAIN) || IS_SETLK(cmd))
|
|
|
|
break;
|
|
|
|
freezable_schedule_timeout_interruptible(timeout);
|
|
|
|
timeout *= 2;
|
|
|
|
timeout = min_t(unsigned long, NFS4_LOCK_MAXTIMEOUT, timeout);
|
|
|
|
status = -ERESTARTSYS;
|
|
|
|
}
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2016-09-18 05:17:39 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_1
|
|
|
|
struct nfs4_lock_waiter {
|
|
|
|
struct task_struct *task;
|
|
|
|
struct inode *inode;
|
|
|
|
struct nfs_lowner *owner;
|
|
|
|
bool notified;
|
|
|
|
};
|
|
|
|
|
|
|
|
static int
|
2017-06-20 17:06:13 +07:00
|
|
|
nfs4_wake_lock_waiter(wait_queue_entry_t *wait, unsigned int mode, int flags, void *key)
|
2016-09-18 05:17:39 +07:00
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
struct nfs4_lock_waiter *waiter = wait->private;
|
|
|
|
|
2018-03-18 19:37:03 +07:00
|
|
|
/* NULL key means to wake up everyone */
|
|
|
|
if (key) {
|
|
|
|
struct cb_notify_lock_args *cbnl = key;
|
|
|
|
struct nfs_lowner *lowner = &cbnl->cbnl_owner,
|
|
|
|
*wowner = waiter->owner;
|
2016-09-18 05:17:39 +07:00
|
|
|
|
2018-03-18 19:37:03 +07:00
|
|
|
/* Only wake if the callback was for the same owner. */
|
|
|
|
if (lowner->id != wowner->id || lowner->s_dev != wowner->s_dev)
|
|
|
|
return 0;
|
2016-09-18 05:17:39 +07:00
|
|
|
|
2018-03-18 19:37:03 +07:00
|
|
|
/* Make sure it's for the right inode */
|
|
|
|
if (nfs_compare_fh(NFS_FH(waiter->inode), &cbnl->cbnl_fh))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
waiter->notified = true;
|
|
|
|
}
|
2016-09-18 05:17:39 +07:00
|
|
|
|
|
|
|
/* override "private" so we can use default_wake_function */
|
|
|
|
wait->private = waiter->task;
|
|
|
|
ret = autoremove_wake_function(wait, mode, flags, key);
|
|
|
|
wait->private = waiter;
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
nfs4_retry_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
|
|
|
|
{
|
|
|
|
int status = -ERESTARTSYS;
|
|
|
|
unsigned long flags;
|
|
|
|
struct nfs4_lock_state *lsp = request->fl_u.nfs4_fl.owner;
|
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
|
|
|
struct nfs_client *clp = server->nfs_client;
|
|
|
|
wait_queue_head_t *q = &clp->cl_lock_waitq;
|
|
|
|
struct nfs_lowner owner = { .clientid = clp->cl_clientid,
|
|
|
|
.id = lsp->ls_seqid.owner_id,
|
|
|
|
.s_dev = server->s_dev };
|
|
|
|
struct nfs4_lock_waiter waiter = { .task = current,
|
|
|
|
.inode = state->inode,
|
|
|
|
.owner = &owner,
|
|
|
|
.notified = false };
|
2017-06-20 17:06:13 +07:00
|
|
|
wait_queue_entry_t wait;
|
2016-09-18 05:17:39 +07:00
|
|
|
|
|
|
|
/* Don't bother with waitqueue if we don't expect a callback */
|
|
|
|
if (!test_bit(NFS_STATE_MAY_NOTIFY_LOCK, &state->flags))
|
|
|
|
return nfs4_retry_setlk_simple(state, cmd, request);
|
|
|
|
|
|
|
|
init_wait(&wait);
|
|
|
|
wait.private = &waiter;
|
|
|
|
wait.func = nfs4_wake_lock_waiter;
|
|
|
|
add_wait_queue(q, &wait);
|
|
|
|
|
|
|
|
while(!signalled()) {
|
2018-03-18 19:37:01 +07:00
|
|
|
waiter.notified = false;
|
2016-09-18 05:17:39 +07:00
|
|
|
status = nfs4_proc_setlk(state, cmd, request);
|
|
|
|
if ((status != -EAGAIN) || IS_SETLK(cmd))
|
|
|
|
break;
|
|
|
|
|
|
|
|
status = -ERESTARTSYS;
|
|
|
|
spin_lock_irqsave(&q->lock, flags);
|
|
|
|
if (waiter.notified) {
|
|
|
|
spin_unlock_irqrestore(&q->lock, flags);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
set_current_state(TASK_INTERRUPTIBLE);
|
|
|
|
spin_unlock_irqrestore(&q->lock, flags);
|
|
|
|
|
2017-07-28 23:33:54 +07:00
|
|
|
freezable_schedule_timeout(NFS4_LOCK_MAXTIMEOUT);
|
2016-09-18 05:17:39 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
finish_wait(q, &wait);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
#else /* !CONFIG_NFS_V4_1 */
|
|
|
|
static inline int
|
|
|
|
nfs4_retry_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
|
|
|
|
{
|
|
|
|
return nfs4_retry_setlk_simple(state, cmd, request);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
static int
|
|
|
|
nfs4_proc_lock(struct file *filp, int cmd, struct file_lock *request)
|
|
|
|
{
|
|
|
|
struct nfs_open_context *ctx;
|
|
|
|
struct nfs4_state *state;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
/* verify open state */
|
2007-08-11 04:44:32 +07:00
|
|
|
ctx = nfs_file_open_context(filp);
|
2005-04-17 05:20:36 +07:00
|
|
|
state = ctx->state;
|
|
|
|
|
2009-07-22 06:22:38 +07:00
|
|
|
if (IS_GETLK(cmd)) {
|
|
|
|
if (state != NULL)
|
|
|
|
return nfs4_proc_getlk(state, F_GETLK, request);
|
|
|
|
return 0;
|
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
|
|
|
|
if (!(IS_SETLK(cmd) || IS_SETLKW(cmd)))
|
|
|
|
return -EINVAL;
|
|
|
|
|
2009-07-22 06:22:38 +07:00
|
|
|
if (request->fl_type == F_UNLCK) {
|
|
|
|
if (state != NULL)
|
|
|
|
return nfs4_proc_unlck(state, cmd, request);
|
|
|
|
return 0;
|
|
|
|
}
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2009-07-22 06:22:38 +07:00
|
|
|
if (state == NULL)
|
|
|
|
return -ENOLCK;
|
2016-09-18 05:17:37 +07:00
|
|
|
|
|
|
|
if ((request->fl_flags & FL_POSIX) &&
|
|
|
|
!test_bit(NFS_STATE_POSIX_LOCKS, &state->flags))
|
|
|
|
return -ENOLCK;
|
|
|
|
|
2017-11-10 18:27:49 +07:00
|
|
|
/*
|
|
|
|
* Don't rely on the VFS having checked the file open mode,
|
|
|
|
* since it won't do this for flock() locks.
|
|
|
|
*/
|
|
|
|
switch (request->fl_type) {
|
|
|
|
case F_RDLCK:
|
|
|
|
if (!(filp->f_mode & FMODE_READ))
|
|
|
|
return -EBADF;
|
|
|
|
break;
|
|
|
|
case F_WRLCK:
|
|
|
|
if (!(filp->f_mode & FMODE_WRITE))
|
|
|
|
return -EBADF;
|
|
|
|
}
|
|
|
|
|
2016-09-18 05:17:37 +07:00
|
|
|
status = nfs4_set_lock_state(state, request);
|
|
|
|
if (status != 0)
|
|
|
|
return status;
|
|
|
|
|
2016-09-18 05:17:38 +07:00
|
|
|
return nfs4_retry_setlk(state, cmd, request);
|
2005-04-17 05:20:36 +07:00
|
|
|
}
|
|
|
|
|
2013-04-02 02:56:46 +07:00
|
|
|
int nfs4_lock_delegation_recall(struct file_lock *fl, struct nfs4_state *state, const nfs4_stateid *stateid)
|
2005-11-05 03:38:11 +07:00
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(state->inode);
|
|
|
|
int err;
|
|
|
|
|
|
|
|
err = nfs4_set_lock_state(state, fl);
|
|
|
|
if (err != 0)
|
2013-04-02 02:56:46 +07:00
|
|
|
return err;
|
2013-04-02 01:47:22 +07:00
|
|
|
err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
|
2017-12-13 05:57:09 +07:00
|
|
|
return nfs4_handle_delegation_recall_error(server, state, stateid, fl, err);
|
2005-11-05 03:38:11 +07:00
|
|
|
}
|
2005-06-23 00:16:22 +07:00
|
|
|
|
2012-03-08 01:49:12 +07:00
|
|
|
struct nfs_release_lockowner_data {
|
|
|
|
struct nfs4_lock_state *lsp;
|
2012-03-20 03:17:18 +07:00
|
|
|
struct nfs_server *server;
|
2012-03-08 01:49:12 +07:00
|
|
|
struct nfs_release_lockowner_args args;
|
2014-02-27 02:19:14 +07:00
|
|
|
struct nfs_release_lockowner_res res;
|
NFS: Migration support for RELEASE_LOCKOWNER
Currently the Linux NFS client ignores the operation status code for
the RELEASE_LOCKOWNER operation. Like NFSv3's UMNT operation,
RELEASE_LOCKOWNER is a courtesy to help servers manage their
resources, and the outcome is not consequential for the client.
During a migration, a server may report NFS4ERR_LEASE_MOVED, in
which case the client really should retry, since typically
LEASE_MOVED has nothing to do with the current operation, but does
prevent it from going forward.
Also, it's important for a client to respond as soon as possible to
a moved lease condition, since the client's lease could expire on
the destination without further action by the client.
NFS4ERR_DELAY is not included in the list of valid status codes for
RELEASE_LOCKOWNER in RFC 3530bis. However, rfc3530-migration-update
does permit migration-capable servers to return DELAY to clients,
but only in the context of an ongoing migration. In this case the
server has frozen lock state in preparation for migration, and a
client retry would help the destination server purge unneeded state
once migration recovery is complete.
Interestly, NFS4ERR_MOVED is not valid for RELEASE_LOCKOWNER, even
though lock owners can be migrated with Transparent State Migration.
Note that RFC 3530bis section 9.5 includes RELEASE_LOCKOWNER in the
list of operations that renew a client's lease on the server if they
succeed. Now that our client pays attention to the operation's
status code, we can note that renewal appropriately.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-10-18 01:13:47 +07:00
|
|
|
unsigned long timestamp;
|
2012-03-08 01:49:12 +07:00
|
|
|
};
|
|
|
|
|
2013-08-09 23:49:38 +07:00
|
|
|
static void nfs4_release_lockowner_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs_release_lockowner_data *data = calldata;
|
2014-08-04 15:18:16 +07:00
|
|
|
struct nfs_server *server = data->server;
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(server->nfs_client, &data->args.seq_args,
|
|
|
|
&data->res.seq_res, task);
|
2014-08-04 15:18:16 +07:00
|
|
|
data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
|
NFS: Migration support for RELEASE_LOCKOWNER
Currently the Linux NFS client ignores the operation status code for
the RELEASE_LOCKOWNER operation. Like NFSv3's UMNT operation,
RELEASE_LOCKOWNER is a courtesy to help servers manage their
resources, and the outcome is not consequential for the client.
During a migration, a server may report NFS4ERR_LEASE_MOVED, in
which case the client really should retry, since typically
LEASE_MOVED has nothing to do with the current operation, but does
prevent it from going forward.
Also, it's important for a client to respond as soon as possible to
a moved lease condition, since the client's lease could expire on
the destination without further action by the client.
NFS4ERR_DELAY is not included in the list of valid status codes for
RELEASE_LOCKOWNER in RFC 3530bis. However, rfc3530-migration-update
does permit migration-capable servers to return DELAY to clients,
but only in the context of an ongoing migration. In this case the
server has frozen lock state in preparation for migration, and a
client retry would help the destination server purge unneeded state
once migration recovery is complete.
Interestly, NFS4ERR_MOVED is not valid for RELEASE_LOCKOWNER, even
though lock owners can be migrated with Transparent State Migration.
Note that RFC 3530bis section 9.5 includes RELEASE_LOCKOWNER in the
list of operations that renew a client's lease on the server if they
succeed. Now that our client pays attention to the operation's
status code, we can note that renewal appropriately.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-10-18 01:13:47 +07:00
|
|
|
data->timestamp = jiffies;
|
2013-08-09 23:49:38 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_release_lockowner_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs_release_lockowner_data *data = calldata;
|
NFS: Migration support for RELEASE_LOCKOWNER
Currently the Linux NFS client ignores the operation status code for
the RELEASE_LOCKOWNER operation. Like NFSv3's UMNT operation,
RELEASE_LOCKOWNER is a courtesy to help servers manage their
resources, and the outcome is not consequential for the client.
During a migration, a server may report NFS4ERR_LEASE_MOVED, in
which case the client really should retry, since typically
LEASE_MOVED has nothing to do with the current operation, but does
prevent it from going forward.
Also, it's important for a client to respond as soon as possible to
a moved lease condition, since the client's lease could expire on
the destination without further action by the client.
NFS4ERR_DELAY is not included in the list of valid status codes for
RELEASE_LOCKOWNER in RFC 3530bis. However, rfc3530-migration-update
does permit migration-capable servers to return DELAY to clients,
but only in the context of an ongoing migration. In this case the
server has frozen lock state in preparation for migration, and a
client retry would help the destination server purge unneeded state
once migration recovery is complete.
Interestly, NFS4ERR_MOVED is not valid for RELEASE_LOCKOWNER, even
though lock owners can be migrated with Transparent State Migration.
Note that RFC 3530bis section 9.5 includes RELEASE_LOCKOWNER in the
list of operations that renew a client's lease on the server if they
succeed. Now that our client pays attention to the operation's
status code, we can note that renewal appropriately.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-10-18 01:13:47 +07:00
|
|
|
struct nfs_server *server = data->server;
|
|
|
|
|
2014-02-27 02:19:14 +07:00
|
|
|
nfs40_sequence_done(task, &data->res.seq_res);
|
NFS: Migration support for RELEASE_LOCKOWNER
Currently the Linux NFS client ignores the operation status code for
the RELEASE_LOCKOWNER operation. Like NFSv3's UMNT operation,
RELEASE_LOCKOWNER is a courtesy to help servers manage their
resources, and the outcome is not consequential for the client.
During a migration, a server may report NFS4ERR_LEASE_MOVED, in
which case the client really should retry, since typically
LEASE_MOVED has nothing to do with the current operation, but does
prevent it from going forward.
Also, it's important for a client to respond as soon as possible to
a moved lease condition, since the client's lease could expire on
the destination without further action by the client.
NFS4ERR_DELAY is not included in the list of valid status codes for
RELEASE_LOCKOWNER in RFC 3530bis. However, rfc3530-migration-update
does permit migration-capable servers to return DELAY to clients,
but only in the context of an ongoing migration. In this case the
server has frozen lock state in preparation for migration, and a
client retry would help the destination server purge unneeded state
once migration recovery is complete.
Interestly, NFS4ERR_MOVED is not valid for RELEASE_LOCKOWNER, even
though lock owners can be migrated with Transparent State Migration.
Note that RFC 3530bis section 9.5 includes RELEASE_LOCKOWNER in the
list of operations that renew a client's lease on the server if they
succeed. Now that our client pays attention to the operation's
status code, we can note that renewal appropriately.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-10-18 01:13:47 +07:00
|
|
|
|
|
|
|
switch (task->tk_status) {
|
|
|
|
case 0:
|
|
|
|
renew_lease(server, data->timestamp);
|
|
|
|
break;
|
|
|
|
case -NFS4ERR_STALE_CLIENTID:
|
|
|
|
case -NFS4ERR_EXPIRED:
|
2014-08-04 15:18:16 +07:00
|
|
|
nfs4_schedule_lease_recovery(server->nfs_client);
|
|
|
|
break;
|
NFS: Migration support for RELEASE_LOCKOWNER
Currently the Linux NFS client ignores the operation status code for
the RELEASE_LOCKOWNER operation. Like NFSv3's UMNT operation,
RELEASE_LOCKOWNER is a courtesy to help servers manage their
resources, and the outcome is not consequential for the client.
During a migration, a server may report NFS4ERR_LEASE_MOVED, in
which case the client really should retry, since typically
LEASE_MOVED has nothing to do with the current operation, but does
prevent it from going forward.
Also, it's important for a client to respond as soon as possible to
a moved lease condition, since the client's lease could expire on
the destination without further action by the client.
NFS4ERR_DELAY is not included in the list of valid status codes for
RELEASE_LOCKOWNER in RFC 3530bis. However, rfc3530-migration-update
does permit migration-capable servers to return DELAY to clients,
but only in the context of an ongoing migration. In this case the
server has frozen lock state in preparation for migration, and a
client retry would help the destination server purge unneeded state
once migration recovery is complete.
Interestly, NFS4ERR_MOVED is not valid for RELEASE_LOCKOWNER, even
though lock owners can be migrated with Transparent State Migration.
Note that RFC 3530bis section 9.5 includes RELEASE_LOCKOWNER in the
list of operations that renew a client's lease on the server if they
succeed. Now that our client pays attention to the operation's
status code, we can note that renewal appropriately.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-10-18 01:13:47 +07:00
|
|
|
case -NFS4ERR_LEASE_MOVED:
|
|
|
|
case -NFS4ERR_DELAY:
|
2014-09-18 13:09:27 +07:00
|
|
|
if (nfs4_async_handle_error(task, server,
|
|
|
|
NULL, NULL) == -EAGAIN)
|
NFS: Migration support for RELEASE_LOCKOWNER
Currently the Linux NFS client ignores the operation status code for
the RELEASE_LOCKOWNER operation. Like NFSv3's UMNT operation,
RELEASE_LOCKOWNER is a courtesy to help servers manage their
resources, and the outcome is not consequential for the client.
During a migration, a server may report NFS4ERR_LEASE_MOVED, in
which case the client really should retry, since typically
LEASE_MOVED has nothing to do with the current operation, but does
prevent it from going forward.
Also, it's important for a client to respond as soon as possible to
a moved lease condition, since the client's lease could expire on
the destination without further action by the client.
NFS4ERR_DELAY is not included in the list of valid status codes for
RELEASE_LOCKOWNER in RFC 3530bis. However, rfc3530-migration-update
does permit migration-capable servers to return DELAY to clients,
but only in the context of an ongoing migration. In this case the
server has frozen lock state in preparation for migration, and a
client retry would help the destination server purge unneeded state
once migration recovery is complete.
Interestly, NFS4ERR_MOVED is not valid for RELEASE_LOCKOWNER, even
though lock owners can be migrated with Transparent State Migration.
Note that RFC 3530bis section 9.5 includes RELEASE_LOCKOWNER in the
list of operations that renew a client's lease on the server if they
succeed. Now that our client pays attention to the operation's
status code, we can note that renewal appropriately.
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2013-10-18 01:13:47 +07:00
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
}
|
2013-08-09 23:49:38 +07:00
|
|
|
}
|
|
|
|
|
2010-07-01 23:49:01 +07:00
|
|
|
static void nfs4_release_lockowner_release(void *calldata)
|
|
|
|
{
|
2012-03-08 01:49:12 +07:00
|
|
|
struct nfs_release_lockowner_data *data = calldata;
|
2012-03-20 03:17:18 +07:00
|
|
|
nfs4_free_lock_state(data->server, data->lsp);
|
2010-07-01 23:49:01 +07:00
|
|
|
kfree(calldata);
|
|
|
|
}
|
|
|
|
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct rpc_call_ops nfs4_release_lockowner_ops = {
|
2013-08-09 23:49:38 +07:00
|
|
|
.rpc_call_prepare = nfs4_release_lockowner_prepare,
|
|
|
|
.rpc_call_done = nfs4_release_lockowner_done,
|
2010-07-01 23:49:01 +07:00
|
|
|
.rpc_release = nfs4_release_lockowner_release,
|
|
|
|
};
|
|
|
|
|
2014-05-01 17:28:47 +07:00
|
|
|
static void
|
|
|
|
nfs4_release_lockowner(struct nfs_server *server, struct nfs4_lock_state *lsp)
|
2010-07-01 23:49:01 +07:00
|
|
|
{
|
2012-03-08 01:49:12 +07:00
|
|
|
struct nfs_release_lockowner_data *data;
|
2010-07-01 23:49:01 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RELEASE_LOCKOWNER],
|
|
|
|
};
|
|
|
|
|
|
|
|
if (server->nfs_client->cl_mvops->minor_version != 0)
|
2014-05-01 17:28:47 +07:00
|
|
|
return;
|
2013-08-09 23:49:38 +07:00
|
|
|
|
2012-03-08 01:49:12 +07:00
|
|
|
data = kmalloc(sizeof(*data), GFP_NOFS);
|
|
|
|
if (!data)
|
2014-05-01 17:28:47 +07:00
|
|
|
return;
|
2012-03-08 01:49:12 +07:00
|
|
|
data->lsp = lsp;
|
2012-03-20 03:17:18 +07:00
|
|
|
data->server = server;
|
2012-03-08 01:49:12 +07:00
|
|
|
data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
|
|
|
|
data->args.lock_owner.id = lsp->ls_seqid.owner_id;
|
|
|
|
data->args.lock_owner.s_dev = server->s_dev;
|
2013-08-09 23:49:38 +07:00
|
|
|
|
2012-03-08 01:49:12 +07:00
|
|
|
msg.rpc_argp = &data->args;
|
2014-02-27 02:19:14 +07:00
|
|
|
msg.rpc_resp = &data->res;
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 0, 0);
|
2012-03-08 01:49:12 +07:00
|
|
|
rpc_call_async(server->client, &msg, 0, &nfs4_release_lockowner_ops, data);
|
2010-07-01 23:49:01 +07:00
|
|
|
}
|
|
|
|
|
2005-06-23 00:16:22 +07:00
|
|
|
#define XATTR_NAME_NFSV4_ACL "system.nfs4_acl"
|
|
|
|
|
2015-10-05 00:18:51 +07:00
|
|
|
static int nfs4_xattr_set_nfs4_acl(const struct xattr_handler *handler,
|
2016-05-27 21:19:30 +07:00
|
|
|
struct dentry *unused, struct inode *inode,
|
|
|
|
const char *key, const void *buf,
|
|
|
|
size_t buflen, int flags)
|
2005-06-23 00:16:22 +07:00
|
|
|
{
|
2016-05-27 21:19:30 +07:00
|
|
|
return nfs4_proc_set_acl(inode, buf, buflen);
|
2005-06-23 00:16:22 +07:00
|
|
|
}
|
|
|
|
|
2015-10-05 00:18:51 +07:00
|
|
|
static int nfs4_xattr_get_nfs4_acl(const struct xattr_handler *handler,
|
2016-04-11 07:48:24 +07:00
|
|
|
struct dentry *unused, struct inode *inode,
|
|
|
|
const char *key, void *buf, size_t buflen)
|
2005-06-23 00:16:22 +07:00
|
|
|
{
|
2016-04-11 07:48:24 +07:00
|
|
|
return nfs4_proc_get_acl(inode, buf, buflen);
|
2005-06-23 00:16:22 +07:00
|
|
|
}
|
|
|
|
|
2015-12-02 20:44:43 +07:00
|
|
|
static bool nfs4_xattr_list_nfs4_acl(struct dentry *dentry)
|
2005-06-23 00:16:22 +07:00
|
|
|
{
|
2015-12-02 20:44:43 +07:00
|
|
|
return nfs4_server_supports_acls(NFS_SERVER(d_inode(dentry)));
|
2005-06-23 00:16:22 +07:00
|
|
|
}
|
|
|
|
|
2013-05-22 23:50:45 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_SECURITY_LABEL
|
|
|
|
|
2015-10-05 00:18:51 +07:00
|
|
|
static int nfs4_xattr_set_nfs4_label(const struct xattr_handler *handler,
|
2016-05-27 21:19:30 +07:00
|
|
|
struct dentry *unused, struct inode *inode,
|
|
|
|
const char *key, const void *buf,
|
|
|
|
size_t buflen, int flags)
|
2013-05-22 23:50:45 +07:00
|
|
|
{
|
|
|
|
if (security_ismaclabel(key))
|
2016-05-27 21:19:30 +07:00
|
|
|
return nfs4_set_security_label(inode, buf, buflen);
|
2013-05-22 23:50:45 +07:00
|
|
|
|
|
|
|
return -EOPNOTSUPP;
|
|
|
|
}
|
|
|
|
|
2015-10-05 00:18:51 +07:00
|
|
|
static int nfs4_xattr_get_nfs4_label(const struct xattr_handler *handler,
|
2016-04-11 07:48:24 +07:00
|
|
|
struct dentry *unused, struct inode *inode,
|
|
|
|
const char *key, void *buf, size_t buflen)
|
2013-05-22 23:50:45 +07:00
|
|
|
{
|
|
|
|
if (security_ismaclabel(key))
|
2016-04-11 07:48:24 +07:00
|
|
|
return nfs4_get_security_label(inode, buf, buflen);
|
2013-05-22 23:50:45 +07:00
|
|
|
return -EOPNOTSUPP;
|
|
|
|
}
|
|
|
|
|
2015-12-02 20:44:41 +07:00
|
|
|
static ssize_t
|
|
|
|
nfs4_listxattr_nfs4_label(struct inode *inode, char *list, size_t list_len)
|
2013-05-22 23:50:45 +07:00
|
|
|
{
|
2015-12-02 20:44:41 +07:00
|
|
|
int len = 0;
|
2013-05-22 23:50:45 +07:00
|
|
|
|
2015-12-02 20:44:41 +07:00
|
|
|
if (nfs_server_capable(inode, NFS_CAP_SECURITY_LABEL)) {
|
|
|
|
len = security_inode_listsecurity(inode, list, list_len);
|
|
|
|
if (list_len && len > list_len)
|
|
|
|
return -ERANGE;
|
2013-05-22 23:50:45 +07:00
|
|
|
}
|
|
|
|
return len;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct xattr_handler nfs4_xattr_nfs4_label_handler = {
|
|
|
|
.prefix = XATTR_SECURITY_PREFIX,
|
|
|
|
.get = nfs4_xattr_get_nfs4_label,
|
|
|
|
.set = nfs4_xattr_set_nfs4_label,
|
|
|
|
};
|
|
|
|
|
2015-12-02 20:44:41 +07:00
|
|
|
#else
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
nfs4_listxattr_nfs4_label(struct inode *inode, char *list, size_t list_len)
|
|
|
|
{
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif
|
2013-05-22 23:50:45 +07:00
|
|
|
|
2011-06-14 05:25:56 +07:00
|
|
|
/*
|
|
|
|
* nfs_fhget will use either the mounted_on_fileid or the fileid
|
|
|
|
*/
|
2009-03-12 01:10:28 +07:00
|
|
|
static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr)
|
|
|
|
{
|
2011-06-14 05:25:56 +07:00
|
|
|
if (!(((fattr->valid & NFS_ATTR_FATTR_MOUNTED_ON_FILEID) ||
|
|
|
|
(fattr->valid & NFS_ATTR_FATTR_FILEID)) &&
|
|
|
|
(fattr->valid & NFS_ATTR_FATTR_FSID) &&
|
2012-03-02 05:01:57 +07:00
|
|
|
(fattr->valid & NFS_ATTR_FATTR_V4_LOCATIONS)))
|
2009-03-12 01:10:28 +07:00
|
|
|
return;
|
|
|
|
|
|
|
|
fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
|
2012-03-02 05:01:57 +07:00
|
|
|
NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_V4_REFERRAL;
|
2009-03-12 01:10:28 +07:00
|
|
|
fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
|
|
|
|
fattr->nlink = 2;
|
|
|
|
}
|
|
|
|
|
2012-04-28 00:27:41 +07:00
|
|
|
static int _nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
|
|
|
|
const struct qstr *name,
|
|
|
|
struct nfs4_fs_locations *fs_locations,
|
|
|
|
struct page *page)
|
2006-06-09 20:34:22 +07:00
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(dir);
|
2017-11-06 03:45:22 +07:00
|
|
|
u32 bitmask[3];
|
2006-06-09 20:34:22 +07:00
|
|
|
struct nfs4_fs_locations_arg args = {
|
|
|
|
.dir_fh = NFS_FH(dir),
|
2007-01-13 14:28:11 +07:00
|
|
|
.name = name,
|
2006-06-09 20:34:22 +07:00
|
|
|
.page = page,
|
|
|
|
.bitmask = bitmask,
|
|
|
|
};
|
2009-04-01 20:22:02 +07:00
|
|
|
struct nfs4_fs_locations_res res = {
|
|
|
|
.fs_locations = fs_locations,
|
|
|
|
};
|
2006-06-09 20:34:22 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
|
|
|
|
.rpc_argp = &args,
|
2009-04-01 20:22:02 +07:00
|
|
|
.rpc_resp = &res,
|
2006-06-09 20:34:22 +07:00
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: start\n", __func__);
|
2011-06-14 05:25:56 +07:00
|
|
|
|
2017-11-06 03:45:22 +07:00
|
|
|
bitmask[0] = nfs4_fattr_bitmap[0] | FATTR4_WORD0_FS_LOCATIONS;
|
|
|
|
bitmask[1] = nfs4_fattr_bitmap[1];
|
|
|
|
|
2011-06-14 05:25:56 +07:00
|
|
|
/* Ask for the fileid of the absent filesystem if mounted_on_fileid
|
|
|
|
* is not supported */
|
|
|
|
if (NFS_SERVER(dir)->attr_bitmask[1] & FATTR4_WORD1_MOUNTED_ON_FILEID)
|
2017-11-06 03:45:22 +07:00
|
|
|
bitmask[0] &= ~FATTR4_WORD0_FILEID;
|
2011-06-14 05:25:56 +07:00
|
|
|
else
|
2017-11-06 03:45:22 +07:00
|
|
|
bitmask[1] &= ~FATTR4_WORD1_MOUNTED_ON_FILEID;
|
2011-06-14 05:25:56 +07:00
|
|
|
|
2007-01-13 14:28:11 +07:00
|
|
|
nfs_fattr_init(&fs_locations->fattr);
|
2006-06-09 20:34:22 +07:00
|
|
|
fs_locations->server = server;
|
2006-06-09 20:34:25 +07:00
|
|
|
fs_locations->nlocations = 0;
|
2012-04-28 00:27:41 +07:00
|
|
|
status = nfs4_call_sync(client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2008-05-03 03:42:44 +07:00
|
|
|
dprintk("%s: returned status = %d\n", __func__, status);
|
2006-06-09 20:34:22 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2012-04-28 00:27:41 +07:00
|
|
|
int nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
|
|
|
|
const struct qstr *name,
|
|
|
|
struct nfs4_fs_locations *fs_locations,
|
|
|
|
struct page *page)
|
2012-04-28 00:27:39 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-08-13 03:45:55 +07:00
|
|
|
err = _nfs4_proc_fs_locations(client, dir, name,
|
|
|
|
fs_locations, page);
|
|
|
|
trace_nfs4_get_fs_locations(dir, name, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err,
|
2012-04-28 00:27:39 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2013-10-18 01:12:50 +07:00
|
|
|
/*
|
|
|
|
* This operation also signals the server that this client is
|
|
|
|
* performing migration recovery. The server can stop returning
|
|
|
|
* NFS4ERR_LEASE_MOVED to this client. A RENEW operation is
|
|
|
|
* appended to this compound to identify the client ID which is
|
|
|
|
* performing recovery.
|
|
|
|
*/
|
|
|
|
static int _nfs40_proc_get_locations(struct inode *inode,
|
|
|
|
struct nfs4_fs_locations *locations,
|
|
|
|
struct page *page, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct rpc_clnt *clnt = server->client;
|
|
|
|
u32 bitmask[2] = {
|
|
|
|
[0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
|
|
|
|
};
|
|
|
|
struct nfs4_fs_locations_arg args = {
|
|
|
|
.clientid = server->nfs_client->cl_clientid,
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.page = page,
|
|
|
|
.bitmask = bitmask,
|
|
|
|
.migration = 1, /* skip LOOKUP */
|
|
|
|
.renew = 1, /* append RENEW */
|
|
|
|
};
|
|
|
|
struct nfs4_fs_locations_res res = {
|
|
|
|
.fs_locations = locations,
|
|
|
|
.migration = 1,
|
|
|
|
.renew = 1,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
|
|
|
unsigned long now = jiffies;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
nfs_fattr_init(&locations->fattr);
|
|
|
|
locations->server = server;
|
|
|
|
locations->nlocations = 0;
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&args.seq_args, &res.seq_res, 0, 1);
|
2013-10-18 01:12:50 +07:00
|
|
|
status = nfs4_call_sync_sequence(clnt, server, &msg,
|
|
|
|
&args.seq_args, &res.seq_res);
|
|
|
|
if (status)
|
|
|
|
return status;
|
|
|
|
|
|
|
|
renew_lease(server, now);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef CONFIG_NFS_V4_1
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This operation also signals the server that this client is
|
|
|
|
* performing migration recovery. The server can stop asserting
|
|
|
|
* SEQ4_STATUS_LEASE_MOVED for this client. The client ID
|
|
|
|
* performing this operation is identified in the SEQUENCE
|
|
|
|
* operation in this compound.
|
|
|
|
*
|
|
|
|
* When the client supports GETATTR(fs_locations_info), it can
|
|
|
|
* be plumbed in here.
|
|
|
|
*/
|
|
|
|
static int _nfs41_proc_get_locations(struct inode *inode,
|
|
|
|
struct nfs4_fs_locations *locations,
|
|
|
|
struct page *page, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct rpc_clnt *clnt = server->client;
|
|
|
|
u32 bitmask[2] = {
|
|
|
|
[0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
|
|
|
|
};
|
|
|
|
struct nfs4_fs_locations_arg args = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.page = page,
|
|
|
|
.bitmask = bitmask,
|
|
|
|
.migration = 1, /* skip LOOKUP */
|
|
|
|
};
|
|
|
|
struct nfs4_fs_locations_res res = {
|
|
|
|
.fs_locations = locations,
|
|
|
|
.migration = 1,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
|
|
|
nfs_fattr_init(&locations->fattr);
|
|
|
|
locations->server = server;
|
|
|
|
locations->nlocations = 0;
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&args.seq_args, &res.seq_res, 0, 1);
|
2013-10-18 01:12:50 +07:00
|
|
|
status = nfs4_call_sync_sequence(clnt, server, &msg,
|
|
|
|
&args.seq_args, &res.seq_res);
|
|
|
|
if (status == NFS4_OK &&
|
|
|
|
res.seq_res.sr_status_flags & SEQ4_STATUS_LEASE_MOVED)
|
|
|
|
status = -NFS4ERR_LEASE_MOVED;
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif /* CONFIG_NFS_V4_1 */
|
|
|
|
|
|
|
|
/**
|
|
|
|
* nfs4_proc_get_locations - discover locations for a migrated FSID
|
|
|
|
* @inode: inode on FSID that is migrating
|
|
|
|
* @locations: result of query
|
|
|
|
* @page: buffer
|
|
|
|
* @cred: credential to use for this operation
|
|
|
|
*
|
|
|
|
* Returns NFS4_OK on success, a negative NFS4ERR status code if the
|
|
|
|
* operation failed, or a negative errno if a local error occurred.
|
|
|
|
*
|
|
|
|
* On success, "locations" is filled in, but if the server has
|
|
|
|
* no locations information, NFS_ATTR_FATTR_V4_LOCATIONS is not
|
|
|
|
* asserted.
|
|
|
|
*
|
|
|
|
* -NFS4ERR_LEASE_MOVED is returned if the server still has leases
|
|
|
|
* from this client that require migration recovery.
|
|
|
|
*/
|
|
|
|
int nfs4_proc_get_locations(struct inode *inode,
|
|
|
|
struct nfs4_fs_locations *locations,
|
|
|
|
struct page *page, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct nfs_client *clp = server->nfs_client;
|
|
|
|
const struct nfs4_mig_recovery_ops *ops =
|
|
|
|
clp->cl_mvops->mig_recovery_ops;
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int status;
|
|
|
|
|
|
|
|
dprintk("%s: FSID %llx:%llx on \"%s\"\n", __func__,
|
|
|
|
(unsigned long long)server->fsid.major,
|
|
|
|
(unsigned long long)server->fsid.minor,
|
|
|
|
clp->cl_hostname);
|
|
|
|
nfs_display_fhandle(NFS_FH(inode), __func__);
|
|
|
|
|
|
|
|
do {
|
|
|
|
status = ops->get_locations(inode, locations, page, cred);
|
|
|
|
if (status != -NFS4ERR_DELAY)
|
|
|
|
break;
|
|
|
|
nfs4_handle_exception(server, status, &exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2013-10-18 01:13:30 +07:00
|
|
|
/*
|
|
|
|
* This operation also signals the server that this client is
|
|
|
|
* performing "lease moved" recovery. The server can stop
|
|
|
|
* returning NFS4ERR_LEASE_MOVED to this client. A RENEW operation
|
|
|
|
* is appended to this compound to identify the client ID which is
|
|
|
|
* performing recovery.
|
|
|
|
*/
|
|
|
|
static int _nfs40_proc_fsid_present(struct inode *inode, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
|
|
|
|
struct rpc_clnt *clnt = server->client;
|
|
|
|
struct nfs4_fsid_present_arg args = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
.clientid = clp->cl_clientid,
|
|
|
|
.renew = 1, /* append RENEW */
|
|
|
|
};
|
|
|
|
struct nfs4_fsid_present_res res = {
|
|
|
|
.renew = 1,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSID_PRESENT],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
|
|
|
unsigned long now = jiffies;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
res.fh = nfs_alloc_fhandle();
|
|
|
|
if (res.fh == NULL)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&args.seq_args, &res.seq_res, 0, 1);
|
2013-10-18 01:13:30 +07:00
|
|
|
status = nfs4_call_sync_sequence(clnt, server, &msg,
|
|
|
|
&args.seq_args, &res.seq_res);
|
|
|
|
nfs_free_fhandle(res.fh);
|
|
|
|
if (status)
|
|
|
|
return status;
|
|
|
|
|
|
|
|
do_renew_lease(clp, now);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef CONFIG_NFS_V4_1
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This operation also signals the server that this client is
|
|
|
|
* performing "lease moved" recovery. The server can stop asserting
|
|
|
|
* SEQ4_STATUS_LEASE_MOVED for this client. The client ID performing
|
|
|
|
* this operation is identified in the SEQUENCE operation in this
|
|
|
|
* compound.
|
|
|
|
*/
|
|
|
|
static int _nfs41_proc_fsid_present(struct inode *inode, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct rpc_clnt *clnt = server->client;
|
|
|
|
struct nfs4_fsid_present_arg args = {
|
|
|
|
.fh = NFS_FH(inode),
|
|
|
|
};
|
|
|
|
struct nfs4_fsid_present_res res = {
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSID_PRESENT],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
|
|
|
res.fh = nfs_alloc_fhandle();
|
|
|
|
if (res.fh == NULL)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&args.seq_args, &res.seq_res, 0, 1);
|
2013-10-18 01:13:30 +07:00
|
|
|
status = nfs4_call_sync_sequence(clnt, server, &msg,
|
|
|
|
&args.seq_args, &res.seq_res);
|
|
|
|
nfs_free_fhandle(res.fh);
|
|
|
|
if (status == NFS4_OK &&
|
|
|
|
res.seq_res.sr_status_flags & SEQ4_STATUS_LEASE_MOVED)
|
|
|
|
status = -NFS4ERR_LEASE_MOVED;
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif /* CONFIG_NFS_V4_1 */
|
|
|
|
|
|
|
|
/**
|
|
|
|
* nfs4_proc_fsid_present - Is this FSID present or absent on server?
|
|
|
|
* @inode: inode on FSID to check
|
|
|
|
* @cred: credential to use for this operation
|
|
|
|
*
|
|
|
|
* Server indicates whether the FSID is present, moved, or not
|
|
|
|
* recognized. This operation is necessary to clear a LEASE_MOVED
|
|
|
|
* condition for this client ID.
|
|
|
|
*
|
|
|
|
* Returns NFS4_OK if the FSID is present on this server,
|
|
|
|
* -NFS4ERR_MOVED if the FSID is no longer present, a negative
|
|
|
|
* NFS4ERR code if some error occurred on the server, or a
|
|
|
|
* negative errno if a local failure occurred.
|
|
|
|
*/
|
|
|
|
int nfs4_proc_fsid_present(struct inode *inode, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct nfs_client *clp = server->nfs_client;
|
|
|
|
const struct nfs4_mig_recovery_ops *ops =
|
|
|
|
clp->cl_mvops->mig_recovery_ops;
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int status;
|
|
|
|
|
|
|
|
dprintk("%s: FSID %llx:%llx on \"%s\"\n", __func__,
|
|
|
|
(unsigned long long)server->fsid.major,
|
|
|
|
(unsigned long long)server->fsid.minor,
|
|
|
|
clp->cl_hostname);
|
|
|
|
nfs_display_fhandle(NFS_FH(inode), __func__);
|
|
|
|
|
|
|
|
do {
|
|
|
|
status = ops->fsid_present(inode, cred);
|
|
|
|
if (status != -NFS4ERR_DELAY)
|
|
|
|
break;
|
|
|
|
nfs4_handle_exception(server, status, &exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2013-08-08 21:57:55 +07:00
|
|
|
/**
|
2013-09-04 02:18:49 +07:00
|
|
|
* If 'use_integrity' is true and the state managment nfs_client
|
|
|
|
* cl_rpcclient is using krb5i/p, use the integrity protected cl_rpcclient
|
|
|
|
* and the machine credential as per RFC3530bis and RFC5661 Security
|
|
|
|
* Considerations sections. Otherwise, just use the user cred with the
|
|
|
|
* filesystem's rpc_client.
|
2013-08-08 21:57:55 +07:00
|
|
|
*/
|
2013-09-04 02:18:49 +07:00
|
|
|
static int _nfs4_proc_secinfo(struct inode *dir, const struct qstr *name, struct nfs4_secinfo_flavors *flavors, bool use_integrity)
|
2011-03-25 00:12:29 +07:00
|
|
|
{
|
|
|
|
int status;
|
|
|
|
struct nfs4_secinfo_arg args = {
|
|
|
|
.dir_fh = NFS_FH(dir),
|
|
|
|
.name = name,
|
|
|
|
};
|
|
|
|
struct nfs4_secinfo_res res = {
|
|
|
|
.flavors = flavors,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
2013-09-04 02:18:49 +07:00
|
|
|
struct rpc_clnt *clnt = NFS_SERVER(dir)->client;
|
2013-09-11 05:44:31 +07:00
|
|
|
struct rpc_cred *cred = NULL;
|
2013-09-04 02:18:49 +07:00
|
|
|
|
|
|
|
if (use_integrity) {
|
|
|
|
clnt = NFS_SERVER(dir)->nfs_client->cl_rpcclient;
|
2013-09-11 05:44:31 +07:00
|
|
|
cred = nfs4_get_clid_cred(NFS_SERVER(dir)->nfs_client);
|
|
|
|
msg.rpc_cred = cred;
|
2013-09-04 02:18:49 +07:00
|
|
|
}
|
2011-03-25 00:12:29 +07:00
|
|
|
|
|
|
|
dprintk("NFS call secinfo %s\n", name->name);
|
2013-08-14 03:37:35 +07:00
|
|
|
|
|
|
|
nfs4_state_protect(NFS_SERVER(dir)->nfs_client,
|
|
|
|
NFS_SP4_MACH_CRED_SECINFO, &clnt, &msg);
|
|
|
|
|
2013-09-04 02:18:49 +07:00
|
|
|
status = nfs4_call_sync(clnt, NFS_SERVER(dir), &msg, &args.seq_args,
|
|
|
|
&res.seq_res, 0);
|
2011-03-25 00:12:29 +07:00
|
|
|
dprintk("NFS reply secinfo: %d\n", status);
|
2013-09-04 02:18:49 +07:00
|
|
|
|
2013-09-11 05:44:31 +07:00
|
|
|
if (cred)
|
|
|
|
put_rpccred(cred);
|
2013-09-04 02:18:49 +07:00
|
|
|
|
2011-03-25 00:12:29 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2012-04-28 00:27:40 +07:00
|
|
|
int nfs4_proc_secinfo(struct inode *dir, const struct qstr *name,
|
|
|
|
struct nfs4_secinfo_flavors *flavors)
|
2011-03-25 00:12:29 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-09-04 02:18:49 +07:00
|
|
|
err = -NFS4ERR_WRONGSEC;
|
|
|
|
|
|
|
|
/* try to use integrity protection with machine cred */
|
|
|
|
if (_nfs4_is_integrity_protected(NFS_SERVER(dir)->nfs_client))
|
|
|
|
err = _nfs4_proc_secinfo(dir, name, flavors, true);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* if unable to use integrity protection, or SECINFO with
|
|
|
|
* integrity protection returns NFS4ERR_WRONGSEC (which is
|
|
|
|
* disallowed by spec, but exists in deployed servers) use
|
|
|
|
* the current filesystem's rpc_client and the user cred.
|
|
|
|
*/
|
|
|
|
if (err == -NFS4ERR_WRONGSEC)
|
|
|
|
err = _nfs4_proc_secinfo(dir, name, flavors, false);
|
|
|
|
|
2013-08-13 03:45:55 +07:00
|
|
|
trace_nfs4_secinfo(dir, name, err);
|
|
|
|
err = nfs4_handle_exception(NFS_SERVER(dir), err,
|
2011-03-25 00:12:29 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:21:53 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_1
|
2010-12-14 22:11:57 +07:00
|
|
|
/*
|
|
|
|
* Check the exchange flags returned by the server for invalid flags, having
|
|
|
|
* both PNFS and NON_PNFS flags set, and not having one of NON_PNFS, PNFS, or
|
|
|
|
* DS flags set.
|
|
|
|
*/
|
|
|
|
static int nfs4_check_cl_exchange_flags(u32 flags)
|
|
|
|
{
|
|
|
|
if (flags & ~EXCHGID4_FLAG_MASK_R)
|
|
|
|
goto out_inval;
|
|
|
|
if ((flags & EXCHGID4_FLAG_USE_PNFS_MDS) &&
|
|
|
|
(flags & EXCHGID4_FLAG_USE_NON_PNFS))
|
|
|
|
goto out_inval;
|
|
|
|
if (!(flags & (EXCHGID4_FLAG_MASK_PNFS)))
|
|
|
|
goto out_inval;
|
|
|
|
return NFS_OK;
|
|
|
|
out_inval:
|
|
|
|
return -NFS4ERR_INVAL;
|
|
|
|
}
|
|
|
|
|
2011-06-01 06:05:47 +07:00
|
|
|
static bool
|
2012-05-22 09:44:31 +07:00
|
|
|
nfs41_same_server_scope(struct nfs41_server_scope *a,
|
|
|
|
struct nfs41_server_scope *b)
|
2011-06-01 06:05:47 +07:00
|
|
|
{
|
2017-01-12 04:51:59 +07:00
|
|
|
if (a->server_scope_sz != b->server_scope_sz)
|
|
|
|
return false;
|
|
|
|
return memcmp(a->server_scope, b->server_scope, a->server_scope_sz) == 0;
|
2011-06-01 06:05:47 +07:00
|
|
|
}
|
|
|
|
|
2016-02-06 04:08:37 +07:00
|
|
|
static void
|
|
|
|
nfs4_bind_one_conn_to_session_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_bind_one_conn_to_session_ops = {
|
|
|
|
.rpc_call_done = &nfs4_bind_one_conn_to_session_done,
|
|
|
|
};
|
|
|
|
|
2012-05-25 00:22:50 +07:00
|
|
|
/*
|
2016-01-31 10:58:24 +07:00
|
|
|
* nfs4_proc_bind_one_conn_to_session()
|
2012-05-25 00:22:50 +07:00
|
|
|
*
|
|
|
|
* The 4.1 client currently uses the same TCP connection for the
|
|
|
|
* fore and backchannel.
|
|
|
|
*/
|
2016-01-31 10:58:24 +07:00
|
|
|
static
|
|
|
|
int nfs4_proc_bind_one_conn_to_session(struct rpc_clnt *clnt,
|
|
|
|
struct rpc_xprt *xprt,
|
|
|
|
struct nfs_client *clp,
|
|
|
|
struct rpc_cred *cred)
|
2012-05-25 00:22:50 +07:00
|
|
|
{
|
|
|
|
int status;
|
2015-02-19 00:27:18 +07:00
|
|
|
struct nfs41_bind_conn_to_session_args args = {
|
|
|
|
.client = clp,
|
|
|
|
.dir = NFS4_CDFC4_FORE_OR_BOTH,
|
|
|
|
};
|
2012-05-25 00:22:50 +07:00
|
|
|
struct nfs41_bind_conn_to_session_res res;
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc =
|
|
|
|
&nfs4_procedures[NFSPROC4_CLNT_BIND_CONN_TO_SESSION],
|
2015-02-19 00:27:18 +07:00
|
|
|
.rpc_argp = &args,
|
2012-05-25 00:22:50 +07:00
|
|
|
.rpc_resp = &res,
|
2012-05-26 04:57:41 +07:00
|
|
|
.rpc_cred = cred,
|
2012-05-25 00:22:50 +07:00
|
|
|
};
|
2016-01-31 10:58:24 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = clnt,
|
|
|
|
.rpc_xprt = xprt,
|
2016-02-06 04:08:37 +07:00
|
|
|
.callback_ops = &nfs4_bind_one_conn_to_session_ops,
|
2016-01-31 10:58:24 +07:00
|
|
|
.rpc_message = &msg,
|
|
|
|
.flags = RPC_TASK_TIMEOUT,
|
|
|
|
};
|
|
|
|
struct rpc_task *task;
|
2012-05-25 00:22:50 +07:00
|
|
|
|
2015-02-19 00:27:18 +07:00
|
|
|
nfs4_copy_sessionid(&args.sessionid, &clp->cl_session->sess_id);
|
|
|
|
if (!(clp->cl_session->flags & SESSION4_BACK_CHAN))
|
|
|
|
args.dir = NFS4_CDFC4_FORE;
|
2012-05-25 00:22:50 +07:00
|
|
|
|
2016-01-31 10:58:24 +07:00
|
|
|
/* Do not set the backchannel flag unless this is clnt->cl_xprt */
|
|
|
|
if (xprt != rcu_access_pointer(clnt->cl_xprt))
|
|
|
|
args.dir = NFS4_CDFC4_FORE;
|
|
|
|
|
|
|
|
task = rpc_run_task(&task_setup_data);
|
|
|
|
if (!IS_ERR(task)) {
|
|
|
|
status = task->tk_status;
|
|
|
|
rpc_put_task(task);
|
|
|
|
} else
|
|
|
|
status = PTR_ERR(task);
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_bind_conn_to_session(clp, status);
|
2012-05-25 00:22:50 +07:00
|
|
|
if (status == 0) {
|
2015-02-19 00:27:18 +07:00
|
|
|
if (memcmp(res.sessionid.data,
|
2012-05-25 00:22:50 +07:00
|
|
|
clp->cl_session->sess_id.data, NFS4_MAX_SESSIONID_LEN)) {
|
|
|
|
dprintk("NFS: %s: Session ID mismatch\n", __func__);
|
2017-04-08 01:15:21 +07:00
|
|
|
return -EIO;
|
2012-05-25 00:22:50 +07:00
|
|
|
}
|
2015-02-19 00:27:18 +07:00
|
|
|
if ((res.dir & args.dir) != res.dir || res.dir == 0) {
|
2012-05-25 00:22:50 +07:00
|
|
|
dprintk("NFS: %s: Unexpected direction from server\n",
|
|
|
|
__func__);
|
2017-04-08 01:15:21 +07:00
|
|
|
return -EIO;
|
2012-05-25 00:22:50 +07:00
|
|
|
}
|
2015-02-19 00:27:18 +07:00
|
|
|
if (res.use_conn_in_rdma_mode != args.use_conn_in_rdma_mode) {
|
2012-05-25 00:22:50 +07:00
|
|
|
dprintk("NFS: %s: Server returned RDMA mode = true\n",
|
|
|
|
__func__);
|
2017-04-08 01:15:21 +07:00
|
|
|
return -EIO;
|
2012-05-25 00:22:50 +07:00
|
|
|
}
|
|
|
|
}
|
2017-04-08 01:15:21 +07:00
|
|
|
|
2012-05-25 00:22:50 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2016-01-31 10:58:24 +07:00
|
|
|
struct rpc_bind_conn_calldata {
|
|
|
|
struct nfs_client *clp;
|
|
|
|
struct rpc_cred *cred;
|
|
|
|
};
|
|
|
|
|
|
|
|
static int
|
|
|
|
nfs4_proc_bind_conn_to_session_callback(struct rpc_clnt *clnt,
|
|
|
|
struct rpc_xprt *xprt,
|
|
|
|
void *calldata)
|
|
|
|
{
|
|
|
|
struct rpc_bind_conn_calldata *p = calldata;
|
|
|
|
|
|
|
|
return nfs4_proc_bind_one_conn_to_session(clnt, xprt, p->clp, p->cred);
|
|
|
|
}
|
|
|
|
|
|
|
|
int nfs4_proc_bind_conn_to_session(struct nfs_client *clp, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct rpc_bind_conn_calldata data = {
|
|
|
|
.clp = clp,
|
|
|
|
.cred = cred,
|
|
|
|
};
|
|
|
|
return rpc_clnt_iterate_for_each_xprt(clp->cl_rpcclient,
|
|
|
|
nfs4_proc_bind_conn_to_session_callback, &data);
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:29 +07:00
|
|
|
/*
|
2013-08-14 03:37:34 +07:00
|
|
|
* Minimum set of SP4_MACH_CRED operations from RFC 5661 in the enforce map
|
|
|
|
* and operations we'd like to see to enable certain features in the allow map
|
2013-08-14 03:37:32 +07:00
|
|
|
*/
|
|
|
|
static const struct nfs41_state_protection nfs4_sp4_mach_cred_request = {
|
|
|
|
.how = SP4_MACH_CRED,
|
|
|
|
.enforce.u.words = {
|
|
|
|
[1] = 1 << (OP_BIND_CONN_TO_SESSION - 32) |
|
|
|
|
1 << (OP_EXCHANGE_ID - 32) |
|
|
|
|
1 << (OP_CREATE_SESSION - 32) |
|
|
|
|
1 << (OP_DESTROY_SESSION - 32) |
|
|
|
|
1 << (OP_DESTROY_CLIENTID - 32)
|
2013-08-14 03:37:34 +07:00
|
|
|
},
|
|
|
|
.allow.u.words = {
|
|
|
|
[0] = 1 << (OP_CLOSE) |
|
2015-12-02 21:39:51 +07:00
|
|
|
1 << (OP_OPEN_DOWNGRADE) |
|
2013-09-11 05:44:30 +07:00
|
|
|
1 << (OP_LOCKU) |
|
2015-12-02 21:39:51 +07:00
|
|
|
1 << (OP_DELEGRETURN) |
|
2013-09-11 05:44:30 +07:00
|
|
|
1 << (OP_COMMIT),
|
2013-08-14 03:37:35 +07:00
|
|
|
[1] = 1 << (OP_SECINFO - 32) |
|
2013-08-14 03:37:36 +07:00
|
|
|
1 << (OP_SECINFO_NO_NAME - 32) |
|
2015-12-02 21:39:51 +07:00
|
|
|
1 << (OP_LAYOUTRETURN - 32) |
|
2013-08-14 03:37:36 +07:00
|
|
|
1 << (OP_TEST_STATEID - 32) |
|
2013-09-11 05:44:30 +07:00
|
|
|
1 << (OP_FREE_STATEID - 32) |
|
|
|
|
1 << (OP_WRITE - 32)
|
2013-08-14 03:37:32 +07:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Select the state protection mode for client `clp' given the server results
|
|
|
|
* from exchange_id in `sp'.
|
2009-04-01 20:22:29 +07:00
|
|
|
*
|
2013-08-14 03:37:32 +07:00
|
|
|
* Returns 0 on success, negative errno otherwise.
|
|
|
|
*/
|
|
|
|
static int nfs4_sp4_select_mode(struct nfs_client *clp,
|
|
|
|
struct nfs41_state_protection *sp)
|
|
|
|
{
|
|
|
|
static const u32 supported_enforce[NFS4_OP_MAP_NUM_WORDS] = {
|
|
|
|
[1] = 1 << (OP_BIND_CONN_TO_SESSION - 32) |
|
|
|
|
1 << (OP_EXCHANGE_ID - 32) |
|
|
|
|
1 << (OP_CREATE_SESSION - 32) |
|
|
|
|
1 << (OP_DESTROY_SESSION - 32) |
|
|
|
|
1 << (OP_DESTROY_CLIENTID - 32)
|
|
|
|
};
|
2017-08-01 18:32:50 +07:00
|
|
|
unsigned long flags = 0;
|
2013-08-14 03:37:32 +07:00
|
|
|
unsigned int i;
|
2017-08-01 18:32:50 +07:00
|
|
|
int ret = 0;
|
2013-08-14 03:37:32 +07:00
|
|
|
|
|
|
|
if (sp->how == SP4_MACH_CRED) {
|
|
|
|
/* Print state protect result */
|
|
|
|
dfprintk(MOUNT, "Server SP4_MACH_CRED support:\n");
|
|
|
|
for (i = 0; i <= LAST_NFS4_OP; i++) {
|
|
|
|
if (test_bit(i, sp->enforce.u.longs))
|
|
|
|
dfprintk(MOUNT, " enforce op %d\n", i);
|
|
|
|
if (test_bit(i, sp->allow.u.longs))
|
|
|
|
dfprintk(MOUNT, " allow op %d\n", i);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* make sure nothing is on enforce list that isn't supported */
|
|
|
|
for (i = 0; i < NFS4_OP_MAP_NUM_WORDS; i++) {
|
|
|
|
if (sp->enforce.u.words[i] & ~supported_enforce[i]) {
|
|
|
|
dfprintk(MOUNT, "sp4_mach_cred: disabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
ret = -EINVAL;
|
|
|
|
goto out;
|
2013-08-14 03:37:32 +07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Minimal mode - state operations are allowed to use machine
|
|
|
|
* credential. Note this already happens by default, so the
|
|
|
|
* client doesn't have to do anything more than the negotiation.
|
|
|
|
*
|
|
|
|
* NOTE: we don't care if EXCHANGE_ID is in the list -
|
|
|
|
* we're already using the machine cred for exchange_id
|
|
|
|
* and will never use a different cred.
|
|
|
|
*/
|
|
|
|
if (test_bit(OP_BIND_CONN_TO_SESSION, sp->enforce.u.longs) &&
|
|
|
|
test_bit(OP_CREATE_SESSION, sp->enforce.u.longs) &&
|
|
|
|
test_bit(OP_DESTROY_SESSION, sp->enforce.u.longs) &&
|
|
|
|
test_bit(OP_DESTROY_CLIENTID, sp->enforce.u.longs)) {
|
|
|
|
dfprintk(MOUNT, "sp4_mach_cred:\n");
|
|
|
|
dfprintk(MOUNT, " minimal mode enabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
__set_bit(NFS_SP4_MACH_CRED_MINIMAL, &flags);
|
2013-08-14 03:37:32 +07:00
|
|
|
} else {
|
|
|
|
dfprintk(MOUNT, "sp4_mach_cred: disabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
ret = -EINVAL;
|
|
|
|
goto out;
|
2013-08-14 03:37:32 +07:00
|
|
|
}
|
2013-08-14 03:37:34 +07:00
|
|
|
|
|
|
|
if (test_bit(OP_CLOSE, sp->allow.u.longs) &&
|
2015-12-02 21:39:51 +07:00
|
|
|
test_bit(OP_OPEN_DOWNGRADE, sp->allow.u.longs) &&
|
|
|
|
test_bit(OP_DELEGRETURN, sp->allow.u.longs) &&
|
2013-08-14 03:37:34 +07:00
|
|
|
test_bit(OP_LOCKU, sp->allow.u.longs)) {
|
|
|
|
dfprintk(MOUNT, " cleanup mode enabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
__set_bit(NFS_SP4_MACH_CRED_CLEANUP, &flags);
|
2013-08-14 03:37:34 +07:00
|
|
|
}
|
2013-08-14 03:37:35 +07:00
|
|
|
|
2015-12-02 21:39:51 +07:00
|
|
|
if (test_bit(OP_LAYOUTRETURN, sp->allow.u.longs)) {
|
|
|
|
dfprintk(MOUNT, " pnfs cleanup mode enabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
__set_bit(NFS_SP4_MACH_CRED_PNFS_CLEANUP, &flags);
|
2015-12-02 21:39:51 +07:00
|
|
|
}
|
|
|
|
|
2013-08-14 03:37:35 +07:00
|
|
|
if (test_bit(OP_SECINFO, sp->allow.u.longs) &&
|
|
|
|
test_bit(OP_SECINFO_NO_NAME, sp->allow.u.longs)) {
|
|
|
|
dfprintk(MOUNT, " secinfo mode enabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
__set_bit(NFS_SP4_MACH_CRED_SECINFO, &flags);
|
2013-08-14 03:37:35 +07:00
|
|
|
}
|
2013-08-14 03:37:36 +07:00
|
|
|
|
|
|
|
if (test_bit(OP_TEST_STATEID, sp->allow.u.longs) &&
|
|
|
|
test_bit(OP_FREE_STATEID, sp->allow.u.longs)) {
|
|
|
|
dfprintk(MOUNT, " stateid mode enabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
__set_bit(NFS_SP4_MACH_CRED_STATEID, &flags);
|
2013-08-14 03:37:36 +07:00
|
|
|
}
|
2013-08-14 03:37:37 +07:00
|
|
|
|
|
|
|
if (test_bit(OP_WRITE, sp->allow.u.longs)) {
|
|
|
|
dfprintk(MOUNT, " write mode enabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
__set_bit(NFS_SP4_MACH_CRED_WRITE, &flags);
|
2013-08-14 03:37:37 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
if (test_bit(OP_COMMIT, sp->allow.u.longs)) {
|
|
|
|
dfprintk(MOUNT, " commit mode enabled\n");
|
2017-08-01 18:32:50 +07:00
|
|
|
__set_bit(NFS_SP4_MACH_CRED_COMMIT, &flags);
|
2013-08-14 03:37:37 +07:00
|
|
|
}
|
2013-08-14 03:37:32 +07:00
|
|
|
}
|
2017-08-01 18:32:50 +07:00
|
|
|
out:
|
|
|
|
clp->cl_sp4_flags = flags;
|
2013-08-14 03:37:32 +07:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-09-09 20:22:18 +07:00
|
|
|
struct nfs41_exchange_id_data {
|
|
|
|
struct nfs41_exchange_id_res res;
|
|
|
|
struct nfs41_exchange_id_args args;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void nfs4_exchange_id_release(void *data)
|
|
|
|
{
|
|
|
|
struct nfs41_exchange_id_data *cdata =
|
|
|
|
(struct nfs41_exchange_id_data *)data;
|
|
|
|
|
2017-03-13 21:36:19 +07:00
|
|
|
nfs_put_client(cdata->args.client);
|
2016-09-09 20:22:18 +07:00
|
|
|
kfree(cdata->res.impl_id);
|
|
|
|
kfree(cdata->res.server_scope);
|
|
|
|
kfree(cdata->res.server_owner);
|
|
|
|
kfree(cdata);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_exchange_id_call_ops = {
|
|
|
|
.rpc_release = nfs4_exchange_id_release,
|
|
|
|
};
|
|
|
|
|
2013-08-14 03:37:32 +07:00
|
|
|
/*
|
|
|
|
* _nfs4_proc_exchange_id()
|
2012-07-12 03:30:59 +07:00
|
|
|
*
|
2013-08-14 03:37:32 +07:00
|
|
|
* Wrapper for EXCHANGE_ID operation.
|
2009-04-01 20:22:29 +07:00
|
|
|
*/
|
2017-08-01 05:38:50 +07:00
|
|
|
static struct rpc_task *
|
|
|
|
nfs4_run_exchange_id(struct nfs_client *clp, struct rpc_cred *cred,
|
2016-09-09 20:22:28 +07:00
|
|
|
u32 sp4_how, struct rpc_xprt *xprt)
|
2009-04-01 20:22:29 +07:00
|
|
|
{
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_EXCHANGE_ID],
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
2016-09-09 20:22:18 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = clp->cl_rpcclient,
|
|
|
|
.callback_ops = &nfs4_exchange_id_call_ops,
|
|
|
|
.rpc_message = &msg,
|
2017-08-02 03:02:48 +07:00
|
|
|
.flags = RPC_TASK_TIMEOUT,
|
2016-09-09 20:22:18 +07:00
|
|
|
};
|
|
|
|
struct nfs41_exchange_id_data *calldata;
|
2017-04-08 01:15:22 +07:00
|
|
|
int status;
|
2016-09-09 20:22:18 +07:00
|
|
|
|
2017-10-20 16:53:38 +07:00
|
|
|
if (!refcount_inc_not_zero(&clp->cl_count))
|
2017-08-01 05:38:50 +07:00
|
|
|
return ERR_PTR(-EIO);
|
2016-09-09 20:22:18 +07:00
|
|
|
|
2017-08-01 05:38:50 +07:00
|
|
|
status = -ENOMEM;
|
2016-09-09 20:22:18 +07:00
|
|
|
calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
|
2017-08-01 05:38:50 +07:00
|
|
|
if (!calldata)
|
|
|
|
goto out;
|
2009-04-01 20:22:29 +07:00
|
|
|
|
2017-08-02 03:02:47 +07:00
|
|
|
nfs4_init_boot_verifier(clp, &calldata->args.verifier);
|
2015-06-10 06:44:00 +07:00
|
|
|
|
|
|
|
status = nfs4_init_uniform_client_string(clp);
|
|
|
|
if (status)
|
2016-09-09 20:22:18 +07:00
|
|
|
goto out_calldata;
|
2015-06-10 06:43:57 +07:00
|
|
|
|
2016-09-09 20:22:18 +07:00
|
|
|
calldata->res.server_owner = kzalloc(sizeof(struct nfs41_server_owner),
|
|
|
|
GFP_NOFS);
|
|
|
|
status = -ENOMEM;
|
|
|
|
if (unlikely(calldata->res.server_owner == NULL))
|
|
|
|
goto out_calldata;
|
2011-06-01 06:05:47 +07:00
|
|
|
|
2016-09-09 20:22:18 +07:00
|
|
|
calldata->res.server_scope = kzalloc(sizeof(struct nfs41_server_scope),
|
2012-05-25 03:31:39 +07:00
|
|
|
GFP_NOFS);
|
2016-09-09 20:22:18 +07:00
|
|
|
if (unlikely(calldata->res.server_scope == NULL))
|
2012-05-22 09:46:16 +07:00
|
|
|
goto out_server_owner;
|
2011-06-01 06:05:47 +07:00
|
|
|
|
2016-09-09 20:22:18 +07:00
|
|
|
calldata->res.impl_id = kzalloc(sizeof(struct nfs41_impl_id), GFP_NOFS);
|
|
|
|
if (unlikely(calldata->res.impl_id == NULL))
|
2012-02-18 03:20:26 +07:00
|
|
|
goto out_server_scope;
|
|
|
|
|
2013-08-14 03:37:32 +07:00
|
|
|
switch (sp4_how) {
|
|
|
|
case SP4_NONE:
|
2016-09-09 20:22:18 +07:00
|
|
|
calldata->args.state_protect.how = SP4_NONE;
|
2013-08-14 03:37:32 +07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case SP4_MACH_CRED:
|
2016-09-09 20:22:18 +07:00
|
|
|
calldata->args.state_protect = nfs4_sp4_mach_cred_request;
|
2013-08-14 03:37:32 +07:00
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
/* unsupported! */
|
|
|
|
WARN_ON_ONCE(1);
|
|
|
|
status = -EINVAL;
|
2015-07-01 10:54:53 +07:00
|
|
|
goto out_impl_id;
|
2013-08-14 03:37:32 +07:00
|
|
|
}
|
2016-09-09 20:22:28 +07:00
|
|
|
if (xprt) {
|
|
|
|
task_setup_data.rpc_xprt = xprt;
|
2017-08-02 03:02:48 +07:00
|
|
|
task_setup_data.flags |= RPC_TASK_SOFTCONN;
|
2017-08-02 03:02:47 +07:00
|
|
|
memcpy(calldata->args.verifier.data, clp->cl_confirm.data,
|
|
|
|
sizeof(calldata->args.verifier.data));
|
2016-09-09 20:22:28 +07:00
|
|
|
}
|
2016-09-09 20:22:18 +07:00
|
|
|
calldata->args.client = clp;
|
|
|
|
calldata->args.flags = EXCHGID4_FLAG_SUPP_MOVED_REFER |
|
2017-08-01 19:17:34 +07:00
|
|
|
EXCHGID4_FLAG_BIND_PRINC_STATEID;
|
|
|
|
#ifdef CONFIG_NFS_V4_1_MIGRATION
|
|
|
|
calldata->args.flags |= EXCHGID4_FLAG_SUPP_MOVED_MIGR;
|
2016-09-09 20:22:18 +07:00
|
|
|
#endif
|
|
|
|
msg.rpc_argp = &calldata->args;
|
|
|
|
msg.rpc_resp = &calldata->res;
|
|
|
|
task_setup_data.callback_data = calldata;
|
2013-08-14 03:37:32 +07:00
|
|
|
|
2017-08-01 05:38:50 +07:00
|
|
|
return rpc_run_task(&task_setup_data);
|
2016-09-09 20:22:18 +07:00
|
|
|
|
|
|
|
out_impl_id:
|
|
|
|
kfree(calldata->res.impl_id);
|
|
|
|
out_server_scope:
|
|
|
|
kfree(calldata->res.server_scope);
|
|
|
|
out_server_owner:
|
|
|
|
kfree(calldata->res.server_owner);
|
|
|
|
out_calldata:
|
|
|
|
kfree(calldata);
|
2017-08-01 05:38:50 +07:00
|
|
|
out:
|
2017-03-13 21:36:19 +07:00
|
|
|
nfs_put_client(clp);
|
2017-08-01 05:38:50 +07:00
|
|
|
return ERR_PTR(status);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* _nfs4_proc_exchange_id()
|
|
|
|
*
|
|
|
|
* Wrapper for EXCHANGE_ID operation.
|
|
|
|
*/
|
|
|
|
static int _nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred,
|
|
|
|
u32 sp4_how)
|
|
|
|
{
|
|
|
|
struct rpc_task *task;
|
|
|
|
struct nfs41_exchange_id_args *argp;
|
|
|
|
struct nfs41_exchange_id_res *resp;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
task = nfs4_run_exchange_id(clp, cred, sp4_how, NULL);
|
|
|
|
if (IS_ERR(task))
|
|
|
|
return PTR_ERR(task);
|
|
|
|
|
|
|
|
argp = task->tk_msg.rpc_argp;
|
|
|
|
resp = task->tk_msg.rpc_resp;
|
|
|
|
status = task->tk_status;
|
|
|
|
if (status != 0)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
status = nfs4_check_cl_exchange_flags(resp->flags);
|
|
|
|
if (status != 0)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
status = nfs4_sp4_select_mode(clp, &resp->state_protect);
|
|
|
|
if (status != 0)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
clp->cl_clientid = resp->clientid;
|
|
|
|
clp->cl_exchange_flags = resp->flags;
|
|
|
|
clp->cl_seqid = resp->seqid;
|
|
|
|
/* Client ID is not confirmed */
|
|
|
|
if (!(resp->flags & EXCHGID4_FLAG_CONFIRMED_R))
|
|
|
|
clear_bit(NFS4_SESSION_ESTABLISHED,
|
|
|
|
&clp->cl_session->session_state);
|
|
|
|
|
|
|
|
if (clp->cl_serverscope != NULL &&
|
|
|
|
!nfs41_same_server_scope(clp->cl_serverscope,
|
|
|
|
resp->server_scope)) {
|
|
|
|
dprintk("%s: server_scope mismatch detected\n",
|
|
|
|
__func__);
|
|
|
|
set_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state);
|
|
|
|
}
|
|
|
|
|
|
|
|
swap(clp->cl_serverowner, resp->server_owner);
|
|
|
|
swap(clp->cl_serverscope, resp->server_scope);
|
|
|
|
swap(clp->cl_implid, resp->impl_id);
|
|
|
|
|
|
|
|
/* Save the EXCHANGE_ID verifier session trunk tests */
|
|
|
|
memcpy(clp->cl_confirm.data, argp->verifier.data,
|
|
|
|
sizeof(clp->cl_confirm.data));
|
|
|
|
out:
|
|
|
|
trace_nfs4_exchange_id(clp, status);
|
|
|
|
rpc_put_task(task);
|
|
|
|
return status;
|
2009-04-01 20:22:29 +07:00
|
|
|
}
|
|
|
|
|
2013-08-14 03:37:32 +07:00
|
|
|
/*
|
|
|
|
* nfs4_proc_exchange_id()
|
|
|
|
*
|
|
|
|
* Returns zero, a negative errno, or a negative NFS4ERR status code.
|
|
|
|
*
|
|
|
|
* Since the clientid has expired, all compounds using sessions
|
|
|
|
* associated with the stale clientid will be returning
|
|
|
|
* NFS4ERR_BADSESSION in the sequence operation, and will therefore
|
|
|
|
* be in some phase of session reset.
|
|
|
|
*
|
|
|
|
* Will attempt to negotiate SP4_MACH_CRED if krb5i / krb5p auth is used.
|
|
|
|
*/
|
|
|
|
int nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
rpc_authflavor_t authflavor = clp->cl_rpcclient->cl_auth->au_flavor;
|
|
|
|
int status;
|
|
|
|
|
|
|
|
/* try SP4_MACH_CRED if krb5i/p */
|
|
|
|
if (authflavor == RPC_AUTH_GSS_KRB5I ||
|
|
|
|
authflavor == RPC_AUTH_GSS_KRB5P) {
|
2017-08-01 05:38:50 +07:00
|
|
|
status = _nfs4_proc_exchange_id(clp, cred, SP4_MACH_CRED);
|
2013-08-14 03:37:32 +07:00
|
|
|
if (!status)
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* try SP4_NONE */
|
2017-08-01 05:38:50 +07:00
|
|
|
return _nfs4_proc_exchange_id(clp, cred, SP4_NONE);
|
2013-08-14 03:37:32 +07:00
|
|
|
}
|
|
|
|
|
2016-09-09 20:22:29 +07:00
|
|
|
/**
|
|
|
|
* nfs4_test_session_trunk
|
|
|
|
*
|
|
|
|
* This is an add_xprt_test() test function called from
|
|
|
|
* rpc_clnt_setup_test_and_add_xprt.
|
|
|
|
*
|
|
|
|
* The rpc_xprt_switch is referrenced by rpc_clnt_setup_test_and_add_xprt
|
|
|
|
* and is dereferrenced in nfs4_exchange_id_release
|
|
|
|
*
|
|
|
|
* Upon success, add the new transport to the rpc_clnt
|
|
|
|
*
|
|
|
|
* @clnt: struct rpc_clnt to get new transport
|
|
|
|
* @xprt: the rpc_xprt to test
|
|
|
|
* @data: call data for _nfs4_proc_exchange_id.
|
|
|
|
*/
|
|
|
|
int nfs4_test_session_trunk(struct rpc_clnt *clnt, struct rpc_xprt *xprt,
|
|
|
|
void *data)
|
|
|
|
{
|
|
|
|
struct nfs4_add_xprt_data *adata = (struct nfs4_add_xprt_data *)data;
|
2017-08-01 05:38:50 +07:00
|
|
|
struct rpc_task *task;
|
|
|
|
int status;
|
|
|
|
|
2016-09-09 20:22:29 +07:00
|
|
|
u32 sp4_how;
|
|
|
|
|
|
|
|
dprintk("--> %s try %s\n", __func__,
|
|
|
|
xprt->address_strings[RPC_DISPLAY_ADDR]);
|
|
|
|
|
|
|
|
sp4_how = (adata->clp->cl_sp4_flags == 0 ? SP4_NONE : SP4_MACH_CRED);
|
|
|
|
|
|
|
|
/* Test connection for session trunking. Async exchange_id call */
|
2017-08-01 05:38:50 +07:00
|
|
|
task = nfs4_run_exchange_id(adata->clp, adata->cred, sp4_how, xprt);
|
|
|
|
if (IS_ERR(task))
|
|
|
|
return PTR_ERR(task);
|
|
|
|
|
|
|
|
status = task->tk_status;
|
|
|
|
if (status == 0)
|
|
|
|
status = nfs4_detect_session_trunking(adata->clp,
|
|
|
|
task->tk_msg.rpc_resp, xprt);
|
|
|
|
|
|
|
|
rpc_put_task(task);
|
|
|
|
return status;
|
2013-08-14 03:37:32 +07:00
|
|
|
}
|
2016-09-09 20:22:29 +07:00
|
|
|
EXPORT_SYMBOL_GPL(nfs4_test_session_trunk);
|
2013-08-14 03:37:32 +07:00
|
|
|
|
2012-05-26 04:18:09 +07:00
|
|
|
static int _nfs4_proc_destroy_clientid(struct nfs_client *clp,
|
|
|
|
struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_CLIENTID],
|
|
|
|
.rpc_argp = clp,
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
|
|
|
status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_destroy_clientid(clp, status);
|
2012-05-26 04:18:09 +07:00
|
|
|
if (status)
|
2012-06-08 00:45:53 +07:00
|
|
|
dprintk("NFS: Got error %d from the server %s on "
|
2012-05-26 04:18:09 +07:00
|
|
|
"DESTROY_CLIENTID.", status, clp->cl_hostname);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_destroy_clientid(struct nfs_client *clp,
|
|
|
|
struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
unsigned int loop;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
|
|
|
|
ret = _nfs4_proc_destroy_clientid(clp, cred);
|
|
|
|
switch (ret) {
|
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
case -NFS4ERR_CLIENTID_BUSY:
|
|
|
|
ssleep(1);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int nfs4_destroy_clientid(struct nfs_client *clp)
|
|
|
|
{
|
|
|
|
struct rpc_cred *cred;
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
if (clp->cl_mvops->minor_version < 1)
|
|
|
|
goto out;
|
|
|
|
if (clp->cl_exchange_flags == 0)
|
|
|
|
goto out;
|
2012-09-15 04:24:32 +07:00
|
|
|
if (clp->cl_preserve_clid)
|
|
|
|
goto out;
|
2013-07-24 23:28:37 +07:00
|
|
|
cred = nfs4_get_clid_cred(clp);
|
2012-05-26 04:18:09 +07:00
|
|
|
ret = nfs4_proc_destroy_clientid(clp, cred);
|
|
|
|
if (cred)
|
|
|
|
put_rpccred(cred);
|
|
|
|
switch (ret) {
|
|
|
|
case 0:
|
|
|
|
case -NFS4ERR_STALE_CLIENTID:
|
|
|
|
clp->cl_exchange_flags = 0;
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:30 +07:00
|
|
|
struct nfs4_get_lease_time_data {
|
|
|
|
struct nfs4_get_lease_time_args *args;
|
|
|
|
struct nfs4_get_lease_time_res *res;
|
|
|
|
struct nfs_client *clp;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void nfs4_get_lease_time_prepare(struct rpc_task *task,
|
|
|
|
void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_get_lease_time_data *data =
|
|
|
|
(struct nfs4_get_lease_time_data *)calldata;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
|
|
|
/* just setup sequence, do not trigger session recovery
|
|
|
|
since we're invoked within one */
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(data->clp,
|
2012-10-23 07:28:44 +07:00
|
|
|
&data->args->la_seq_args,
|
|
|
|
&data->res->lr_seq_res,
|
|
|
|
task);
|
2009-04-01 20:22:30 +07:00
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Called from nfs4_state_manager thread for session setup, so don't recover
|
|
|
|
* from sequence operation or clientid errors.
|
|
|
|
*/
|
|
|
|
static void nfs4_get_lease_time_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_get_lease_time_data *data =
|
|
|
|
(struct nfs4_get_lease_time_data *)calldata;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs41_sequence_done(task, &data->res->lr_seq_res))
|
|
|
|
return;
|
2009-04-01 20:22:30 +07:00
|
|
|
switch (task->tk_status) {
|
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
case -NFS4ERR_GRACE:
|
|
|
|
dprintk("%s Retry: tk_status %d\n", __func__, task->tk_status);
|
|
|
|
rpc_delay(task, NFS4_POLL_RETRY_MIN);
|
|
|
|
task->tk_status = 0;
|
2011-05-04 00:43:03 +07:00
|
|
|
/* fall through */
|
|
|
|
case -NFS4ERR_RETRY_UNCACHED_REP:
|
2011-10-20 02:17:29 +07:00
|
|
|
rpc_restart_call_prepare(task);
|
2009-04-01 20:22:30 +07:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
}
|
|
|
|
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct rpc_call_ops nfs4_get_lease_time_ops = {
|
2009-04-01 20:22:30 +07:00
|
|
|
.rpc_call_prepare = nfs4_get_lease_time_prepare,
|
|
|
|
.rpc_call_done = nfs4_get_lease_time_done,
|
|
|
|
};
|
|
|
|
|
|
|
|
int nfs4_proc_get_lease_time(struct nfs_client *clp, struct nfs_fsinfo *fsinfo)
|
|
|
|
{
|
|
|
|
struct rpc_task *task;
|
|
|
|
struct nfs4_get_lease_time_args args;
|
|
|
|
struct nfs4_get_lease_time_res res = {
|
|
|
|
.lr_fsinfo = fsinfo,
|
|
|
|
};
|
|
|
|
struct nfs4_get_lease_time_data data = {
|
|
|
|
.args = &args,
|
|
|
|
.res = &res,
|
|
|
|
.clp = clp,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GET_LEASE_TIME],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
|
|
|
struct rpc_task_setup task_setup = {
|
|
|
|
.rpc_client = clp->cl_rpcclient,
|
|
|
|
.rpc_message = &msg,
|
|
|
|
.callback_ops = &nfs4_get_lease_time_ops,
|
2011-04-25 01:29:33 +07:00
|
|
|
.callback_data = &data,
|
|
|
|
.flags = RPC_TASK_TIMEOUT,
|
2009-04-01 20:22:30 +07:00
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&args.la_seq_args, &res.lr_seq_res, 0, 1);
|
2009-04-01 20:22:30 +07:00
|
|
|
task = rpc_run_task(&task_setup);
|
|
|
|
|
|
|
|
if (IS_ERR(task))
|
2017-04-08 01:15:23 +07:00
|
|
|
return PTR_ERR(task);
|
2009-04-01 20:22:30 +07:00
|
|
|
|
2017-04-08 01:15:23 +07:00
|
|
|
status = task->tk_status;
|
|
|
|
rpc_put_task(task);
|
2009-04-01 20:22:30 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:31 +07:00
|
|
|
/*
|
|
|
|
* Initialize the values to be used by the client in CREATE_SESSION
|
|
|
|
* If nfs4_init_session set the fore channel request and response sizes,
|
|
|
|
* use them.
|
|
|
|
*
|
|
|
|
* Set the back channel max_resp_sz_cached to zero to force the client to
|
|
|
|
* always set csa_cachethis to FALSE because the current implementation
|
|
|
|
* of the back channel DRC only supports caching the CB_SEQUENCE operation.
|
|
|
|
*/
|
2016-05-03 01:40:40 +07:00
|
|
|
static void nfs4_init_channel_attrs(struct nfs41_create_session_args *args,
|
|
|
|
struct rpc_clnt *clnt)
|
2009-04-01 20:22:31 +07:00
|
|
|
{
|
2013-06-26 23:21:49 +07:00
|
|
|
unsigned int max_rqst_sz, max_resp_sz;
|
2016-05-03 01:40:40 +07:00
|
|
|
unsigned int max_bc_payload = rpc_max_bc_payload(clnt);
|
2013-06-26 23:21:49 +07:00
|
|
|
|
|
|
|
max_rqst_sz = NFS_MAX_FILE_IO_SIZE + nfs41_maxwrite_overhead;
|
|
|
|
max_resp_sz = NFS_MAX_FILE_IO_SIZE + nfs41_maxread_overhead;
|
2009-04-01 20:22:31 +07:00
|
|
|
|
|
|
|
/* Fore channel attributes */
|
2013-06-26 23:21:49 +07:00
|
|
|
args->fc_attrs.max_rqst_sz = max_rqst_sz;
|
|
|
|
args->fc_attrs.max_resp_sz = max_resp_sz;
|
2009-04-01 20:22:31 +07:00
|
|
|
args->fc_attrs.max_ops = NFS4_MAX_OPS;
|
2012-02-07 07:50:40 +07:00
|
|
|
args->fc_attrs.max_reqs = max_session_slots;
|
2009-04-01 20:22:31 +07:00
|
|
|
|
|
|
|
dprintk("%s: Fore Channel : max_rqst_sz=%u max_resp_sz=%u "
|
2009-12-18 00:06:26 +07:00
|
|
|
"max_ops=%u max_reqs=%u\n",
|
2009-04-01 20:22:31 +07:00
|
|
|
__func__,
|
|
|
|
args->fc_attrs.max_rqst_sz, args->fc_attrs.max_resp_sz,
|
2009-12-18 00:06:26 +07:00
|
|
|
args->fc_attrs.max_ops, args->fc_attrs.max_reqs);
|
2009-04-01 20:22:31 +07:00
|
|
|
|
|
|
|
/* Back channel attributes */
|
2016-05-03 01:40:40 +07:00
|
|
|
args->bc_attrs.max_rqst_sz = max_bc_payload;
|
|
|
|
args->bc_attrs.max_resp_sz = max_bc_payload;
|
2009-04-01 20:22:31 +07:00
|
|
|
args->bc_attrs.max_resp_sz_cached = 0;
|
|
|
|
args->bc_attrs.max_ops = NFS4_MAX_BACK_CHANNEL_OPS;
|
2016-08-30 07:03:52 +07:00
|
|
|
args->bc_attrs.max_reqs = min_t(unsigned short, max_session_cb_slots, 1);
|
2009-04-01 20:22:31 +07:00
|
|
|
|
|
|
|
dprintk("%s: Back Channel : max_rqst_sz=%u max_resp_sz=%u "
|
|
|
|
"max_resp_sz_cached=%u max_ops=%u max_reqs=%u\n",
|
|
|
|
__func__,
|
|
|
|
args->bc_attrs.max_rqst_sz, args->bc_attrs.max_resp_sz,
|
|
|
|
args->bc_attrs.max_resp_sz_cached, args->bc_attrs.max_ops,
|
|
|
|
args->bc_attrs.max_reqs);
|
|
|
|
}
|
|
|
|
|
2015-02-19 02:30:18 +07:00
|
|
|
static int nfs4_verify_fore_channel_attrs(struct nfs41_create_session_args *args,
|
|
|
|
struct nfs41_create_session_res *res)
|
2009-04-01 20:22:32 +07:00
|
|
|
{
|
2010-10-03 02:19:01 +07:00
|
|
|
struct nfs4_channel_attrs *sent = &args->fc_attrs;
|
2015-02-19 02:30:18 +07:00
|
|
|
struct nfs4_channel_attrs *rcvd = &res->fc_attrs;
|
2010-10-03 02:19:01 +07:00
|
|
|
|
|
|
|
if (rcvd->max_resp_sz > sent->max_resp_sz)
|
|
|
|
return -EINVAL;
|
|
|
|
/*
|
|
|
|
* Our requested max_ops is the minimum we need; we're not
|
|
|
|
* prepared to break up compounds into smaller pieces than that.
|
|
|
|
* So, no point even trying to continue if the server won't
|
|
|
|
* cooperate:
|
|
|
|
*/
|
|
|
|
if (rcvd->max_ops < sent->max_ops)
|
|
|
|
return -EINVAL;
|
|
|
|
if (rcvd->max_reqs == 0)
|
|
|
|
return -EINVAL;
|
2012-02-15 22:38:25 +07:00
|
|
|
if (rcvd->max_reqs > NFS4_MAX_SLOT_TABLE)
|
|
|
|
rcvd->max_reqs = NFS4_MAX_SLOT_TABLE;
|
2010-10-03 02:19:01 +07:00
|
|
|
return 0;
|
2009-04-01 20:22:32 +07:00
|
|
|
}
|
|
|
|
|
2015-02-19 02:30:18 +07:00
|
|
|
static int nfs4_verify_back_channel_attrs(struct nfs41_create_session_args *args,
|
|
|
|
struct nfs41_create_session_res *res)
|
2010-10-03 02:19:01 +07:00
|
|
|
{
|
|
|
|
struct nfs4_channel_attrs *sent = &args->bc_attrs;
|
2015-02-19 02:30:18 +07:00
|
|
|
struct nfs4_channel_attrs *rcvd = &res->bc_attrs;
|
2009-04-01 20:22:32 +07:00
|
|
|
|
2015-02-19 02:34:58 +07:00
|
|
|
if (!(res->flags & SESSION4_BACK_CHAN))
|
|
|
|
goto out;
|
2010-10-03 02:19:01 +07:00
|
|
|
if (rcvd->max_rqst_sz > sent->max_rqst_sz)
|
|
|
|
return -EINVAL;
|
|
|
|
if (rcvd->max_resp_sz < sent->max_resp_sz)
|
|
|
|
return -EINVAL;
|
|
|
|
if (rcvd->max_resp_sz_cached > sent->max_resp_sz_cached)
|
|
|
|
return -EINVAL;
|
2016-08-30 07:03:52 +07:00
|
|
|
if (rcvd->max_ops > sent->max_ops)
|
2010-10-03 02:19:01 +07:00
|
|
|
return -EINVAL;
|
2016-08-30 07:03:52 +07:00
|
|
|
if (rcvd->max_reqs > sent->max_reqs)
|
2010-10-03 02:19:01 +07:00
|
|
|
return -EINVAL;
|
2015-02-19 02:34:58 +07:00
|
|
|
out:
|
2010-10-03 02:19:01 +07:00
|
|
|
return 0;
|
|
|
|
}
|
2009-04-01 20:22:32 +07:00
|
|
|
|
|
|
|
static int nfs4_verify_channel_attrs(struct nfs41_create_session_args *args,
|
2015-02-19 02:30:18 +07:00
|
|
|
struct nfs41_create_session_res *res)
|
2009-04-01 20:22:32 +07:00
|
|
|
{
|
2010-10-03 02:19:01 +07:00
|
|
|
int ret;
|
2009-04-01 20:22:32 +07:00
|
|
|
|
2015-02-19 02:30:18 +07:00
|
|
|
ret = nfs4_verify_fore_channel_attrs(args, res);
|
2010-10-03 02:19:01 +07:00
|
|
|
if (ret)
|
|
|
|
return ret;
|
2015-02-19 02:30:18 +07:00
|
|
|
return nfs4_verify_back_channel_attrs(args, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_update_session(struct nfs4_session *session,
|
|
|
|
struct nfs41_create_session_res *res)
|
|
|
|
{
|
|
|
|
nfs4_copy_sessionid(&session->sess_id, &res->sessionid);
|
2015-03-04 08:35:31 +07:00
|
|
|
/* Mark client id and session as being confirmed */
|
|
|
|
session->clp->cl_exchange_flags |= EXCHGID4_FLAG_CONFIRMED_R;
|
|
|
|
set_bit(NFS4_SESSION_ESTABLISHED, &session->session_state);
|
2015-02-19 02:30:18 +07:00
|
|
|
session->flags = res->flags;
|
|
|
|
memcpy(&session->fc_attrs, &res->fc_attrs, sizeof(session->fc_attrs));
|
2015-02-19 02:34:58 +07:00
|
|
|
if (res->flags & SESSION4_BACK_CHAN)
|
|
|
|
memcpy(&session->bc_attrs, &res->bc_attrs,
|
|
|
|
sizeof(session->bc_attrs));
|
2009-04-01 20:22:32 +07:00
|
|
|
}
|
|
|
|
|
2012-05-26 04:51:23 +07:00
|
|
|
static int _nfs4_proc_create_session(struct nfs_client *clp,
|
|
|
|
struct rpc_cred *cred)
|
2009-04-01 20:22:31 +07:00
|
|
|
{
|
|
|
|
struct nfs4_session *session = clp->cl_session;
|
|
|
|
struct nfs41_create_session_args args = {
|
|
|
|
.client = clp,
|
2015-02-19 02:30:18 +07:00
|
|
|
.clientid = clp->cl_clientid,
|
|
|
|
.seqid = clp->cl_seqid,
|
2009-04-01 20:22:31 +07:00
|
|
|
.cb_program = NFS4_CALLBACK,
|
|
|
|
};
|
2015-02-19 02:30:18 +07:00
|
|
|
struct nfs41_create_session_res res;
|
|
|
|
|
2009-04-01 20:22:31 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE_SESSION],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
2012-05-26 04:51:23 +07:00
|
|
|
.rpc_cred = cred,
|
2009-04-01 20:22:31 +07:00
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
2016-05-03 01:40:40 +07:00
|
|
|
nfs4_init_channel_attrs(&args, clp->cl_rpcclient);
|
2009-04-01 20:23:16 +07:00
|
|
|
args.flags = (SESSION4_PERSIST | SESSION4_BACK_CHAN);
|
2009-04-01 20:22:31 +07:00
|
|
|
|
2011-04-25 01:29:33 +07:00
|
|
|
status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_create_session(clp, status);
|
2009-04-01 20:22:31 +07:00
|
|
|
|
2016-09-12 01:50:01 +07:00
|
|
|
switch (status) {
|
|
|
|
case -NFS4ERR_STALE_CLIENTID:
|
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
case -ETIMEDOUT:
|
|
|
|
case -EACCES:
|
|
|
|
case -EAGAIN:
|
|
|
|
goto out;
|
|
|
|
};
|
|
|
|
|
|
|
|
clp->cl_seqid++;
|
2012-11-20 23:13:12 +07:00
|
|
|
if (!status) {
|
2009-04-01 20:22:32 +07:00
|
|
|
/* Verify the session's negotiated channel_attrs values */
|
2015-02-19 02:30:18 +07:00
|
|
|
status = nfs4_verify_channel_attrs(&args, &res);
|
2009-04-01 20:22:31 +07:00
|
|
|
/* Increment the clientid slot sequence id */
|
2015-02-19 02:30:18 +07:00
|
|
|
if (status)
|
|
|
|
goto out;
|
|
|
|
nfs4_update_session(session, &res);
|
2009-04-01 20:22:31 +07:00
|
|
|
}
|
2015-02-19 02:30:18 +07:00
|
|
|
out:
|
2009-04-01 20:22:31 +07:00
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Issues a CREATE_SESSION operation to the server.
|
|
|
|
* It is the responsibility of the caller to verify the session is
|
|
|
|
* expired before calling this routine.
|
|
|
|
*/
|
2012-05-26 04:51:23 +07:00
|
|
|
int nfs4_proc_create_session(struct nfs_client *clp, struct rpc_cred *cred)
|
2009-04-01 20:22:31 +07:00
|
|
|
{
|
|
|
|
int status;
|
|
|
|
unsigned *ptr;
|
|
|
|
struct nfs4_session *session = clp->cl_session;
|
|
|
|
|
|
|
|
dprintk("--> %s clp=%p session=%p\n", __func__, clp, session);
|
|
|
|
|
2012-05-26 04:51:23 +07:00
|
|
|
status = _nfs4_proc_create_session(clp, cred);
|
2009-04-01 20:22:31 +07:00
|
|
|
if (status)
|
|
|
|
goto out;
|
|
|
|
|
2011-11-10 01:58:21 +07:00
|
|
|
/* Init or reset the session slot tables */
|
|
|
|
status = nfs4_setup_session_slot_tables(session);
|
|
|
|
dprintk("slot table setup returned %d\n", status);
|
2009-04-01 20:22:31 +07:00
|
|
|
if (status)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
ptr = (unsigned *)&session->sess_id.data[0];
|
|
|
|
dprintk("%s client>seqid %d sessionid %u:%u:%u:%u\n", __func__,
|
|
|
|
clp->cl_seqid, ptr[0], ptr[1], ptr[2], ptr[3]);
|
|
|
|
out:
|
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:34 +07:00
|
|
|
/*
|
|
|
|
* Issue the over-the-wire RPC DESTROY_SESSION.
|
|
|
|
* The caller must serialize access to this routine.
|
|
|
|
*/
|
2012-05-26 04:51:23 +07:00
|
|
|
int nfs4_proc_destroy_session(struct nfs4_session *session,
|
|
|
|
struct rpc_cred *cred)
|
2009-04-01 20:22:34 +07:00
|
|
|
{
|
2012-05-26 04:51:23 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_SESSION],
|
|
|
|
.rpc_argp = session,
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
2009-04-01 20:22:34 +07:00
|
|
|
int status = 0;
|
|
|
|
|
|
|
|
dprintk("--> nfs4_proc_destroy_session\n");
|
|
|
|
|
|
|
|
/* session is still being setup */
|
2015-03-04 08:35:31 +07:00
|
|
|
if (!test_and_clear_bit(NFS4_SESSION_ESTABLISHED, &session->session_state))
|
|
|
|
return 0;
|
2009-04-01 20:22:34 +07:00
|
|
|
|
2011-04-25 01:29:33 +07:00
|
|
|
status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_destroy_session(session->clp, status);
|
2009-04-01 20:22:34 +07:00
|
|
|
|
|
|
|
if (status)
|
2012-06-05 21:08:24 +07:00
|
|
|
dprintk("NFS: Got error %d from the server on DESTROY_SESSION. "
|
2009-04-01 20:22:34 +07:00
|
|
|
"Session has been destroyed regardless...\n", status);
|
|
|
|
|
|
|
|
dprintk("<-- nfs4_proc_destroy_session\n");
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2009-04-01 20:22:36 +07:00
|
|
|
/*
|
|
|
|
* Renew the cl_session lease.
|
|
|
|
*/
|
2010-06-16 20:52:25 +07:00
|
|
|
struct nfs4_sequence_data {
|
|
|
|
struct nfs_client *clp;
|
|
|
|
struct nfs4_sequence_args args;
|
|
|
|
struct nfs4_sequence_res res;
|
|
|
|
};
|
|
|
|
|
2010-02-05 18:45:04 +07:00
|
|
|
static void nfs41_sequence_release(void *data)
|
|
|
|
{
|
2010-06-16 20:52:25 +07:00
|
|
|
struct nfs4_sequence_data *calldata = data;
|
|
|
|
struct nfs_client *clp = calldata->clp;
|
2010-02-05 18:45:04 +07:00
|
|
|
|
2017-10-20 16:53:38 +07:00
|
|
|
if (refcount_read(&clp->cl_count) > 1)
|
2010-02-05 18:45:05 +07:00
|
|
|
nfs4_schedule_state_renewal(clp);
|
|
|
|
nfs_put_client(clp);
|
2010-06-16 20:52:25 +07:00
|
|
|
kfree(calldata);
|
2010-02-05 18:45:04 +07:00
|
|
|
}
|
|
|
|
|
2010-06-16 20:52:25 +07:00
|
|
|
static int nfs41_sequence_handle_errors(struct rpc_task *task, struct nfs_client *clp)
|
|
|
|
{
|
|
|
|
switch(task->tk_status) {
|
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
rpc_delay(task, NFS4_POLL_RETRY_MAX);
|
|
|
|
return -EAGAIN;
|
|
|
|
default:
|
2011-03-10 04:00:53 +07:00
|
|
|
nfs4_schedule_lease_recovery(clp);
|
2010-06-16 20:52:25 +07:00
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2010-02-05 18:45:04 +07:00
|
|
|
static void nfs41_sequence_call_done(struct rpc_task *task, void *data)
|
2009-04-01 20:22:36 +07:00
|
|
|
{
|
2010-06-16 20:52:25 +07:00
|
|
|
struct nfs4_sequence_data *calldata = data;
|
|
|
|
struct nfs_client *clp = calldata->clp;
|
2009-04-01 20:22:36 +07:00
|
|
|
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs41_sequence_done(task, task->tk_msg.rpc_resp))
|
|
|
|
return;
|
2009-04-01 20:22:36 +07:00
|
|
|
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_sequence(clp, task->tk_status);
|
2009-04-01 20:22:36 +07:00
|
|
|
if (task->tk_status < 0) {
|
|
|
|
dprintk("%s ERROR %d\n", __func__, task->tk_status);
|
2017-10-20 16:53:38 +07:00
|
|
|
if (refcount_read(&clp->cl_count) == 1)
|
2010-02-05 18:45:05 +07:00
|
|
|
goto out;
|
2009-04-01 20:22:36 +07:00
|
|
|
|
2010-06-16 20:52:25 +07:00
|
|
|
if (nfs41_sequence_handle_errors(task, clp) == -EAGAIN) {
|
|
|
|
rpc_restart_call_prepare(task);
|
2009-04-01 20:22:36 +07:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
dprintk("%s rpc_cred %p\n", __func__, task->tk_msg.rpc_cred);
|
2010-02-05 18:45:05 +07:00
|
|
|
out:
|
2009-04-01 20:22:36 +07:00
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs41_sequence_prepare(struct rpc_task *task, void *data)
|
|
|
|
{
|
2010-06-16 20:52:25 +07:00
|
|
|
struct nfs4_sequence_data *calldata = data;
|
|
|
|
struct nfs_client *clp = calldata->clp;
|
2009-04-01 20:22:36 +07:00
|
|
|
struct nfs4_sequence_args *args;
|
|
|
|
struct nfs4_sequence_res *res;
|
|
|
|
|
|
|
|
args = task->tk_msg.rpc_argp;
|
|
|
|
res = task->tk_msg.rpc_resp;
|
|
|
|
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(clp, args, res, task);
|
2009-04-01 20:22:36 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs41_sequence_ops = {
|
|
|
|
.rpc_call_done = nfs41_sequence_call_done,
|
|
|
|
.rpc_call_prepare = nfs41_sequence_prepare,
|
2010-02-05 18:45:04 +07:00
|
|
|
.rpc_release = nfs41_sequence_release,
|
2009-04-01 20:22:36 +07:00
|
|
|
};
|
|
|
|
|
2012-10-30 06:02:20 +07:00
|
|
|
static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp,
|
|
|
|
struct rpc_cred *cred,
|
2017-10-20 02:46:45 +07:00
|
|
|
struct nfs4_slot *slot,
|
2012-10-30 06:02:20 +07:00
|
|
|
bool is_privileged)
|
2009-04-01 20:22:36 +07:00
|
|
|
{
|
2010-06-16 20:52:25 +07:00
|
|
|
struct nfs4_sequence_data *calldata;
|
2009-04-01 20:22:36 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SEQUENCE],
|
|
|
|
.rpc_cred = cred,
|
|
|
|
};
|
2010-06-16 20:52:26 +07:00
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = clp->cl_rpcclient,
|
|
|
|
.rpc_message = &msg,
|
2012-10-30 06:02:20 +07:00
|
|
|
.callback_ops = &nfs41_sequence_ops,
|
2013-04-09 04:50:28 +07:00
|
|
|
.flags = RPC_TASK_ASYNC | RPC_TASK_TIMEOUT,
|
2010-06-16 20:52:26 +07:00
|
|
|
};
|
2017-10-20 02:46:45 +07:00
|
|
|
struct rpc_task *ret;
|
2009-04-01 20:22:36 +07:00
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
ret = ERR_PTR(-EIO);
|
2017-10-20 16:53:38 +07:00
|
|
|
if (!refcount_inc_not_zero(&clp->cl_count))
|
2017-10-20 02:46:45 +07:00
|
|
|
goto out_err;
|
|
|
|
|
|
|
|
ret = ERR_PTR(-ENOMEM);
|
2010-09-24 20:17:01 +07:00
|
|
|
calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
|
2017-10-20 02:46:45 +07:00
|
|
|
if (calldata == NULL)
|
|
|
|
goto out_put_clp;
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&calldata->args, &calldata->res, 0, is_privileged);
|
2017-10-20 02:46:45 +07:00
|
|
|
nfs4_sequence_attach_slot(&calldata->args, &calldata->res, slot);
|
2010-06-16 20:52:25 +07:00
|
|
|
msg.rpc_argp = &calldata->args;
|
|
|
|
msg.rpc_resp = &calldata->res;
|
|
|
|
calldata->clp = clp;
|
2010-06-16 20:52:26 +07:00
|
|
|
task_setup_data.callback_data = calldata;
|
2009-04-01 20:22:36 +07:00
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
ret = rpc_run_task(&task_setup_data);
|
|
|
|
if (IS_ERR(ret))
|
|
|
|
goto out_err;
|
|
|
|
return ret;
|
|
|
|
out_put_clp:
|
|
|
|
nfs_put_client(clp);
|
|
|
|
out_err:
|
|
|
|
nfs41_release_slot(slot);
|
|
|
|
return ret;
|
2010-06-16 20:52:26 +07:00
|
|
|
}
|
|
|
|
|
2011-08-25 02:07:37 +07:00
|
|
|
static int nfs41_proc_async_sequence(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
|
2010-06-16 20:52:26 +07:00
|
|
|
{
|
|
|
|
struct rpc_task *task;
|
|
|
|
int ret = 0;
|
|
|
|
|
2011-08-25 02:07:37 +07:00
|
|
|
if ((renew_flags & NFS4_RENEW_TIMEOUT) == 0)
|
NFSv4.1: Fix an NFSv4.1 state renewal regression
Commit 2f60ea6b8ced ("NFSv4: The NFSv4.0 client must send RENEW calls if it holds a delegation") set the NFS4_RENEW_TIMEOUT flag in nfs4_renew_state, and does
not put an nfs41_proc_async_sequence call, the NFSv4.1 lease renewal heartbeat
call, on the wire to renew the NFSv4.1 state if the flag was not set.
The NFS4_RENEW_TIMEOUT flag is set when "now" is after the last renewal
(cl_last_renewal) plus the lease time divided by 3. This is arbitrary and
sometimes does the following:
In normal operation, the only way a future state renewal call is put on the
wire is via a call to nfs4_schedule_state_renewal, which schedules a
nfs4_renew_state workqueue task. nfs4_renew_state determines if the
NFS4_RENEW_TIMEOUT should be set, and the calls nfs41_proc_async_sequence,
which only gets sent if the NFS4_RENEW_TIMEOUT flag is set.
Then the nfs41_proc_async_sequence rpc_release function schedules
another state remewal via nfs4_schedule_state_renewal.
Without this change we can get into a state where an application stops
accessing the NFSv4.1 share, state renewal calls stop due to the
NFS4_RENEW_TIMEOUT flag _not_ being set. The only way to recover
from this situation is with a clientid re-establishment, once the application
resumes and the server has timed out the lease and so returns
NFS4ERR_BAD_SESSION on the subsequent SEQUENCE operation.
An example application:
open, lock, write a file.
sleep for 6 * lease (could be less)
ulock, close.
In the above example with NFSv4.1 delegations enabled, without this change,
there are no OP_SEQUENCE state renewal calls during the sleep, and the
clientid is recovered due to lease expiration on the close.
This issue does not occur with NFSv4.1 delegations disabled, nor with
NFSv4.0, with or without delegations enabled.
Signed-off-by: Andy Adamson <andros@netapp.com>
Link: http://lkml.kernel.org/r/1411486536-23401-1-git-send-email-andros@netapp.com
Fixes: 2f60ea6b8ced (NFSv4: The NFSv4.0 client must send RENEW calls...)
Cc: stable@vger.kernel.org # 3.2.x
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2014-09-29 23:31:57 +07:00
|
|
|
return -EAGAIN;
|
2017-10-20 02:46:45 +07:00
|
|
|
task = _nfs41_proc_sequence(clp, cred, NULL, false);
|
2010-06-16 20:52:26 +07:00
|
|
|
if (IS_ERR(task))
|
|
|
|
ret = PTR_ERR(task);
|
|
|
|
else
|
2011-02-22 02:05:41 +07:00
|
|
|
rpc_put_task_async(task);
|
2010-06-16 20:52:26 +07:00
|
|
|
dprintk("<-- %s status=%d\n", __func__, ret);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int nfs4_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
|
|
|
|
{
|
|
|
|
struct rpc_task *task;
|
|
|
|
int ret;
|
|
|
|
|
2017-10-20 02:46:45 +07:00
|
|
|
task = _nfs41_proc_sequence(clp, cred, NULL, true);
|
2010-06-16 20:52:26 +07:00
|
|
|
if (IS_ERR(task)) {
|
|
|
|
ret = PTR_ERR(task);
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
ret = rpc_wait_for_completion_task(task);
|
2015-07-06 01:50:46 +07:00
|
|
|
if (!ret)
|
2010-06-16 20:52:26 +07:00
|
|
|
ret = task->tk_status;
|
|
|
|
rpc_put_task(task);
|
|
|
|
out:
|
|
|
|
dprintk("<-- %s status=%d\n", __func__, ret);
|
|
|
|
return ret;
|
2009-04-01 20:22:36 +07:00
|
|
|
}
|
|
|
|
|
2009-12-06 04:08:41 +07:00
|
|
|
struct nfs4_reclaim_complete_data {
|
|
|
|
struct nfs_client *clp;
|
|
|
|
struct nfs41_reclaim_complete_args arg;
|
|
|
|
struct nfs41_reclaim_complete_res res;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void nfs4_reclaim_complete_prepare(struct rpc_task *task, void *data)
|
|
|
|
{
|
|
|
|
struct nfs4_reclaim_complete_data *calldata = data;
|
|
|
|
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(calldata->clp,
|
2012-10-23 07:28:44 +07:00
|
|
|
&calldata->arg.seq_args,
|
|
|
|
&calldata->res.seq_res,
|
|
|
|
task);
|
2009-12-06 04:08:41 +07:00
|
|
|
}
|
|
|
|
|
2010-06-16 20:52:25 +07:00
|
|
|
static int nfs41_reclaim_complete_handle_errors(struct rpc_task *task, struct nfs_client *clp)
|
|
|
|
{
|
|
|
|
switch(task->tk_status) {
|
|
|
|
case 0:
|
2018-03-18 19:37:03 +07:00
|
|
|
wake_up_all(&clp->cl_lock_waitq);
|
|
|
|
/* Fallthrough */
|
2010-06-16 20:52:25 +07:00
|
|
|
case -NFS4ERR_COMPLETE_ALREADY:
|
|
|
|
case -NFS4ERR_WRONG_CRED: /* What to do here? */
|
|
|
|
break;
|
|
|
|
case -NFS4ERR_DELAY:
|
|
|
|
rpc_delay(task, NFS4_POLL_RETRY_MAX);
|
2011-05-04 00:43:03 +07:00
|
|
|
/* fall through */
|
|
|
|
case -NFS4ERR_RETRY_UNCACHED_REP:
|
2010-06-16 20:52:25 +07:00
|
|
|
return -EAGAIN;
|
2017-05-05 00:44:04 +07:00
|
|
|
case -NFS4ERR_BADSESSION:
|
|
|
|
case -NFS4ERR_DEADSESSION:
|
|
|
|
case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
|
|
|
|
nfs4_schedule_session_recovery(clp->cl_session,
|
|
|
|
task->tk_status);
|
|
|
|
break;
|
2010-06-16 20:52:25 +07:00
|
|
|
default:
|
2011-03-10 04:00:53 +07:00
|
|
|
nfs4_schedule_lease_recovery(clp);
|
2010-06-16 20:52:25 +07:00
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2009-12-06 04:08:41 +07:00
|
|
|
static void nfs4_reclaim_complete_done(struct rpc_task *task, void *data)
|
|
|
|
{
|
|
|
|
struct nfs4_reclaim_complete_data *calldata = data;
|
|
|
|
struct nfs_client *clp = calldata->clp;
|
|
|
|
struct nfs4_sequence_res *res = &calldata->res.seq_res;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2010-08-01 01:29:06 +07:00
|
|
|
if (!nfs41_sequence_done(task, res))
|
|
|
|
return;
|
2009-12-06 04:08:41 +07:00
|
|
|
|
2013-08-09 22:51:26 +07:00
|
|
|
trace_nfs4_reclaim_complete(clp, task->tk_status);
|
2010-06-16 20:52:25 +07:00
|
|
|
if (nfs41_reclaim_complete_handle_errors(task, clp) == -EAGAIN) {
|
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
return;
|
|
|
|
}
|
2009-12-06 04:08:41 +07:00
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_free_reclaim_complete_data(void *data)
|
|
|
|
{
|
|
|
|
struct nfs4_reclaim_complete_data *calldata = data;
|
|
|
|
|
|
|
|
kfree(calldata);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_reclaim_complete_call_ops = {
|
|
|
|
.rpc_call_prepare = nfs4_reclaim_complete_prepare,
|
|
|
|
.rpc_call_done = nfs4_reclaim_complete_done,
|
|
|
|
.rpc_release = nfs4_free_reclaim_complete_data,
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Issue a global reclaim complete.
|
|
|
|
*/
|
2013-05-20 22:05:17 +07:00
|
|
|
static int nfs41_proc_reclaim_complete(struct nfs_client *clp,
|
|
|
|
struct rpc_cred *cred)
|
2009-12-06 04:08:41 +07:00
|
|
|
{
|
|
|
|
struct nfs4_reclaim_complete_data *calldata;
|
|
|
|
struct rpc_task *task;
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RECLAIM_COMPLETE],
|
2013-05-20 22:05:17 +07:00
|
|
|
.rpc_cred = cred,
|
2009-12-06 04:08:41 +07:00
|
|
|
};
|
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = clp->cl_rpcclient,
|
|
|
|
.rpc_message = &msg,
|
|
|
|
.callback_ops = &nfs4_reclaim_complete_call_ops,
|
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
|
|
|
int status = -ENOMEM;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2010-05-13 23:51:01 +07:00
|
|
|
calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
|
2009-12-06 04:08:41 +07:00
|
|
|
if (calldata == NULL)
|
|
|
|
goto out;
|
|
|
|
calldata->clp = clp;
|
|
|
|
calldata->arg.one_fs = 0;
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 0, 1);
|
2009-12-06 04:08:41 +07:00
|
|
|
msg.rpc_argp = &calldata->arg;
|
|
|
|
msg.rpc_resp = &calldata->res;
|
|
|
|
task_setup_data.callback_data = calldata;
|
|
|
|
task = rpc_run_task(&task_setup_data);
|
2010-04-22 16:28:39 +07:00
|
|
|
if (IS_ERR(task)) {
|
2009-12-06 04:08:41 +07:00
|
|
|
status = PTR_ERR(task);
|
2010-04-22 16:28:39 +07:00
|
|
|
goto out;
|
|
|
|
}
|
2017-01-12 03:01:43 +07:00
|
|
|
status = rpc_wait_for_completion_task(task);
|
2011-03-10 01:13:46 +07:00
|
|
|
if (status == 0)
|
|
|
|
status = task->tk_status;
|
2009-12-06 04:08:41 +07:00
|
|
|
rpc_put_task(task);
|
|
|
|
out:
|
|
|
|
dprintk("<-- %s status=%d\n", __func__, status);
|
|
|
|
return status;
|
|
|
|
}
|
2010-10-20 11:18:03 +07:00
|
|
|
|
|
|
|
static void
|
|
|
|
nfs4_layoutget_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutget *lgp = calldata;
|
2011-01-06 18:36:24 +07:00
|
|
|
struct nfs_server *server = NFS_SERVER(lgp->args.inode);
|
2010-10-20 11:18:03 +07:00
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(server->nfs_client, &lgp->args.seq_args,
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
&lgp->res.seq_res, task);
|
|
|
|
dprintk("<-- %s\n", __func__);
|
2010-10-20 11:18:03 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutget *lgp = calldata;
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2016-08-28 22:50:26 +07:00
|
|
|
nfs41_sequence_process(task, &lgp->res.seq_res);
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
nfs4_layoutget_handle_exception(struct rpc_task *task,
|
|
|
|
struct nfs4_layoutget *lgp, struct nfs4_exception *exception)
|
|
|
|
{
|
2012-10-02 07:25:48 +07:00
|
|
|
struct inode *inode = lgp->args.inode;
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
|
|
|
struct pnfs_layout_hdr *lo;
|
2016-07-15 05:46:24 +07:00
|
|
|
int nfs4err = task->tk_status;
|
|
|
|
int err, status = 0;
|
2016-07-15 02:14:02 +07:00
|
|
|
LIST_HEAD(head);
|
2010-10-20 11:18:03 +07:00
|
|
|
|
2014-01-23 01:34:54 +07:00
|
|
|
dprintk("--> %s tk_status => %d\n", __func__, -task->tk_status);
|
2010-10-20 11:18:03 +07:00
|
|
|
|
2016-07-15 05:46:24 +07:00
|
|
|
switch (nfs4err) {
|
2010-10-20 11:18:03 +07:00
|
|
|
case 0:
|
2012-10-02 07:25:48 +07:00
|
|
|
goto out;
|
2015-12-05 16:01:01 +07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* NFS4ERR_LAYOUTUNAVAILABLE means we are not supposed to use pnfs
|
|
|
|
* on the file. set tk_status to -ENODATA to tell upper layer to
|
|
|
|
* retry go inband.
|
|
|
|
*/
|
|
|
|
case -NFS4ERR_LAYOUTUNAVAILABLE:
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
status = -ENODATA;
|
2015-12-05 16:01:01 +07:00
|
|
|
goto out;
|
2015-08-31 15:19:22 +07:00
|
|
|
/*
|
|
|
|
* NFS4ERR_BADLAYOUT means the MDS cannot return a layout of
|
|
|
|
* length lgp->args.minlength != 0 (see RFC5661 section 18.43.3).
|
|
|
|
*/
|
|
|
|
case -NFS4ERR_BADLAYOUT:
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
status = -EOVERFLOW;
|
|
|
|
goto out;
|
2014-01-23 01:34:54 +07:00
|
|
|
/*
|
|
|
|
* NFS4ERR_LAYOUTTRYLATER is a conflict with another client
|
2015-08-31 15:19:22 +07:00
|
|
|
* (or clients) writing to the same RAID stripe except when
|
|
|
|
* the minlength argument is 0 (see RFC5661 section 18.43.3).
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
*
|
|
|
|
* Treat it like we would RECALLCONFLICT -- we retry for a little
|
|
|
|
* while, and then eventually give up.
|
2014-01-23 01:34:54 +07:00
|
|
|
*/
|
2010-10-20 11:18:03 +07:00
|
|
|
case -NFS4ERR_LAYOUTTRYLATER:
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
if (lgp->args.minlength == 0) {
|
|
|
|
status = -EOVERFLOW;
|
|
|
|
goto out;
|
2014-01-23 01:34:54 +07:00
|
|
|
}
|
2016-07-15 05:46:24 +07:00
|
|
|
status = -EBUSY;
|
|
|
|
break;
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
case -NFS4ERR_RECALLCONFLICT:
|
|
|
|
status = -ERECALLCONFLICT;
|
2016-07-15 05:46:24 +07:00
|
|
|
break;
|
2016-09-23 00:39:10 +07:00
|
|
|
case -NFS4ERR_DELEG_REVOKED:
|
|
|
|
case -NFS4ERR_ADMIN_REVOKED:
|
2012-10-02 07:25:48 +07:00
|
|
|
case -NFS4ERR_EXPIRED:
|
|
|
|
case -NFS4ERR_BAD_STATEID:
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
exception->timeout = 0;
|
2012-10-02 07:25:48 +07:00
|
|
|
spin_lock(&inode->i_lock);
|
2016-07-15 02:14:02 +07:00
|
|
|
lo = NFS_I(inode)->layout;
|
|
|
|
/* If the open stateid was bad, then recover it. */
|
|
|
|
if (!lo || test_bit(NFS_LAYOUT_INVALID_STID, &lo->plh_flags) ||
|
2017-10-05 00:49:12 +07:00
|
|
|
!nfs4_stateid_match_other(&lgp->args.stateid, &lo->plh_stateid)) {
|
2012-10-02 07:25:48 +07:00
|
|
|
spin_unlock(&inode->i_lock);
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
exception->state = lgp->args.ctx->state;
|
2016-09-23 00:39:10 +07:00
|
|
|
exception->stateid = &lgp->args.stateid;
|
2015-09-21 00:30:30 +07:00
|
|
|
break;
|
|
|
|
}
|
2016-07-15 02:14:02 +07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Mark the bad layout state as invalid, then retry
|
|
|
|
*/
|
2016-07-25 04:08:59 +07:00
|
|
|
pnfs_mark_layout_stateid_invalid(lo, &head);
|
2016-07-15 02:14:02 +07:00
|
|
|
spin_unlock(&inode->i_lock);
|
2017-04-29 21:10:17 +07:00
|
|
|
nfs_commit_inode(inode, 0);
|
2016-07-15 02:14:02 +07:00
|
|
|
pnfs_free_lseg_list(&head);
|
|
|
|
status = -EAGAIN;
|
|
|
|
goto out;
|
2010-10-20 11:18:03 +07:00
|
|
|
}
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
|
2017-01-24 10:44:12 +07:00
|
|
|
nfs4_sequence_free_slot(&lgp->res.seq_res);
|
2016-07-15 05:46:24 +07:00
|
|
|
err = nfs4_handle_exception(server, nfs4err, exception);
|
|
|
|
if (!status) {
|
|
|
|
if (exception->retry)
|
|
|
|
status = -EAGAIN;
|
|
|
|
else
|
|
|
|
status = err;
|
|
|
|
}
|
2012-10-02 07:25:48 +07:00
|
|
|
out:
|
2010-10-20 11:18:03 +07:00
|
|
|
dprintk("<-- %s\n", __func__);
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
return status;
|
2010-10-20 11:18:03 +07:00
|
|
|
}
|
|
|
|
|
2016-09-20 04:47:09 +07:00
|
|
|
size_t max_response_pages(struct nfs_server *server)
|
2012-08-02 15:47:10 +07:00
|
|
|
{
|
|
|
|
u32 max_resp_sz = server->nfs_client->cl_session->fc_attrs.max_resp_sz;
|
|
|
|
return nfs_page_array_len(0, max_resp_sz);
|
|
|
|
}
|
|
|
|
|
2010-10-20 11:18:03 +07:00
|
|
|
static void nfs4_layoutget_release(void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutget *lgp = calldata;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2017-06-28 04:33:38 +07:00
|
|
|
nfs4_sequence_free_slot(&lgp->res.seq_res);
|
2018-05-31 04:16:20 +07:00
|
|
|
pnfs_layoutget_free(lgp);
|
2010-10-20 11:18:03 +07:00
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_layoutget_call_ops = {
|
|
|
|
.rpc_call_prepare = nfs4_layoutget_prepare,
|
|
|
|
.rpc_call_done = nfs4_layoutget_done,
|
|
|
|
.rpc_release = nfs4_layoutget_release,
|
|
|
|
};
|
|
|
|
|
2012-09-18 04:12:15 +07:00
|
|
|
struct pnfs_layout_segment *
|
2016-09-20 04:47:09 +07:00
|
|
|
nfs4_proc_layoutget(struct nfs4_layoutget *lgp, long *timeout)
|
2010-10-20 11:18:03 +07:00
|
|
|
{
|
2013-02-26 09:27:33 +07:00
|
|
|
struct inode *inode = lgp->args.inode;
|
|
|
|
struct nfs_server *server = NFS_SERVER(inode);
|
2010-10-20 11:18:03 +07:00
|
|
|
struct rpc_task *task;
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTGET],
|
|
|
|
.rpc_argp = &lgp->args,
|
|
|
|
.rpc_resp = &lgp->res,
|
2013-05-20 21:49:34 +07:00
|
|
|
.rpc_cred = lgp->cred,
|
2010-10-20 11:18:03 +07:00
|
|
|
};
|
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.rpc_client = server->client,
|
|
|
|
.rpc_message = &msg,
|
|
|
|
.callback_ops = &nfs4_layoutget_call_ops,
|
|
|
|
.callback_data = lgp,
|
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
2012-09-18 04:12:15 +07:00
|
|
|
struct pnfs_layout_segment *lseg = NULL;
|
2016-06-18 03:48:18 +07:00
|
|
|
struct nfs4_exception exception = {
|
|
|
|
.inode = inode,
|
|
|
|
.timeout = *timeout,
|
|
|
|
};
|
2010-10-20 11:18:03 +07:00
|
|
|
int status = 0;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
|
|
|
|
2014-11-17 10:05:17 +07:00
|
|
|
/* nfs4_layoutget_release calls pnfs_put_layout_hdr */
|
|
|
|
pnfs_get_layout_hdr(NFS_I(inode)->layout);
|
|
|
|
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&lgp->args.seq_args, &lgp->res.seq_res, 0, 0);
|
2013-02-26 09:27:33 +07:00
|
|
|
|
2010-10-20 11:18:03 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
|
|
|
if (IS_ERR(task))
|
2012-09-18 04:12:15 +07:00
|
|
|
return ERR_CAST(task);
|
2017-01-12 03:01:43 +07:00
|
|
|
status = rpc_wait_for_completion_task(task);
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
if (status == 0) {
|
|
|
|
status = nfs4_layoutget_handle_exception(task, lgp, &exception);
|
|
|
|
*timeout = exception.timeout;
|
|
|
|
}
|
|
|
|
|
2013-08-15 03:36:51 +07:00
|
|
|
trace_nfs4_layoutget(lgp->args.ctx,
|
|
|
|
&lgp->args.range,
|
|
|
|
&lgp->res.range,
|
Adding stateid information to tracepoints
Operations to which stateid information is added:
close, delegreturn, open, read, setattr, layoutget, layoutcommit, test_stateid,
write, lock, locku, lockt
Format is "stateid=<seqid>:<crc32 hash stateid.other>", also "openstateid=",
"layoutstateid=", and "lockstateid=" for open_file, layoutget, set_lock
tracepoints.
New function is added to internal.h, nfs_stateid_hash(), to compute the hash
trace_nfs4_setattr() is moved from nfs4_do_setattr() to _nfs4_do_setattr()
to get access to stateid.
trace_nfs4_setattr and trace_nfs4_delegreturn are changed from INODE_EVENT
to new event type, INODE_STATEID_EVENT which is same as INODE_EVENT but adds
stateid information
for locking tracepoints, moved trace_nfs4_set_lock() into _nfs4_do_setlk()
to get access to stateid information, and removed trace_nfs4_lock_reclaim(),
trace_nfs4_lock_expired() as they call into _nfs4_do_setlk() and both were
previously same LOCK_EVENT type.
Signed-off-by: Olga Kornievskaia <kolga@netapp.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-11-25 01:29:41 +07:00
|
|
|
&lgp->res.stateid,
|
2013-08-15 03:36:51 +07:00
|
|
|
status);
|
pnfs: rework LAYOUTGET retry handling
There are several problems in the way a stateid is selected for a
LAYOUTGET operation:
We pick a stateid to use in the RPC prepare op, but that makes
it difficult to serialize LAYOUTGETs that use the open stateid. That
serialization is done in pnfs_update_layout, which occurs well before
the rpc_prepare operation.
Between those two events, the i_lock is dropped and reacquired.
pnfs_update_layout can find that the list has lsegs in it and not do any
serialization, but then later pnfs_choose_layoutget_stateid ends up
choosing the open stateid.
This patch changes the client to select the stateid to use in the
LAYOUTGET earlier, when we're searching for a usable layout segment.
This way we can do it all while holding the i_lock the first time, and
ensure that we serialize any LAYOUTGET call that uses a non-layout
stateid.
This also means a rework of how LAYOUTGET replies are handled, as we
must now get the latest stateid if we want to retransmit in response
to a retryable error.
Most of those errors boil down to the fact that the layout state has
changed in some fashion. Thus, what we really want to do is to re-search
for a layout when it fails with a retryable error, so that we can avoid
reissuing the RPC at all if possible.
While the LAYOUTGET RPC is async, the initiating thread always waits for
it to complete, so it's effectively synchronous anyway. Currently, when
we need to retry a LAYOUTGET because of an error, we drive that retry
via the rpc state machine.
This means that once the call has been submitted, it runs until it
completes. So, we must move the error handling for this RPC out of the
rpc_call_done operation and into the caller.
In order to handle errors like NFS4ERR_DELAY properly, we must also
pass a pointer to the sliding timeout, which is now moved to the stack
in pnfs_update_layout.
The complicating errors are -NFS4ERR_RECALLCONFLICT and
-NFS4ERR_LAYOUTTRYLATER, as those involve a timeout after which we give
up and return NULL back to the caller. So, there is some special
handling for those errors to ensure that the layers driving the retries
can handle that appropriately.
Signed-off-by: Jeff Layton <jeff.layton@primarydata.com>
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
2016-05-17 23:28:47 +07:00
|
|
|
|
2013-02-16 04:03:46 +07:00
|
|
|
/* if layoutp->len is 0, nfs4_layoutget_prepare called rpc_exit */
|
|
|
|
if (status == 0 && lgp->res.layoutp->len)
|
2012-09-18 04:12:15 +07:00
|
|
|
lseg = pnfs_layout_process(lgp);
|
2010-10-20 11:18:03 +07:00
|
|
|
rpc_put_task(task);
|
|
|
|
dprintk("<-- %s status=%d\n", __func__, status);
|
2012-09-18 04:12:15 +07:00
|
|
|
if (status)
|
|
|
|
return ERR_PTR(status);
|
|
|
|
return lseg;
|
2010-10-20 11:18:03 +07:00
|
|
|
}
|
|
|
|
|
2011-05-22 23:52:37 +07:00
|
|
|
static void
|
|
|
|
nfs4_layoutreturn_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutreturn *lrp = calldata;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(lrp->clp,
|
2012-10-23 07:28:44 +07:00
|
|
|
&lrp->args.seq_args,
|
|
|
|
&lrp->res.seq_res,
|
|
|
|
task);
|
2011-05-22 23:52:37 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_layoutreturn_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutreturn *lrp = calldata;
|
|
|
|
struct nfs_server *server;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
|
|
|
|
2016-08-28 22:50:26 +07:00
|
|
|
if (!nfs41_sequence_process(task, &lrp->res.seq_res))
|
2011-05-22 23:52:37 +07:00
|
|
|
return;
|
|
|
|
|
|
|
|
server = NFS_SERVER(lrp->args.inode);
|
2013-12-05 00:09:45 +07:00
|
|
|
switch (task->tk_status) {
|
2017-11-07 03:28:08 +07:00
|
|
|
case -NFS4ERR_OLD_STATEID:
|
|
|
|
if (nfs4_refresh_layout_stateid(&lrp->args.stateid,
|
|
|
|
lrp->args.inode))
|
|
|
|
goto out_restart;
|
|
|
|
/* Fallthrough */
|
2013-12-05 00:09:45 +07:00
|
|
|
default:
|
|
|
|
task->tk_status = 0;
|
2017-11-07 03:28:08 +07:00
|
|
|
/* Fallthrough */
|
2013-12-05 00:09:45 +07:00
|
|
|
case 0:
|
|
|
|
break;
|
|
|
|
case -NFS4ERR_DELAY:
|
2014-09-18 13:09:27 +07:00
|
|
|
if (nfs4_async_handle_error(task, server, NULL, NULL) != -EAGAIN)
|
2013-12-05 00:09:45 +07:00
|
|
|
break;
|
2017-11-07 03:28:08 +07:00
|
|
|
goto out_restart;
|
2011-05-22 23:52:37 +07:00
|
|
|
}
|
|
|
|
dprintk("<-- %s\n", __func__);
|
2017-11-07 03:28:08 +07:00
|
|
|
return;
|
|
|
|
out_restart:
|
|
|
|
task->tk_status = 0;
|
|
|
|
nfs4_sequence_free_slot(&lrp->res.seq_res);
|
|
|
|
rpc_restart_call_prepare(task);
|
2011-05-22 23:52:37 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_layoutreturn_release(void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutreturn *lrp = calldata;
|
2012-09-25 01:18:39 +07:00
|
|
|
struct pnfs_layout_hdr *lo = lrp->args.layout;
|
2011-05-22 23:52:37 +07:00
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2016-11-21 01:13:54 +07:00
|
|
|
pnfs_layoutreturn_free_lsegs(lo, &lrp->args.stateid, &lrp->args.range,
|
2016-10-13 06:50:54 +07:00
|
|
|
lrp->res.lrs_present ? &lrp->res.stateid : NULL);
|
2016-08-28 22:50:26 +07:00
|
|
|
nfs4_sequence_free_slot(&lrp->res.seq_res);
|
2016-09-23 22:38:08 +07:00
|
|
|
if (lrp->ld_private.ops && lrp->ld_private.ops->free)
|
|
|
|
lrp->ld_private.ops->free(&lrp->ld_private);
|
2016-12-08 00:29:26 +07:00
|
|
|
pnfs_put_layout_hdr(lrp->args.layout);
|
|
|
|
nfs_iput_and_deactive(lrp->inode);
|
2011-05-22 23:52:37 +07:00
|
|
|
kfree(calldata);
|
|
|
|
dprintk("<-- %s\n", __func__);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_layoutreturn_call_ops = {
|
|
|
|
.rpc_call_prepare = nfs4_layoutreturn_prepare,
|
|
|
|
.rpc_call_done = nfs4_layoutreturn_done,
|
|
|
|
.rpc_release = nfs4_layoutreturn_release,
|
|
|
|
};
|
|
|
|
|
2014-11-17 08:30:40 +07:00
|
|
|
int nfs4_proc_layoutreturn(struct nfs4_layoutreturn *lrp, bool sync)
|
2011-05-22 23:52:37 +07:00
|
|
|
{
|
|
|
|
struct rpc_task *task;
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTRETURN],
|
|
|
|
.rpc_argp = &lrp->args,
|
|
|
|
.rpc_resp = &lrp->res,
|
2013-05-20 21:43:47 +07:00
|
|
|
.rpc_cred = lrp->cred,
|
2011-05-22 23:52:37 +07:00
|
|
|
};
|
|
|
|
struct rpc_task_setup task_setup_data = {
|
2013-07-22 23:42:05 +07:00
|
|
|
.rpc_client = NFS_SERVER(lrp->args.inode)->client,
|
2011-05-22 23:52:37 +07:00
|
|
|
.rpc_message = &msg,
|
|
|
|
.callback_ops = &nfs4_layoutreturn_call_ops,
|
|
|
|
.callback_data = lrp,
|
|
|
|
};
|
2014-11-17 08:30:40 +07:00
|
|
|
int status = 0;
|
2011-05-22 23:52:37 +07:00
|
|
|
|
2015-12-02 21:39:51 +07:00
|
|
|
nfs4_state_protect(NFS_SERVER(lrp->args.inode)->nfs_client,
|
|
|
|
NFS_SP4_MACH_CRED_PNFS_CLEANUP,
|
|
|
|
&task_setup_data.rpc_client, &msg);
|
|
|
|
|
2011-05-22 23:52:37 +07:00
|
|
|
dprintk("--> %s\n", __func__);
|
2015-02-06 04:35:16 +07:00
|
|
|
if (!sync) {
|
|
|
|
lrp->inode = nfs_igrab_and_active(lrp->args.inode);
|
|
|
|
if (!lrp->inode) {
|
|
|
|
nfs4_layoutreturn_release(lrp);
|
|
|
|
return -EAGAIN;
|
|
|
|
}
|
|
|
|
task_setup_data.flags |= RPC_TASK_ASYNC;
|
|
|
|
}
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&lrp->args.seq_args, &lrp->res.seq_res, 1, 0);
|
2011-05-22 23:52:37 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
|
|
|
if (IS_ERR(task))
|
|
|
|
return PTR_ERR(task);
|
2015-02-06 04:35:16 +07:00
|
|
|
if (sync)
|
|
|
|
status = task->tk_status;
|
Adding stateid information to tracepoints
Operations to which stateid information is added:
close, delegreturn, open, read, setattr, layoutget, layoutcommit, test_stateid,
write, lock, locku, lockt
Format is "stateid=<seqid>:<crc32 hash stateid.other>", also "openstateid=",
"layoutstateid=", and "lockstateid=" for open_file, layoutget, set_lock
tracepoints.
New function is added to internal.h, nfs_stateid_hash(), to compute the hash
trace_nfs4_setattr() is moved from nfs4_do_setattr() to _nfs4_do_setattr()
to get access to stateid.
trace_nfs4_setattr and trace_nfs4_delegreturn are changed from INODE_EVENT
to new event type, INODE_STATEID_EVENT which is same as INODE_EVENT but adds
stateid information
for locking tracepoints, moved trace_nfs4_set_lock() into _nfs4_do_setlk()
to get access to stateid information, and removed trace_nfs4_lock_reclaim(),
trace_nfs4_lock_expired() as they call into _nfs4_do_setlk() and both were
previously same LOCK_EVENT type.
Signed-off-by: Olga Kornievskaia <kolga@netapp.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-11-25 01:29:41 +07:00
|
|
|
trace_nfs4_layoutreturn(lrp->args.inode, &lrp->args.stateid, status);
|
2011-05-22 23:52:37 +07:00
|
|
|
dprintk("<-- %s status=%d\n", __func__, status);
|
|
|
|
rpc_put_task(task);
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2010-10-20 11:18:03 +07:00
|
|
|
static int
|
2013-05-20 22:42:54 +07:00
|
|
|
_nfs4_proc_getdeviceinfo(struct nfs_server *server,
|
|
|
|
struct pnfs_device *pdev,
|
|
|
|
struct rpc_cred *cred)
|
2010-10-20 11:18:03 +07:00
|
|
|
{
|
|
|
|
struct nfs4_getdeviceinfo_args args = {
|
|
|
|
.pdev = pdev,
|
2015-03-10 01:01:25 +07:00
|
|
|
.notify_types = NOTIFY_DEVICEID4_CHANGE |
|
|
|
|
NOTIFY_DEVICEID4_DELETE,
|
2010-10-20 11:18:03 +07:00
|
|
|
};
|
|
|
|
struct nfs4_getdeviceinfo_res res = {
|
|
|
|
.pdev = pdev,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICEINFO],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
2013-05-20 22:42:54 +07:00
|
|
|
.rpc_cred = cred,
|
2010-10-20 11:18:03 +07:00
|
|
|
};
|
|
|
|
int status;
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
2011-03-25 00:12:24 +07:00
|
|
|
status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
|
2015-03-10 01:01:25 +07:00
|
|
|
if (res.notification & ~args.notify_types)
|
|
|
|
dprintk("%s: unsupported notification\n", __func__);
|
2015-03-10 01:48:32 +07:00
|
|
|
if (res.notification != args.notify_types)
|
|
|
|
pdev->nocache = 1;
|
2015-03-10 01:01:25 +07:00
|
|
|
|
2010-10-20 11:18:03 +07:00
|
|
|
dprintk("<-- %s status=%d\n", __func__, status);
|
|
|
|
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
|
2013-05-20 22:42:54 +07:00
|
|
|
int nfs4_proc_getdeviceinfo(struct nfs_server *server,
|
|
|
|
struct pnfs_device *pdev,
|
|
|
|
struct rpc_cred *cred)
|
2010-10-20 11:18:03 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
|
|
|
|
do {
|
|
|
|
err = nfs4_handle_exception(server,
|
2013-05-20 22:42:54 +07:00
|
|
|
_nfs4_proc_getdeviceinfo(server, pdev, cred),
|
2010-10-20 11:18:03 +07:00
|
|
|
&exception);
|
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(nfs4_proc_getdeviceinfo);
|
|
|
|
|
2011-03-23 20:27:54 +07:00
|
|
|
static void nfs4_layoutcommit_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutcommit_data *data = calldata;
|
|
|
|
struct nfs_server *server = NFS_SERVER(data->args.inode);
|
|
|
|
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(server->nfs_client,
|
2012-10-23 07:28:44 +07:00
|
|
|
&data->args.seq_args,
|
|
|
|
&data->res.seq_res,
|
|
|
|
task);
|
2011-03-23 20:27:54 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
nfs4_layoutcommit_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutcommit_data *data = calldata;
|
|
|
|
struct nfs_server *server = NFS_SERVER(data->args.inode);
|
|
|
|
|
2012-10-23 07:07:20 +07:00
|
|
|
if (!nfs41_sequence_done(task, &data->res.seq_res))
|
2011-03-23 20:27:54 +07:00
|
|
|
return;
|
|
|
|
|
|
|
|
switch (task->tk_status) { /* Just ignore these failures */
|
2012-03-28 05:22:19 +07:00
|
|
|
case -NFS4ERR_DELEG_REVOKED: /* layout was recalled */
|
|
|
|
case -NFS4ERR_BADIOMODE: /* no IOMODE_RW layout for range */
|
|
|
|
case -NFS4ERR_BADLAYOUT: /* no layout */
|
|
|
|
case -NFS4ERR_GRACE: /* loca_recalim always false */
|
2011-03-23 20:27:54 +07:00
|
|
|
task->tk_status = 0;
|
2012-03-28 05:22:19 +07:00
|
|
|
case 0:
|
|
|
|
break;
|
|
|
|
default:
|
2014-09-18 13:09:27 +07:00
|
|
|
if (nfs4_async_handle_error(task, server, NULL, NULL) == -EAGAIN) {
|
2012-03-28 05:22:19 +07:00
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
2011-03-23 20:27:54 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs4_layoutcommit_release(void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs4_layoutcommit_data *data = calldata;
|
|
|
|
|
2011-07-31 07:52:38 +07:00
|
|
|
pnfs_cleanup_layoutcommit(data);
|
2014-01-14 00:08:11 +07:00
|
|
|
nfs_post_op_update_inode_force_wcc(data->args.inode,
|
|
|
|
data->res.fattr);
|
2011-03-23 20:27:54 +07:00
|
|
|
put_rpccred(data->cred);
|
2015-02-06 04:50:30 +07:00
|
|
|
nfs_iput_and_deactive(data->inode);
|
2011-03-23 20:27:54 +07:00
|
|
|
kfree(data);
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct rpc_call_ops nfs4_layoutcommit_ops = {
|
|
|
|
.rpc_call_prepare = nfs4_layoutcommit_prepare,
|
|
|
|
.rpc_call_done = nfs4_layoutcommit_done,
|
|
|
|
.rpc_release = nfs4_layoutcommit_release,
|
|
|
|
};
|
|
|
|
|
|
|
|
int
|
2011-03-12 14:58:10 +07:00
|
|
|
nfs4_proc_layoutcommit(struct nfs4_layoutcommit_data *data, bool sync)
|
2011-03-23 20:27:54 +07:00
|
|
|
{
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTCOMMIT],
|
|
|
|
.rpc_argp = &data->args,
|
|
|
|
.rpc_resp = &data->res,
|
|
|
|
.rpc_cred = data->cred,
|
|
|
|
};
|
|
|
|
struct rpc_task_setup task_setup_data = {
|
|
|
|
.task = &data->task,
|
|
|
|
.rpc_client = NFS_CLIENT(data->args.inode),
|
|
|
|
.rpc_message = &msg,
|
|
|
|
.callback_ops = &nfs4_layoutcommit_ops,
|
|
|
|
.callback_data = data,
|
|
|
|
};
|
|
|
|
struct rpc_task *task;
|
|
|
|
int status = 0;
|
|
|
|
|
2015-07-01 11:00:13 +07:00
|
|
|
dprintk("NFS: initiating layoutcommit call. sync %d "
|
|
|
|
"lbw: %llu inode %lu\n", sync,
|
2011-03-23 20:27:54 +07:00
|
|
|
data->args.lastbytewritten,
|
|
|
|
data->args.inode->i_ino);
|
|
|
|
|
2015-02-06 04:50:30 +07:00
|
|
|
if (!sync) {
|
|
|
|
data->inode = nfs_igrab_and_active(data->args.inode);
|
|
|
|
if (data->inode == NULL) {
|
|
|
|
nfs4_layoutcommit_release(data);
|
|
|
|
return -EAGAIN;
|
|
|
|
}
|
|
|
|
task_setup_data.flags = RPC_TASK_ASYNC;
|
|
|
|
}
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 1, 0);
|
2011-03-23 20:27:54 +07:00
|
|
|
task = rpc_run_task(&task_setup_data);
|
|
|
|
if (IS_ERR(task))
|
|
|
|
return PTR_ERR(task);
|
2015-02-06 04:50:30 +07:00
|
|
|
if (sync)
|
|
|
|
status = task->tk_status;
|
Adding stateid information to tracepoints
Operations to which stateid information is added:
close, delegreturn, open, read, setattr, layoutget, layoutcommit, test_stateid,
write, lock, locku, lockt
Format is "stateid=<seqid>:<crc32 hash stateid.other>", also "openstateid=",
"layoutstateid=", and "lockstateid=" for open_file, layoutget, set_lock
tracepoints.
New function is added to internal.h, nfs_stateid_hash(), to compute the hash
trace_nfs4_setattr() is moved from nfs4_do_setattr() to _nfs4_do_setattr()
to get access to stateid.
trace_nfs4_setattr and trace_nfs4_delegreturn are changed from INODE_EVENT
to new event type, INODE_STATEID_EVENT which is same as INODE_EVENT but adds
stateid information
for locking tracepoints, moved trace_nfs4_set_lock() into _nfs4_do_setlk()
to get access to stateid information, and removed trace_nfs4_lock_reclaim(),
trace_nfs4_lock_expired() as they call into _nfs4_do_setlk() and both were
previously same LOCK_EVENT type.
Signed-off-by: Olga Kornievskaia <kolga@netapp.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-11-25 01:29:41 +07:00
|
|
|
trace_nfs4_layoutcommit(data->args.inode, &data->args.stateid, status);
|
2011-03-23 20:27:54 +07:00
|
|
|
dprintk("%s: status %d\n", __func__, status);
|
|
|
|
rpc_put_task(task);
|
|
|
|
return status;
|
|
|
|
}
|
2011-06-03 01:59:07 +07:00
|
|
|
|
2013-08-08 21:57:56 +07:00
|
|
|
/**
|
|
|
|
* Use the state managment nfs_client cl_rpcclient, which uses krb5i (if
|
|
|
|
* possible) as per RFC3530bis and RFC5661 Security Considerations sections
|
|
|
|
*/
|
2011-06-03 01:59:07 +07:00
|
|
|
static int
|
|
|
|
_nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
|
2013-09-04 23:13:19 +07:00
|
|
|
struct nfs_fsinfo *info,
|
|
|
|
struct nfs4_secinfo_flavors *flavors, bool use_integrity)
|
2011-06-03 01:59:07 +07:00
|
|
|
{
|
|
|
|
struct nfs41_secinfo_no_name_args args = {
|
|
|
|
.style = SECINFO_STYLE_CURRENT_FH,
|
|
|
|
};
|
|
|
|
struct nfs4_secinfo_res res = {
|
|
|
|
.flavors = flavors,
|
|
|
|
};
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO_NO_NAME],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
|
|
|
};
|
2013-09-04 23:13:19 +07:00
|
|
|
struct rpc_clnt *clnt = server->client;
|
2013-09-11 05:44:31 +07:00
|
|
|
struct rpc_cred *cred = NULL;
|
2013-09-04 23:13:19 +07:00
|
|
|
int status;
|
|
|
|
|
|
|
|
if (use_integrity) {
|
|
|
|
clnt = server->nfs_client->cl_rpcclient;
|
2013-09-11 05:44:31 +07:00
|
|
|
cred = nfs4_get_clid_cred(server->nfs_client);
|
|
|
|
msg.rpc_cred = cred;
|
2013-09-04 23:13:19 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
dprintk("--> %s\n", __func__);
|
|
|
|
status = nfs4_call_sync(clnt, server, &msg, &args.seq_args,
|
|
|
|
&res.seq_res, 0);
|
|
|
|
dprintk("<-- %s status=%d\n", __func__, status);
|
|
|
|
|
2013-09-11 05:44:31 +07:00
|
|
|
if (cred)
|
|
|
|
put_rpccred(cred);
|
2013-09-04 23:13:19 +07:00
|
|
|
|
|
|
|
return status;
|
2011-06-03 01:59:07 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
|
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-09-04 23:13:19 +07:00
|
|
|
/* first try using integrity protection */
|
|
|
|
err = -NFS4ERR_WRONGSEC;
|
|
|
|
|
|
|
|
/* try to use integrity protection with machine cred */
|
|
|
|
if (_nfs4_is_integrity_protected(server->nfs_client))
|
|
|
|
err = _nfs41_proc_secinfo_no_name(server, fhandle, info,
|
|
|
|
flavors, true);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* if unable to use integrity protection, or SECINFO with
|
|
|
|
* integrity protection returns NFS4ERR_WRONGSEC (which is
|
|
|
|
* disallowed by spec, but exists in deployed servers) use
|
|
|
|
* the current filesystem's rpc_client and the user cred.
|
|
|
|
*/
|
|
|
|
if (err == -NFS4ERR_WRONGSEC)
|
|
|
|
err = _nfs41_proc_secinfo_no_name(server, fhandle, info,
|
|
|
|
flavors, false);
|
|
|
|
|
2011-06-03 01:59:07 +07:00
|
|
|
switch (err) {
|
|
|
|
case 0:
|
|
|
|
case -NFS4ERR_WRONGSEC:
|
2014-01-14 04:54:45 +07:00
|
|
|
case -ENOTSUPP:
|
2012-03-28 05:13:02 +07:00
|
|
|
goto out;
|
2011-06-03 01:59:07 +07:00
|
|
|
default:
|
|
|
|
err = nfs4_handle_exception(server, err, &exception);
|
|
|
|
}
|
|
|
|
} while (exception.retry);
|
2012-03-28 05:13:02 +07:00
|
|
|
out:
|
2011-06-03 01:59:07 +07:00
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
|
|
nfs41_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
|
|
|
|
struct nfs_fsinfo *info)
|
|
|
|
{
|
|
|
|
int err;
|
|
|
|
struct page *page;
|
2013-09-26 04:02:48 +07:00
|
|
|
rpc_authflavor_t flavor = RPC_AUTH_MAXFLAVOR;
|
2011-06-03 01:59:07 +07:00
|
|
|
struct nfs4_secinfo_flavors *flavors;
|
2013-09-25 00:58:02 +07:00
|
|
|
struct nfs4_secinfo4 *secinfo;
|
|
|
|
int i;
|
2011-06-03 01:59:07 +07:00
|
|
|
|
|
|
|
page = alloc_page(GFP_KERNEL);
|
|
|
|
if (!page) {
|
|
|
|
err = -ENOMEM;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
flavors = page_address(page);
|
|
|
|
err = nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Fall back on "guess and check" method if
|
|
|
|
* the server doesn't support SECINFO_NO_NAME
|
|
|
|
*/
|
2014-01-14 04:54:45 +07:00
|
|
|
if (err == -NFS4ERR_WRONGSEC || err == -ENOTSUPP) {
|
2011-06-03 01:59:07 +07:00
|
|
|
err = nfs4_find_root_sec(server, fhandle, info);
|
|
|
|
goto out_freepage;
|
|
|
|
}
|
|
|
|
if (err)
|
|
|
|
goto out_freepage;
|
|
|
|
|
2013-09-25 00:58:02 +07:00
|
|
|
for (i = 0; i < flavors->num_flavors; i++) {
|
|
|
|
secinfo = &flavors->flavors[i];
|
|
|
|
|
|
|
|
switch (secinfo->flavor) {
|
|
|
|
case RPC_AUTH_NULL:
|
|
|
|
case RPC_AUTH_UNIX:
|
|
|
|
case RPC_AUTH_GSS:
|
|
|
|
flavor = rpcauth_get_pseudoflavor(secinfo->flavor,
|
|
|
|
&secinfo->flavor_info);
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
flavor = RPC_AUTH_MAXFLAVOR;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2013-10-19 02:15:19 +07:00
|
|
|
if (!nfs_auth_info_match(&server->auth_info, flavor))
|
|
|
|
flavor = RPC_AUTH_MAXFLAVOR;
|
|
|
|
|
2013-09-25 00:58:02 +07:00
|
|
|
if (flavor != RPC_AUTH_MAXFLAVOR) {
|
|
|
|
err = nfs4_lookup_root_sec(server, fhandle,
|
|
|
|
info, flavor);
|
|
|
|
if (!err)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (flavor == RPC_AUTH_MAXFLAVOR)
|
|
|
|
err = -EPERM;
|
2011-06-03 01:59:07 +07:00
|
|
|
|
|
|
|
out_freepage:
|
|
|
|
put_page(page);
|
|
|
|
if (err == -EACCES)
|
|
|
|
return -EPERM;
|
|
|
|
out:
|
|
|
|
return err;
|
|
|
|
}
|
2012-01-31 22:39:29 +07:00
|
|
|
|
2013-05-20 22:20:27 +07:00
|
|
|
static int _nfs41_test_stateid(struct nfs_server *server,
|
|
|
|
nfs4_stateid *stateid,
|
|
|
|
struct rpc_cred *cred)
|
2011-06-03 01:59:08 +07:00
|
|
|
{
|
|
|
|
int status;
|
|
|
|
struct nfs41_test_stateid_args args = {
|
2012-01-31 22:39:29 +07:00
|
|
|
.stateid = stateid,
|
2011-06-03 01:59:08 +07:00
|
|
|
};
|
|
|
|
struct nfs41_test_stateid_res res;
|
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_TEST_STATEID],
|
|
|
|
.rpc_argp = &args,
|
|
|
|
.rpc_resp = &res,
|
2013-05-20 22:20:27 +07:00
|
|
|
.rpc_cred = cred,
|
2011-06-03 01:59:08 +07:00
|
|
|
};
|
2013-08-14 03:37:36 +07:00
|
|
|
struct rpc_clnt *rpc_client = server->client;
|
|
|
|
|
|
|
|
nfs4_state_protect(server->nfs_client, NFS_SP4_MACH_CRED_STATEID,
|
|
|
|
&rpc_client, &msg);
|
2012-01-31 22:39:29 +07:00
|
|
|
|
2012-07-12 03:30:23 +07:00
|
|
|
dprintk("NFS call test_stateid %p\n", stateid);
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&args.seq_args, &res.seq_res, 0, 1);
|
2013-08-14 03:37:36 +07:00
|
|
|
status = nfs4_call_sync_sequence(rpc_client, server, &msg,
|
2012-10-30 06:02:20 +07:00
|
|
|
&args.seq_args, &res.seq_res);
|
2012-07-12 03:30:23 +07:00
|
|
|
if (status != NFS_OK) {
|
|
|
|
dprintk("NFS reply test_stateid: failed, %d\n", status);
|
NFS: Fix up TEST_STATEID and FREE_STATEID return code handling
The TEST_STATEID and FREE_STATEID operations can return
-NFS4ERR_BAD_STATEID, -NFS4ERR_OLD_STATEID, or -NFS4ERR_DEADSESSION.
nfs41_{test,free}_stateid() should not pass these errors to
nfs4_handle_exception() during state recovery, since that will
recursively kick off state recovery again, resulting in a deadlock.
In particular, when the TEST_STATEID operation returns NFS4_OK,
res.status can contain one of these errors. _nfs41_test_stateid()
replaces NFS4_OK with the value in res.status, which is then returned
to callers.
But res.status is not passed through nfs4_stat_to_errno(), and thus is
a positive NFS4ERR value. Currently callers are only interested in
!NFS4_OK, and nfs4_handle_exception() ignores positive values.
Thus the res.status values are currently ignored by
nfs4_handle_exception() and won't cause the deadlock above. Thanks to
this missing negative, it is only when these operations fail (which
is very rare) that a deadlock can occur.
Bryan agrees the original intent was to return res.status as a
negative NFS4ERR value to callers of nfs41_test_stateid().
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-07-12 03:29:45 +07:00
|
|
|
return status;
|
2012-07-12 03:30:23 +07:00
|
|
|
}
|
|
|
|
dprintk("NFS reply test_stateid: succeeded, %d\n", -res.status);
|
NFS: Fix up TEST_STATEID and FREE_STATEID return code handling
The TEST_STATEID and FREE_STATEID operations can return
-NFS4ERR_BAD_STATEID, -NFS4ERR_OLD_STATEID, or -NFS4ERR_DEADSESSION.
nfs41_{test,free}_stateid() should not pass these errors to
nfs4_handle_exception() during state recovery, since that will
recursively kick off state recovery again, resulting in a deadlock.
In particular, when the TEST_STATEID operation returns NFS4_OK,
res.status can contain one of these errors. _nfs41_test_stateid()
replaces NFS4_OK with the value in res.status, which is then returned
to callers.
But res.status is not passed through nfs4_stat_to_errno(), and thus is
a positive NFS4ERR value. Currently callers are only interested in
!NFS4_OK, and nfs4_handle_exception() ignores positive values.
Thus the res.status values are currently ignored by
nfs4_handle_exception() and won't cause the deadlock above. Thanks to
this missing negative, it is only when these operations fail (which
is very rare) that a deadlock can occur.
Bryan agrees the original intent was to return res.status as a
negative NFS4ERR value to callers of nfs41_test_stateid().
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2012-07-12 03:29:45 +07:00
|
|
|
return -res.status;
|
2011-06-03 01:59:08 +07:00
|
|
|
}
|
|
|
|
|
2016-09-23 00:38:56 +07:00
|
|
|
static void nfs4_handle_delay_or_session_error(struct nfs_server *server,
|
|
|
|
int err, struct nfs4_exception *exception)
|
|
|
|
{
|
|
|
|
exception->retry = 0;
|
|
|
|
switch(err) {
|
|
|
|
case -NFS4ERR_DELAY:
|
2016-09-23 00:39:19 +07:00
|
|
|
case -NFS4ERR_RETRY_UNCACHED_REP:
|
2016-09-23 00:38:56 +07:00
|
|
|
nfs4_handle_exception(server, err, exception);
|
|
|
|
break;
|
|
|
|
case -NFS4ERR_BADSESSION:
|
|
|
|
case -NFS4ERR_BADSLOT:
|
|
|
|
case -NFS4ERR_BAD_HIGH_SLOT:
|
|
|
|
case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
|
|
|
|
case -NFS4ERR_DEADSESSION:
|
|
|
|
nfs4_do_handle_exception(server, err, exception);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-07-12 03:30:23 +07:00
|
|
|
/**
|
|
|
|
* nfs41_test_stateid - perform a TEST_STATEID operation
|
|
|
|
*
|
|
|
|
* @server: server / transport on which to perform the operation
|
|
|
|
* @stateid: state ID to test
|
2013-05-20 22:20:27 +07:00
|
|
|
* @cred: credential
|
2012-07-12 03:30:23 +07:00
|
|
|
*
|
|
|
|
* Returns NFS_OK if the server recognizes that "stateid" is valid.
|
|
|
|
* Otherwise a negative NFS4ERR value is returned if the operation
|
|
|
|
* failed or the state ID is not currently valid.
|
|
|
|
*/
|
2013-05-20 22:20:27 +07:00
|
|
|
static int nfs41_test_stateid(struct nfs_server *server,
|
|
|
|
nfs4_stateid *stateid,
|
|
|
|
struct rpc_cred *cred)
|
2011-06-03 01:59:08 +07:00
|
|
|
{
|
|
|
|
struct nfs4_exception exception = { };
|
|
|
|
int err;
|
|
|
|
do {
|
2013-05-20 22:20:27 +07:00
|
|
|
err = _nfs41_test_stateid(server, stateid, cred);
|
2016-09-23 00:38:56 +07:00
|
|
|
nfs4_handle_delay_or_session_error(server, err, &exception);
|
2011-06-03 01:59:08 +07:00
|
|
|
} while (exception.retry);
|
|
|
|
return err;
|
|
|
|
}
|
2011-06-03 01:59:09 +07:00
|
|
|
|
2013-05-04 01:40:01 +07:00
|
|
|
struct nfs_free_stateid_data {
|
|
|
|
struct nfs_server *server;
|
|
|
|
struct nfs41_free_stateid_args args;
|
2011-06-03 01:59:09 +07:00
|
|
|
struct nfs41_free_stateid_res res;
|
2013-05-04 01:40:01 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
static void nfs41_free_stateid_prepare(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs_free_stateid_data *data = calldata;
|
2017-01-10 23:39:53 +07:00
|
|
|
nfs4_setup_sequence(data->server->nfs_client,
|
2013-05-04 01:40:01 +07:00
|
|
|
&data->args.seq_args,
|
|
|
|
&data->res.seq_res,
|
|
|
|
task);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs41_free_stateid_done(struct rpc_task *task, void *calldata)
|
|
|
|
{
|
|
|
|
struct nfs_free_stateid_data *data = calldata;
|
|
|
|
|
|
|
|
nfs41_sequence_done(task, &data->res.seq_res);
|
|
|
|
|
|
|
|
switch (task->tk_status) {
|
|
|
|
case -NFS4ERR_DELAY:
|
2014-09-18 13:09:27 +07:00
|
|
|
if (nfs4_async_handle_error(task, data->server, NULL, NULL) == -EAGAIN)
|
2013-05-04 01:40:01 +07:00
|
|
|
rpc_restart_call_prepare(task);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void nfs41_free_stateid_release(void *calldata)
|
|
|
|
{
|
|
|
|
kfree(calldata);
|
|
|
|
}
|
|
|
|
|
2013-08-22 02:48:42 +07:00
|
|
|
static const struct rpc_call_ops nfs41_free_stateid_ops = {
|
2013-05-04 01:40:01 +07:00
|
|
|
.rpc_call_prepare = nfs41_free_stateid_prepare,
|
|
|
|
.rpc_call_done = nfs41_free_stateid_done,
|
|
|
|
.rpc_release = nfs41_free_stateid_release,
|
|
|
|
};
|
|
|
|
|
2018-05-16 00:03:39 +07:00
|
|
|
/**
|
|
|
|
* nfs41_free_stateid - perform a FREE_STATEID operation
|
|
|
|
*
|
|
|
|
* @server: server / transport on which to perform the operation
|
|
|
|
* @stateid: state ID to release
|
|
|
|
* @cred: credential
|
|
|
|
* @is_recovery: set to true if this call needs to be privileged
|
|
|
|
*
|
|
|
|
* Note: this function is always asynchronous.
|
|
|
|
*/
|
|
|
|
static int nfs41_free_stateid(struct nfs_server *server,
|
2016-09-23 00:39:04 +07:00
|
|
|
const nfs4_stateid *stateid,
|
2013-05-20 22:20:27 +07:00
|
|
|
struct rpc_cred *cred,
|
2013-05-04 01:40:01 +07:00
|
|
|
bool privileged)
|
|
|
|
{
|
2011-06-03 01:59:09 +07:00
|
|
|
struct rpc_message msg = {
|
|
|
|
.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FREE_STATEID],
|
2013-05-20 22:20:27 +07:00
|
|
|
.rpc_cred = cred,
|
2011-06-03 01:59:09 +07:00
|
|
|
};
|
2013-05-04 01:40:01 +07:00
|
|
|
struct rpc_task_setup task_setup = {
|
|
|
|
.rpc_client = server->client,
|
|
|
|
.rpc_message = &msg,
|
|
|
|
.callback_ops = &nfs41_free_stateid_ops,
|
|
|
|
.flags = RPC_TASK_ASYNC,
|
|
|
|
};
|
|
|
|
struct nfs_free_stateid_data *data;
|
2018-05-16 00:03:39 +07:00
|
|
|
struct rpc_task *task;
|
2011-06-03 01:59:09 +07:00
|
|
|
|
2013-08-14 03:37:36 +07:00
|
|
|
nfs4_state_protect(server->nfs_client, NFS_SP4_MACH_CRED_STATEID,
|
|
|
|
&task_setup.rpc_client, &msg);
|
|
|
|
|
2012-07-12 03:30:23 +07:00
|
|
|
dprintk("NFS call free_stateid %p\n", stateid);
|
2013-05-04 01:40:01 +07:00
|
|
|
data = kmalloc(sizeof(*data), GFP_NOFS);
|
|
|
|
if (!data)
|
2018-05-16 00:03:39 +07:00
|
|
|
return -ENOMEM;
|
2013-05-04 01:40:01 +07:00
|
|
|
data->server = server;
|
|
|
|
nfs4_stateid_copy(&data->args.stateid, stateid);
|
|
|
|
|
|
|
|
task_setup.callback_data = data;
|
|
|
|
|
|
|
|
msg.rpc_argp = &data->args;
|
|
|
|
msg.rpc_resp = &data->res;
|
2018-05-05 03:22:50 +07:00
|
|
|
nfs4_init_sequence(&data->args.seq_args, &data->res.seq_res, 1, privileged);
|
2018-05-16 00:03:39 +07:00
|
|
|
task = rpc_run_task(&task_setup);
|
2013-05-04 01:40:01 +07:00
|
|
|
if (IS_ERR(task))
|
|
|
|
return PTR_ERR(task);
|
|
|
|
rpc_put_task(task);
|
2016-09-23 00:39:04 +07:00
|
|
|
return 0;
|
2011-06-03 01:59:09 +07:00
|
|
|
}
|
2012-03-05 06:13:56 +07:00
|
|
|
|
2014-05-01 17:28:47 +07:00
|
|
|
static void
|
|
|
|
nfs41_free_lock_state(struct nfs_server *server, struct nfs4_lock_state *lsp)
|
2013-05-04 03:22:55 +07:00
|
|
|
{
|
2013-05-20 22:20:27 +07:00
|
|
|
struct rpc_cred *cred = lsp->ls_state->owner->so_cred;
|
2013-05-04 03:22:55 +07:00
|
|
|
|
2016-09-23 00:39:04 +07:00
|
|
|
nfs41_free_stateid(server, &lsp->ls_stateid, cred, false);
|
2013-05-04 03:22:55 +07:00
|
|
|
nfs4_free_lock_state(server, lsp);
|
|
|
|
}
|
|
|
|
|
2012-03-05 06:13:56 +07:00
|
|
|
static bool nfs41_match_stateid(const nfs4_stateid *s1,
|
|
|
|
const nfs4_stateid *s2)
|
|
|
|
{
|
2016-05-17 04:42:43 +07:00
|
|
|
if (s1->type != s2->type)
|
|
|
|
return false;
|
|
|
|
|
2012-03-05 06:13:57 +07:00
|
|
|
if (memcmp(s1->other, s2->other, sizeof(s1->other)) != 0)
|
2012-03-05 06:13:56 +07:00
|
|
|
return false;
|
|
|
|
|
2012-03-05 06:13:57 +07:00
|
|
|
if (s1->seqid == s2->seqid)
|
2012-03-05 06:13:56 +07:00
|
|
|
return true;
|
|
|
|
|
2017-01-12 04:59:48 +07:00
|
|
|
return s1->seqid == 0 || s2->seqid == 0;
|
2012-03-05 06:13:56 +07:00
|
|
|
}
|
|
|
|
|
2009-04-01 20:21:53 +07:00
|
|
|
#endif /* CONFIG_NFS_V4_1 */
|
|
|
|
|
2012-03-05 06:13:56 +07:00
|
|
|
static bool nfs4_match_stateid(const nfs4_stateid *s1,
|
|
|
|
const nfs4_stateid *s2)
|
|
|
|
{
|
2012-03-05 06:13:56 +07:00
|
|
|
return nfs4_stateid_match(s1, s2);
|
2012-03-05 06:13:56 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct nfs4_state_recovery_ops nfs40_reboot_recovery_ops = {
|
2008-12-24 03:21:43 +07:00
|
|
|
.owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
|
2008-12-24 03:21:41 +07:00
|
|
|
.state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
|
2005-04-17 05:20:36 +07:00
|
|
|
.recover_open = nfs4_open_reclaim,
|
|
|
|
.recover_lock = nfs4_lock_reclaim,
|
2009-04-01 20:22:47 +07:00
|
|
|
.establish_clid = nfs4_init_clientid,
|
2012-09-15 04:24:32 +07:00
|
|
|
.detect_trunking = nfs40_discover_server_trunking,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2009-04-01 20:22:47 +07:00
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct nfs4_state_recovery_ops nfs41_reboot_recovery_ops = {
|
2009-04-01 20:22:47 +07:00
|
|
|
.owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
|
|
|
|
.state_flag_bit = NFS_STATE_RECLAIM_REBOOT,
|
|
|
|
.recover_open = nfs4_open_reclaim,
|
|
|
|
.recover_lock = nfs4_lock_reclaim,
|
2009-12-05 03:52:24 +07:00
|
|
|
.establish_clid = nfs41_init_clientid,
|
2009-12-06 04:08:41 +07:00
|
|
|
.reclaim_complete = nfs41_proc_reclaim_complete,
|
2012-09-15 04:24:32 +07:00
|
|
|
.detect_trunking = nfs41_discover_server_trunking,
|
2009-04-01 20:22:47 +07:00
|
|
|
};
|
|
|
|
#endif /* CONFIG_NFS_V4_1 */
|
|
|
|
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct nfs4_state_recovery_ops nfs40_nograce_recovery_ops = {
|
2009-04-01 20:22:47 +07:00
|
|
|
.owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
|
|
|
|
.state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
|
2014-10-17 19:10:25 +07:00
|
|
|
.recover_open = nfs40_open_expired,
|
2009-04-01 20:22:47 +07:00
|
|
|
.recover_lock = nfs4_lock_expired,
|
|
|
|
.establish_clid = nfs4_init_clientid,
|
|
|
|
};
|
|
|
|
|
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct nfs4_state_recovery_ops nfs41_nograce_recovery_ops = {
|
2008-12-24 03:21:43 +07:00
|
|
|
.owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
|
2008-12-24 03:21:41 +07:00
|
|
|
.state_flag_bit = NFS_STATE_RECLAIM_NOGRACE,
|
2011-06-03 01:59:10 +07:00
|
|
|
.recover_open = nfs41_open_expired,
|
|
|
|
.recover_lock = nfs41_lock_expired,
|
2009-12-05 03:52:24 +07:00
|
|
|
.establish_clid = nfs41_init_clientid,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
2009-04-01 20:22:47 +07:00
|
|
|
#endif /* CONFIG_NFS_V4_1 */
|
2005-04-17 05:20:36 +07:00
|
|
|
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct nfs4_state_maintenance_ops nfs40_state_renewal_ops = {
|
2009-04-01 20:22:44 +07:00
|
|
|
.sched_state_renewal = nfs4_proc_async_renew,
|
2009-04-01 20:22:46 +07:00
|
|
|
.get_state_renewal_cred_locked = nfs4_get_renew_cred_locked,
|
2009-04-01 20:22:45 +07:00
|
|
|
.renew_lease = nfs4_proc_renew,
|
2009-04-01 20:22:44 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
2012-03-12 00:11:00 +07:00
|
|
|
static const struct nfs4_state_maintenance_ops nfs41_state_renewal_ops = {
|
2009-04-01 20:22:44 +07:00
|
|
|
.sched_state_renewal = nfs41_proc_async_sequence,
|
2009-04-01 20:22:46 +07:00
|
|
|
.get_state_renewal_cred_locked = nfs4_get_machine_cred_locked,
|
2009-04-01 20:22:45 +07:00
|
|
|
.renew_lease = nfs4_proc_sequence,
|
2009-04-01 20:22:44 +07:00
|
|
|
};
|
|
|
|
#endif
|
|
|
|
|
2013-10-18 01:12:39 +07:00
|
|
|
static const struct nfs4_mig_recovery_ops nfs40_mig_recovery_ops = {
|
2013-10-18 01:12:50 +07:00
|
|
|
.get_locations = _nfs40_proc_get_locations,
|
2013-10-18 01:13:30 +07:00
|
|
|
.fsid_present = _nfs40_proc_fsid_present,
|
2013-10-18 01:12:39 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
|
|
|
static const struct nfs4_mig_recovery_ops nfs41_mig_recovery_ops = {
|
2013-10-18 01:12:50 +07:00
|
|
|
.get_locations = _nfs41_proc_get_locations,
|
2013-10-18 01:13:30 +07:00
|
|
|
.fsid_present = _nfs41_proc_fsid_present,
|
2013-10-18 01:12:39 +07:00
|
|
|
};
|
|
|
|
#endif /* CONFIG_NFS_V4_1 */
|
|
|
|
|
2010-06-16 20:52:26 +07:00
|
|
|
static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
|
|
|
|
.minor_version = 0,
|
2013-03-16 03:11:57 +07:00
|
|
|
.init_caps = NFS_CAP_READDIRPLUS
|
|
|
|
| NFS_CAP_ATOMIC_OPEN
|
|
|
|
| NFS_CAP_POSIX_LOCK,
|
2013-08-09 23:49:11 +07:00
|
|
|
.init_client = nfs40_init_client,
|
|
|
|
.shutdown_client = nfs40_shutdown_client,
|
2012-03-05 06:13:56 +07:00
|
|
|
.match_stateid = nfs4_match_stateid,
|
2011-06-03 01:59:07 +07:00
|
|
|
.find_root_sec = nfs4_find_root_sec,
|
2013-05-04 03:22:55 +07:00
|
|
|
.free_lock_state = nfs4_release_lockowner,
|
2016-09-23 00:38:59 +07:00
|
|
|
.test_and_free_expired = nfs40_test_and_free_expired_stateid,
|
2015-01-24 07:19:25 +07:00
|
|
|
.alloc_seqid = nfs_alloc_seqid,
|
2013-08-09 23:48:27 +07:00
|
|
|
.call_sync_ops = &nfs40_call_sync_ops,
|
2010-06-16 20:52:27 +07:00
|
|
|
.reboot_recovery_ops = &nfs40_reboot_recovery_ops,
|
|
|
|
.nograce_recovery_ops = &nfs40_nograce_recovery_ops,
|
|
|
|
.state_renewal_ops = &nfs40_state_renewal_ops,
|
2013-10-18 01:12:39 +07:00
|
|
|
.mig_recovery_ops = &nfs40_mig_recovery_ops,
|
2010-06-16 20:52:26 +07:00
|
|
|
};
|
|
|
|
|
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
2015-01-24 07:19:25 +07:00
|
|
|
static struct nfs_seqid *
|
|
|
|
nfs_alloc_no_seqid(struct nfs_seqid_counter *arg1, gfp_t arg2)
|
|
|
|
{
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2010-06-16 20:52:26 +07:00
|
|
|
static const struct nfs4_minor_version_ops nfs_v4_1_minor_ops = {
|
|
|
|
.minor_version = 1,
|
2013-03-16 03:11:57 +07:00
|
|
|
.init_caps = NFS_CAP_READDIRPLUS
|
|
|
|
| NFS_CAP_ATOMIC_OPEN
|
2013-03-18 02:31:15 +07:00
|
|
|
| NFS_CAP_POSIX_LOCK
|
2013-03-16 03:44:28 +07:00
|
|
|
| NFS_CAP_STATEID_NFSV41
|
2016-10-05 02:26:41 +07:00
|
|
|
| NFS_CAP_ATOMIC_OPEN_V1
|
|
|
|
| NFS_CAP_LGOPEN,
|
2013-08-09 23:49:11 +07:00
|
|
|
.init_client = nfs41_init_client,
|
|
|
|
.shutdown_client = nfs41_shutdown_client,
|
2012-03-05 06:13:56 +07:00
|
|
|
.match_stateid = nfs41_match_stateid,
|
2011-06-03 01:59:07 +07:00
|
|
|
.find_root_sec = nfs41_find_root_sec,
|
2013-05-04 03:22:55 +07:00
|
|
|
.free_lock_state = nfs41_free_lock_state,
|
2016-09-23 00:38:59 +07:00
|
|
|
.test_and_free_expired = nfs41_test_and_free_expired_stateid,
|
2015-01-24 07:19:25 +07:00
|
|
|
.alloc_seqid = nfs_alloc_no_seqid,
|
2016-09-09 20:22:29 +07:00
|
|
|
.session_trunk = nfs4_test_session_trunk,
|
2013-08-09 23:48:27 +07:00
|
|
|
.call_sync_ops = &nfs41_call_sync_ops,
|
2010-06-16 20:52:27 +07:00
|
|
|
.reboot_recovery_ops = &nfs41_reboot_recovery_ops,
|
|
|
|
.nograce_recovery_ops = &nfs41_nograce_recovery_ops,
|
|
|
|
.state_renewal_ops = &nfs41_state_renewal_ops,
|
2013-10-18 01:12:39 +07:00
|
|
|
.mig_recovery_ops = &nfs41_mig_recovery_ops,
|
2010-06-16 20:52:26 +07:00
|
|
|
};
|
|
|
|
#endif
|
|
|
|
|
2013-05-22 23:50:38 +07:00
|
|
|
#if defined(CONFIG_NFS_V4_2)
|
|
|
|
static const struct nfs4_minor_version_ops nfs_v4_2_minor_ops = {
|
|
|
|
.minor_version = 2,
|
2013-06-20 00:41:43 +07:00
|
|
|
.init_caps = NFS_CAP_READDIRPLUS
|
|
|
|
| NFS_CAP_ATOMIC_OPEN
|
|
|
|
| NFS_CAP_POSIX_LOCK
|
|
|
|
| NFS_CAP_STATEID_NFSV41
|
2014-10-23 02:53:10 +07:00
|
|
|
| NFS_CAP_ATOMIC_OPEN_V1
|
2016-10-05 02:26:41 +07:00
|
|
|
| NFS_CAP_LGOPEN
|
2014-11-26 01:18:15 +07:00
|
|
|
| NFS_CAP_ALLOCATE
|
2013-05-22 03:53:03 +07:00
|
|
|
| NFS_CAP_COPY
|
2014-11-26 01:18:16 +07:00
|
|
|
| NFS_CAP_DEALLOCATE
|
2015-06-27 22:45:46 +07:00
|
|
|
| NFS_CAP_SEEK
|
2015-09-26 01:24:35 +07:00
|
|
|
| NFS_CAP_LAYOUTSTATS
|
|
|
|
| NFS_CAP_CLONE,
|
2013-08-09 23:49:11 +07:00
|
|
|
.init_client = nfs41_init_client,
|
|
|
|
.shutdown_client = nfs41_shutdown_client,
|
2013-05-22 23:50:38 +07:00
|
|
|
.match_stateid = nfs41_match_stateid,
|
|
|
|
.find_root_sec = nfs41_find_root_sec,
|
2013-06-20 00:41:43 +07:00
|
|
|
.free_lock_state = nfs41_free_lock_state,
|
2013-08-09 23:48:27 +07:00
|
|
|
.call_sync_ops = &nfs41_call_sync_ops,
|
2016-09-23 00:38:59 +07:00
|
|
|
.test_and_free_expired = nfs41_test_and_free_expired_stateid,
|
2015-01-24 07:19:25 +07:00
|
|
|
.alloc_seqid = nfs_alloc_no_seqid,
|
2016-09-09 20:22:29 +07:00
|
|
|
.session_trunk = nfs4_test_session_trunk,
|
2013-05-22 23:50:38 +07:00
|
|
|
.reboot_recovery_ops = &nfs41_reboot_recovery_ops,
|
|
|
|
.nograce_recovery_ops = &nfs41_nograce_recovery_ops,
|
|
|
|
.state_renewal_ops = &nfs41_state_renewal_ops,
|
NFS: Fix a NULL pointer dereference of migration recovery ops for v4.2 client
---Steps to Reproduce--
<nfs-server>
# cat /etc/exports
/nfs/referal *(rw,insecure,no_subtree_check,no_root_squash,crossmnt)
/nfs/old *(ro,insecure,subtree_check,root_squash,crossmnt)
<nfs-client>
# mount -t nfs nfs-server:/nfs/ /mnt/
# ll /mnt/*/
<nfs-server>
# cat /etc/exports
/nfs/referal *(rw,insecure,no_subtree_check,no_root_squash,crossmnt,refer=/nfs/old/@nfs-server)
/nfs/old *(ro,insecure,subtree_check,root_squash,crossmnt)
# service nfs restart
<nfs-client>
# ll /mnt/*/ --->>>>> oops here
[ 5123.102925] BUG: unable to handle kernel NULL pointer dereference at (null)
[ 5123.103363] IP: [<ffffffffa03ed38b>] nfs4_proc_get_locations+0x9b/0x120 [nfsv4]
[ 5123.103752] PGD 587b9067 PUD 3cbf5067 PMD 0
[ 5123.104131] Oops: 0000 [#1]
[ 5123.104529] Modules linked in: nfsv4(OE) nfs(OE) fscache(E) nfsd(OE) xfs libcrc32c iscsi_tcp libiscsi_tcp libiscsi scsi_transport_iscsi coretemp crct10dif_pclmul crc32_pclmul crc32c_intel ghash_clmulni_intel ppdev vmw_balloon parport_pc parport i2c_piix4 shpchp auth_rpcgss nfs_acl vmw_vmci lockd grace sunrpc vmwgfx drm_kms_helper ttm drm mptspi serio_raw scsi_transport_spi e1000 mptscsih mptbase ata_generic pata_acpi [last unloaded: nfsd]
[ 5123.105887] CPU: 0 PID: 15853 Comm: ::1-manager Tainted: G OE 4.2.0-rc6+ #214
[ 5123.106358] Hardware name: VMware, Inc. VMware Virtual Platform/440BX Desktop Reference Platform, BIOS 6.00 05/20/2014
[ 5123.106860] task: ffff88007620f300 ti: ffff88005877c000 task.ti: ffff88005877c000
[ 5123.107363] RIP: 0010:[<ffffffffa03ed38b>] [<ffffffffa03ed38b>] nfs4_proc_get_locations+0x9b/0x120 [nfsv4]
[ 5123.107909] RSP: 0018:ffff88005877fdb8 EFLAGS: 00010246
[ 5123.108435] RAX: ffff880053f3bc00 RBX: ffff88006ce6c908 RCX: ffff880053a0d240
[ 5123.108968] RDX: ffffea0000e6d940 RSI: ffff8800399a0000 RDI: ffff88006ce6c908
[ 5123.109503] RBP: ffff88005877fe28 R08: ffffffff81c708a0 R09: 0000000000000000
[ 5123.110045] R10: 00000000000001a2 R11: ffff88003ba7f5c8 R12: ffff880054c55800
[ 5123.110618] R13: 0000000000000000 R14: ffff880053a0d240 R15: ffff880053a0d240
[ 5123.111169] FS: 0000000000000000(0000) GS:ffffffff81c27000(0000) knlGS:0000000000000000
[ 5123.111726] CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[ 5123.112286] CR2: 0000000000000000 CR3: 0000000054cac000 CR4: 00000000001406f0
[ 5123.112888] Stack:
[ 5123.113458] ffffea0000e6d940 ffff8800399a0000 00000000000167d0 0000000000000000
[ 5123.114049] 0000000000000000 0000000000000000 0000000000000000 00000000a7ec82c6
[ 5123.114662] ffff88005877fe18 ffffea0000e6d940 ffff8800399a0000 ffff880054c55800
[ 5123.115264] Call Trace:
[ 5123.115868] [<ffffffffa03fb44b>] nfs4_try_migration+0xbb/0x220 [nfsv4]
[ 5123.116487] [<ffffffffa03fcb3b>] nfs4_run_state_manager+0x4ab/0x7b0 [nfsv4]
[ 5123.117104] [<ffffffffa03fc690>] ? nfs4_do_reclaim+0x510/0x510 [nfsv4]
[ 5123.117813] [<ffffffff810a4527>] kthread+0xd7/0xf0
[ 5123.118456] [<ffffffff810a4450>] ? kthread_worker_fn+0x160/0x160
[ 5123.119108] [<ffffffff816d9cdf>] ret_from_fork+0x3f/0x70
[ 5123.119723] [<ffffffff810a4450>] ? kthread_worker_fn+0x160/0x160
[ 5123.120329] Code: 4c 8b 6a 58 74 17 eb 52 48 8d 55 a8 89 c6 4c 89 e7 e8 4a b5 ff ff 8b 45 b0 85 c0 74 1c 4c 89 f9 48 8b 55 90 48 8b 75 98 48 89 df <41> ff 55 00 3d e8 d8 ff ff 41 89 c6 74 cf 48 8b 4d c8 65 48 33
[ 5123.121643] RIP [<ffffffffa03ed38b>] nfs4_proc_get_locations+0x9b/0x120 [nfsv4]
[ 5123.122308] RSP <ffff88005877fdb8>
[ 5123.122942] CR2: 0000000000000000
Fixes: ec011fe847 ("NFS: Introduce a vector of migration recovery ops")
Cc: stable@vger.kernel.org # v3.13+
Signed-off-by: Kinglong Mee <kinglongmee@gmail.com>
Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
2015-08-15 20:52:10 +07:00
|
|
|
.mig_recovery_ops = &nfs41_mig_recovery_ops,
|
2013-05-22 23:50:38 +07:00
|
|
|
};
|
|
|
|
#endif
|
|
|
|
|
2010-06-16 20:52:26 +07:00
|
|
|
const struct nfs4_minor_version_ops *nfs_v4_minor_ops[] = {
|
|
|
|
[0] = &nfs_v4_0_minor_ops,
|
|
|
|
#if defined(CONFIG_NFS_V4_1)
|
|
|
|
[1] = &nfs_v4_1_minor_ops,
|
|
|
|
#endif
|
2013-05-22 23:50:38 +07:00
|
|
|
#if defined(CONFIG_NFS_V4_2)
|
|
|
|
[2] = &nfs_v4_2_minor_ops,
|
|
|
|
#endif
|
2010-06-16 20:52:26 +07:00
|
|
|
};
|
|
|
|
|
2016-07-25 04:10:52 +07:00
|
|
|
static ssize_t nfs4_listxattr(struct dentry *dentry, char *list, size_t size)
|
2015-12-02 20:44:41 +07:00
|
|
|
{
|
|
|
|
ssize_t error, error2;
|
|
|
|
|
|
|
|
error = generic_listxattr(dentry, list, size);
|
|
|
|
if (error < 0)
|
|
|
|
return error;
|
|
|
|
if (list) {
|
|
|
|
list += error;
|
|
|
|
size -= error;
|
|
|
|
}
|
|
|
|
|
|
|
|
error2 = nfs4_listxattr_nfs4_label(d_inode(dentry), list, size);
|
|
|
|
if (error2 < 0)
|
|
|
|
return error2;
|
|
|
|
return error + error2;
|
|
|
|
}
|
|
|
|
|
2013-08-22 02:48:42 +07:00
|
|
|
static const struct inode_operations nfs4_dir_inode_operations = {
|
2012-07-17 03:39:12 +07:00
|
|
|
.create = nfs_create,
|
|
|
|
.lookup = nfs_lookup,
|
|
|
|
.atomic_open = nfs_atomic_open,
|
|
|
|
.link = nfs_link,
|
|
|
|
.unlink = nfs_unlink,
|
|
|
|
.symlink = nfs_symlink,
|
|
|
|
.mkdir = nfs_mkdir,
|
|
|
|
.rmdir = nfs_rmdir,
|
|
|
|
.mknod = nfs_mknod,
|
|
|
|
.rename = nfs_rename,
|
|
|
|
.permission = nfs_permission,
|
|
|
|
.getattr = nfs_getattr,
|
|
|
|
.setattr = nfs_setattr,
|
2015-12-02 20:44:41 +07:00
|
|
|
.listxattr = nfs4_listxattr,
|
2012-07-17 03:39:12 +07:00
|
|
|
};
|
|
|
|
|
2007-02-12 15:55:39 +07:00
|
|
|
static const struct inode_operations nfs4_file_inode_operations = {
|
2005-06-23 00:16:22 +07:00
|
|
|
.permission = nfs_permission,
|
|
|
|
.getattr = nfs_getattr,
|
|
|
|
.setattr = nfs_setattr,
|
2015-12-02 20:44:41 +07:00
|
|
|
.listxattr = nfs4_listxattr,
|
2005-06-23 00:16:22 +07:00
|
|
|
};
|
|
|
|
|
2006-08-23 07:06:11 +07:00
|
|
|
const struct nfs_rpc_ops nfs_v4_clientops = {
|
2005-04-17 05:20:36 +07:00
|
|
|
.version = 4, /* protocol version */
|
|
|
|
.dentry_ops = &nfs4_dentry_operations,
|
|
|
|
.dir_inode_ops = &nfs4_dir_inode_operations,
|
2005-06-23 00:16:22 +07:00
|
|
|
.file_inode_ops = &nfs4_file_inode_operations,
|
nfs: when attempting to open a directory, fall back on normal lookup (try #5)
commit d953126 changed how nfs_atomic_lookup handles an -EISDIR return
from an OPEN call. Prior to that patch, that caused the client to fall
back to doing a normal lookup. When that patch went in, the code began
returning that error to userspace. The d_revalidate codepath however
never had the corresponding change, so it was still possible to end up
with a NULL ctx->state pointer after that.
That patch caused a regression. When we attempt to open a directory that
does not have a cached dentry, that open now errors out with EISDIR. If
you attempt the same open with a cached dentry, it will succeed.
Fix this by reverting the change in nfs_atomic_lookup and allowing
attempts to open directories to fall back to a normal lookup
Also, add a NFSv4-specific f_ops->open routine that just returns
-ENOTDIR. This should never be called if things are working properly,
but if it ever is, then the dprintk may help in debugging.
To facilitate this, a new file_operations field is also added to the
nfs_rpc_ops struct.
Cc: stable@kernel.org
Signed-off-by: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
2011-11-05 00:31:21 +07:00
|
|
|
.file_ops = &nfs4_file_operations,
|
2005-04-17 05:20:36 +07:00
|
|
|
.getroot = nfs4_proc_get_root,
|
2012-04-28 00:27:45 +07:00
|
|
|
.submount = nfs4_submount,
|
2012-07-31 03:05:18 +07:00
|
|
|
.try_mount = nfs4_try_mount,
|
2005-04-17 05:20:36 +07:00
|
|
|
.getattr = nfs4_proc_getattr,
|
|
|
|
.setattr = nfs4_proc_setattr,
|
|
|
|
.lookup = nfs4_proc_lookup,
|
2017-06-29 20:34:52 +07:00
|
|
|
.lookupp = nfs4_proc_lookupp,
|
2005-04-17 05:20:36 +07:00
|
|
|
.access = nfs4_proc_access,
|
|
|
|
.readlink = nfs4_proc_readlink,
|
|
|
|
.create = nfs4_proc_create,
|
|
|
|
.remove = nfs4_proc_remove,
|
|
|
|
.unlink_setup = nfs4_proc_unlink_setup,
|
2012-03-20 01:54:41 +07:00
|
|
|
.unlink_rpc_prepare = nfs4_proc_unlink_rpc_prepare,
|
2005-04-17 05:20:36 +07:00
|
|
|
.unlink_done = nfs4_proc_unlink_done,
|
2010-09-18 04:31:57 +07:00
|
|
|
.rename_setup = nfs4_proc_rename_setup,
|
2012-03-20 01:54:42 +07:00
|
|
|
.rename_rpc_prepare = nfs4_proc_rename_rpc_prepare,
|
2010-09-18 04:31:57 +07:00
|
|
|
.rename_done = nfs4_proc_rename_done,
|
2005-04-17 05:20:36 +07:00
|
|
|
.link = nfs4_proc_link,
|
|
|
|
.symlink = nfs4_proc_symlink,
|
|
|
|
.mkdir = nfs4_proc_mkdir,
|
2018-03-21 03:43:15 +07:00
|
|
|
.rmdir = nfs4_proc_rmdir,
|
2005-04-17 05:20:36 +07:00
|
|
|
.readdir = nfs4_proc_readdir,
|
|
|
|
.mknod = nfs4_proc_mknod,
|
|
|
|
.statfs = nfs4_proc_statfs,
|
|
|
|
.fsinfo = nfs4_proc_fsinfo,
|
|
|
|
.pathconf = nfs4_proc_pathconf,
|
2006-08-23 07:06:10 +07:00
|
|
|
.set_capabilities = nfs4_server_capabilities,
|
2005-04-17 05:20:36 +07:00
|
|
|
.decode_dirent = nfs4_decode_dirent,
|
2014-05-06 20:12:31 +07:00
|
|
|
.pgio_rpc_prepare = nfs4_proc_pgio_rpc_prepare,
|
2005-04-17 05:20:36 +07:00
|
|
|
.read_setup = nfs4_proc_read_setup,
|
2006-03-21 01:44:27 +07:00
|
|
|
.read_done = nfs4_read_done,
|
2005-04-17 05:20:36 +07:00
|
|
|
.write_setup = nfs4_proc_write_setup,
|
2006-03-21 01:44:27 +07:00
|
|
|
.write_done = nfs4_write_done,
|
2005-04-17 05:20:36 +07:00
|
|
|
.commit_setup = nfs4_proc_commit_setup,
|
2012-04-21 01:47:39 +07:00
|
|
|
.commit_rpc_prepare = nfs4_proc_commit_rpc_prepare,
|
2006-03-21 01:44:27 +07:00
|
|
|
.commit_done = nfs4_commit_done,
|
2005-04-17 05:20:36 +07:00
|
|
|
.lock = nfs4_proc_lock,
|
2005-06-23 00:16:23 +07:00
|
|
|
.clear_acl_cache = nfs4_zap_acl_attr,
|
2009-03-20 02:35:50 +07:00
|
|
|
.close_context = nfs4_close_context,
|
2010-09-17 21:56:51 +07:00
|
|
|
.open_context = nfs4_atomic_open,
|
2012-06-21 02:53:43 +07:00
|
|
|
.have_delegation = nfs4_have_delegation,
|
2012-06-21 02:53:46 +07:00
|
|
|
.alloc_client = nfs4_alloc_client,
|
2011-03-01 08:34:08 +07:00
|
|
|
.init_client = nfs4_init_client,
|
2012-06-21 02:53:45 +07:00
|
|
|
.free_client = nfs4_free_client,
|
2012-07-31 03:05:19 +07:00
|
|
|
.create_server = nfs4_create_server,
|
|
|
|
.clone_server = nfs_clone_server,
|
2005-04-17 05:20:36 +07:00
|
|
|
};
|
|
|
|
|
2010-12-09 18:35:25 +07:00
|
|
|
static const struct xattr_handler nfs4_xattr_nfs4_acl_handler = {
|
2015-12-02 20:44:36 +07:00
|
|
|
.name = XATTR_NAME_NFSV4_ACL,
|
2010-12-09 18:35:25 +07:00
|
|
|
.list = nfs4_xattr_list_nfs4_acl,
|
|
|
|
.get = nfs4_xattr_get_nfs4_acl,
|
|
|
|
.set = nfs4_xattr_set_nfs4_acl,
|
|
|
|
};
|
|
|
|
|
|
|
|
const struct xattr_handler *nfs4_xattr_handlers[] = {
|
|
|
|
&nfs4_xattr_nfs4_acl_handler,
|
2013-05-22 23:50:45 +07:00
|
|
|
#ifdef CONFIG_NFS_V4_SECURITY_LABEL
|
|
|
|
&nfs4_xattr_nfs4_label_handler,
|
|
|
|
#endif
|
2010-12-09 18:35:25 +07:00
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
2005-04-17 05:20:36 +07:00
|
|
|
/*
|
|
|
|
* Local variables:
|
|
|
|
* c-basic-offset: 8
|
|
|
|
* End:
|
|
|
|
*/
|