aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorRick Macklem <rmacklem@FreeBSD.org>2021-10-13 22:48:54 +0000
committerRick Macklem <rmacklem@FreeBSD.org>2021-10-27 02:33:45 +0000
commitda6c043ff3a2b75d7d1ce56ada0c2cc817f2afe0 (patch)
treed54bb17568ea5fb8a7d2d5cc08a4d1a12ca77084
parentc3c880be15a40985268f018c7828f8b98dfa93be (diff)
downloadsrc-da6c043ff3a2b75d7d1ce56ada0c2cc817f2afe0.tar.gz
src-da6c043ff3a2b75d7d1ce56ada0c2cc817f2afe0.zip
nfscl: Make nfscl_getlayout() acquire the correct pNFS layout
Without this patch, if a pNFS read layout has already been acquired for a file, writes would be redirected to the Metadata Server (MDS), because nfscl_getlayout() would not acquire a read/write layout for the file. This happened because there was no "mode" argument to nfscl_getlayout() to indicate whether reading or writing was being done. Since doing I/O through the Metadata Server is not encouraged for some pNFS servers, it is preferable to get a read/write layout for writes instead of redirecting the write to the MDS. This patch adds a access mode argument to nfscl_getlayout() and nfsrpc_getlayout(), so that nfscl_getlayout() knows to acquire a read/write layout for writing, even if a read layout has already been acquired. This patch only affects NFSv4.1/4.2 client behaviour when pNFS ("pnfs" mount option against a server that supports pNFS) is in use. This problem was detected during a recent NFSv4 interoperability testing event held by the IETF working group. (cherry picked from commit 24af0fcdfc4983fd3cef10f9d949aca79476c2c2)
-rw-r--r--sys/fs/nfs/nfs_var.h2
-rw-r--r--sys/fs/nfsclient/nfs_clrpcops.c14
-rw-r--r--sys/fs/nfsclient/nfs_clstate.c7
3 files changed, 12 insertions, 11 deletions
diff --git a/sys/fs/nfs/nfs_var.h b/sys/fs/nfs/nfs_var.h
index 846ab2503981..04946d88c26b 100644
--- a/sys/fs/nfs/nfs_var.h
+++ b/sys/fs/nfs/nfs_var.h
@@ -631,7 +631,7 @@ int nfscl_layout(struct nfsmount *, vnode_t, u_int8_t *, int, nfsv4stateid_t *,
int, int, struct nfsclflayouthead *, struct nfscllayout **, struct ucred *,
NFSPROC_T *);
struct nfscllayout *nfscl_getlayout(struct nfsclclient *, uint8_t *, int,
- uint64_t, struct nfsclflayout **, int *);
+ uint64_t, uint32_t, struct nfsclflayout **, int *);
void nfscl_dserr(uint32_t, uint32_t, struct nfscldevinfo *,
struct nfscllayout *, struct nfsclds *);
void nfscl_cancelreqs(struct nfsclds *);
diff --git a/sys/fs/nfsclient/nfs_clrpcops.c b/sys/fs/nfsclient/nfs_clrpcops.c
index dbbfdb3b2976..36ee7768686f 100644
--- a/sys/fs/nfsclient/nfs_clrpcops.c
+++ b/sys/fs/nfsclient/nfs_clrpcops.c
@@ -148,7 +148,7 @@ static int nfsrpc_locku(struct nfsrv_descript *, struct nfsmount *,
static int nfsrpc_setaclrpc(vnode_t, struct ucred *, NFSPROC_T *,
struct acl *, nfsv4stateid_t *, void *);
static int nfsrpc_getlayout(struct nfsmount *, vnode_t, struct nfsfh *, int,
- uint32_t *, nfsv4stateid_t *, uint64_t, struct nfscllayout **,
+ uint32_t, uint32_t *, nfsv4stateid_t *, uint64_t, struct nfscllayout **,
struct ucred *, NFSPROC_T *);
static int nfsrpc_fillsa(struct nfsmount *, struct sockaddr_in *,
struct sockaddr_in6 *, sa_family_t, int, int, struct nfsclds **,
@@ -5438,8 +5438,8 @@ nfsmout:
*/
static int
nfsrpc_getlayout(struct nfsmount *nmp, vnode_t vp, struct nfsfh *nfhp,
- int iomode, uint32_t *notifybitsp, nfsv4stateid_t *stateidp, uint64_t off,
- struct nfscllayout **lypp, struct ucred *cred, NFSPROC_T *p)
+ int iomode, uint32_t rw, uint32_t *notifybitsp, nfsv4stateid_t *stateidp,
+ uint64_t off, struct nfscllayout **lypp, struct ucred *cred, NFSPROC_T *p)
{
struct nfscllayout *lyp;
struct nfsclflayout *flp;
@@ -5459,7 +5459,7 @@ nfsrpc_getlayout(struct nfsmount *nmp, vnode_t vp, struct nfsfh *nfhp,
* flp == NULL.
*/
lyp = nfscl_getlayout(nmp->nm_clp, nfhp->nfh_fh, nfhp->nfh_len,
- off, &flp, &recalled);
+ off, rw, &flp, &recalled);
islocked = 0;
if (lyp == NULL || flp == NULL) {
if (recalled != 0)
@@ -5790,7 +5790,7 @@ nfscl_doiods(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
/* Search for a layout for this file. */
off = uiop->uio_offset;
layp = nfscl_getlayout(nmp->nm_clp, np->n_fhp->nfh_fh,
- np->n_fhp->nfh_len, off, &rflp, &recalled);
+ np->n_fhp->nfh_len, off, rwaccess, &rflp, &recalled);
if (layp == NULL || rflp == NULL) {
if (recalled != 0) {
NFSFREECRED(newcred);
@@ -5808,7 +5808,7 @@ nfscl_doiods(vnode_t vp, struct uio *uiop, int *iomode, int *must_commit,
else
iolaymode = NFSLAYOUTIOMODE_READ;
error = nfsrpc_getlayout(nmp, vp, np->n_fhp, iolaymode,
- NULL, &stateid, off, &layp, newcred, p);
+ rwaccess, NULL, &stateid, off, &layp, newcred, p);
if (error != 0) {
NFSLOCKNODE(np);
np->n_flag |= NNOLAYOUT;
@@ -7494,7 +7494,7 @@ nfsrpc_getopenlayout(struct nfsmount *nmp, vnode_t vp, u_int8_t *nfhp,
* on it, iff flp != NULL or a lock (exclusive lock) on it iff
* flp == NULL.
*/
- lyp = nfscl_getlayout(nmp->nm_clp, newfhp, newfhlen, 0, &flp,
+ lyp = nfscl_getlayout(nmp->nm_clp, newfhp, newfhlen, 0, mode, &flp,
&recalled);
NFSCL_DEBUG(4, "nfsrpc_getopenlayout nfscl_getlayout lyp=%p\n", lyp);
if (lyp == NULL)
diff --git a/sys/fs/nfsclient/nfs_clstate.c b/sys/fs/nfsclient/nfs_clstate.c
index 276e94002d34..248725c668d7 100644
--- a/sys/fs/nfsclient/nfs_clstate.c
+++ b/sys/fs/nfsclient/nfs_clstate.c
@@ -5143,7 +5143,8 @@ nfscl_layout(struct nfsmount *nmp, vnode_t vp, u_int8_t *fhp, int fhlen,
*/
struct nfscllayout *
nfscl_getlayout(struct nfsclclient *clp, uint8_t *fhp, int fhlen,
- uint64_t off, struct nfsclflayout **retflpp, int *recalledp)
+ uint64_t off, uint32_t rwaccess, struct nfsclflayout **retflpp,
+ int *recalledp)
{
struct nfscllayout *lyp;
mount_t mp;
@@ -5159,8 +5160,8 @@ nfscl_getlayout(struct nfsclclient *clp, uint8_t *fhp, int fhlen,
TAILQ_REMOVE(&clp->nfsc_layout, lyp, nfsly_list);
TAILQ_INSERT_HEAD(&clp->nfsc_layout, lyp, nfsly_list);
lyp->nfsly_timestamp = NFSD_MONOSEC + 120;
- error = nfscl_findlayoutforio(lyp, off,
- NFSV4OPEN_ACCESSREAD, retflpp);
+ error = nfscl_findlayoutforio(lyp, off, rwaccess,
+ retflpp);
if (error == 0)
nfsv4_getref(&lyp->nfsly_lock, NULL,
NFSCLSTATEMUTEXPTR, mp);