Skip to content

Commit aeb6e6a

Browse files
committed
Merge tag 'nfs-for-5.20-1' of git://git.linux-nfs.org/projects/trondmy/linux-nfs
Pull NFS client updates from Trond Myklebust: "Highlights include: Stable fixes: - pNFS/flexfiles: Fix infinite looping when the RDMA connection errors out Bugfixes: - NFS: fix port value parsing - SUNRPC: Reinitialise the backchannel request buffers before reuse - SUNRPC: fix expiry of auth creds - NFSv4: Fix races in the legacy idmapper upcall - NFS: O_DIRECT fixes from Jeff Layton - NFSv4.1: Fix OP_SEQUENCE error handling - SUNRPC: Fix an RPC/RDMA performance regression - NFS: Fix case insensitive renames - NFSv4/pnfs: Fix a use-after-free bug in open - NFSv4.1: RECLAIM_COMPLETE must handle EACCES Features: - NFSv4.1: session trunking enhancements - NFSv4.2: READ_PLUS performance optimisations - NFS: relax the rules for rsize/wsize mount options - NFS: don't unhash dentry during unlink/rename - SUNRPC: Fail faster on bad verifier - NFS/SUNRPC: Various tracing improvements" * tag 'nfs-for-5.20-1' of git://git.linux-nfs.org/projects/trondmy/linux-nfs: (46 commits) NFS: Improve readpage/writepage tracing NFS: Improve O_DIRECT tracing NFS: Improve write error tracing NFS: don't unhash dentry during unlink/rename NFSv4/pnfs: Fix a use-after-free bug in open NFS: nfs_async_write_reschedule_io must not recurse into the writeback code SUNRPC: Don't reuse bvec on retransmission of the request SUNRPC: Reinitialise the backchannel request buffers before reuse NFSv4.1: RECLAIM_COMPLETE must handle EACCES NFSv4.1 probe offline transports for trunking on session creation SUNRPC create a function that probes only offline transports SUNRPC export xprt_iter_rewind function SUNRPC restructure rpc_clnt_setup_test_and_add_xprt NFSv4.1 remove xprt from xprt_switch if session trunking test fails SUNRPC create an rpc function that allows xprt removal from rpc_clnt SUNRPC enable back offline transports in trunking discovery SUNRPC create an iterator to list only OFFLINE xprts NFSv4.1 offline trunkable transports on DESTROY_SESSION SUNRPC add function to offline remove trunkable transports SUNRPC expose functions for offline remote xprt functionality ...
2 parents f414456 + 3fa5cbd commit aeb6e6a

37 files changed

+1032
-457
lines changed

fs/nfs/blocklayout/dev.c

Lines changed: 11 additions & 31 deletions
Original file line numberDiff line numberDiff line change
@@ -301,18 +301,14 @@ bl_validate_designator(struct pnfs_block_volume *v)
301301
}
302302
}
303303

304-
/*
305-
* Try to open the udev path for the WWN. At least on Debian the udev
306-
* by-id path will always point to the dm-multipath device if one exists.
307-
*/
308304
static struct block_device *
309-
bl_open_udev_path(struct pnfs_block_volume *v)
305+
bl_open_path(struct pnfs_block_volume *v, const char *prefix)
310306
{
311307
struct block_device *bdev;
312308
const char *devname;
313309

314-
devname = kasprintf(GFP_KERNEL, "/dev/disk/by-id/wwn-0x%*phN",
315-
v->scsi.designator_len, v->scsi.designator);
310+
devname = kasprintf(GFP_KERNEL, "/dev/disk/by-id/%s%*phN",
311+
prefix, v->scsi.designator_len, v->scsi.designator);
316312
if (!devname)
317313
return ERR_PTR(-ENOMEM);
318314

@@ -326,28 +322,6 @@ bl_open_udev_path(struct pnfs_block_volume *v)
326322
return bdev;
327323
}
328324

329-
/*
330-
* Try to open the RH/Fedora specific dm-mpath udev path for this WWN, as the
331-
* wwn- links will only point to the first discovered SCSI device there.
332-
*/
333-
static struct block_device *
334-
bl_open_dm_mpath_udev_path(struct pnfs_block_volume *v)
335-
{
336-
struct block_device *bdev;
337-
const char *devname;
338-
339-
devname = kasprintf(GFP_KERNEL,
340-
"/dev/disk/by-id/dm-uuid-mpath-%d%*phN",
341-
v->scsi.designator_type,
342-
v->scsi.designator_len, v->scsi.designator);
343-
if (!devname)
344-
return ERR_PTR(-ENOMEM);
345-
346-
bdev = blkdev_get_by_path(devname, FMODE_READ | FMODE_WRITE, NULL);
347-
kfree(devname);
348-
return bdev;
349-
}
350-
351325
static int
352326
bl_parse_scsi(struct nfs_server *server, struct pnfs_block_dev *d,
353327
struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask)
@@ -360,9 +334,15 @@ bl_parse_scsi(struct nfs_server *server, struct pnfs_block_dev *d,
360334
if (!bl_validate_designator(v))
361335
return -EINVAL;
362336

363-
bdev = bl_open_dm_mpath_udev_path(v);
337+
/*
338+
* Try to open the RH/Fedora specific dm-mpath udev path first, as the
339+
* wwn- links will only point to the first discovered SCSI device there.
340+
* On other distributions like Debian, the default SCSI by-id path will
341+
* point to the dm-multipath device if one exists.
342+
*/
343+
bdev = bl_open_path(v, "dm-uuid-mpath-0x");
364344
if (IS_ERR(bdev))
365-
bdev = bl_open_udev_path(v);
345+
bdev = bl_open_path(v, "wwn-0x");
366346
if (IS_ERR(bdev))
367347
return PTR_ERR(bdev);
368348
d->bdev = bdev;

fs/nfs/client.c

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -708,9 +708,9 @@ static int nfs_init_server(struct nfs_server *server,
708708
}
709709

710710
if (ctx->rsize)
711-
server->rsize = nfs_block_size(ctx->rsize, NULL);
711+
server->rsize = nfs_io_size(ctx->rsize, clp->cl_proto);
712712
if (ctx->wsize)
713-
server->wsize = nfs_block_size(ctx->wsize, NULL);
713+
server->wsize = nfs_io_size(ctx->wsize, clp->cl_proto);
714714

715715
server->acregmin = ctx->acregmin * HZ;
716716
server->acregmax = ctx->acregmax * HZ;
@@ -755,18 +755,19 @@ static int nfs_init_server(struct nfs_server *server,
755755
static void nfs_server_set_fsinfo(struct nfs_server *server,
756756
struct nfs_fsinfo *fsinfo)
757757
{
758+
struct nfs_client *clp = server->nfs_client;
758759
unsigned long max_rpc_payload, raw_max_rpc_payload;
759760

760761
/* Work out a lot of parameters */
761762
if (server->rsize == 0)
762-
server->rsize = nfs_block_size(fsinfo->rtpref, NULL);
763+
server->rsize = nfs_io_size(fsinfo->rtpref, clp->cl_proto);
763764
if (server->wsize == 0)
764-
server->wsize = nfs_block_size(fsinfo->wtpref, NULL);
765+
server->wsize = nfs_io_size(fsinfo->wtpref, clp->cl_proto);
765766

766767
if (fsinfo->rtmax >= 512 && server->rsize > fsinfo->rtmax)
767-
server->rsize = nfs_block_size(fsinfo->rtmax, NULL);
768+
server->rsize = nfs_io_size(fsinfo->rtmax, clp->cl_proto);
768769
if (fsinfo->wtmax >= 512 && server->wsize > fsinfo->wtmax)
769-
server->wsize = nfs_block_size(fsinfo->wtmax, NULL);
770+
server->wsize = nfs_io_size(fsinfo->wtmax, clp->cl_proto);
770771

771772
raw_max_rpc_payload = rpc_max_payload(server->client);
772773
max_rpc_payload = nfs_block_size(raw_max_rpc_payload, NULL);

fs/nfs/dir.c

Lines changed: 60 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -1084,7 +1084,7 @@ static void nfs_do_filldir(struct nfs_readdir_descriptor *desc,
10841084
struct nfs_cache_array *array;
10851085
unsigned int i;
10861086

1087-
array = kmap(desc->page);
1087+
array = kmap_local_page(desc->page);
10881088
for (i = desc->cache_entry_index; i < array->size; i++) {
10891089
struct nfs_cache_array_entry *ent;
10901090

@@ -1110,7 +1110,7 @@ static void nfs_do_filldir(struct nfs_readdir_descriptor *desc,
11101110
if (array->page_is_eof)
11111111
desc->eof = !desc->eob;
11121112

1113-
kunmap(desc->page);
1113+
kunmap_local(array);
11141114
dfprintk(DIRCACHE, "NFS: nfs_do_filldir() filling ended @ cookie %llu\n",
11151115
(unsigned long long)desc->dir_cookie);
11161116
}
@@ -1739,6 +1739,10 @@ nfs_do_lookup_revalidate(struct inode *dir, struct dentry *dentry,
17391739
goto out_bad;
17401740
}
17411741

1742+
if ((flags & LOOKUP_RENAME_TARGET) && d_count(dentry) < 2 &&
1743+
nfs_server_capable(dir, NFS_CAP_CASE_INSENSITIVE))
1744+
goto out_bad;
1745+
17421746
if (nfs_verifier_is_delegated(dentry))
17431747
return nfs_lookup_revalidate_delegated(dir, dentry, inode);
17441748

@@ -1778,6 +1782,8 @@ __nfs_lookup_revalidate(struct dentry *dentry, unsigned int flags,
17781782
int ret;
17791783

17801784
if (flags & LOOKUP_RCU) {
1785+
if (dentry->d_fsdata == NFS_FSDATA_BLOCKED)
1786+
return -ECHILD;
17811787
parent = READ_ONCE(dentry->d_parent);
17821788
dir = d_inode_rcu(parent);
17831789
if (!dir)
@@ -1786,6 +1792,9 @@ __nfs_lookup_revalidate(struct dentry *dentry, unsigned int flags,
17861792
if (parent != READ_ONCE(dentry->d_parent))
17871793
return -ECHILD;
17881794
} else {
1795+
/* Wait for unlink to complete */
1796+
wait_var_event(&dentry->d_fsdata,
1797+
dentry->d_fsdata != NFS_FSDATA_BLOCKED);
17891798
parent = dget_parent(dentry);
17901799
ret = reval(d_inode(parent), dentry, flags);
17911800
dput(parent);
@@ -2454,7 +2463,6 @@ static int nfs_safe_remove(struct dentry *dentry)
24542463
int nfs_unlink(struct inode *dir, struct dentry *dentry)
24552464
{
24562465
int error;
2457-
int need_rehash = 0;
24582466

24592467
dfprintk(VFS, "NFS: unlink(%s/%lu, %pd)\n", dir->i_sb->s_id,
24602468
dir->i_ino, dentry);
@@ -2469,15 +2477,25 @@ int nfs_unlink(struct inode *dir, struct dentry *dentry)
24692477
error = nfs_sillyrename(dir, dentry);
24702478
goto out;
24712479
}
2472-
if (!d_unhashed(dentry)) {
2473-
__d_drop(dentry);
2474-
need_rehash = 1;
2475-
}
2480+
/* We must prevent any concurrent open until the unlink
2481+
* completes. ->d_revalidate will wait for ->d_fsdata
2482+
* to clear. We set it here to ensure no lookup succeeds until
2483+
* the unlink is complete on the server.
2484+
*/
2485+
error = -ETXTBSY;
2486+
if (WARN_ON(dentry->d_flags & DCACHE_NFSFS_RENAMED) ||
2487+
WARN_ON(dentry->d_fsdata == NFS_FSDATA_BLOCKED))
2488+
goto out;
2489+
if (dentry->d_fsdata)
2490+
/* old devname */
2491+
kfree(dentry->d_fsdata);
2492+
dentry->d_fsdata = NFS_FSDATA_BLOCKED;
2493+
24762494
spin_unlock(&dentry->d_lock);
24772495
error = nfs_safe_remove(dentry);
24782496
nfs_dentry_remove_handle_error(dir, dentry, error);
2479-
if (need_rehash)
2480-
d_rehash(dentry);
2497+
dentry->d_fsdata = NULL;
2498+
wake_up_var(&dentry->d_fsdata);
24812499
out:
24822500
trace_nfs_unlink_exit(dir, dentry, error);
24832501
return error;
@@ -2584,6 +2602,15 @@ nfs_link(struct dentry *old_dentry, struct inode *dir, struct dentry *dentry)
25842602
}
25852603
EXPORT_SYMBOL_GPL(nfs_link);
25862604

2605+
static void
2606+
nfs_unblock_rename(struct rpc_task *task, struct nfs_renamedata *data)
2607+
{
2608+
struct dentry *new_dentry = data->new_dentry;
2609+
2610+
new_dentry->d_fsdata = NULL;
2611+
wake_up_var(&new_dentry->d_fsdata);
2612+
}
2613+
25872614
/*
25882615
* RENAME
25892616
* FIXME: Some nfsds, like the Linux user space nfsd, may generate a
@@ -2614,8 +2641,9 @@ int nfs_rename(struct user_namespace *mnt_userns, struct inode *old_dir,
26142641
{
26152642
struct inode *old_inode = d_inode(old_dentry);
26162643
struct inode *new_inode = d_inode(new_dentry);
2617-
struct dentry *dentry = NULL, *rehash = NULL;
2644+
struct dentry *dentry = NULL;
26182645
struct rpc_task *task;
2646+
bool must_unblock = false;
26192647
int error = -EBUSY;
26202648

26212649
if (flags)
@@ -2633,18 +2661,27 @@ int nfs_rename(struct user_namespace *mnt_userns, struct inode *old_dir,
26332661
* the new target.
26342662
*/
26352663
if (new_inode && !S_ISDIR(new_inode->i_mode)) {
2636-
/*
2637-
* To prevent any new references to the target during the
2638-
* rename, we unhash the dentry in advance.
2664+
/* We must prevent any concurrent open until the unlink
2665+
* completes. ->d_revalidate will wait for ->d_fsdata
2666+
* to clear. We set it here to ensure no lookup succeeds until
2667+
* the unlink is complete on the server.
26392668
*/
2640-
if (!d_unhashed(new_dentry)) {
2641-
d_drop(new_dentry);
2642-
rehash = new_dentry;
2669+
error = -ETXTBSY;
2670+
if (WARN_ON(new_dentry->d_flags & DCACHE_NFSFS_RENAMED) ||
2671+
WARN_ON(new_dentry->d_fsdata == NFS_FSDATA_BLOCKED))
2672+
goto out;
2673+
if (new_dentry->d_fsdata) {
2674+
/* old devname */
2675+
kfree(new_dentry->d_fsdata);
2676+
new_dentry->d_fsdata = NULL;
26432677
}
26442678

2679+
spin_lock(&new_dentry->d_lock);
26452680
if (d_count(new_dentry) > 2) {
26462681
int err;
26472682

2683+
spin_unlock(&new_dentry->d_lock);
2684+
26482685
/* copy the target dentry's name */
26492686
dentry = d_alloc(new_dentry->d_parent,
26502687
&new_dentry->d_name);
@@ -2657,14 +2694,19 @@ int nfs_rename(struct user_namespace *mnt_userns, struct inode *old_dir,
26572694
goto out;
26582695

26592696
new_dentry = dentry;
2660-
rehash = NULL;
26612697
new_inode = NULL;
2698+
} else {
2699+
new_dentry->d_fsdata = NFS_FSDATA_BLOCKED;
2700+
must_unblock = true;
2701+
spin_unlock(&new_dentry->d_lock);
26622702
}
2703+
26632704
}
26642705

26652706
if (S_ISREG(old_inode->i_mode))
26662707
nfs_sync_inode(old_inode);
2667-
task = nfs_async_rename(old_dir, new_dir, old_dentry, new_dentry, NULL);
2708+
task = nfs_async_rename(old_dir, new_dir, old_dentry, new_dentry,
2709+
must_unblock ? nfs_unblock_rename : NULL);
26682710
if (IS_ERR(task)) {
26692711
error = PTR_ERR(task);
26702712
goto out;
@@ -2688,8 +2730,6 @@ int nfs_rename(struct user_namespace *mnt_userns, struct inode *old_dir,
26882730
spin_unlock(&old_inode->i_lock);
26892731
}
26902732
out:
2691-
if (rehash)
2692-
d_rehash(rehash);
26932733
trace_nfs_rename_exit(old_dir, old_dentry,
26942734
new_dir, new_dentry, error);
26952735
if (!error) {

0 commit comments

Comments
 (0)