From: Le Rouzic <aime.le-rouzic@bull.net>
To: nfsv4 <nfsv4@linux-nfs.org>
Cc: nfs@lists.sourceforge.net
Subject: Re: 2.6.23-rc9-CITI_NFS4_ALL-1 connectathon suite testdir error
Date: Thu, 18 Oct 2007 13:49:11 +0200 [thread overview]
Message-ID: <47174837.6090404@bull.net> (raw)
In-Reply-To: <1192575407.7554.40.camel@heimdal.trondhjem.org>
Hi,
Unfortunately not the case I was mentioning.
More on
------------------------------------------------------------- =
Bug: =
http://bugzilla.linux-nfs.org/show_bug.cgi?id=3D150 =
=
Cheers
Trond Myklebust a =E9crit :
>On Fri, 2007-10-12 at 16:12 +0200, Le Rouzic wrote:
> =
>
>>Hi,
>>
>>Running 2.6.23-rc9-CITI_NFS4_ALL-1 on two Intel X86_64 bi-ways machines as
>>client and server, get the following error with the runtest (-s) of the s=
pecial
>>tests of the connectathon suite when running it with several other robust=
ness
>>tests (fsx,iozone,fssbfss_stress) in the same time:
>>
>> Second check for lost reply on non-idempotent requests
>> testing 50 idempotencies in directory "testdir"
>> rmdir 1: Directory not empty
>> special tests failed
>>
>>
>> =
>>------------------------------------------------------------- =
>>Bug: =
>> http://bugzilla.linux-nfs.org/show_bug.cgi?id=3D150 =
>> =
>>Cheers
>> =
>>
>
>I'm hoping that the attached patch will fix this problem. It basically
>ensures that lookup(), readdir(), and open() cannot race with the
>sillyrename code.
>
>Cheers
> Trond
> =
>
>
> ------------------------------------------------------------------------
>
> Sujet:
> No Subject
> Exp=E9diteur:
> Trond Myklebust <Trond.Myklebust@netapp.com>
> Date:
> Mon, 15 Oct 2007 18:17:53 -0400
>
>
>lookup() and sillyrename() can race one another because the sillyrename()
>completion cannot take the parent directory's inode->i_mutex since the
>latter may be held by whoever is calling dput().
>
>We therefore have little option but to add extra locking to ensure that
>nfs_lookup() and nfs_atomic_open() do not race with the sillyrename
>completion.
>If somebody has looked up the sillyrenamed file in the meantime, we just
>transfer the sillydelete information to the new dentry.
>
>Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
>---
>
> fs/nfs/dir.c | 14 +++++-
> fs/nfs/inode.c | 3 +
> fs/nfs/nfs4proc.c | 6 +++
> fs/nfs/unlink.c | 114 ++++++++++++++++++++++++++++++++++++++++++-=
-----
> include/linux/nfs_fs.h | 8 +++
> 5 files changed, 127 insertions(+), 18 deletions(-)
>
>diff --git a/fs/nfs/dir.c b/fs/nfs/dir.c
>index 8ec7fbd..3533453 100644
>--- a/fs/nfs/dir.c
>+++ b/fs/nfs/dir.c
>@@ -562,6 +562,7 @@ static int nfs_readdir(struct file *filp, void *dirent=
, filldir_t filldir)
> nfs_fattr_init(&fattr);
> desc->entry =3D &my_entry;
> =
>+ nfs_block_sillyrename(dentry);
> while(!desc->entry->eof) {
> res =3D readdir_search_pagecache(desc);
> =
>@@ -592,6 +593,7 @@ static int nfs_readdir(struct file *filp, void *dirent=
, filldir_t filldir)
> break;
> }
> }
>+ nfs_unblock_sillyrename(dentry);
> unlock_kernel();
> if (res > 0)
> res =3D 0;
>@@ -866,6 +868,7 @@ struct dentry_operations nfs_dentry_operations =3D {
> static struct dentry *nfs_lookup(struct inode *dir, struct dentry * dentr=
y, struct nameidata *nd)
> {
> struct dentry *res;
>+ struct dentry *parent;
> struct inode *inode =3D NULL;
> int error;
> struct nfs_fh fhandle;
>@@ -894,26 +897,31 @@ static struct dentry *nfs_lookup(struct inode *dir, =
struct dentry * dentry, stru
> goto out_unlock;
> }
> =
>+ parent =3D dentry->d_parent;
>+ /* Protect against concurrent sillydeletes */
>+ nfs_block_sillyrename(parent);
> error =3D NFS_PROTO(dir)->lookup(dir, &dentry->d_name, &fhandle, &fattr);
> if (error =3D=3D -ENOENT)
> goto no_entry;
> if (error < 0) {
> res =3D ERR_PTR(error);
>- goto out_unlock;
>+ goto out_unblock_sillyrename;
> }
> inode =3D nfs_fhget(dentry->d_sb, &fhandle, &fattr);
> res =3D (struct dentry *)inode;
> if (IS_ERR(res))
>- goto out_unlock;
>+ goto out_unblock_sillyrename;
> =
> no_entry:
> res =3D d_materialise_unique(dentry, inode);
> if (res !=3D NULL) {
> if (IS_ERR(res))
>- goto out_unlock;
>+ goto out_unblock_sillyrename;
> dentry =3D res;
> }
> nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
>+out_unblock_sillyrename:
>+ nfs_unblock_sillyrename(parent);
> out_unlock:
> unlock_kernel();
> out:
>diff --git a/fs/nfs/inode.c b/fs/nfs/inode.c
>index 035c769..facb065 100644
>--- a/fs/nfs/inode.c
>+++ b/fs/nfs/inode.c
>@@ -1165,6 +1165,9 @@ static void init_once(void * foo, struct kmem_cache =
* cachep, unsigned long flag
> INIT_RADIX_TREE(&nfsi->nfs_page_tree, GFP_ATOMIC);
> nfsi->ncommit =3D 0;
> nfsi->npages =3D 0;
>+ atomic_set(&nfsi->silly_count, 1);
>+ INIT_HLIST_HEAD(&nfsi->silly_list);
>+ init_waitqueue_head(&nfsi->waitqueue);
> nfs4_init_once(nfsi);
> }
> =
>diff --git a/fs/nfs/nfs4proc.c b/fs/nfs/nfs4proc.c
>index cb99fd9..2cb3b8b 100644
>--- a/fs/nfs/nfs4proc.c
>+++ b/fs/nfs/nfs4proc.c
>@@ -1372,6 +1372,7 @@ out_close:
> struct dentry *
> nfs4_atomic_open(struct inode *dir, struct dentry *dentry, struct nameida=
ta *nd)
> {
>+ struct dentry *parent;
> struct path path =3D {
> .mnt =3D nd->mnt,
> .dentry =3D dentry,
>@@ -1394,6 +1395,9 @@ nfs4_atomic_open(struct inode *dir, struct dentry *d=
entry, struct nameidata *nd)
> cred =3D rpcauth_lookupcred(NFS_CLIENT(dir)->cl_auth, 0);
> if (IS_ERR(cred))
> return (struct dentry *)cred;
>+ parent =3D dentry->d_parent;
>+ /* Protect against concurrent sillydeletes */
>+ nfs_block_sillyrename(parent);
> state =3D nfs4_do_open(dir, &path, nd->intent.open.flags, &attr, cred);
> put_rpccred(cred);
> if (IS_ERR(state)) {
>@@ -1401,12 +1405,14 @@ nfs4_atomic_open(struct inode *dir, struct dentry =
*dentry, struct nameidata *nd)
> d_add(dentry, NULL);
> nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
> }
>+ nfs_unblock_sillyrename(parent);
> return (struct dentry *)state;
> }
> res =3D d_add_unique(dentry, igrab(state->inode));
> if (res !=3D NULL)
> path.dentry =3D res;
> nfs_set_verifier(path.dentry, nfs_save_change_attribute(dir));
>+ nfs_unblock_sillyrename(parent);
> nfs4_intent_set_file(nd, &path, state);
> return res;
> }
>diff --git a/fs/nfs/unlink.c b/fs/nfs/unlink.c
>index 1aed850..6ecd46c 100644
>--- a/fs/nfs/unlink.c
>+++ b/fs/nfs/unlink.c
>@@ -14,6 +14,7 @@
> =
> =
> struct nfs_unlinkdata {
>+ struct hlist_node list;
> struct nfs_removeargs args;
> struct nfs_removeres res;
> struct inode *dir;
>@@ -52,6 +53,20 @@ static int nfs_copy_dname(struct dentry *dentry, struct=
nfs_unlinkdata *data)
> return 0;
> }
> =
>+static void nfs_free_dname(struct nfs_unlinkdata *data)
>+{
>+ kfree(data->args.name.name);
>+ data->args.name.name =3D NULL;
>+ data->args.name.len =3D 0;
>+}
>+
>+static void nfs_dec_sillycount(struct inode *dir)
>+{
>+ struct nfs_inode *nfsi =3D NFS_I(dir);
>+ if (atomic_dec_return(&nfsi->silly_count) =3D=3D 1)
>+ wake_up(&nfsi->waitqueue);
>+}
>+
> /**
> * nfs_async_unlink_init - Initialize the RPC info
> * task: rpc_task of the sillydelete
>@@ -95,6 +110,8 @@ static void nfs_async_unlink_done(struct rpc_task *task=
, void *calldata)
> static void nfs_async_unlink_release(void *calldata)
> {
> struct nfs_unlinkdata *data =3D calldata;
>+
>+ nfs_dec_sillycount(data->dir);
> nfs_free_unlinkdata(data);
> }
> =
>@@ -104,33 +121,100 @@ static const struct rpc_call_ops nfs_unlink_ops =3D=
{
> .rpc_release =3D nfs_async_unlink_release,
> };
> =
>-static int nfs_call_unlink(struct dentry *dentry, struct nfs_unlinkdata *=
data)
>+static int nfs_do_call_unlink(struct dentry *parent, struct inode *dir, s=
truct nfs_unlinkdata *data)
> {
> struct rpc_task *task;
>+ struct dentry *alias;
>+
>+ alias =3D d_lookup(parent, &data->args.name);
>+ if (alias !=3D NULL) {
>+ int ret =3D 0;
>+ /*
>+ * Hey, we raced with lookup... See if we need to transfer
>+ * the sillyrename information to the aliased dentry.
>+ */
>+ nfs_free_dname(data);
>+ spin_lock(&alias->d_lock);
>+ if (!(alias->d_flags & DCACHE_NFSFS_RENAMED)) {
>+ alias->d_fsdata =3D data;
>+ alias->d_flags ^=3D DCACHE_NFSFS_RENAMED;
>+ ret =3D 1;
>+ }
>+ spin_unlock(&alias->d_lock);
>+ nfs_dec_sillycount(dir);
>+ dput(alias);
>+ return ret;
>+ }
>+ data->dir =3D igrab(dir);
>+ if (!data->dir) {
>+ nfs_dec_sillycount(dir);
>+ return 0;
>+ }
>+ data->args.fh =3D NFS_FH(dir);
>+ nfs_fattr_init(&data->res.dir_attr);
>+
>+ task =3D rpc_run_task(NFS_CLIENT(dir), RPC_TASK_ASYNC, &nfs_unlink_ops, =
data);
>+ if (!IS_ERR(task))
>+ rpc_put_task(task);
>+ return 1;
>+}
>+
>+static int nfs_call_unlink(struct dentry *dentry, struct nfs_unlinkdata *=
data)
>+{
> struct dentry *parent;
> struct inode *dir;
>+ int ret =3D 0;
> =
>- if (nfs_copy_dname(dentry, data) < 0)
>- goto out_free;
> =
> parent =3D dget_parent(dentry);
> if (parent =3D=3D NULL)
> goto out_free;
>- dir =3D igrab(parent->d_inode);
>+ dir =3D parent->d_inode;
>+ if (nfs_copy_dname(dentry, data) =3D=3D 0)
>+ goto out_dput;
>+ /* Non-exclusive lock protects against concurrent lookup() calls */
>+ spin_lock(&dir->i_lock);
>+ if (atomic_inc_not_zero(&NFS_I(dir)->silly_count) =3D=3D 0) {
>+ /* Deferred delete */
>+ hlist_add_head(&data->list, &NFS_I(dir)->silly_list);
>+ spin_unlock(&dir->i_lock);
>+ ret =3D 1;
>+ goto out_dput;
>+ }
>+ spin_unlock(&dir->i_lock);
>+ ret =3D nfs_do_call_unlink(parent, dir, data);
>+out_dput:
> dput(parent);
>- if (dir =3D=3D NULL)
>- goto out_free;
>+out_free:
>+ return ret;
>+}
> =
>- data->dir =3D dir;
>- data->args.fh =3D NFS_FH(dir);
>- nfs_fattr_init(&data->res.dir_attr);
>+void nfs_block_sillyrename(struct dentry *dentry)
>+{
>+ struct nfs_inode *nfsi =3D NFS_I(dentry->d_inode);
> =
>- task =3D rpc_run_task(NFS_CLIENT(dir), RPC_TASK_ASYNC, &nfs_unlink_ops, =
data);
>- if (!IS_ERR(task))
>- rpc_put_task(task);
>- return 1;
>-out_free:
>- return 0;
>+ wait_event(nfsi->waitqueue, atomic_cmpxchg(&nfsi->silly_count, 1, 0) =3D=
=3D 1);
>+}
>+
>+void nfs_unblock_sillyrename(struct dentry *dentry)
>+{
>+ struct inode *dir =3D dentry->d_inode;
>+ struct nfs_inode *nfsi =3D NFS_I(dir);
>+ struct nfs_unlinkdata *data;
>+
>+ atomic_inc(&nfsi->silly_count);
>+ spin_lock(&dir->i_lock);
>+ while (!hlist_empty(&nfsi->silly_list)) {
>+ if (!atomic_inc_not_zero(&nfsi->silly_count))
>+ break;
>+ data =3D hlist_entry(nfsi->silly_list.first, struct nfs_unlinkdata, lis=
t);
>+ hlist_del(&data->list);
>+ spin_unlock(&dir->i_lock);
>+ if (nfs_do_call_unlink(dentry, dir, data) =3D=3D 0)
>+ nfs_free_unlinkdata(data);
>+ spin_lock(&dir->i_lock);
>+ }
>+ spin_unlock(&dir->i_lock);
> }
> =
> /**
>diff --git a/include/linux/nfs_fs.h b/include/linux/nfs_fs.h
>index c5164c2..e82a6eb 100644
>--- a/include/linux/nfs_fs.h
>+++ b/include/linux/nfs_fs.h
>@@ -160,6 +160,12 @@ struct nfs_inode {
> /* Open contexts for shared mmap writes */
> struct list_head open_files;
> =
>+ /* Number of in-flight sillydelete RPC calls */
>+ atomic_t silly_count;
>+ /* List of deferred sillydelete requests */
>+ struct hlist_head silly_list;
>+ wait_queue_head_t waitqueue;
>+
> #ifdef CONFIG_NFS_V4
> struct nfs4_cached_acl *nfs4_acl;
> /* NFSv4 state */
>@@ -394,6 +400,8 @@ extern void nfs_release_automount_timer(void);
> */
> extern int nfs_async_unlink(struct inode *dir, struct dentry *dentry);
> extern void nfs_complete_unlink(struct dentry *dentry, struct inode *);
>+extern void nfs_block_sillyrename(struct dentry *dentry);
>+extern void nfs_unblock_sillyrename(struct dentry *dentry);
> =
> /*
> * linux/fs/nfs/write.c
> =
>
-- =
-----------------------------------------------------------------
Company : Bull, Architect of an Open World TM (www.bull.com)
Name : Aime Le Rouzic =
Mail : Bull - BP 208 - 38432 Echirolles Cedex - France
E-Mail : aime.le-rouzic@bull.net
Phone : 33 (4) 76.29.75.51
Fax : 33 (4) 76.29.75.18
----------------------------------------------------------------- =
next prev parent reply other threads:[~2007-10-18 11:49 UTC|newest]
Thread overview: 4+ messages / expand[flat|nested] mbox.gz Atom feed top
2007-10-12 14:12 2.6.23-rc9-CITI_NFS4_ALL-1 connectathon suite testdir error Le Rouzic
2007-10-16 22:56 ` Trond Myklebust
2007-10-18 11:49 ` Le Rouzic [this message]
2007-10-23 10:58 ` Le Rouzic
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=47174837.6090404@bull.net \
--to=aime.le-rouzic@bull.net \
--cc=nfs@lists.sourceforge.net \
--cc=nfsv4@linux-nfs.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox