From: Le Rouzic <aime.le-rouzic@bull.net>
To: nfsv4 <nfsv4@linux-nfs.org>
Cc: nfs@lists.sourceforge.net
Subject: Re: 2.6.23-rc9-CITI_NFS4_ALL-1 connectathon suite testdir error
Date: Tue, 23 Oct 2007 12:58:05 +0200 [thread overview]
Message-ID: <471DD3BD.2070906@bull.net> (raw)
In-Reply-To: <47174837.6090404@bull.net>
Hi,
It is fixed now thanks to a second patch delivered by Trond.
You will find this second patch at :
Bug: =
http://bugzilla.linux-nfs.org/show_bug.cgi?id=3D150 =
=
Regards
Le Rouzic a =E9crit :
>Hi,
>
>Unfortunately not the case I was mentioning.
>More on
>
>------------------------------------------------------------- =
>Bug: =
> http://bugzilla.linux-nfs.org/show_bug.cgi?id=3D150 =
> =
>
>
>Cheers
>
>
>
>Trond Myklebust a =E9crit :
>
> =
>
>>On Fri, 2007-10-12 at 16:12 +0200, Le Rouzic wrote:
>> =
>>
>> =
>>
>>>Hi,
>>>
>>>Running 2.6.23-rc9-CITI_NFS4_ALL-1 on two Intel X86_64 bi-ways machines =
as
>>>client and server, get the following error with the runtest (-s) of the =
special
>>>tests of the connectathon suite when running it with several other robus=
tness
>>>tests (fsx,iozone,fssbfss_stress) in the same time:
>>>
>>>Second check for lost reply on non-idempotent requests
>>>testing 50 idempotencies in directory "testdir"
>>>rmdir 1: Directory not empty
>>>special tests failed
>>>
>>>
>>>
>>>------------------------------------------------------------- =
>>>Bug: =
>>> http://bugzilla.linux-nfs.org/show_bug.cgi?id=3D150 =
>>> =
>>>Cheers
>>> =
>>>
>>> =
>>>
>>I'm hoping that the attached patch will fix this problem. It basically
>>ensures that lookup(), readdir(), and open() cannot race with the
>>sillyrename code.
>>
>>Cheers
>> Trond
>> =
>>
>>
>>------------------------------------------------------------------------
>>
>>Sujet:
>>No Subject
>>Exp=E9diteur:
>>Trond Myklebust <Trond.Myklebust@netapp.com>
>>Date:
>>Mon, 15 Oct 2007 18:17:53 -0400
>>
>>
>>lookup() and sillyrename() can race one another because the sillyrename()
>>completion cannot take the parent directory's inode->i_mutex since the
>>latter may be held by whoever is calling dput().
>>
>>We therefore have little option but to add extra locking to ensure that
>>nfs_lookup() and nfs_atomic_open() do not race with the sillyrename
>>completion.
>>If somebody has looked up the sillyrenamed file in the meantime, we just
>>transfer the sillydelete information to the new dentry.
>>
>>Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
>>---
>>
>>fs/nfs/dir.c | 14 +++++-
>>fs/nfs/inode.c | 3 +
>>fs/nfs/nfs4proc.c | 6 +++
>>fs/nfs/unlink.c | 114 ++++++++++++++++++++++++++++++++++++++++++-=
-----
>>include/linux/nfs_fs.h | 8 +++
>>5 files changed, 127 insertions(+), 18 deletions(-)
>>
>>diff --git a/fs/nfs/dir.c b/fs/nfs/dir.c
>>index 8ec7fbd..3533453 100644
>>--- a/fs/nfs/dir.c
>>+++ b/fs/nfs/dir.c
>>@@ -562,6 +562,7 @@ static int nfs_readdir(struct file *filp, void *diren=
t, filldir_t filldir)
>> nfs_fattr_init(&fattr);
>> desc->entry =3D &my_entry;
>>
>>+ nfs_block_sillyrename(dentry);
>> while(!desc->entry->eof) {
>> res =3D readdir_search_pagecache(desc);
>>
>>@@ -592,6 +593,7 @@ static int nfs_readdir(struct file *filp, void *diren=
t, filldir_t filldir)
>> break;
>> }
>> }
>>+ nfs_unblock_sillyrename(dentry);
>> unlock_kernel();
>> if (res > 0)
>> res =3D 0;
>>@@ -866,6 +868,7 @@ struct dentry_operations nfs_dentry_operations =3D {
>>static struct dentry *nfs_lookup(struct inode *dir, struct dentry * dentr=
y, struct nameidata *nd)
>>{
>> struct dentry *res;
>>+ struct dentry *parent;
>> struct inode *inode =3D NULL;
>> int error;
>> struct nfs_fh fhandle;
>>@@ -894,26 +897,31 @@ static struct dentry *nfs_lookup(struct inode *dir,=
struct dentry * dentry, stru
>> goto out_unlock;
>> }
>>
>>+ parent =3D dentry->d_parent;
>>+ /* Protect against concurrent sillydeletes */
>>+ nfs_block_sillyrename(parent);
>> error =3D NFS_PROTO(dir)->lookup(dir, &dentry->d_name, &fhandle, &fattr);
>> if (error =3D=3D -ENOENT)
>> goto no_entry;
>> if (error < 0) {
>> res =3D ERR_PTR(error);
>>- goto out_unlock;
>>+ goto out_unblock_sillyrename;
>> }
>> inode =3D nfs_fhget(dentry->d_sb, &fhandle, &fattr);
>> res =3D (struct dentry *)inode;
>> if (IS_ERR(res))
>>- goto out_unlock;
>>+ goto out_unblock_sillyrename;
>>
>>no_entry:
>> res =3D d_materialise_unique(dentry, inode);
>> if (res !=3D NULL) {
>> if (IS_ERR(res))
>>- goto out_unlock;
>>+ goto out_unblock_sillyrename;
>> dentry =3D res;
>> }
>> nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
>>+out_unblock_sillyrename:
>>+ nfs_unblock_sillyrename(parent);
>>out_unlock:
>> unlock_kernel();
>>out:
>>diff --git a/fs/nfs/inode.c b/fs/nfs/inode.c
>>index 035c769..facb065 100644
>>--- a/fs/nfs/inode.c
>>+++ b/fs/nfs/inode.c
>>@@ -1165,6 +1165,9 @@ static void init_once(void * foo, struct kmem_cache=
* cachep, unsigned long flag
>> INIT_RADIX_TREE(&nfsi->nfs_page_tree, GFP_ATOMIC);
>> nfsi->ncommit =3D 0;
>> nfsi->npages =3D 0;
>>+ atomic_set(&nfsi->silly_count, 1);
>>+ INIT_HLIST_HEAD(&nfsi->silly_list);
>>+ init_waitqueue_head(&nfsi->waitqueue);
>> nfs4_init_once(nfsi);
>>}
>>
>>diff --git a/fs/nfs/nfs4proc.c b/fs/nfs/nfs4proc.c
>>index cb99fd9..2cb3b8b 100644
>>--- a/fs/nfs/nfs4proc.c
>>+++ b/fs/nfs/nfs4proc.c
>>@@ -1372,6 +1372,7 @@ out_close:
>>struct dentry *
>>nfs4_atomic_open(struct inode *dir, struct dentry *dentry, struct nameida=
ta *nd)
>>{
>>+ struct dentry *parent;
>> struct path path =3D {
>> .mnt =3D nd->mnt,
>> .dentry =3D dentry,
>>@@ -1394,6 +1395,9 @@ nfs4_atomic_open(struct inode *dir, struct dentry *=
dentry, struct nameidata *nd)
>> cred =3D rpcauth_lookupcred(NFS_CLIENT(dir)->cl_auth, 0);
>> if (IS_ERR(cred))
>> return (struct dentry *)cred;
>>+ parent =3D dentry->d_parent;
>>+ /* Protect against concurrent sillydeletes */
>>+ nfs_block_sillyrename(parent);
>> state =3D nfs4_do_open(dir, &path, nd->intent.open.flags, &attr, cred);
>> put_rpccred(cred);
>> if (IS_ERR(state)) {
>>@@ -1401,12 +1405,14 @@ nfs4_atomic_open(struct inode *dir, struct dentry=
*dentry, struct nameidata *nd)
>> d_add(dentry, NULL);
>> nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
>> }
>>+ nfs_unblock_sillyrename(parent);
>> return (struct dentry *)state;
>> }
>> res =3D d_add_unique(dentry, igrab(state->inode));
>> if (res !=3D NULL)
>> path.dentry =3D res;
>> nfs_set_verifier(path.dentry, nfs_save_change_attribute(dir));
>>+ nfs_unblock_sillyrename(parent);
>> nfs4_intent_set_file(nd, &path, state);
>> return res;
>>}
>>diff --git a/fs/nfs/unlink.c b/fs/nfs/unlink.c
>>index 1aed850..6ecd46c 100644
>>--- a/fs/nfs/unlink.c
>>+++ b/fs/nfs/unlink.c
>>@@ -14,6 +14,7 @@
>>
>>
>>struct nfs_unlinkdata {
>>+ struct hlist_node list;
>> struct nfs_removeargs args;
>> struct nfs_removeres res;
>> struct inode *dir;
>>@@ -52,6 +53,20 @@ static int nfs_copy_dname(struct dentry *dentry, struc=
t nfs_unlinkdata *data)
>> return 0;
>>}
>>
>>+static void nfs_free_dname(struct nfs_unlinkdata *data)
>>+{
>>+ kfree(data->args.name.name);
>>+ data->args.name.name =3D NULL;
>>+ data->args.name.len =3D 0;
>>+}
>>+
>>+static void nfs_dec_sillycount(struct inode *dir)
>>+{
>>+ struct nfs_inode *nfsi =3D NFS_I(dir);
>>+ if (atomic_dec_return(&nfsi->silly_count) =3D=3D 1)
>>+ wake_up(&nfsi->waitqueue);
>>+}
>>+
>>/**
>> * nfs_async_unlink_init - Initialize the RPC info
>> * task: rpc_task of the sillydelete
>>@@ -95,6 +110,8 @@ static void nfs_async_unlink_done(struct rpc_task *tas=
k, void *calldata)
>>static void nfs_async_unlink_release(void *calldata)
>>{
>> struct nfs_unlinkdata *data =3D calldata;
>>+
>>+ nfs_dec_sillycount(data->dir);
>> nfs_free_unlinkdata(data);
>>}
>>
>>@@ -104,33 +121,100 @@ static const struct rpc_call_ops nfs_unlink_ops =
=3D {
>> .rpc_release =3D nfs_async_unlink_release,
>>};
>>
>>-static int nfs_call_unlink(struct dentry *dentry, struct nfs_unlinkdata =
*data)
>>+static int nfs_do_call_unlink(struct dentry *parent, struct inode *dir, =
struct nfs_unlinkdata *data)
>>{
>> struct rpc_task *task;
>>+ struct dentry *alias;
>>+
>>+ alias =3D d_lookup(parent, &data->args.name);
>>+ if (alias !=3D NULL) {
>>+ int ret =3D 0;
>>+ /*
>>+ * Hey, we raced with lookup... See if we need to transfer
>>+ * the sillyrename information to the aliased dentry.
>>+ */
>>+ nfs_free_dname(data);
>>+ spin_lock(&alias->d_lock);
>>+ if (!(alias->d_flags & DCACHE_NFSFS_RENAMED)) {
>>+ alias->d_fsdata =3D data;
>>+ alias->d_flags ^=3D DCACHE_NFSFS_RENAMED;
>>+ ret =3D 1;
>>+ }
>>+ spin_unlock(&alias->d_lock);
>>+ nfs_dec_sillycount(dir);
>>+ dput(alias);
>>+ return ret;
>>+ }
>>+ data->dir =3D igrab(dir);
>>+ if (!data->dir) {
>>+ nfs_dec_sillycount(dir);
>>+ return 0;
>>+ }
>>+ data->args.fh =3D NFS_FH(dir);
>>+ nfs_fattr_init(&data->res.dir_attr);
>>+
>>+ task =3D rpc_run_task(NFS_CLIENT(dir), RPC_TASK_ASYNC, &nfs_unlink_ops,=
data);
>>+ if (!IS_ERR(task))
>>+ rpc_put_task(task);
>>+ return 1;
>>+}
>>+
>>+static int nfs_call_unlink(struct dentry *dentry, struct nfs_unlinkdata =
*data)
>>+{
>> struct dentry *parent;
>> struct inode *dir;
>>+ int ret =3D 0;
>>
>>- if (nfs_copy_dname(dentry, data) < 0)
>>- goto out_free;
>>
>> parent =3D dget_parent(dentry);
>> if (parent =3D=3D NULL)
>> goto out_free;
>>- dir =3D igrab(parent->d_inode);
>>+ dir =3D parent->d_inode;
>>+ if (nfs_copy_dname(dentry, data) =3D=3D 0)
>>+ goto out_dput;
>>+ /* Non-exclusive lock protects against concurrent lookup() calls */
>>+ spin_lock(&dir->i_lock);
>>+ if (atomic_inc_not_zero(&NFS_I(dir)->silly_count) =3D=3D 0) {
>>+ /* Deferred delete */
>>+ hlist_add_head(&data->list, &NFS_I(dir)->silly_list);
>>+ spin_unlock(&dir->i_lock);
>>+ ret =3D 1;
>>+ goto out_dput;
>>+ }
>>+ spin_unlock(&dir->i_lock);
>>+ ret =3D nfs_do_call_unlink(parent, dir, data);
>>+out_dput:
>> dput(parent);
>>- if (dir =3D=3D NULL)
>>- goto out_free;
>>+out_free:
>>+ return ret;
>>+}
>>
>>- data->dir =3D dir;
>>- data->args.fh =3D NFS_FH(dir);
>>- nfs_fattr_init(&data->res.dir_attr);
>>+void nfs_block_sillyrename(struct dentry *dentry)
>>+{
>>+ struct nfs_inode *nfsi =3D NFS_I(dentry->d_inode);
>>
>>- task =3D rpc_run_task(NFS_CLIENT(dir), RPC_TASK_ASYNC, &nfs_unlink_ops,=
data);
>>- if (!IS_ERR(task))
>>- rpc_put_task(task);
>>- return 1;
>>-out_free:
>>- return 0;
>>+ wait_event(nfsi->waitqueue, atomic_cmpxchg(&nfsi->silly_count, 1, 0) =
=3D=3D 1);
>>+}
>>+
>>+void nfs_unblock_sillyrename(struct dentry *dentry)
>>+{
>>+ struct inode *dir =3D dentry->d_inode;
>>+ struct nfs_inode *nfsi =3D NFS_I(dir);
>>+ struct nfs_unlinkdata *data;
>>+
>>+ atomic_inc(&nfsi->silly_count);
>>+ spin_lock(&dir->i_lock);
>>+ while (!hlist_empty(&nfsi->silly_list)) {
>>+ if (!atomic_inc_not_zero(&nfsi->silly_count))
>>+ break;
>>+ data =3D hlist_entry(nfsi->silly_list.first, struct nfs_unlinkdata, li=
st);
>>+ hlist_del(&data->list);
>>+ spin_unlock(&dir->i_lock);
>>+ if (nfs_do_call_unlink(dentry, dir, data) =3D=3D 0)
>>+ nfs_free_unlinkdata(data);
>>+ spin_lock(&dir->i_lock);
>>+ }
>>+ spin_unlock(&dir->i_lock);
>>}
>>
>>/**
>>diff --git a/include/linux/nfs_fs.h b/include/linux/nfs_fs.h
>>index c5164c2..e82a6eb 100644
>>--- a/include/linux/nfs_fs.h
>>+++ b/include/linux/nfs_fs.h
>>@@ -160,6 +160,12 @@ struct nfs_inode {
>> /* Open contexts for shared mmap writes */
>> struct list_head open_files;
>>
>>+ /* Number of in-flight sillydelete RPC calls */
>>+ atomic_t silly_count;
>>+ /* List of deferred sillydelete requests */
>>+ struct hlist_head silly_list;
>>+ wait_queue_head_t waitqueue;
>>+
>>#ifdef CONFIG_NFS_V4
>> struct nfs4_cached_acl *nfs4_acl;
>> /* NFSv4 state */
>>@@ -394,6 +400,8 @@ extern void nfs_release_automount_timer(void);
>> */
>>extern int nfs_async_unlink(struct inode *dir, struct dentry *dentry);
>>extern void nfs_complete_unlink(struct dentry *dentry, struct inode *);
>>+extern void nfs_block_sillyrename(struct dentry *dentry);
>>+extern void nfs_unblock_sillyrename(struct dentry *dentry);
>>
>>/*
>> * linux/fs/nfs/write.c
>> =
>>
>> =
>>
>
>
> =
>
-- =
-----------------------------------------------------------------
Company : Bull, Architect of an Open World TM (www.bull.com)
Name : Aime Le Rouzic =
Mail : Bull - BP 208 - 38432 Echirolles Cedex - France
E-Mail : aime.le-rouzic@bull.net
Phone : 33 (4) 76.29.75.51
Fax : 33 (4) 76.29.75.18
----------------------------------------------------------------- =
prev parent reply other threads:[~2007-10-23 10:58 UTC|newest]
Thread overview: 4+ messages / expand[flat|nested] mbox.gz Atom feed top
2007-10-12 14:12 2.6.23-rc9-CITI_NFS4_ALL-1 connectathon suite testdir error Le Rouzic
2007-10-16 22:56 ` Trond Myklebust
2007-10-18 11:49 ` Le Rouzic
2007-10-23 10:58 ` Le Rouzic [this message]
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=471DD3BD.2070906@bull.net \
--to=aime.le-rouzic@bull.net \
--cc=nfs@lists.sourceforge.net \
--cc=nfsv4@linux-nfs.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox