From: Jeff Layton <jlayton@kernel.org>
To: Chuck Lever <cel@kernel.org>, linux-nfs@vger.kernel.org
Subject: Re: [PATCH RFC] NFSD: Move callback_wq into struct nfs4_client
Date: Tue, 02 Apr 2024 06:29:39 -0400 [thread overview]
Message-ID: <c9337d1e9e955e7235280d95fb56db07a9dd0dbb.camel@kernel.org> (raw)
In-Reply-To: <171200183231.5439.7855646322906072619.stgit@klimt.1015granger.net>
On Mon, 2024-04-01 at 16:05 -0400, Chuck Lever wrote:
> From: Chuck Lever <chuck.lever@oracle.com>
>
> Commit 883820366747 ("nfsd: update workqueue creation") made the
> callback_wq single-threaded, presumably to protect modifications of
> cl_cb_client. See documenting comment for nfsd4_process_cb_update().
>
> However, cl_cb_client is per-lease. There's no other reason that all
> callback operations need to be dispatched via a single thread. The
> single threading here means all client callbacks can be blocked by a
> problem with one client.
>
> Change the NFSv4 callback client so it serializes per-lease instead
> of serializing all NFSv4 callback operations on the server.
>
> Reported-by: Dai Ngo <dai.ngo@oracle.com>
> Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
> ---
> fs/nfsd/nfs4callback.c | 37 +++++++++++++------------------------
> fs/nfsd/nfs4state.c | 14 +++++++-------
> fs/nfsd/state.h | 4 ++--
> 3 files changed, 22 insertions(+), 33 deletions(-)
>
> This has seen some light testing with a single client, and has been
> pushed to the nfsd-testing branch of:
>
> https://git.kernel.org/pub/scm/linux/kernel/git/cel/linux.git
>
>
> diff --git a/fs/nfsd/nfs4callback.c b/fs/nfsd/nfs4callback.c
> index 87c9547989f6..cf87ace7a1b0 100644
> --- a/fs/nfsd/nfs4callback.c
> +++ b/fs/nfsd/nfs4callback.c
> @@ -978,19 +978,21 @@ static int max_cb_time(struct net *net)
> return max(((u32)nn->nfsd4_lease)/10, 1u) * HZ;
> }
>
> -static struct workqueue_struct *callback_wq;
> -
> static bool nfsd4_queue_cb(struct nfsd4_callback *cb)
> {
> - trace_nfsd_cb_queue(cb->cb_clp, cb);
> - return queue_delayed_work(callback_wq, &cb->cb_work, 0);
> + struct nfs4_client *clp = cb->cb_clp;
> +
> + trace_nfsd_cb_queue(clp, cb);
> + return queue_delayed_work(clp->cl_callback_wq, &cb->cb_work, 0);
> }
>
> static void nfsd4_queue_cb_delayed(struct nfsd4_callback *cb,
> unsigned long msecs)
> {
> - trace_nfsd_cb_queue(cb->cb_clp, cb);
> - queue_delayed_work(callback_wq, &cb->cb_work,
> + struct nfs4_client *clp = cb->cb_clp;
> +
> + trace_nfsd_cb_queue(clp, cb);
> + queue_delayed_work(clp->cl_callback_wq, &cb->cb_work,
> msecs_to_jiffies(msecs));
> }
>
> @@ -1161,7 +1163,7 @@ void nfsd4_probe_callback(struct nfs4_client *clp)
> void nfsd4_probe_callback_sync(struct nfs4_client *clp)
> {
> nfsd4_probe_callback(clp);
> - flush_workqueue(callback_wq);
> + flush_workqueue(clp->cl_callback_wq);
> }
>
> void nfsd4_change_callback(struct nfs4_client *clp, struct nfs4_cb_conn *conn)
> @@ -1380,19 +1382,6 @@ static const struct rpc_call_ops nfsd4_cb_ops = {
> .rpc_release = nfsd4_cb_release,
> };
>
> -int nfsd4_create_callback_queue(void)
> -{
> - callback_wq = alloc_ordered_workqueue("nfsd4_callbacks", 0);
> - if (!callback_wq)
> - return -ENOMEM;
> - return 0;
> -}
> -
> -void nfsd4_destroy_callback_queue(void)
> -{
> - destroy_workqueue(callback_wq);
> -}
> -
> /* must be called under the state lock */
> void nfsd4_shutdown_callback(struct nfs4_client *clp)
> {
> @@ -1406,7 +1395,7 @@ void nfsd4_shutdown_callback(struct nfs4_client *clp)
> * client, destroy the rpc client, and stop:
> */
> nfsd4_run_cb(&clp->cl_cb_null);
> - flush_workqueue(callback_wq);
> + flush_workqueue(clp->cl_callback_wq);
> nfsd41_cb_inflight_wait_complete(clp);
> }
>
> @@ -1428,9 +1417,9 @@ static struct nfsd4_conn * __nfsd4_find_backchannel(struct nfs4_client *clp)
>
> /*
> * Note there isn't a lot of locking in this code; instead we depend on
> - * the fact that it is run from the callback_wq, which won't run two
> - * work items at once. So, for example, callback_wq handles all access
> - * of cl_cb_client and all calls to rpc_create or rpc_shutdown_client.
> + * the fact that it is run from clp->cl_callback_wq, which won't run two
> + * work items at once. So, for example, clp->cl_callback_wq handles all
> + * access of cl_cb_client and all calls to rpc_create or rpc_shutdown_client.
> */
> static void nfsd4_process_cb_update(struct nfsd4_callback *cb)
> {
> diff --git a/fs/nfsd/nfs4state.c b/fs/nfsd/nfs4state.c
> index 2ece3092a4e3..19e15c093f0a 100644
> --- a/fs/nfsd/nfs4state.c
> +++ b/fs/nfsd/nfs4state.c
> @@ -2233,6 +2233,10 @@ static struct nfs4_client *alloc_client(struct xdr_netobj name,
> GFP_KERNEL);
> if (!clp->cl_ownerstr_hashtbl)
> goto err_no_hashtbl;
> + clp->cl_callback_wq = alloc_ordered_workqueue("nfsd4_callbacks", 0);
> + if (!clp->cl_callback_wq)
> + goto err_no_callback_wq;
> +
> for (i = 0; i < OWNER_HASH_SIZE; i++)
> INIT_LIST_HEAD(&clp->cl_ownerstr_hashtbl[i]);
> INIT_LIST_HEAD(&clp->cl_sessions);
> @@ -2255,6 +2259,8 @@ static struct nfs4_client *alloc_client(struct xdr_netobj name,
> spin_lock_init(&clp->cl_lock);
> rpc_init_wait_queue(&clp->cl_cb_waitq, "Backchannel slot table");
> return clp;
> +err_no_callback_wq:
> + kfree(clp->cl_ownerstr_hashtbl);
> err_no_hashtbl:
> kfree(clp->cl_name.data);
> err_no_name:
> @@ -2268,6 +2274,7 @@ static void __free_client(struct kref *k)
> struct nfs4_client *clp = container_of(c, struct nfs4_client, cl_nfsdfs);
>
> free_svc_cred(&clp->cl_cred);
> + destroy_workqueue(clp->cl_callback_wq);
> kfree(clp->cl_ownerstr_hashtbl);
> kfree(clp->cl_name.data);
> kfree(clp->cl_nii_domain.data);
> @@ -8644,12 +8651,6 @@ nfs4_state_start(void)
> if (ret)
> return ret;
>
> - ret = nfsd4_create_callback_queue();
> - if (ret) {
> - rhltable_destroy(&nfs4_file_rhltable);
> - return ret;
> - }
> -
> set_max_delegations();
> return 0;
> }
> @@ -8690,7 +8691,6 @@ nfs4_state_shutdown_net(struct net *net)
> void
> nfs4_state_shutdown(void)
> {
> - nfsd4_destroy_callback_queue();
> rhltable_destroy(&nfs4_file_rhltable);
> }
>
> diff --git a/fs/nfsd/state.h b/fs/nfsd/state.h
> index 0400441c87c1..f42d8d782c84 100644
> --- a/fs/nfsd/state.h
> +++ b/fs/nfsd/state.h
> @@ -408,6 +408,8 @@ struct nfs4_client {
> 1 << NFSD4_CLIENT_CB_KILL)
> #define NFSD4_CLIENT_CB_RECALL_ANY (6)
> unsigned long cl_flags;
> +
> + struct workqueue_struct *cl_callback_wq;
> const struct cred *cl_cb_cred;
> struct rpc_clnt *cl_cb_client;
> u32 cl_cb_ident;
> @@ -735,8 +737,6 @@ extern void nfsd4_change_callback(struct nfs4_client *clp, struct nfs4_cb_conn *
> extern void nfsd4_init_cb(struct nfsd4_callback *cb, struct nfs4_client *clp,
> const struct nfsd4_callback_ops *ops, enum nfsd4_cb_op op);
> extern bool nfsd4_run_cb(struct nfsd4_callback *cb);
> -extern int nfsd4_create_callback_queue(void);
> -extern void nfsd4_destroy_callback_queue(void);
> extern void nfsd4_shutdown_callback(struct nfs4_client *);
> extern void nfsd4_shutdown_copy(struct nfs4_client *clp);
> extern struct nfs4_client_reclaim *nfs4_client_to_reclaim(struct xdr_netobj name,
>
>
>
Looks good.
Reviewed-by: Jeff Layton <jlayton@kernel.org>
prev parent reply other threads:[~2024-04-02 10:29 UTC|newest]
Thread overview: 2+ messages / expand[flat|nested] mbox.gz Atom feed top
2024-04-01 20:05 [PATCH RFC] NFSD: Move callback_wq into struct nfs4_client Chuck Lever
2024-04-02 10:29 ` Jeff Layton [this message]
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=c9337d1e9e955e7235280d95fb56db07a9dd0dbb.camel@kernel.org \
--to=jlayton@kernel.org \
--cc=cel@kernel.org \
--cc=linux-nfs@vger.kernel.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox