From: James Simmons <jsimmons@infradead.org>
To: Andreas Dilger <adilger@whamcloud.com>,
Oleg Drokin <green@whamcloud.com>, NeilBrown <neilb@suse.de>
Cc: Lustre Development List <lustre-devel@lists.lustre.org>
Subject: [lustre-devel] [PATCH 39/42] lustre: llite: revert: "llite: clear stale page's uptodate bit"
Date: Mon, 23 Jan 2023 18:00:52 -0500 [thread overview]
Message-ID: <1674514855-15399-40-git-send-email-jsimmons@infradead.org> (raw)
In-Reply-To: <1674514855-15399-1-git-send-email-jsimmons@infradead.org>
From: Bobi Jam <bobijam@whamcloud.com>
This reverts commit 23c4c1c09cfebccea37a88a27f122646168cbad4
which caused a bug in cl_page_own() race with ll_releasepage()
and cl_pagevec_put() assertion failure.
WC-bug-id: https://jira.whamcloud.com/browse/LU-16160
Lustre-commit: 84c9618190f9e3a52 ("LU-16160 revert: "llite: clear stale page's uptodate bit")
Signed-off-by: Bobi Jam <bobijam@whamcloud.com>
Reviewed-on: https://review.whamcloud.com/c/fs/lustre-release/+/49541
Reviewed-by: Oleg Drokin <green@whamcloud.com>
Reviewed-by: Andreas Dilger <adilger@whamcloud.com>
Reviewed-by: Qian Yingjin <qian@ddn.com>
Signed-off-by: James Simmons <jsimmons@infradead.org>
---
fs/lustre/include/cl_object.h | 15 +---
fs/lustre/llite/rw.c | 10 +--
fs/lustre/llite/vvp_io.c | 124 +++-------------------------------
fs/lustre/llite/vvp_page.c | 5 --
fs/lustre/obdclass/cl_page.c | 37 +++-------
5 files changed, 19 insertions(+), 172 deletions(-)
diff --git a/fs/lustre/include/cl_object.h b/fs/lustre/include/cl_object.h
index 8be58ffb9f34..41ce0b02e00e 100644
--- a/fs/lustre/include/cl_object.h
+++ b/fs/lustre/include/cl_object.h
@@ -768,15 +768,7 @@ struct cl_page {
enum cl_page_type cp_type:CP_TYPE_BITS;
unsigned int cp_defer_uptodate:1,
cp_ra_updated:1,
- cp_ra_used:1,
- /* fault page read grab extra referece */
- cp_fault_ref:1,
- /**
- * if fault page got delete before returned to
- * filemap_fault(), defer the vmpage detach/put
- * until filemap_fault() has been handled.
- */
- cp_defer_detach:1;
+ cp_ra_used:1;
/* which slab kmem index this memory allocated from */
short int cp_kmem_index;
@@ -2401,11 +2393,6 @@ int cl_io_lru_reserve(const struct lu_env *env, struct cl_io *io,
int cl_io_read_ahead(const struct lu_env *env, struct cl_io *io,
pgoff_t start, struct cl_read_ahead *ra);
-static inline int cl_io_is_pagefault(const struct cl_io *io)
-{
- return io->ci_type == CIT_FAULT && !io->u.ci_fault.ft_mkwrite;
-}
-
/**
* True, if @io is an O_APPEND write(2).
*/
diff --git a/fs/lustre/llite/rw.c b/fs/lustre/llite/rw.c
index 0283af422712..2290b3112380 100644
--- a/fs/lustre/llite/rw.c
+++ b/fs/lustre/llite/rw.c
@@ -1947,15 +1947,7 @@ int ll_readpage(struct file *file, struct page *vmpage)
unlock_page(vmpage);
result = 0;
}
- if (cl_io_is_pagefault(io) && result == 0) {
- /**
- * page fault, retain the cl_page reference until
- * vvp_io_kernel_fault() release it.
- */
- page->cp_fault_ref = 1;
- } else {
- cl_page_put(env, page);
- }
+ cl_page_put(env, page);
} else {
unlock_page(vmpage);
result = PTR_ERR(page);
diff --git a/fs/lustre/llite/vvp_io.c b/fs/lustre/llite/vvp_io.c
index 317704172080..eacb35b500e5 100644
--- a/fs/lustre/llite/vvp_io.c
+++ b/fs/lustre/llite/vvp_io.c
@@ -1302,41 +1302,14 @@ static void vvp_io_rw_end(const struct lu_env *env,
trunc_sem_up_read(&lli->lli_trunc_sem);
}
-static void detach_and_deref_page(struct cl_page *clp, struct page *vmpage)
-{
- if (!clp->cp_defer_detach)
- return;
-
- /**
- * cl_page_delete0() took a vmpage reference, but not unlink the vmpage
- * from its cl_page.
- */
- clp->cp_defer_detach = 0;
- ClearPagePrivate(vmpage);
- vmpage->private = 0;
-
- put_page(vmpage);
- refcount_dec(&clp->cp_ref);
-}
-
-static int vvp_io_kernel_fault(const struct lu_env *env,
- struct vvp_fault_io *cfio)
+static int vvp_io_kernel_fault(struct vvp_fault_io *cfio)
{
struct vm_fault *vmf = cfio->ft_vmf;
- struct file *vmff = cfio->ft_vma->vm_file;
- struct address_space *mapping = vmff->f_mapping;
- struct inode *inode = mapping->host;
- struct page *vmpage = NULL;
- struct cl_page *clp = NULL;
- int rc = 0;
- ll_inode_size_lock(inode);
-retry:
cfio->ft_flags = filemap_fault(vmf);
cfio->ft_flags_valid = 1;
if (vmf->page) {
- /* success, vmpage is locked */
CDEBUG(D_PAGE,
"page %p map %p index %lu flags %lx count %u priv %0lx: got addr %p type NOPAGE\n",
vmf->page, vmf->page->mapping, vmf->page->index,
@@ -1348,105 +1321,24 @@ static int vvp_io_kernel_fault(const struct lu_env *env,
}
cfio->ft_vmpage = vmf->page;
-
- /**
- * ll_filemap_fault()->ll_readpage() could get an extra cl_page
- * reference. So we have to get the cl_page's to check its
- * cp_fault_ref and drop the reference later.
- */
- clp = cl_vmpage_page(vmf->page, NULL);
-
- goto unlock;
- }
-
- /* filemap_fault() fails, vmpage is not locked */
- if (!clp) {
- vmpage = find_get_page(mapping, vmf->pgoff);
- if (vmpage) {
- lock_page(vmpage);
- clp = cl_vmpage_page(vmpage, NULL);
- unlock_page(vmpage);
- }
+ return 0;
}
if (cfio->ft_flags & (VM_FAULT_SIGBUS | VM_FAULT_SIGSEGV)) {
- pgoff_t max_idx;
-
- /**
- * ll_filemap_fault()->ll_readpage() could fill vmpage
- * correctly, and unlock the vmpage, while memory pressure or
- * truncate could detach cl_page from vmpage, and kernel
- * filemap_fault() will wait_on_page_locked(vmpage) and find
- * out that the vmpage has been cleared its uptodate bit,
- * so it returns VM_FAULT_SIGBUS.
- *
- * In this case, we'd retry the filemap_fault()->ll_readpage()
- * to rebuild the cl_page and fill vmpage with uptodated data.
- */
- if (likely(vmpage)) {
- bool need_retry = false;
-
- if (clp) {
- if (clp->cp_defer_detach) {
- detach_and_deref_page(clp, vmpage);
- /**
- * check i_size to make sure it's not
- * over EOF, we don't want to call
- * filemap_fault() repeatedly since it
- * returns VM_FAULT_SIGBUS without even
- * trying if vmf->pgoff is over EOF.
- */
- max_idx = DIV_ROUND_UP(i_size_read(inode),
- PAGE_SIZE);
- if (vmf->pgoff < max_idx)
- need_retry = true;
- }
- if (clp->cp_fault_ref) {
- clp->cp_fault_ref = 0;
- /* ref not released in ll_readpage() */
- cl_page_put(env, clp);
- }
- if (need_retry)
- goto retry;
- }
- }
-
CDEBUG(D_PAGE, "got addr %p - SIGBUS\n", (void *)vmf->address);
- rc = -EFAULT;
- goto unlock;
+ return -EFAULT;
}
if (cfio->ft_flags & VM_FAULT_OOM) {
CDEBUG(D_PAGE, "got addr %p - OOM\n", (void *)vmf->address);
- rc = -ENOMEM;
- goto unlock;
+ return -ENOMEM;
}
- if (cfio->ft_flags & VM_FAULT_RETRY) {
- rc = -EAGAIN;
- goto unlock;
- }
+ if (cfio->ft_flags & VM_FAULT_RETRY)
+ return -EAGAIN;
CERROR("Unknown error in page fault %d!\n", cfio->ft_flags);
- rc = -EINVAL;
-unlock:
- ll_inode_size_unlock(inode);
- if (clp) {
- if (clp->cp_defer_detach && vmpage)
- detach_and_deref_page(clp, vmpage);
-
- /* additional cl_page ref has been taken in ll_readpage() */
- if (clp->cp_fault_ref) {
- clp->cp_fault_ref = 0;
- /* ref not released in ll_readpage() */
- cl_page_put(env, clp);
- }
- /* ref taken in this function */
- cl_page_put(env, clp);
- }
- if (vmpage)
- put_page(vmpage);
- return rc;
+ return -EINVAL;
}
static void mkwrite_commit_callback(const struct lu_env *env, struct cl_io *io,
@@ -1486,7 +1378,7 @@ static int vvp_io_fault_start(const struct lu_env *env,
LASSERT(cfio->ft_vmpage);
lock_page(cfio->ft_vmpage);
} else {
- result = vvp_io_kernel_fault(env, cfio);
+ result = vvp_io_kernel_fault(cfio);
if (result != 0)
return result;
}
diff --git a/fs/lustre/llite/vvp_page.c b/fs/lustre/llite/vvp_page.c
index 9e8c1588347f..f359596bc32d 100644
--- a/fs/lustre/llite/vvp_page.c
+++ b/fs/lustre/llite/vvp_page.c
@@ -104,11 +104,6 @@ static void vvp_page_completion_read(const struct lu_env *env,
ll_ra_count_put(ll_i2sbi(inode), 1);
if (ioret == 0) {
- /**
- * cp_defer_uptodate is used for readahead page, and the
- * vmpage Uptodate bit is deferred to set in ll_readpage/
- * ll_io_read_page.
- */
if (!cp->cp_defer_uptodate)
SetPageUptodate(vmpage);
} else if (cp->cp_defer_uptodate) {
diff --git a/fs/lustre/obdclass/cl_page.c b/fs/lustre/obdclass/cl_page.c
index 3bc1a9b0eb98..7011235a9b3c 100644
--- a/fs/lustre/obdclass/cl_page.c
+++ b/fs/lustre/obdclass/cl_page.c
@@ -725,35 +725,16 @@ static void __cl_page_delete(const struct lu_env *env, struct cl_page *cp)
LASSERT(PageLocked(vmpage));
LASSERT((struct cl_page *)vmpage->private == cp);
- /**
- * clear vmpage uptodate bit, since ll_read_ahead_pages()->
- * ll_read_ahead_page() could pick up this stale vmpage and
- * take it as uptodated.
- */
- ClearPageUptodate(vmpage);
- /**
- * vvp_io_kernel_fault()->ll_readpage() set cp_fault_ref
- * and need it to check cl_page to retry the page fault read.
+ /* Drop the reference count held in vvp_page_init */
+ refcount_dec(&cp->cp_ref);
+ ClearPagePrivate(vmpage);
+ vmpage->private = 0;
+
+ /*
+ * The reference from vmpage to cl_page is removed,
+ * but the reference back is still here. It is removed
+ * later in cl_page_free().
*/
- if (cp->cp_fault_ref) {
- cp->cp_defer_detach = 1;
- /**
- * get a vmpage reference, so that filemap_fault()
- * won't free it from pagecache.
- */
- get_page(vmpage);
- } else {
- /* Drop the reference count held in vvp_page_init */
- refcount_dec(&cp->cp_ref);
- ClearPagePrivate(vmpage);
- vmpage->private = 0;
-
- /*
- * The reference from vmpage to cl_page is removed,
- * but the reference back is still here. It is removed
- * later in cl_page_free().
- */
- }
}
}
--
2.27.0
_______________________________________________
lustre-devel mailing list
lustre-devel@lists.lustre.org
http://lists.lustre.org/listinfo.cgi/lustre-devel-lustre.org
next prev parent reply other threads:[~2023-01-23 23:39 UTC|newest]
Thread overview: 43+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-01-23 23:00 [lustre-devel] [PATCH 00/42] lustre: sync to OpenSFS tree as of Jan 22 2023 James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 01/42] lustre: osc: pack osc_async_page better James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 02/42] lnet: lnet_peer_merge_data to understand large addr James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 03/42] lnet: router_discover - handle large addrs in ping James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 04/42] lnet: Drop LNet message if deadline exceeded James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 05/42] lnet: change lnet_find_best_lpni to handle large NIDs James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 06/42] lustre: ldebugfs: add histogram to stats counter James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 07/42] lustre: llite: wake_up after cl_object_kill James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 08/42] lustre: pcc: use two bits to indicate pcc type for attach James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 09/42] lustre: ldebugfs: make job_stats and rename_stats valid YAML James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 10/42] lustre: misc: fix stats snapshot_time to use wallclock James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 11/42] lustre: pools: force creation of a component without a pool James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 12/42] lustre: sec: reserve flag for fid2path for encrypted files James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 13/42] lustre: llite: update statx size/ctime for fallocate James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 14/42] lustre: ptlrpc: fiemap flexible array James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 15/42] lustre: ptlrpc: Add LCME_FL_PARITY to wirecheck James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 16/42] lnet: selftest: lst read-outside of allocation James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 17/42] lustre: misc: rename lprocfs_stats functions James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 18/42] lustre: osc: Fix possible null pointer James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 19/42] lustre: ptlrpc: NUL terminate long jobid strings James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 20/42] lustre: uapi: remove _GNU_SOURCE dependency in lustre_user.h James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 21/42] lnet: handles unregister/register events James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 22/42] lustre: update version to 2.15.53 James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 23/42] lustre: ptlrpc: don't panic during reconnection James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 24/42] lustre: move to kobj_type default_groups James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 25/42] lnet: increase transaction timeout James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 26/42] lnet: Allow IP specification James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 27/42] lustre: obdclass: fix T10PI prototypes James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 28/42] lustre: obdclass: prefer T10 checksum if the target supports it James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 29/42] lustre: llite: remove false outdated comment James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 30/42] lnet: socklnd: clarify error message on timeout James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 31/42] lustre: llite: replace selinux_is_enabled() James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 32/42] lustre: enc: S_ENCRYPTED flag on OST objects for enc files James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 33/42] lnet: asym route inconsistency warning James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 34/42] lnet: o2iblnd: reset hiw proportionally James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 35/42] lnet: libcfs: cfs_hash_for_each_empty optimization James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 36/42] lustre: llite: always enable remote subdir mount James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 37/42] lnet: selftest: migrate LNet selftest group handling to Netlink James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 38/42] lnet: use Netlink to support LNet ping commands James Simmons
2023-01-23 23:00 ` James Simmons [this message]
2023-01-23 23:00 ` [lustre-devel] [PATCH 40/42] lnet: validate data sent from user land properly James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 41/42] lnet: modify lnet_inetdev to work with large NIDS James Simmons
2023-01-23 23:00 ` [lustre-devel] [PATCH 42/42] lustre: ldlm: remove obsolete LDLM_FL_SERVER_LOCK James Simmons
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=1674514855-15399-40-git-send-email-jsimmons@infradead.org \
--to=jsimmons@infradead.org \
--cc=adilger@whamcloud.com \
--cc=green@whamcloud.com \
--cc=lustre-devel@lists.lustre.org \
--cc=neilb@suse.de \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).