From: Chao Yu <chao@kernel.org>
To: Yunlei He <heyunlei@huawei.com>,
jaegeuk@kernel.org, yuchao0@huawei.com,
linux-f2fs-devel@lists.sourceforge.net
Cc: ning.jia@huawei.com
Subject: Re: [PATCH v2] f2fs: avoid dead loop in function find_fsync_dnodes
Date: Mon, 11 Dec 2017 21:46:29 +0800 [thread overview]
Message-ID: <223a6c82-e8d8-9307-c53e-eaf588a6252f@kernel.org> (raw)
In-Reply-To: <1512966212-12595-1-git-send-email-heyunlei@huawei.com>
On 2017/12/11 12:23, Yunlei He wrote:
> Came across a dead loop in recovery like this:
>
> ......
> [ 24.680480s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597696
> [ 24.698394s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597697
> [ 24.724334s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724334s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724365s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724365s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724365s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724395s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724395s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724395s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724395s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> [ 24.724426s][pid:320,cpu0,init]find_fsync_dnodes: blkaddr =13597698
> ......
>
> Mount process will block in dead loop and fsck can do nothing with this
> error, This patch abandon recovery if node chain is cyclical.
What about tagging page with PG_checked flag to indicate current meta page
has been traversed?
Thanks,
>
> Signed-off-by: Yunlei He <heyunlei@huawei.com>
> ---
> fs/f2fs/f2fs.h | 6 +++++
> fs/f2fs/recovery.c | 71 ++++++++++++++++++++++++++++++++++++++++++++++--------
> 2 files changed, 67 insertions(+), 10 deletions(-)
>
> diff --git a/fs/f2fs/f2fs.h b/fs/f2fs/f2fs.h
> index 82f1dc3..4649663 100644
> --- a/fs/f2fs/f2fs.h
> +++ b/fs/f2fs/f2fs.h
> @@ -289,6 +289,12 @@ struct fsync_inode_entry {
> block_t last_dentry; /* block address locating the last dentry */
> };
>
> +/* for the block of node chain, used only during recovery */
> +struct fsync_node_entry {
> + struct list_head list; /* list head */
> + block_t blkaddr; /* locating the node block in recovery chain */
> +};
> +
> #define nats_in_cursum(jnl) (le16_to_cpu((jnl)->n_nats))
> #define sits_in_cursum(jnl) (le16_to_cpu((jnl)->n_sits))
>
> diff --git a/fs/f2fs/recovery.c b/fs/f2fs/recovery.c
> index 7d63faf..9958abb 100644
> --- a/fs/f2fs/recovery.c
> +++ b/fs/f2fs/recovery.c
> @@ -46,6 +46,7 @@
> */
>
> static struct kmem_cache *fsync_entry_slab;
> +static struct kmem_cache *fsync_node_chain_slab;
>
> bool space_for_roll_forward(struct f2fs_sb_info *sbi)
> {
> @@ -220,14 +221,55 @@ static void recover_inode(struct inode *inode, struct page *page)
> ino_of_node(page), name);
> }
>
> +static void destroy_node_blocks(struct list_head *head)
> +{
> + struct fsync_node_entry *entry, *tmp;
> +
> + list_for_each_entry_safe(entry, tmp, head, list) {
> + list_del(&entry->list);
> + kmem_cache_free(fsync_node_chain_slab, entry);
> + }
> +}
> +
> +static bool blkaddr_already_in_list(struct list_head *head, block_t blkaddr)
> +{
> + struct fsync_node_entry *entry;
> +
> + list_for_each_entry(entry, head, list)
> + if (entry->blkaddr == blkaddr)
> + return true;
> +
> + return false;
> +}
> +
> +static void add_fsync_node(struct list_head *head, block_t blkaddr)
> +{
> + struct fsync_node_entry *entry;
> +
> + entry = f2fs_kmem_cache_alloc(fsync_node_chain_slab, GFP_F2FS_ZERO);
> + entry->blkaddr = blkaddr;
> + list_add_tail(&entry->list, head);
> +}
> +
> +static void destroy_fsync_dnodes(struct list_head *head)
> +{
> + struct fsync_inode_entry *entry, *tmp;
> +
> + list_for_each_entry_safe(entry, tmp, head, list)
> + del_fsync_inode(entry);
> +}
> +
> static int find_fsync_dnodes(struct f2fs_sb_info *sbi, struct list_head *head,
> bool check_only)
> {
> struct curseg_info *curseg;
> struct page *page = NULL;
> + struct list_head node_block_list;
> block_t blkaddr;
> int err = 0;
>
> + INIT_LIST_HEAD(&node_block_list);
> +
> /* get node pages in the current segment */
> curseg = CURSEG_I(sbi, CURSEG_WARM_NODE);
> blkaddr = NEXT_FREE_BLKADDR(sbi, curseg);
> @@ -239,7 +281,13 @@ static int find_fsync_dnodes(struct f2fs_sb_info *sbi, struct list_head *head,
> return 0;
>
> page = get_tmp_page(sbi, blkaddr);
> + if (unlikely(blkaddr_already_in_list(&node_block_list, blkaddr))) {
> + f2fs_msg(sbi->sb, KERN_ERR, "Abandon dead loop node block list");
> + destroy_fsync_dnodes(head);
> + break;
> + }
>
> + add_fsync_node(&node_block_list, blkaddr);
> if (!is_recoverable_dnode(page))
> break;
>
> @@ -284,18 +332,12 @@ static int find_fsync_dnodes(struct f2fs_sb_info *sbi, struct list_head *head,
>
> ra_meta_pages_cond(sbi, blkaddr);
> }
> +
> + destroy_node_blocks(&node_block_list);
> f2fs_put_page(page, 1);
> return err;
> }
>
> -static void destroy_fsync_dnodes(struct list_head *head)
> -{
> - struct fsync_inode_entry *entry, *tmp;
> -
> - list_for_each_entry_safe(entry, tmp, head, list)
> - del_fsync_inode(entry);
> -}
> -
> static int check_index_in_prev_nodes(struct f2fs_sb_info *sbi,
> block_t blkaddr, struct dnode_of_data *dn)
> {
> @@ -614,7 +656,14 @@ int recover_fsync_data(struct f2fs_sb_info *sbi, bool check_only)
> sizeof(struct fsync_inode_entry));
> if (!fsync_entry_slab) {
> err = -ENOMEM;
> - goto out;
> + goto free_inode_entry;
> + }
> +
> + fsync_node_chain_slab = f2fs_kmem_cache_create("f2fs_fsync_node_entry",
> + sizeof(struct fsync_node_entry));
> + if (!fsync_node_chain_slab) {
> + err = -ENOMEM;
> + goto free_node_entry;
> }
>
> INIT_LIST_HEAD(&inode_list);
> @@ -664,8 +713,10 @@ int recover_fsync_data(struct f2fs_sb_info *sbi, bool check_only)
> err = write_checkpoint(sbi, &cpc);
> }
>
> + kmem_cache_destroy(fsync_node_chain_slab);
> +free_node_entry:
> kmem_cache_destroy(fsync_entry_slab);
> -out:
> +free_inode_entry:
> #ifdef CONFIG_QUOTA
> /* Turn quotas off */
> if (quota_enabled)
>
------------------------------------------------------------------------------
Check out the vibrant tech community on one of the world's most
engaging tech sites, Slashdot.org! http://sdm.link/slashdot
prev parent reply other threads:[~2017-12-11 13:46 UTC|newest]
Thread overview: 2+ messages / expand[flat|nested] mbox.gz Atom feed top
2017-12-11 4:23 [PATCH v2] f2fs: avoid dead loop in function find_fsync_dnodes Yunlei He
2017-12-11 13:46 ` Chao Yu [this message]
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=223a6c82-e8d8-9307-c53e-eaf588a6252f@kernel.org \
--to=chao@kernel.org \
--cc=heyunlei@huawei.com \
--cc=jaegeuk@kernel.org \
--cc=linux-f2fs-devel@lists.sourceforge.net \
--cc=ning.jia@huawei.com \
--cc=yuchao0@huawei.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).