From: Chao Yu <chao@kernel.org>
To: Daniel Rosenberg <drosen@google.com>,
linux-f2fs-devel@lists.sourceforge.net
Cc: Jaegeuk Kim <jaegeuk@kernel.org>,
kernel-team@android.com, Daeho Jeong <daehojeong@google.com>
Subject: Re: [f2fs-dev] [PATCH v4 1/2] dump.f2fs: Add ability to dump folders
Date: Wed, 29 May 2024 14:39:52 +0800 [thread overview]
Message-ID: <aa383858-655d-4876-b3bc-52a04067b0d2@kernel.org> (raw)
In-Reply-To: <20240523224700.265251-1-drosen@google.com>
On 2024/5/24 6:46, Daniel Rosenberg wrote:
> This adds the ability to dump folders as well as files. Folders are
> dumped recursively. Additionally, dumped files/folders may be directed
> to a folder specified by -o [path] instead of ./lost_found. The -r flag
> will dump the entire fs from the root inode. -f or -y will skip the
> prompt before dumping, and -P will preserve the mode/owner info for the
> created file/folder.
>
> Signed-off-by: Daniel Rosenberg <drosen@google.com>
> Reviewed-by: Daeho Jeong <daehojeong@google.com>
> ---
> fsck/dump.c | 178 ++++++++++++++++++++++++++++++++++++++----------
> fsck/fsck.c | 4 +-
> fsck/fsck.h | 4 +-
> fsck/main.c | 29 +++++++-
> man/dump.f2fs.8 | 17 ++++-
> 5 files changed, 190 insertions(+), 42 deletions(-)
>
> diff --git a/fsck/dump.c b/fsck/dump.c
> index b2e990b..fa68456 100644
> --- a/fsck/dump.c
> +++ b/fsck/dump.c
> @@ -247,7 +247,26 @@ out:
> printf("\n");
> }
>
> -static void dump_data_blk(struct f2fs_sb_info *sbi, __u64 offset, u32 blkaddr)
> +static void dump_folder_contents(struct f2fs_sb_info *sbi, u8 *bitmap,
> + struct f2fs_dir_entry *dentry,
> + __u8 (*filenames)[F2FS_SLOT_LEN], int max)
> +{
> + int i;
> + int name_len;
> +
> + for (i = 0; i < max; i++) {
> + if (test_bit_le(i, bitmap) == 0)
> + continue;
> + name_len = le16_to_cpu(dentry[i].name_len);
> + if (name_len == 1 && filenames[i][0] == '.')
> + continue;
> + if (name_len == 2 && filenames[i][0] == '.' && filenames[i][1] == '.')
> + continue;
> + dump_node(sbi, le32_to_cpu(dentry[i].ino), 1, NULL, 0, 1);
> + }
> +}
> +
> +static void dump_data_blk(struct f2fs_sb_info *sbi, __u64 offset, u32 blkaddr, bool is_folder)
> {
> char buf[F2FS_BLKSIZE];
>
> @@ -288,12 +307,19 @@ static void dump_data_blk(struct f2fs_sb_info *sbi, __u64 offset, u32 blkaddr)
> ASSERT(ret >= 0);
> }
>
> - /* write blkaddr */
> - dev_write_dump(buf, offset, F2FS_BLKSIZE);
> + if (is_folder) {
> + struct f2fs_dentry_block *d = (struct f2fs_dentry_block *) buf;
> +
> + dump_folder_contents(sbi, d->dentry_bitmap, F2FS_DENTRY_BLOCK_DENTRIES(d),
> + F2FS_DENTRY_BLOCK_FILENAMES(d), NR_DENTRY_IN_BLOCK);
> + } else {
> + /* write blkaddr */
> + dev_write_dump(buf, offset, F2FS_BLKSIZE);
> + }
> }
>
> static void dump_node_blk(struct f2fs_sb_info *sbi, int ntype,
> - u32 nid, u32 addr_per_block, u64 *ofs)
> + u32 nid, u32 addr_per_block, u64 *ofs, int is_dir)
> {
> struct node_info ni;
> struct f2fs_node *node_blk;
> @@ -330,20 +356,20 @@ static void dump_node_blk(struct f2fs_sb_info *sbi, int ntype,
> switch (ntype) {
> case TYPE_DIRECT_NODE:
> dump_data_blk(sbi, *ofs * F2FS_BLKSIZE,
> - le32_to_cpu(node_blk->dn.addr[i]));
> + le32_to_cpu(node_blk->dn.addr[i]), is_dir);
> (*ofs)++;
> break;
> case TYPE_INDIRECT_NODE:
> dump_node_blk(sbi, TYPE_DIRECT_NODE,
> le32_to_cpu(node_blk->in.nid[i]),
> addr_per_block,
> - ofs);
> + ofs, is_dir);
> break;
> case TYPE_DOUBLE_INDIRECT_NODE:
> dump_node_blk(sbi, TYPE_INDIRECT_NODE,
> le32_to_cpu(node_blk->in.nid[i]),
> addr_per_block,
> - ofs);
> + ofs, is_dir);
> break;
> }
> }
> @@ -435,8 +461,9 @@ static int dump_inode_blk(struct f2fs_sb_info *sbi, u32 nid,
> u32 i = 0;
> u64 ofs = 0;
> u32 addr_per_block;
> + bool is_dir = S_ISDIR(le16_to_cpu(node_blk->i.i_mode));
>
> - if((node_blk->i.i_inline & F2FS_INLINE_DATA)) {
> + if ((node_blk->i.i_inline & F2FS_INLINE_DATA)) {
> DBG(3, "ino[0x%x] has inline data!\n", nid);
> /* recover from inline data */
> dev_write_dump(((unsigned char *)node_blk) + INLINE_DATA_OFFSET,
> @@ -444,13 +471,25 @@ static int dump_inode_blk(struct f2fs_sb_info *sbi, u32 nid,
> return -1;
> }
>
> + if ((node_blk->i.i_inline & F2FS_INLINE_DENTRY)) {
> + void *inline_dentry = inline_data_addr(node_blk);
> + struct f2fs_dentry_ptr d;
> +
> + make_dentry_ptr(&d, node_blk, inline_dentry, 2);
> +
> + DBG(3, "ino[0x%x] has inline dentries!\n", nid);
> + /* recover from inline dentry */
> + dump_folder_contents(sbi, d.bitmap, d.dentry, d.filename, d.max);
> + return -1;
> + }
> +
> c.show_file_map_max_offset = f2fs_max_file_offset(&node_blk->i);
> addr_per_block = ADDRS_PER_BLOCK(&node_blk->i);
>
> /* check data blocks in inode */
> for (i = 0; i < ADDRS_PER_INODE(&node_blk->i); i++, ofs++)
> dump_data_blk(sbi, ofs * F2FS_BLKSIZE, le32_to_cpu(
> - node_blk->i.i_addr[get_extra_isize(node_blk) + i]));
> + node_blk->i.i_addr[get_extra_isize(node_blk) + i]), is_dir);
>
> /* check node blocks in inode */
> for (i = 0; i < 5; i++) {
> @@ -458,17 +497,20 @@ static int dump_inode_blk(struct f2fs_sb_info *sbi, u32 nid,
> dump_node_blk(sbi, TYPE_DIRECT_NODE,
> le32_to_cpu(F2FS_INODE_I_NID(&node_blk->i, i)),
> addr_per_block,
> - &ofs);
> + &ofs,
> + is_dir);
> else if (i == 2 || i == 3)
> dump_node_blk(sbi, TYPE_INDIRECT_NODE,
> le32_to_cpu(F2FS_INODE_I_NID(&node_blk->i, i)),
> addr_per_block,
> - &ofs);
> + &ofs,
> + is_dir);
> else if (i == 4)
> dump_node_blk(sbi, TYPE_DOUBLE_INDIRECT_NODE,
> le32_to_cpu(F2FS_INODE_I_NID(&node_blk->i, i)),
> addr_per_block,
> - &ofs);
> + &ofs,
> + is_dir);
> else
> ASSERT(0);
> }
> @@ -479,8 +521,51 @@ static int dump_inode_blk(struct f2fs_sb_info *sbi, u32 nid,
> return 0;
> }
>
> -static int dump_file(struct f2fs_sb_info *sbi, struct node_info *ni,
> - struct f2fs_node *node_blk, int force)
> +static void dump_file(struct f2fs_sb_info *sbi, struct node_info *ni,
> + struct f2fs_node *node_blk, char *path)
> +{
> + struct f2fs_inode *inode = &node_blk->i;
> + int ret;
> +
> + c.dump_fd = open(path, O_TRUNC|O_CREAT|O_RDWR, 0666);
> + ASSERT(c.dump_fd >= 0);
> +
> + /* dump file's data */
> + dump_inode_blk(sbi, ni->ino, node_blk);
> +
> + /* adjust file size */
> + ret = ftruncate(c.dump_fd, le32_to_cpu(inode->i_size));
> + ASSERT(ret >= 0);
> +
> + close(c.dump_fd);
> +}
> +
> +static void dump_folder(struct f2fs_sb_info *sbi, struct node_info *ni,
> + struct f2fs_node *node_blk, char *path, int is_root)
> +{
> + if (!is_root) {
> +#if defined(__MINGW32__)
> + if (mkdir(path) < 0 && errno != EEXIST) {
> + MSG(0, "Failed to create directory %s\n", path);
> + return;
> + }
> +#else
> + if (mkdir(path, 0777) < 0 && errno != EEXIST) {
> + MSG(0, "Failed to create directory %s\n", path);
> + return;
> + }
> +#endif
> + ASSERT(chdir(path) == 0);
> + }
> + /* dump folder data */
> + dump_inode_blk(sbi, ni->ino, node_blk);
> + if (!is_root)
> + ASSERT(chdir("..") == 0);
> +}
> +
> +static int dump_filesystem(struct f2fs_sb_info *sbi, struct node_info *ni,
> + struct f2fs_node *node_blk, int force, char *base_path,
> + bool is_base, bool allow_folder)
> {
> struct f2fs_inode *inode = &node_blk->i;
> u32 imode = le16_to_cpu(inode->i_mode);
> @@ -489,6 +574,7 @@ static int dump_file(struct f2fs_sb_info *sbi, struct node_info *ni,
> char path[1024] = {0};
> char ans[255] = {0};
> int is_encrypted = file_is_encrypt(inode);
> + int is_root = sbi->root_ino_num == ni->nid;
> int ret;
>
> if (is_encrypted) {
> @@ -496,11 +582,15 @@ static int dump_file(struct f2fs_sb_info *sbi, struct node_info *ni,
> return -1;
> }
>
> - if ((!S_ISREG(imode) && !S_ISLNK(imode)) ||
> - namelen == 0 || namelen > F2FS_NAME_LEN) {
> - MSG(force, "Not a regular file or wrong name info\n\n");
> + if ((!S_ISREG(imode) && !S_ISLNK(imode) && !(S_ISDIR(imode) && allow_folder))) {
> + MSG(force, "Not a valid file type\n\n");
> + return -1;
> + }
> + if (!is_root && (namelen == 0 || namelen > F2FS_NAME_LEN)) {
> + MSG(force, "Wrong name info\n\n");
> return -1;
> }
> + base_path = base_path ?: "./lost_found";
> if (force)
> goto dump;
>
> @@ -508,31 +598,49 @@ static int dump_file(struct f2fs_sb_info *sbi, struct node_info *ni,
> if (c.show_file_map)
> return dump_inode_blk(sbi, ni->ino, node_blk);
>
> - printf("Do you want to dump this file into ./lost_found/? [Y/N] ");
> + printf("Do you want to dump this %s into %s/? [Y/N] ",
> + S_ISREG(imode) || S_ISLNK(imode) ? "file" : "folder",
> + base_path);
> ret = scanf("%s", ans);
> ASSERT(ret >= 0);
>
> if (!strcasecmp(ans, "y")) {
> dump:
> - ret = system("mkdir -p ./lost_found");
> - ASSERT(ret >= 0);
> -
> - /* make a file */
> - strncpy(name, (const char *)inode->i_name, namelen);
> - name[namelen] = 0;
> - sprintf(path, "./lost_found/%s", name);
> + if (is_base) {
> + ASSERT(getcwd(path, sizeof(path)) != NULL);
> +#if defined(__MINGW32__)
> + ret = mkdir(base_path);
> +#else
> + ret = mkdir(base_path, 0777);
> +#endif
>
> - c.dump_fd = open(path, O_TRUNC|O_CREAT|O_RDWR, 0666);
> - ASSERT(c.dump_fd >= 0);
> + ASSERT(ret == 0 || errno == EEXIST);
> + ASSERT(chdir(base_path) == 0);
> + }
>
> - /* dump file's data */
> - dump_inode_blk(sbi, ni->ino, node_blk);
> + /* make a file */
> + if (!is_root) {
> + strncpy(name, (const char *)inode->i_name, namelen);
> + name[namelen] = 0;
> + }
>
> - /* adjust file size */
> - ret = ftruncate(c.dump_fd, le32_to_cpu(inode->i_size));
> - ASSERT(ret >= 0);
> + if (S_ISREG(imode) || S_ISLNK(imode)) {
> + dump_file(sbi, ni, node_blk, name);
> + } else {
> + dump_folder(sbi, ni, node_blk, name, is_root);
> + }
>
> - close(c.dump_fd);
> +#if !defined(__MINGW32__)
> + /* fix up mode/owner */
> + if (c.preserve_perms) {
> + if (is_root)
> + strncpy(name, ".", 2);
> + ASSERT(chmod(name, imode) == 0);
> + ASSERT(chown(name, inode->i_uid, inode->i_gid) == 0);
> + }
> +#endif
> + if (is_base)
> + ASSERT(chdir(path) == 0);
> }
> return 0;
> }
> @@ -582,7 +690,7 @@ void dump_node_scan_disk(struct f2fs_sb_info *sbi, nid_t nid)
> free(node_blk);
> }
>
> -int dump_node(struct f2fs_sb_info *sbi, nid_t nid, int force)
> +int dump_node(struct f2fs_sb_info *sbi, nid_t nid, int force, char *base_path, int base, int allow_folder)
> {
> struct node_info ni;
> struct f2fs_node *node_blk;
> @@ -617,7 +725,7 @@ int dump_node(struct f2fs_sb_info *sbi, nid_t nid, int force)
> print_node_info(sbi, node_blk, force);
>
> if (ni.ino == ni.nid)
> - ret = dump_file(sbi, &ni, node_blk, force);
> + ret = dump_filesystem(sbi, &ni, node_blk, force, base_path, base, allow_folder);
> } else {
> print_node_info(sbi, node_blk, force);
> MSG(force, "Invalid (i)node block\n\n");
> diff --git a/fsck/fsck.c b/fsck/fsck.c
> index 5d345d0..7400dcf 100644
> --- a/fsck/fsck.c
> +++ b/fsck/fsck.c
> @@ -1651,7 +1651,7 @@ static void print_dentry(struct f2fs_sb_info *sbi, __u8 *name,
> d = d->next;
> }
> printf("/%s", new);
> - if (dump_node(sbi, le32_to_cpu(dentry[idx].ino), 0))
> + if (dump_node(sbi, le32_to_cpu(dentry[idx].ino), 0, NULL, 0, 0))
> printf("\33[2K\r");
> } else {
> for (i = 1; i < depth; i++)
> @@ -3632,7 +3632,7 @@ int fsck_verify(struct f2fs_sb_info *sbi)
> if (!strcasecmp(ans, "y")) {
> for (i = 0; i < fsck->nr_nat_entries; i++) {
> if (f2fs_test_bit(i, fsck->nat_area_bitmap))
> - dump_node(sbi, i, 1);
> + dump_node(sbi, i, 1, NULL, 1, 0);
> }
> }
> }
> diff --git a/fsck/fsck.h b/fsck/fsck.h
> index f5282e2..6cac926 100644
> --- a/fsck/fsck.h
> +++ b/fsck/fsck.h
> @@ -270,12 +270,14 @@ struct dump_option {
> int end_ssa;
> int32_t blk_addr;
> nid_t scan_nid;
> + int use_root_nid;
> + char *base_path;
> };
>
> extern void nat_dump(struct f2fs_sb_info *, nid_t, nid_t);
> extern void sit_dump(struct f2fs_sb_info *, unsigned int, unsigned int);
> extern void ssa_dump(struct f2fs_sb_info *, int, int);
> -extern int dump_node(struct f2fs_sb_info *, nid_t, int);
> +extern int dump_node(struct f2fs_sb_info *, nid_t, int, char *, int, int);
> extern int dump_info_from_blkaddr(struct f2fs_sb_info *, u32);
> extern unsigned int start_bidx_of_node(unsigned int, struct f2fs_node *);
> extern void dump_node_scan_disk(struct f2fs_sb_info *sbi, nid_t nid);
> diff --git a/fsck/main.c b/fsck/main.c
> index c4d0956..6edc902 100644
> --- a/fsck/main.c
> +++ b/fsck/main.c
> @@ -34,7 +34,7 @@ struct f2fs_fsck gfsck;
>
> INIT_FEATURE_TABLE;
>
> -#ifdef WITH_SLOAD
> +#if defined(WITH_SLOAD) || defined(WITH_DUMP)
> static char *absolute_path(const char *file)
> {
> char *ret;
> @@ -384,7 +384,7 @@ void f2fs_parse_options(int argc, char *argv[])
> }
> } else if (!strcmp("dump.f2fs", prog)) {
> #ifdef WITH_DUMP
> - const char *option_string = "d:i:I:n:Ms:Sa:b:V";
> + const char *option_string = "d:fi:I:n:Mo:Prs:Sa:b:Vy";
> static struct dump_option dump_opt = {
> .nid = 0, /* default root ino */
> .start_nat = -1,
> @@ -395,6 +395,8 @@ void f2fs_parse_options(int argc, char *argv[])
> .end_ssa = -1,
> .blk_addr = -1,
> .scan_nid = 0,
> + .use_root_nid = 0,
> + .base_path = NULL,
> };
>
> c.func = DUMP;
> @@ -456,6 +458,24 @@ void f2fs_parse_options(int argc, char *argv[])
> ret = sscanf(optarg, "%x",
> &dump_opt.blk_addr);
> break;
> + case 'y':
> + case 'f':
> + c.force = 1;
> + break;
> + case 'r':
> + dump_opt.use_root_nid = 1;
> + break;
> + case 'o':
> + dump_opt.base_path = absolute_path(optarg);
> + break;
> + case 'P':
> +#if defined(__MINGW32__)
> + MSG(0, "-P not supported for Windows\n");
> + err = EWRONG_OPT;
> +#else
> + c.preserve_perms = 1;
> +#endif
> + break;
> case 'V':
> show_version(prog);
> exit(0);
> @@ -914,6 +934,9 @@ static void do_dump(struct f2fs_sb_info *sbi)
> struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi);
> u32 flag = le32_to_cpu(ckpt->ckpt_flags);
>
> + if (opt->use_root_nid)
> + opt->nid = sbi->root_ino_num;
> +
> if (opt->end_nat == -1)
> opt->end_nat = NM_I(sbi)->max_nid;
> if (opt->end_sit == -1)
> @@ -929,7 +952,7 @@ static void do_dump(struct f2fs_sb_info *sbi)
> if (opt->blk_addr != -1)
> dump_info_from_blkaddr(sbi, opt->blk_addr);
> if (opt->nid)
> - dump_node(sbi, opt->nid, 0);
> + dump_node(sbi, opt->nid, c.force, opt->base_path, 1, 1);
> if (opt->scan_nid)
> dump_node_scan_disk(sbi, opt->scan_nid);
>
> diff --git a/man/dump.f2fs.8 b/man/dump.f2fs.8
> index 94bf5f3..60d6783 100644
> --- a/man/dump.f2fs.8
> +++ b/man/dump.f2fs.8
> @@ -44,7 +44,8 @@ is used to retrieve f2fs metadata (usually in a disk partition).
> \fIdevice\fP is the special file corresponding to the device (e.g.
> \fI/dev/sdXX\fP).
>
> -Currently, it can retrieve 1) a file given its inode number, 2) NAT
> +Currently, it can retrieve 1) a file or folder given its inode number
> +(folders are dumped recursively), 2) NAT
> entries into a file, 3) SIT entries into a file, 4) SSA entries into
> a file, 5) reverse information from the given block address.
> .PP
> @@ -56,6 +57,20 @@ is 0 on success and -1 on failure.
> .BI \-i " inode number"
> Specify an inode number to dump out.
> .TP
> +.BI \-r
> +Dump out from the root inode.
> +.TP
> +.BI \-f
> +Do not prompt before dumping
> +.TP
> +.BI \-y
> +Alias for \-f
> +.TP
> +.BI \-o " path"
> +Dump inodes to the given path
> +.BI \-P
> +Preserve mode/owner/group for dumped inode
> +.TP
It needs to update dump_usage() as well.
Seems f2fs mailing list is out-of-response previously, so I resend it.
Thanks,
> .BI \-I " inode number"
> Specify an inode number and scan full disk to dump out, include history inode block
> .TP
>
> base-commit: 5da4e5241503b385e4a7e75b1b2bb3367b38be96
_______________________________________________
Linux-f2fs-devel mailing list
Linux-f2fs-devel@lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/linux-f2fs-devel
next prev parent reply other threads:[~2024-05-29 6:40 UTC|newest]
Thread overview: 8+ messages / expand[flat|nested] mbox.gz Atom feed top
2024-05-23 22:46 [f2fs-dev] [PATCH v4 1/2] dump.f2fs: Add ability to dump folders Daniel Rosenberg via Linux-f2fs-devel
2024-05-23 22:47 ` [f2fs-dev] [PATCH v4 2/2] dump.f2fs: Fix xattr dumping Daniel Rosenberg via Linux-f2fs-devel
2024-05-23 23:34 ` Daeho Jeong
2024-05-29 6:41 ` Chao Yu
2024-05-23 23:33 ` [f2fs-dev] [PATCH v4 1/2] dump.f2fs: Add ability to dump folders Daeho Jeong
2024-05-29 6:39 ` Chao Yu [this message]
2024-05-30 23:41 ` Jaegeuk Kim
2024-05-31 1:13 ` Chao Yu
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=aa383858-655d-4876-b3bc-52a04067b0d2@kernel.org \
--to=chao@kernel.org \
--cc=daehojeong@google.com \
--cc=drosen@google.com \
--cc=jaegeuk@kernel.org \
--cc=kernel-team@android.com \
--cc=linux-f2fs-devel@lists.sourceforge.net \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).