From: Li Zhang <zhanglikernel@gmail.com>
To: linux-btrfs@vger.kernel.org
Cc: Li Zhang <zhanglikernel@gmail.com>
Subject: [PATCH V2] Make btrfs_prepare_device parallel during mkfs.btrfs
Date: Sun, 28 Aug 2022 22:30:00 +0800 [thread overview]
Message-ID: <1661697000-18809-1-git-send-email-zhanglikernel@gmail.com> (raw)
[enhancement]
When a disk is formatted as btrfs, it calls
btrfs_prepare_device for each device, which takes too much time.
[implementation]
Put each btrfs_prepare_device into a thread,
wait for the first thread to complete to mkfs.btrfs,
and wait for other threads to complete before adding
other devices to the file system.
[test]
Using the btrfs-progs test case mkfs-tests, mkfs.btrfs works fine.
But I don't have an actual zoed device,
so I don't know how much time it saves, If you guys
have a way to test it, please let me know.
Signed-off-by: Li Zhang <zhanglikernel@gmail.com>
---
Issue: 496
V1:
* Put btrfs_prepare_device into threads and make them parallel
V2:
* Set the 4 variables used by btrfs_prepare_device as global variables.
* Use pthread_mutex to ensure error messages are not messed up.
* Correct the error message
* Wait for all threads to exit in a loop
mkfs/main.c | 132 +++++++++++++++++++++++++++++++++++++++++++-----------------
1 file changed, 95 insertions(+), 37 deletions(-)
diff --git a/mkfs/main.c b/mkfs/main.c
index ce096d3..b111f12 100644
--- a/mkfs/main.c
+++ b/mkfs/main.c
@@ -31,6 +31,7 @@
#include <uuid/uuid.h>
#include <ctype.h>
#include <blkid/blkid.h>
+#include <pthread.h>
#include "kernel-shared/ctree.h"
#include "kernel-shared/disk-io.h"
#include "kernel-shared/free-space-tree.h"
@@ -60,6 +61,20 @@ struct mkfs_allocation {
u64 system;
};
+static bool zero_end;
+static bool discard;
+static bool zoned;
+static int oflags;
+
+static pthread_mutex_t prepare_mutex;
+
+struct prepare_device_progress {
+ char *file;
+ u64 dev_block_count;
+ u64 block_count;
+ int ret;
+};
+
static int create_metadata_block_groups(struct btrfs_root *root, bool mixed,
struct mkfs_allocation *allocation)
{
@@ -969,6 +984,30 @@ fail:
return ret;
}
+static void *prepare_one_dev(void *ctx)
+{
+ struct prepare_device_progress *prepare_ctx = ctx;
+ int fd;
+
+ fd = open(prepare_ctx->file, oflags);
+ if (fd < 0) {
+ pthread_mutex_lock(&prepare_mutex);
+ error("unable to open %s: %m", prepare_ctx->file);
+ pthread_mutex_unlock(&prepare_mutex);
+ prepare_ctx->ret = fd;
+ return NULL;
+ }
+ prepare_ctx->ret = btrfs_prepare_device(fd,
+ prepare_ctx->file, &prepare_ctx->dev_block_count,
+ prepare_ctx->block_count,
+ (bconf.verbose ? PREP_DEVICE_VERBOSE : 0) |
+ (zero_end ? PREP_DEVICE_ZERO_END : 0) |
+ (discard ? PREP_DEVICE_DISCARD : 0) |
+ (zoned ? PREP_DEVICE_ZONED : 0));
+ close(fd);
+ return NULL;
+}
+
int BOX_MAIN(mkfs)(int argc, char **argv)
{
char *file;
@@ -984,7 +1023,7 @@ int BOX_MAIN(mkfs)(int argc, char **argv)
u32 nodesize = 0;
u32 sectorsize = 0;
u32 stripesize = 4096;
- bool zero_end = true;
+ zero_end = true;
int fd = -1;
int ret = 0;
int close_ret;
@@ -993,11 +1032,10 @@ int BOX_MAIN(mkfs)(int argc, char **argv)
bool nodesize_forced = false;
bool data_profile_opt = false;
bool metadata_profile_opt = false;
- bool discard = true;
+ discard = true;
bool ssd = false;
- bool zoned = false;
+ zoned = false;
bool force_overwrite = false;
- int oflags;
char *source_dir = NULL;
bool source_dir_set = false;
bool shrink_rootdir = false;
@@ -1006,6 +1044,8 @@ int BOX_MAIN(mkfs)(int argc, char **argv)
u64 shrink_size;
int dev_cnt = 0;
int saved_optind;
+ pthread_t *t_prepare = NULL;
+ struct prepare_device_progress *prepare_ctx = NULL;
char fs_uuid[BTRFS_UUID_UNPARSED_SIZE] = { 0 };
u64 features = BTRFS_MKFS_DEFAULT_FEATURES;
u64 runtime_features = BTRFS_MKFS_DEFAULT_RUNTIME_FEATURES;
@@ -1428,29 +1468,49 @@ int BOX_MAIN(mkfs)(int argc, char **argv)
goto error;
}
- dev_cnt--;
+ t_prepare = calloc(dev_cnt, sizeof(*t_prepare));
+ prepare_ctx = calloc(dev_cnt, sizeof(*prepare_ctx));
+
+ if (!t_prepare || !prepare_ctx) {
+ error("unable to alloc thread for preparing dev");
+ goto error;
+ }
+ pthread_mutex_init(&prepare_mutex, NULL);
+ zero_end = zero_end;
+ discard = discard;
+ zoned = zoned;
oflags = O_RDWR;
- if (zoned && zoned_model(file) == ZONED_HOST_MANAGED)
- oflags |= O_DIRECT;
+ for (i = 0; i < dev_cnt; i++) {
+ if (zoned && zoned_model(argv[optind + i - 1]) ==
+ ZONED_HOST_MANAGED) {
+ oflags |= O_DIRECT;
+ break;
+ }
+ }
+ for (i = 0; i < dev_cnt; i++) {
+ prepare_ctx[i].file = argv[optind + i - 1];
+ prepare_ctx[i].block_count = block_count;
+ prepare_ctx[i].dev_block_count = block_count;
+ ret = pthread_create(&t_prepare[i], NULL,
+ prepare_one_dev, &prepare_ctx[i]);
+ if (ret) {
+ error("create thread for prepare devices failed, errno:%d", ret);
+ goto error;
+ }
+ }
+ for (i = 0; i < dev_cnt; i++)
+ pthread_join(t_prepare[i], NULL);
+ ret = prepare_ctx[0].ret;
- /*
- * Open without O_EXCL so that the problem should not occur by the
- * following operation in kernel:
- * (btrfs_register_one_device() fails if O_EXCL is on)
- */
- fd = open(file, oflags);
- if (fd < 0) {
- error("unable to open %s: %m", file);
+ if (ret) {
+ error("unable prepare device:%s.\n", prepare_ctx[0].file);
goto error;
}
- ret = btrfs_prepare_device(fd, file, &dev_block_count, block_count,
- (zero_end ? PREP_DEVICE_ZERO_END : 0) |
- (discard ? PREP_DEVICE_DISCARD : 0) |
- (bconf.verbose ? PREP_DEVICE_VERBOSE : 0) |
- (zoned ? PREP_DEVICE_ZONED : 0));
- if (ret)
- goto error;
+
+ dev_cnt--;
+ fd = open(file, oflags);
+ dev_block_count = prepare_ctx[0].dev_block_count;
if (block_count && block_count > dev_block_count) {
error("%s is smaller than requested size, expected %llu, found %llu",
file, (unsigned long long)block_count,
@@ -1459,7 +1519,7 @@ int BOX_MAIN(mkfs)(int argc, char **argv)
}
/* To create the first block group and chunk 0 in make_btrfs */
- system_group_size = zoned ? zone_size(file) : BTRFS_MKFS_SYSTEM_GROUP_SIZE;
+ system_group_size = zoned ? zone_size(file) : BTRFS_MKFS_SYSTEM_GROUP_SIZE;
if (dev_block_count < system_group_size) {
error("device is too small to make filesystem, must be at least %llu",
(unsigned long long)system_group_size);
@@ -1558,14 +1618,10 @@ int BOX_MAIN(mkfs)(int argc, char **argv)
goto raid_groups;
while (dev_cnt-- > 0) {
+ int dev_index = argc - saved_optind - dev_cnt - 1;
file = argv[optind++];
- /*
- * open without O_EXCL so that the problem should not
- * occur by the following processing.
- * (btrfs_register_one_device() fails if O_EXCL is on)
- */
- fd = open(file, O_RDWR);
+ fd = open(file, oflags);
if (fd < 0) {
error("unable to open %s: %m", file);
goto error;
@@ -1578,13 +1634,11 @@ int BOX_MAIN(mkfs)(int argc, char **argv)
close(fd);
continue;
}
- ret = btrfs_prepare_device(fd, file, &dev_block_count,
- block_count,
- (bconf.verbose ? PREP_DEVICE_VERBOSE : 0) |
- (zero_end ? PREP_DEVICE_ZERO_END : 0) |
- (discard ? PREP_DEVICE_DISCARD : 0) |
- (zoned ? PREP_DEVICE_ZONED : 0));
- if (ret) {
+ dev_block_count = prepare_ctx[dev_index]
+ .dev_block_count;
+
+ if (prepare_ctx[dev_index].ret) {
+ error("unable prepare device:%s.\n", prepare_ctx[dev_index].file);
goto error;
}
@@ -1763,12 +1817,16 @@ out:
btrfs_close_all_devices();
free(label);
-
+ free(t_prepare);
+ free(prepare_ctx);
return !!ret;
+
error:
if (fd > 0)
close(fd);
+ free(t_prepare);
+ free(prepare_ctx);
free(label);
exit(1);
success:
--
1.8.3.1
next reply other threads:[~2022-08-28 14:30 UTC|newest]
Thread overview: 3+ messages / expand[flat|nested] mbox.gz Atom feed top
2022-08-28 14:30 Li Zhang [this message]
2022-08-29 21:55 ` [PATCH V2] Make btrfs_prepare_device parallel during mkfs.btrfs Qu Wenruo
2022-08-30 17:30 ` David Sterba
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=1661697000-18809-1-git-send-email-zhanglikernel@gmail.com \
--to=zhanglikernel@gmail.com \
--cc=linux-btrfs@vger.kernel.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.