From: Wengang Wang <wen.gang.wang@oracle.com>
To: linux-xfs@vger.kernel.org
Cc: wen.gang.wang@oracle.com
Subject: [PATCH 1/9] xfsprogs: introduce defrag command to spaceman
Date: Tue, 9 Jul 2024 12:10:20 -0700 [thread overview]
Message-ID: <20240709191028.2329-2-wen.gang.wang@oracle.com> (raw)
In-Reply-To: <20240709191028.2329-1-wen.gang.wang@oracle.com>
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit
Non-exclusive defragment
Here we are introducing the non-exclusive manner to defragment a file,
especially for huge files, without blocking IO to it long.
Non-exclusive defragmentation divides the whole file into small segments.
For each segment, we lock the file, defragment the segment and unlock the file.
Defragmenting the small segment doesn’t take long. File IO requests can get
served between defragmenting segments before blocked long. Also we put
(user adjustable) idle time between defragmenting two consecutive segments to
balance the defragmentation and file IOs.
The first patch in the set checks for valid target files
Valid target files to defrag must:
1. be accessible for read/write
2. be regular files
3. be in XFS filesystem
4. the containing XFS has reflink enabled. This is not checked
before starting defragmentation, but error would be reported
later.
Signed-off-by: Wengang Wang <wen.gang.wang@oracle.com>
---
spaceman/Makefile | 2 +-
spaceman/defrag.c | 198 ++++++++++++++++++++++++++++++++++++++++++++++
spaceman/init.c | 1 +
spaceman/space.h | 1 +
4 files changed, 201 insertions(+), 1 deletion(-)
create mode 100644 spaceman/defrag.c
diff --git a/spaceman/Makefile b/spaceman/Makefile
index 1f048d54..9c00b20a 100644
--- a/spaceman/Makefile
+++ b/spaceman/Makefile
@@ -7,7 +7,7 @@ include $(TOPDIR)/include/builddefs
LTCOMMAND = xfs_spaceman
HFILES = init.h space.h
-CFILES = info.c init.c file.c health.c prealloc.c trim.c
+CFILES = info.c init.c file.c health.c prealloc.c trim.c defrag.c
LSRCFILES = xfs_info.sh
LLDLIBS = $(LIBXCMD) $(LIBFROG)
diff --git a/spaceman/defrag.c b/spaceman/defrag.c
new file mode 100644
index 00000000..c9732984
--- /dev/null
+++ b/spaceman/defrag.c
@@ -0,0 +1,198 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * Copyright (c) 2024 Oracle.
+ * All Rights Reserved.
+ */
+
+#include "libxfs.h"
+#include <linux/fiemap.h>
+#include <linux/fsmap.h>
+#include "libfrog/fsgeom.h"
+#include "command.h"
+#include "init.h"
+#include "libfrog/paths.h"
+#include "space.h"
+#include "input.h"
+
+/* defrag segment size limit in units of 512 bytes */
+#define MIN_SEGMENT_SIZE_LIMIT 8192 /* 4MiB */
+#define DEFAULT_SEGMENT_SIZE_LIMIT 32768 /* 16MiB */
+static int g_segment_size_lmt = DEFAULT_SEGMENT_SIZE_LIMIT;
+
+/* size of the defrag target file */
+static off_t g_defrag_file_size = 0;
+
+/* stats for the target file extents before defrag */
+struct ext_stats {
+ long nr_ext_total;
+ long nr_ext_unwritten;
+ long nr_ext_shared;
+};
+static struct ext_stats g_ext_stats;
+
+/*
+ * check if the target is a valid file to defrag
+ * also store file size
+ * returns:
+ * true for yes and false for no
+ */
+static bool
+defrag_check_file(char *path)
+{
+ struct statfs statfs_s;
+ struct stat stat_s;
+
+ if (access(path, F_OK|W_OK) == -1) {
+ if (errno == ENOENT)
+ fprintf(stderr, "file \"%s\" doesn't exist\n", path);
+ else
+ fprintf(stderr, "no access to \"%s\", %s\n", path,
+ strerror(errno));
+ return false;
+ }
+
+ if (stat(path, &stat_s) == -1) {
+ fprintf(stderr, "failed to get file info on \"%s\": %s\n",
+ path, strerror(errno));
+ return false;
+ }
+
+ g_defrag_file_size = stat_s.st_size;
+
+ if (!S_ISREG(stat_s.st_mode)) {
+ fprintf(stderr, "\"%s\" is not a regular file\n", path);
+ return false;
+ }
+
+ if (statfs(path, &statfs_s) == -1) {
+ fprintf(stderr, "failed to get FS info on \"%s\": %s\n",
+ path, strerror(errno));
+ return false;
+ }
+
+ if (statfs_s.f_type != XFS_SUPER_MAGIC) {
+ fprintf(stderr, "\"%s\" is not a xfs file\n", path);
+ return false;
+ }
+
+ return true;
+}
+
+/*
+ * defragment a file
+ * return 0 if successfully done, 1 otherwise
+ */
+static int
+defrag_xfs_defrag(char *file_path) {
+ int max_clone_us = 0, max_unshare_us = 0, max_punch_us = 0;
+ long nr_seg_defrag = 0, nr_ext_defrag = 0;
+ int scratch_fd = -1, defrag_fd = -1;
+ char tmp_file_path[PATH_MAX+1];
+ char *defrag_dir;
+ struct fsxattr fsx;
+ int ret = 0;
+
+ fsx.fsx_nextents = 0;
+ memset(&g_ext_stats, 0, sizeof(g_ext_stats));
+
+ if (!defrag_check_file(file_path)) {
+ ret = 1;
+ goto out;
+ }
+
+ defrag_fd = open(file_path, O_RDWR);
+ if (defrag_fd == -1) {
+ fprintf(stderr, "Opening %s failed. %s\n", file_path,
+ strerror(errno));
+ ret = 1;
+ goto out;
+ }
+
+ defrag_dir = dirname(file_path);
+ snprintf(tmp_file_path, PATH_MAX, "%s/.xfsdefrag_%d", defrag_dir,
+ getpid());
+ tmp_file_path[PATH_MAX] = 0;
+ scratch_fd = open(tmp_file_path, O_CREAT|O_EXCL|O_RDWR, 0600);
+ if (scratch_fd == -1) {
+ fprintf(stderr, "Opening temporary file %s failed. %s\n",
+ tmp_file_path, strerror(errno));
+ ret = 1;
+ goto out;
+ }
+out:
+ if (scratch_fd != -1) {
+ close(scratch_fd);
+ unlink(tmp_file_path);
+ }
+ if (defrag_fd != -1) {
+ ioctl(defrag_fd, FS_IOC_FSGETXATTR, &fsx);
+ close(defrag_fd);
+ }
+
+ printf("Pre-defrag %ld extents detected, %ld are \"unwritten\","
+ "%ld are \"shared\"\n",
+ g_ext_stats.nr_ext_total, g_ext_stats.nr_ext_unwritten,
+ g_ext_stats.nr_ext_shared);
+ printf("Tried to defragment %ld extents in %ld segments\n",
+ nr_ext_defrag, nr_seg_defrag);
+ printf("Time stats(ms): max clone: %d, max unshare: %d,"
+ " max punch_hole: %d\n",
+ max_clone_us/1000, max_unshare_us/1000, max_punch_us/1000);
+ printf("Post-defrag %u extents detected\n", fsx.fsx_nextents);
+ return ret;
+}
+
+
+static void defrag_help(void)
+{
+ printf(_(
+"\n"
+"Defragemnt files on XFS where reflink is enabled. IOs to the target files \n"
+"can be served durning the defragmentations.\n"
+"\n"
+" -s segment_size -- specify the segment size in MiB, minmum value is 4 \n"
+" default is 16\n"));
+}
+
+static cmdinfo_t defrag_cmd;
+
+static int
+defrag_f(int argc, char **argv)
+{
+ int i;
+ int c;
+
+ while ((c = getopt(argc, argv, "s:")) != EOF) {
+ switch(c) {
+ case 's':
+ g_segment_size_lmt = atoi(optarg) * 1024 * 1024 / 512;
+ if (g_segment_size_lmt < MIN_SEGMENT_SIZE_LIMIT) {
+ g_segment_size_lmt = MIN_SEGMENT_SIZE_LIMIT;
+ printf("Using minimium segment size %d\n",
+ g_segment_size_lmt);
+ }
+ break;
+ default:
+ command_usage(&defrag_cmd);
+ return 1;
+ }
+ }
+
+ for (i = 0; i < filecount; i++)
+ defrag_xfs_defrag(filetable[i].name);
+ return 0;
+}
+void defrag_init(void)
+{
+ defrag_cmd.name = "defrag";
+ defrag_cmd.altname = "dfg";
+ defrag_cmd.cfunc = defrag_f;
+ defrag_cmd.argmin = 0;
+ defrag_cmd.argmax = 4;
+ defrag_cmd.args = "[-s segment_size]";
+ defrag_cmd.flags = CMD_FLAG_ONESHOT;
+ defrag_cmd.oneline = _("Defragment XFS files");
+ defrag_cmd.help = defrag_help;
+
+ add_command(&defrag_cmd);
+}
diff --git a/spaceman/init.c b/spaceman/init.c
index cf1ff3cb..396f965c 100644
--- a/spaceman/init.c
+++ b/spaceman/init.c
@@ -35,6 +35,7 @@ init_commands(void)
trim_init();
freesp_init();
health_init();
+ defrag_init();
}
static int
diff --git a/spaceman/space.h b/spaceman/space.h
index 723209ed..c288aeb9 100644
--- a/spaceman/space.h
+++ b/spaceman/space.h
@@ -26,6 +26,7 @@ extern void help_init(void);
extern void prealloc_init(void);
extern void quit_init(void);
extern void trim_init(void);
+extern void defrag_init(void);
#ifdef HAVE_GETFSMAP
extern void freesp_init(void);
#else
--
2.39.3 (Apple Git-146)
next prev parent reply other threads:[~2024-07-09 19:10 UTC|newest]
Thread overview: 60+ messages / expand[flat|nested] mbox.gz Atom feed top
2024-07-09 19:10 [PATCH 0/9] introduce defrag to xfs_spaceman Wengang Wang
2024-07-09 19:10 ` Wengang Wang [this message]
2024-07-09 21:18 ` [PATCH 1/9] xfsprogs: introduce defrag command to spaceman Darrick J. Wong
2024-07-11 21:54 ` Wengang Wang
2024-07-15 21:30 ` Wengang Wang
2024-07-15 22:44 ` Darrick J. Wong
2024-07-09 19:10 ` [PATCH 2/9] spaceman/defrag: pick up segments from target file Wengang Wang
2024-07-09 21:50 ` [PATCH 2/9] spaceman/defrag: pick up segments from target fileOM Darrick J. Wong
2024-07-11 22:37 ` Wengang Wang
2024-07-15 23:40 ` [PATCH 2/9] spaceman/defrag: pick up segments from target file Dave Chinner
2024-07-16 20:23 ` Wengang Wang
2024-07-17 4:11 ` Dave Chinner
2024-07-18 19:03 ` Wengang Wang
2024-07-19 4:59 ` Dave Chinner
2024-07-19 4:01 ` Christoph Hellwig
2024-07-24 19:22 ` Wengang Wang
2024-07-30 22:13 ` Dave Chinner
2024-07-09 19:10 ` [PATCH 3/9] spaceman/defrag: defrag segments Wengang Wang
2024-07-09 21:57 ` Darrick J. Wong
2024-07-11 22:49 ` Wengang Wang
2024-07-12 19:07 ` Wengang Wang
2024-07-15 22:42 ` Darrick J. Wong
2024-07-16 0:08 ` Dave Chinner
2024-07-18 18:06 ` Wengang Wang
2024-07-09 19:10 ` [PATCH 4/9] spaceman/defrag: ctrl-c handler Wengang Wang
2024-07-09 21:08 ` Darrick J. Wong
2024-07-11 22:58 ` Wengang Wang
2024-07-15 22:56 ` Darrick J. Wong
2024-07-16 16:21 ` Wengang Wang
2024-07-09 19:10 ` [PATCH 5/9] spaceman/defrag: exclude shared segments on low free space Wengang Wang
2024-07-09 21:05 ` Darrick J. Wong
2024-07-11 23:08 ` Wengang Wang
2024-07-15 22:58 ` Darrick J. Wong
2024-07-09 19:10 ` [PATCH 6/9] spaceman/defrag: workaround kernel xfs_reflink_try_clear_inode_flag() Wengang Wang
2024-07-09 20:51 ` Darrick J. Wong
2024-07-11 23:11 ` Wengang Wang
2024-07-16 0:25 ` Dave Chinner
2024-07-18 18:24 ` Wengang Wang
2024-07-31 22:25 ` Dave Chinner
2024-07-09 19:10 ` [PATCH 7/9] spaceman/defrag: sleeps between segments Wengang Wang
2024-07-09 20:46 ` Darrick J. Wong
2024-07-11 23:26 ` Wengang Wang
2024-07-11 23:30 ` Wengang Wang
2024-07-09 19:10 ` [PATCH 8/9] spaceman/defrag: readahead for better performance Wengang Wang
2024-07-09 20:27 ` Darrick J. Wong
2024-07-11 23:29 ` Wengang Wang
2024-07-16 0:56 ` Dave Chinner
2024-07-18 18:40 ` Wengang Wang
2024-07-31 3:10 ` Dave Chinner
2024-08-02 18:31 ` Wengang Wang
2024-07-09 19:10 ` [PATCH 9/9] spaceman/defrag: warn on extsize Wengang Wang
2024-07-09 20:21 ` Darrick J. Wong
2024-07-11 23:36 ` Wengang Wang
2024-07-16 0:29 ` Dave Chinner
2024-07-22 18:01 ` Wengang Wang
2024-07-30 22:43 ` Dave Chinner
2024-07-15 23:03 ` [PATCH 0/9] introduce defrag to xfs_spaceman Dave Chinner
2024-07-16 19:45 ` Wengang Wang
2024-07-31 2:51 ` Dave Chinner
2024-08-02 18:14 ` Wengang Wang
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20240709191028.2329-2-wen.gang.wang@oracle.com \
--to=wen.gang.wang@oracle.com \
--cc=linux-xfs@vger.kernel.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox