public inbox for linux-mm@kvack.org
 help / color / mirror / Atom feed
From: "David Hildenbrand (Arm)" <david@kernel.org>
To: Li Wang <liwang@redhat.com>,
	akpm@linux-foundation.org, rppt@kernel.org, ljs@kernel.org,
	Liam.Howlett@oracle.com, vbabka@kernel.org, surenb@google.com,
	mhocko@suse.com, shuah@kernel.org
Cc: aubaker@redhat.com, linux-mm@kvack.org,
	linux-kselftest@vger.kernel.org, linux-kernel@vger.kernel.org,
	linux-fsdevel@vger.kernel.org
Subject: Re: [PATCH v3] selftests/mm: skip hugetlb_dio tests when DIO alignment is incompatible
Date: Mon, 30 Mar 2026 08:02:01 +0200	[thread overview]
Message-ID: <a5b7add7-0507-40c0-a324-81f243ffa261@kernel.org> (raw)
In-Reply-To: <20260330053915.75442-1-liwang@redhat.com>

On 3/30/26 07:39, Li Wang wrote:
> hugetlb_dio test uses sub-page offsets (pagesize / 2) to verify that
> hugepages used as DIO user buffers are correctly unpinned at completion.
> 
> However, on filesystems with a logical block size larger than half the
> page size (e.g., 4K-sector block devices), these unaligned DIO writes
> are rejected with -EINVAL, causing the test to fail unexpectedly.
> 
> Add get_dio_alignment() to query the filesystem's required DIO alignment
> via statx(STATX_DIOALIGN) and pass it to run_dio_using_hugetlb(). Skip
> individual test cases whose writesize/buf-offset is not a multiple of the
> alignment, so that aligned cases are still tested.
> 
> === Reproduce Steps ===
> 
>   # dd if=/dev/zero of=/tmp/test.img bs=1M count=512
>   # losetup --sector-size 4096 /dev/loop0 /tmp/test.img
>   # mkfs.xfs /dev/loop0
>   # mkdir -p /mnt/dio_test
>   # mount /dev/loop0 /mnt/dio_test
> 
>   // Modify test to open /mnt/dio_test and rebuild it:
>   -       fd = open("/tmp", O_TMPFILE | O_RDWR | O_DIRECT, 0664);
>   +       fd = open("/mnt/dio_test", O_TMPFILE | O_RDWR | O_DIRECT, 0664);
> 
>   # getconf PAGESIZE
>   4096
> 
>   # echo 100 >/proc/sys/vm/nr_hugepages
> 
>   # ./hugetlb_dio
>   TAP version 13
>   1..4
>   # No. Free pages before allocation : 100
>   # No. Free pages after munmap : 100
>   ok 1 free huge pages from 0-12288
>   Bail out! Error writing to file
>   : Invalid argument (22)
>   # Planned tests != run tests (4 != 1)
>   # Totals: pass:1 fail:0 xfail:0 xpass:0 skip:0 error:0
> 
> Signed-off-by: Li Wang <liwang@redhat.com>
> ---
> 
> Notes:
>     v3:
>     	- Adopt statx raw syscall to build on older glibc.
>     	- add buf offset alignment check as well
>     v2:
>     	- Pass dio_align as a parameter to run_dio_using_hugetlb()
>     	  instead of generally page_size/2 alignment check.
>     	- Add O_DIRECT flag back to the first open().
>     	- Add stx_dio_offset_align zero check.
> 
>  tools/testing/selftests/mm/hugetlb_dio.c | 62 +++++++++++++++++-------
>  1 file changed, 45 insertions(+), 17 deletions(-)
> 
> diff --git a/tools/testing/selftests/mm/hugetlb_dio.c b/tools/testing/selftests/mm/hugetlb_dio.c
> index 9ac62eb4c97d..b125092fc6c1 100644
> --- a/tools/testing/selftests/mm/hugetlb_dio.c
> +++ b/tools/testing/selftests/mm/hugetlb_dio.c
> @@ -17,10 +17,41 @@
>  #include <unistd.h>
>  #include <string.h>
>  #include <sys/mman.h>
> +#include <sys/syscall.h>
>  #include "vm_util.h"
>  #include "kselftest.h"
>  
> -void run_dio_using_hugetlb(unsigned int start_off, unsigned int end_off)
> +#define HP_DIO_TMPDIR "/tmp"
> +
> +#ifndef STATX_DIOALIGN
> +#define STATX_DIOALIGN		0x00002000U
> +#endif
> +
> +unsigned int get_dio_alignment(void)
> +{
> +	int fd, ret;
> +	struct statx stx;
> +	unsigned int dio_align = 1;
> +
> +	fd = open(HP_DIO_TMPDIR, O_TMPFILE | O_RDWR | O_DIRECT, 0664);
> +	if (fd < 0)
> +		ksft_exit_skip("Unable to allocate file: %s\n", strerror(errno));
> +
> +	ret = syscall(__NR_statx, fd, "", AT_EMPTY_PATH, STATX_DIOALIGN, &stx);
> +	if (ret < 0) {
> +		ksft_perror("statx() failed");
> +	} else if ((stx.stx_mask & STATX_DIOALIGN) &&
> +			stx.stx_dio_offset_align) {
> +		dio_align = stx.stx_dio_offset_align;
> +	}
> +
> +	close(fd);
> +
> +	return dio_align;
> +}
> +
> +void run_dio_using_hugetlb(unsigned int start_off, unsigned int end_off,
> +			unsigned int dio_align)
>  {
>  	int fd;
>  	char *buffer =  NULL;
> @@ -33,6 +64,12 @@ void run_dio_using_hugetlb(unsigned int start_off, unsigned int end_off)
>  	const int mmap_prot  = PROT_READ | PROT_WRITE;
>  
>  	writesize = end_off - start_off;
> +	if (start_off % dio_align != 0 || writesize % dio_align != 0) {
> +		ksft_test_result_skip("DIO alignment (%u) incompatible with "
> +				"buf offset %u and writesize %zu\n",
> +				dio_align, start_off, writesize);
> +		return;
> +	}
>  
>  	/* Get the default huge page size */
>  	h_pagesize = default_huge_page_size();
> @@ -40,7 +77,7 @@ void run_dio_using_hugetlb(unsigned int start_off, unsigned int end_off)
>  		ksft_exit_fail_msg("Unable to determine huge page size\n");
>  
>  	/* Open the file to DIO */

This comment is misleading as we are not opening "the" file, but we create a new one.
See below, maybe we should clean that up.

> -	fd = open("/tmp", O_TMPFILE | O_RDWR | O_DIRECT, 0664);
> +	fd = open(HP_DIO_TMPDIR, O_TMPFILE | O_RDWR | O_DIRECT, 0664);
>  	if (fd < 0)
>  		ksft_exit_fail_perror("Error opening file\n");
>  
> @@ -89,37 +126,28 @@ void run_dio_using_hugetlb(unsigned int start_off, unsigned int end_off)
>  
>  int main(void)
>  {
> -	size_t pagesize = 0;
> -	int fd;
> +	size_t pagesize = psize();
> +	unsigned int dio_align = get_dio_alignment();

Both could be const.

>  
>  	ksft_print_header();
>  
> -	/* Open the file to DIO */
> -	fd = open("/tmp", O_TMPFILE | O_RDWR | O_DIRECT, 0664);
> -	if (fd < 0)
> -		ksft_exit_skip("Unable to allocate file: %s\n", strerror(errno));
> -	close(fd);


Why can't we simply open the file once and pass the fd to run_dio_using_hugetlb()?

fd = open("/tmp", O_TMPFILE | O_RDWR | O_DIRECT, 0664);
if (fd < 0)
	ksft_exit_skip("Unable to allocate file: %s\n", strerror(errno));
dio_align = get_dio_alignment(fd);
if (dio_align <= 0)
	ksft_exit_skip("Unable to obtain DIO alignment: %s\n", strerror(errno));

...

run_dio_using_hugetlb(fd, 0, (pagesize * 3), dio_align);

> -
>  	/* Check if huge pages are free */
>  	if (!get_free_hugepages())
>  		ksft_exit_skip("No free hugepage, exiting\n");
>  
>  	ksft_set_plan(4);
>  
> -	/* Get base page size */
> -	pagesize  = psize();
> -
>  	/* start and end is aligned to pagesize */
> -	run_dio_using_hugetlb(0, (pagesize * 3));
> +	run_dio_using_hugetlb(0, (pagesize * 3), dio_align);
>  
>  	/* start is aligned but end is not aligned */
> -	run_dio_using_hugetlb(0, (pagesize * 3) - (pagesize / 2));
> +	run_dio_using_hugetlb(0, (pagesize * 3) - (pagesize / 2), dio_align);
>  
>  	/* start is unaligned and end is aligned */
> -	run_dio_using_hugetlb(pagesize / 2, (pagesize * 3));
> +	run_dio_using_hugetlb(pagesize / 2, (pagesize * 3), dio_align);
>  
>  	/* both start and end are unaligned */
> -	run_dio_using_hugetlb(pagesize / 2, (pagesize * 3) + (pagesize / 2));
> +	run_dio_using_hugetlb(pagesize / 2, (pagesize * 3) + (pagesize / 2), dio_align);
>  
>  	ksft_finished();
>  }


-- 
Cheers,

David


  reply	other threads:[~2026-03-30  6:02 UTC|newest]

Thread overview: 8+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2026-03-30  5:39 [PATCH v3] selftests/mm: skip hugetlb_dio tests when DIO alignment is incompatible Li Wang
2026-03-30  6:02 ` David Hildenbrand (Arm) [this message]
2026-03-30  7:23   ` Li Wang
2026-03-30 10:10     ` Li Wang
2026-03-30 10:43       ` David Hildenbrand (Arm)
2026-03-30 11:35         ` Li Wang
2026-03-30 11:57           ` Li Wang
2026-03-30  9:58 ` Li Wang

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=a5b7add7-0507-40c0-a324-81f243ffa261@kernel.org \
    --to=david@kernel.org \
    --cc=Liam.Howlett@oracle.com \
    --cc=akpm@linux-foundation.org \
    --cc=aubaker@redhat.com \
    --cc=linux-fsdevel@vger.kernel.org \
    --cc=linux-kernel@vger.kernel.org \
    --cc=linux-kselftest@vger.kernel.org \
    --cc=linux-mm@kvack.org \
    --cc=liwang@redhat.com \
    --cc=ljs@kernel.org \
    --cc=mhocko@suse.com \
    --cc=rppt@kernel.org \
    --cc=shuah@kernel.org \
    --cc=surenb@google.com \
    --cc=vbabka@kernel.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox