* [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test
@ 2026-03-13 11:40 Zi Yan
2026-03-14 22:27 ` Andrew Morton
2026-03-15 0:03 ` Zi Yan
0 siblings, 2 replies; 6+ messages in thread
From: Zi Yan @ 2026-03-13 11:40 UTC (permalink / raw)
To: Andrew Morton
Cc: David Hildenbrand, Lorenzo Stoakes, Zi Yan, Hugh Dickins,
Baolin Wang, Liam R. Howlett, Nico Pache, Ryan Roberts, Dev Jain,
Barry Song, Lance Yang, Matthew Wilcox, Bas van Dijk, Eero Kelly,
Andrew Battat, Adam Bratschi-Kaye, linux-mm, linux-kernel,
linux-fsdevel
The added folio_split_race_test is a modified C port of the race condition
test from [1]. The test creates shmem huge pages shared by both a parent
and a child processes, where the parent process punches holes in the shmem
to cause folio_split() in the kernel and the child process reads the shmem
in 16 threads to cause filemap_get_entry() in the kernel.
filemap_get_entry() reads the folio and xarray split by folio_split()
locklessly. The original test[2] is written in rust and uses memfd (shmem
backed). This C port uses shmem directly.
Note: the initial rust to C conversion is done by Cursor.
Link: https://lore.kernel.org/all/CAKNNEtw5_kZomhkugedKMPOG-sxs5Q5OLumWJdiWXv+C9Yct0w@mail.gmail.com/ [1]
Link: https://github.com/dfinity/thp-madv-remove-test [2]
Signed-off-by: Zi Yan <ziy@nvidia.com>
Cc: Bas van Dijk <bas@dfinity.org>
Cc: Adam Bratschi-Kaye <adam.bratschikaye@dfinity.org>
---
tools/testing/selftests/mm/Makefile | 1 +
.../selftests/mm/folio_split_race_test.c | 380 ++++++++++++++++++
tools/testing/selftests/mm/run_vmtests.sh | 2 +
3 files changed, 383 insertions(+)
create mode 100644 tools/testing/selftests/mm/folio_split_race_test.c
diff --git a/tools/testing/selftests/mm/Makefile b/tools/testing/selftests/mm/Makefile
index 90fcca53a561b..3316d8a3b7e82 100644
--- a/tools/testing/selftests/mm/Makefile
+++ b/tools/testing/selftests/mm/Makefile
@@ -105,6 +105,7 @@ TEST_GEN_FILES += droppable
TEST_GEN_FILES += guard-regions
TEST_GEN_FILES += merge
TEST_GEN_FILES += rmap
+TEST_GEN_FILES += folio_split_race_test
ifneq ($(ARCH),arm64)
TEST_GEN_FILES += soft-dirty
diff --git a/tools/testing/selftests/mm/folio_split_race_test.c b/tools/testing/selftests/mm/folio_split_race_test.c
new file mode 100644
index 0000000000000..cf5a5666bab77
--- /dev/null
+++ b/tools/testing/selftests/mm/folio_split_race_test.c
@@ -0,0 +1,380 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * The parent process creates a shmem and forks. The child creates a THP on the
+ * mapping, fills all pages with known patterns, and then continuously verifies
+ * non-punched pages. The parent punches holes via MADV_REMOVE on the shmem
+ * while the child reads.
+ *
+ * It tests the race condition between folio_split() and filemap_get_entry(),
+ * where the hole punches on shmem lead to folio_split() and reading the shmem
+ * lead to filemap_get_entry().
+ */
+
+#define _GNU_SOURCE
+#include <assert.h>
+#include <errno.h>
+#include <linux/mman.h>
+#include <pthread.h>
+#include <stdatomic.h>
+#include <stdbool.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <sys/mman.h>
+#include <sys/stat.h>
+#include <sys/wait.h>
+#include <unistd.h>
+#include "vm_util.h"
+#include "kselftest.h"
+#include "thp_settings.h"
+
+uint64_t page_size;
+uint64_t pmd_pagesize;
+#define NR_PMD_PAGE 5
+#define FILE_SIZE (pmd_pagesize * NR_PMD_PAGE)
+#define TOTAL_PAGES (FILE_SIZE / page_size)
+
+/* Every N-th to N+M-th pages are punched; not aligned with huge page boundaries. */
+#define PUNCH_INTERVAL 50 /* N */
+#define PUNCH_SIZE_FACTOR 3 /* M */
+
+#define NUM_READER_THREADS 16
+#define FILL_BYTE 0xAF
+#define NUM_ITERATIONS 100
+
+#define CHILD_READY 1
+#define CHILD_FAILED 2
+/* Shared control block: MAP_SHARED anonymous so parent and child see same values. */
+struct SharedCtl {
+ atomic_uint_fast32_t ready;
+ atomic_uint_fast32_t stop;
+ atomic_size_t child_failures;
+ atomic_size_t child_verified;
+};
+
+static int get_errno(void)
+{
+ return errno;
+}
+
+static void fill_page(unsigned char *base, size_t page_idx)
+{
+ unsigned char *page_ptr = base + page_idx * page_size;
+ uint64_t idx = (uint64_t)page_idx;
+
+ memset(page_ptr, FILL_BYTE, page_size);
+ memcpy(page_ptr, &idx, sizeof(idx));
+}
+
+/* Returns true if valid, false if corrupted. */
+static bool check_page(unsigned char *base, size_t page_idx)
+{
+ unsigned char *page_ptr = base + page_idx * page_size;
+ uint64_t expected_idx = (uint64_t)page_idx;
+ uint64_t got_idx;
+
+ memcpy(&got_idx, page_ptr, 8);
+
+ if (got_idx != expected_idx) {
+ size_t off;
+ int all_zero = 1;
+
+ for (off = 0; off < page_size; off++) {
+ if (page_ptr[off] != 0) {
+ all_zero = 0;
+ break;
+ }
+ }
+ if (all_zero) {
+ ksft_print_msg(
+ "CORRUPTED: page %zu (huge page %zu) is ALL ZEROS\n",
+ page_idx,
+ (page_idx * page_size) / pmd_pagesize);
+ } else {
+ ksft_print_msg(
+ "CORRUPTED: page %zu (huge page %zu): expected idx %zu, got %lu\n",
+ page_idx, (page_idx * page_size) / pmd_pagesize,
+ page_idx, (unsigned long)got_idx);
+ }
+ return false;
+ }
+ return true;
+}
+
+struct reader_arg {
+ unsigned char *base;
+ struct SharedCtl *ctl;
+ int tid;
+ atomic_size_t *failures;
+ atomic_size_t *verified;
+};
+
+static void *reader_thread(void *arg)
+{
+ struct reader_arg *ra = (struct reader_arg *)arg;
+ unsigned char *base = ra->base;
+ struct SharedCtl *ctl = ra->ctl;
+ int tid = ra->tid;
+ atomic_size_t *failures = ra->failures;
+ atomic_size_t *verified = ra->verified;
+ size_t page_idx;
+
+ while (atomic_load_explicit(&ctl->stop, memory_order_acquire) == 0) {
+ for (page_idx = (size_t)tid; page_idx < TOTAL_PAGES;
+ page_idx += NUM_READER_THREADS) {
+ if (page_idx % PUNCH_INTERVAL >= 0 &&
+ page_idx % PUNCH_INTERVAL < PUNCH_SIZE_FACTOR)
+ continue;
+ if (check_page(base, page_idx))
+ atomic_fetch_add_explicit(verified, 1,
+ memory_order_relaxed);
+ else
+ atomic_fetch_add_explicit(failures, 1,
+ memory_order_relaxed);
+ }
+ if (atomic_load_explicit(failures, memory_order_relaxed) > 0)
+ break;
+ }
+
+ return NULL;
+}
+
+static void child_reader_loop(unsigned char *base, struct SharedCtl *ctl)
+{
+ pthread_t threads[NUM_READER_THREADS];
+ struct reader_arg args[NUM_READER_THREADS];
+ atomic_size_t failures = 0;
+ atomic_size_t verified = 0;
+ size_t page_idx;
+ size_t recheck = 0;
+ int i;
+
+ for (i = 0; i < NUM_READER_THREADS; i++) {
+ args[i].base = base;
+ args[i].ctl = ctl;
+ args[i].tid = i;
+ args[i].failures = &failures;
+ args[i].verified = &verified;
+ if (pthread_create(&threads[i], NULL, reader_thread,
+ &args[i]) != 0)
+ ksft_exit_fail_msg("pthread_create failed\n");
+ }
+
+ for (i = 0; i < NUM_READER_THREADS; i++)
+ pthread_join(threads[i], NULL);
+
+ /* Post-sleep recheck */
+ usleep(1000); /* 1 ms */
+
+ for (page_idx = 0; page_idx < TOTAL_PAGES; page_idx++) {
+ if (page_idx % PUNCH_INTERVAL >= 0 &&
+ page_idx % PUNCH_INTERVAL < PUNCH_SIZE_FACTOR)
+ continue;
+ if (!check_page(base, page_idx))
+ recheck++;
+ }
+ if (recheck)
+ ksft_print_msg("post-sleep failures: %zu\n", recheck);
+
+ atomic_store_explicit(&ctl->child_failures,
+ atomic_load_explicit(&failures,
+ memory_order_relaxed),
+ memory_order_release);
+ atomic_store_explicit(&ctl->child_verified,
+ atomic_load_explicit(&verified,
+ memory_order_relaxed),
+ memory_order_release);
+}
+
+/* Returns number of corrupted pages. */
+static size_t verify_pages(unsigned char *base, const bool *is_punched)
+{
+ size_t failures = 0;
+ size_t page_idx;
+ size_t non_punched = 0;
+
+ for (page_idx = 0; page_idx < TOTAL_PAGES; page_idx++) {
+ if (is_punched[page_idx])
+ continue;
+ if (!check_page(base, page_idx)) {
+ failures++;
+ if (failures >= 100)
+ return failures;
+ }
+ non_punched++;
+ }
+ if (failures)
+ ksft_print_msg(" %zu non-punched pages are corrupted!\n",
+ failures);
+ return failures;
+}
+
+/* Run a single iteration. Returns total number of corrupted pages. */
+static size_t run_iteration(void)
+{
+ struct SharedCtl *ctl;
+ pid_t pid;
+ unsigned char *parent_base;
+ bool *is_punched;
+ size_t i;
+ size_t child_failures, child_verified, parent_failures;
+ int status;
+ size_t n_punched = 0;
+
+ ctl = (struct SharedCtl *)mmap(NULL, sizeof(struct SharedCtl), PROT_READ | PROT_WRITE,
+ MAP_SHARED | MAP_ANONYMOUS, -1, 0);
+ if (ctl == MAP_FAILED)
+ ksft_exit_fail_msg("mmap ctl failed: %d\n", get_errno());
+
+ memset(ctl, 0, sizeof(struct SharedCtl));
+
+ parent_base = mmap(NULL, FILE_SIZE, PROT_READ | PROT_WRITE,
+ MAP_SHARED | MAP_ANONYMOUS, -1, 0);
+
+ if (parent_base == MAP_FAILED)
+ ksft_exit_fail_msg("mmap failed: %d\n", get_errno());
+
+ pid = fork();
+ if (pid < 0)
+ ksft_exit_fail_msg("fork failed: %d\n", get_errno());
+
+ if (pid == 0) {
+ /* ---- Child process ---- */
+ unsigned char *child_base = parent_base;
+
+ if (madvise(child_base, FILE_SIZE, MADV_HUGEPAGE) != 0)
+ ksft_exit_fail_msg("madvise(MADV_HUGEPAGE) failed: %d\n",
+ get_errno());
+
+ for (i = 0; i < TOTAL_PAGES; i++)
+ fill_page(child_base, i);
+
+ if (!check_huge_shmem(child_base, NR_PMD_PAGE, pmd_pagesize)) {
+ atomic_store_explicit(&ctl->ready, CHILD_FAILED, memory_order_release);
+ ksft_print_msg("No shmem THP is allocated\n");
+ _exit(0);
+ }
+
+ atomic_store_explicit(&ctl->ready, CHILD_READY, memory_order_release);
+ child_reader_loop(child_base, ctl);
+
+ munmap(child_base, FILE_SIZE);
+ _exit(0);
+ }
+
+ /* ---- Parent process ---- */
+ while (atomic_load_explicit(&ctl->ready, memory_order_acquire) == 0)
+ usleep(1000);
+
+ if (ctl->ready == CHILD_FAILED)
+ ksft_exit_fail_msg("Child process error\n");
+
+ is_punched = calloc(TOTAL_PAGES, sizeof(bool));
+ if (!is_punched)
+ ksft_exit_fail_msg("calloc is_punched failed\n");
+
+ for (i = 0; i < TOTAL_PAGES; i++) {
+ int j;
+
+ if (i % PUNCH_INTERVAL != 0)
+ continue;
+ if (madvise(parent_base + i * page_size,
+ PUNCH_SIZE_FACTOR * page_size, MADV_REMOVE) != 0) {
+ ksft_exit_fail_msg(
+ "madvise(MADV_REMOVE) failed on page %zu: %d\n",
+ i, get_errno());
+ }
+ for (j = 0; j < PUNCH_SIZE_FACTOR && i + j < TOTAL_PAGES; j++)
+ is_punched[i + j] = true;
+
+ i += PUNCH_SIZE_FACTOR;
+
+ n_punched += PUNCH_SIZE_FACTOR;
+ }
+
+ atomic_store_explicit(&ctl->stop, 1, memory_order_release);
+
+ if (waitpid(pid, &status, 0) != pid)
+ ksft_exit_fail_msg("waitpid failed\n");
+
+ child_failures = atomic_load_explicit(&ctl->child_failures,
+ memory_order_acquire);
+ child_verified = atomic_load_explicit(&ctl->child_verified,
+ memory_order_acquire);
+ if (child_failures)
+ ksft_print_msg("Child: %zu pages verified, %zu failures\n",
+ child_verified, child_failures);
+
+ parent_failures = verify_pages(parent_base, is_punched);
+ if (parent_failures)
+ ksft_print_msg("Parent verification failures: %zu\n",
+ parent_failures);
+
+ munmap(parent_base, FILE_SIZE);
+ munmap(ctl, sizeof(struct SharedCtl));
+ free(is_punched);
+
+ (void)n_punched;
+ return child_failures + parent_failures;
+}
+
+int main(void)
+{
+ size_t iter;
+ size_t failures;
+ struct thp_settings current_settings;
+ bool failed = false;
+
+ ksft_print_header();
+
+ if (!thp_is_enabled())
+ ksft_exit_skip("Transparent Hugepages not available\n");
+
+ if (geteuid() != 0) {
+ ksft_print_msg("Please run the benchmark as root\n");
+ ksft_finished();
+ }
+
+ thp_save_settings();
+ thp_read_settings(¤t_settings);
+ current_settings.shmem_enabled = SHMEM_ADVISE;
+ thp_write_settings(¤t_settings);
+
+ ksft_set_plan(1);
+
+ page_size = getpagesize();
+ pmd_pagesize = read_pmd_pagesize();
+
+ ksft_print_msg("folio split race test\n");
+ ksft_print_msg("=======================================================\n");
+ ksft_print_msg("Shmem size: %zu MiB\n", FILE_SIZE / 1024 / 1024);
+ ksft_print_msg("Total pages: %zu\n", TOTAL_PAGES);
+ ksft_print_msg("Child readers: %d\n", NUM_READER_THREADS);
+ ksft_print_msg("Punching every %dth to %dth page\n", PUNCH_INTERVAL,
+ PUNCH_INTERVAL + PUNCH_SIZE_FACTOR);
+ ksft_print_msg("Iterations: %d\n", NUM_ITERATIONS);
+
+ for (iter = 1; iter <= NUM_ITERATIONS; iter++) {
+ failures = run_iteration();
+ if (failures > 0) {
+ failed = true;
+ ksft_print_msg(
+ "FAILED on iteration %zu: %zu pages corrupted by cross-process MADV_REMOVE!\n",
+ iter, failures);
+ break;
+ }
+ }
+
+ thp_restore_settings();
+
+ if (failed) {
+ ksft_test_result_fail("Test failed\n");
+ ksft_exit_fail();
+ } else {
+ ksft_test_result_pass("All %d iterations passed\n", NUM_ITERATIONS);
+ ksft_exit_pass();
+ }
+
+ return 0;
+}
diff --git a/tools/testing/selftests/mm/run_vmtests.sh b/tools/testing/selftests/mm/run_vmtests.sh
index a0b4d8a52980b..f54ec9d0edb8b 100755
--- a/tools/testing/selftests/mm/run_vmtests.sh
+++ b/tools/testing/selftests/mm/run_vmtests.sh
@@ -555,6 +555,8 @@ if [ -n "${MOUNTED_XFS}" ]; then
rm -f ${XFS_IMG}
fi
+CATEGORY="thp" run_test ./folio_split_race_test
+
CATEGORY="migration" run_test ./migration
CATEGORY="mkdirty" run_test ./mkdirty
--
2.51.0
^ permalink raw reply [flat|nested] 6+ messages in thread* Re: [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test
2026-03-13 11:40 [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test Zi Yan
@ 2026-03-14 22:27 ` Andrew Morton
2026-03-14 23:44 ` Zi Yan
2026-03-15 0:03 ` Zi Yan
1 sibling, 1 reply; 6+ messages in thread
From: Andrew Morton @ 2026-03-14 22:27 UTC (permalink / raw)
To: Zi Yan
Cc: David Hildenbrand, Lorenzo Stoakes, Hugh Dickins, Baolin Wang,
Liam R. Howlett, Nico Pache, Ryan Roberts, Dev Jain, Barry Song,
Lance Yang, Matthew Wilcox, Bas van Dijk, Eero Kelly,
Andrew Battat, Adam Bratschi-Kaye, linux-mm, linux-kernel,
linux-fsdevel
On Fri, 13 Mar 2026 07:40:37 -0400 Zi Yan <ziy@nvidia.com> wrote:
> The added folio_split_race_test is a modified C port of the race condition
> test from [1]. The test creates shmem huge pages shared by both a parent
> and a child processes, where the parent process punches holes in the shmem
> to cause folio_split() in the kernel and the child process reads the shmem
> in 16 threads to cause filemap_get_entry() in the kernel.
> filemap_get_entry() reads the folio and xarray split by folio_split()
> locklessly. The original test[2] is written in rust and uses memfd (shmem
> backed). This C port uses shmem directly.
Cool.
> Note: the initial rust to C conversion is done by Cursor.
Hence the CaMeLcAsE "struct SharedCtl". Fair enough.
> Link: https://lore.kernel.org/all/CAKNNEtw5_kZomhkugedKMPOG-sxs5Q5OLumWJdiWXv+C9Yct0w@mail.gmail.com/ [1]
> Link: https://github.com/dfinity/thp-madv-remove-test [2]
I couldn't immediately find any licensing info there. Bas and Adam,
please advise? And sending your Signed-off-by's would be appropriate.
Thanks.
^ permalink raw reply [flat|nested] 6+ messages in thread
* Re: [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test
2026-03-14 22:27 ` Andrew Morton
@ 2026-03-14 23:44 ` Zi Yan
0 siblings, 0 replies; 6+ messages in thread
From: Zi Yan @ 2026-03-14 23:44 UTC (permalink / raw)
To: Andrew Morton
Cc: David Hildenbrand, Lorenzo Stoakes, Hugh Dickins, Baolin Wang,
Liam R. Howlett, Nico Pache, Ryan Roberts, Dev Jain, Barry Song,
Lance Yang, Matthew Wilcox, Bas van Dijk, Eero Kelly,
Andrew Battat, Adam Bratschi-Kaye, linux-mm, linux-kernel,
linux-fsdevel
On 14 Mar 2026, at 18:27, Andrew Morton wrote:
> On Fri, 13 Mar 2026 07:40:37 -0400 Zi Yan <ziy@nvidia.com> wrote:
>
>> The added folio_split_race_test is a modified C port of the race condition
>> test from [1]. The test creates shmem huge pages shared by both a parent
>> and a child processes, where the parent process punches holes in the shmem
>> to cause folio_split() in the kernel and the child process reads the shmem
>> in 16 threads to cause filemap_get_entry() in the kernel.
>> filemap_get_entry() reads the folio and xarray split by folio_split()
>> locklessly. The original test[2] is written in rust and uses memfd (shmem
>> backed). This C port uses shmem directly.
>
> Cool.
>
>> Note: the initial rust to C conversion is done by Cursor.
>
> Hence the CaMeLcAsE "struct SharedCtl". Fair enough.
Will change it to struct shared_ctl.
I also got some AI feedback[1] on this test program and will fix them
in a new version. I will send the new one late next week, so that I can
get feedback from human. :)
I will post the AI feedback inline in a separate email.
[1] https://sashiko.dev/#/patchset/20260313114037.3593642-1-ziy%40nvidia.com
>
>> Link: https://lore.kernel.org/all/CAKNNEtw5_kZomhkugedKMPOG-sxs5Q5OLumWJdiWXv+C9Yct0w@mail.gmail.com/ [1]
>> Link: https://github.com/dfinity/thp-madv-remove-test [2]
>
> I couldn't immediately find any licensing info there. Bas and Adam,
> please advise? And sending your Signed-off-by's would be appropriate.
>
> Thanks.
--
Best Regards,
Yan, Zi
^ permalink raw reply [flat|nested] 6+ messages in thread
* Re: [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test
2026-03-13 11:40 [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test Zi Yan
2026-03-14 22:27 ` Andrew Morton
@ 2026-03-15 0:03 ` Zi Yan
2026-03-17 7:31 ` [External Sender] " Adam Bratschi-Kaye
1 sibling, 1 reply; 6+ messages in thread
From: Zi Yan @ 2026-03-15 0:03 UTC (permalink / raw)
To: Andrew Morton
Cc: David Hildenbrand, Lorenzo Stoakes, Zi Yan, Hugh Dickins,
Baolin Wang, Liam R. Howlett, Nico Pache, Ryan Roberts, Dev Jain,
Barry Song, Lance Yang, Matthew Wilcox, Bas van Dijk, Eero Kelly,
Andrew Battat, Adam Bratschi-Kaye, linux-mm, linux-kernel,
linux-fsdevel
On 13 Mar 2026, at 7:40, Zi Yan wrote:
> The added folio_split_race_test is a modified C port of the race condition
> test from [1]. The test creates shmem huge pages shared by both a parent
> and a child processes, where the parent process punches holes in the shmem
> to cause folio_split() in the kernel and the child process reads the shmem
> in 16 threads to cause filemap_get_entry() in the kernel.
> filemap_get_entry() reads the folio and xarray split by folio_split()
> locklessly. The original test[2] is written in rust and uses memfd (shmem
> backed). This C port uses shmem directly.
>
> Note: the initial rust to C conversion is done by Cursor.
>
> Link: https://lore.kernel.org/all/CAKNNEtw5_kZomhkugedKMPOG-sxs5Q5OLumWJdiWXv+C9Yct0w@mail.gmail.com/ [1]
> Link: https://github.com/dfinity/thp-madv-remove-test [2]
> Signed-off-by: Zi Yan <ziy@nvidia.com>
> Cc: Bas van Dijk <bas@dfinity.org>
> Cc: Adam Bratschi-Kaye <adam.bratschikaye@dfinity.org>
> ---
> tools/testing/selftests/mm/Makefile | 1 +
> .../selftests/mm/folio_split_race_test.c | 380 ++++++++++++++++++
> tools/testing/selftests/mm/run_vmtests.sh | 2 +
> 3 files changed, 383 insertions(+)
> create mode 100644 tools/testing/selftests/mm/folio_split_race_test.c
I got some AI feedback from[1].
[1] https://sashiko.dev/#/patchset/20260313114037.3593642-1-ziy%40nvidia.com
<snip>
> diff --git a/tools/testing/selftests/mm/folio_split_race_test.c b/tools/testing/selftests/mm/folio_split_race_test.c
> new file mode 100644
> index 0000000000000..cf5a5666bab77
> --- /dev/null
> +++ b/tools/testing/selftests/mm/folio_split_race_test.c
<snip>
> +static void *reader_thread(void *arg)
> +{
> + struct reader_arg *ra = (struct reader_arg *)arg;
> + unsigned char *base = ra->base;
> + struct SharedCtl *ctl = ra->ctl;
> + int tid = ra->tid;
> + atomic_size_t *failures = ra->failures;
> + atomic_size_t *verified = ra->verified;
> + size_t page_idx;
> +
> + while (atomic_load_explicit(&ctl->stop, memory_order_acquire) == 0) {
If parent exits early without setting ctl->stop to 1, child will loop
forever.
I will add prctl(PR_SET_PDEATHSIG, SIGTERM) at the beginning of
child, so that child gets TERM when parent exits.
> + for (page_idx = (size_t)tid; page_idx < TOTAL_PAGES;
> + page_idx += NUM_READER_THREADS) {
> + if (page_idx % PUNCH_INTERVAL >= 0 &&
> + page_idx % PUNCH_INTERVAL < PUNCH_SIZE_FACTOR)
page_idx % PUNCH_INTERVAL >= 0 is a nop, since page_idx is unsigned.
I will leave it as is to show the range of page_idx % PUNCH_INTERVAL.
<snip>
> +/* Run a single iteration. Returns total number of corrupted pages. */
> +static size_t run_iteration(void)
> +{
> + struct SharedCtl *ctl;
> + pid_t pid;
> + unsigned char *parent_base;
> + bool *is_punched;
> + size_t i;
> + size_t child_failures, child_verified, parent_failures;
> + int status;
> + size_t n_punched = 0;
> +
<snip>
> +
> + /* ---- Parent process ---- */
> + while (atomic_load_explicit(&ctl->ready, memory_order_acquire) == 0)
> + usleep(1000);
If child exits/crashes without setting ctl->ready, parent can loop forever.
I will add waitpid(pid, &status, WNOHANG) == pid to check child status
and break if child is gone.
<snip>
> +
> + atomic_store_explicit(&ctl->stop, 1, memory_order_release);
> +
> + if (waitpid(pid, &status, 0) != pid)
> + ksft_exit_fail_msg("waitpid failed\n");
> +
> + child_failures = atomic_load_explicit(&ctl->child_failures,
> + memory_order_acquire);
If child exits abnormally without setting ctl->child_failures, we will
miss an issue.
I will inspect child exit status and fail the test if child exits abnormally.
<snip>
> +int main(void)
> +{
> + size_t iter;
> + size_t failures;
> + struct thp_settings current_settings;
> + bool failed = false;
> +
> + ksft_print_header();
> +
> + if (!thp_is_enabled())
> + ksft_exit_skip("Transparent Hugepages not available\n");
> +
> + if (geteuid() != 0) {
> + ksft_print_msg("Please run the benchmark as root\n");
> + ksft_finished();
> + }
ksft_finished() here leads to a PASS status.
Will use ksft_exit_skip() instead.
> +
> + thp_save_settings();
> + thp_read_settings(¤t_settings);
> + current_settings.shmem_enabled = SHMEM_ADVISE;
> + thp_write_settings(¤t_settings);
> +
> + ksft_set_plan(1);
> +
<snip>
> + for (iter = 1; iter <= NUM_ITERATIONS; iter++) {
> + failures = run_iteration();
run_iteration() has several ksft_exit_fail_msg() or if it crashes,
THP settings are not restored.
Will add signal handlers and atexit() to call thp_restore_settings().
> + if (failures > 0) {
> + failed = true;
> + ksft_print_msg(
> + "FAILED on iteration %zu: %zu pages corrupted by cross-process MADV_REMOVE!\n",
> + iter, failures);
> + break;
> + }
> + }
> +
> + thp_restore_settings();
> +
> + if (failed) {
> + ksft_test_result_fail("Test failed\n");
> + ksft_exit_fail();
> + } else {
> + ksft_test_result_pass("All %d iterations passed\n", NUM_ITERATIONS);
> + ksft_exit_pass();
> + }
> +
> + return 0;
> +}
--
Best Regards,
Yan, Zi
^ permalink raw reply [flat|nested] 6+ messages in thread* Re: [External Sender] Re: [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test
2026-03-15 0:03 ` Zi Yan
@ 2026-03-17 7:31 ` Adam Bratschi-Kaye
2026-03-17 9:43 ` Bas van Dijk
0 siblings, 1 reply; 6+ messages in thread
From: Adam Bratschi-Kaye @ 2026-03-17 7:31 UTC (permalink / raw)
To: Zi Yan
Cc: Andrew Morton, David Hildenbrand, Lorenzo Stoakes, Hugh Dickins,
Baolin Wang, Liam R. Howlett, Nico Pache, Ryan Roberts, Dev Jain,
Barry Song, Lance Yang, Matthew Wilcox, Bas van Dijk, Eero Kelly,
Andrew Battat, linux-mm, linux-kernel, linux-fsdevel
On 13 Mar 2026, at 7:40, Zi Yan wrote:
> The added folio_split_race_test is a modified C port of the race condition
> test from [1]. The test creates shmem huge pages shared by both a parent
> and a child processes, where the parent process punches holes in the shmem
> to cause folio_split() in the kernel and the child process reads the shmem
> in 16 threads to cause filemap_get_entry() in the kernel.
Note that the fork isn't actually necessary to reproduce the issue. I
had it working as
well with the reading and punching in the same process, but just with
two separate
mappings. Not that it makes much of a difference - just in case you
wanted to simplify
the test.
On 14 Mar 2026, at 18:27, Andrew Morton wrote:
> I couldn't immediately find any licensing info there. Bas and Adam,
> please advise?
GPL-2.0 license is fine by me.
> And sending your Signed-off-by's would be appropriate.
No problem:
Signed-off-by: Adam Bratschi-Kaye <adam.bratschikaye@dfinity.org>
Thanks,
Adam
^ permalink raw reply [flat|nested] 6+ messages in thread
* Re: [External Sender] Re: [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test
2026-03-17 7:31 ` [External Sender] " Adam Bratschi-Kaye
@ 2026-03-17 9:43 ` Bas van Dijk
0 siblings, 0 replies; 6+ messages in thread
From: Bas van Dijk @ 2026-03-17 9:43 UTC (permalink / raw)
To: Andrew Morton
Cc: Zi Yan, Adam Bratschi-Kaye, David Hildenbrand, Lorenzo Stoakes,
Hugh Dickins, Baolin Wang, Liam R. Howlett, Nico Pache,
Ryan Roberts, Dev Jain, Barry Song, Lance Yang, Matthew Wilcox,
Eero Kelly, Andrew Battat, linux-mm, linux-kernel, linux-fsdevel
No problem for me either.
Signed-off-by: Bas van Dijk <bas@dfinity.org>
I'll add a GPL-2.0 license to the repo.
On Tue, Mar 17, 2026 at 8:32 AM Adam Bratschi-Kaye
<adam.bratschikaye@dfinity.org> wrote:
>
> On 13 Mar 2026, at 7:40, Zi Yan wrote:
> > The added folio_split_race_test is a modified C port of the race condition
> > test from [1]. The test creates shmem huge pages shared by both a parent
> > and a child processes, where the parent process punches holes in the shmem
> > to cause folio_split() in the kernel and the child process reads the shmem
> > in 16 threads to cause filemap_get_entry() in the kernel.
>
> Note that the fork isn't actually necessary to reproduce the issue. I
> had it working as
> well with the reading and punching in the same process, but just with
> two separate
> mappings. Not that it makes much of a difference - just in case you
> wanted to simplify
> the test.
>
> On 14 Mar 2026, at 18:27, Andrew Morton wrote:
> > I couldn't immediately find any licensing info there. Bas and Adam,
> > please advise?
>
> GPL-2.0 license is fine by me.
>
> > And sending your Signed-off-by's would be appropriate.
>
> No problem:
>
> Signed-off-by: Adam Bratschi-Kaye <adam.bratschikaye@dfinity.org>
>
> Thanks,
> Adam
^ permalink raw reply [flat|nested] 6+ messages in thread
end of thread, other threads:[~2026-03-17 9:44 UTC | newest]
Thread overview: 6+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2026-03-13 11:40 [PATCH] selftests/mm: add folio_split() and filemap_get_entry() race test Zi Yan
2026-03-14 22:27 ` Andrew Morton
2026-03-14 23:44 ` Zi Yan
2026-03-15 0:03 ` Zi Yan
2026-03-17 7:31 ` [External Sender] " Adam Bratschi-Kaye
2026-03-17 9:43 ` Bas van Dijk
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox