[RFC 1/7] mm: add generic dual-bitmap consistency primitives

From: Sasha Levin

Date: Fri Apr 24 2026 - 10:01:57 EST


From: Sasha Levin <sashal@xxxxxxxxxx>

Add a header-only library implementing a pair-of-complementary-bitmaps
integrity primitive: maintain two bitmaps where primary[i] == !secondary[i]
for every bit i, and detect corruption by checking that invariant.

The motivation (silent metadata corruption that KASAN/KFENCE cannot see,
plus the functional-safety argument for wanting this in the kernel) is
described in the cover letter; this patch only introduces the building
block.

The primary bitmap uses 1 for "allocated" and 0 for "free"; the secondary
uses the opposite convention. dual_bitmap_set() and dual_bitmap_clear()
update both bitmaps and return the previous primary bit so callers can
distinguish a real state transition from a double-alloc or double-free.
dual_bitmap_validate() walks every word and returns the number of words
that fail the invariant.

Concurrency note: set and clear perform two independent atomic bit
operations against the primary and secondary bitmaps, so the invariant
is transiently violated between those two ops. A concurrent reader can
observe an inconsistent pair on a healthy kernel. The validation
helpers absorb this by retrying a small number of times with cpu_relax()
and, after the retries, issuing an smp_rmb() and re-reading. Real
corruption is persistent and survives the retries; transient races
resolve within a few cpu_relax() loops. This keeps the update path
lock-free at the cost of a bounded false-positive probability under
extreme write rates, which is acceptable for a fail-stop integrity
check.

Based-on-patch-by: Sanif Veeras <sveeras@xxxxxxxxxx>
Assisted-by: Claude:claude-opus-4-7 <noreply@xxxxxxxxxxxxx>
Signed-off-by: Sasha Levin <sashal@xxxxxxxxxx>
---
MAINTAINERS | 10 ++
include/linux/dual_bitmap.h | 216 ++++++++++++++++++++++++++++++++++++
2 files changed, 226 insertions(+)
create mode 100644 include/linux/dual_bitmap.h

diff --git a/MAINTAINERS b/MAINTAINERS
index d1cc0e12fe1f..81b1f44215b3 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -19972,6 +19972,16 @@ F: mm/page-writeback.c
F: mm/readahead.c
F: mm/truncate.c

+PAGE CONSISTENCY CHECKER
+M: Sasha Levin <sashal@xxxxxxxxxx>
+L: linux-mm@xxxxxxxxx
+S: Maintained
+F: Documentation/mm/page_consistency.rst
+F: include/linux/dual_bitmap.h
+F: include/linux/page_consistency.h
+F: mm/page_consistency.c
+F: mm/page_consistency_test.c
+
PAGE POOL
M: Jesper Dangaard Brouer <hawk@xxxxxxxxxx>
M: Ilias Apalodimas <ilias.apalodimas@xxxxxxxxxx>
diff --git a/include/linux/dual_bitmap.h b/include/linux/dual_bitmap.h
new file mode 100644
index 000000000000..136822267be1
--- /dev/null
+++ b/include/linux/dual_bitmap.h
@@ -0,0 +1,216 @@
+/* SPDX-License-Identifier: GPL-2.0 */
+/*
+ * Dual-bitmap consistency primitives
+ *
+ * Provides a generic library for maintaining dual bitmaps with the invariant
+ * that (primary == ~secondary). This pattern is useful for detecting
+ * single-bit memory corruption in bitmap-based data structures.
+ *
+ * Based on NVIDIA safety research.
+ */
+#ifndef _LINUX_DUAL_BITMAP_H
+#define _LINUX_DUAL_BITMAP_H
+
+#include <linux/types.h>
+#include <linux/bitops.h>
+#include <linux/bitmap.h>
+#include <linux/bug.h>
+#include <asm/barrier.h>
+#include <linux/processor.h>
+
+/* Number of retries for transient inconsistencies from concurrent updates */
+#define DUAL_BITMAP_RETRY_COUNT 3
+
+/* Bitmap indices */
+enum dual_bitmap_index {
+ DUAL_BITMAP_PRIMARY = 0, /* 0=free, 1=allocated */
+ DUAL_BITMAP_SECONDARY = 1, /* 0=allocated, 1=free (complement) */
+ DUAL_BITMAP_COUNT = 2
+};
+
+/**
+ * struct dual_bitmap - Dual bitmap structure
+ * @bitmap: Array of two bitmap pointers [PRIMARY, SECONDARY]
+ * @nbits: Number of bits in each bitmap
+ */
+struct dual_bitmap {
+ unsigned long *bitmap[DUAL_BITMAP_COUNT];
+ unsigned int nbits;
+};
+
+/**
+ * dual_bitmap_consistent_word - Check if a word pair maintains the invariant
+ * @primary: Primary bitmap word
+ * @secondary: Secondary bitmap word
+ *
+ * Returns true if primary == ~secondary
+ */
+static inline bool dual_bitmap_consistent_word(unsigned long primary,
+ unsigned long secondary)
+{
+ return primary == ~secondary;
+}
+
+/**
+ * dual_bitmap_set - Set bit in dual bitmap (mark as allocated)
+ * @db: Dual bitmap structure
+ * @bit: Bit position to set
+ *
+ * Sets bit in primary and clears corresponding bit in secondary.
+ * Returns the old value of the primary bit (true if was already set).
+ */
+static inline bool dual_bitmap_set(struct dual_bitmap *db, unsigned long bit)
+{
+ bool was_set;
+
+ if (WARN_ON_ONCE(bit >= db->nbits))
+ return false;
+
+ was_set = test_and_set_bit(bit, db->bitmap[DUAL_BITMAP_PRIMARY]);
+ test_and_clear_bit(bit, db->bitmap[DUAL_BITMAP_SECONDARY]);
+
+ return was_set;
+}
+
+/**
+ * dual_bitmap_clear - Clear bit in dual bitmap (mark as free)
+ * @db: Dual bitmap structure
+ * @bit: Bit position to clear
+ *
+ * Clears bit in primary and sets corresponding bit in secondary.
+ * Returns the old value of the primary bit (true if was set).
+ */
+static inline bool dual_bitmap_clear(struct dual_bitmap *db, unsigned long bit)
+{
+ bool was_set;
+
+ if (WARN_ON_ONCE(bit >= db->nbits))
+ return false;
+
+ was_set = test_and_clear_bit(bit, db->bitmap[DUAL_BITMAP_PRIMARY]);
+ test_and_set_bit(bit, db->bitmap[DUAL_BITMAP_SECONDARY]);
+
+ return was_set;
+}
+
+/**
+ * dual_bitmap_test - Test if bit is set in primary bitmap
+ * @db: Dual bitmap structure
+ * @bit: Bit position to test
+ *
+ * Returns true if bit is set in primary (allocated), false if clear (free).
+ */
+static inline bool dual_bitmap_test(const struct dual_bitmap *db,
+ unsigned long bit)
+{
+ if (WARN_ON_ONCE(bit >= db->nbits))
+ return false;
+
+ return test_bit(bit, db->bitmap[DUAL_BITMAP_PRIMARY]);
+}
+
+/**
+ * dual_bitmap_consistent - Check consistency of a single bit
+ * @db: Dual bitmap structure
+ * @bit: Bit position to check
+ *
+ * Returns true if the bit values are consistent (primary != secondary).
+ * Uses retry logic to handle transient inconsistencies from concurrent
+ * updates - real corruption persists while races resolve quickly.
+ */
+static inline bool dual_bitmap_consistent(const struct dual_bitmap *db,
+ unsigned long bit)
+{
+ int retries = DUAL_BITMAP_RETRY_COUNT;
+
+ if (WARN_ON_ONCE(bit >= db->nbits))
+ return false;
+
+ do {
+ bool primary = test_bit(bit, db->bitmap[DUAL_BITMAP_PRIMARY]);
+ bool secondary = test_bit(bit, db->bitmap[DUAL_BITMAP_SECONDARY]);
+
+ if (primary != secondary)
+ return true; /* Consistent */
+
+ /* Inconsistent - could be transient race, retry */
+ cpu_relax();
+ } while (--retries > 0);
+
+ /*
+ * Inconsistent after retries. Issue a read barrier and check
+ * one last time to rule out stale/reordered reads.
+ *
+ * Note: the two test_bit() calls are still non-atomic w.r.t.
+ * each other, so a concurrent set/clear between them can cause
+ * a transient false positive. This is acceptable because real
+ * corruption is persistent and will be caught on the next check.
+ */
+ smp_rmb();
+ return test_bit(bit, db->bitmap[DUAL_BITMAP_PRIMARY]) !=
+ test_bit(bit, db->bitmap[DUAL_BITMAP_SECONDARY]);
+}
+
+/**
+ * dual_bitmap_validate - Validate entire dual bitmap
+ * @db: Dual bitmap structure
+ *
+ * Checks that the invariant (primary == ~secondary) holds for all words.
+ * Uses retry logic to handle transient inconsistencies from concurrent
+ * updates - real corruption persists while races resolve quickly.
+ * Returns the number of inconsistent words found (0 = all consistent).
+ *
+ * Note: this is a cold-path diagnostic function kept inline for
+ * header-only library simplicity. It should not be called in hot paths.
+ */
+static inline unsigned long dual_bitmap_validate(const struct dual_bitmap *db)
+{
+ unsigned int words = BITS_TO_LONGS(db->nbits);
+ unsigned long violations = 0;
+ unsigned int i;
+
+ for (i = 0; i < words; i++) {
+ unsigned long primary, secondary;
+ int retries = DUAL_BITMAP_RETRY_COUNT;
+
+ do {
+ primary = READ_ONCE(db->bitmap[DUAL_BITMAP_PRIMARY][i]);
+ secondary = READ_ONCE(db->bitmap[DUAL_BITMAP_SECONDARY][i]);
+
+ if (dual_bitmap_consistent_word(primary, secondary))
+ break; /* Consistent, move to next word */
+
+ cpu_relax();
+ } while (--retries > 0);
+
+ if (retries == 0) {
+ /*
+ * Inconsistent after retries. Issue a read
+ * barrier and re-read to rule out stale/reordered
+ * memory views before declaring corruption.
+ */
+ smp_rmb();
+ primary = READ_ONCE(db->bitmap[DUAL_BITMAP_PRIMARY][i]);
+ secondary = READ_ONCE(db->bitmap[DUAL_BITMAP_SECONDARY][i]);
+ if (!dual_bitmap_consistent_word(primary, secondary))
+ violations++;
+ }
+ }
+
+ return violations;
+}
+
+/**
+ * dual_bitmap_init - Initialize dual bitmap to empty state
+ * @db: Dual bitmap structure
+ *
+ * Sets primary to all zeros (nothing allocated) and secondary to all ones.
+ * The bitmaps must already be allocated before calling this.
+ */
+static inline void dual_bitmap_init(struct dual_bitmap *db)
+{
+ bitmap_zero(db->bitmap[DUAL_BITMAP_PRIMARY], db->nbits);
+ bitmap_fill(db->bitmap[DUAL_BITMAP_SECONDARY], db->nbits);
+}
+
+#endif /* _LINUX_DUAL_BITMAP_H */
--
2.53.0