[PATCH] arm64: Add 5-level page table support for 4K pages with 52-bit VA

Xiaolei Wang xiaolei.wang at windriver.com
Mon May 18 20:17:06 PDT 2026


From: Xiaolei wang <xiaolei.wang at windriver.com>

makedumpfile fails with "PAGE SIZE 0x1000 and VA Bits 52 not supported"
on ARM64 systems configured with CONFIG_ARM64_VA_BITS_52=y and 4KB page
size. This combination requires 5-level page tables, which makedumpfile
does not currently support.

Add support for 5-level page tables on ARM64 by:
- Adding the P4D page table level definitions and helpers
- Updating pud_t to contain p4d_t (reflecting the correct hierarchy)
- Extending calculate_plat_config() to recognize 4K + 52-bit VA as
  pgtable_level=5, and 16K + 52-bit VA as pgtable_level=4
- Adding p4d_offset() to handle the additional translation level
- Updating vaddr_to_paddr_arm64() to walk through PGD->P4D->PUD->PMD->PTE
- Using vabits_actual instead of va_bits in calculate_plat_config() and
  PTRS_PER_PGD to correctly handle the case where the kernel is compiled
  with VA_BITS=52 but the hardware only supports 48-bit VA (runtime
  fallback to 4-level)

The pgtable_level assignments follow arch/arm64/Kconfig:
- 4K  + 52-bit VA → 5-level (the only 5-level configuration)
- 16K + 52-bit VA → 4-level
- 4K  + 48-bit VA → 4-level
- 16K + 48-bit VA → 4-level

Fixes: https://github.com/makedumpfile/makedumpfile/issues/18
Signed-off-by: Xiaolei Wang <xiaolei.wang at windriver.com>
---
 arch/arm64.c | 89 +++++++++++++++++++++++++++++++++++++++++++---------
 1 file changed, 74 insertions(+), 15 deletions(-)

diff --git a/arch/arm64.c b/arch/arm64.c
index 1072178..f3f33e4 100644
--- a/arch/arm64.c
+++ b/arch/arm64.c
@@ -29,6 +29,10 @@ typedef struct {
 
 typedef struct {
 	pgd_t pgd;
+} p4d_t;
+
+typedef struct {
+	p4d_t p4d;
 } pud_t;
 
 typedef struct {
@@ -42,6 +46,7 @@ typedef struct {
 #define __pte(x)	((pte_t) { (x) } )
 #define __pmd(x)	((pmd_t) { (x) } )
 #define __pud(x)	((pud_t) { (x) } )
+#define __p4d(x)	((p4d_t) { (x) } )
 #define __pgd(x)	((pgd_t) { (x) } )
 
 static int lpa_52_bit_support_available;
@@ -62,7 +67,8 @@ static unsigned long kimage_voffset;
 #define PAGE_OFFSET_48		((0xffffffffffffffffUL) << 48)
 
 #define pgd_val(x)		((x).pgd)
-#define pud_val(x)		(pgd_val((x).pgd))
+#define p4d_val(x)		(pgd_val((x).pgd))
+#define pud_val(x)		(p4d_val((x).p4d))
 #define pmd_val(x)		(pud_val((x).pud))
 #define pte_val(x)		((x).pte)
 
@@ -75,6 +81,7 @@ static unsigned long kimage_voffset;
 typedef unsigned long pteval_t;
 typedef unsigned long pmdval_t;
 typedef unsigned long pudval_t;
+typedef unsigned long p4dval_t;
 typedef unsigned long pgdval_t;
 
 #define PAGE_SHIFT	PAGESHIFT()
@@ -101,6 +108,14 @@ typedef unsigned long pgdval_t;
 #define PUD_MASK		(~(PUD_SIZE-1))
 #define PTRS_PER_PUD		PTRS_PER_PTE
 
+/*
+ * P4D_SHIFT determines the size a level 0 page table entry can map.
+ */
+#define P4D_SHIFT		ARM64_HW_PGTABLE_LEVEL_SHIFT(0)
+#define P4D_SIZE		(_AC(1, UL) << P4D_SHIFT)
+#define P4D_MASK		(~(P4D_SIZE-1))
+#define PTRS_PER_P4D		PTRS_PER_PTE
+
 /*
  * PGDIR_SHIFT determines the size a top-level page table entry can map
  * (depending on the configuration, this level can be 0, 1 or 2).
@@ -108,7 +123,7 @@ typedef unsigned long pgdval_t;
 #define PGDIR_SHIFT		ARM64_HW_PGTABLE_LEVEL_SHIFT(4 - (pgtable_level))
 #define PGDIR_SIZE		(_AC(1, UL) << PGDIR_SHIFT)
 #define PGDIR_MASK		(~(PGDIR_SIZE-1))
-#define PTRS_PER_PGD		(1 << ((va_bits) - PGDIR_SHIFT))
+#define PTRS_PER_PGD		(1 << ((vabits_actual) - PGDIR_SHIFT))
 
 /*
  * Section address mask and size definitions.
@@ -178,6 +193,22 @@ pgd_pte(pgd_t pgd)
 #define __pgd_to_phys(pgd)		__pte_to_phys(pgd_pte(pgd))
 #define pgd_offset(pgd, vaddr)		((pgd_t *)(pgd) + pgd_index(vaddr))
 
+/* P4D */
+#define p4d_index(vaddr)		(((vaddr) >> P4D_SHIFT) & (PTRS_PER_P4D - 1))
+
+static inline pte_t p4d_pte(p4d_t p4d)
+{
+	return __pte(p4d_val(p4d));
+}
+
+#define __p4d_to_phys(p4d)		__pte_to_phys(p4d_pte(p4d))
+
+static inline unsigned long
+p4d_page_paddr(p4d_t p4d)
+{
+	return __p4d_to_phys(p4d);
+}
+
 static inline pte_t pud_pte(pud_t pud)
 {
 	return __pte(pud_val(pud));
@@ -237,13 +268,22 @@ __pa(unsigned long vaddr)
 		return (vaddr - kimage_voffset);
 }
 
+static p4d_t *
+p4d_offset(pgd_t *pgda, pgd_t *pgdv, unsigned long vaddr)
+{
+	if (pgtable_level > 4)
+		return (p4d_t *)(pgd_page_paddr(*pgdv) + p4d_index(vaddr) * sizeof(p4d_t));
+	else
+		return (p4d_t *)(pgda);
+}
+
 static pud_t *
-pud_offset(pgd_t *pgda, pgd_t *pgdv, unsigned long vaddr)
+pud_offset(p4d_t *p4da, p4d_t *p4dv, unsigned long vaddr)
 {
 	if (pgtable_level > 3)
-		return (pud_t *)(pgd_page_paddr(*pgdv) + pud_index(vaddr) * sizeof(pud_t));
+		return (pud_t *)(p4d_page_paddr(*p4dv) + pud_index(vaddr) * sizeof(pud_t));
 	else
-		return (pud_t *)(pgda);
+		return (pud_t *)(p4da);
 }
 
 static pmd_t *
@@ -257,20 +297,32 @@ pmd_offset(pud_t *puda, pud_t *pudv, unsigned long vaddr)
 
 static int calculate_plat_config(void)
 {
-	/* derive pgtable_level as per arch/arm64/Kconfig */
-	if ((PAGESIZE() == SZ_16K && va_bits == 36) ||
-			(PAGESIZE() == SZ_64K && va_bits == 42)) {
+	/*
+	 * Derive pgtable_level as per arch/arm64/Kconfig.
+	 * Use vabits_actual (runtime VA size) rather than va_bits (compile-time)
+	 * because the kernel may reduce the VA space at boot if the hardware
+	 * does not support 52-bit VA (LVA). In that case va_bits=52 but
+	 * vabits_actual=48, and the page tables are 4-level, not 5-level.
+	 */
+	int va = vabits_actual;
+
+	if ((PAGESIZE() == SZ_16K && va == 36) ||
+			(PAGESIZE() == SZ_64K && va == 42)) {
 		pgtable_level = 2;
-	} else if ((PAGESIZE() == SZ_64K && va_bits == 48) ||
-			(PAGESIZE() == SZ_64K && va_bits == 52) ||
-			(PAGESIZE() == SZ_4K && va_bits == 39) ||
-			(PAGESIZE() == SZ_16K && va_bits == 47)) {
+	} else if ((PAGESIZE() == SZ_64K && va == 48) ||
+			(PAGESIZE() == SZ_64K && va == 52) ||
+			(PAGESIZE() == SZ_4K && va == 39) ||
+			(PAGESIZE() == SZ_16K && va == 47)) {
 		pgtable_level = 3;
-	} else if ((PAGESIZE() != SZ_64K && va_bits == 48)) {
+	} else if ((PAGESIZE() == SZ_4K && va == 48) ||
+			(PAGESIZE() == SZ_16K && va == 48) ||
+			(PAGESIZE() == SZ_16K && va == 52)) {
 		pgtable_level = 4;
+	} else if (PAGESIZE() == SZ_4K && va == 52) {
+		pgtable_level = 5;
 	} else {
 		ERRMSG("PAGE SIZE %#lx and VA Bits %d not supported\n",
-				PAGESIZE(), va_bits);
+				PAGESIZE(), va);
 		return FALSE;
 	}
 	DEBUG_MSG("pgtable_level: %d\n", pgtable_level);
@@ -548,6 +600,7 @@ vaddr_to_paddr_arm64(unsigned long vaddr)
 	unsigned long long paddr = NOT_PADDR;
 	unsigned long long swapper_phys;
 	pgd_t	*pgda, pgdv;
+	p4d_t	*p4da, p4dv;
 	pud_t	*puda, pudv;
 	pmd_t	*pmda, pmdv;
 	pte_t 	*ptea, ptev;
@@ -565,7 +618,13 @@ vaddr_to_paddr_arm64(unsigned long vaddr)
 		return NOT_PADDR;
 	}
 
-	puda = pud_offset(pgda, &pgdv, vaddr);
+	p4da = p4d_offset(pgda, &pgdv, vaddr);
+	if (!readmem(PADDR, (unsigned long long)p4da, &p4dv, sizeof(p4dv))) {
+		ERRMSG("Can't read p4d\n");
+		return NOT_PADDR;
+	}
+
+	puda = pud_offset(p4da, &p4dv, vaddr);
 	if (!readmem(PADDR, (unsigned long long)puda, &pudv, sizeof(pudv))) {
 		ERRMSG("Can't read pud\n");
 		return NOT_PADDR;
-- 
2.43.0




More information about the kexec mailing list