[PATCH] makedumpfile: ppc64: get vmalloc start address from vmcoreinfo

HAGIO KAZUHITO(萩尾 一仁) k-hagio-ab at nec.com
Tue Feb 27 20:51:28 PST 2024


Hi Aditya,

thanks for the patch.

On 2024/02/24 4:03, Aditya Gupta wrote:
> Below error was noticed when running makedumpfile on linux-next kernel
> crash (linux-next tag next-20240121):
> 
>      ...
>      Checking for memory holes : [100.0 %] | readpage_elf: Attempt to read non-existent page at 0xc000000000000.
>      [ 17.551718] kdump.sh[404]: readmem: type_addr: 0, addr:c00c000000000000, size:16384
>      [ 17.551793] kdump.sh[404]: __exclude_unnecessary_pages: Can't read the buffer of struct page.
>      [ 17.551864] kdump.sh[404]: create_2nd_bitmap: Can't exclude unnecessary pages.
>      [ 17.562632] kdump.sh[404]: The kernel version is not supported.
>      [ 17.562708] kdump.sh[404]: The makedumpfile operation may be incomplete.
>      [ 17.562773] kdump.sh[404]: makedumpfile Failed.
>      [ 17.564335] kdump[406]: saving vmcore failed, _exitcode:1
> 
> Above error was due to 'vmap_area_list' and 'vmlist' symbols missing
> from the vmcore.
> 
> 'vmap_area_list' was removed in the linux kernel with below commit:
> 
>      commit 378eb24a0658dd922b29524e0ce35c6c43f56cba
>           mm/vmalloc: remove vmap_area_list
> 
> Subsequently the commit also introduced 'VMALLOC_START' in vmcoreinfo to
> get base address of vmalloc area, instead of depending on 'vmap_area_list'
> 
> Hence if 'VMALLOC_START' symbol is there in vmcoreinfo:
>    1. Set vmalloc_start based on 'VMALLOC_START'
>    2. Don't error if vmap_area_list/vmlist are not defined
> 
> Reported-by: Sachin Sant <sachinp at linux.ibm.com>
> Signed-off-by: Aditya Gupta <adityag at linux.ibm.com>
> ---
>   arch/ppc64.c   | 19 +++++++++++++------
>   makedumpfile.c |  3 ++-
>   makedumpfile.h |  6 +++---
>   3 files changed, 18 insertions(+), 10 deletions(-)
> 
> diff --git a/arch/ppc64.c b/arch/ppc64.c
> index 96c357cb0335..bb62e2cd199a 100644
> --- a/arch/ppc64.c
> +++ b/arch/ppc64.c
> @@ -568,7 +568,9 @@ get_machdep_info_ppc64(void)
>   	/*
>   	 * Get vmalloc_start value from either vmap_area_list or vmlist.
>   	 */
> -	if ((SYMBOL(vmap_area_list) != NOT_FOUND_SYMBOL)
> +	if (NUMBER(vmalloc_start) != NOT_FOUND_SYMBOL) {

I will fix this NOT_FOUND_SYMBOL to NOT_FOUND_NUMBER when applying, 
otherwise makedumpfile will fail for a dumpfile without the 
corresponding kernel patch, correct?

The patch looks good to me except for it.  I will apply this with the 
kernel version in the commit log after the kernel patch gets merged.

Thanks,
Kazu


> +		vmalloc_start = NUMBER(vmalloc_start);
> +	} else if ((SYMBOL(vmap_area_list) != NOT_FOUND_SYMBOL)
>   	    && (OFFSET(vmap_area.va_start) != NOT_FOUND_STRUCTURE)
>   	    && (OFFSET(vmap_area.list) != NOT_FOUND_STRUCTURE)) {
>   		if (!readmem(VADDR, SYMBOL(vmap_area_list) + OFFSET(list_head.next),
> @@ -684,11 +686,16 @@ vaddr_to_paddr_ppc64(unsigned long vaddr)
>   	if ((SYMBOL(vmap_area_list) == NOT_FOUND_SYMBOL)
>   	    || (OFFSET(vmap_area.va_start) == NOT_FOUND_STRUCTURE)
>   	    || (OFFSET(vmap_area.list) == NOT_FOUND_STRUCTURE)) {
> -		if ((SYMBOL(vmlist) == NOT_FOUND_SYMBOL)
> -		    || (OFFSET(vm_struct.addr) == NOT_FOUND_STRUCTURE)) {
> -			ERRMSG("Can't get info for vmalloc translation.\n");
> -			return NOT_PADDR;
> -		}
> +		/*
> +		 * Don't depend on vmap_area_list/vmlist if vmalloc_start is set in
> +		 * vmcoreinfo, in that case proceed without error
> +		 */
> +		if (NUMBER(vmalloc_start) == NOT_FOUND_NUMBER)
> +			if ((SYMBOL(vmlist) == NOT_FOUND_SYMBOL)
> +				|| (OFFSET(vm_struct.addr) == NOT_FOUND_STRUCTURE)) {
> +				ERRMSG("Can't get info for vmalloc translation.\n");
> +				return NOT_PADDR;
> +			}
>   	}
>   
>   	return ppc64_vtop_level4(vaddr);
> diff --git a/makedumpfile.c b/makedumpfile.c
> index b004b93fecb7..b6c63fad15f3 100644
> --- a/makedumpfile.c
> +++ b/makedumpfile.c
> @@ -2978,6 +2978,8 @@ read_vmcoreinfo(void)
>   	READ_NUMBER("PAGE_OFFLINE_MAPCOUNT_VALUE", PAGE_OFFLINE_MAPCOUNT_VALUE);
>   	READ_NUMBER("phys_base", phys_base);
>   	READ_NUMBER("KERNEL_IMAGE_SIZE", KERNEL_IMAGE_SIZE);
> +
> +	READ_NUMBER_UNSIGNED("VMALLOC_START", vmalloc_start);
>   #ifdef __aarch64__
>   	READ_NUMBER("VA_BITS", VA_BITS);
>   	READ_NUMBER("TCR_EL1_T1SZ", TCR_EL1_T1SZ);
> @@ -2989,7 +2991,6 @@ read_vmcoreinfo(void)
>   	READ_NUMBER("VA_BITS", va_bits);
>   	READ_NUMBER_UNSIGNED("phys_ram_base", phys_ram_base);
>   	READ_NUMBER_UNSIGNED("PAGE_OFFSET", page_offset);
> -	READ_NUMBER_UNSIGNED("VMALLOC_START", vmalloc_start);
>   	READ_NUMBER_UNSIGNED("VMALLOC_END", vmalloc_end);
>   	READ_NUMBER_UNSIGNED("VMEMMAP_START", vmemmap_start);
>   	READ_NUMBER_UNSIGNED("VMEMMAP_END", vmemmap_end);
> diff --git a/makedumpfile.h b/makedumpfile.h
> index 59c83e1d9df3..4021c5af2a34 100644
> --- a/makedumpfile.h
> +++ b/makedumpfile.h
> @@ -541,8 +541,6 @@ do { \
>    * The value of dependence on machine
>    */
>   #define PAGE_OFFSET		(info->page_offset)
> -#define VMALLOC_START		(info->vmalloc_start)
> -#define VMALLOC_END		(info->vmalloc_end)
>   #define VMEMMAP_START		(info->vmemmap_start)
>   #define VMEMMAP_END		(info->vmemmap_end)
>   #define PMASK			(0x7ffffffffffff000UL)
> @@ -2262,6 +2260,9 @@ struct number_table {
>   	long    HUGETLB_PAGE_DTOR;
>   	long	phys_base;
>   	long	KERNEL_IMAGE_SIZE;
> +
> +	unsigned long vmalloc_start;
> +
>   #ifdef __aarch64__
>   	long 	VA_BITS;
>   	long	TCR_EL1_T1SZ;
> @@ -2272,7 +2273,6 @@ struct number_table {
>   	long va_bits;
>   	unsigned long phys_ram_base;
>   	unsigned long page_offset;
> -	unsigned long vmalloc_start;
>   	unsigned long vmalloc_end;
>   	unsigned long vmemmap_start;
>   	unsigned long vmemmap_end;


More information about the kexec mailing list