[PATCH] makedumpfile: ppc64: get vmalloc start address from vmcoreinfo

Aditya Gupta adityag at linux.ibm.com
Wed Feb 28 01:36:12 PST 2024


Hi Kazu,

On Wed, Feb 28, 2024 at 04:51:28AM +0000, HAGIO KAZUHITO(萩尾 一仁) wrote:
> Hi Aditya,
> 
> thanks for the patch.
> 
> On 2024/02/24 4:03, Aditya Gupta wrote:
> > Below error was noticed when running makedumpfile on linux-next kernel
> > crash (linux-next tag next-20240121):
> > 
> >      ...
> >      Checking for memory holes : [100.0 %] | readpage_elf: Attempt to read non-existent page at 0xc000000000000.
> >      [ 17.551718] kdump.sh[404]: readmem: type_addr: 0, addr:c00c000000000000, size:16384
> >      [ 17.551793] kdump.sh[404]: __exclude_unnecessary_pages: Can't read the buffer of struct page.
> >      [ 17.551864] kdump.sh[404]: create_2nd_bitmap: Can't exclude unnecessary pages.
> >      [ 17.562632] kdump.sh[404]: The kernel version is not supported.
> >      [ 17.562708] kdump.sh[404]: The makedumpfile operation may be incomplete.
> >      [ 17.562773] kdump.sh[404]: makedumpfile Failed.
> >      [ 17.564335] kdump[406]: saving vmcore failed, _exitcode:1
> > 
> > Above error was due to 'vmap_area_list' and 'vmlist' symbols missing
> > from the vmcore.
> > 
> > 'vmap_area_list' was removed in the linux kernel with below commit:
> > 
> >      commit 378eb24a0658dd922b29524e0ce35c6c43f56cba
> >           mm/vmalloc: remove vmap_area_list
> > 
> > Subsequently the commit also introduced 'VMALLOC_START' in vmcoreinfo to
> > get base address of vmalloc area, instead of depending on 'vmap_area_list'
> > 
> > Hence if 'VMALLOC_START' symbol is there in vmcoreinfo:
> >    1. Set vmalloc_start based on 'VMALLOC_START'
> >    2. Don't error if vmap_area_list/vmlist are not defined
> > 
> > Reported-by: Sachin Sant <sachinp at linux.ibm.com>
> > Signed-off-by: Aditya Gupta <adityag at linux.ibm.com>
> > ---
> >   arch/ppc64.c   | 19 +++++++++++++------
> >   makedumpfile.c |  3 ++-
> >   makedumpfile.h |  6 +++---
> >   3 files changed, 18 insertions(+), 10 deletions(-)
> > 
> > diff --git a/arch/ppc64.c b/arch/ppc64.c
> > index 96c357cb0335..bb62e2cd199a 100644
> > --- a/arch/ppc64.c
> > +++ b/arch/ppc64.c
> > @@ -568,7 +568,9 @@ get_machdep_info_ppc64(void)
> >   	/*
> >   	 * Get vmalloc_start value from either vmap_area_list or vmlist.
> >   	 */
> > -	if ((SYMBOL(vmap_area_list) != NOT_FOUND_SYMBOL)
> > +	if (NUMBER(vmalloc_start) != NOT_FOUND_SYMBOL) {
> 
> I will fix this NOT_FOUND_SYMBOL to NOT_FOUND_NUMBER when applying, 
> otherwise makedumpfile will fail for a dumpfile without the 
> corresponding kernel patch, correct?
> 
> The patch looks good to me except for it.  I will apply this with the 
> kernel version in the commit log after the kernel patch gets merged.

Sure, thanks Kazu. I just ran it on an older version, it succeeds
collecting dump on 6.5.0 kernel somehow, though I agree with your
suggestion, it should have been NOT_FOUND_NUMBER. I will be more careful
about these things later.

Thanks,
Aditya Gupta

> 
> Thanks,
> Kazu
> 
> 
> > +		vmalloc_start = NUMBER(vmalloc_start);
> > +	} else if ((SYMBOL(vmap_area_list) != NOT_FOUND_SYMBOL)
> >   	    && (OFFSET(vmap_area.va_start) != NOT_FOUND_STRUCTURE)
> >   	    && (OFFSET(vmap_area.list) != NOT_FOUND_STRUCTURE)) {
> >   		if (!readmem(VADDR, SYMBOL(vmap_area_list) + OFFSET(list_head.next),
> > @@ -684,11 +686,16 @@ vaddr_to_paddr_ppc64(unsigned long vaddr)
> >   	if ((SYMBOL(vmap_area_list) == NOT_FOUND_SYMBOL)
> >   	    || (OFFSET(vmap_area.va_start) == NOT_FOUND_STRUCTURE)
> >   	    || (OFFSET(vmap_area.list) == NOT_FOUND_STRUCTURE)) {
> > -		if ((SYMBOL(vmlist) == NOT_FOUND_SYMBOL)
> > -		    || (OFFSET(vm_struct.addr) == NOT_FOUND_STRUCTURE)) {
> > -			ERRMSG("Can't get info for vmalloc translation.\n");
> > -			return NOT_PADDR;
> > -		}
> > +		/*
> > +		 * Don't depend on vmap_area_list/vmlist if vmalloc_start is set in
> > +		 * vmcoreinfo, in that case proceed without error
> > +		 */
> > +		if (NUMBER(vmalloc_start) == NOT_FOUND_NUMBER)
> > +			if ((SYMBOL(vmlist) == NOT_FOUND_SYMBOL)
> > +				|| (OFFSET(vm_struct.addr) == NOT_FOUND_STRUCTURE)) {
> > +				ERRMSG("Can't get info for vmalloc translation.\n");
> > +				return NOT_PADDR;
> > +			}
> >   	}
> >   
> >   	return ppc64_vtop_level4(vaddr);
> > diff --git a/makedumpfile.c b/makedumpfile.c
> > index b004b93fecb7..b6c63fad15f3 100644
> > --- a/makedumpfile.c
> > +++ b/makedumpfile.c
> > @@ -2978,6 +2978,8 @@ read_vmcoreinfo(void)
> >   	READ_NUMBER("PAGE_OFFLINE_MAPCOUNT_VALUE", PAGE_OFFLINE_MAPCOUNT_VALUE);
> >   	READ_NUMBER("phys_base", phys_base);
> >   	READ_NUMBER("KERNEL_IMAGE_SIZE", KERNEL_IMAGE_SIZE);
> > +
> > +	READ_NUMBER_UNSIGNED("VMALLOC_START", vmalloc_start);
> >   #ifdef __aarch64__
> >   	READ_NUMBER("VA_BITS", VA_BITS);
> >   	READ_NUMBER("TCR_EL1_T1SZ", TCR_EL1_T1SZ);
> > @@ -2989,7 +2991,6 @@ read_vmcoreinfo(void)
> >   	READ_NUMBER("VA_BITS", va_bits);
> >   	READ_NUMBER_UNSIGNED("phys_ram_base", phys_ram_base);
> >   	READ_NUMBER_UNSIGNED("PAGE_OFFSET", page_offset);
> > -	READ_NUMBER_UNSIGNED("VMALLOC_START", vmalloc_start);
> >   	READ_NUMBER_UNSIGNED("VMALLOC_END", vmalloc_end);
> >   	READ_NUMBER_UNSIGNED("VMEMMAP_START", vmemmap_start);
> >   	READ_NUMBER_UNSIGNED("VMEMMAP_END", vmemmap_end);
> > diff --git a/makedumpfile.h b/makedumpfile.h
> > index 59c83e1d9df3..4021c5af2a34 100644
> > --- a/makedumpfile.h
> > +++ b/makedumpfile.h
> > @@ -541,8 +541,6 @@ do { \
> >    * The value of dependence on machine
> >    */
> >   #define PAGE_OFFSET		(info->page_offset)
> > -#define VMALLOC_START		(info->vmalloc_start)
> > -#define VMALLOC_END		(info->vmalloc_end)
> >   #define VMEMMAP_START		(info->vmemmap_start)
> >   #define VMEMMAP_END		(info->vmemmap_end)
> >   #define PMASK			(0x7ffffffffffff000UL)
> > @@ -2262,6 +2260,9 @@ struct number_table {
> >   	long    HUGETLB_PAGE_DTOR;
> >   	long	phys_base;
> >   	long	KERNEL_IMAGE_SIZE;
> > +
> > +	unsigned long vmalloc_start;
> > +
> >   #ifdef __aarch64__
> >   	long 	VA_BITS;
> >   	long	TCR_EL1_T1SZ;
> > @@ -2272,7 +2273,6 @@ struct number_table {
> >   	long va_bits;
> >   	unsigned long phys_ram_base;
> >   	unsigned long page_offset;
> > -	unsigned long vmalloc_start;
> >   	unsigned long vmalloc_end;
> >   	unsigned long vmemmap_start;
> >   	unsigned long vmemmap_end;



More information about the kexec mailing list