Re: [PATCH] x86_64/mm: check and print vmemmap allocationcontinuous
From: Andrew Morton
Date:  Tue Apr 15 2008 - 02:54:54 EST
On Sat, 12 Apr 2008 01:19:24 -0700 Yinghai Lu <yhlu.kernel.send@xxxxxxxxx> wrote:
> 
> So for big system with a lot memory, don't print out too much, and easy found
> out if it is continuous
> 
> on 256G 8 sockets system will get
>  [ffffe20000000000-ffffe20002bfffff] PMD -> [ffff810001400000-ffff810003ffffff] on node 0
> [ffffe2001c700000-ffffe2001c7fffff] potential offnode page_structs
>  [ffffe20002c00000-ffffe2001c7fffff] PMD -> [ffff81000c000000-ffff8100255fffff] on node 0
> [ffffe20038700000-ffffe200387fffff] potential offnode page_structs
>  [ffffe2001c800000-ffffe200387fffff] PMD -> [ffff810820200000-ffff81083c1fffff] on node 1
>  [ffffe20040000000-ffffe2007fffffff] PUD ->ffff811027a00000 on node 2
>  [ffffe20038800000-ffffe2003fffffff] PMD -> [ffff811020200000-ffff8110279fffff] on node 2
> [ffffe20054700000-ffffe200547fffff] potential offnode page_structs
>  [ffffe20040000000-ffffe200547fffff] PMD -> [ffff811027c00000-ffff81103c3fffff] on node 2
> [ffffe20070700000-ffffe200707fffff] potential offnode page_structs
>  [ffffe20054800000-ffffe200707fffff] PMD -> [ffff811820200000-ffff81183c1fffff] on node 3
>  [ffffe20080000000-ffffe200bfffffff] PUD ->ffff81202fa00000 on node 4
>  [ffffe20070800000-ffffe2007fffffff] PMD -> [ffff812020200000-ffff81202f9fffff] on node 4
> [ffffe2008c700000-ffffe2008c7fffff] potential offnode page_structs
>  [ffffe20080000000-ffffe2008c7fffff] PMD -> [ffff81202fc00000-ffff81203c3fffff] on node 4
> [ffffe200a8700000-ffffe200a87fffff] potential offnode page_structs
>  [ffffe2008c800000-ffffe200a87fffff] PMD -> [ffff812820200000-ffff81283c1fffff] on node 5
>  [ffffe200c0000000-ffffe200ffffffff] PUD ->ffff813037a00000 on node 6
>  [ffffe200a8800000-ffffe200bfffffff] PMD -> [ffff813020200000-ffff8130379fffff] on node 6
> [ffffe200c4700000-ffffe200c47fffff] potential offnode page_structs
>  [ffffe200c0000000-ffffe200c47fffff] PMD -> [ffff813037c00000-ffff81303c3fffff] on node 6
>  [ffffe200c4800000-ffffe200e07fffff] PMD -> [ffff813820200000-ffff81383c1fffff] on node 7
> 
> instead of a long print out...
> 
I'll consider this an x86 patch, for the x86 tree.
> 
> Index: linux-2.6/arch/x86/mm/init_64.c
> ===================================================================
> --- linux-2.6.orig/arch/x86/mm/init_64.c
> +++ linux-2.6/arch/x86/mm/init_64.c
> @@ -931,6 +931,10 @@ const char *arch_vma_name(struct vm_area
>  /*
>   * Initialise the sparsemem vmemmap using huge-pages at the PMD level.
>   */
> +static long __meminitdata addr_start, addr_end;
> +static void __meminitdata *p_start, *p_end;
> +static int __meminitdata node_start;
> +
>  int __meminit
>  vmemmap_populate(struct page *start_page, unsigned long size, int node)
>  {
> @@ -965,12 +969,32 @@ vmemmap_populate(struct page *start_page
>  							PAGE_KERNEL_LARGE);
>  			set_pmd(pmd, __pmd(pte_val(entry)));
>  
> -			printk(KERN_DEBUG " [%lx-%lx] PMD ->%p on node %d\n",
> -				addr, addr + PMD_SIZE - 1, p, node);
> +			/* check if we got continous */
"continuous".
In fact I'd phrase it "Check to see if we have contiguous blocks".
> +			if (p_end != p || node_start != node) {
> +				if (p_start)
> +					printk(KERN_DEBUG " [%lx-%lx] PMD -> [%p-%p] on node %d\n",
> +						addr_start, addr_end-1, p_start, p_end-1, node_start);
> +				addr_start = addr;
> +				node_start = node;
> +				p_start = p;
> +			}
> +			addr_end = addr + PMD_SIZE;
> +			p_end = p + PMD_SIZE;
>  		} else {
>  			vmemmap_verify((pte_t *)pmd, node, addr, next);
>  		}
>  	}
>  	return 0;
>  }
> +
> +void __meminit vmemmap_populate_print_last(void)
This definition
> +{
> +	if (p_start) {
> +		printk(KERN_DEBUG " [%lx-%lx] PMD -> [%p-%p] on node %d\n",
> +			addr_start, addr_end-1, p_start, p_end-1, node_start);
> +		p_start = NULL;
> +		p_end = NULL;
> +		node_start = 0;
> +	}
> +}
>  #endif
> Index: linux-2.6/mm/sparse.c
> ===================================================================
> --- linux-2.6.orig/mm/sparse.c
> +++ linux-2.6/mm/sparse.c
> @@ -285,6 +285,9 @@ struct page __init *sparse_early_mem_map
>  	return NULL;
>  }
>  
> +void __attribute__((weak)) __meminit vmemmap_populate_print_last(void)
And this definition
should match each other.  The way to do that is to put a declaration in a
header file which is included by both .c files, please.
> +{
> +}
>  /*
>   * Allocate the accumulated non-linear sections, allocate a mem_map
>   * for each and record the physical to section mapping.
> @@ -337,6 +340,8 @@ void __init sparse_init(void)
>  								usemap);
>  	}
>  
> +	vmemmap_populate_print_last();
> +
>  	free_bootmem(__pa(usemap_map), size);
>  }
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/