Memory region boundaries don't necessarily fit on zone boundaries. So we need to maintain a zone-level mapping of the absolute memory region boundaries. "Node Memory Regions" will be used to capture the absolute region boundaries. Add "Zone Memory Regions" to track the subsets of the absolute memory regions that fall within the zone boundaries. Eg: |<---------------------Node---------------------->| _________________________________________________ | Node mem reg 0 | Node mem reg 1 | |_______________________|_________________________| _________________________________________________ | ZONE_DMA | ZONE_NORMAL | |_______________|_________________________________| In the above figure, ZONE_DMA has only 1 zone memory region (say, Zone mem reg 0) which is a subset of Node mem reg 0. ZONE_NORMAL has 2 zone memory regions (say, Zone mem reg 0 and Zone mem reg 1) which are subsets of Node mem reg 0 and Node mem reg 1 respectively. Signed-off-by: Srivatsa S. Bhat <srivatsa.bhat@xxxxxxxxxxxxxxxxxx> --- include/linux/mmzone.h | 9 +++++++++ mm/page_alloc.c | 42 +++++++++++++++++++++++++++++++++++++++++- 2 files changed, 50 insertions(+), 1 deletion(-) diff --git a/include/linux/mmzone.h b/include/linux/mmzone.h index bb7c3ef..9f923aa 100644 --- a/include/linux/mmzone.h +++ b/include/linux/mmzone.h @@ -339,6 +339,12 @@ struct node_mem_region { struct pglist_data *pgdat; }; +struct zone_mem_region { + unsigned long start_pfn; + unsigned long spanned_pages; + unsigned long present_pages; +}; + struct zone { /* Fields commonly accessed by the page allocator */ @@ -403,6 +409,9 @@ struct zone { #endif struct free_area free_area[MAX_ORDER]; + struct zone_mem_region zone_mem_region[MAX_NR_REGIONS]; + int nr_zone_regions; + #ifndef CONFIG_SPARSEMEM /* * Flags for a pageblock_nr_pages block. See pageblock-flags.h. diff --git a/mm/page_alloc.c b/mm/page_alloc.c index 709e3c1..c00f72d 100644 --- a/mm/page_alloc.c +++ b/mm/page_alloc.c @@ -4594,6 +4594,46 @@ void init_node_memory_regions(struct pglist_data *pgdat) } } +void init_zone_memory_regions(struct pglist_data *pgdat) +{ + unsigned long start_pfn, end_pfn, absent; + int i, j, idx, nid = pgdat->node_id; + struct node_mem_region *region; + struct zone *z; + + for (i = 0; i < pgdat->nr_zones; i++) { + z = &pgdat->node_zones[i]; + idx = 0; + + for (j = 0; j < pgdat->nr_node_regions; j++) { + region = &pgdat->node_regions[j]; + start_pfn = max(z->zone_start_pfn, region->start_pfn); + end_pfn = min(z->zone_start_pfn + z->spanned_pages, + region->start_pfn + region->spanned_pages); + + if (start_pfn >= end_pfn) + continue; + + z->zone_mem_region[idx].start_pfn = start_pfn; + z->zone_mem_region[idx].spanned_pages = end_pfn - start_pfn; + + absent = __absent_pages_in_range(nid, start_pfn, + end_pfn); + z->zone_mem_region[idx].present_pages = + end_pfn - start_pfn - absent; + idx++; + } + + z->nr_zone_regions = idx; + } +} + +void init_memory_regions(struct pglist_data *pgdat) +{ + init_node_memory_regions(pgdat); + init_zone_memory_regions(pgdat); +} + void __paginginit free_area_init_node(int nid, unsigned long *zones_size, unsigned long node_start_pfn, unsigned long *zholes_size) { @@ -4615,7 +4655,7 @@ void __paginginit free_area_init_node(int nid, unsigned long *zones_size, #endif free_area_init_core(pgdat, zones_size, zholes_size); - init_node_memory_regions(pgdat); + init_memory_regions(pgdat); } #ifdef CONFIG_HAVE_MEMBLOCK_NODE_MAP -- To unsubscribe, send a message with 'unsubscribe linux-mm' in the body to majordomo@xxxxxxxxx. For more info on Linux MM, see: http://www.linux-mm.org/ . Don't email: <a href=mailto:"dont@xxxxxxxxx"> email@xxxxxxxxx </a>