Hi Mike, On 2019/4/14 20:13, Mike Rapoport wrote: > Hi, > > On Tue, Apr 09, 2019 at 06:28:18PM +0800, Chen Zhou wrote: >> After commit (arm64: kdump: support reserving crashkernel above 4G), >> there may be two crash kernel regions, one is below 4G, the other is >> above 4G. >> >> Crash dump kernel reads more than one crash kernel regions via a dtb >> property under node /chosen, >> linux,usable-memory-range = <BASE1 SIZE1 [BASE2 SIZE2]> > > Somehow I've missed that previously, but how is this supposed to work on > EFI systems? Whatever the way in which the systems work, there is FDT pointer(__fdt_pointer) in arm64 kernel and file /sys/firmware/fdt will be created in late_initcall. Kexec-tools read and update file /sys/firmware/fdt in EFI systems to support kdump to boot capture kernel. For supporting more than one crash kernel regions, kexec-tools make changes accordingly. Details are in below: http://lists.infradead.org/pipermail/kexec/2019-April/022792.html Thanks, Chen Zhou > >> Signed-off-by: Chen Zhou <chenzhou10@xxxxxxxxxx> >> --- >> arch/arm64/mm/init.c | 66 ++++++++++++++++++++++++++++++++++++++++-------- >> include/linux/memblock.h | 6 +++++ >> mm/memblock.c | 7 ++--- >> 3 files changed, 66 insertions(+), 13 deletions(-) >> >> diff --git a/arch/arm64/mm/init.c b/arch/arm64/mm/init.c >> index 3bebddf..0f18665 100644 >> --- a/arch/arm64/mm/init.c >> +++ b/arch/arm64/mm/init.c >> @@ -65,6 +65,11 @@ phys_addr_t arm64_dma_phys_limit __ro_after_init; >> >> #ifdef CONFIG_KEXEC_CORE >> >> +/* at most two crash kernel regions, low_region and high_region */ >> +#define CRASH_MAX_USABLE_RANGES 2 >> +#define LOW_REGION_IDX 0 >> +#define HIGH_REGION_IDX 1 >> + >> /* >> * reserve_crashkernel() - reserves memory for crash kernel >> * >> @@ -297,8 +302,8 @@ static int __init early_init_dt_scan_usablemem(unsigned long node, >> const char *uname, int depth, void *data) >> { >> struct memblock_region *usablemem = data; >> - const __be32 *reg; >> - int len; >> + const __be32 *reg, *endp; >> + int len, nr = 0; >> >> if (depth != 1 || strcmp(uname, "chosen") != 0) >> return 0; >> @@ -307,22 +312,63 @@ static int __init early_init_dt_scan_usablemem(unsigned long node, >> if (!reg || (len < (dt_root_addr_cells + dt_root_size_cells))) >> return 1; >> >> - usablemem->base = dt_mem_next_cell(dt_root_addr_cells, ®); >> - usablemem->size = dt_mem_next_cell(dt_root_size_cells, ®); >> + endp = reg + (len / sizeof(__be32)); >> + while ((endp - reg) >= (dt_root_addr_cells + dt_root_size_cells)) { >> + usablemem[nr].base = dt_mem_next_cell(dt_root_addr_cells, ®); >> + usablemem[nr].size = dt_mem_next_cell(dt_root_size_cells, ®); >> + >> + if (++nr >= CRASH_MAX_USABLE_RANGES) >> + break; >> + } >> >> return 1; >> } >> >> static void __init fdt_enforce_memory_region(void) >> { >> - struct memblock_region reg = { >> - .size = 0, >> - }; >> + int i, cnt = 0; >> + struct memblock_region regs[CRASH_MAX_USABLE_RANGES]; >> + >> + memset(regs, 0, sizeof(regs)); >> + of_scan_flat_dt(early_init_dt_scan_usablemem, regs); >> + >> + for (i = 0; i < CRASH_MAX_USABLE_RANGES; i++) >> + if (regs[i].size) >> + cnt++; >> + else >> + break; >> + >> + if (cnt - 1 == LOW_REGION_IDX) >> + memblock_cap_memory_range(regs[LOW_REGION_IDX].base, >> + regs[LOW_REGION_IDX].size); >> + else if (cnt - 1 == HIGH_REGION_IDX) { >> + /* >> + * Two crash kernel regions, cap the memory range >> + * [regs[LOW_REGION_IDX].base, regs[HIGH_REGION_IDX].end] >> + * and then remove the memory range in the middle. >> + */ >> + int start_rgn, end_rgn, i, ret; >> + phys_addr_t mid_base, mid_size; >> + >> + mid_base = regs[LOW_REGION_IDX].base + regs[LOW_REGION_IDX].size; >> + mid_size = regs[HIGH_REGION_IDX].base - mid_base; >> + ret = memblock_isolate_range(&memblock.memory, mid_base, >> + mid_size, &start_rgn, &end_rgn); >> >> - of_scan_flat_dt(early_init_dt_scan_usablemem, ®); >> + if (ret) >> + return; >> >> - if (reg.size) >> - memblock_cap_memory_range(reg.base, reg.size); >> + memblock_cap_memory_range(regs[LOW_REGION_IDX].base, >> + regs[HIGH_REGION_IDX].base - >> + regs[LOW_REGION_IDX].base + >> + regs[HIGH_REGION_IDX].size); >> + for (i = end_rgn - 1; i >= start_rgn; i--) { >> + if (!memblock_is_nomap(&memblock.memory.regions[i])) >> + memblock_remove_region(&memblock.memory, i); >> + } >> + memblock_remove_range(&memblock.reserved, mid_base, >> + mid_base + mid_size); >> + } >> } >> >> void __init arm64_memblock_init(void) >> diff --git a/include/linux/memblock.h b/include/linux/memblock.h >> index 294d5d8..787d252 100644 >> --- a/include/linux/memblock.h >> +++ b/include/linux/memblock.h >> @@ -110,9 +110,15 @@ void memblock_discard(void); >> >> phys_addr_t memblock_find_in_range(phys_addr_t start, phys_addr_t end, >> phys_addr_t size, phys_addr_t align); >> +void memblock_remove_region(struct memblock_type *type, unsigned long r); >> void memblock_allow_resize(void); >> int memblock_add_node(phys_addr_t base, phys_addr_t size, int nid); >> int memblock_add(phys_addr_t base, phys_addr_t size); >> +int memblock_isolate_range(struct memblock_type *type, >> + phys_addr_t base, phys_addr_t size, >> + int *start_rgn, int *end_rgn); >> +int memblock_remove_range(struct memblock_type *type, >> + phys_addr_t base, phys_addr_t size); >> int memblock_remove(phys_addr_t base, phys_addr_t size); >> int memblock_free(phys_addr_t base, phys_addr_t size); >> int memblock_reserve(phys_addr_t base, phys_addr_t size); >> diff --git a/mm/memblock.c b/mm/memblock.c >> index e7665cf..1846e2d 100644 >> --- a/mm/memblock.c >> +++ b/mm/memblock.c >> @@ -357,7 +357,8 @@ phys_addr_t __init_memblock memblock_find_in_range(phys_addr_t start, >> return ret; >> } >> >> -static void __init_memblock memblock_remove_region(struct memblock_type *type, unsigned long r) >> +void __init_memblock memblock_remove_region(struct memblock_type *type, >> + unsigned long r) >> { >> type->total_size -= type->regions[r].size; >> memmove(&type->regions[r], &type->regions[r + 1], >> @@ -724,7 +725,7 @@ int __init_memblock memblock_add(phys_addr_t base, phys_addr_t size) >> * Return: >> * 0 on success, -errno on failure. >> */ >> -static int __init_memblock memblock_isolate_range(struct memblock_type *type, >> +int __init_memblock memblock_isolate_range(struct memblock_type *type, >> phys_addr_t base, phys_addr_t size, >> int *start_rgn, int *end_rgn) >> { >> @@ -784,7 +785,7 @@ static int __init_memblock memblock_isolate_range(struct memblock_type *type, >> return 0; >> } >> >> -static int __init_memblock memblock_remove_range(struct memblock_type *type, >> +int __init_memblock memblock_remove_range(struct memblock_type *type, >> phys_addr_t base, phys_addr_t size) >> { >> int start_rgn, end_rgn; >> -- >> 2.7.4 >> >