On Mon, Apr 15, 2019 at 10:27:30AM +0800, Chen Zhou wrote:
> Hi Mike,
> 
> On 2019/4/14 20:13, Mike Rapoport wrote:
> > Hi,
> > 
> > On Tue, Apr 09, 2019 at 06:28:18PM +0800, Chen Zhou wrote:
> >> After commit (arm64: kdump: support reserving crashkernel above 4G),
> >> there may be two crash kernel regions, one is below 4G, the other is
> >> above 4G.
> >>
> >> Crash dump kernel reads more than one crash kernel regions via a dtb
> >> property under node /chosen,
> >> linux,usable-memory-range = <BASE1 SIZE1 [BASE2 SIZE2]>
> > 
> > Somehow I've missed that previously, but how is this supposed to work on
> > EFI systems?
> 
> Whatever the way in which the systems work, there is FDT 
> pointer(__fdt_pointer)
> in arm64 kernel and file /sys/firmware/fdt will be created in late_initcall.
> 
> Kexec-tools read and update file /sys/firmware/fdt in EFI systems to support 
> kdump to
> boot capture kernel.
> 
> For supporting more than one crash kernel regions, kexec-tools make changes 
> accordingly.
> Details are in below:
> http://lists.infradead.org/pipermail/kexec/2019-April/022792.html
 
Thanks for the clarification!

> Thanks,
> Chen Zhou
> 
> >  
> >> Signed-off-by: Chen Zhou <chenzho...@huawei.com>
> >> ---
> >>  arch/arm64/mm/init.c     | 66 
> >> ++++++++++++++++++++++++++++++++++++++++--------
> >>  include/linux/memblock.h |  6 +++++
> >>  mm/memblock.c            |  7 ++---
> >>  3 files changed, 66 insertions(+), 13 deletions(-)
> >>
> >> diff --git a/arch/arm64/mm/init.c b/arch/arm64/mm/init.c
> >> index 3bebddf..0f18665 100644
> >> --- a/arch/arm64/mm/init.c
> >> +++ b/arch/arm64/mm/init.c
> >> @@ -65,6 +65,11 @@ phys_addr_t arm64_dma_phys_limit __ro_after_init;
> >>  
> >>  #ifdef CONFIG_KEXEC_CORE
> >>  
> >> +/* at most two crash kernel regions, low_region and high_region */
> >> +#define CRASH_MAX_USABLE_RANGES   2
> >> +#define LOW_REGION_IDX                    0
> >> +#define HIGH_REGION_IDX                   1
> >> +
> >>  /*
> >>   * reserve_crashkernel() - reserves memory for crash kernel
> >>   *
> >> @@ -297,8 +302,8 @@ static int __init 
> >> early_init_dt_scan_usablemem(unsigned long node,
> >>            const char *uname, int depth, void *data)
> >>  {
> >>    struct memblock_region *usablemem = data;
> >> -  const __be32 *reg;
> >> -  int len;
> >> +  const __be32 *reg, *endp;
> >> +  int len, nr = 0;
> >>  
> >>    if (depth != 1 || strcmp(uname, "chosen") != 0)
> >>            return 0;
> >> @@ -307,22 +312,63 @@ static int __init 
> >> early_init_dt_scan_usablemem(unsigned long node,
> >>    if (!reg || (len < (dt_root_addr_cells + dt_root_size_cells)))
> >>            return 1;
> >>  
> >> -  usablemem->base = dt_mem_next_cell(dt_root_addr_cells, &reg);
> >> -  usablemem->size = dt_mem_next_cell(dt_root_size_cells, &reg);
> >> +  endp = reg + (len / sizeof(__be32));
> >> +  while ((endp - reg) >= (dt_root_addr_cells + dt_root_size_cells)) {
> >> +          usablemem[nr].base = dt_mem_next_cell(dt_root_addr_cells, &reg);
> >> +          usablemem[nr].size = dt_mem_next_cell(dt_root_size_cells, &reg);
> >> +
> >> +          if (++nr >= CRASH_MAX_USABLE_RANGES)
> >> +                  break;
> >> +  }
> >>  
> >>    return 1;
> >>  }
> >>  
> >>  static void __init fdt_enforce_memory_region(void)
> >>  {
> >> -  struct memblock_region reg = {
> >> -          .size = 0,
> >> -  };
> >> +  int i, cnt = 0;
> >> +  struct memblock_region regs[CRASH_MAX_USABLE_RANGES];
> >> +
> >> +  memset(regs, 0, sizeof(regs));
> >> +  of_scan_flat_dt(early_init_dt_scan_usablemem, regs);
> >> +
> >> +  for (i = 0; i < CRASH_MAX_USABLE_RANGES; i++)
> >> +          if (regs[i].size)
> >> +                  cnt++;
> >> +          else
> >> +                  break;
> >> +
> >> +  if (cnt - 1 == LOW_REGION_IDX)
> >> +          memblock_cap_memory_range(regs[LOW_REGION_IDX].base,
> >> +                          regs[LOW_REGION_IDX].size);
> >> +  else if (cnt - 1 == HIGH_REGION_IDX) {
> >> +          /*
> >> +           * Two crash kernel regions, cap the memory range
> >> +           * [regs[LOW_REGION_IDX].base, regs[HIGH_REGION_IDX].end]
> >> +           * and then remove the memory range in the middle.
> >> +           */
> >> +          int start_rgn, end_rgn, i, ret;
> >> +          phys_addr_t mid_base, mid_size;
> >> +
> >> +          mid_base = regs[LOW_REGION_IDX].base + 
> >> regs[LOW_REGION_IDX].size;
> >> +          mid_size = regs[HIGH_REGION_IDX].base - mid_base;
> >> +          ret = memblock_isolate_range(&memblock.memory, mid_base,
> >> +                          mid_size, &start_rgn, &end_rgn);
> >>  
> >> -  of_scan_flat_dt(early_init_dt_scan_usablemem, &reg);
> >> +          if (ret)
> >> +                  return;
> >>  
> >> -  if (reg.size)
> >> -          memblock_cap_memory_range(reg.base, reg.size);
> >> +          memblock_cap_memory_range(regs[LOW_REGION_IDX].base,
> >> +                          regs[HIGH_REGION_IDX].base -
> >> +                          regs[LOW_REGION_IDX].base +
> >> +                          regs[HIGH_REGION_IDX].size);
> >> +          for (i = end_rgn - 1; i >= start_rgn; i--) {
> >> +                  if (!memblock_is_nomap(&memblock.memory.regions[i]))
> >> +                          memblock_remove_region(&memblock.memory, i);
> >> +          }
> >> +          memblock_remove_range(&memblock.reserved, mid_base,
> >> +                          mid_base + mid_size);
> >> +  }
> >>  }
> >>  
> >>  void __init arm64_memblock_init(void)
> >> diff --git a/include/linux/memblock.h b/include/linux/memblock.h
> >> index 294d5d8..787d252 100644
> >> --- a/include/linux/memblock.h
> >> +++ b/include/linux/memblock.h
> >> @@ -110,9 +110,15 @@ void memblock_discard(void);
> >>  
> >>  phys_addr_t memblock_find_in_range(phys_addr_t start, phys_addr_t end,
> >>                               phys_addr_t size, phys_addr_t align);
> >> +void memblock_remove_region(struct memblock_type *type, unsigned long r);
> >>  void memblock_allow_resize(void);
> >>  int memblock_add_node(phys_addr_t base, phys_addr_t size, int nid);
> >>  int memblock_add(phys_addr_t base, phys_addr_t size);
> >> +int memblock_isolate_range(struct memblock_type *type,
> >> +                                  phys_addr_t base, phys_addr_t size,
> >> +                                  int *start_rgn, int *end_rgn);
> >> +int memblock_remove_range(struct memblock_type *type,
> >> +                                  phys_addr_t base, phys_addr_t size);
> >>  int memblock_remove(phys_addr_t base, phys_addr_t size);
> >>  int memblock_free(phys_addr_t base, phys_addr_t size);
> >>  int memblock_reserve(phys_addr_t base, phys_addr_t size);
> >> diff --git a/mm/memblock.c b/mm/memblock.c
> >> index e7665cf..1846e2d 100644
> >> --- a/mm/memblock.c
> >> +++ b/mm/memblock.c
> >> @@ -357,7 +357,8 @@ phys_addr_t __init_memblock 
> >> memblock_find_in_range(phys_addr_t start,
> >>    return ret;
> >>  }
> >>  
> >> -static void __init_memblock memblock_remove_region(struct memblock_type 
> >> *type, unsigned long r)
> >> +void __init_memblock memblock_remove_region(struct memblock_type *type,
> >> +                                  unsigned long r)
> >>  {
> >>    type->total_size -= type->regions[r].size;
> >>    memmove(&type->regions[r], &type->regions[r + 1],
> >> @@ -724,7 +725,7 @@ int __init_memblock memblock_add(phys_addr_t base, 
> >> phys_addr_t size)
> >>   * Return:
> >>   * 0 on success, -errno on failure.
> >>   */
> >> -static int __init_memblock memblock_isolate_range(struct memblock_type 
> >> *type,
> >> +int __init_memblock memblock_isolate_range(struct memblock_type *type,
> >>                                    phys_addr_t base, phys_addr_t size,
> >>                                    int *start_rgn, int *end_rgn)
> >>  {
> >> @@ -784,7 +785,7 @@ static int __init_memblock 
> >> memblock_isolate_range(struct memblock_type *type,
> >>    return 0;
> >>  }
> >>  
> >> -static int __init_memblock memblock_remove_range(struct memblock_type 
> >> *type,
> >> +int __init_memblock memblock_remove_range(struct memblock_type *type,
> >>                                      phys_addr_t base, phys_addr_t size)
> >>  {
> >>    int start_rgn, end_rgn;
> >> -- 
> >> 2.7.4
> >>
> > 
> 

-- 
Sincerely yours,
Mike.

Reply via email to