提交 5510db9c 编写于 作者: T Tejun Heo 提交者: H. Peter Anvin

x86-32, numa: Reorganize calculate_numa_remap_page()

Separate the outer node walking loop and per-node logic from
calculate_numa_remap_pages().  The outer loop is collapsed into
initmem_init() and the per-node logic is moved into a new function -
init_alloc_remap().

The new function name is confusing with the existing
init_remap_allocator() and the behavior is the function isn't very
clean either at this point, but this is to prepare for further
cleanups and it will become prettier.

This function doesn't introduce any behavior change.
Signed-off-by: NTejun Heo <tj@kernel.org>
Link: http://lkml.kernel.org/r/1301955840-7246-5-git-send-email-tj@kernel.orgAcked-by: NYinghai Lu <yinghai@kernel.org>
Cc: David Rientjes <rientjes@google.com>
Signed-off-by: NH. Peter Anvin <hpa@zytor.com>
上级 5b8443b2
...@@ -264,24 +264,21 @@ void resume_map_numa_kva(pgd_t *pgd_base) ...@@ -264,24 +264,21 @@ void resume_map_numa_kva(pgd_t *pgd_base)
} }
#endif #endif
static __init unsigned long calculate_numa_remap_pages(void) static __init unsigned long init_alloc_remap(int nid, unsigned long offset)
{ {
int nid; unsigned long size;
unsigned long size, reserve_pages = 0;
for_each_online_node(nid) {
u64 node_kva; u64 node_kva;
/* /*
* The acpi/srat node info can show hot-add memroy zones * The acpi/srat node info can show hot-add memroy zones where
* where memory could be added but not currently present. * memory could be added but not currently present.
*/ */
printk(KERN_DEBUG "node %d pfn: [%lx - %lx]\n", printk(KERN_DEBUG "node %d pfn: [%lx - %lx]\n",
nid, node_start_pfn[nid], node_end_pfn[nid]); nid, node_start_pfn[nid], node_end_pfn[nid]);
if (node_start_pfn[nid] > max_pfn) if (node_start_pfn[nid] > max_pfn)
continue; return 0;
if (!node_end_pfn[nid]) if (!node_end_pfn[nid])
continue; return 0;
if (node_end_pfn[nid] > max_pfn) if (node_end_pfn[nid] > max_pfn)
node_end_pfn[nid] = max_pfn; node_end_pfn[nid] = max_pfn;
...@@ -295,17 +292,15 @@ static __init unsigned long calculate_numa_remap_pages(void) ...@@ -295,17 +292,15 @@ static __init unsigned long calculate_numa_remap_pages(void)
size = size * PTRS_PER_PTE; size = size * PTRS_PER_PTE;
node_kva = memblock_find_in_range(node_start_pfn[nid] << PAGE_SHIFT, node_kva = memblock_find_in_range(node_start_pfn[nid] << PAGE_SHIFT,
((u64)node_end_pfn[nid])<<PAGE_SHIFT, (u64)node_end_pfn[nid] << PAGE_SHIFT,
((u64)size)<<PAGE_SHIFT, (u64)size << PAGE_SHIFT,
LARGE_PAGE_BYTES); LARGE_PAGE_BYTES);
if (node_kva == MEMBLOCK_ERROR) if (node_kva == MEMBLOCK_ERROR)
panic("Can not get kva ram\n"); panic("Can not get kva ram\n");
node_remap_size[nid] = size; node_remap_size[nid] = size;
node_remap_offset[nid] = reserve_pages; node_remap_offset[nid] = offset;
reserve_pages += size; printk(KERN_DEBUG "Reserving %ld pages of KVA for lmem_map of node %d at %llx\n",
printk(KERN_DEBUG "Reserving %ld pages of KVA for lmem_map of"
" node %d at %llx\n",
size, nid, node_kva >> PAGE_SHIFT); size, nid, node_kva >> PAGE_SHIFT);
/* /*
...@@ -313,21 +308,20 @@ static __init unsigned long calculate_numa_remap_pages(void) ...@@ -313,21 +308,20 @@ static __init unsigned long calculate_numa_remap_pages(void)
* with less memory later. * with less memory later.
* layout will be: KVA address , KVA RAM * layout will be: KVA address , KVA RAM
* *
* we are supposed to only record the one less then max_low_pfn * we are supposed to only record the one less then
* but we could have some hole in high memory, and it will only * max_low_pfn but we could have some hole in high memory,
* check page_is_ram(pfn) && !page_is_reserved_early(pfn) to decide * and it will only check page_is_ram(pfn) &&
* to use it as free. * !page_is_reserved_early(pfn) to decide to use it as free.
* So memblock_x86_reserve_range here, hope we don't run out of that array * So memblock_x86_reserve_range here, hope we don't run out
* of that array
*/ */
memblock_x86_reserve_range(node_kva, memblock_x86_reserve_range(node_kva,
node_kva + (((u64)size)<<PAGE_SHIFT), node_kva + ((u64)size << PAGE_SHIFT),
"KVA RAM"); "KVA RAM");
node_remap_start_pfn[nid] = node_kva >> PAGE_SHIFT; node_remap_start_pfn[nid] = node_kva >> PAGE_SHIFT;
}
printk(KERN_INFO "Reserving total of %lx pages for numa KVA remap\n", return size;
reserve_pages);
return reserve_pages;
} }
static void init_remap_allocator(int nid) static void init_remap_allocator(int nid)
...@@ -346,6 +340,7 @@ static void init_remap_allocator(int nid) ...@@ -346,6 +340,7 @@ static void init_remap_allocator(int nid)
void __init initmem_init(void) void __init initmem_init(void)
{ {
unsigned long reserve_pages = 0;
int nid; int nid;
/* /*
...@@ -359,7 +354,11 @@ void __init initmem_init(void) ...@@ -359,7 +354,11 @@ void __init initmem_init(void)
get_memcfg_numa(); get_memcfg_numa();
numa_init_array(); numa_init_array();
kva_pages = roundup(calculate_numa_remap_pages(), PTRS_PER_PTE); for_each_online_node(nid)
reserve_pages += init_alloc_remap(nid, reserve_pages);
kva_pages = roundup(reserve_pages, PTRS_PER_PTE);
printk(KERN_INFO "Reserving total of %lx pages for numa KVA remap\n",
reserve_pages);
kva_start_pfn = memblock_find_in_range(min_low_pfn << PAGE_SHIFT, kva_start_pfn = memblock_find_in_range(min_low_pfn << PAGE_SHIFT,
max_low_pfn << PAGE_SHIFT, max_low_pfn << PAGE_SHIFT,
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册