mm/hotplug: correctly setup fallback zonelists when creating new pgdat
When hotadd_new_pgdat() is called to create new pgdat for a new node, a fallback zonelist should be created for the new node. There's code to try to achieve that in hotadd_new_pgdat() as below: /* * The node we allocated has no zone fallback lists. For avoiding * to access not-initialized zonelist, build here. */ mutex_lock(&zonelists_mutex); build_all_zonelists(pgdat, NULL); mutex_unlock(&zonelists_mutex); But it doesn't work as expected. When hotadd_new_pgdat() is called, the new node is still in offline state because node_set_online(nid) hasn't been called yet. And build_all_zonelists() only builds zonelists for online nodes as: for_each_online_node(nid) { pg_data_t *pgdat = NODE_DATA(nid); build_zonelists(pgdat); build_zonelist_cache(pgdat); } Though we hope to create zonelist for the new pgdat, but it doesn't. So add a new parameter "pgdat" the build_all_zonelists() to build pgdat for the new pgdat too. Signed-off-by: Jiang Liu <liuj97@gmail.com> Signed-off-by: Xishi Qiu <qiuxishi@huawei.com> Cc: Mel Gorman <mgorman@suse.de> Cc: Michal Hocko <mhocko@suse.cz> Cc: Minchan Kim <minchan@kernel.org> Cc: Rusty Russell <rusty@rustcorp.com.au> Cc: Yinghai Lu <yinghai@kernel.org> Cc: Tony Luck <tony.luck@intel.com> Cc: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com> Cc: KOSAKI Motohiro <kosaki.motohiro@jp.fujitsu.com> Cc: David Rientjes <rientjes@google.com> Cc: Keping Chen <chenkeping@huawei.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
This commit is contained in:
parent
da92c47d06
commit
9adb62a5df
@ -721,7 +721,7 @@ typedef struct pglist_data {
|
|||||||
#include <linux/memory_hotplug.h>
|
#include <linux/memory_hotplug.h>
|
||||||
|
|
||||||
extern struct mutex zonelists_mutex;
|
extern struct mutex zonelists_mutex;
|
||||||
void build_all_zonelists(void *data);
|
void build_all_zonelists(pg_data_t *pgdat, struct zone *zone);
|
||||||
void wakeup_kswapd(struct zone *zone, int order, enum zone_type classzone_idx);
|
void wakeup_kswapd(struct zone *zone, int order, enum zone_type classzone_idx);
|
||||||
bool zone_watermark_ok(struct zone *z, int order, unsigned long mark,
|
bool zone_watermark_ok(struct zone *z, int order, unsigned long mark,
|
||||||
int classzone_idx, int alloc_flags);
|
int classzone_idx, int alloc_flags);
|
||||||
|
@ -506,7 +506,7 @@ asmlinkage void __init start_kernel(void)
|
|||||||
setup_per_cpu_areas();
|
setup_per_cpu_areas();
|
||||||
smp_prepare_boot_cpu(); /* arch-specific boot-cpu hooks */
|
smp_prepare_boot_cpu(); /* arch-specific boot-cpu hooks */
|
||||||
|
|
||||||
build_all_zonelists(NULL);
|
build_all_zonelists(NULL, NULL);
|
||||||
page_alloc_init();
|
page_alloc_init();
|
||||||
|
|
||||||
printk(KERN_NOTICE "Kernel command line: %s\n", boot_command_line);
|
printk(KERN_NOTICE "Kernel command line: %s\n", boot_command_line);
|
||||||
|
@ -416,7 +416,7 @@ int __cpuinit cpu_up(unsigned int cpu)
|
|||||||
|
|
||||||
if (pgdat->node_zonelists->_zonerefs->zone == NULL) {
|
if (pgdat->node_zonelists->_zonerefs->zone == NULL) {
|
||||||
mutex_lock(&zonelists_mutex);
|
mutex_lock(&zonelists_mutex);
|
||||||
build_all_zonelists(NULL);
|
build_all_zonelists(NULL, NULL);
|
||||||
mutex_unlock(&zonelists_mutex);
|
mutex_unlock(&zonelists_mutex);
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
@ -513,7 +513,7 @@ int __ref online_pages(unsigned long pfn, unsigned long nr_pages)
|
|||||||
zone->present_pages += onlined_pages;
|
zone->present_pages += onlined_pages;
|
||||||
zone->zone_pgdat->node_present_pages += onlined_pages;
|
zone->zone_pgdat->node_present_pages += onlined_pages;
|
||||||
if (need_zonelists_rebuild)
|
if (need_zonelists_rebuild)
|
||||||
build_all_zonelists(zone);
|
build_all_zonelists(NULL, zone);
|
||||||
else
|
else
|
||||||
zone_pcp_update(zone);
|
zone_pcp_update(zone);
|
||||||
|
|
||||||
@ -562,7 +562,7 @@ static pg_data_t __ref *hotadd_new_pgdat(int nid, u64 start)
|
|||||||
* to access not-initialized zonelist, build here.
|
* to access not-initialized zonelist, build here.
|
||||||
*/
|
*/
|
||||||
mutex_lock(&zonelists_mutex);
|
mutex_lock(&zonelists_mutex);
|
||||||
build_all_zonelists(NULL);
|
build_all_zonelists(pgdat, NULL);
|
||||||
mutex_unlock(&zonelists_mutex);
|
mutex_unlock(&zonelists_mutex);
|
||||||
|
|
||||||
return pgdat;
|
return pgdat;
|
||||||
|
@ -3032,7 +3032,7 @@ int numa_zonelist_order_handler(ctl_table *table, int write,
|
|||||||
user_zonelist_order = oldval;
|
user_zonelist_order = oldval;
|
||||||
} else if (oldval != user_zonelist_order) {
|
} else if (oldval != user_zonelist_order) {
|
||||||
mutex_lock(&zonelists_mutex);
|
mutex_lock(&zonelists_mutex);
|
||||||
build_all_zonelists(NULL);
|
build_all_zonelists(NULL, NULL);
|
||||||
mutex_unlock(&zonelists_mutex);
|
mutex_unlock(&zonelists_mutex);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -3415,10 +3415,17 @@ static __init_refok int __build_all_zonelists(void *data)
|
|||||||
{
|
{
|
||||||
int nid;
|
int nid;
|
||||||
int cpu;
|
int cpu;
|
||||||
|
pg_data_t *self = data;
|
||||||
|
|
||||||
#ifdef CONFIG_NUMA
|
#ifdef CONFIG_NUMA
|
||||||
memset(node_load, 0, sizeof(node_load));
|
memset(node_load, 0, sizeof(node_load));
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
if (self && !node_online(self->node_id)) {
|
||||||
|
build_zonelists(self);
|
||||||
|
build_zonelist_cache(self);
|
||||||
|
}
|
||||||
|
|
||||||
for_each_online_node(nid) {
|
for_each_online_node(nid) {
|
||||||
pg_data_t *pgdat = NODE_DATA(nid);
|
pg_data_t *pgdat = NODE_DATA(nid);
|
||||||
|
|
||||||
@ -3463,7 +3470,7 @@ static __init_refok int __build_all_zonelists(void *data)
|
|||||||
* Called with zonelists_mutex held always
|
* Called with zonelists_mutex held always
|
||||||
* unless system_state == SYSTEM_BOOTING.
|
* unless system_state == SYSTEM_BOOTING.
|
||||||
*/
|
*/
|
||||||
void __ref build_all_zonelists(void *data)
|
void __ref build_all_zonelists(pg_data_t *pgdat, struct zone *zone)
|
||||||
{
|
{
|
||||||
set_zonelist_order();
|
set_zonelist_order();
|
||||||
|
|
||||||
@ -3475,10 +3482,10 @@ void __ref build_all_zonelists(void *data)
|
|||||||
/* we have to stop all cpus to guarantee there is no user
|
/* we have to stop all cpus to guarantee there is no user
|
||||||
of zonelist */
|
of zonelist */
|
||||||
#ifdef CONFIG_MEMORY_HOTPLUG
|
#ifdef CONFIG_MEMORY_HOTPLUG
|
||||||
if (data)
|
if (zone)
|
||||||
setup_zone_pageset((struct zone *)data);
|
setup_zone_pageset(zone);
|
||||||
#endif
|
#endif
|
||||||
stop_machine(__build_all_zonelists, NULL, NULL);
|
stop_machine(__build_all_zonelists, pgdat, NULL);
|
||||||
/* cpuset refresh routine should be here */
|
/* cpuset refresh routine should be here */
|
||||||
}
|
}
|
||||||
vm_total_pages = nr_free_pagecache_pages();
|
vm_total_pages = nr_free_pagecache_pages();
|
||||||
|
Loading…
Reference in New Issue
Block a user