Skip to content

Commit

Permalink
drivers/base/node: consolidate node device subsystem initialization i…
Browse files Browse the repository at this point in the history
…n node_dev_init()

...  and call node_dev_init() after memory_dev_init() from driver_init(),
so before any of the existing arch/subsys calls.  All online nodes should
be known at that point: early during boot, arch code determines node and
zone ranges and sets the relevant nodes online; usually this happens in
setup_arch().

This is in line with memory_dev_init(), which initializes the memory
device subsystem and creates all memory block devices.

Similar to memory_dev_init(), panic() if anything goes wrong, we don't
want to continue with such basic initialization errors.

The important part is that node_dev_init() gets called after
memory_dev_init() and after cpu_dev_init(), but before any of the relevant
archs call register_cpu() to register the new cpu device under the node
device.  The latter should be the case for the current users of
topology_init().

Link: https://lkml.kernel.org/r/20220203105212.30385-1-david@redhat.com
Signed-off-by: David Hildenbrand <david@redhat.com>
Reviewed-by: Oscar Salvador <osalvador@suse.de>
Tested-by: Anatoly Pugachev <matorola@gmail.com> (sparc64)
Cc: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Cc: Michal Hocko <mhocko@suse.com>
Cc: Oscar Salvador <osalvador@suse.de>
Cc: Mike Rapoport <rppt@kernel.org>
Cc: Catalin Marinas <catalin.marinas@arm.com>
Cc: Will Deacon <will@kernel.org>
Cc: Thomas Bogendoerfer <tsbogend@alpha.franken.de>
Cc: Michael Ellerman <mpe@ellerman.id.au>
Cc: Benjamin Herrenschmidt <benh@kernel.crashing.org>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Paul Walmsley <paul.walmsley@sifive.com>
Cc: Palmer Dabbelt <palmer@dabbelt.com>
Cc: Albert Ou <aou@eecs.berkeley.edu>
Cc: Heiko Carstens <hca@linux.ibm.com>
Cc: Vasily Gorbik <gor@linux.ibm.com>
Cc: Yoshinori Sato <ysato@users.sourceforge.jp>
Cc: Rich Felker <dalias@libc.org>
Cc: "David S. Miller" <davem@davemloft.net>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Borislav Petkov <bp@alien8.de>
Cc: Dave Hansen <dave.hansen@linux.intel.com>
Cc: "Rafael J. Wysocki" <rafael@kernel.org>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
  • Loading branch information
davidhildenbrand authored and torvalds committed Mar 22, 2022
1 parent 7ea0d2d commit 2848a28
Show file tree
Hide file tree
Showing 12 changed files with 22 additions and 80 deletions.
3 changes: 0 additions & 3 deletions arch/arm64/kernel/setup.c
Original file line number Diff line number Diff line change
Expand Up @@ -406,9 +406,6 @@ static int __init topology_init(void)
{
int i;

for_each_online_node(i)
register_one_node(i);

for_each_possible_cpu(i) {
struct cpu *cpu = &per_cpu(cpu_data.cpu, i);
cpu->hotpluggable = cpu_can_disable(i);
Expand Down
10 changes: 0 additions & 10 deletions arch/ia64/kernel/topology.c
Original file line number Diff line number Diff line change
Expand Up @@ -70,16 +70,6 @@ static int __init topology_init(void)
{
int i, err = 0;

#ifdef CONFIG_NUMA
/*
* MCD - Do we want to register all ONLINE nodes, or all POSSIBLE nodes?
*/
for_each_online_node(i) {
if ((err = register_one_node(i)))
goto out;
}
#endif

sysfs_cpus = kcalloc(NR_CPUS, sizeof(struct ia64_cpu), GFP_KERNEL);
if (!sysfs_cpus)
panic("kzalloc in topology_init failed - NR_CPUS too big?");
Expand Down
5 changes: 0 additions & 5 deletions arch/mips/kernel/topology.c
Original file line number Diff line number Diff line change
Expand Up @@ -12,11 +12,6 @@ static int __init topology_init(void)
{
int i, ret;

#ifdef CONFIG_NUMA
for_each_online_node(i)
register_one_node(i);
#endif /* CONFIG_NUMA */

for_each_present_cpu(i) {
struct cpu *c = &per_cpu(cpu_devices, i);

Expand Down
17 changes: 0 additions & 17 deletions arch/powerpc/kernel/sysfs.c
Original file line number Diff line number Diff line change
Expand Up @@ -1110,14 +1110,6 @@ EXPORT_SYMBOL_GPL(cpu_remove_dev_attr_group);
/* NUMA stuff */

#ifdef CONFIG_NUMA
static void __init register_nodes(void)
{
int i;

for (i = 0; i < MAX_NUMNODES; i++)
register_one_node(i);
}

int sysfs_add_device_to_node(struct device *dev, int nid)
{
struct node *node = node_devices[nid];
Expand All @@ -1132,13 +1124,6 @@ void sysfs_remove_device_from_node(struct device *dev, int nid)
sysfs_remove_link(&node->dev.kobj, kobject_name(&dev->kobj));
}
EXPORT_SYMBOL_GPL(sysfs_remove_device_from_node);

#else
static void __init register_nodes(void)
{
return;
}

#endif

/* Only valid if CPU is present. */
Expand All @@ -1155,8 +1140,6 @@ static int __init topology_init(void)
{
int cpu, r;

register_nodes();

for_each_possible_cpu(cpu) {
struct cpu *c = &per_cpu(cpu_devices, cpu);

Expand Down
3 changes: 0 additions & 3 deletions arch/riscv/kernel/setup.c
Original file line number Diff line number Diff line change
Expand Up @@ -301,9 +301,6 @@ static int __init topology_init(void)
{
int i, ret;

for_each_online_node(i)
register_one_node(i);

for_each_possible_cpu(i) {
struct cpu *cpu = &per_cpu(cpu_devices, i);

Expand Down
7 changes: 0 additions & 7 deletions arch/s390/kernel/numa.c
Original file line number Diff line number Diff line change
Expand Up @@ -33,10 +33,3 @@ void __init numa_setup(void)
NODE_DATA(0)->node_spanned_pages = memblock_end_of_DRAM() >> PAGE_SHIFT;
NODE_DATA(0)->node_id = 0;
}

static int __init numa_init_late(void)
{
register_one_node(0);
return 0;
}
arch_initcall(numa_init_late);
5 changes: 0 additions & 5 deletions arch/sh/kernel/topology.c
Original file line number Diff line number Diff line change
Expand Up @@ -46,11 +46,6 @@ static int __init topology_init(void)
{
int i, ret;

#ifdef CONFIG_NUMA
for_each_online_node(i)
register_one_node(i);
#endif

for_each_present_cpu(i) {
struct cpu *c = &per_cpu(cpu_devices, i);

Expand Down
12 changes: 0 additions & 12 deletions arch/sparc/kernel/sysfs.c
Original file line number Diff line number Diff line change
Expand Up @@ -244,22 +244,10 @@ static void __init check_mmu_stats(void)
mmu_stats_supported = 1;
}

static void register_nodes(void)
{
#ifdef CONFIG_NUMA
int i;

for (i = 0; i < MAX_NUMNODES; i++)
register_one_node(i);
#endif
}

static int __init topology_init(void)
{
int cpu, ret;

register_nodes();

check_mmu_stats();

for_each_possible_cpu(cpu) {
Expand Down
5 changes: 0 additions & 5 deletions arch/x86/kernel/topology.c
Original file line number Diff line number Diff line change
Expand Up @@ -154,11 +154,6 @@ static int __init topology_init(void)
{
int i;

#ifdef CONFIG_NUMA
for_each_online_node(i)
register_one_node(i);
#endif

for_each_present_cpu(i)
arch_register_cpu(i);

Expand Down
1 change: 1 addition & 0 deletions drivers/base/init.c
Original file line number Diff line number Diff line change
Expand Up @@ -35,5 +35,6 @@ void __init driver_init(void)
auxiliary_bus_init();
cpu_dev_init();
memory_dev_init();
node_dev_init();
container_dev_init();
}
30 changes: 17 additions & 13 deletions drivers/base/node.c
Original file line number Diff line number Diff line change
Expand Up @@ -1065,26 +1065,30 @@ static const struct attribute_group *cpu_root_attr_groups[] = {
};

#define NODE_CALLBACK_PRI 2 /* lower than SLAB */
static int __init register_node_type(void)
void __init node_dev_init(void)
{
int ret;
static struct notifier_block node_memory_callback_nb = {
.notifier_call = node_memory_callback,
.priority = NODE_CALLBACK_PRI,
};
int ret, i;

BUILD_BUG_ON(ARRAY_SIZE(node_state_attr) != NR_NODE_STATES);
BUILD_BUG_ON(ARRAY_SIZE(node_state_attrs)-1 != NR_NODE_STATES);

ret = subsys_system_register(&node_subsys, cpu_root_attr_groups);
if (!ret) {
static struct notifier_block node_memory_callback_nb = {
.notifier_call = node_memory_callback,
.priority = NODE_CALLBACK_PRI,
};
register_hotmemory_notifier(&node_memory_callback_nb);
}
if (ret)
panic("%s() failed to register subsystem: %d\n", __func__, ret);

register_hotmemory_notifier(&node_memory_callback_nb);

/*
* Note: we're not going to unregister the node class if we fail
* to register the node state class attribute files.
* Create all node devices, which will properly link the node
* to applicable memory block devices and already created cpu devices.
*/
return ret;
for_each_online_node(i) {
ret = register_one_node(i);
if (ret)
panic("%s() failed to add node: %d\n", __func__, ret);
}
}
postcore_initcall(register_node_type);
4 changes: 4 additions & 0 deletions include/linux/node.h
Original file line number Diff line number Diff line change
Expand Up @@ -112,6 +112,7 @@ static inline void link_mem_sections(int nid, unsigned long start_pfn,

extern void unregister_node(struct node *node);
#ifdef CONFIG_NUMA
extern void node_dev_init(void);
/* Core of the node registration - only memory hotplug should use this */
extern int __register_one_node(int nid);

Expand Down Expand Up @@ -149,6 +150,9 @@ extern void register_hugetlbfs_with_node(node_registration_func_t doregister,
node_registration_func_t unregister);
#endif
#else
static inline void node_dev_init(void)
{
}
static inline int __register_one_node(int nid)
{
return 0;
Expand Down

0 comments on commit 2848a28

Please sign in to comment.