[PATCHv4 1/3] powerpc, cpu: partially unbind the mapping between cpu logical id and its seq in dt
Pingfan Liu
kernelfans at gmail.com
Tue Mar 13 19:02:50 PDT 2018
On Tue, Mar 13, 2018 at 10:58 AM, Benjamin Herrenschmidt
<benh at kernel.crashing.org> wrote:
> On Mon, 2018-03-12 at 12:43 +0800, Pingfan Liu wrote:
>> For kexec -p, the boot cpu can be not the cpu0, this causes the problem
>> to alloc paca[]. In theory, there is no requirement to assign cpu's logical
>> id as its present seq by device tree. But we have something like
>> cpu_first_thread_sibling(), which makes assumption on the mapping inside
>> a core. Hence partially changing the mapping, i.e. unbind the mapping of
>> core while keep the mapping inside a core. After this patch, boot-cpu
>> will always be mapped into the range [0,threads_per_core).
>
> I'm ok with the idea but not fan of the implementation:
>
>> Signed-off-by: Pingfan Liu <kernelfans at gmail.com>
>> ---
>> arch/powerpc/include/asm/smp.h | 1 +
>> arch/powerpc/kernel/prom.c | 25 ++++++++++++++-----------
>> arch/powerpc/kernel/setup-common.c | 21 +++++++++++++++++++++
>> 3 files changed, 36 insertions(+), 11 deletions(-)
>>
>> diff --git a/arch/powerpc/include/asm/smp.h b/arch/powerpc/include/asm/smp.h
>> index fac963e..1299100 100644
>> --- a/arch/powerpc/include/asm/smp.h
>> +++ b/arch/powerpc/include/asm/smp.h
>> @@ -30,6 +30,7 @@
>> #include <asm/percpu.h>
>>
>> extern int boot_cpuid;
>> +extern int boot_cpuhwid;
>> extern int spinning_secondaries;
>>
>> extern void cpu_die(void);
>> diff --git a/arch/powerpc/kernel/prom.c b/arch/powerpc/kernel/prom.c
>> index da67606..d0ebb25 100644
>> --- a/arch/powerpc/kernel/prom.c
>> +++ b/arch/powerpc/kernel/prom.c
>> @@ -315,8 +315,7 @@ static int __init early_init_dt_scan_cpus(unsigned long node,
>> const __be32 *intserv;
>> int i, nthreads;
>> int len;
>> - int found = -1;
>> - int found_thread = 0;
>> + bool found = false;
>>
>> /* We are scanning "cpu" nodes only */
>> if (type == NULL || strcmp(type, "cpu") != 0)
>> @@ -341,8 +340,11 @@ static int __init early_init_dt_scan_cpus(unsigned long node,
>> if (fdt_version(initial_boot_params) >= 2) {
>> if (be32_to_cpu(intserv[i]) ==
>> fdt_boot_cpuid_phys(initial_boot_params)) {
>> - found = boot_cpu_count;
>> - found_thread = i;
>> + /* always map the boot-cpu logical id into the
>> + * the range of [0, thread_per_core)
>> + */
>> + boot_cpuid = i;
>> + found = true;
>> }
>
> Call it boot_thread_id
>
But I think boot_cpuid has the meaning of global index, while the
thread_id has the meaning of index in a core.
>> } else {
>> /*
>> @@ -351,8 +353,10 @@ static int __init early_init_dt_scan_cpus(unsigned long node,
>> * off secondary threads.
>> */
>> if (of_get_flat_dt_prop(node,
>> - "linux,boot-cpu", NULL) != NULL)
>> - found = boot_cpu_count;
>> + "linux,boot-cpu", NULL) != NULL) {
>> + boot_cpuid = i;
>> + found = true;
>> + }
>> }
>> #ifdef CONFIG_SMP
>> /* logical cpu id is always 0 on UP kernels */
>> @@ -361,13 +365,12 @@ static int __init early_init_dt_scan_cpus(unsigned long node,
>> }
>>
>> /* Not the boot CPU */
>> - if (found < 0)
>> + if (!found)
>> return 0;
>>
>> - DBG("boot cpu: logical %d physical %d\n", found,
>> - be32_to_cpu(intserv[found_thread]));
>> - boot_cpuid = found;
>> - set_hard_smp_processor_id(found, be32_to_cpu(intserv[found_thread]));
>> + boot_cpuhwid = be32_to_cpu(intserv[boot_cpuid]);
>> + DBG("boot cpu: logical %d physical %d\n", boot_cpuid, boot_cpuhwid);
>> + set_hard_smp_processor_id(boot_cpuid, boot_cpuhwid);
>>
>> /*
>> * PAPR defines "logical" PVR values for cpus that
>> diff --git a/arch/powerpc/kernel/setup-common.c b/arch/powerpc/kernel/setup-common.c
>> index 66f7cc6..1a67344 100644
>> --- a/arch/powerpc/kernel/setup-common.c
>> +++ b/arch/powerpc/kernel/setup-common.c
>> @@ -86,6 +86,7 @@ struct machdep_calls *machine_id;
>> EXPORT_SYMBOL(machine_id);
>>
>> int boot_cpuid = -1;
>> +int boot_cpuhwid = -1;
>> EXPORT_SYMBOL_GPL(boot_cpuid);
>>
>> /*
>> @@ -459,11 +460,17 @@ static void __init cpu_init_thread_core_maps(int tpc)
>> void __init smp_setup_cpu_maps(void)
>> {
>> struct device_node *dn;
>> + struct device_node *boot_dn = NULL;
>> + bool handling_bootdn = true;
>> int cpu = 0;
>> int nthreads = 1;
>>
>> DBG("smp_setup_cpu_maps()\n");
>>
>> +again:
>> + /* E.g. kexec will not boot from the 1st core. So firstly loop to find out
>> + * the dn of boot-cpu, and map them onto [0, nthreads)
>> + */
>> for_each_node_by_type(dn, "cpu") {
>> const __be32 *intserv;
>> __be32 cpu_be;
>> @@ -488,6 +495,16 @@ void __init smp_setup_cpu_maps(void)
>>
>> nthreads = len / sizeof(int);
>>
>> + if (handling_bootdn) {
>> + if (boot_cpuid < nthreads &&
>> + be32_to_cpu(intserv[boot_cpuid]) == boot_cpuhwid) {
>> + boot_dn = dn;
>> + }
>> + if (boot_dn == NULL)
>> + continue;
>> + } else if (dn == boot_dn)
>> + continue;
>> +
>> for (j = 0; j < nthreads && cpu < nr_cpu_ids; j++) {
>> bool avail;
>>
>> @@ -509,6 +526,10 @@ void __init smp_setup_cpu_maps(void)
>> of_node_put(dn);
>> break;
>> }
>> + if (handling_bootdn) {
>> + handling_bootdn = false;
>> + goto again;
>> + }
>> }
>
> You don't need that "again" loop and "handling_bootdn" weird boolean.
>
> Instead, start with cpu = 1 instead of cpu = 0, and rename it to
> "next_cpu".
>
> Then, before the thread loop, check if we are on the same core
> as boot_cpuhwid:
>
> if (same_core_as_boot_cpu(intserv)) {
> cpu = 0;
> } else if (next_cpu < nr_cpus_ids) {
> cpu = next_cpu++;
> } else {
> of_node_put(dn);
> break;
> }
>
OK.
Thanks for your review.
Regards,
Pingfan
More information about the kexec
mailing list