On 22-01-16, 12:49, Shilpasri G Bhat wrote:
> cpu_to_chip_id() does a DT walk through to find out the chip id by
> taking a contended device tree lock. This adds an unnecessary overhead
> in a hot path. So instead of calling cpu_to_chip_id() everytime cache
> the chip ids for all cores in the array 'core_to_chip_map' and use it
> in the hotpath.
> 
> Reported-by: Anton Blanchard <an...@samba.org>
> Signed-off-by: Shilpasri G Bhat <shilpa.b...@linux.vnet.ibm.com>
> Reviewed-by: Gautham R. Shenoy <e...@linux.vnet.ibm.com>
> ---
> No changes from v5.
> 
> Changes from v4:
> - Taken care of Shreyas's comments to add a core_to_chip_map array to
>   store the chip id.
> 
>  drivers/cpufreq/powernv-cpufreq.c | 24 +++++++++++++++++++++---
>  1 file changed, 21 insertions(+), 3 deletions(-)
> 
> diff --git a/drivers/cpufreq/powernv-cpufreq.c 
> b/drivers/cpufreq/powernv-cpufreq.c
> index 140c75f..6f186dc 100644
> --- a/drivers/cpufreq/powernv-cpufreq.c
> +++ b/drivers/cpufreq/powernv-cpufreq.c
> @@ -43,6 +43,7 @@
>  
>  static struct cpufreq_frequency_table powernv_freqs[POWERNV_MAX_PSTATES+1];
>  static bool rebooting, throttled, occ_reset;
> +static unsigned int *core_to_chip_map;
>  
>  static struct chip {
>       unsigned int id;
> @@ -313,13 +314,14 @@ static inline unsigned int get_nominal_index(void)
>  static void powernv_cpufreq_throttle_check(void *data)
>  {
>       unsigned int cpu = smp_processor_id();
> +     unsigned int chip_id = core_to_chip_map[cpu_core_index_of_thread(cpu)];
>       unsigned long pmsr;
>       int pmsr_pmax, i;
>  
>       pmsr = get_pmspr(SPRN_PMSR);
>  
>       for (i = 0; i < nr_chips; i++)
> -             if (chips[i].id == cpu_to_chip_id(cpu))
> +             if (chips[i].id == chip_id)
>                       break;
>  
>       /* Check for Pmax Capping */
> @@ -559,19 +561,29 @@ static int init_chip_info(void)
>       unsigned int chip[256];
>       unsigned int cpu, i;
>       unsigned int prev_chip_id = UINT_MAX;
> +     cpumask_t cpu_mask;
> +     int ret = -ENOMEM;
>  
> -     for_each_possible_cpu(cpu) {
> +     cpumask_copy(&cpu_mask, cpu_possible_mask);

Shouldn't this copy be done after the following check, so that we
don't do that on failures ?

> +     core_to_chip_map = kcalloc(cpu_nr_cores(), sizeof(unsigned int),
> +                                GFP_KERNEL);
> +     if (!core_to_chip_map)
> +             goto out;
> +
> +     for_each_cpu(cpu, &cpu_mask) {
>               unsigned int id = cpu_to_chip_id(cpu);
>  
>               if (prev_chip_id != id) {
>                       prev_chip_id = id;
>                       chip[nr_chips++] = id;
>               }
> +             core_to_chip_map[cpu_core_index_of_thread(cpu)] = id;
> +             cpumask_andnot(&cpu_mask, &cpu_mask, cpu_sibling_mask(cpu));
>       }
>  
>       chips = kmalloc_array(nr_chips, sizeof(struct chip), GFP_KERNEL);
>       if (!chips)
> -             return -ENOMEM;
> +             goto free_chip_map;
>  
>       for (i = 0; i < nr_chips; i++) {
>               chips[i].id = chip[i];
> @@ -582,6 +594,10 @@ static int init_chip_info(void)
>       }
>  
>       return 0;
> +free_chip_map:
> +     kfree(core_to_chip_map);
> +out:
> +     return ret;
>  }
>  
>  static int __init powernv_cpufreq_init(void)
> @@ -615,6 +631,8 @@ static void __exit powernv_cpufreq_exit(void)
>       unregister_reboot_notifier(&powernv_cpufreq_reboot_nb);
>       opal_message_notifier_unregister(OPAL_MSG_OCC,
>                                        &powernv_cpufreq_opal_nb);
> +     kfree(chips);

Yeah, this is an important fix, but it shouldn't be part of this
patch, isn't it ?

> +     kfree(core_to_chip_map);
>       cpufreq_unregister_driver(&powernv_cpufreq_driver);
>  }
>  module_exit(powernv_cpufreq_exit);
> -- 
> 1.9.3

-- 
viresh

Reply via email to