Re: [PATCH v6 2/5] cpufreq: powernv: Remove cpu_to_chip_id() from hot-path
From: Viresh Kumar
Date: Mon Jan 25 2016 - 00:54:03 EST
On 22-01-16, 12:49, Shilpasri G Bhat wrote:
> cpu_to_chip_id() does a DT walk through to find out the chip id by
> taking a contended device tree lock. This adds an unnecessary overhead
> in a hot path. So instead of calling cpu_to_chip_id() everytime cache
> the chip ids for all cores in the array 'core_to_chip_map' and use it
> in the hotpath.
>
> Reported-by: Anton Blanchard <anton@xxxxxxxxx>
> Signed-off-by: Shilpasri G Bhat <shilpa.bhat@xxxxxxxxxxxxxxxxxx>
> Reviewed-by: Gautham R. Shenoy <ego@xxxxxxxxxxxxxxxxxx>
> ---
> No changes from v5.
>
> Changes from v4:
> - Taken care of Shreyas's comments to add a core_to_chip_map array to
> store the chip id.
>
> drivers/cpufreq/powernv-cpufreq.c | 24 +++++++++++++++++++++---
> 1 file changed, 21 insertions(+), 3 deletions(-)
>
> diff --git a/drivers/cpufreq/powernv-cpufreq.c b/drivers/cpufreq/powernv-cpufreq.c
> index 140c75f..6f186dc 100644
> --- a/drivers/cpufreq/powernv-cpufreq.c
> +++ b/drivers/cpufreq/powernv-cpufreq.c
> @@ -43,6 +43,7 @@
>
> static struct cpufreq_frequency_table powernv_freqs[POWERNV_MAX_PSTATES+1];
> static bool rebooting, throttled, occ_reset;
> +static unsigned int *core_to_chip_map;
>
> static struct chip {
> unsigned int id;
> @@ -313,13 +314,14 @@ static inline unsigned int get_nominal_index(void)
> static void powernv_cpufreq_throttle_check(void *data)
> {
> unsigned int cpu = smp_processor_id();
> + unsigned int chip_id = core_to_chip_map[cpu_core_index_of_thread(cpu)];
> unsigned long pmsr;
> int pmsr_pmax, i;
>
> pmsr = get_pmspr(SPRN_PMSR);
>
> for (i = 0; i < nr_chips; i++)
> - if (chips[i].id == cpu_to_chip_id(cpu))
> + if (chips[i].id == chip_id)
> break;
>
> /* Check for Pmax Capping */
> @@ -559,19 +561,29 @@ static int init_chip_info(void)
> unsigned int chip[256];
> unsigned int cpu, i;
> unsigned int prev_chip_id = UINT_MAX;
> + cpumask_t cpu_mask;
> + int ret = -ENOMEM;
>
> - for_each_possible_cpu(cpu) {
> + cpumask_copy(&cpu_mask, cpu_possible_mask);
Shouldn't this copy be done after the following check, so that we
don't do that on failures ?
> + core_to_chip_map = kcalloc(cpu_nr_cores(), sizeof(unsigned int),
> + GFP_KERNEL);
> + if (!core_to_chip_map)
> + goto out;
> +
> + for_each_cpu(cpu, &cpu_mask) {
> unsigned int id = cpu_to_chip_id(cpu);
>
> if (prev_chip_id != id) {
> prev_chip_id = id;
> chip[nr_chips++] = id;
> }
> + core_to_chip_map[cpu_core_index_of_thread(cpu)] = id;
> + cpumask_andnot(&cpu_mask, &cpu_mask, cpu_sibling_mask(cpu));
> }
>
> chips = kmalloc_array(nr_chips, sizeof(struct chip), GFP_KERNEL);
> if (!chips)
> - return -ENOMEM;
> + goto free_chip_map;
>
> for (i = 0; i < nr_chips; i++) {
> chips[i].id = chip[i];
> @@ -582,6 +594,10 @@ static int init_chip_info(void)
> }
>
> return 0;
> +free_chip_map:
> + kfree(core_to_chip_map);
> +out:
> + return ret;
> }
>
> static int __init powernv_cpufreq_init(void)
> @@ -615,6 +631,8 @@ static void __exit powernv_cpufreq_exit(void)
> unregister_reboot_notifier(&powernv_cpufreq_reboot_nb);
> opal_message_notifier_unregister(OPAL_MSG_OCC,
> &powernv_cpufreq_opal_nb);
> + kfree(chips);
Yeah, this is an important fix, but it shouldn't be part of this
patch, isn't it ?
> + kfree(core_to_chip_map);
> cpufreq_unregister_driver(&powernv_cpufreq_driver);
> }
> module_exit(powernv_cpufreq_exit);
> --
> 1.9.3
--
viresh