On Tue, Feb 07, 2017 at 02:40:36AM -0600, Suravee Suthikulpanit wrote:
> From: Suravee Suthikulpanit <suravee.suthikulpa...@amd.com>
> 
> Add multi-IOMMU support for perf by exposing an AMD IOMMU PMU
> for each IOMMU found in the system via:
> 
>   /bus/event_source/devices/amd_iommu_x
> 
> where x is the IOMMU index. This allows users to specify
> different events to be programmed onto performance counters
> of each IOMMU.
> 
> Cc: Peter Zijlstra <pet...@infradead.org>
> Cc: Borislav Petkov <b...@alien8.de>
> Signed-off-by: Suravee Suthikulpanit <suravee.suthikulpa...@amd.com>
> ---

...

> @@ -414,46 +417,46 @@ static __init void amd_iommu_pc_exit(void)
>  };
>  
>  static __init int
> -_init_perf_amd_iommu(struct perf_amd_iommu *perf_iommu, char *name)
> +init_one_perf_amd_iommu(struct perf_amd_iommu *perf_iommu, unsigned int idx)

It's a static function - just call it "init_one_iommu".

>  {
>       int ret;
>  
>       raw_spin_lock_init(&perf_iommu->lock);
>  
> -     /* Init cpumask attributes to only core 0 */
> -     cpumask_set_cpu(0, &iommu_cpumask);
> -
> -     perf_iommu->max_banks    = amd_iommu_pc_get_max_banks(0);
> -     perf_iommu->max_counters = amd_iommu_pc_get_max_counters(0);
> +     perf_iommu->iommu        = get_amd_iommu(idx);

This function can return NULL - you need to handle that here otherwise
it will blow up later.

> +     perf_iommu->max_banks    = amd_iommu_pc_get_max_banks(idx);
> +     perf_iommu->max_counters = amd_iommu_pc_get_max_counters(idx);
>       if (!perf_iommu->max_banks || !perf_iommu->max_counters)
>               return -EINVAL;
>  
> +     snprintf(perf_iommu->name, PERF_AMD_IOMMU_NAME_SIZE, "amd_iommu_%u", 
> idx);
> +
> +     perf_iommu->pmu.event_init  = perf_iommu_event_init;
> +     perf_iommu->pmu.add         = perf_iommu_add;
> +     perf_iommu->pmu.del         = perf_iommu_del;
> +     perf_iommu->pmu.start       = perf_iommu_start;
> +     perf_iommu->pmu.stop        = perf_iommu_stop;
> +     perf_iommu->pmu.read        = perf_iommu_read;
> +     perf_iommu->pmu.task_ctx_nr = perf_invalid_context;
>       perf_iommu->pmu.attr_groups = amd_iommu_attr_groups;

So you can define a static struct pmu in the driver and do struct
assignment directly instead of writing them one-by-one.

        perf_iommu->pmu = pmu;

> -     ret = perf_pmu_register(&perf_iommu->pmu, name, -1);
> +
> +     ret = perf_pmu_register(&perf_iommu->pmu, perf_iommu->name, -1);
>       if (ret)
>               pr_err("Error initializing AMD IOMMU perf counters.\n");
>       else
> -             pr_info("perf: amd_iommu: Detected. (%d banks, %d 
> counters/bank)\n",
> -                     amd_iommu_pc_get_max_banks(0),
> -                     amd_iommu_pc_get_max_counters(0));
> +     pr_info("Detected AMD IOMMU #%d (%d banks, %d counters/bank)\n",
> +             idx, amd_iommu_pc_get_max_banks(idx),

perf_iommu->max_banks

> +             amd_iommu_pc_get_max_counters(idx));

perf_iommu->max_counters

You already read them above.

>       return ret;
>  }
>  
> -static struct perf_amd_iommu __perf_iommu = {
> -     .pmu = {
> -             .task_ctx_nr    = perf_invalid_context,
> -             .event_init     = perf_iommu_event_init,
> -             .add            = perf_iommu_add,
> -             .del            = perf_iommu_del,
> -             .start          = perf_iommu_start,
> -             .stop           = perf_iommu_stop,
> -             .read           = perf_iommu_read,
> -     },
> -};
> -
>  static __init int amd_iommu_pc_init(void)
>  {
>       int ret;
> +     unsigned int i;
> +
> +     /* Init cpumask attributes to only core 0 */
> +     cpumask_set_cpu(0, &iommu_cpumask);

This belongs at the end of the function, once everything has been
initialized successfully.

>       /* Make sure the IOMMU PC resource is available */
>       if (!amd_iommu_pc_supported())


> @@ -463,7 +466,24 @@ static __init int amd_iommu_pc_init(void)
>       if (ret)
>               return ret;
>  
> -     ret = _init_perf_amd_iommu(&__perf_iommu, "amd_iommu");
> +     for (i = 0 ; i < amd_iommu_get_num_iommus(); i++) {
> +             struct perf_amd_iommu *pi;
> +
> +             pi = kzalloc(sizeof(struct perf_amd_iommu), GFP_KERNEL);
> +             if (!pi) {
> +                     ret = -ENOMEM;
> +                     break;
> +             }
> +
> +             ret = init_one_perf_amd_iommu(pi, i);
> +             if (ret) {
> +                     kfree(pi);
> +                     break;

What happens with the iommus that have been initialized successfully
before this one fails? They remain in use?

I think we need at least a warning saying here:

        pr_warning("Error initializing IOMMU %d ...")

so that we at least know why some are missing.

-- 
Regards/Gruss,
    Boris.

Good mailing practices for 400: avoid top-posting and trim the reply.

Reply via email to