Hi Eric,

> -----Original Message-----
> From: Eric Auger <eric.au...@redhat.com>
> Sent: Wednesday, November 13, 2024 5:12 PM
> To: Shameerali Kolothum Thodi
> <shameerali.kolothum.th...@huawei.com>; qemu-...@nongnu.org;
> qemu-devel@nongnu.org
> Cc: peter.mayd...@linaro.org; j...@nvidia.com; nicol...@nvidia.com;
> ddut...@redhat.com; Linuxarm <linux...@huawei.com>; Wangzhou (B)
> <wangzh...@hisilicon.com>; jiangkunkun <jiangkun...@huawei.com>;
> Jonathan Cameron <jonathan.came...@huawei.com>;
> zhangfei....@linaro.org
> Subject: Re: [RFC PATCH 2/5] hw/arm/smmuv3: Add initial support for
> SMMUv3 Nested device
> 
> Hi Shameer,
> On 11/8/24 13:52, Shameer Kolothum wrote:
> > Based on SMMUv3 as a parent device, add a user-creatable smmuv3-
> nested
> > device. Subsequent patches will add support to specify a PCI bus for
> > this device.
> >
> > Currently only supported for "virt", so hook up the sybus mem & irq
> > for that  as well.
> >
> > No FDT support is added for now.
> >
> > Signed-off-by: Shameer Kolothum
> <shameerali.kolothum.th...@huawei.com>
> > ---
> >  hw/arm/smmuv3.c         | 34 ++++++++++++++++++++++++++++++++++
> >  hw/arm/virt.c           | 31 +++++++++++++++++++++++++++++--
> >  hw/core/sysbus-fdt.c    |  1 +
> >  include/hw/arm/smmuv3.h | 15 +++++++++++++++
> >  include/hw/arm/virt.h   |  6 ++++++
> >  5 files changed, 85 insertions(+), 2 deletions(-)
> >
> > diff --git a/hw/arm/smmuv3.c b/hw/arm/smmuv3.c index
> > 2101031a8f..0033eb8125 100644
> > --- a/hw/arm/smmuv3.c
> > +++ b/hw/arm/smmuv3.c
> > @@ -2201,6 +2201,19 @@ static void smmu_realize(DeviceState *d, Error
> **errp)
> >      smmu_init_irq(s, dev);
> >  }
> >
> > +static void smmu_nested_realize(DeviceState *d, Error **errp) {
> > +    SMMUv3NestedState *s_nested = ARM_SMMUV3_NESTED(d);
> nit: s/s_nested/ns or just s?
> > +    SMMUv3NestedClass *c =
> ARM_SMMUV3_NESTED_GET_CLASS(s_nested);
> > +    Error *local_err = NULL;
> > +
> > +    c->parent_realize(d, &local_err);
> I think it is safe to use errp directly here.

Ok.

> > +    if (local_err) {
> > +        error_propagate(errp, local_err);
> > +        return;
> > +    }
> > +}
> > +
> >  static const VMStateDescription vmstate_smmuv3_queue = {
> >      .name = "smmuv3_queue",
> >      .version_id = 1,
> > @@ -2299,6 +2312,18 @@ static void smmuv3_class_init(ObjectClass
> *klass, void *data)
> >      device_class_set_props(dc, smmuv3_properties);  }
> >
> > +static void smmuv3_nested_class_init(ObjectClass *klass, void *data)
> > +{
> > +    DeviceClass *dc = DEVICE_CLASS(klass);
> > +    SMMUv3NestedClass *c = ARM_SMMUV3_NESTED_CLASS(klass);
> > +
> > +    dc->vmsd = &vmstate_smmuv3;
> > +    device_class_set_parent_realize(dc, smmu_nested_realize,
> > +                                    &c->parent_realize);
> > +    dc->user_creatable = true;
> > +    dc->hotpluggable = false;
> > +}
> > +
> >  static int smmuv3_notify_flag_changed(IOMMUMemoryRegion *iommu,
> >                                        IOMMUNotifierFlag old,
> >                                        IOMMUNotifierFlag new, @@
> > -2337,6 +2362,14 @@ static void
> smmuv3_iommu_memory_region_class_init(ObjectClass *klass,
> >      imrc->notify_flag_changed = smmuv3_notify_flag_changed;  }
> >
> > +static const TypeInfo smmuv3_nested_type_info = {
> > +    .name          = TYPE_ARM_SMMUV3_NESTED,
> > +    .parent        = TYPE_ARM_SMMUV3,
> > +    .instance_size = sizeof(SMMUv3NestedState),
> > +    .class_size    = sizeof(SMMUv3NestedClass),
> > +    .class_init    = smmuv3_nested_class_init,
> > +};
> > +
> >  static const TypeInfo smmuv3_type_info = {
> >      .name          = TYPE_ARM_SMMUV3,
> >      .parent        = TYPE_ARM_SMMU,
> > @@ -2355,6 +2388,7 @@ static const TypeInfo
> > smmuv3_iommu_memory_region_info = {  static void
> > smmuv3_register_types(void)  {
> >      type_register(&smmuv3_type_info);
> > +    type_register(&smmuv3_nested_type_info);
> >      type_register(&smmuv3_iommu_memory_region_info);
> >  }
> >
> > diff --git a/hw/arm/virt.c b/hw/arm/virt.c index
> > 780bcff77c..38075f9ab2 100644
> > --- a/hw/arm/virt.c
> > +++ b/hw/arm/virt.c
> > @@ -181,6 +181,7 @@ static const MemMapEntry base_memmap[] = {
> >      [VIRT_PVTIME] =             { 0x090a0000, 0x00010000 },
> >      [VIRT_SECURE_GPIO] =        { 0x090b0000, 0x00001000 },
> >      [VIRT_MMIO] =               { 0x0a000000, 0x00000200 },
> > +    [VIRT_SMMU_NESTED] =        { 0x0b000000, 0x01000000 },
> I agree with Mostafa that the _NESTED terminology may not be the best
> choice.

Yes. Agree.

> The motivation behind that multi-instance attempt, as introduced in
> https://lore.kernel.org/all/ZEcT%2F7erkhHDaNvD@Asurada-Nvidia/
> was:
> - SMMUs with different feature bits
> - support of VCMDQ HW extension for SMMU CMDQ
> - need for separate S1 invalidation paths
> 
> If I understand correctly this is mostly wanted for VCMDQ handling? if this
> is correct we may indicate that somehow in the terminology.
> 

Not just for VCMDQ, but it benefits when we have multiple physical SMMUv3
instances as well.

> If I understand correctly VCMDQ terminology is NVidia specific while ECMDQ
> is the baseline (?).

Yes, VCMDQ is NVIDIA specific. And ECMDQ is ARM SMMUv3, but don’t think we
can associate ECMDQ with a virtual SMMUv3.

> >      /* ...repeating for a total of NUM_VIRTIO_TRANSPORTS, each of that
> size */
> >      [VIRT_PLATFORM_BUS] =       { 0x0c000000, 0x02000000 },
> >      [VIRT_SECURE_MEM] =         { 0x0e000000, 0x01000000 },
> > @@ -226,6 +227,7 @@ static const int a15irqmap[] = {
> >      [VIRT_GIC_V2M] = 48, /* ...to 48 + NUM_GICV2M_SPIS - 1 */
> >      [VIRT_SMMU] = 74,    /* ...to 74 + NUM_SMMU_IRQS - 1 */
> >      [VIRT_PLATFORM_BUS] = 112, /* ...to 112 + PLATFORM_BUS_NUM_IRQS
> > -1 */
> > +    [VIRT_SMMU_NESTED] = 200,
> What is the max IRQs expected to be consumed. Wother to comment for
> next interrupt user.

Depends on how many we plan to support max  and each requires minimum 4. I will
update with a  comment here.

> >  };
> >
> >  static void create_randomness(MachineState *ms, const char *node) @@
> > -2883,10 +2885,34 @@ static void
> virt_machine_device_plug_cb(HotplugHandler *hotplug_dev,
> >                                          DeviceState *dev, Error
> > **errp)  {
> >      VirtMachineState *vms = VIRT_MACHINE(hotplug_dev);
> > +    MachineClass *mc = MACHINE_GET_CLASS(vms);
> >
> > -    if (vms->platform_bus_dev) {
> > -        MachineClass *mc = MACHINE_GET_CLASS(vms);
> > +    /* For smmuv3-nested devices we need to set the mem & irq */
> > +    if (device_is_dynamic_sysbus(mc, dev) &&
> > +        object_dynamic_cast(OBJECT(dev), TYPE_ARM_SMMUV3_NESTED)) {
> why did you choose not using the PLATFORM BUS infra which does that
> kind of binding automatically (also it provisions for dedicated MMIOs and
> IRQs). At least you would need to justify in the commit msg I think

Because I was not  sure how to do this binding otherwise. I couldn't find
any such precedence  for a  dynamic platform bus dev binding 
MMIOs/IRQs(May be I didn't look hard). I mentioned it in cover letter.

Could you please give me some pointers/example for this? I will also
take another look.

> > +        hwaddr base = vms->memmap[VIRT_SMMU_NESTED].base;
> > +        int irq =  vms->irqmap[VIRT_SMMU_NESTED];
> > +
> > +        if (vms->smmu_nested_count >= MAX_SMMU_NESTED) {
> > +            error_setg(errp, "smmuv3-nested max count reached!");
> > +            return;
> > +        }
> > +
> > +        base += (vms->smmu_nested_count * SMMU_IO_LEN);
> > +        irq += (vms->smmu_nested_count * NUM_SMMU_IRQS);
> >
> > +        sysbus_mmio_map(SYS_BUS_DEVICE(dev), 0, base);
> > +        for (int i = 0; i < 4; i++) {
> > +            sysbus_connect_irq(SYS_BUS_DEVICE(dev), i,
> > +                               qdev_get_gpio_in(vms->gic, irq + i));
> > +        }
> > +        if (vms->iommu != VIRT_IOMMU_SMMUV3_NESTED) {
> > +            vms->iommu = VIRT_IOMMU_SMMUV3_NESTED;
> > +        }
> > +        vms->smmu_nested_count++;
> this kind of check would definitively not integrated in the platform bus but
> this could be introduced generically in the framework though or special
> cased after the platform_bus_link_device

Ok. So I assume there is a better way to link the MMIOs/IRQs as you mentioned 
above and we can add another helper to track this count as well.

> > +    }
> > +
> > +    if (vms->platform_bus_dev) {
> >          if (device_is_dynamic_sysbus(mc, dev)) {
> >              platform_bus_link_device(PLATFORM_BUS_DEVICE(vms-
> >platform_bus_dev),
> >                                       SYS_BUS_DEVICE(dev)); @@ -3067,6
> > +3093,7 @@ static void virt_machine_class_init(ObjectClass *oc, void
> *data)
> >      machine_class_allow_dynamic_sysbus_dev(mc,
> TYPE_VFIO_AMD_XGBE);
> >      machine_class_allow_dynamic_sysbus_dev(mc, TYPE_RAMFB_DEVICE);
> >      machine_class_allow_dynamic_sysbus_dev(mc,
> TYPE_VFIO_PLATFORM);
> > +    machine_class_allow_dynamic_sysbus_dev(mc,
> > + TYPE_ARM_SMMUV3_NESTED);
> >  #ifdef CONFIG_TPM
> >      machine_class_allow_dynamic_sysbus_dev(mc,
> TYPE_TPM_TIS_SYSBUS);
> > #endif diff --git a/hw/core/sysbus-fdt.c b/hw/core/sysbus-fdt.c index
> > eebcd28f9a..0f0d0b3e58 100644
> > --- a/hw/core/sysbus-fdt.c
> > +++ b/hw/core/sysbus-fdt.c
> > @@ -489,6 +489,7 @@ static const BindingEntry bindings[] = {  #ifdef
> > CONFIG_LINUX
> >      TYPE_BINDING(TYPE_VFIO_CALXEDA_XGMAC,
> add_calxeda_midway_xgmac_fdt_node),
> >      TYPE_BINDING(TYPE_VFIO_AMD_XGBE, add_amd_xgbe_fdt_node),
> > +    TYPE_BINDING("arm-smmuv3-nested", no_fdt_node),
> >      VFIO_PLATFORM_BINDING("amd,xgbe-seattle-v1a",
> > add_amd_xgbe_fdt_node),  #endif  #ifdef CONFIG_TPM diff --git
> > a/include/hw/arm/smmuv3.h b/include/hw/arm/smmuv3.h index
> > d183a62766..87e628be7a 100644
> > --- a/include/hw/arm/smmuv3.h
> > +++ b/include/hw/arm/smmuv3.h
> > @@ -84,6 +84,21 @@ struct SMMUv3Class {
> >  #define TYPE_ARM_SMMUV3   "arm-smmuv3"
> >  OBJECT_DECLARE_TYPE(SMMUv3State, SMMUv3Class, ARM_SMMUV3)
> >
> > +#define TYPE_ARM_SMMUV3_NESTED   "arm-smmuv3-nested"
> > +OBJECT_DECLARE_TYPE(SMMUv3NestedState, SMMUv3NestedClass,
> > +ARM_SMMUV3_NESTED)
> > +
> > +struct SMMUv3NestedState {
> > +    SMMUv3State smmuv3_state;
> > +};
> > +
> > +struct SMMUv3NestedClass {
> > +    /*< private >*/
> > +    SMMUv3Class smmuv3_class;
> > +    /*< public >*/
> > +
> > +    DeviceRealize parent_realize;
> > +};
> > +
> >  #define STAGE1_SUPPORTED(s)      FIELD_EX32(s->idr[0], IDR0, S1P)
> >  #define STAGE2_SUPPORTED(s)      FIELD_EX32(s->idr[0], IDR0, S2P)
> >
> > diff --git a/include/hw/arm/virt.h b/include/hw/arm/virt.h index
> > 46f48fe561..50e47a4ef3 100644
> > --- a/include/hw/arm/virt.h
> > +++ b/include/hw/arm/virt.h
> > @@ -50,6 +50,9 @@
> >  /* MMIO region size for SMMUv3 */
> >  #define SMMU_IO_LEN 0x20000
> >
> > +/* Max supported nested SMMUv3 */
> > +#define MAX_SMMU_NESTED 128
> Ouch, that many?!

😊. I just came up with the max we can support the allocated MMIO space.
We do have systems at present which has 8 physical SMMUv3s at the moment.
Probably 16/32 would be a better number I guess.

Thanks,
Shameer

Reply via email to