On Thu, Apr 14, 2022 at 12:33 AM Eugenio Pérez <epere...@redhat.com> wrote:
>
> We can configure ASID per group, but we still use asid 0 for every vdpa
> device. Multiple asid support for cvq will be introduced in next
> patches
>
> Signed-off-by: Eugenio Pérez <epere...@redhat.com>
> ---
>  include/hw/virtio/vhost.h |  4 ++
>  hw/net/vhost_net.c        |  5 +++
>  hw/virtio/vhost-vdpa.c    | 95 ++++++++++++++++++++++++++++++++-------
>  net/vhost-vdpa.c          |  4 +-
>  hw/virtio/trace-events    |  9 ++--
>  5 files changed, 94 insertions(+), 23 deletions(-)
>
> diff --git a/include/hw/virtio/vhost.h b/include/hw/virtio/vhost.h
> index 034868fa9e..640cf82168 100644
> --- a/include/hw/virtio/vhost.h
> +++ b/include/hw/virtio/vhost.h
> @@ -76,8 +76,12 @@ struct vhost_dev {
>      int vq_index;
>      /* one past the last vq index for the virtio device (not vhost) */
>      int vq_index_end;
> +    /* one past the last vq index of this virtqueue group */
> +    int vq_group_index_end;
>      /* if non-zero, minimum required value for max_queues */
>      int num_queues;
> +    /* address space id */

Instead of doing shortcuts like this, I think we need to have
abstraction as what kernel did. That is to say, introduce structures
like:

struct vhost_vdpa_dev_group;
struct vhost_vdpa_as;

Then having pointers to those structures like

struct vhost_vdpa {
        ...
        struct vhost_vdpa_dev_group *group;
};

struct vhost_vdpa_group {
        ...
        uint32_t id;
        struct vhost_vdpa_as;
};

struct vhost_vdpa_as {
        uint32_t id;
        MemoryListener listener;
};

We can read the group topology during initialization and allocate the
structure accordingly. If the CVQ has its own group:

1) We know we will have 2 AS otherwise 1 AS
2) allocate #AS and attach the group to the corresponding AS

Then we know the

1) map/unmap and listener is done per as instead of per group or vdpa.
2) AS attach/detach is done per group

And it would simplify the future extension when we want to advertise
the as/groups to guests.

To simplify the reviewing, we can introduce the above concept before
the ASID uAPIs and assume a 1 group 1 as a model as a start.

Thanks

> +    uint32_t address_space_id;
>      /* Must be a vq group different than any other vhost dev */
>      bool independent_vq_group;
>      uint64_t features;
> diff --git a/hw/net/vhost_net.c b/hw/net/vhost_net.c
> index 10480e19e5..a34df739a7 100644
> --- a/hw/net/vhost_net.c
> +++ b/hw/net/vhost_net.c
> @@ -344,15 +344,20 @@ int vhost_net_start(VirtIODevice *dev, NetClientState 
> *ncs,
>
>      for (i = 0; i < nvhosts; i++) {
>          bool cvq_idx = i >= data_queue_pairs;
> +        uint32_t vq_group_end;
>
>          if (!cvq_idx) {
>              peer = qemu_get_peer(ncs, i);
> +            vq_group_end = 2 * data_queue_pairs;
>          } else { /* Control Virtqueue */
>              peer = qemu_get_peer(ncs, n->max_queue_pairs);
> +            vq_group_end = 2 * data_queue_pairs + 1;
>          }
>
>          net = get_vhost_net(peer);
> +        net->dev.address_space_id = !!cvq_idx;
>          net->dev.independent_vq_group = !!cvq_idx;
> +        net->dev.vq_group_index_end = vq_group_end;
>          vhost_net_set_vq_index(net, i * 2, index_end);
>
>          /* Suppress the masking guest notifiers on vhost user
> diff --git a/hw/virtio/vhost-vdpa.c b/hw/virtio/vhost-vdpa.c
> index 4096555242..5ed211287c 100644
> --- a/hw/virtio/vhost-vdpa.c
> +++ b/hw/virtio/vhost-vdpa.c
> @@ -79,6 +79,9 @@ static int vhost_vdpa_dma_map(struct vhost_vdpa *v, hwaddr 
> iova, hwaddr size,
>      int ret = 0;
>
>      msg.type = v->msg_type;
> +    if (v->dev->backend_cap & BIT_ULL(VHOST_BACKEND_F_IOTLB_ASID)) {
> +        msg.asid = v->dev->address_space_id;
> +    }
>      msg.iotlb.iova = iova;
>      msg.iotlb.size = size;
>      msg.iotlb.uaddr = (uint64_t)(uintptr_t)vaddr;
> @@ -90,8 +93,9 @@ static int vhost_vdpa_dma_map(struct vhost_vdpa *v, hwaddr 
> iova, hwaddr size,
>          return 0;
>      }
>
> -   trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.iotlb.iova, msg.iotlb.size,
> -                            msg.iotlb.uaddr, msg.iotlb.perm, msg.iotlb.type);
> +    trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.asid, msg.iotlb.iova,
> +                             msg.iotlb.size, msg.iotlb.uaddr, msg.iotlb.perm,
> +                             msg.iotlb.type);
>
>      if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) {
>          error_report("failed to write, fd=%d, errno=%d (%s)",
> @@ -109,6 +113,9 @@ static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, 
> hwaddr iova,
>      int fd = v->device_fd;
>      int ret = 0;
>
> +    if (v->dev->backend_cap & BIT_ULL(VHOST_BACKEND_F_IOTLB_ASID)) {
> +        msg.asid = v->dev->address_space_id;
> +    }
>      msg.type = v->msg_type;
>      msg.iotlb.iova = iova;
>      msg.iotlb.size = size;
> @@ -119,7 +126,7 @@ static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, 
> hwaddr iova,
>          return 0;
>      }
>
> -    trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.iotlb.iova,
> +    trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.asid, msg.iotlb.iova,
>                                 msg.iotlb.size, msg.iotlb.type);
>
>      if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) {
> @@ -134,6 +141,7 @@ static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, 
> hwaddr iova,
>  static void vhost_vdpa_listener_commit(MemoryListener *listener)
>  {
>      struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, 
> listener);
> +    struct vhost_dev *dev = v->dev;
>      struct vhost_msg_v2 msg = {};
>      int fd = v->device_fd;
>      size_t num = v->iotlb_updates->len;
> @@ -142,9 +150,14 @@ static void vhost_vdpa_listener_commit(MemoryListener 
> *listener)
>          return;
>      }
>
> +    if (dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_ASID)) {
> +        msg.asid = v->dev->address_space_id;
> +    }
> +
>      msg.type = v->msg_type;
>      msg.iotlb.type = VHOST_IOTLB_BATCH_BEGIN;
> -    trace_vhost_vdpa_listener_begin_batch(v, fd, msg.type, msg.iotlb.type);
> +    trace_vhost_vdpa_listener_begin_batch(v, fd, msg.type, msg.asid,
> +                                          msg.iotlb.type);
>      if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) {
>          error_report("failed to write BEGIN_BATCH, fd=%d, errno=%d (%s)",
>                       fd, errno, strerror(errno));
> @@ -162,7 +175,8 @@ static void vhost_vdpa_listener_commit(MemoryListener 
> *listener)
>      }
>
>      msg.iotlb.type = VHOST_IOTLB_BATCH_END;
> -    trace_vhost_vdpa_listener_commit(v, fd, msg.type, msg.iotlb.type);
> +    trace_vhost_vdpa_listener_commit(v, fd, msg.type, msg.asid,
> +                                     msg.iotlb.type);
>      if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) {
>          error_report("failed to write, fd=%d, errno=%d (%s)",
>                       fd, errno, strerror(errno));
> @@ -1171,10 +1185,48 @@ call_err:
>      return false;
>  }
>
> +static int vhost_vdpa_set_vq_group_address_space_id(struct vhost_dev *dev,
> +                                                struct vhost_vring_state 
> *asid)
> +{
> +    trace_vhost_vdpa_set_vq_group_address_space_id(dev, asid->index, 
> asid->num);
> +    return vhost_vdpa_call(dev, VHOST_VDPA_SET_GROUP_ASID, asid);
> +}
> +
> +static int vhost_vdpa_set_address_space_id(struct vhost_dev *dev)
> +{
> +    struct vhost_vring_state vq_group = {
> +        .index = dev->vq_index,
> +    };
> +    struct vhost_vring_state asid;
> +    int ret;
> +
> +    if (!dev->address_space_id) {
> +        return 0;
> +    }
> +
> +    ret = vhost_vdpa_get_vring_group(dev, &vq_group);
> +    if (unlikely(ret)) {
> +        error_report("Can't read vq group, errno=%d (%s)", ret,
> +                     g_strerror(-ret));
> +        return ret;
> +    }
> +
> +    asid.index = vq_group.num;
> +    asid.num = dev->address_space_id;
> +    ret = vhost_vdpa_set_vq_group_address_space_id(dev, &asid);
> +    if (unlikely(ret)) {
> +        error_report("Can't set vq group %u asid %u, errno=%d (%s)",
> +            asid.index, asid.num, ret, g_strerror(-ret));
> +    }
> +    return ret;
> +}
> +
>  static int vhost_vdpa_dev_start(struct vhost_dev *dev, bool started)
>  {
>      struct vhost_vdpa *v = dev->opaque;
> -    bool ok;
> +    bool vq_group_end, ok;
> +    int r = 0;
> +
>      trace_vhost_vdpa_dev_start(dev, started);
>
>      if (started) {
> @@ -1183,6 +1235,10 @@ static int vhost_vdpa_dev_start(struct vhost_dev *dev, 
> bool started)
>              !vhost_dev_is_independent_group(dev)) {
>              return -1;
>          }
> +        r = vhost_vdpa_set_address_space_id(dev);
> +        if (unlikely(r)) {
> +            return r;
> +        }
>          ok = vhost_vdpa_svqs_start(dev);
>          if (unlikely(!ok)) {
>              return -1;
> @@ -1196,21 +1252,26 @@ static int vhost_vdpa_dev_start(struct vhost_dev 
> *dev, bool started)
>          vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs);
>      }
>
> -    if (dev->vq_index + dev->nvqs != dev->vq_index_end) {
> -        return 0;
> +    vq_group_end = dev->vq_index + dev->nvqs == dev->vq_group_index_end;
> +    if (vq_group_end && started) {
> +        memory_listener_register(&v->listener, &address_space_memory);
>      }
>
> -    if (started) {
> -        memory_listener_register(&v->listener, &address_space_memory);
> -        return vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK);
> -    } else {
> -        vhost_vdpa_reset_device(dev);
> -        vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE |
> -                                   VIRTIO_CONFIG_S_DRIVER);
> -        memory_listener_unregister(&v->listener);
> +    if (dev->vq_index + dev->nvqs == dev->vq_index_end) {
> +        if (started) {
> +            r = vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK);
> +        } else {
> +            vhost_vdpa_reset_device(dev);
> +            vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE |
> +                                       VIRTIO_CONFIG_S_DRIVER);
> +        }
> +    }
>
> -        return 0;
> +    if (vq_group_end && !started) {
> +        memory_listener_unregister(&v->listener);
>      }
> +
> +    return r;
>  }
>
>  static int vhost_vdpa_set_log_base(struct vhost_dev *dev, uint64_t base,
> diff --git a/net/vhost-vdpa.c b/net/vhost-vdpa.c
> index 15c3e4f703..a6f803ea4e 100644
> --- a/net/vhost-vdpa.c
> +++ b/net/vhost-vdpa.c
> @@ -473,8 +473,8 @@ int net_init_vhost_vdpa(const Netdev *netdev, const char 
> *name,
>
>      if (has_cvq) {
>          nc = net_vhost_vdpa_init(peer, TYPE_VHOST_VDPA, name,
> -                                 vdpa_device_fd, i, 1, false, opts->x_svq,
> -                                 iova_tree);
> +                                 vdpa_device_fd, i, 1,
> +                                 false, opts->x_svq, iova_tree);
>          if (!nc)
>              goto err;
>      }
> diff --git a/hw/virtio/trace-events b/hw/virtio/trace-events
> index e6fdc03514..2858deac60 100644
> --- a/hw/virtio/trace-events
> +++ b/hw/virtio/trace-events
> @@ -23,10 +23,10 @@ vhost_user_postcopy_waker_found(uint64_t client_addr) 
> "0x%"PRIx64
>  vhost_user_postcopy_waker_nomatch(const char *rb, uint64_t rb_offset) "%s + 
> 0x%"PRIx64
>
>  # vhost-vdpa.c
> -vhost_vdpa_dma_map(void *vdpa, int fd, uint32_t msg_type, uint64_t iova, 
> uint64_t size, uint64_t uaddr, uint8_t perm, uint8_t type) "vdpa:%p fd: %d 
> msg_type: %"PRIu32" iova: 0x%"PRIx64" size: 0x%"PRIx64" uaddr: 0x%"PRIx64" 
> perm: 0x%"PRIx8" type: %"PRIu8
> -vhost_vdpa_dma_unmap(void *vdpa, int fd, uint32_t msg_type, uint64_t iova, 
> uint64_t size, uint8_t type) "vdpa:%p fd: %d msg_type: %"PRIu32" iova: 
> 0x%"PRIx64" size: 0x%"PRIx64" type: %"PRIu8
> -vhost_vdpa_listener_begin_batch(void *v, int fd, uint32_t msg_type, uint8_t 
> type)  "vdpa:%p fd: %d msg_type: %"PRIu32" type: %"PRIu8
> -vhost_vdpa_listener_commit(void *v, int fd, uint32_t msg_type, uint8_t type) 
>  "vdpa:%p fd: %d msg_type: %"PRIu32" type: %"PRIu8
> +vhost_vdpa_dma_map(void *vdpa, int fd, uint32_t msg_type, uint32_t asid, 
> uint64_t iova, uint64_t size, uint64_t uaddr, uint8_t perm, uint8_t type) 
> "vdpa:%p fd: %d msg_type: %"PRIu32" asid: %"PRIu32" iova: 0x%"PRIx64" size: 
> 0x%"PRIx64" uaddr: 0x%"PRIx64" perm: 0x%"PRIx8" type: %"PRIu8
> +vhost_vdpa_dma_unmap(void *vdpa, int fd, uint32_t msg_type, uint32_t asid, 
> uint64_t iova, uint64_t size, uint8_t type) "vdpa:%p fd: %d msg_type: 
> %"PRIu32" asid: %"PRIu32" iova: 0x%"PRIx64" size: 0x%"PRIx64" type: %"PRIu8
> +vhost_vdpa_listener_begin_batch(void *v, int fd, uint32_t msg_type, uint32_t 
> asid, uint8_t type)  "vdpa:%p fd: %d msg_type: %"PRIu32" asid: %"PRIu32" 
> type: %"PRIu8
> +vhost_vdpa_listener_commit(void *v, int fd, uint32_t msg_type, uint32_t 
> asid, uint8_t type)  "vdpa:%p fd: %d msg_type: %"PRIu32" asid: %"PRIu32" 
> type: %"PRIu8
>  vhost_vdpa_listener_region_add(void *vdpa, uint64_t iova, uint64_t llend, 
> void *vaddr, bool readonly) "vdpa: %p iova 0x%"PRIx64" llend 0x%"PRIx64" 
> vaddr: %p read-only: %d"
>  vhost_vdpa_listener_region_del(void *vdpa, uint64_t iova, uint64_t llend) 
> "vdpa: %p iova 0x%"PRIx64" llend 0x%"PRIx64
>  vhost_vdpa_add_status(void *dev, uint8_t status) "dev: %p status: 0x%"PRIx8
> @@ -44,6 +44,7 @@ vhost_vdpa_dump_config(void *dev, const char *line) "dev: 
> %p %s"
>  vhost_vdpa_set_config(void *dev, uint32_t offset, uint32_t size, uint32_t 
> flags) "dev: %p offset: %"PRIu32" size: %"PRIu32" flags: 0x%"PRIx32
>  vhost_vdpa_get_config(void *dev, void *config, uint32_t config_len) "dev: %p 
> config: %p config_len: %"PRIu32
>  vhost_vdpa_get_vring_group(void *dev, unsigned int index, unsigned int num) 
> "dev: %p index: %u num: %u"
> +vhost_vdpa_set_vq_group_address_space_id(void *dev, unsigned int index, 
> unsigned int num) "dev: %p index: %u num: %u"
>  vhost_vdpa_dev_start(void *dev, bool started) "dev: %p started: %d"
>  vhost_vdpa_set_log_base(void *dev, uint64_t base, unsigned long long size, 
> int refcnt, int fd, void *log) "dev: %p base: 0x%"PRIx64" size: %llu refcnt: 
> %d fd: %d log: %p"
>  vhost_vdpa_set_vring_addr(void *dev, unsigned int index, unsigned int flags, 
> uint64_t desc_user_addr, uint64_t used_user_addr, uint64_t avail_user_addr, 
> uint64_t log_guest_addr) "dev: %p index: %u flags: 0x%x desc_user_addr: 
> 0x%"PRIx64" used_user_addr: 0x%"PRIx64" avail_user_addr: 0x%"PRIx64" 
> log_guest_addr: 0x%"PRIx64
> --
> 2.27.0
>


Reply via email to