On Thu, Apr 14, 2022 at 11:10 AM Jason Wang <jasow...@redhat.com> wrote: > > On Thu, Apr 14, 2022 at 12:33 AM Eugenio Pérez <epere...@redhat.com> wrote: > > > > We can configure ASID per group, but we still use asid 0 for every vdpa > > device. Multiple asid support for cvq will be introduced in next > > patches > > > > Signed-off-by: Eugenio Pérez <epere...@redhat.com> > > --- > > include/hw/virtio/vhost.h | 4 ++ > > hw/net/vhost_net.c | 5 +++ > > hw/virtio/vhost-vdpa.c | 95 ++++++++++++++++++++++++++++++++------- > > net/vhost-vdpa.c | 4 +- > > hw/virtio/trace-events | 9 ++-- > > 5 files changed, 94 insertions(+), 23 deletions(-) > > > > diff --git a/include/hw/virtio/vhost.h b/include/hw/virtio/vhost.h > > index 034868fa9e..640cf82168 100644 > > --- a/include/hw/virtio/vhost.h > > +++ b/include/hw/virtio/vhost.h > > @@ -76,8 +76,12 @@ struct vhost_dev { > > int vq_index; > > /* one past the last vq index for the virtio device (not vhost) */ > > int vq_index_end; > > + /* one past the last vq index of this virtqueue group */ > > + int vq_group_index_end; > > /* if non-zero, minimum required value for max_queues */ > > int num_queues; > > + /* address space id */ > > Instead of doing shortcuts like this, I think we need to have > abstraction as what kernel did. That is to say, introduce structures > like: > > struct vhost_vdpa_dev_group; > struct vhost_vdpa_as; > > Then having pointers to those structures like > > struct vhost_vdpa { > ... > struct vhost_vdpa_dev_group *group; > }; > > struct vhost_vdpa_group { > ... > uint32_t id; > struct vhost_vdpa_as; > }; > > struct vhost_vdpa_as { > uint32_t id; > MemoryListener listener; > }; > > We can read the group topology during initialization and allocate the > structure accordingly. If the CVQ has its own group: > > 1) We know we will have 2 AS otherwise 1 AS > 2) allocate #AS and attach the group to the corresponding AS > > Then we know the > > 1) map/unmap and listener is done per as instead of per group or vdpa. > 2) AS attach/detach is done per group > > And it would simplify the future extension when we want to advertise > the as/groups to guests. > > To simplify the reviewing, we can introduce the above concept before > the ASID uAPIs and assume a 1 group 1 as a model as a start. >
I think it's doable, let me refactor the code that way and I'll come back with the results. Thanks! > Thanks > > > + uint32_t address_space_id; > > /* Must be a vq group different than any other vhost dev */ > > bool independent_vq_group; > > uint64_t features; > > diff --git a/hw/net/vhost_net.c b/hw/net/vhost_net.c > > index 10480e19e5..a34df739a7 100644 > > --- a/hw/net/vhost_net.c > > +++ b/hw/net/vhost_net.c > > @@ -344,15 +344,20 @@ int vhost_net_start(VirtIODevice *dev, NetClientState > > *ncs, > > > > for (i = 0; i < nvhosts; i++) { > > bool cvq_idx = i >= data_queue_pairs; > > + uint32_t vq_group_end; > > > > if (!cvq_idx) { > > peer = qemu_get_peer(ncs, i); > > + vq_group_end = 2 * data_queue_pairs; > > } else { /* Control Virtqueue */ > > peer = qemu_get_peer(ncs, n->max_queue_pairs); > > + vq_group_end = 2 * data_queue_pairs + 1; > > } > > > > net = get_vhost_net(peer); > > + net->dev.address_space_id = !!cvq_idx; > > net->dev.independent_vq_group = !!cvq_idx; > > + net->dev.vq_group_index_end = vq_group_end; > > vhost_net_set_vq_index(net, i * 2, index_end); > > > > /* Suppress the masking guest notifiers on vhost user > > diff --git a/hw/virtio/vhost-vdpa.c b/hw/virtio/vhost-vdpa.c > > index 4096555242..5ed211287c 100644 > > --- a/hw/virtio/vhost-vdpa.c > > +++ b/hw/virtio/vhost-vdpa.c > > @@ -79,6 +79,9 @@ static int vhost_vdpa_dma_map(struct vhost_vdpa *v, > > hwaddr iova, hwaddr size, > > int ret = 0; > > > > msg.type = v->msg_type; > > + if (v->dev->backend_cap & BIT_ULL(VHOST_BACKEND_F_IOTLB_ASID)) { > > + msg.asid = v->dev->address_space_id; > > + } > > msg.iotlb.iova = iova; > > msg.iotlb.size = size; > > msg.iotlb.uaddr = (uint64_t)(uintptr_t)vaddr; > > @@ -90,8 +93,9 @@ static int vhost_vdpa_dma_map(struct vhost_vdpa *v, > > hwaddr iova, hwaddr size, > > return 0; > > } > > > > - trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.iotlb.iova, > > msg.iotlb.size, > > - msg.iotlb.uaddr, msg.iotlb.perm, > > msg.iotlb.type); > > + trace_vhost_vdpa_dma_map(v, fd, msg.type, msg.asid, msg.iotlb.iova, > > + msg.iotlb.size, msg.iotlb.uaddr, > > msg.iotlb.perm, > > + msg.iotlb.type); > > > > if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { > > error_report("failed to write, fd=%d, errno=%d (%s)", > > @@ -109,6 +113,9 @@ static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, > > hwaddr iova, > > int fd = v->device_fd; > > int ret = 0; > > > > + if (v->dev->backend_cap & BIT_ULL(VHOST_BACKEND_F_IOTLB_ASID)) { > > + msg.asid = v->dev->address_space_id; > > + } > > msg.type = v->msg_type; > > msg.iotlb.iova = iova; > > msg.iotlb.size = size; > > @@ -119,7 +126,7 @@ static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, > > hwaddr iova, > > return 0; > > } > > > > - trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.iotlb.iova, > > + trace_vhost_vdpa_dma_unmap(v, fd, msg.type, msg.asid, msg.iotlb.iova, > > msg.iotlb.size, msg.iotlb.type); > > > > if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { > > @@ -134,6 +141,7 @@ static int vhost_vdpa_dma_unmap(struct vhost_vdpa *v, > > hwaddr iova, > > static void vhost_vdpa_listener_commit(MemoryListener *listener) > > { > > struct vhost_vdpa *v = container_of(listener, struct vhost_vdpa, > > listener); > > + struct vhost_dev *dev = v->dev; > > struct vhost_msg_v2 msg = {}; > > int fd = v->device_fd; > > size_t num = v->iotlb_updates->len; > > @@ -142,9 +150,14 @@ static void vhost_vdpa_listener_commit(MemoryListener > > *listener) > > return; > > } > > > > + if (dev->backend_cap & (0x1ULL << VHOST_BACKEND_F_IOTLB_ASID)) { > > + msg.asid = v->dev->address_space_id; > > + } > > + > > msg.type = v->msg_type; > > msg.iotlb.type = VHOST_IOTLB_BATCH_BEGIN; > > - trace_vhost_vdpa_listener_begin_batch(v, fd, msg.type, msg.iotlb.type); > > + trace_vhost_vdpa_listener_begin_batch(v, fd, msg.type, msg.asid, > > + msg.iotlb.type); > > if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { > > error_report("failed to write BEGIN_BATCH, fd=%d, errno=%d (%s)", > > fd, errno, strerror(errno)); > > @@ -162,7 +175,8 @@ static void vhost_vdpa_listener_commit(MemoryListener > > *listener) > > } > > > > msg.iotlb.type = VHOST_IOTLB_BATCH_END; > > - trace_vhost_vdpa_listener_commit(v, fd, msg.type, msg.iotlb.type); > > + trace_vhost_vdpa_listener_commit(v, fd, msg.type, msg.asid, > > + msg.iotlb.type); > > if (write(fd, &msg, sizeof(msg)) != sizeof(msg)) { > > error_report("failed to write, fd=%d, errno=%d (%s)", > > fd, errno, strerror(errno)); > > @@ -1171,10 +1185,48 @@ call_err: > > return false; > > } > > > > +static int vhost_vdpa_set_vq_group_address_space_id(struct vhost_dev *dev, > > + struct vhost_vring_state > > *asid) > > +{ > > + trace_vhost_vdpa_set_vq_group_address_space_id(dev, asid->index, > > asid->num); > > + return vhost_vdpa_call(dev, VHOST_VDPA_SET_GROUP_ASID, asid); > > +} > > + > > +static int vhost_vdpa_set_address_space_id(struct vhost_dev *dev) > > +{ > > + struct vhost_vring_state vq_group = { > > + .index = dev->vq_index, > > + }; > > + struct vhost_vring_state asid; > > + int ret; > > + > > + if (!dev->address_space_id) { > > + return 0; > > + } > > + > > + ret = vhost_vdpa_get_vring_group(dev, &vq_group); > > + if (unlikely(ret)) { > > + error_report("Can't read vq group, errno=%d (%s)", ret, > > + g_strerror(-ret)); > > + return ret; > > + } > > + > > + asid.index = vq_group.num; > > + asid.num = dev->address_space_id; > > + ret = vhost_vdpa_set_vq_group_address_space_id(dev, &asid); > > + if (unlikely(ret)) { > > + error_report("Can't set vq group %u asid %u, errno=%d (%s)", > > + asid.index, asid.num, ret, g_strerror(-ret)); > > + } > > + return ret; > > +} > > + > > static int vhost_vdpa_dev_start(struct vhost_dev *dev, bool started) > > { > > struct vhost_vdpa *v = dev->opaque; > > - bool ok; > > + bool vq_group_end, ok; > > + int r = 0; > > + > > trace_vhost_vdpa_dev_start(dev, started); > > > > if (started) { > > @@ -1183,6 +1235,10 @@ static int vhost_vdpa_dev_start(struct vhost_dev > > *dev, bool started) > > !vhost_dev_is_independent_group(dev)) { > > return -1; > > } > > + r = vhost_vdpa_set_address_space_id(dev); > > + if (unlikely(r)) { > > + return r; > > + } > > ok = vhost_vdpa_svqs_start(dev); > > if (unlikely(!ok)) { > > return -1; > > @@ -1196,21 +1252,26 @@ static int vhost_vdpa_dev_start(struct vhost_dev > > *dev, bool started) > > vhost_vdpa_host_notifiers_uninit(dev, dev->nvqs); > > } > > > > - if (dev->vq_index + dev->nvqs != dev->vq_index_end) { > > - return 0; > > + vq_group_end = dev->vq_index + dev->nvqs == dev->vq_group_index_end; > > + if (vq_group_end && started) { > > + memory_listener_register(&v->listener, &address_space_memory); > > } > > > > - if (started) { > > - memory_listener_register(&v->listener, &address_space_memory); > > - return vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK); > > - } else { > > - vhost_vdpa_reset_device(dev); > > - vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | > > - VIRTIO_CONFIG_S_DRIVER); > > - memory_listener_unregister(&v->listener); > > + if (dev->vq_index + dev->nvqs == dev->vq_index_end) { > > + if (started) { > > + r = vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_DRIVER_OK); > > + } else { > > + vhost_vdpa_reset_device(dev); > > + vhost_vdpa_add_status(dev, VIRTIO_CONFIG_S_ACKNOWLEDGE | > > + VIRTIO_CONFIG_S_DRIVER); > > + } > > + } > > > > - return 0; > > + if (vq_group_end && !started) { > > + memory_listener_unregister(&v->listener); > > } > > + > > + return r; > > } > > > > static int vhost_vdpa_set_log_base(struct vhost_dev *dev, uint64_t base, > > diff --git a/net/vhost-vdpa.c b/net/vhost-vdpa.c > > index 15c3e4f703..a6f803ea4e 100644 > > --- a/net/vhost-vdpa.c > > +++ b/net/vhost-vdpa.c > > @@ -473,8 +473,8 @@ int net_init_vhost_vdpa(const Netdev *netdev, const > > char *name, > > > > if (has_cvq) { > > nc = net_vhost_vdpa_init(peer, TYPE_VHOST_VDPA, name, > > - vdpa_device_fd, i, 1, false, opts->x_svq, > > - iova_tree); > > + vdpa_device_fd, i, 1, > > + false, opts->x_svq, iova_tree); > > if (!nc) > > goto err; > > } > > diff --git a/hw/virtio/trace-events b/hw/virtio/trace-events > > index e6fdc03514..2858deac60 100644 > > --- a/hw/virtio/trace-events > > +++ b/hw/virtio/trace-events > > @@ -23,10 +23,10 @@ vhost_user_postcopy_waker_found(uint64_t client_addr) > > "0x%"PRIx64 > > vhost_user_postcopy_waker_nomatch(const char *rb, uint64_t rb_offset) "%s > > + 0x%"PRIx64 > > > > # vhost-vdpa.c > > -vhost_vdpa_dma_map(void *vdpa, int fd, uint32_t msg_type, uint64_t iova, > > uint64_t size, uint64_t uaddr, uint8_t perm, uint8_t type) "vdpa:%p fd: %d > > msg_type: %"PRIu32" iova: 0x%"PRIx64" size: 0x%"PRIx64" uaddr: 0x%"PRIx64" > > perm: 0x%"PRIx8" type: %"PRIu8 > > -vhost_vdpa_dma_unmap(void *vdpa, int fd, uint32_t msg_type, uint64_t iova, > > uint64_t size, uint8_t type) "vdpa:%p fd: %d msg_type: %"PRIu32" iova: > > 0x%"PRIx64" size: 0x%"PRIx64" type: %"PRIu8 > > -vhost_vdpa_listener_begin_batch(void *v, int fd, uint32_t msg_type, > > uint8_t type) "vdpa:%p fd: %d msg_type: %"PRIu32" type: %"PRIu8 > > -vhost_vdpa_listener_commit(void *v, int fd, uint32_t msg_type, uint8_t > > type) "vdpa:%p fd: %d msg_type: %"PRIu32" type: %"PRIu8 > > +vhost_vdpa_dma_map(void *vdpa, int fd, uint32_t msg_type, uint32_t asid, > > uint64_t iova, uint64_t size, uint64_t uaddr, uint8_t perm, uint8_t type) > > "vdpa:%p fd: %d msg_type: %"PRIu32" asid: %"PRIu32" iova: 0x%"PRIx64" size: > > 0x%"PRIx64" uaddr: 0x%"PRIx64" perm: 0x%"PRIx8" type: %"PRIu8 > > +vhost_vdpa_dma_unmap(void *vdpa, int fd, uint32_t msg_type, uint32_t asid, > > uint64_t iova, uint64_t size, uint8_t type) "vdpa:%p fd: %d msg_type: > > %"PRIu32" asid: %"PRIu32" iova: 0x%"PRIx64" size: 0x%"PRIx64" type: %"PRIu8 > > +vhost_vdpa_listener_begin_batch(void *v, int fd, uint32_t msg_type, > > uint32_t asid, uint8_t type) "vdpa:%p fd: %d msg_type: %"PRIu32" asid: > > %"PRIu32" type: %"PRIu8 > > +vhost_vdpa_listener_commit(void *v, int fd, uint32_t msg_type, uint32_t > > asid, uint8_t type) "vdpa:%p fd: %d msg_type: %"PRIu32" asid: %"PRIu32" > > type: %"PRIu8 > > vhost_vdpa_listener_region_add(void *vdpa, uint64_t iova, uint64_t llend, > > void *vaddr, bool readonly) "vdpa: %p iova 0x%"PRIx64" llend 0x%"PRIx64" > > vaddr: %p read-only: %d" > > vhost_vdpa_listener_region_del(void *vdpa, uint64_t iova, uint64_t llend) > > "vdpa: %p iova 0x%"PRIx64" llend 0x%"PRIx64 > > vhost_vdpa_add_status(void *dev, uint8_t status) "dev: %p status: 0x%"PRIx8 > > @@ -44,6 +44,7 @@ vhost_vdpa_dump_config(void *dev, const char *line) "dev: > > %p %s" > > vhost_vdpa_set_config(void *dev, uint32_t offset, uint32_t size, uint32_t > > flags) "dev: %p offset: %"PRIu32" size: %"PRIu32" flags: 0x%"PRIx32 > > vhost_vdpa_get_config(void *dev, void *config, uint32_t config_len) "dev: > > %p config: %p config_len: %"PRIu32 > > vhost_vdpa_get_vring_group(void *dev, unsigned int index, unsigned int > > num) "dev: %p index: %u num: %u" > > +vhost_vdpa_set_vq_group_address_space_id(void *dev, unsigned int index, > > unsigned int num) "dev: %p index: %u num: %u" > > vhost_vdpa_dev_start(void *dev, bool started) "dev: %p started: %d" > > vhost_vdpa_set_log_base(void *dev, uint64_t base, unsigned long long size, > > int refcnt, int fd, void *log) "dev: %p base: 0x%"PRIx64" size: %llu > > refcnt: %d fd: %d log: %p" > > vhost_vdpa_set_vring_addr(void *dev, unsigned int index, unsigned int > > flags, uint64_t desc_user_addr, uint64_t used_user_addr, uint64_t > > avail_user_addr, uint64_t log_guest_addr) "dev: %p index: %u flags: 0x%x > > desc_user_addr: 0x%"PRIx64" used_user_addr: 0x%"PRIx64" avail_user_addr: > > 0x%"PRIx64" log_guest_addr: 0x%"PRIx64 > > -- > > 2.27.0 > > >