On 1/29/20 11:09 AM, Matan Azrad wrote:
> The HW virtq object represents an emulated context for a VIRTIO_NET
> virtqueue which was created and managed by a VIRTIO_NET driver as
> defined in VIRTIO Specification.
> 
> Add support to prepare and release all the basic HW resources needed
> the user virtqs emulation according to the rte_vhost configurations.
> 
> This patch prepares the basic configurations needed by DevX commands to
> create a virtq.
> 
> Add new file mlx5_vdpa_virtq.c to manage virtq operations.
> 
> Signed-off-by: Matan Azrad <ma...@mellanox.com>
> Acked-by: Viacheslav Ovsiienko <viachesl...@mellanox.com>
> ---
>  drivers/vdpa/mlx5/Makefile          |   1 +
>  drivers/vdpa/mlx5/meson.build       |   1 +
>  drivers/vdpa/mlx5/mlx5_vdpa.c       |   1 +
>  drivers/vdpa/mlx5/mlx5_vdpa.h       |  36 ++++++
>  drivers/vdpa/mlx5/mlx5_vdpa_virtq.c | 212 
> ++++++++++++++++++++++++++++++++++++
>  5 files changed, 251 insertions(+)
>  create mode 100644 drivers/vdpa/mlx5/mlx5_vdpa_virtq.c
> 
> diff --git a/drivers/vdpa/mlx5/Makefile b/drivers/vdpa/mlx5/Makefile
> index 7f13756..353e262 100644
> --- a/drivers/vdpa/mlx5/Makefile
> +++ b/drivers/vdpa/mlx5/Makefile
> @@ -10,6 +10,7 @@ LIB = librte_pmd_mlx5_vdpa.a
>  SRCS-$(CONFIG_RTE_LIBRTE_MLX5_VDPA_PMD) += mlx5_vdpa.c
>  SRCS-$(CONFIG_RTE_LIBRTE_MLX5_VDPA_PMD) += mlx5_vdpa_mem.c
>  SRCS-$(CONFIG_RTE_LIBRTE_MLX5_VDPA_PMD) += mlx5_vdpa_event.c
> +SRCS-$(CONFIG_RTE_LIBRTE_MLX5_VDPA_PMD) += mlx5_vdpa_virtq.c
>  
>  # Basic CFLAGS.
>  CFLAGS += -O3
> diff --git a/drivers/vdpa/mlx5/meson.build b/drivers/vdpa/mlx5/meson.build
> index c609f7c..e017f95 100644
> --- a/drivers/vdpa/mlx5/meson.build
> +++ b/drivers/vdpa/mlx5/meson.build
> @@ -14,6 +14,7 @@ sources = files(
>       'mlx5_vdpa.c',
>       'mlx5_vdpa_mem.c',
>       'mlx5_vdpa_event.c',
> +     'mlx5_vdpa_virtq.c',
>  )
>  cflags_options = [
>       '-std=c11',
> diff --git a/drivers/vdpa/mlx5/mlx5_vdpa.c b/drivers/vdpa/mlx5/mlx5_vdpa.c
> index c67f93d..4d30b35 100644
> --- a/drivers/vdpa/mlx5/mlx5_vdpa.c
> +++ b/drivers/vdpa/mlx5/mlx5_vdpa.c
> @@ -229,6 +229,7 @@
>               goto error;
>       }
>       SLIST_INIT(&priv->mr_list);
> +     SLIST_INIT(&priv->virtq_list);
>       pthread_mutex_lock(&priv_list_lock);
>       TAILQ_INSERT_TAIL(&priv_list, priv, next);
>       pthread_mutex_unlock(&priv_list_lock);
> diff --git a/drivers/vdpa/mlx5/mlx5_vdpa.h b/drivers/vdpa/mlx5/mlx5_vdpa.h
> index 30030b7..a7e2185 100644
> --- a/drivers/vdpa/mlx5/mlx5_vdpa.h
> +++ b/drivers/vdpa/mlx5/mlx5_vdpa.h
> @@ -53,6 +53,19 @@ struct mlx5_vdpa_query_mr {
>       int is_indirect;
>  };
>  
> +struct mlx5_vdpa_virtq {
> +     SLIST_ENTRY(mlx5_vdpa_virtq) next;
> +     uint16_t index;
> +     uint16_t vq_size;
> +     struct mlx5_devx_obj *virtq;
> +     struct mlx5_vdpa_event_qp eqp;
> +     struct {
> +             struct mlx5dv_devx_umem *obj;
> +             void *buf;
> +             uint32_t size;
> +     } umems[3];
> +};
> +
>  struct mlx5_vdpa_priv {
>       TAILQ_ENTRY(mlx5_vdpa_priv) next;
>       int id; /* vDPA device id. */
> @@ -69,6 +82,10 @@ struct mlx5_vdpa_priv {
>       struct mlx5dv_devx_event_channel *eventc;
>       struct mlx5dv_devx_uar *uar;
>       struct rte_intr_handle intr_handle;
> +     struct mlx5_devx_obj *td;
> +     struct mlx5_devx_obj *tis;
> +     uint16_t nr_virtqs;
> +     SLIST_HEAD(virtq_list, mlx5_vdpa_virtq) virtq_list;
>       SLIST_HEAD(mr_list, mlx5_vdpa_query_mr) mr_list;
>  };
>  
> @@ -146,4 +163,23 @@ int mlx5_vdpa_event_qp_create(struct mlx5_vdpa_priv 
> *priv, uint16_t desc_n,
>   */
>  void mlx5_vdpa_cqe_event_unset(struct mlx5_vdpa_priv *priv);
>  
> +/**
> + * Release a virtq and all its related resources.
> + *
> + * @param[in] priv
> + *   The vdpa driver private structure.
> + */
> +void mlx5_vdpa_virtqs_release(struct mlx5_vdpa_priv *priv);
> +
> +/**
> + * Create all the HW virtqs resources and all their related resources.
> + *
> + * @param[in] priv
> + *   The vdpa driver private structure.
> + *
> + * @return
> + *   0 on success, a negative errno value otherwise and rte_errno is set.
> + */
> +int mlx5_vdpa_virtqs_prepare(struct mlx5_vdpa_priv *priv);
> +
>  #endif /* RTE_PMD_MLX5_VDPA_H_ */
> diff --git a/drivers/vdpa/mlx5/mlx5_vdpa_virtq.c 
> b/drivers/vdpa/mlx5/mlx5_vdpa_virtq.c
> new file mode 100644
> index 0000000..781bccf
> --- /dev/null
> +++ b/drivers/vdpa/mlx5/mlx5_vdpa_virtq.c
> @@ -0,0 +1,212 @@
> +/* SPDX-License-Identifier: BSD-3-Clause
> + * Copyright 2019 Mellanox Technologies, Ltd
> + */
> +#include <string.h>
> +
> +#include <rte_malloc.h>
> +#include <rte_errno.h>
> +
> +#include <mlx5_common.h>
> +
> +#include "mlx5_vdpa_utils.h"
> +#include "mlx5_vdpa.h"
> +
> +
> +static int
> +mlx5_vdpa_virtq_unset(struct mlx5_vdpa_virtq *virtq)
> +{
> +     int i;
> +
> +     if (virtq->virtq) {
> +             claim_zero(mlx5_devx_cmd_destroy(virtq->virtq));
> +             virtq->virtq = NULL;
> +     }
> +     for (i = 0; i < 3; ++i) {
> +             if (virtq->umems[i].obj)
> +                     claim_zero(mlx5_glue->devx_umem_dereg
> +                                                      (virtq->umems[i].obj));
> +             if (virtq->umems[i].buf)
> +                     rte_free(virtq->umems[i].buf);
> +     }
> +     memset(&virtq->umems, 0, sizeof(virtq->umems));
> +     if (virtq->eqp.fw_qp)
> +             mlx5_vdpa_event_qp_destroy(&virtq->eqp);
> +     return 0;
> +}
> +
> +void
> +mlx5_vdpa_virtqs_release(struct mlx5_vdpa_priv *priv)
> +{
> +     struct mlx5_vdpa_virtq *entry;
> +     struct mlx5_vdpa_virtq *next;
> +
> +     entry = SLIST_FIRST(&priv->virtq_list);
> +     while (entry) {
> +             next = SLIST_NEXT(entry, next);
> +             mlx5_vdpa_virtq_unset(entry);
> +             SLIST_REMOVE(&priv->virtq_list, entry, mlx5_vdpa_virtq, next);
> +             rte_free(entry);
> +             entry = next;
> +     }
> +     SLIST_INIT(&priv->virtq_list);
> +     if (priv->tis) {
> +             claim_zero(mlx5_devx_cmd_destroy(priv->tis));
> +             priv->tis = NULL;
> +     }
> +     if (priv->td) {
> +             claim_zero(mlx5_devx_cmd_destroy(priv->td));
> +             priv->td = NULL;
> +     }
> +}
> +
> +static uint64_t
> +mlx5_vdpa_hva_to_gpa(struct rte_vhost_memory *mem, uint64_t hva)
> +{
> +     struct rte_vhost_mem_region *reg;
> +     uint32_t i;
> +     uint64_t gpa = 0;
> +
> +     for (i = 0; i < mem->nregions; i++) {
> +             reg = &mem->regions[i];
> +             if (hva >= reg->host_user_addr &&
> +                 hva < reg->host_user_addr + reg->size) {
> +                     gpa = hva - reg->host_user_addr + reg->guest_phys_addr;
> +                     break;
> +             }
> +     }
> +     return gpa;
> +}

I think you may need a third parameter for the size to map.
Otherwise, you would be vulnerable to CVE-2018-1059.

> +
> +static int
> +mlx5_vdpa_virtq_setup(struct mlx5_vdpa_priv *priv,
> +                   struct mlx5_vdpa_virtq *virtq, int index)
> +{
> +     struct rte_vhost_vring vq;
> +     struct mlx5_devx_virtq_attr attr = {0};
> +     uint64_t gpa;
> +     int ret;
> +     int i;
> +     uint16_t last_avail_idx;
> +     uint16_t last_used_idx;
> +
> +     ret = rte_vhost_get_vhost_vring(priv->vid, index, &vq);
> +     if (ret)
> +             return -1;
> +     virtq->index = index;
> +     virtq->vq_size = vq.size;
> +     /*
> +      * No need event QPs creation when the guest in poll mode or when the
> +      * capability allows it.
> +      */
> +     attr.event_mode = vq.callfd != -1 || !(priv->caps.event_mode & (1 <<
> +                                            MLX5_VIRTQ_EVENT_MODE_NO_MSIX)) ?
> +                                                   MLX5_VIRTQ_EVENT_MODE_QP :
> +                                               MLX5_VIRTQ_EVENT_MODE_NO_MSIX;
> +     if (attr.event_mode == MLX5_VIRTQ_EVENT_MODE_QP) {
> +             ret = mlx5_vdpa_event_qp_create(priv, vq.size, vq.callfd,
> +                                             &virtq->eqp);
> +             if (ret) {
> +                     DRV_LOG(ERR, "Failed to create event QPs for virtq %d.",
> +                             index);
> +                     return -1;
> +             }
> +             attr.qp_id = virtq->eqp.fw_qp->id;
> +     } else {
> +             DRV_LOG(INFO, "Virtq %d is, for sure, working by poll mode, no"
> +                     " need event QPs and event mechanism.", index);
> +     }
> +     /* Setup 3 UMEMs for each virtq. */
> +     for (i = 0; i < 3; ++i) {
> +             virtq->umems[i].size = priv->caps.umems[i].a * vq.size +
> +                                                       priv->caps.umems[i].b;
> +             virtq->umems[i].buf = rte_zmalloc(__func__,
> +                                               virtq->umems[i].size, 4096);
> +             if (!virtq->umems[i].buf) {
> +                     DRV_LOG(ERR, "Cannot allocate umem %d memory for virtq"
> +                             " %u.", i, index);
> +                     goto error;
> +             }
> +             virtq->umems[i].obj = mlx5_glue->devx_umem_reg(priv->ctx,
> +                                                     virtq->umems[i].buf,
> +                                                     virtq->umems[i].size,
> +                                                     IBV_ACCESS_LOCAL_WRITE);
> +             if (!virtq->umems[i].obj) {
> +                     DRV_LOG(ERR, "Failed to register umem %d for virtq %u.",
> +                             i, index);
> +                     goto error;
> +             }
> +             attr.umems[i].id = virtq->umems[i].obj->umem_id;
> +             attr.umems[i].offset = 0;
> +             attr.umems[i].size = virtq->umems[i].size;
> +     }
> +     gpa = mlx5_vdpa_hva_to_gpa(priv->vmem, (uint64_t)(uintptr_t)vq.desc);
> +     if (!gpa) {
> +             DRV_LOG(ERR, "Fail to get GPA for descriptor ring.");
> +             goto error;
> +     }
> +     attr.desc_addr = gpa;
> +     gpa = mlx5_vdpa_hva_to_gpa(priv->vmem, (uint64_t)(uintptr_t)vq.used);
> +     if (!gpa) {
> +             DRV_LOG(ERR, "Fail to get GPA for used ring.");
> +             goto error;
> +     }
> +     attr.used_addr = gpa;
> +     gpa = mlx5_vdpa_hva_to_gpa(priv->vmem, (uint64_t)(uintptr_t)vq.avail);
> +     if (!gpa) {
> +             DRV_LOG(ERR, "Fail to get GPA for available ring.");
> +             goto error;
> +     }
> +     attr.available_addr = gpa;
> +     rte_vhost_get_vring_base(priv->vid, index, &last_avail_idx,
> +                              &last_used_idx);
> +     DRV_LOG(INFO, "vid %d: Init last_avail_idx=%d, last_used_idx=%d for "
> +             "virtq %d.", priv->vid, last_avail_idx, last_used_idx, index);
> +     attr.hw_available_index = last_avail_idx;
> +     attr.hw_used_index = last_used_idx;
> +     attr.q_size = vq.size;
> +     attr.mkey = priv->gpa_mkey_index;
> +     attr.tis_id = priv->tis->id;
> +     attr.queue_index = index;
> +     virtq->virtq = mlx5_devx_cmd_create_virtq(priv->ctx, &attr);
> +     if (!virtq->virtq)
> +             goto error;
> +     return 0;
> +error:
> +     mlx5_vdpa_virtq_unset(virtq);
> +     return -1;
> +}
> +
> +int
> +mlx5_vdpa_virtqs_prepare(struct mlx5_vdpa_priv *priv)
> +{
> +     struct mlx5_devx_tis_attr tis_attr = {0};
> +     struct mlx5_vdpa_virtq *virtq;
> +     uint32_t i;
> +     uint16_t nr_vring = rte_vhost_get_vring_num(priv->vid);
> +
> +     priv->td = mlx5_devx_cmd_create_td(priv->ctx);
> +     if (!priv->td) {
> +             DRV_LOG(ERR, "Failed to create transport domain.");
> +             return -rte_errno;
> +     }
> +     tis_attr.transport_domain = priv->td->id;
> +     priv->tis = mlx5_devx_cmd_create_tis(priv->ctx, &tis_attr);
> +     if (!priv->tis) {
> +             DRV_LOG(ERR, "Failed to create TIS.");
> +             goto error;
> +     }
> +     for (i = 0; i < nr_vring; i++) {
> +             virtq = rte_zmalloc(__func__, sizeof(*virtq), 0);
> +             if (!virtq || mlx5_vdpa_virtq_setup(priv, virtq, i)) {
> +                     if (virtq)
> +                             rte_free(virtq);
> +                     goto error;
> +             }
> +             SLIST_INSERT_HEAD(&priv->virtq_list, virtq, next);
> +     }
> +     priv->nr_virtqs = nr_vring;
> +     return 0;
> +error:
> +     mlx5_vdpa_virtqs_release(priv);
> +     return -1;
> +}
> 

Reply via email to