> Subject: [PATCH 1/1] net/mana: add 32 bit short doorbell
> 
> Add 32 bit short doorbell support. Ring short doorbell when running in 32 bit
> applicactions.
> 
> Cc: sta...@dpdk.org
> 
> Signed-off-by: Wei Hu <w...@microsoft.com>
> ---
>  drivers/net/mana/gdma.c | 95
> +++++++++++++++++++++++++++++++++++++++++
>  drivers/net/mana/mana.h | 25 +++++++++++
>  drivers/net/mana/rx.c   | 52 ++++++++++++++++++++++
>  drivers/net/mana/tx.c   | 28 ++++++++++++
>  4 files changed, 200 insertions(+)
> 
> diff --git a/drivers/net/mana/gdma.c b/drivers/net/mana/gdma.c index
> 65685fe236..d1da025d1b 100644
> --- a/drivers/net/mana/gdma.c
> +++ b/drivers/net/mana/gdma.c
> @@ -166,6 +166,97 @@ gdma_post_work_request(struct
> mana_gdma_queue *queue,
>       return 0;
>  }
> 
> +#ifdef RTE_ARCH_32
> +union gdma_short_doorbell_entry {
> +     uint32_t     as_uint32;
> +
> +     struct {
> +             uint32_t tail_ptr_incr  : 16; /* Number of CQEs */
> +             uint32_t id             : 12;
> +             uint32_t reserved       : 3;
> +             uint32_t arm            : 1;
> +     } cq;
> +
> +     struct {
> +             uint32_t tail_ptr_incr  : 16; /* In number of bytes */
> +             uint32_t id             : 12;
> +             uint32_t reserved       : 4;
> +     } rq;
> +
> +     struct {
> +             uint32_t tail_ptr_incr  : 16; /* In number of bytes */
> +             uint32_t id             : 12;
> +             uint32_t reserved       : 4;
> +     } sq;
> +
> +     struct {
> +             uint32_t tail_ptr_incr  : 16; /* Number of EQEs */
> +             uint32_t id             : 12;
> +             uint32_t reserved       : 3;
> +             uint32_t arm            : 1;
> +     } eq;
> +}; /* HW DATA */
> +
> +enum {
> +     DOORBELL_SHORT_OFFSET_SQ = 0x10,
> +     DOORBELL_SHORT_OFFSET_RQ = 0x410,
> +     DOORBELL_SHORT_OFFSET_CQ = 0x810,
> +     DOORBELL_SHORT_OFFSET_EQ = 0xFF0,
> +};
> +
> +/*
> + * Write to hardware doorbell to notify new activity.
> + */
> +int
> +mana_ring_short_doorbell(void *db_page, enum gdma_queue_types
> queue_type,
> +                      uint32_t queue_id, uint32_t tail_incr, uint8_t arm) {
> +     uint8_t *addr = db_page;
> +     union gdma_short_doorbell_entry e = {};
> +
> +     if ((queue_id & ~GDMA_SHORT_DB_QID_MASK) ||
> +         (tail_incr & ~GDMA_SHORT_DB_INC_MASK)) {
> +             DP_LOG(ERR, "%s: queue_id %u or "
> +                    "tail_incr %u overflowed, queue type %d",
> +                    __func__, queue_id, tail_incr, queue_type);
> +             return -EINVAL;
> +     }
> +
> +     switch (queue_type) {
> +     case GDMA_QUEUE_SEND:
> +             e.sq.id = queue_id;
> +             e.sq.tail_ptr_incr = tail_incr;
> +             addr += DOORBELL_SHORT_OFFSET_SQ;
> +             break;
> +
> +     case GDMA_QUEUE_RECEIVE:
> +             e.rq.id = queue_id;
> +             e.rq.tail_ptr_incr = tail_incr;
> +             addr += DOORBELL_SHORT_OFFSET_RQ;
> +             break;
> +
> +     case GDMA_QUEUE_COMPLETION:
> +             e.cq.id = queue_id;
> +             e.cq.tail_ptr_incr = tail_incr;
> +             e.cq.arm = arm;
> +             addr += DOORBELL_SHORT_OFFSET_CQ;
> +             break;
> +
> +     default:
> +             DP_LOG(ERR, "Unsupported queue type %d", queue_type);
> +             return -1;
> +     }
> +
> +     /* Ensure all writes are done before ringing doorbell */
> +     rte_wmb();
> +
> +     DP_LOG(DEBUG, "db_page %p addr %p queue_id %u type %u tail %u
> arm %u",
> +            db_page, addr, queue_id, queue_type, tail_incr, arm);
> +
> +     rte_write32(e.as_uint32, addr);
> +     return 0;
> +}
> +#else
>  union gdma_doorbell_entry {
>       uint64_t     as_uint64;
> 
> @@ -248,6 +339,7 @@ mana_ring_doorbell(void *db_page, enum
> gdma_queue_types queue_type,
>       rte_write64(e.as_uint64, addr);
>       return 0;
>  }
> +#endif
> 
>  /*
>   * Poll completion queue for completions.
> @@ -287,6 +379,9 @@ gdma_poll_completion_queue(struct
> mana_gdma_queue *cq,
>               num_comp++;
> 
>               cq->head++;
> +#ifdef RTE_ARCH_32
> +             cq->head_incr_to_short_db++;
> +#endif
> 
>               DP_LOG(DEBUG, "comp new 0x%x old 0x%x cqe 0x%x wq %u
> sq %u head %u",
>                      new_owner_bits, old_owner_bits, cqe_owner_bits, diff --
> git a/drivers/net/mana/mana.h b/drivers/net/mana/mana.h index
> 5801491d75..848d87c096 100644
> --- a/drivers/net/mana/mana.h
> +++ b/drivers/net/mana/mana.h
> @@ -50,6 +50,19 @@ struct mana_shared_data {  #define
> MAX_TX_WQE_SIZE 512  #define MAX_RX_WQE_SIZE 256
> 
> +/* For 32 bit only */
> +#ifdef RTE_ARCH_32
> +#define      GDMA_SHORT_DB_INC_MASK 0xffff
> +#define      GDMA_SHORT_DB_QID_MASK 0xfff
> +
> +#define GDMA_SHORT_DB_MAX_WQE        (0x10000 /
> GDMA_WQE_ALIGNMENT_UNIT_SIZE)
> +
> +#define TX_WQE_SHORT_DB_THRESHOLD \
> +     (GDMA_SHORT_DB_MAX_WQE - (2 * MAX_TX_WQE_SIZE)) #define
> +RX_WQE_SHORT_DB_THRESHOLD \

GDMA_SHORT_DB_MAX_WQE is in BU, MAX_TX_WQE_SIZE is in bytes.

Doing math on two different units...

And why using "2*", using "1*" is good enough?




> +     (GDMA_SHORT_DB_MAX_WQE - (2 * MAX_RX_WQE_SIZE)) #endif
> +
>  /* Values from the GDMA specification document, WQE format description */
> #define INLINE_OOB_SMALL_SIZE_IN_BYTES 8  #define
> INLINE_OOB_LARGE_SIZE_IN_BYTES 24 @@ -375,6 +388,9 @@ struct
> mana_gdma_queue {
>       uint32_t id;
>       uint32_t head;
>       uint32_t tail;
> +#ifdef RTE_ARCH_32
> +     uint32_t head_incr_to_short_db;
> +#endif
>  };
> 
>  #define MANA_MR_BTREE_PER_QUEUE_N    64
> @@ -425,6 +441,9 @@ struct mana_rxq {
>        */
>       uint32_t desc_ring_head, desc_ring_tail;
> 
> +     /* For storing wqe increment count btw each short doorbell ring */
> +     uint32_t wqe_cnt_to_short_db;
> +
>       struct mana_gdma_queue gdma_rq;
>       struct mana_gdma_queue gdma_cq;
>       struct gdma_comp *gdma_comp_buf;
> @@ -455,8 +474,14 @@ extern int mana_logtype_init;
> 
>  #define PMD_INIT_FUNC_TRACE() PMD_INIT_LOG(DEBUG, " >>")
> 
> +#ifdef RTE_ARCH_32
> +int mana_ring_short_doorbell(void *db_page, enum gdma_queue_types
> queue_type,
> +                          uint32_t queue_id, uint32_t tail_incr,
> +                          uint8_t arm);
> +#else
>  int mana_ring_doorbell(void *db_page, enum gdma_queue_types
> queue_type,
>                      uint32_t queue_id, uint32_t tail, uint8_t arm);
> +#endif
>  int mana_rq_ring_doorbell(struct mana_rxq *rxq);
> 
>  int gdma_post_work_request(struct mana_gdma_queue *queue, diff --git
> a/drivers/net/mana/rx.c b/drivers/net/mana/rx.c index
> 14d9085801..303d129e5b 100644
> --- a/drivers/net/mana/rx.c
> +++ b/drivers/net/mana/rx.c
> @@ -39,10 +39,23 @@ mana_rq_ring_doorbell(struct mana_rxq *rxq)
>       /* Hardware Spec specifies that software client should set 0 for
>        * wqe_cnt for Receive Queues.
>        */
> +#ifdef RTE_ARCH_32
> +     if (rxq->wqe_cnt_to_short_db) {
> +             ret = mana_ring_short_doorbell(db_page,
> GDMA_QUEUE_RECEIVE,
> +                              rxq->gdma_rq.id,
> +                              rxq->wqe_cnt_to_short_db *
> +
>       GDMA_WQE_ALIGNMENT_UNIT_SIZE,
> +                              0);
> +     } else {

Is it possible that rxq->wqe_cnt_to_short_db might be 0 from the caller? The 
caller shouldn't ring the doorbell if there is nothing to ring.





> +             /* No need to ring, just return */
> +             ret = 0;
> +     }
> +#else
>       ret = mana_ring_doorbell(db_page, GDMA_QUEUE_RECEIVE,
>                        rxq->gdma_rq.id,
>                        rxq->gdma_rq.head *
> GDMA_WQE_ALIGNMENT_UNIT_SIZE,
>                        0);
> +#endif
> 
>       if (ret)
>               DP_LOG(ERR, "failed to ring RX doorbell ret %d", ret); @@ -
> 97,6 +110,7 @@ mana_alloc_and_post_rx_wqe(struct mana_rxq *rxq)
>               /* update queue for tracking pending packets */
>               desc->pkt = mbuf;
>               desc->wqe_size_in_bu = wqe_size_in_bu;
> +             rxq->wqe_cnt_to_short_db += wqe_size_in_bu;
>               rxq->desc_ring_head = (rxq->desc_ring_head + 1) % rxq-
> >num_desc;
>       } else {
>               DP_LOG(DEBUG, "failed to post recv ret %d", ret); @@ -
> 115,12 +129,22 @@ mana_alloc_and_post_rx_wqes(struct mana_rxq *rxq)
>       int ret;
>       uint32_t i;
> 
> +#ifdef RTE_ARCH_32
> +     rxq->wqe_cnt_to_short_db = 0;
> +#endif
>       for (i = 0; i < rxq->num_desc; i++) {
>               ret = mana_alloc_and_post_rx_wqe(rxq);
>               if (ret) {
>                       DP_LOG(ERR, "failed to post RX ret = %d", ret);
>                       return ret;
>               }
> +
> +#ifdef RTE_ARCH_32
> +             if (rxq->wqe_cnt_to_short_db >
> RX_WQE_SHORT_DB_THRESHOLD) {
> +                     mana_rq_ring_doorbell(rxq);
> +                     rxq->wqe_cnt_to_short_db = 0;
> +             }
> +#endif
>       }
> 
>       mana_rq_ring_doorbell(rxq);
> @@ -349,6 +373,9 @@ mana_start_rx_queues(struct rte_eth_dev *dev)
> 
>               /* CQ head starts with count */
>               rxq->gdma_cq.head = rxq->gdma_cq.count;
> +#ifdef RTE_ARCH_32
> +             rxq->gdma_cq.head_incr_to_short_db = 0; #endif
> 
>               DRV_LOG(INFO, "rxq cq id %u buf %p count %u size %u",
>                       rxq->gdma_cq.id, rxq->gdma_cq.buffer, @@ -397,6
> +424,10 @@ mana_rx_burst(void *dpdk_rxq, struct rte_mbuf **pkts,
> uint16_t pkts_n)
>       uint32_t i;
>       int polled = 0;
> 
> +#ifdef RTE_ARCH_32
> +     rxq->wqe_cnt_to_short_db = 0;
> +#endif
> +
>  repoll:
>       /* Polling on new completions if we have no backlog */
>       if (rxq->comp_buf_idx == rxq->comp_buf_len) { @@ -505,6 +536,16
> @@ mana_rx_burst(void *dpdk_rxq, struct rte_mbuf **pkts, uint16_t
> pkts_n)
>               wqe_posted++;
>               if (pkt_received == pkts_n)
>                       break;
> +
> +#ifdef RTE_ARCH_32
> +             /* Ring short doorbell if approaching the wqe increment
> +              * limit.
> +              */
> +             if (rxq->wqe_cnt_to_short_db >
> RX_WQE_SHORT_DB_THRESHOLD) {
> +                     mana_rq_ring_doorbell(rxq);
> +                     rxq->wqe_cnt_to_short_db = 0;
> +             }
> +#endif
>       }
> 
>       rxq->backlog_idx = pkt_idx;
> @@ -529,6 +570,16 @@ static int
>  mana_arm_cq(struct mana_rxq *rxq, uint8_t arm)  {
>       struct mana_priv *priv = rxq->priv;
> +#ifdef RTE_ARCH_32
> +     uint16_t cqe_incr = (uint16_t)rxq->gdma_cq.head_incr_to_short_db;

How do you make sure head_incr_to_short_db doesn't overflow?


Thanks,

Long

Reply via email to