Hi Tom, > From: Tom Rix <t...@redhat.com> > On 9/28/20 5:29 PM, Nicolas Chautru wrote: > > Adding capability and functions to support MSI interrupts, call backs > > and inforing. > > > > Signed-off-by: Nicolas Chautru <nicolas.chau...@intel.com> > > Acked-by: Liu Tianjiao <tianjiao....@intel.com> > > --- > > drivers/baseband/acc100/rte_acc100_pmd.c | 288 > > ++++++++++++++++++++++++++++++- > > drivers/baseband/acc100/rte_acc100_pmd.h | 15 ++ > > 2 files changed, 300 insertions(+), 3 deletions(-) > > > > diff --git a/drivers/baseband/acc100/rte_acc100_pmd.c > > b/drivers/baseband/acc100/rte_acc100_pmd.c > > index 7d4c3df..b6d9e7c 100644 > > --- a/drivers/baseband/acc100/rte_acc100_pmd.c > > +++ b/drivers/baseband/acc100/rte_acc100_pmd.c > > @@ -339,6 +339,213 @@ > > free_base_addresses(base_addrs, i); > > } > > > > +/* > > + * Find queue_id of a device queue based on details from the Info Ring. > > + * If a queue isn't found UINT16_MAX is returned. > > + */ > > +static inline uint16_t > > +get_queue_id_from_ring_info(struct rte_bbdev_data *data, > > + const union acc100_info_ring_data ring_data) { > > + uint16_t queue_id; > > + > > + for (queue_id = 0; queue_id < data->num_queues; ++queue_id) { > > + struct acc100_queue *acc100_q = > > + data->queues[queue_id].queue_private; > > + if (acc100_q != NULL && acc100_q->aq_id == ring_data.aq_id > && > > + acc100_q->qgrp_id == ring_data.qg_id && > > + acc100_q->vf_id == ring_data.vf_id) > > + return queue_id; > > If num_queues is large, this linear search will be slow. > > Consider changing the search algorithm.
This is not in the time critical part of the code > > > + } > > + > > + return UINT16_MAX; > the interrupt handlers that use this function do not a great job of handling > this error. if that error actualy happened then there is not much else that can be done except reporting the unexpected data. > > +} > > + > > +/* Checks PF Info Ring to find the interrupt cause and handles it > > +accordingly */ static inline void acc100_check_ir(struct > > +acc100_device *acc100_dev) { > > + volatile union acc100_info_ring_data *ring_data; > > + uint16_t info_ring_head = acc100_dev->info_ring_head; > > + if (acc100_dev->info_ring == NULL) > > + return; > > + > > + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & > > + ACC100_INFO_RING_MASK); > > + > > + while (ring_data->valid) { > > + if ((ring_data->int_nb < > ACC100_PF_INT_DMA_DL_DESC_IRQ) || ( > > + ring_data->int_nb > > > + ACC100_PF_INT_DMA_DL5G_DESC_IRQ)) > > + rte_bbdev_log(WARNING, "InfoRing: ITR:%d > Info:0x%x", > > + ring_data->int_nb, ring_data- > >detailed_info); > > + /* Initialize Info Ring entry and move forward */ > > + ring_data->val = 0; > > + info_ring_head++; > > + ring_data = acc100_dev->info_ring + > > + (info_ring_head & > ACC100_INFO_RING_MASK); > These three statements are common for the ring handling, consider a macro > or inline function. ok > > + } > > +} > > + > > +/* Checks PF Info Ring to find the interrupt cause and handles it > > +accordingly */ static inline void acc100_pf_interrupt_handler(struct > > +rte_bbdev *dev) { > > + struct acc100_device *acc100_dev = dev->data->dev_private; > > + volatile union acc100_info_ring_data *ring_data; > > + struct acc100_deq_intr_details deq_intr_det; > > + > > + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & > > + ACC100_INFO_RING_MASK); > > + > > + while (ring_data->valid) { > > + > > + rte_bbdev_log_debug( > > + "ACC100 PF Interrupt received, Info Ring > data: 0x%x", > > + ring_data->val); > > + > > + switch (ring_data->int_nb) { > > + case ACC100_PF_INT_DMA_DL_DESC_IRQ: > > + case ACC100_PF_INT_DMA_UL_DESC_IRQ: > > + case ACC100_PF_INT_DMA_UL5G_DESC_IRQ: > > + case ACC100_PF_INT_DMA_DL5G_DESC_IRQ: > > + deq_intr_det.queue_id = > get_queue_id_from_ring_info( > > + dev->data, *ring_data); > > + if (deq_intr_det.queue_id == UINT16_MAX) { > > + rte_bbdev_log(ERR, > > + "Couldn't find queue: aq_id: > %u, qg_id: %u, vf_id: %u", > > + ring_data->aq_id, > > + ring_data->qg_id, > > + ring_data->vf_id); > > + return; > > + } > > + rte_bbdev_pmd_callback_process(dev, > > + RTE_BBDEV_EVENT_DEQUEUE, > &deq_intr_det); > > + break; > > + default: > > + rte_bbdev_pmd_callback_process(dev, > > + RTE_BBDEV_EVENT_ERROR, NULL); > > + break; > > + } > > + > > + /* Initialize Info Ring entry and move forward */ > > + ring_data->val = 0; > > + ++acc100_dev->info_ring_head; > > + ring_data = acc100_dev->info_ring + > > + (acc100_dev->info_ring_head & > > + ACC100_INFO_RING_MASK); > > + } > > +} > > + > > +/* Checks VF Info Ring to find the interrupt cause and handles it > > +accordingly */ static inline void acc100_vf_interrupt_handler(struct > > +rte_bbdev *dev) > very similar to pf case, consider combining. > > +{ > > + struct acc100_device *acc100_dev = dev->data->dev_private; > > + volatile union acc100_info_ring_data *ring_data; > > + struct acc100_deq_intr_details deq_intr_det; > > + > > + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & > > + ACC100_INFO_RING_MASK); > > + > > + while (ring_data->valid) { > > + > > + rte_bbdev_log_debug( > > + "ACC100 VF Interrupt received, Info Ring > data: 0x%x", > > + ring_data->val); > > + > > + switch (ring_data->int_nb) { > > + case ACC100_VF_INT_DMA_DL_DESC_IRQ: > > + case ACC100_VF_INT_DMA_UL_DESC_IRQ: > > + case ACC100_VF_INT_DMA_UL5G_DESC_IRQ: > > + case ACC100_VF_INT_DMA_DL5G_DESC_IRQ: > > + /* VFs are not aware of their vf_id - it's set to 0 in > > + * queue structures. > > + */ > > + ring_data->vf_id = 0; > > + deq_intr_det.queue_id = > get_queue_id_from_ring_info( > > + dev->data, *ring_data); > > + if (deq_intr_det.queue_id == UINT16_MAX) { > > + rte_bbdev_log(ERR, > > + "Couldn't find queue: aq_id: > %u, qg_id: %u", > > + ring_data->aq_id, > > + ring_data->qg_id); > > + return; > > + } > > + rte_bbdev_pmd_callback_process(dev, > > + RTE_BBDEV_EVENT_DEQUEUE, > &deq_intr_det); > > + break; > > + default: > > + rte_bbdev_pmd_callback_process(dev, > > + RTE_BBDEV_EVENT_ERROR, NULL); > > + break; > > + } > > + > > + /* Initialize Info Ring entry and move forward */ > > + ring_data->valid = 0; > > + ++acc100_dev->info_ring_head; > > + ring_data = acc100_dev->info_ring + (acc100_dev- > >info_ring_head > > + & ACC100_INFO_RING_MASK); > > + } > > +} > > + > > +/* Interrupt handler triggered by ACC100 dev for handling specific > > +interrupt */ static void acc100_dev_interrupt_handler(void *cb_arg) { > > + struct rte_bbdev *dev = cb_arg; > > + struct acc100_device *acc100_dev = dev->data->dev_private; > > + > > + /* Read info ring */ > > + if (acc100_dev->pf_device) > > + acc100_pf_interrupt_handler(dev); > > combined like .. > > acc100_interrupt_handler(dev, is_pf) unsure it will help readability. Much of the code would still be distinct > > > + else > > + acc100_vf_interrupt_handler(dev); > > +} > > + > > +/* Allocate and setup inforing */ > > +static int > > +allocate_inforing(struct rte_bbdev *dev) > > consider renaming > > allocate_info_ring ok > > > +{ > > + struct acc100_device *d = dev->data->dev_private; > > + const struct acc100_registry_addr *reg_addr; > > + rte_iova_t info_ring_phys; > > + uint32_t phys_low, phys_high; > > + > > + if (d->info_ring != NULL) > > + return 0; /* Already configured */ > > + > > + /* Choose correct registry addresses for the device type */ > > + if (d->pf_device) > > + reg_addr = &pf_reg_addr; > > + else > > + reg_addr = &vf_reg_addr; > > + /* Allocate InfoRing */ > > + d->info_ring = rte_zmalloc_socket("Info Ring", > > + ACC100_INFO_RING_NUM_ENTRIES * > > + sizeof(*d->info_ring), RTE_CACHE_LINE_SIZE, > > + dev->data->socket_id); > > + if (d->info_ring == NULL) { > > + rte_bbdev_log(ERR, > > + "Failed to allocate Info Ring for %s:%u", > > + dev->device->driver->name, > > + dev->data->dev_id); > The callers do not check that this fails. arguably the error would be self contained if that did fail. But doesn't hurt to add, ok. > > + return -ENOMEM; > > + } > > + info_ring_phys = rte_malloc_virt2iova(d->info_ring); > > + > > + /* Setup Info Ring */ > > + phys_high = (uint32_t)(info_ring_phys >> 32); > > + phys_low = (uint32_t)(info_ring_phys); > > + acc100_reg_write(d, reg_addr->info_ring_hi, phys_high); > > + acc100_reg_write(d, reg_addr->info_ring_lo, phys_low); > > + acc100_reg_write(d, reg_addr->info_ring_en, > ACC100_REG_IRQ_EN_ALL); > > + d->info_ring_head = (acc100_reg_read(d, reg_addr->info_ring_ptr) & > > + 0xFFF) / sizeof(union acc100_info_ring_data); > > + return 0; > > +} > > + > > + > > /* Allocate 64MB memory used for all software rings */ static int > > acc100_setup_queues(struct rte_bbdev *dev, uint16_t num_queues, int > > socket_id) @@ -426,6 +633,7 @@ > > acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_hi, phys_high); > > acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_lo, phys_low); > > > > + allocate_inforing(dev); > need to check here > > d->harq_layout = rte_zmalloc_socket("HARQ Layout", > > ACC100_HARQ_LAYOUT * sizeof(*d->harq_layout), > > RTE_CACHE_LINE_SIZE, dev->data->socket_id); @@ - > 437,13 +645,53 @@ > > return 0; > > } > > > > +static int > > +acc100_intr_enable(struct rte_bbdev *dev) { > > + int ret; > > + struct acc100_device *d = dev->data->dev_private; > > + > > + /* Only MSI are currently supported */ > > + if (dev->intr_handle->type == RTE_INTR_HANDLE_VFIO_MSI || > > + dev->intr_handle->type == RTE_INTR_HANDLE_UIO) > { > > + > > + allocate_inforing(dev); > need to check here > > + > > + ret = rte_intr_enable(dev->intr_handle); > > + if (ret < 0) { > > + rte_bbdev_log(ERR, > > + "Couldn't enable interrupts for > device: %s", > > + dev->data->name); > > + rte_free(d->info_ring); > > + return ret; > > + } > > + ret = rte_intr_callback_register(dev->intr_handle, > > + acc100_dev_interrupt_handler, dev); > > + if (ret < 0) { > > + rte_bbdev_log(ERR, > > + "Couldn't register interrupt callback > for device: %s", > > + dev->data->name); > > + rte_free(d->info_ring); > does intr need to be disabled here ? Well I don't see a lot of consistency with other drivers. Sometimes these are not even check for failure. I would rather defer changing through other future patch if required as this is same code on other bbdev drivers already used (if changed I would rather all changed the same way). > > + return ret; > > + } > > + > > + return 0; > > + } > > + > > + rte_bbdev_log(ERR, "ACC100 (%s) supports only VFIO MSI > interrupts", > > + dev->data->name); > > + return -ENOTSUP; > > +} > > + > > /* Free 64MB memory used for software rings */ static int > > acc100_dev_close(struct rte_bbdev *dev) { > > struct acc100_device *d = dev->data->dev_private; > > + acc100_check_ir(d); > > if (d->sw_rings_base != NULL) { > > rte_free(d->tail_ptrs); > > + rte_free(d->info_ring); > > rte_free(d->sw_rings_base); > > d->sw_rings_base = NULL; > > } > > @@ -643,6 +891,7 @@ > > RTE_BBDEV_TURBO_CRC_TYPE_24B > | > > > RTE_BBDEV_TURBO_HALF_ITERATION_EVEN | > > > RTE_BBDEV_TURBO_EARLY_TERMINATION | > > + > RTE_BBDEV_TURBO_DEC_INTERRUPTS | > > > RTE_BBDEV_TURBO_NEG_LLR_1_BIT_IN | > > RTE_BBDEV_TURBO_MAP_DEC | > > > RTE_BBDEV_TURBO_DEC_TB_CRC_24B_KEEP | @@ -663,6 +912,7 > @@ > > > RTE_BBDEV_TURBO_CRC_24B_ATTACH | > > > RTE_BBDEV_TURBO_RV_INDEX_BYPASS | > > RTE_BBDEV_TURBO_RATE_MATCH | > > + > RTE_BBDEV_TURBO_ENC_INTERRUPTS | > > > RTE_BBDEV_TURBO_ENC_SCATTER_GATHER, > > .num_buffers_src = > > > RTE_BBDEV_TURBO_MAX_CODE_BLOCKS, @@ -676,7 +926,8 @@ > > .capability_flags = > > RTE_BBDEV_LDPC_RATE_MATCH | > > > RTE_BBDEV_LDPC_CRC_24B_ATTACH | > > - > RTE_BBDEV_LDPC_INTERLEAVER_BYPASS, > > + > RTE_BBDEV_LDPC_INTERLEAVER_BYPASS | > > + > RTE_BBDEV_LDPC_ENC_INTERRUPTS, > > .num_buffers_src = > > > RTE_BBDEV_LDPC_MAX_CODE_BLOCKS, > > .num_buffers_dst = > > @@ -701,7 +952,8 @@ > > RTE_BBDEV_LDPC_DECODE_BYPASS | > > RTE_BBDEV_LDPC_DEC_SCATTER_GATHER | > > > RTE_BBDEV_LDPC_HARQ_6BIT_COMPRESSION | > > - RTE_BBDEV_LDPC_LLR_COMPRESSION, > > + RTE_BBDEV_LDPC_LLR_COMPRESSION | > > + RTE_BBDEV_LDPC_DEC_INTERRUPTS, > > .llr_size = 8, > > .llr_decimals = 1, > > .num_buffers_src = > > @@ -751,14 +1003,39 @@ > > #else > > dev_info->harq_buffer_size = 0; > > #endif > > + acc100_check_ir(d); > > +} > > + > > +static int > > +acc100_queue_intr_enable(struct rte_bbdev *dev, uint16_t queue_id) { > > + struct acc100_queue *q = dev->data- > >queues[queue_id].queue_private; > > + > > + if (dev->intr_handle->type != RTE_INTR_HANDLE_VFIO_MSI && > > + dev->intr_handle->type != RTE_INTR_HANDLE_UIO) > > + return -ENOTSUP; > > + > > + q->irq_enable = 1; > > + return 0; > > +} > > + > > +static int > > +acc100_queue_intr_disable(struct rte_bbdev *dev, uint16_t queue_id) { > > + struct acc100_queue *q = dev->data- > >queues[queue_id].queue_private; > > + q->irq_enable = 0; > A -ENOTSUP above, should need similar check here. How can this fail when we purely disable? > > + return 0; > > } > > > > static const struct rte_bbdev_ops acc100_bbdev_ops = { > > .setup_queues = acc100_setup_queues, > > + .intr_enable = acc100_intr_enable, > > .close = acc100_dev_close, > > .info_get = acc100_dev_info_get, > > .queue_setup = acc100_queue_setup, > > .queue_release = acc100_queue_release, > > + .queue_intr_enable = acc100_queue_intr_enable, > > + .queue_intr_disable = acc100_queue_intr_disable > > }; > > > > /* ACC100 PCI PF address map */ > > @@ -3018,8 +3295,10 @@ > > ? (1 << RTE_BBDEV_DATA_ERROR) : 0); > > op->status |= ((rsp.dma_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0); > > op->status |= ((rsp.fcw_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0); > > - if (op->status != 0) > > + if (op->status != 0) { > > q_data->queue_stats.dequeue_err_count++; > > + acc100_check_ir(q->d); > > + } > > > > /* CRC invalid if error exists */ > > if (!op->status) > > @@ -3076,6 +3355,9 @@ > > op->status |= 1 << RTE_BBDEV_SYNDROME_ERROR; > > op->ldpc_dec.iter_count = (uint8_t) rsp.iter_cnt; > > > > + if (op->status & (1 << RTE_BBDEV_DRV_ERROR)) > > + acc100_check_ir(q->d); > > + > > /* Check if this is the last desc in batch (Atomic Queue) */ > > if (desc->req.last_desc_in_batch) { > > (*aq_dequeued)++; > > diff --git a/drivers/baseband/acc100/rte_acc100_pmd.h > > b/drivers/baseband/acc100/rte_acc100_pmd.h > > index 78686c1..8980fa5 100644 > > --- a/drivers/baseband/acc100/rte_acc100_pmd.h > > +++ b/drivers/baseband/acc100/rte_acc100_pmd.h > > @@ -559,7 +559,14 @@ struct acc100_device { > > /* Virtual address of the info memory routed to the this function > under > > * operation, whether it is PF or VF. > > */ > > + union acc100_info_ring_data *info_ring; > > Need a comment that this array needs a sentinel ? Can clarify a bit expected HW behaviour Thanks > > Tom > > > + > > union acc100_harq_layout_data *harq_layout; > > + /* Virtual Info Ring head */ > > + uint16_t info_ring_head; > > + /* Number of bytes available for each queue in device, depending > on > > + * how many queues are enabled with configure() > > + */ > > uint32_t sw_ring_size; > > uint32_t ddr_size; /* Size in kB */ > > uint32_t *tail_ptrs; /* Base address of response tail pointer buffer > > */ @@ -575,4 +582,12 @@ struct acc100_device { > > bool configured; /**< True if this ACC100 device is configured */ > > }; > > > > +/** > > + * Structure with details about RTE_BBDEV_EVENT_DEQUEUE event. It's > > +passed to > > + * the callback function. > > + */ > > +struct acc100_deq_intr_details { > > + uint16_t queue_id; > > +}; > > + > > #endif /* _RTE_ACC100_PMD_H_ */