On 9/30/20 12:45 PM, Chautru, Nicolas wrote: > Hi Tom, > >> From: Tom Rix <t...@redhat.com> >> On 9/28/20 5:29 PM, Nicolas Chautru wrote: >>> Adding capability and functions to support MSI interrupts, call backs >>> and inforing. >>> >>> Signed-off-by: Nicolas Chautru <nicolas.chau...@intel.com> >>> Acked-by: Liu Tianjiao <tianjiao....@intel.com> >>> --- >>> drivers/baseband/acc100/rte_acc100_pmd.c | 288 >>> ++++++++++++++++++++++++++++++- >>> drivers/baseband/acc100/rte_acc100_pmd.h | 15 ++ >>> 2 files changed, 300 insertions(+), 3 deletions(-) >>> >>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.c >>> b/drivers/baseband/acc100/rte_acc100_pmd.c >>> index 7d4c3df..b6d9e7c 100644 >>> --- a/drivers/baseband/acc100/rte_acc100_pmd.c >>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.c >>> @@ -339,6 +339,213 @@ >>> free_base_addresses(base_addrs, i); >>> } >>> >>> +/* >>> + * Find queue_id of a device queue based on details from the Info Ring. >>> + * If a queue isn't found UINT16_MAX is returned. >>> + */ >>> +static inline uint16_t >>> +get_queue_id_from_ring_info(struct rte_bbdev_data *data, >>> + const union acc100_info_ring_data ring_data) { >>> + uint16_t queue_id; >>> + >>> + for (queue_id = 0; queue_id < data->num_queues; ++queue_id) { >>> + struct acc100_queue *acc100_q = >>> + data->queues[queue_id].queue_private; >>> + if (acc100_q != NULL && acc100_q->aq_id == ring_data.aq_id >> && >>> + acc100_q->qgrp_id == ring_data.qg_id && >>> + acc100_q->vf_id == ring_data.vf_id) >>> + return queue_id; >> If num_queues is large, this linear search will be slow. >> >> Consider changing the search algorithm. > This is not in the time critical part of the code ok > > >>> + } >>> + >>> + return UINT16_MAX; >> the interrupt handlers that use this function do not a great job of handling >> this error. > if that error actualy happened then there is not much else that can be done > except reporting the unexpected data. ok > >>> +} >>> + >>> +/* Checks PF Info Ring to find the interrupt cause and handles it >>> +accordingly */ static inline void acc100_check_ir(struct >>> +acc100_device *acc100_dev) { >>> + volatile union acc100_info_ring_data *ring_data; >>> + uint16_t info_ring_head = acc100_dev->info_ring_head; >>> + if (acc100_dev->info_ring == NULL) >>> + return; >>> + >>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & >>> + ACC100_INFO_RING_MASK); >>> + >>> + while (ring_data->valid) { >>> + if ((ring_data->int_nb < >> ACC100_PF_INT_DMA_DL_DESC_IRQ) || ( >>> + ring_data->int_nb > >>> + ACC100_PF_INT_DMA_DL5G_DESC_IRQ)) >>> + rte_bbdev_log(WARNING, "InfoRing: ITR:%d >> Info:0x%x", >>> + ring_data->int_nb, ring_data- >>> detailed_info); >>> + /* Initialize Info Ring entry and move forward */ >>> + ring_data->val = 0; >>> + info_ring_head++; >>> + ring_data = acc100_dev->info_ring + >>> + (info_ring_head & >> ACC100_INFO_RING_MASK); >> These three statements are common for the ring handling, consider a macro >> or inline function. > ok > >>> + } >>> +} >>> + >>> +/* Checks PF Info Ring to find the interrupt cause and handles it >>> +accordingly */ static inline void acc100_pf_interrupt_handler(struct >>> +rte_bbdev *dev) { >>> + struct acc100_device *acc100_dev = dev->data->dev_private; >>> + volatile union acc100_info_ring_data *ring_data; >>> + struct acc100_deq_intr_details deq_intr_det; >>> + >>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & >>> + ACC100_INFO_RING_MASK); >>> + >>> + while (ring_data->valid) { >>> + >>> + rte_bbdev_log_debug( >>> + "ACC100 PF Interrupt received, Info Ring >> data: 0x%x", >>> + ring_data->val); >>> + >>> + switch (ring_data->int_nb) { >>> + case ACC100_PF_INT_DMA_DL_DESC_IRQ: >>> + case ACC100_PF_INT_DMA_UL_DESC_IRQ: >>> + case ACC100_PF_INT_DMA_UL5G_DESC_IRQ: >>> + case ACC100_PF_INT_DMA_DL5G_DESC_IRQ: >>> + deq_intr_det.queue_id = >> get_queue_id_from_ring_info( >>> + dev->data, *ring_data); >>> + if (deq_intr_det.queue_id == UINT16_MAX) { >>> + rte_bbdev_log(ERR, >>> + "Couldn't find queue: aq_id: >> %u, qg_id: %u, vf_id: %u", >>> + ring_data->aq_id, >>> + ring_data->qg_id, >>> + ring_data->vf_id); >>> + return; >>> + } >>> + rte_bbdev_pmd_callback_process(dev, >>> + RTE_BBDEV_EVENT_DEQUEUE, >> &deq_intr_det); >>> + break; >>> + default: >>> + rte_bbdev_pmd_callback_process(dev, >>> + RTE_BBDEV_EVENT_ERROR, NULL); >>> + break; >>> + } >>> + >>> + /* Initialize Info Ring entry and move forward */ >>> + ring_data->val = 0; >>> + ++acc100_dev->info_ring_head; >>> + ring_data = acc100_dev->info_ring + >>> + (acc100_dev->info_ring_head & >>> + ACC100_INFO_RING_MASK); >>> + } >>> +} >>> + >>> +/* Checks VF Info Ring to find the interrupt cause and handles it >>> +accordingly */ static inline void acc100_vf_interrupt_handler(struct >>> +rte_bbdev *dev) >> very similar to pf case, consider combining. >>> +{ >>> + struct acc100_device *acc100_dev = dev->data->dev_private; >>> + volatile union acc100_info_ring_data *ring_data; >>> + struct acc100_deq_intr_details deq_intr_det; >>> + >>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & >>> + ACC100_INFO_RING_MASK); >>> + >>> + while (ring_data->valid) { >>> + >>> + rte_bbdev_log_debug( >>> + "ACC100 VF Interrupt received, Info Ring >> data: 0x%x", >>> + ring_data->val); >>> + >>> + switch (ring_data->int_nb) { >>> + case ACC100_VF_INT_DMA_DL_DESC_IRQ: >>> + case ACC100_VF_INT_DMA_UL_DESC_IRQ: >>> + case ACC100_VF_INT_DMA_UL5G_DESC_IRQ: >>> + case ACC100_VF_INT_DMA_DL5G_DESC_IRQ: >>> + /* VFs are not aware of their vf_id - it's set to 0 in >>> + * queue structures. >>> + */ >>> + ring_data->vf_id = 0; >>> + deq_intr_det.queue_id = >> get_queue_id_from_ring_info( >>> + dev->data, *ring_data); >>> + if (deq_intr_det.queue_id == UINT16_MAX) { >>> + rte_bbdev_log(ERR, >>> + "Couldn't find queue: aq_id: >> %u, qg_id: %u", >>> + ring_data->aq_id, >>> + ring_data->qg_id); >>> + return; >>> + } >>> + rte_bbdev_pmd_callback_process(dev, >>> + RTE_BBDEV_EVENT_DEQUEUE, >> &deq_intr_det); >>> + break; >>> + default: >>> + rte_bbdev_pmd_callback_process(dev, >>> + RTE_BBDEV_EVENT_ERROR, NULL); >>> + break; >>> + } >>> + >>> + /* Initialize Info Ring entry and move forward */ >>> + ring_data->valid = 0; >>> + ++acc100_dev->info_ring_head; >>> + ring_data = acc100_dev->info_ring + (acc100_dev- >>> info_ring_head >>> + & ACC100_INFO_RING_MASK); >>> + } >>> +} >>> + >>> +/* Interrupt handler triggered by ACC100 dev for handling specific >>> +interrupt */ static void acc100_dev_interrupt_handler(void *cb_arg) { >>> + struct rte_bbdev *dev = cb_arg; >>> + struct acc100_device *acc100_dev = dev->data->dev_private; >>> + >>> + /* Read info ring */ >>> + if (acc100_dev->pf_device) >>> + acc100_pf_interrupt_handler(dev); >> combined like .. >> >> acc100_interrupt_handler(dev, is_pf) > unsure it will help readability. Much of the code would still be distinct ok > >>> + else >>> + acc100_vf_interrupt_handler(dev); >>> +} >>> + >>> +/* Allocate and setup inforing */ >>> +static int >>> +allocate_inforing(struct rte_bbdev *dev) >> consider renaming >> >> allocate_info_ring > ok > >>> +{ >>> + struct acc100_device *d = dev->data->dev_private; >>> + const struct acc100_registry_addr *reg_addr; >>> + rte_iova_t info_ring_phys; >>> + uint32_t phys_low, phys_high; >>> + >>> + if (d->info_ring != NULL) >>> + return 0; /* Already configured */ >>> + >>> + /* Choose correct registry addresses for the device type */ >>> + if (d->pf_device) >>> + reg_addr = &pf_reg_addr; >>> + else >>> + reg_addr = &vf_reg_addr; >>> + /* Allocate InfoRing */ >>> + d->info_ring = rte_zmalloc_socket("Info Ring", >>> + ACC100_INFO_RING_NUM_ENTRIES * >>> + sizeof(*d->info_ring), RTE_CACHE_LINE_SIZE, >>> + dev->data->socket_id); >>> + if (d->info_ring == NULL) { >>> + rte_bbdev_log(ERR, >>> + "Failed to allocate Info Ring for %s:%u", >>> + dev->device->driver->name, >>> + dev->data->dev_id); >> The callers do not check that this fails. > arguably the error would be self contained if that did fail. But doesn't hurt > to add, ok. > >>> + return -ENOMEM; >>> + } >>> + info_ring_phys = rte_malloc_virt2iova(d->info_ring); >>> + >>> + /* Setup Info Ring */ >>> + phys_high = (uint32_t)(info_ring_phys >> 32); >>> + phys_low = (uint32_t)(info_ring_phys); >>> + acc100_reg_write(d, reg_addr->info_ring_hi, phys_high); >>> + acc100_reg_write(d, reg_addr->info_ring_lo, phys_low); >>> + acc100_reg_write(d, reg_addr->info_ring_en, >> ACC100_REG_IRQ_EN_ALL); >>> + d->info_ring_head = (acc100_reg_read(d, reg_addr->info_ring_ptr) & >>> + 0xFFF) / sizeof(union acc100_info_ring_data); >>> + return 0; >>> +} >>> + >>> + >>> /* Allocate 64MB memory used for all software rings */ static int >>> acc100_setup_queues(struct rte_bbdev *dev, uint16_t num_queues, int >>> socket_id) @@ -426,6 +633,7 @@ >>> acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_hi, phys_high); >>> acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_lo, phys_low); >>> >>> + allocate_inforing(dev); >> need to check here >>> d->harq_layout = rte_zmalloc_socket("HARQ Layout", >>> ACC100_HARQ_LAYOUT * sizeof(*d->harq_layout), >>> RTE_CACHE_LINE_SIZE, dev->data->socket_id); @@ - >> 437,13 +645,53 @@ >>> return 0; >>> } >>> >>> +static int >>> +acc100_intr_enable(struct rte_bbdev *dev) { >>> + int ret; >>> + struct acc100_device *d = dev->data->dev_private; >>> + >>> + /* Only MSI are currently supported */ >>> + if (dev->intr_handle->type == RTE_INTR_HANDLE_VFIO_MSI || >>> + dev->intr_handle->type == RTE_INTR_HANDLE_UIO) >> { >>> + >>> + allocate_inforing(dev); >> need to check here >>> + >>> + ret = rte_intr_enable(dev->intr_handle); >>> + if (ret < 0) { >>> + rte_bbdev_log(ERR, >>> + "Couldn't enable interrupts for >> device: %s", >>> + dev->data->name); >>> + rte_free(d->info_ring); >>> + return ret; >>> + } >>> + ret = rte_intr_callback_register(dev->intr_handle, >>> + acc100_dev_interrupt_handler, dev); >>> + if (ret < 0) { >>> + rte_bbdev_log(ERR, >>> + "Couldn't register interrupt callback >> for device: %s", >>> + dev->data->name); >>> + rte_free(d->info_ring); >> does intr need to be disabled here ? > Well I don't see a lot of consistency with other drivers. Sometimes these are > not even check for failure. > I would rather defer changing through other future patch if required as this > is same code on other bbdev drivers already used (if changed I would rather > all changed the same way).
ok. > >>> + return ret; >>> + } >>> + >>> + return 0; >>> + } >>> + >>> + rte_bbdev_log(ERR, "ACC100 (%s) supports only VFIO MSI >> interrupts", >>> + dev->data->name); >>> + return -ENOTSUP; >>> +} >>> + >>> /* Free 64MB memory used for software rings */ static int >>> acc100_dev_close(struct rte_bbdev *dev) { >>> struct acc100_device *d = dev->data->dev_private; >>> + acc100_check_ir(d); >>> if (d->sw_rings_base != NULL) { >>> rte_free(d->tail_ptrs); >>> + rte_free(d->info_ring); >>> rte_free(d->sw_rings_base); >>> d->sw_rings_base = NULL; >>> } >>> @@ -643,6 +891,7 @@ >>> RTE_BBDEV_TURBO_CRC_TYPE_24B >> | >> RTE_BBDEV_TURBO_HALF_ITERATION_EVEN | >> RTE_BBDEV_TURBO_EARLY_TERMINATION | >>> + >> RTE_BBDEV_TURBO_DEC_INTERRUPTS | >> RTE_BBDEV_TURBO_NEG_LLR_1_BIT_IN | >>> RTE_BBDEV_TURBO_MAP_DEC | >>> >> RTE_BBDEV_TURBO_DEC_TB_CRC_24B_KEEP | @@ -663,6 +912,7 >> @@ >> RTE_BBDEV_TURBO_CRC_24B_ATTACH | >> RTE_BBDEV_TURBO_RV_INDEX_BYPASS | >>> RTE_BBDEV_TURBO_RATE_MATCH | >>> + >> RTE_BBDEV_TURBO_ENC_INTERRUPTS | >> RTE_BBDEV_TURBO_ENC_SCATTER_GATHER, >>> .num_buffers_src = >>> >> RTE_BBDEV_TURBO_MAX_CODE_BLOCKS, @@ -676,7 +926,8 @@ >>> .capability_flags = >>> RTE_BBDEV_LDPC_RATE_MATCH | >>> >> RTE_BBDEV_LDPC_CRC_24B_ATTACH | >>> - >> RTE_BBDEV_LDPC_INTERLEAVER_BYPASS, >>> + >> RTE_BBDEV_LDPC_INTERLEAVER_BYPASS | >>> + >> RTE_BBDEV_LDPC_ENC_INTERRUPTS, >>> .num_buffers_src = >>> >> RTE_BBDEV_LDPC_MAX_CODE_BLOCKS, >>> .num_buffers_dst = >>> @@ -701,7 +952,8 @@ >>> RTE_BBDEV_LDPC_DECODE_BYPASS | >>> RTE_BBDEV_LDPC_DEC_SCATTER_GATHER | >>> >> RTE_BBDEV_LDPC_HARQ_6BIT_COMPRESSION | >>> - RTE_BBDEV_LDPC_LLR_COMPRESSION, >>> + RTE_BBDEV_LDPC_LLR_COMPRESSION | >>> + RTE_BBDEV_LDPC_DEC_INTERRUPTS, >>> .llr_size = 8, >>> .llr_decimals = 1, >>> .num_buffers_src = >>> @@ -751,14 +1003,39 @@ >>> #else >>> dev_info->harq_buffer_size = 0; >>> #endif >>> + acc100_check_ir(d); >>> +} >>> + >>> +static int >>> +acc100_queue_intr_enable(struct rte_bbdev *dev, uint16_t queue_id) { >>> + struct acc100_queue *q = dev->data- >>> queues[queue_id].queue_private; >>> + >>> + if (dev->intr_handle->type != RTE_INTR_HANDLE_VFIO_MSI && >>> + dev->intr_handle->type != RTE_INTR_HANDLE_UIO) >>> + return -ENOTSUP; >>> + >>> + q->irq_enable = 1; >>> + return 0; >>> +} >>> + >>> +static int >>> +acc100_queue_intr_disable(struct rte_bbdev *dev, uint16_t queue_id) { >>> + struct acc100_queue *q = dev->data- >>> queues[queue_id].queue_private; >>> + q->irq_enable = 0; >> A -ENOTSUP above, should need similar check here. > How can this fail when we purely disable? It is for api consistency. the enable fails the disable succeeds that is not consistent. Tom > >>> + return 0; >>> } >>> >>> static const struct rte_bbdev_ops acc100_bbdev_ops = { >>> .setup_queues = acc100_setup_queues, >>> + .intr_enable = acc100_intr_enable, >>> .close = acc100_dev_close, >>> .info_get = acc100_dev_info_get, >>> .queue_setup = acc100_queue_setup, >>> .queue_release = acc100_queue_release, >>> + .queue_intr_enable = acc100_queue_intr_enable, >>> + .queue_intr_disable = acc100_queue_intr_disable >>> }; >>> >>> /* ACC100 PCI PF address map */ >>> @@ -3018,8 +3295,10 @@ >>> ? (1 << RTE_BBDEV_DATA_ERROR) : 0); >>> op->status |= ((rsp.dma_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0); >>> op->status |= ((rsp.fcw_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0); >>> - if (op->status != 0) >>> + if (op->status != 0) { >>> q_data->queue_stats.dequeue_err_count++; >>> + acc100_check_ir(q->d); >>> + } >>> >>> /* CRC invalid if error exists */ >>> if (!op->status) >>> @@ -3076,6 +3355,9 @@ >>> op->status |= 1 << RTE_BBDEV_SYNDROME_ERROR; >>> op->ldpc_dec.iter_count = (uint8_t) rsp.iter_cnt; >>> >>> + if (op->status & (1 << RTE_BBDEV_DRV_ERROR)) >>> + acc100_check_ir(q->d); >>> + >>> /* Check if this is the last desc in batch (Atomic Queue) */ >>> if (desc->req.last_desc_in_batch) { >>> (*aq_dequeued)++; >>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.h >>> b/drivers/baseband/acc100/rte_acc100_pmd.h >>> index 78686c1..8980fa5 100644 >>> --- a/drivers/baseband/acc100/rte_acc100_pmd.h >>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.h >>> @@ -559,7 +559,14 @@ struct acc100_device { >>> /* Virtual address of the info memory routed to the this function >> under >>> * operation, whether it is PF or VF. >>> */ >>> + union acc100_info_ring_data *info_ring; >> Need a comment that this array needs a sentinel ? > Can clarify a bit expected HW behaviour > > Thanks > >> Tom >> >>> + >>> union acc100_harq_layout_data *harq_layout; >>> + /* Virtual Info Ring head */ >>> + uint16_t info_ring_head; >>> + /* Number of bytes available for each queue in device, depending >> on >>> + * how many queues are enabled with configure() >>> + */ >>> uint32_t sw_ring_size; >>> uint32_t ddr_size; /* Size in kB */ >>> uint32_t *tail_ptrs; /* Base address of response tail pointer buffer >>> */ @@ -575,4 +582,12 @@ struct acc100_device { >>> bool configured; /**< True if this ACC100 device is configured */ >>> }; >>> >>> +/** >>> + * Structure with details about RTE_BBDEV_EVENT_DEQUEUE event. It's >>> +passed to >>> + * the callback function. >>> + */ >>> +struct acc100_deq_intr_details { >>> + uint16_t queue_id; >>> +}; >>> + >>> #endif /* _RTE_ACC100_PMD_H_ */