Hi Tom, > From: Tom Rix <t...@redhat.com> > On 9/30/20 12:45 PM, Chautru, Nicolas wrote: > > Hi Tom, > > > >> From: Tom Rix <t...@redhat.com> > >> On 9/28/20 5:29 PM, Nicolas Chautru wrote: > >>> Adding capability and functions to support MSI interrupts, call > >>> backs and inforing. > >>> > >>> Signed-off-by: Nicolas Chautru <nicolas.chau...@intel.com> > >>> Acked-by: Liu Tianjiao <tianjiao....@intel.com> > >>> --- > >>> drivers/baseband/acc100/rte_acc100_pmd.c | 288 > >>> ++++++++++++++++++++++++++++++- > >>> drivers/baseband/acc100/rte_acc100_pmd.h | 15 ++ > >>> 2 files changed, 300 insertions(+), 3 deletions(-) > >>> > >>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.c > >>> b/drivers/baseband/acc100/rte_acc100_pmd.c > >>> index 7d4c3df..b6d9e7c 100644 > >>> --- a/drivers/baseband/acc100/rte_acc100_pmd.c > >>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.c > >>> @@ -339,6 +339,213 @@ > >>> free_base_addresses(base_addrs, i); } > >>> > >>> +/* > >>> + * Find queue_id of a device queue based on details from the Info Ring. > >>> + * If a queue isn't found UINT16_MAX is returned. > >>> + */ > >>> +static inline uint16_t > >>> +get_queue_id_from_ring_info(struct rte_bbdev_data *data, > >>> + const union acc100_info_ring_data ring_data) { > >>> + uint16_t queue_id; > >>> + > >>> + for (queue_id = 0; queue_id < data->num_queues; ++queue_id) { > >>> + struct acc100_queue *acc100_q = > >>> + data->queues[queue_id].queue_private; > >>> + if (acc100_q != NULL && acc100_q->aq_id == ring_data.aq_id > >> && > >>> + acc100_q->qgrp_id == ring_data.qg_id && > >>> + acc100_q->vf_id == ring_data.vf_id) > >>> + return queue_id; > >> If num_queues is large, this linear search will be slow. > >> > >> Consider changing the search algorithm. > > This is not in the time critical part of the code > ok > > > > > >>> + } > >>> + > >>> + return UINT16_MAX; > >> the interrupt handlers that use this function do not a great job of > >> handling this error. > > if that error actualy happened then there is not much else that can be > done except reporting the unexpected data. > ok > > > >>> +} > >>> + > >>> +/* Checks PF Info Ring to find the interrupt cause and handles it > >>> +accordingly */ static inline void acc100_check_ir(struct > >>> +acc100_device *acc100_dev) { > >>> + volatile union acc100_info_ring_data *ring_data; > >>> + uint16_t info_ring_head = acc100_dev->info_ring_head; > >>> + if (acc100_dev->info_ring == NULL) > >>> + return; > >>> + > >>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & > >>> + ACC100_INFO_RING_MASK); > >>> + > >>> + while (ring_data->valid) { > >>> + if ((ring_data->int_nb < > >> ACC100_PF_INT_DMA_DL_DESC_IRQ) || ( > >>> + ring_data->int_nb > > >>> + ACC100_PF_INT_DMA_DL5G_DESC_IRQ)) > >>> + rte_bbdev_log(WARNING, "InfoRing: ITR:%d > >> Info:0x%x", > >>> + ring_data->int_nb, ring_data- > >>> detailed_info); > >>> + /* Initialize Info Ring entry and move forward */ > >>> + ring_data->val = 0; > >>> + info_ring_head++; > >>> + ring_data = acc100_dev->info_ring + > >>> + (info_ring_head & > >> ACC100_INFO_RING_MASK); > >> These three statements are common for the ring handling, consider a > >> macro or inline function. > > ok > > > >>> + } > >>> +} > >>> + > >>> +/* Checks PF Info Ring to find the interrupt cause and handles it > >>> +accordingly */ static inline void > >>> +acc100_pf_interrupt_handler(struct > >>> +rte_bbdev *dev) { > >>> + struct acc100_device *acc100_dev = dev->data->dev_private; > >>> + volatile union acc100_info_ring_data *ring_data; > >>> + struct acc100_deq_intr_details deq_intr_det; > >>> + > >>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & > >>> + ACC100_INFO_RING_MASK); > >>> + > >>> + while (ring_data->valid) { > >>> + > >>> + rte_bbdev_log_debug( > >>> + "ACC100 PF Interrupt received, Info Ring > >> data: 0x%x", > >>> + ring_data->val); > >>> + > >>> + switch (ring_data->int_nb) { > >>> + case ACC100_PF_INT_DMA_DL_DESC_IRQ: > >>> + case ACC100_PF_INT_DMA_UL_DESC_IRQ: > >>> + case ACC100_PF_INT_DMA_UL5G_DESC_IRQ: > >>> + case ACC100_PF_INT_DMA_DL5G_DESC_IRQ: > >>> + deq_intr_det.queue_id = > >> get_queue_id_from_ring_info( > >>> + dev->data, *ring_data); > >>> + if (deq_intr_det.queue_id == UINT16_MAX) { > >>> + rte_bbdev_log(ERR, > >>> + "Couldn't find queue: aq_id: > >> %u, qg_id: %u, vf_id: %u", > >>> + ring_data->aq_id, > >>> + ring_data->qg_id, > >>> + ring_data->vf_id); > >>> + return; > >>> + } > >>> + rte_bbdev_pmd_callback_process(dev, > >>> + RTE_BBDEV_EVENT_DEQUEUE, > >> &deq_intr_det); > >>> + break; > >>> + default: > >>> + rte_bbdev_pmd_callback_process(dev, > >>> + RTE_BBDEV_EVENT_ERROR, NULL); > >>> + break; > >>> + } > >>> + > >>> + /* Initialize Info Ring entry and move forward */ > >>> + ring_data->val = 0; > >>> + ++acc100_dev->info_ring_head; > >>> + ring_data = acc100_dev->info_ring + > >>> + (acc100_dev->info_ring_head & > >>> + ACC100_INFO_RING_MASK); > >>> + } > >>> +} > >>> + > >>> +/* Checks VF Info Ring to find the interrupt cause and handles it > >>> +accordingly */ static inline void > >>> +acc100_vf_interrupt_handler(struct > >>> +rte_bbdev *dev) > >> very similar to pf case, consider combining. > >>> +{ > >>> + struct acc100_device *acc100_dev = dev->data->dev_private; > >>> + volatile union acc100_info_ring_data *ring_data; > >>> + struct acc100_deq_intr_details deq_intr_det; > >>> + > >>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head & > >>> + ACC100_INFO_RING_MASK); > >>> + > >>> + while (ring_data->valid) { > >>> + > >>> + rte_bbdev_log_debug( > >>> + "ACC100 VF Interrupt received, Info Ring > >> data: 0x%x", > >>> + ring_data->val); > >>> + > >>> + switch (ring_data->int_nb) { > >>> + case ACC100_VF_INT_DMA_DL_DESC_IRQ: > >>> + case ACC100_VF_INT_DMA_UL_DESC_IRQ: > >>> + case ACC100_VF_INT_DMA_UL5G_DESC_IRQ: > >>> + case ACC100_VF_INT_DMA_DL5G_DESC_IRQ: > >>> + /* VFs are not aware of their vf_id - it's set to 0 in > >>> + * queue structures. > >>> + */ > >>> + ring_data->vf_id = 0; > >>> + deq_intr_det.queue_id = > >> get_queue_id_from_ring_info( > >>> + dev->data, *ring_data); > >>> + if (deq_intr_det.queue_id == UINT16_MAX) { > >>> + rte_bbdev_log(ERR, > >>> + "Couldn't find queue: aq_id: > >> %u, qg_id: %u", > >>> + ring_data->aq_id, > >>> + ring_data->qg_id); > >>> + return; > >>> + } > >>> + rte_bbdev_pmd_callback_process(dev, > >>> + RTE_BBDEV_EVENT_DEQUEUE, > >> &deq_intr_det); > >>> + break; > >>> + default: > >>> + rte_bbdev_pmd_callback_process(dev, > >>> + RTE_BBDEV_EVENT_ERROR, NULL); > >>> + break; > >>> + } > >>> + > >>> + /* Initialize Info Ring entry and move forward */ > >>> + ring_data->valid = 0; > >>> + ++acc100_dev->info_ring_head; > >>> + ring_data = acc100_dev->info_ring + (acc100_dev- > >>> info_ring_head > >>> + & ACC100_INFO_RING_MASK); > >>> + } > >>> +} > >>> + > >>> +/* Interrupt handler triggered by ACC100 dev for handling specific > >>> +interrupt */ static void acc100_dev_interrupt_handler(void *cb_arg) { > >>> + struct rte_bbdev *dev = cb_arg; > >>> + struct acc100_device *acc100_dev = dev->data->dev_private; > >>> + > >>> + /* Read info ring */ > >>> + if (acc100_dev->pf_device) > >>> + acc100_pf_interrupt_handler(dev); > >> combined like .. > >> > >> acc100_interrupt_handler(dev, is_pf) > > unsure it will help readability. Much of the code would still be > > distinct > ok > > > >>> + else > >>> + acc100_vf_interrupt_handler(dev); } > >>> + > >>> +/* Allocate and setup inforing */ > >>> +static int > >>> +allocate_inforing(struct rte_bbdev *dev) > >> consider renaming > >> > >> allocate_info_ring > > ok > > > >>> +{ > >>> + struct acc100_device *d = dev->data->dev_private; > >>> + const struct acc100_registry_addr *reg_addr; > >>> + rte_iova_t info_ring_phys; > >>> + uint32_t phys_low, phys_high; > >>> + > >>> + if (d->info_ring != NULL) > >>> + return 0; /* Already configured */ > >>> + > >>> + /* Choose correct registry addresses for the device type */ > >>> + if (d->pf_device) > >>> + reg_addr = &pf_reg_addr; > >>> + else > >>> + reg_addr = &vf_reg_addr; > >>> + /* Allocate InfoRing */ > >>> + d->info_ring = rte_zmalloc_socket("Info Ring", > >>> + ACC100_INFO_RING_NUM_ENTRIES * > >>> + sizeof(*d->info_ring), RTE_CACHE_LINE_SIZE, > >>> + dev->data->socket_id); > >>> + if (d->info_ring == NULL) { > >>> + rte_bbdev_log(ERR, > >>> + "Failed to allocate Info Ring for %s:%u", > >>> + dev->device->driver->name, > >>> + dev->data->dev_id); > >> The callers do not check that this fails. > > arguably the error would be self contained if that did fail. But doesn't > > hurt > to add, ok. > > > >>> + return -ENOMEM; > >>> + } > >>> + info_ring_phys = rte_malloc_virt2iova(d->info_ring); > >>> + > >>> + /* Setup Info Ring */ > >>> + phys_high = (uint32_t)(info_ring_phys >> 32); > >>> + phys_low = (uint32_t)(info_ring_phys); > >>> + acc100_reg_write(d, reg_addr->info_ring_hi, phys_high); > >>> + acc100_reg_write(d, reg_addr->info_ring_lo, phys_low); > >>> + acc100_reg_write(d, reg_addr->info_ring_en, > >> ACC100_REG_IRQ_EN_ALL); > >>> + d->info_ring_head = (acc100_reg_read(d, reg_addr->info_ring_ptr) & > >>> + 0xFFF) / sizeof(union acc100_info_ring_data); > >>> + return 0; > >>> +} > >>> + > >>> + > >>> /* Allocate 64MB memory used for all software rings */ static int > >>> acc100_setup_queues(struct rte_bbdev *dev, uint16_t num_queues, int > >>> socket_id) @@ -426,6 +633,7 @@ > >>> acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_hi, phys_high); > >>> acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_lo, phys_low); > >>> > >>> + allocate_inforing(dev); > >> need to check here > >>> d->harq_layout = rte_zmalloc_socket("HARQ Layout", > >>> ACC100_HARQ_LAYOUT * sizeof(*d->harq_layout), > >>> RTE_CACHE_LINE_SIZE, dev->data->socket_id); @@ - > >> 437,13 +645,53 @@ > >>> return 0; > >>> } > >>> > >>> +static int > >>> +acc100_intr_enable(struct rte_bbdev *dev) { > >>> + int ret; > >>> + struct acc100_device *d = dev->data->dev_private; > >>> + > >>> + /* Only MSI are currently supported */ > >>> + if (dev->intr_handle->type == RTE_INTR_HANDLE_VFIO_MSI || > >>> + dev->intr_handle->type == RTE_INTR_HANDLE_UIO) > >> { > >>> + > >>> + allocate_inforing(dev); > >> need to check here > >>> + > >>> + ret = rte_intr_enable(dev->intr_handle); > >>> + if (ret < 0) { > >>> + rte_bbdev_log(ERR, > >>> + "Couldn't enable interrupts for > >> device: %s", > >>> + dev->data->name); > >>> + rte_free(d->info_ring); > >>> + return ret; > >>> + } > >>> + ret = rte_intr_callback_register(dev->intr_handle, > >>> + acc100_dev_interrupt_handler, dev); > >>> + if (ret < 0) { > >>> + rte_bbdev_log(ERR, > >>> + "Couldn't register interrupt callback > >> for device: %s", > >>> + dev->data->name); > >>> + rte_free(d->info_ring); > >> does intr need to be disabled here ? > > Well I don't see a lot of consistency with other drivers. Sometimes these > are not even check for failure. > > I would rather defer changing through other future patch if required as this > is same code on other bbdev drivers already used (if changed I would rather > all changed the same way). > > ok. > > > > > >>> + return ret; > >>> + } > >>> + > >>> + return 0; > >>> + } > >>> + > >>> + rte_bbdev_log(ERR, "ACC100 (%s) supports only VFIO MSI > >> interrupts", > >>> + dev->data->name); > >>> + return -ENOTSUP; > >>> +} > >>> + > >>> /* Free 64MB memory used for software rings */ static int > >>> acc100_dev_close(struct rte_bbdev *dev) { > >>> struct acc100_device *d = dev->data->dev_private; > >>> + acc100_check_ir(d); > >>> if (d->sw_rings_base != NULL) { > >>> rte_free(d->tail_ptrs); > >>> + rte_free(d->info_ring); > >>> rte_free(d->sw_rings_base); > >>> d->sw_rings_base = NULL; > >>> } > >>> @@ -643,6 +891,7 @@ > >>> RTE_BBDEV_TURBO_CRC_TYPE_24B > >> | > >> RTE_BBDEV_TURBO_HALF_ITERATION_EVEN | > >> RTE_BBDEV_TURBO_EARLY_TERMINATION | > >>> + > >> RTE_BBDEV_TURBO_DEC_INTERRUPTS | > >> RTE_BBDEV_TURBO_NEG_LLR_1_BIT_IN | > >>> RTE_BBDEV_TURBO_MAP_DEC | > >>> > >> RTE_BBDEV_TURBO_DEC_TB_CRC_24B_KEEP | @@ -663,6 +912,7 > @@ > >> RTE_BBDEV_TURBO_CRC_24B_ATTACH | > >> RTE_BBDEV_TURBO_RV_INDEX_BYPASS | > >>> RTE_BBDEV_TURBO_RATE_MATCH | > >>> + > >> RTE_BBDEV_TURBO_ENC_INTERRUPTS | > >> RTE_BBDEV_TURBO_ENC_SCATTER_GATHER, > >>> .num_buffers_src = > >>> > >> RTE_BBDEV_TURBO_MAX_CODE_BLOCKS, @@ -676,7 +926,8 @@ > >>> .capability_flags = > >>> RTE_BBDEV_LDPC_RATE_MATCH | > >>> > >> RTE_BBDEV_LDPC_CRC_24B_ATTACH | > >>> - > >> RTE_BBDEV_LDPC_INTERLEAVER_BYPASS, > >>> + > >> RTE_BBDEV_LDPC_INTERLEAVER_BYPASS | > >>> + > >> RTE_BBDEV_LDPC_ENC_INTERRUPTS, > >>> .num_buffers_src = > >>> > >> RTE_BBDEV_LDPC_MAX_CODE_BLOCKS, > >>> .num_buffers_dst = > >>> @@ -701,7 +952,8 @@ > >>> RTE_BBDEV_LDPC_DECODE_BYPASS | > >>> RTE_BBDEV_LDPC_DEC_SCATTER_GATHER | > >>> > >> RTE_BBDEV_LDPC_HARQ_6BIT_COMPRESSION | > >>> - RTE_BBDEV_LDPC_LLR_COMPRESSION, > >>> + RTE_BBDEV_LDPC_LLR_COMPRESSION | > >>> + RTE_BBDEV_LDPC_DEC_INTERRUPTS, > >>> .llr_size = 8, > >>> .llr_decimals = 1, > >>> .num_buffers_src = > >>> @@ -751,14 +1003,39 @@ > >>> #else > >>> dev_info->harq_buffer_size = 0; > >>> #endif > >>> + acc100_check_ir(d); > >>> +} > >>> + > >>> +static int > >>> +acc100_queue_intr_enable(struct rte_bbdev *dev, uint16_t queue_id) > { > >>> + struct acc100_queue *q = dev->data- > >>> queues[queue_id].queue_private; > >>> + > >>> + if (dev->intr_handle->type != RTE_INTR_HANDLE_VFIO_MSI && > >>> + dev->intr_handle->type != RTE_INTR_HANDLE_UIO) > >>> + return -ENOTSUP; > >>> + > >>> + q->irq_enable = 1; > >>> + return 0; > >>> +} > >>> + > >>> +static int > >>> +acc100_queue_intr_disable(struct rte_bbdev *dev, uint16_t queue_id) > { > >>> + struct acc100_queue *q = dev->data- > >>> queues[queue_id].queue_private; > >>> + q->irq_enable = 0; > >> A -ENOTSUP above, should need similar check here. > > How can this fail when we purely disable? > > It is for api consistency. > > the enable fails > > the disable succeeds > > that is not consistent. >
OK can do. Thanks > Tom > > > > >>> + return 0; > >>> } > >>> > >>> static const struct rte_bbdev_ops acc100_bbdev_ops = { > >>> .setup_queues = acc100_setup_queues, > >>> + .intr_enable = acc100_intr_enable, > >>> .close = acc100_dev_close, > >>> .info_get = acc100_dev_info_get, > >>> .queue_setup = acc100_queue_setup, > >>> .queue_release = acc100_queue_release, > >>> + .queue_intr_enable = acc100_queue_intr_enable, > >>> + .queue_intr_disable = acc100_queue_intr_disable > >>> }; > >>> > >>> /* ACC100 PCI PF address map */ > >>> @@ -3018,8 +3295,10 @@ > >>> ? (1 << RTE_BBDEV_DATA_ERROR) : 0); > >>> op->status |= ((rsp.dma_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0); > >>> op->status |= ((rsp.fcw_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0); > >>> - if (op->status != 0) > >>> + if (op->status != 0) { > >>> q_data->queue_stats.dequeue_err_count++; > >>> + acc100_check_ir(q->d); > >>> + } > >>> > >>> /* CRC invalid if error exists */ > >>> if (!op->status) > >>> @@ -3076,6 +3355,9 @@ > >>> op->status |= 1 << RTE_BBDEV_SYNDROME_ERROR; > >>> op->ldpc_dec.iter_count = (uint8_t) rsp.iter_cnt; > >>> > >>> + if (op->status & (1 << RTE_BBDEV_DRV_ERROR)) > >>> + acc100_check_ir(q->d); > >>> + > >>> /* Check if this is the last desc in batch (Atomic Queue) */ > >>> if (desc->req.last_desc_in_batch) { > >>> (*aq_dequeued)++; > >>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.h > >>> b/drivers/baseband/acc100/rte_acc100_pmd.h > >>> index 78686c1..8980fa5 100644 > >>> --- a/drivers/baseband/acc100/rte_acc100_pmd.h > >>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.h > >>> @@ -559,7 +559,14 @@ struct acc100_device { > >>> /* Virtual address of the info memory routed to the this function > >> under > >>> * operation, whether it is PF or VF. > >>> */ > >>> + union acc100_info_ring_data *info_ring; > >> Need a comment that this array needs a sentinel ? > > Can clarify a bit expected HW behaviour > > > > Thanks > > > >> Tom > >> > >>> + > >>> union acc100_harq_layout_data *harq_layout; > >>> + /* Virtual Info Ring head */ > >>> + uint16_t info_ring_head; > >>> + /* Number of bytes available for each queue in device, depending > >> on > >>> + * how many queues are enabled with configure() > >>> + */ > >>> uint32_t sw_ring_size; > >>> uint32_t ddr_size; /* Size in kB */ > >>> uint32_t *tail_ptrs; /* Base address of response tail pointer > >>> buffer */ @@ -575,4 +582,12 @@ struct acc100_device { > >>> bool configured; /**< True if this ACC100 device is configured */ > >>> }; > >>> > >>> +/** > >>> + * Structure with details about RTE_BBDEV_EVENT_DEQUEUE event. > It's > >>> +passed to > >>> + * the callback function. > >>> + */ > >>> +struct acc100_deq_intr_details { > >>> + uint16_t queue_id; > >>> +}; > >>> + > >>> #endif /* _RTE_ACC100_PMD_H_ */