[dpdk-dev] [PATCH v9 08/10] baseband/acc100: add interrupt support to PMD
Tom Rix
trix at redhat.com
Thu Oct 1 18:05:18 CEST 2020
On 9/30/20 12:45 PM, Chautru, Nicolas wrote:
> Hi Tom,
>
>> From: Tom Rix <trix at redhat.com>
>> On 9/28/20 5:29 PM, Nicolas Chautru wrote:
>>> Adding capability and functions to support MSI interrupts, call backs
>>> and inforing.
>>>
>>> Signed-off-by: Nicolas Chautru <nicolas.chautru at intel.com>
>>> Acked-by: Liu Tianjiao <Tianjiao.liu at intel.com>
>>> ---
>>> drivers/baseband/acc100/rte_acc100_pmd.c | 288
>>> ++++++++++++++++++++++++++++++-
>>> drivers/baseband/acc100/rte_acc100_pmd.h | 15 ++
>>> 2 files changed, 300 insertions(+), 3 deletions(-)
>>>
>>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.c
>>> b/drivers/baseband/acc100/rte_acc100_pmd.c
>>> index 7d4c3df..b6d9e7c 100644
>>> --- a/drivers/baseband/acc100/rte_acc100_pmd.c
>>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.c
>>> @@ -339,6 +339,213 @@
>>> free_base_addresses(base_addrs, i);
>>> }
>>>
>>> +/*
>>> + * Find queue_id of a device queue based on details from the Info Ring.
>>> + * If a queue isn't found UINT16_MAX is returned.
>>> + */
>>> +static inline uint16_t
>>> +get_queue_id_from_ring_info(struct rte_bbdev_data *data,
>>> + const union acc100_info_ring_data ring_data) {
>>> + uint16_t queue_id;
>>> +
>>> + for (queue_id = 0; queue_id < data->num_queues; ++queue_id) {
>>> + struct acc100_queue *acc100_q =
>>> + data->queues[queue_id].queue_private;
>>> + if (acc100_q != NULL && acc100_q->aq_id == ring_data.aq_id
>> &&
>>> + acc100_q->qgrp_id == ring_data.qg_id &&
>>> + acc100_q->vf_id == ring_data.vf_id)
>>> + return queue_id;
>> If num_queues is large, this linear search will be slow.
>>
>> Consider changing the search algorithm.
> This is not in the time critical part of the code
ok
>
>
>>> + }
>>> +
>>> + return UINT16_MAX;
>> the interrupt handlers that use this function do not a great job of handling
>> this error.
> if that error actualy happened then there is not much else that can be done except reporting the unexpected data.
ok
>
>>> +}
>>> +
>>> +/* Checks PF Info Ring to find the interrupt cause and handles it
>>> +accordingly */ static inline void acc100_check_ir(struct
>>> +acc100_device *acc100_dev) {
>>> + volatile union acc100_info_ring_data *ring_data;
>>> + uint16_t info_ring_head = acc100_dev->info_ring_head;
>>> + if (acc100_dev->info_ring == NULL)
>>> + return;
>>> +
>>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head &
>>> + ACC100_INFO_RING_MASK);
>>> +
>>> + while (ring_data->valid) {
>>> + if ((ring_data->int_nb <
>> ACC100_PF_INT_DMA_DL_DESC_IRQ) || (
>>> + ring_data->int_nb >
>>> + ACC100_PF_INT_DMA_DL5G_DESC_IRQ))
>>> + rte_bbdev_log(WARNING, "InfoRing: ITR:%d
>> Info:0x%x",
>>> + ring_data->int_nb, ring_data-
>>> detailed_info);
>>> + /* Initialize Info Ring entry and move forward */
>>> + ring_data->val = 0;
>>> + info_ring_head++;
>>> + ring_data = acc100_dev->info_ring +
>>> + (info_ring_head &
>> ACC100_INFO_RING_MASK);
>> These three statements are common for the ring handling, consider a macro
>> or inline function.
> ok
>
>>> + }
>>> +}
>>> +
>>> +/* Checks PF Info Ring to find the interrupt cause and handles it
>>> +accordingly */ static inline void acc100_pf_interrupt_handler(struct
>>> +rte_bbdev *dev) {
>>> + struct acc100_device *acc100_dev = dev->data->dev_private;
>>> + volatile union acc100_info_ring_data *ring_data;
>>> + struct acc100_deq_intr_details deq_intr_det;
>>> +
>>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head &
>>> + ACC100_INFO_RING_MASK);
>>> +
>>> + while (ring_data->valid) {
>>> +
>>> + rte_bbdev_log_debug(
>>> + "ACC100 PF Interrupt received, Info Ring
>> data: 0x%x",
>>> + ring_data->val);
>>> +
>>> + switch (ring_data->int_nb) {
>>> + case ACC100_PF_INT_DMA_DL_DESC_IRQ:
>>> + case ACC100_PF_INT_DMA_UL_DESC_IRQ:
>>> + case ACC100_PF_INT_DMA_UL5G_DESC_IRQ:
>>> + case ACC100_PF_INT_DMA_DL5G_DESC_IRQ:
>>> + deq_intr_det.queue_id =
>> get_queue_id_from_ring_info(
>>> + dev->data, *ring_data);
>>> + if (deq_intr_det.queue_id == UINT16_MAX) {
>>> + rte_bbdev_log(ERR,
>>> + "Couldn't find queue: aq_id:
>> %u, qg_id: %u, vf_id: %u",
>>> + ring_data->aq_id,
>>> + ring_data->qg_id,
>>> + ring_data->vf_id);
>>> + return;
>>> + }
>>> + rte_bbdev_pmd_callback_process(dev,
>>> + RTE_BBDEV_EVENT_DEQUEUE,
>> &deq_intr_det);
>>> + break;
>>> + default:
>>> + rte_bbdev_pmd_callback_process(dev,
>>> + RTE_BBDEV_EVENT_ERROR, NULL);
>>> + break;
>>> + }
>>> +
>>> + /* Initialize Info Ring entry and move forward */
>>> + ring_data->val = 0;
>>> + ++acc100_dev->info_ring_head;
>>> + ring_data = acc100_dev->info_ring +
>>> + (acc100_dev->info_ring_head &
>>> + ACC100_INFO_RING_MASK);
>>> + }
>>> +}
>>> +
>>> +/* Checks VF Info Ring to find the interrupt cause and handles it
>>> +accordingly */ static inline void acc100_vf_interrupt_handler(struct
>>> +rte_bbdev *dev)
>> very similar to pf case, consider combining.
>>> +{
>>> + struct acc100_device *acc100_dev = dev->data->dev_private;
>>> + volatile union acc100_info_ring_data *ring_data;
>>> + struct acc100_deq_intr_details deq_intr_det;
>>> +
>>> + ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head &
>>> + ACC100_INFO_RING_MASK);
>>> +
>>> + while (ring_data->valid) {
>>> +
>>> + rte_bbdev_log_debug(
>>> + "ACC100 VF Interrupt received, Info Ring
>> data: 0x%x",
>>> + ring_data->val);
>>> +
>>> + switch (ring_data->int_nb) {
>>> + case ACC100_VF_INT_DMA_DL_DESC_IRQ:
>>> + case ACC100_VF_INT_DMA_UL_DESC_IRQ:
>>> + case ACC100_VF_INT_DMA_UL5G_DESC_IRQ:
>>> + case ACC100_VF_INT_DMA_DL5G_DESC_IRQ:
>>> + /* VFs are not aware of their vf_id - it's set to 0 in
>>> + * queue structures.
>>> + */
>>> + ring_data->vf_id = 0;
>>> + deq_intr_det.queue_id =
>> get_queue_id_from_ring_info(
>>> + dev->data, *ring_data);
>>> + if (deq_intr_det.queue_id == UINT16_MAX) {
>>> + rte_bbdev_log(ERR,
>>> + "Couldn't find queue: aq_id:
>> %u, qg_id: %u",
>>> + ring_data->aq_id,
>>> + ring_data->qg_id);
>>> + return;
>>> + }
>>> + rte_bbdev_pmd_callback_process(dev,
>>> + RTE_BBDEV_EVENT_DEQUEUE,
>> &deq_intr_det);
>>> + break;
>>> + default:
>>> + rte_bbdev_pmd_callback_process(dev,
>>> + RTE_BBDEV_EVENT_ERROR, NULL);
>>> + break;
>>> + }
>>> +
>>> + /* Initialize Info Ring entry and move forward */
>>> + ring_data->valid = 0;
>>> + ++acc100_dev->info_ring_head;
>>> + ring_data = acc100_dev->info_ring + (acc100_dev-
>>> info_ring_head
>>> + & ACC100_INFO_RING_MASK);
>>> + }
>>> +}
>>> +
>>> +/* Interrupt handler triggered by ACC100 dev for handling specific
>>> +interrupt */ static void acc100_dev_interrupt_handler(void *cb_arg) {
>>> + struct rte_bbdev *dev = cb_arg;
>>> + struct acc100_device *acc100_dev = dev->data->dev_private;
>>> +
>>> + /* Read info ring */
>>> + if (acc100_dev->pf_device)
>>> + acc100_pf_interrupt_handler(dev);
>> combined like ..
>>
>> acc100_interrupt_handler(dev, is_pf)
> unsure it will help readability. Much of the code would still be distinct
ok
>
>>> + else
>>> + acc100_vf_interrupt_handler(dev);
>>> +}
>>> +
>>> +/* Allocate and setup inforing */
>>> +static int
>>> +allocate_inforing(struct rte_bbdev *dev)
>> consider renaming
>>
>> allocate_info_ring
> ok
>
>>> +{
>>> + struct acc100_device *d = dev->data->dev_private;
>>> + const struct acc100_registry_addr *reg_addr;
>>> + rte_iova_t info_ring_phys;
>>> + uint32_t phys_low, phys_high;
>>> +
>>> + if (d->info_ring != NULL)
>>> + return 0; /* Already configured */
>>> +
>>> + /* Choose correct registry addresses for the device type */
>>> + if (d->pf_device)
>>> + reg_addr = &pf_reg_addr;
>>> + else
>>> + reg_addr = &vf_reg_addr;
>>> + /* Allocate InfoRing */
>>> + d->info_ring = rte_zmalloc_socket("Info Ring",
>>> + ACC100_INFO_RING_NUM_ENTRIES *
>>> + sizeof(*d->info_ring), RTE_CACHE_LINE_SIZE,
>>> + dev->data->socket_id);
>>> + if (d->info_ring == NULL) {
>>> + rte_bbdev_log(ERR,
>>> + "Failed to allocate Info Ring for %s:%u",
>>> + dev->device->driver->name,
>>> + dev->data->dev_id);
>> The callers do not check that this fails.
> arguably the error would be self contained if that did fail. But doesn't hurt to add, ok.
>
>>> + return -ENOMEM;
>>> + }
>>> + info_ring_phys = rte_malloc_virt2iova(d->info_ring);
>>> +
>>> + /* Setup Info Ring */
>>> + phys_high = (uint32_t)(info_ring_phys >> 32);
>>> + phys_low = (uint32_t)(info_ring_phys);
>>> + acc100_reg_write(d, reg_addr->info_ring_hi, phys_high);
>>> + acc100_reg_write(d, reg_addr->info_ring_lo, phys_low);
>>> + acc100_reg_write(d, reg_addr->info_ring_en,
>> ACC100_REG_IRQ_EN_ALL);
>>> + d->info_ring_head = (acc100_reg_read(d, reg_addr->info_ring_ptr) &
>>> + 0xFFF) / sizeof(union acc100_info_ring_data);
>>> + return 0;
>>> +}
>>> +
>>> +
>>> /* Allocate 64MB memory used for all software rings */ static int
>>> acc100_setup_queues(struct rte_bbdev *dev, uint16_t num_queues, int
>>> socket_id) @@ -426,6 +633,7 @@
>>> acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_hi, phys_high);
>>> acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_lo, phys_low);
>>>
>>> + allocate_inforing(dev);
>> need to check here
>>> d->harq_layout = rte_zmalloc_socket("HARQ Layout",
>>> ACC100_HARQ_LAYOUT * sizeof(*d->harq_layout),
>>> RTE_CACHE_LINE_SIZE, dev->data->socket_id); @@ -
>> 437,13 +645,53 @@
>>> return 0;
>>> }
>>>
>>> +static int
>>> +acc100_intr_enable(struct rte_bbdev *dev) {
>>> + int ret;
>>> + struct acc100_device *d = dev->data->dev_private;
>>> +
>>> + /* Only MSI are currently supported */
>>> + if (dev->intr_handle->type == RTE_INTR_HANDLE_VFIO_MSI ||
>>> + dev->intr_handle->type == RTE_INTR_HANDLE_UIO)
>> {
>>> +
>>> + allocate_inforing(dev);
>> need to check here
>>> +
>>> + ret = rte_intr_enable(dev->intr_handle);
>>> + if (ret < 0) {
>>> + rte_bbdev_log(ERR,
>>> + "Couldn't enable interrupts for
>> device: %s",
>>> + dev->data->name);
>>> + rte_free(d->info_ring);
>>> + return ret;
>>> + }
>>> + ret = rte_intr_callback_register(dev->intr_handle,
>>> + acc100_dev_interrupt_handler, dev);
>>> + if (ret < 0) {
>>> + rte_bbdev_log(ERR,
>>> + "Couldn't register interrupt callback
>> for device: %s",
>>> + dev->data->name);
>>> + rte_free(d->info_ring);
>> does intr need to be disabled here ?
> Well I don't see a lot of consistency with other drivers. Sometimes these are not even check for failure.
> I would rather defer changing through other future patch if required as this is same code on other bbdev drivers already used (if changed I would rather all changed the same way).
ok.
>
>>> + return ret;
>>> + }
>>> +
>>> + return 0;
>>> + }
>>> +
>>> + rte_bbdev_log(ERR, "ACC100 (%s) supports only VFIO MSI
>> interrupts",
>>> + dev->data->name);
>>> + return -ENOTSUP;
>>> +}
>>> +
>>> /* Free 64MB memory used for software rings */ static int
>>> acc100_dev_close(struct rte_bbdev *dev) {
>>> struct acc100_device *d = dev->data->dev_private;
>>> + acc100_check_ir(d);
>>> if (d->sw_rings_base != NULL) {
>>> rte_free(d->tail_ptrs);
>>> + rte_free(d->info_ring);
>>> rte_free(d->sw_rings_base);
>>> d->sw_rings_base = NULL;
>>> }
>>> @@ -643,6 +891,7 @@
>>> RTE_BBDEV_TURBO_CRC_TYPE_24B
>> |
>> RTE_BBDEV_TURBO_HALF_ITERATION_EVEN |
>> RTE_BBDEV_TURBO_EARLY_TERMINATION |
>>> +
>> RTE_BBDEV_TURBO_DEC_INTERRUPTS |
>> RTE_BBDEV_TURBO_NEG_LLR_1_BIT_IN |
>>> RTE_BBDEV_TURBO_MAP_DEC |
>>>
>> RTE_BBDEV_TURBO_DEC_TB_CRC_24B_KEEP | @@ -663,6 +912,7
>> @@
>> RTE_BBDEV_TURBO_CRC_24B_ATTACH |
>> RTE_BBDEV_TURBO_RV_INDEX_BYPASS |
>>> RTE_BBDEV_TURBO_RATE_MATCH |
>>> +
>> RTE_BBDEV_TURBO_ENC_INTERRUPTS |
>> RTE_BBDEV_TURBO_ENC_SCATTER_GATHER,
>>> .num_buffers_src =
>>>
>> RTE_BBDEV_TURBO_MAX_CODE_BLOCKS, @@ -676,7 +926,8 @@
>>> .capability_flags =
>>> RTE_BBDEV_LDPC_RATE_MATCH |
>>>
>> RTE_BBDEV_LDPC_CRC_24B_ATTACH |
>>> -
>> RTE_BBDEV_LDPC_INTERLEAVER_BYPASS,
>>> +
>> RTE_BBDEV_LDPC_INTERLEAVER_BYPASS |
>>> +
>> RTE_BBDEV_LDPC_ENC_INTERRUPTS,
>>> .num_buffers_src =
>>>
>> RTE_BBDEV_LDPC_MAX_CODE_BLOCKS,
>>> .num_buffers_dst =
>>> @@ -701,7 +952,8 @@
>>> RTE_BBDEV_LDPC_DECODE_BYPASS |
>>> RTE_BBDEV_LDPC_DEC_SCATTER_GATHER |
>>>
>> RTE_BBDEV_LDPC_HARQ_6BIT_COMPRESSION |
>>> - RTE_BBDEV_LDPC_LLR_COMPRESSION,
>>> + RTE_BBDEV_LDPC_LLR_COMPRESSION |
>>> + RTE_BBDEV_LDPC_DEC_INTERRUPTS,
>>> .llr_size = 8,
>>> .llr_decimals = 1,
>>> .num_buffers_src =
>>> @@ -751,14 +1003,39 @@
>>> #else
>>> dev_info->harq_buffer_size = 0;
>>> #endif
>>> + acc100_check_ir(d);
>>> +}
>>> +
>>> +static int
>>> +acc100_queue_intr_enable(struct rte_bbdev *dev, uint16_t queue_id) {
>>> + struct acc100_queue *q = dev->data-
>>> queues[queue_id].queue_private;
>>> +
>>> + if (dev->intr_handle->type != RTE_INTR_HANDLE_VFIO_MSI &&
>>> + dev->intr_handle->type != RTE_INTR_HANDLE_UIO)
>>> + return -ENOTSUP;
>>> +
>>> + q->irq_enable = 1;
>>> + return 0;
>>> +}
>>> +
>>> +static int
>>> +acc100_queue_intr_disable(struct rte_bbdev *dev, uint16_t queue_id) {
>>> + struct acc100_queue *q = dev->data-
>>> queues[queue_id].queue_private;
>>> + q->irq_enable = 0;
>> A -ENOTSUP above, should need similar check here.
> How can this fail when we purely disable?
It is for api consistency.
the enable fails
the disable succeeds
that is not consistent.
Tom
>
>>> + return 0;
>>> }
>>>
>>> static const struct rte_bbdev_ops acc100_bbdev_ops = {
>>> .setup_queues = acc100_setup_queues,
>>> + .intr_enable = acc100_intr_enable,
>>> .close = acc100_dev_close,
>>> .info_get = acc100_dev_info_get,
>>> .queue_setup = acc100_queue_setup,
>>> .queue_release = acc100_queue_release,
>>> + .queue_intr_enable = acc100_queue_intr_enable,
>>> + .queue_intr_disable = acc100_queue_intr_disable
>>> };
>>>
>>> /* ACC100 PCI PF address map */
>>> @@ -3018,8 +3295,10 @@
>>> ? (1 << RTE_BBDEV_DATA_ERROR) : 0);
>>> op->status |= ((rsp.dma_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0);
>>> op->status |= ((rsp.fcw_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0);
>>> - if (op->status != 0)
>>> + if (op->status != 0) {
>>> q_data->queue_stats.dequeue_err_count++;
>>> + acc100_check_ir(q->d);
>>> + }
>>>
>>> /* CRC invalid if error exists */
>>> if (!op->status)
>>> @@ -3076,6 +3355,9 @@
>>> op->status |= 1 << RTE_BBDEV_SYNDROME_ERROR;
>>> op->ldpc_dec.iter_count = (uint8_t) rsp.iter_cnt;
>>>
>>> + if (op->status & (1 << RTE_BBDEV_DRV_ERROR))
>>> + acc100_check_ir(q->d);
>>> +
>>> /* Check if this is the last desc in batch (Atomic Queue) */
>>> if (desc->req.last_desc_in_batch) {
>>> (*aq_dequeued)++;
>>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.h
>>> b/drivers/baseband/acc100/rte_acc100_pmd.h
>>> index 78686c1..8980fa5 100644
>>> --- a/drivers/baseband/acc100/rte_acc100_pmd.h
>>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.h
>>> @@ -559,7 +559,14 @@ struct acc100_device {
>>> /* Virtual address of the info memory routed to the this function
>> under
>>> * operation, whether it is PF or VF.
>>> */
>>> + union acc100_info_ring_data *info_ring;
>> Need a comment that this array needs a sentinel ?
> Can clarify a bit expected HW behaviour
>
> Thanks
>
>> Tom
>>
>>> +
>>> union acc100_harq_layout_data *harq_layout;
>>> + /* Virtual Info Ring head */
>>> + uint16_t info_ring_head;
>>> + /* Number of bytes available for each queue in device, depending
>> on
>>> + * how many queues are enabled with configure()
>>> + */
>>> uint32_t sw_ring_size;
>>> uint32_t ddr_size; /* Size in kB */
>>> uint32_t *tail_ptrs; /* Base address of response tail pointer buffer
>>> */ @@ -575,4 +582,12 @@ struct acc100_device {
>>> bool configured; /**< True if this ACC100 device is configured */
>>> };
>>>
>>> +/**
>>> + * Structure with details about RTE_BBDEV_EVENT_DEQUEUE event. It's
>>> +passed to
>>> + * the callback function.
>>> + */
>>> +struct acc100_deq_intr_details {
>>> + uint16_t queue_id;
>>> +};
>>> +
>>> #endif /* _RTE_ACC100_PMD_H_ */
More information about the dev
mailing list