[dpdk-dev] [PATCH v9 08/10] baseband/acc100: add interrupt support to PMD

Tom Rix trix at redhat.com
Thu Oct 1 18:05:18 CEST 2020


On 9/30/20 12:45 PM, Chautru, Nicolas wrote:
> Hi Tom, 
>
>> From: Tom Rix <trix at redhat.com>
>> On 9/28/20 5:29 PM, Nicolas Chautru wrote:
>>> Adding capability and functions to support MSI interrupts, call backs
>>> and inforing.
>>>
>>> Signed-off-by: Nicolas Chautru <nicolas.chautru at intel.com>
>>> Acked-by: Liu Tianjiao <Tianjiao.liu at intel.com>
>>> ---
>>>  drivers/baseband/acc100/rte_acc100_pmd.c | 288
>>> ++++++++++++++++++++++++++++++-
>>> drivers/baseband/acc100/rte_acc100_pmd.h |  15 ++
>>>  2 files changed, 300 insertions(+), 3 deletions(-)
>>>
>>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.c
>>> b/drivers/baseband/acc100/rte_acc100_pmd.c
>>> index 7d4c3df..b6d9e7c 100644
>>> --- a/drivers/baseband/acc100/rte_acc100_pmd.c
>>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.c
>>> @@ -339,6 +339,213 @@
>>>  	free_base_addresses(base_addrs, i);
>>>  }
>>>
>>> +/*
>>> + * Find queue_id of a device queue based on details from the Info Ring.
>>> + * If a queue isn't found UINT16_MAX is returned.
>>> + */
>>> +static inline uint16_t
>>> +get_queue_id_from_ring_info(struct rte_bbdev_data *data,
>>> +		const union acc100_info_ring_data ring_data) {
>>> +	uint16_t queue_id;
>>> +
>>> +	for (queue_id = 0; queue_id < data->num_queues; ++queue_id) {
>>> +		struct acc100_queue *acc100_q =
>>> +				data->queues[queue_id].queue_private;
>>> +		if (acc100_q != NULL && acc100_q->aq_id == ring_data.aq_id
>> &&
>>> +				acc100_q->qgrp_id == ring_data.qg_id &&
>>> +				acc100_q->vf_id == ring_data.vf_id)
>>> +			return queue_id;
>> If num_queues is large, this linear search will be slow.
>>
>> Consider changing the search algorithm.
> This is not in the time critical part of the code
ok
>
>
>>> +	}
>>> +
>>> +	return UINT16_MAX;
>> the interrupt handlers that use this function do not a great job of handling
>> this error.
> if that error actualy happened then there is not much else that can be done except reporting the unexpected data.
ok
>
>>> +}
>>> +
>>> +/* Checks PF Info Ring to find the interrupt cause and handles it
>>> +accordingly */ static inline void acc100_check_ir(struct
>>> +acc100_device *acc100_dev) {
>>> +	volatile union acc100_info_ring_data *ring_data;
>>> +	uint16_t info_ring_head = acc100_dev->info_ring_head;
>>> +	if (acc100_dev->info_ring == NULL)
>>> +		return;
>>> +
>>> +	ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head &
>>> +			ACC100_INFO_RING_MASK);
>>> +
>>> +	while (ring_data->valid) {
>>> +		if ((ring_data->int_nb <
>> ACC100_PF_INT_DMA_DL_DESC_IRQ) || (
>>> +				ring_data->int_nb >
>>> +				ACC100_PF_INT_DMA_DL5G_DESC_IRQ))
>>> +			rte_bbdev_log(WARNING, "InfoRing: ITR:%d
>> Info:0x%x",
>>> +				ring_data->int_nb, ring_data-
>>> detailed_info);
>>> +		/* Initialize Info Ring entry and move forward */
>>> +		ring_data->val = 0;
>>> +		info_ring_head++;
>>> +		ring_data = acc100_dev->info_ring +
>>> +				(info_ring_head &
>> ACC100_INFO_RING_MASK);
>> These three statements are common for the ring handling, consider a macro
>> or inline function.
> ok
>
>>> +	}
>>> +}
>>> +
>>> +/* Checks PF Info Ring to find the interrupt cause and handles it
>>> +accordingly */ static inline void acc100_pf_interrupt_handler(struct
>>> +rte_bbdev *dev) {
>>> +	struct acc100_device *acc100_dev = dev->data->dev_private;
>>> +	volatile union acc100_info_ring_data *ring_data;
>>> +	struct acc100_deq_intr_details deq_intr_det;
>>> +
>>> +	ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head &
>>> +			ACC100_INFO_RING_MASK);
>>> +
>>> +	while (ring_data->valid) {
>>> +
>>> +		rte_bbdev_log_debug(
>>> +				"ACC100 PF Interrupt received, Info Ring
>> data: 0x%x",
>>> +				ring_data->val);
>>> +
>>> +		switch (ring_data->int_nb) {
>>> +		case ACC100_PF_INT_DMA_DL_DESC_IRQ:
>>> +		case ACC100_PF_INT_DMA_UL_DESC_IRQ:
>>> +		case ACC100_PF_INT_DMA_UL5G_DESC_IRQ:
>>> +		case ACC100_PF_INT_DMA_DL5G_DESC_IRQ:
>>> +			deq_intr_det.queue_id =
>> get_queue_id_from_ring_info(
>>> +					dev->data, *ring_data);
>>> +			if (deq_intr_det.queue_id == UINT16_MAX) {
>>> +				rte_bbdev_log(ERR,
>>> +						"Couldn't find queue: aq_id:
>> %u, qg_id: %u, vf_id: %u",
>>> +						ring_data->aq_id,
>>> +						ring_data->qg_id,
>>> +						ring_data->vf_id);
>>> +				return;
>>> +			}
>>> +			rte_bbdev_pmd_callback_process(dev,
>>> +					RTE_BBDEV_EVENT_DEQUEUE,
>> &deq_intr_det);
>>> +			break;
>>> +		default:
>>> +			rte_bbdev_pmd_callback_process(dev,
>>> +					RTE_BBDEV_EVENT_ERROR, NULL);
>>> +			break;
>>> +		}
>>> +
>>> +		/* Initialize Info Ring entry and move forward */
>>> +		ring_data->val = 0;
>>> +		++acc100_dev->info_ring_head;
>>> +		ring_data = acc100_dev->info_ring +
>>> +				(acc100_dev->info_ring_head &
>>> +				ACC100_INFO_RING_MASK);
>>> +	}
>>> +}
>>> +
>>> +/* Checks VF Info Ring to find the interrupt cause and handles it
>>> +accordingly */ static inline void acc100_vf_interrupt_handler(struct
>>> +rte_bbdev *dev)
>> very similar to pf case, consider combining.
>>> +{
>>> +	struct acc100_device *acc100_dev = dev->data->dev_private;
>>> +	volatile union acc100_info_ring_data *ring_data;
>>> +	struct acc100_deq_intr_details deq_intr_det;
>>> +
>>> +	ring_data = acc100_dev->info_ring + (acc100_dev->info_ring_head &
>>> +			ACC100_INFO_RING_MASK);
>>> +
>>> +	while (ring_data->valid) {
>>> +
>>> +		rte_bbdev_log_debug(
>>> +				"ACC100 VF Interrupt received, Info Ring
>> data: 0x%x",
>>> +				ring_data->val);
>>> +
>>> +		switch (ring_data->int_nb) {
>>> +		case ACC100_VF_INT_DMA_DL_DESC_IRQ:
>>> +		case ACC100_VF_INT_DMA_UL_DESC_IRQ:
>>> +		case ACC100_VF_INT_DMA_UL5G_DESC_IRQ:
>>> +		case ACC100_VF_INT_DMA_DL5G_DESC_IRQ:
>>> +			/* VFs are not aware of their vf_id - it's set to 0 in
>>> +			 * queue structures.
>>> +			 */
>>> +			ring_data->vf_id = 0;
>>> +			deq_intr_det.queue_id =
>> get_queue_id_from_ring_info(
>>> +					dev->data, *ring_data);
>>> +			if (deq_intr_det.queue_id == UINT16_MAX) {
>>> +				rte_bbdev_log(ERR,
>>> +						"Couldn't find queue: aq_id:
>> %u, qg_id: %u",
>>> +						ring_data->aq_id,
>>> +						ring_data->qg_id);
>>> +				return;
>>> +			}
>>> +			rte_bbdev_pmd_callback_process(dev,
>>> +					RTE_BBDEV_EVENT_DEQUEUE,
>> &deq_intr_det);
>>> +			break;
>>> +		default:
>>> +			rte_bbdev_pmd_callback_process(dev,
>>> +					RTE_BBDEV_EVENT_ERROR, NULL);
>>> +			break;
>>> +		}
>>> +
>>> +		/* Initialize Info Ring entry and move forward */
>>> +		ring_data->valid = 0;
>>> +		++acc100_dev->info_ring_head;
>>> +		ring_data = acc100_dev->info_ring + (acc100_dev-
>>> info_ring_head
>>> +				& ACC100_INFO_RING_MASK);
>>> +	}
>>> +}
>>> +
>>> +/* Interrupt handler triggered by ACC100 dev for handling specific
>>> +interrupt */ static void acc100_dev_interrupt_handler(void *cb_arg) {
>>> +	struct rte_bbdev *dev = cb_arg;
>>> +	struct acc100_device *acc100_dev = dev->data->dev_private;
>>> +
>>> +	/* Read info ring */
>>> +	if (acc100_dev->pf_device)
>>> +		acc100_pf_interrupt_handler(dev);
>> combined like ..
>>
>> acc100_interrupt_handler(dev, is_pf)
> unsure it will help readability. Much of the code would still be distinct
ok
>
>>> +	else
>>> +		acc100_vf_interrupt_handler(dev);
>>> +}
>>> +
>>> +/* Allocate and setup inforing */
>>> +static int
>>> +allocate_inforing(struct rte_bbdev *dev)
>> consider renaming
>>
>> allocate_info_ring
> ok
>
>>> +{
>>> +	struct acc100_device *d = dev->data->dev_private;
>>> +	const struct acc100_registry_addr *reg_addr;
>>> +	rte_iova_t info_ring_phys;
>>> +	uint32_t phys_low, phys_high;
>>> +
>>> +	if (d->info_ring != NULL)
>>> +		return 0; /* Already configured */
>>> +
>>> +	/* Choose correct registry addresses for the device type */
>>> +	if (d->pf_device)
>>> +		reg_addr = &pf_reg_addr;
>>> +	else
>>> +		reg_addr = &vf_reg_addr;
>>> +	/* Allocate InfoRing */
>>> +	d->info_ring = rte_zmalloc_socket("Info Ring",
>>> +			ACC100_INFO_RING_NUM_ENTRIES *
>>> +			sizeof(*d->info_ring), RTE_CACHE_LINE_SIZE,
>>> +			dev->data->socket_id);
>>> +	if (d->info_ring == NULL) {
>>> +		rte_bbdev_log(ERR,
>>> +				"Failed to allocate Info Ring for %s:%u",
>>> +				dev->device->driver->name,
>>> +				dev->data->dev_id);
>> The callers do not check that this fails.
> arguably the error would be self contained if that did fail. But doesn't hurt to add, ok. 
>
>>> +		return -ENOMEM;
>>> +	}
>>> +	info_ring_phys = rte_malloc_virt2iova(d->info_ring);
>>> +
>>> +	/* Setup Info Ring */
>>> +	phys_high = (uint32_t)(info_ring_phys >> 32);
>>> +	phys_low  = (uint32_t)(info_ring_phys);
>>> +	acc100_reg_write(d, reg_addr->info_ring_hi, phys_high);
>>> +	acc100_reg_write(d, reg_addr->info_ring_lo, phys_low);
>>> +	acc100_reg_write(d, reg_addr->info_ring_en,
>> ACC100_REG_IRQ_EN_ALL);
>>> +	d->info_ring_head = (acc100_reg_read(d, reg_addr->info_ring_ptr) &
>>> +			0xFFF) / sizeof(union acc100_info_ring_data);
>>> +	return 0;
>>> +}
>>> +
>>> +
>>>  /* Allocate 64MB memory used for all software rings */  static int
>>> acc100_setup_queues(struct rte_bbdev *dev, uint16_t num_queues, int
>>> socket_id) @@ -426,6 +633,7 @@
>>>  	acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_hi, phys_high);
>>>  	acc100_reg_write(d, reg_addr->tail_ptrs_dl4g_lo, phys_low);
>>>
>>> +	allocate_inforing(dev);
>> need to check here
>>>  	d->harq_layout = rte_zmalloc_socket("HARQ Layout",
>>>  			ACC100_HARQ_LAYOUT * sizeof(*d->harq_layout),
>>>  			RTE_CACHE_LINE_SIZE, dev->data->socket_id); @@ -
>> 437,13 +645,53 @@
>>>  	return 0;
>>>  }
>>>
>>> +static int
>>> +acc100_intr_enable(struct rte_bbdev *dev) {
>>> +	int ret;
>>> +	struct acc100_device *d = dev->data->dev_private;
>>> +
>>> +	/* Only MSI are currently supported */
>>> +	if (dev->intr_handle->type == RTE_INTR_HANDLE_VFIO_MSI ||
>>> +			dev->intr_handle->type == RTE_INTR_HANDLE_UIO)
>> {
>>> +
>>> +		allocate_inforing(dev);
>> need to check here
>>> +
>>> +		ret = rte_intr_enable(dev->intr_handle);
>>> +		if (ret < 0) {
>>> +			rte_bbdev_log(ERR,
>>> +					"Couldn't enable interrupts for
>> device: %s",
>>> +					dev->data->name);
>>> +			rte_free(d->info_ring);
>>> +			return ret;
>>> +		}
>>> +		ret = rte_intr_callback_register(dev->intr_handle,
>>> +				acc100_dev_interrupt_handler, dev);
>>> +		if (ret < 0) {
>>> +			rte_bbdev_log(ERR,
>>> +					"Couldn't register interrupt callback
>> for device: %s",
>>> +					dev->data->name);
>>> +			rte_free(d->info_ring);
>> does intr need to be disabled here ?
> Well I don't see a lot of consistency with other drivers. Sometimes these are not even check for failure.
> I would rather defer changing through other future patch if required as this is same code on other bbdev drivers already used (if changed I would rather all changed the same way). 

ok.


>
>>> +			return ret;
>>> +		}
>>> +
>>> +		return 0;
>>> +	}
>>> +
>>> +	rte_bbdev_log(ERR, "ACC100 (%s) supports only VFIO MSI
>> interrupts",
>>> +			dev->data->name);
>>> +	return -ENOTSUP;
>>> +}
>>> +
>>>  /* Free 64MB memory used for software rings */  static int
>>> acc100_dev_close(struct rte_bbdev *dev)  {
>>>  	struct acc100_device *d = dev->data->dev_private;
>>> +	acc100_check_ir(d);
>>>  	if (d->sw_rings_base != NULL) {
>>>  		rte_free(d->tail_ptrs);
>>> +		rte_free(d->info_ring);
>>>  		rte_free(d->sw_rings_base);
>>>  		d->sw_rings_base = NULL;
>>>  	}
>>> @@ -643,6 +891,7 @@
>>>  					RTE_BBDEV_TURBO_CRC_TYPE_24B
>> |
>> 	RTE_BBDEV_TURBO_HALF_ITERATION_EVEN |
>> 	RTE_BBDEV_TURBO_EARLY_TERMINATION |
>>> +
>> 	RTE_BBDEV_TURBO_DEC_INTERRUPTS |
>> 	RTE_BBDEV_TURBO_NEG_LLR_1_BIT_IN |
>>>  					RTE_BBDEV_TURBO_MAP_DEC |
>>>
>> 	RTE_BBDEV_TURBO_DEC_TB_CRC_24B_KEEP | @@ -663,6 +912,7
>> @@
>> 	RTE_BBDEV_TURBO_CRC_24B_ATTACH |
>> 	RTE_BBDEV_TURBO_RV_INDEX_BYPASS |
>>>  					RTE_BBDEV_TURBO_RATE_MATCH |
>>> +
>> 	RTE_BBDEV_TURBO_ENC_INTERRUPTS |
>> 	RTE_BBDEV_TURBO_ENC_SCATTER_GATHER,
>>>  				.num_buffers_src =
>>>
>> 	RTE_BBDEV_TURBO_MAX_CODE_BLOCKS, @@ -676,7 +926,8 @@
>>>  				.capability_flags =
>>>  					RTE_BBDEV_LDPC_RATE_MATCH |
>>>
>> 	RTE_BBDEV_LDPC_CRC_24B_ATTACH |
>>> -
>> 	RTE_BBDEV_LDPC_INTERLEAVER_BYPASS,
>>> +
>> 	RTE_BBDEV_LDPC_INTERLEAVER_BYPASS |
>>> +
>> 	RTE_BBDEV_LDPC_ENC_INTERRUPTS,
>>>  				.num_buffers_src =
>>>
>> 	RTE_BBDEV_LDPC_MAX_CODE_BLOCKS,
>>>  				.num_buffers_dst =
>>> @@ -701,7 +952,8 @@
>>>  				RTE_BBDEV_LDPC_DECODE_BYPASS |
>>>  				RTE_BBDEV_LDPC_DEC_SCATTER_GATHER |
>>>
>> 	RTE_BBDEV_LDPC_HARQ_6BIT_COMPRESSION |
>>> -				RTE_BBDEV_LDPC_LLR_COMPRESSION,
>>> +				RTE_BBDEV_LDPC_LLR_COMPRESSION |
>>> +				RTE_BBDEV_LDPC_DEC_INTERRUPTS,
>>>  			.llr_size = 8,
>>>  			.llr_decimals = 1,
>>>  			.num_buffers_src =
>>> @@ -751,14 +1003,39 @@
>>>  #else
>>>  	dev_info->harq_buffer_size = 0;
>>>  #endif
>>> +	acc100_check_ir(d);
>>> +}
>>> +
>>> +static int
>>> +acc100_queue_intr_enable(struct rte_bbdev *dev, uint16_t queue_id) {
>>> +	struct acc100_queue *q = dev->data-
>>> queues[queue_id].queue_private;
>>> +
>>> +	if (dev->intr_handle->type != RTE_INTR_HANDLE_VFIO_MSI &&
>>> +			dev->intr_handle->type != RTE_INTR_HANDLE_UIO)
>>> +		return -ENOTSUP;
>>> +
>>> +	q->irq_enable = 1;
>>> +	return 0;
>>> +}
>>> +
>>> +static int
>>> +acc100_queue_intr_disable(struct rte_bbdev *dev, uint16_t queue_id) {
>>> +	struct acc100_queue *q = dev->data-
>>> queues[queue_id].queue_private;
>>> +	q->irq_enable = 0;
>> A -ENOTSUP above, should need similar check here.
> How can this fail when we purely disable?

It is for api consistency.

the enable fails

the disable succeeds

that is not consistent.

Tom

>
>>> +	return 0;
>>>  }
>>>
>>>  static const struct rte_bbdev_ops acc100_bbdev_ops = {
>>>  	.setup_queues = acc100_setup_queues,
>>> +	.intr_enable = acc100_intr_enable,
>>>  	.close = acc100_dev_close,
>>>  	.info_get = acc100_dev_info_get,
>>>  	.queue_setup = acc100_queue_setup,
>>>  	.queue_release = acc100_queue_release,
>>> +	.queue_intr_enable = acc100_queue_intr_enable,
>>> +	.queue_intr_disable = acc100_queue_intr_disable
>>>  };
>>>
>>>  /* ACC100 PCI PF address map */
>>> @@ -3018,8 +3295,10 @@
>>>  			? (1 << RTE_BBDEV_DATA_ERROR) : 0);
>>>  	op->status |= ((rsp.dma_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0);
>>>  	op->status |= ((rsp.fcw_err) ? (1 << RTE_BBDEV_DRV_ERROR) : 0);
>>> -	if (op->status != 0)
>>> +	if (op->status != 0) {
>>>  		q_data->queue_stats.dequeue_err_count++;
>>> +		acc100_check_ir(q->d);
>>> +	}
>>>
>>>  	/* CRC invalid if error exists */
>>>  	if (!op->status)
>>> @@ -3076,6 +3355,9 @@
>>>  		op->status |= 1 << RTE_BBDEV_SYNDROME_ERROR;
>>>  	op->ldpc_dec.iter_count = (uint8_t) rsp.iter_cnt;
>>>
>>> +	if (op->status & (1 << RTE_BBDEV_DRV_ERROR))
>>> +		acc100_check_ir(q->d);
>>> +
>>>  	/* Check if this is the last desc in batch (Atomic Queue) */
>>>  	if (desc->req.last_desc_in_batch) {
>>>  		(*aq_dequeued)++;
>>> diff --git a/drivers/baseband/acc100/rte_acc100_pmd.h
>>> b/drivers/baseband/acc100/rte_acc100_pmd.h
>>> index 78686c1..8980fa5 100644
>>> --- a/drivers/baseband/acc100/rte_acc100_pmd.h
>>> +++ b/drivers/baseband/acc100/rte_acc100_pmd.h
>>> @@ -559,7 +559,14 @@ struct acc100_device {
>>>  	/* Virtual address of the info memory routed to the this function
>> under
>>>  	 * operation, whether it is PF or VF.
>>>  	 */
>>> +	union acc100_info_ring_data *info_ring;
>> Need a comment that this array needs a sentinel ?
> Can clarify a bit expected HW behaviour
>
> Thanks
>
>> Tom
>>
>>> +
>>>  	union acc100_harq_layout_data *harq_layout;
>>> +	/* Virtual Info Ring head */
>>> +	uint16_t info_ring_head;
>>> +	/* Number of bytes available for each queue in device, depending
>> on
>>> +	 * how many queues are enabled with configure()
>>> +	 */
>>>  	uint32_t sw_ring_size;
>>>  	uint32_t ddr_size; /* Size in kB */
>>>  	uint32_t *tail_ptrs; /* Base address of response tail pointer buffer
>>> */ @@ -575,4 +582,12 @@ struct acc100_device {
>>>  	bool configured; /**< True if this ACC100 device is configured */
>>> };
>>>
>>> +/**
>>> + * Structure with details about RTE_BBDEV_EVENT_DEQUEUE event. It's
>>> +passed to
>>> + * the callback function.
>>> + */
>>> +struct acc100_deq_intr_details {
>>> +	uint16_t queue_id;
>>> +};
>>> +
>>>  #endif /* _RTE_ACC100_PMD_H_ */



More information about the dev mailing list