[PATCH 10/14] net/xsc: optimize Rx path
Renyong Wan
wanry at yunsilicon.com
Fri Aug 29 10:24:28 CEST 2025
CQEs are not cache line aligned, which can cause cache conflicts when
polling Rx CQs under high-PPS load.
This patch checks CQ producer/consumer indices before processing packets,
reducing cache conflicts. The added MMIO read overhead is minor
compared to the latency caused by cache conflicts, improving observed
small-packet performance.
Signed-off-by: Rong Qian <qianr at yunsilicon.com>
Signed-off-by: Renyong Wan <wanry at yunsilicon.com>
---
drivers/net/xsc/xsc_defs.h | 2 ++
drivers/net/xsc/xsc_rx.c | 18 ++++++++++++++++--
drivers/net/xsc/xsc_rx.h | 1 +
drivers/net/xsc/xsc_vfio.c | 2 +-
4 files changed, 20 insertions(+), 3 deletions(-)
diff --git a/drivers/net/xsc/xsc_defs.h b/drivers/net/xsc/xsc_defs.h
index 4b95a0521d..73941901e7 100644
--- a/drivers/net/xsc/xsc_defs.h
+++ b/drivers/net/xsc/xsc_defs.h
@@ -46,10 +46,12 @@
#define XSC_PF_TX_DB_ADDR 0x4802000
#define XSC_PF_RX_DB_ADDR 0x4804000
#define XSC_PF_CQ_DB_ADDR 0x2120000
+#define XSC_PF_CQ_PID_START_ADDR 0x2080000
#define XSC_VF_RX_DB_ADDR 0x8d4
#define XSC_VF_TX_DB_ADDR 0x8d0
#define XSC_VF_CQ_DB_ADDR 0x8c4
+#define XSC_VF_CQ_PID_START_ADDR 0x60000
#define XSC_HIF_CMDQM_VECTOR_ID_MEM_ADDR 0x1034000
diff --git a/drivers/net/xsc/xsc_rx.c b/drivers/net/xsc/xsc_rx.c
index 332ceb9606..5f8003a1f6 100644
--- a/drivers/net/xsc/xsc_rx.c
+++ b/drivers/net/xsc/xsc_rx.c
@@ -83,6 +83,16 @@ xsc_rx_burst(void *dpdk_rxq, struct rte_mbuf **pkts, uint16_t pkts_n)
int cqe_msg_len = 0;
volatile struct xsc_cqe_u64 *cqe_u64 = NULL;
struct rte_mbuf *rep;
+ uint16_t cq_pi;
+ uint16_t cqe_pkts_n = 0;
+
+ if (rxq->cq_pi != NULL) {
+ cq_pi = (*(volatile uint32_t *)(rxq->cq_pi)) & 0xFFFF;
+ if (cq_pi == rxq->cq_ci)
+ return 0;
+ cqe_pkts_n = (uint16_t)((cq_pi - rxq->cq_ci) & 0xFFFF);
+ pkts_n = pkts_n < cqe_pkts_n ? pkts_n : cqe_pkts_n;
+ }
while (pkts_n) {
uint32_t idx = rq_ci & wqe_m;
@@ -463,12 +473,16 @@ xsc_rss_qp_create(struct xsc_ethdev_priv *priv, int port_id)
}
rxq_data->wqes = rxq_data->rq_pas->addr;
- if (!xsc_dev_is_vf(xdev))
+ if (!xsc_dev_is_vf(xdev)) {
rxq_data->rq_db = (uint32_t *)((uint8_t *)xdev->bar_addr +
XSC_PF_RX_DB_ADDR);
- else
+ rxq_data->cq_pi = (uint32_t *)((uint8_t *)xdev->bar_addr +
+ XSC_PF_CQ_PID_START_ADDR + rxq_data->cqn * 4);
+ } else {
rxq_data->rq_db = (uint32_t *)((uint8_t *)xdev->bar_addr +
XSC_VF_RX_DB_ADDR);
+ rxq_data->cq_pi = NULL;
+ }
rxq_data->qpn = rqn_base + i;
xsc_dev_modify_qp_status(xdev, rxq_data->qpn, 1, XSC_CMD_OP_RTR2RTS_QP);
diff --git a/drivers/net/xsc/xsc_rx.h b/drivers/net/xsc/xsc_rx.h
index 90fbb89197..59cbbb5141 100644
--- a/drivers/net/xsc/xsc_rx.h
+++ b/drivers/net/xsc/xsc_rx.h
@@ -31,6 +31,7 @@ struct __rte_cache_aligned xsc_rxq_data {
uint16_t rsv0:4;
volatile uint32_t *rq_db;
volatile uint32_t *cq_db;
+ volatile uint32_t *cq_pi;
uint32_t rq_ci;
uint32_t rq_pi;
uint16_t cq_ci;
diff --git a/drivers/net/xsc/xsc_vfio.c b/drivers/net/xsc/xsc_vfio.c
index 1650a3ab2b..c233728c5f 100644
--- a/drivers/net/xsc/xsc_vfio.c
+++ b/drivers/net/xsc/xsc_vfio.c
@@ -562,7 +562,7 @@ xsc_vfio_rx_cq_create(struct xsc_dev *xdev, struct xsc_rx_cq_params *cq_params,
PMD_DRV_LOG(WARNING, "Port %u rxq %u: cq numa_node=%u, device numa_node=%u",
port_id, idx, cq_params->socket_id, numa_node);
- cqe_n = cq_params->wqe_s;
+ cqe_n = cq_params->wqe_s * 2;
log_cq_sz = rte_log2_u32(cqe_n);
cqe_total_sz = cqe_n * sizeof(struct xsc_cqe);
pa_num = (cqe_total_sz + XSC_PAGE_SIZE - 1) / XSC_PAGE_SIZE;
--
2.25.1
More information about the dev
mailing list