1e31f123dSWei Hu (Xavier) /* SPDX-License-Identifier: BSD-3-Clause 2e31f123dSWei Hu (Xavier) * Copyright(c) 2020 Hisilicon Limited. 3e31f123dSWei Hu (Xavier) */ 4e31f123dSWei Hu (Xavier) 5e31f123dSWei Hu (Xavier) #include <rte_io.h> 6df96fd0dSBruce Richardson #include <ethdev_driver.h> 7e31f123dSWei Hu (Xavier) 8e31f123dSWei Hu (Xavier) #include "hns3_ethdev.h" 9e31f123dSWei Hu (Xavier) #include "hns3_rxtx.h" 10e31f123dSWei Hu (Xavier) #include "hns3_rxtx_vec.h" 11e31f123dSWei Hu (Xavier) 12e31f123dSWei Hu (Xavier) #if defined RTE_ARCH_ARM64 13e31f123dSWei Hu (Xavier) #include "hns3_rxtx_vec_neon.h" 14e31f123dSWei Hu (Xavier) #endif 15e31f123dSWei Hu (Xavier) 16e31f123dSWei Hu (Xavier) int 17e31f123dSWei Hu (Xavier) hns3_tx_check_vec_support(struct rte_eth_dev *dev) 18e31f123dSWei Hu (Xavier) { 19e31f123dSWei Hu (Xavier) struct rte_eth_txmode *txmode = &dev->data->dev_conf.txmode; 20e31f123dSWei Hu (Xavier) 21*38b539d9SMin Hu (Connor) struct hns3_hw *hw = HNS3_DEV_PRIVATE_TO_HW(dev->data->dev_private); 22*38b539d9SMin Hu (Connor) if (hns3_dev_ptp_supported(hw)) 23*38b539d9SMin Hu (Connor) return -ENOTSUP; 24*38b539d9SMin Hu (Connor) 25e31f123dSWei Hu (Xavier) /* Only support DEV_TX_OFFLOAD_MBUF_FAST_FREE */ 26e31f123dSWei Hu (Xavier) if (txmode->offloads != DEV_TX_OFFLOAD_MBUF_FAST_FREE) 27e31f123dSWei Hu (Xavier) return -ENOTSUP; 28e31f123dSWei Hu (Xavier) 29e31f123dSWei Hu (Xavier) return 0; 30e31f123dSWei Hu (Xavier) } 31e31f123dSWei Hu (Xavier) 32e31f123dSWei Hu (Xavier) uint16_t 33e31f123dSWei Hu (Xavier) hns3_xmit_pkts_vec(void *tx_queue, struct rte_mbuf **tx_pkts, uint16_t nb_pkts) 34e31f123dSWei Hu (Xavier) { 35e31f123dSWei Hu (Xavier) struct hns3_tx_queue *txq = (struct hns3_tx_queue *)tx_queue; 36e31f123dSWei Hu (Xavier) uint16_t nb_tx = 0; 37e31f123dSWei Hu (Xavier) 38e31f123dSWei Hu (Xavier) while (nb_pkts) { 39e31f123dSWei Hu (Xavier) uint16_t ret, new_burst; 40e31f123dSWei Hu (Xavier) 41e31f123dSWei Hu (Xavier) new_burst = RTE_MIN(nb_pkts, txq->tx_rs_thresh); 42e31f123dSWei Hu (Xavier) ret = hns3_xmit_fixed_burst_vec(tx_queue, &tx_pkts[nb_tx], 43e31f123dSWei Hu (Xavier) new_burst); 44e31f123dSWei Hu (Xavier) nb_tx += ret; 45e31f123dSWei Hu (Xavier) nb_pkts -= ret; 46e31f123dSWei Hu (Xavier) if (ret < new_burst) 47e31f123dSWei Hu (Xavier) break; 48e31f123dSWei Hu (Xavier) } 49e31f123dSWei Hu (Xavier) 50e31f123dSWei Hu (Xavier) return nb_tx; 51e31f123dSWei Hu (Xavier) } 52a3d4f4d2SWei Hu (Xavier) 53a3d4f4d2SWei Hu (Xavier) static inline void 54a3d4f4d2SWei Hu (Xavier) hns3_rxq_rearm_mbuf(struct hns3_rx_queue *rxq) 55a3d4f4d2SWei Hu (Xavier) { 56a3d4f4d2SWei Hu (Xavier) #define REARM_LOOP_STEP_NUM 4 57a3d4f4d2SWei Hu (Xavier) struct hns3_entry *rxep = &rxq->sw_ring[rxq->rx_rearm_start]; 58a3d4f4d2SWei Hu (Xavier) struct hns3_desc *rxdp = rxq->rx_ring + rxq->rx_rearm_start; 59a3d4f4d2SWei Hu (Xavier) uint64_t dma_addr; 60a3d4f4d2SWei Hu (Xavier) int i; 61a3d4f4d2SWei Hu (Xavier) 62a3d4f4d2SWei Hu (Xavier) if (unlikely(rte_mempool_get_bulk(rxq->mb_pool, (void *)rxep, 63a3d4f4d2SWei Hu (Xavier) HNS3_DEFAULT_RXQ_REARM_THRESH) < 0)) { 64a3d4f4d2SWei Hu (Xavier) rte_eth_devices[rxq->port_id].data->rx_mbuf_alloc_failed++; 65a3d4f4d2SWei Hu (Xavier) return; 66a3d4f4d2SWei Hu (Xavier) } 67a3d4f4d2SWei Hu (Xavier) 68a3d4f4d2SWei Hu (Xavier) for (i = 0; i < HNS3_DEFAULT_RXQ_REARM_THRESH; i += REARM_LOOP_STEP_NUM, 69a3d4f4d2SWei Hu (Xavier) rxep += REARM_LOOP_STEP_NUM, rxdp += REARM_LOOP_STEP_NUM) { 70a3d4f4d2SWei Hu (Xavier) if (likely(i < 71a3d4f4d2SWei Hu (Xavier) HNS3_DEFAULT_RXQ_REARM_THRESH - REARM_LOOP_STEP_NUM)) { 72a3d4f4d2SWei Hu (Xavier) rte_prefetch_non_temporal(rxep[4].mbuf); 73a3d4f4d2SWei Hu (Xavier) rte_prefetch_non_temporal(rxep[5].mbuf); 74a3d4f4d2SWei Hu (Xavier) rte_prefetch_non_temporal(rxep[6].mbuf); 75a3d4f4d2SWei Hu (Xavier) rte_prefetch_non_temporal(rxep[7].mbuf); 76a3d4f4d2SWei Hu (Xavier) } 77a3d4f4d2SWei Hu (Xavier) 78a3d4f4d2SWei Hu (Xavier) dma_addr = rte_mbuf_data_iova_default(rxep[0].mbuf); 79a3d4f4d2SWei Hu (Xavier) rxdp[0].addr = rte_cpu_to_le_64(dma_addr); 80a3d4f4d2SWei Hu (Xavier) rxdp[0].rx.bd_base_info = 0; 81a3d4f4d2SWei Hu (Xavier) 82a3d4f4d2SWei Hu (Xavier) dma_addr = rte_mbuf_data_iova_default(rxep[1].mbuf); 83a3d4f4d2SWei Hu (Xavier) rxdp[1].addr = rte_cpu_to_le_64(dma_addr); 84a3d4f4d2SWei Hu (Xavier) rxdp[1].rx.bd_base_info = 0; 85a3d4f4d2SWei Hu (Xavier) 86a3d4f4d2SWei Hu (Xavier) dma_addr = rte_mbuf_data_iova_default(rxep[2].mbuf); 87a3d4f4d2SWei Hu (Xavier) rxdp[2].addr = rte_cpu_to_le_64(dma_addr); 88a3d4f4d2SWei Hu (Xavier) rxdp[2].rx.bd_base_info = 0; 89a3d4f4d2SWei Hu (Xavier) 90a3d4f4d2SWei Hu (Xavier) dma_addr = rte_mbuf_data_iova_default(rxep[3].mbuf); 91a3d4f4d2SWei Hu (Xavier) rxdp[3].addr = rte_cpu_to_le_64(dma_addr); 92a3d4f4d2SWei Hu (Xavier) rxdp[3].rx.bd_base_info = 0; 93a3d4f4d2SWei Hu (Xavier) } 94a3d4f4d2SWei Hu (Xavier) 95a3d4f4d2SWei Hu (Xavier) rxq->rx_rearm_start += HNS3_DEFAULT_RXQ_REARM_THRESH; 96a3d4f4d2SWei Hu (Xavier) if (rxq->rx_rearm_start >= rxq->nb_rx_desc) 97a3d4f4d2SWei Hu (Xavier) rxq->rx_rearm_start = 0; 98a3d4f4d2SWei Hu (Xavier) 99a3d4f4d2SWei Hu (Xavier) rxq->rx_rearm_nb -= HNS3_DEFAULT_RXQ_REARM_THRESH; 100a3d4f4d2SWei Hu (Xavier) 101a3d4f4d2SWei Hu (Xavier) hns3_write_reg_opt(rxq->io_head_reg, HNS3_DEFAULT_RXQ_REARM_THRESH); 102a3d4f4d2SWei Hu (Xavier) } 103a3d4f4d2SWei Hu (Xavier) 104a3d4f4d2SWei Hu (Xavier) uint16_t 105a3d4f4d2SWei Hu (Xavier) hns3_recv_pkts_vec(void *__restrict rx_queue, 106a3d4f4d2SWei Hu (Xavier) struct rte_mbuf **__restrict rx_pkts, 107a3d4f4d2SWei Hu (Xavier) uint16_t nb_pkts) 108a3d4f4d2SWei Hu (Xavier) { 109a3d4f4d2SWei Hu (Xavier) struct hns3_rx_queue *rxq = rx_queue; 110a3d4f4d2SWei Hu (Xavier) struct hns3_desc *rxdp = &rxq->rx_ring[rxq->next_to_use]; 111a3d4f4d2SWei Hu (Xavier) uint64_t bd_err_mask; /* bit mask indicate whick pkts is error */ 112a3d4f4d2SWei Hu (Xavier) uint16_t nb_rx; 113a3d4f4d2SWei Hu (Xavier) 114a3d4f4d2SWei Hu (Xavier) nb_pkts = RTE_MIN(nb_pkts, HNS3_DEFAULT_RX_BURST); 115a3d4f4d2SWei Hu (Xavier) nb_pkts = RTE_ALIGN_FLOOR(nb_pkts, HNS3_DEFAULT_DESCS_PER_LOOP); 116a3d4f4d2SWei Hu (Xavier) 117a3d4f4d2SWei Hu (Xavier) rte_prefetch_non_temporal(rxdp); 118a3d4f4d2SWei Hu (Xavier) 119a3d4f4d2SWei Hu (Xavier) if (rxq->rx_rearm_nb > HNS3_DEFAULT_RXQ_REARM_THRESH) 120a3d4f4d2SWei Hu (Xavier) hns3_rxq_rearm_mbuf(rxq); 121a3d4f4d2SWei Hu (Xavier) 122a3d4f4d2SWei Hu (Xavier) if (unlikely(!(rxdp->rx.bd_base_info & 123a3d4f4d2SWei Hu (Xavier) rte_cpu_to_le_32(1u << HNS3_RXD_VLD_B)))) 124a3d4f4d2SWei Hu (Xavier) return 0; 125a3d4f4d2SWei Hu (Xavier) 126a3d4f4d2SWei Hu (Xavier) rte_prefetch0(rxq->sw_ring[rxq->next_to_use + 0].mbuf); 127a3d4f4d2SWei Hu (Xavier) rte_prefetch0(rxq->sw_ring[rxq->next_to_use + 1].mbuf); 128a3d4f4d2SWei Hu (Xavier) rte_prefetch0(rxq->sw_ring[rxq->next_to_use + 2].mbuf); 129a3d4f4d2SWei Hu (Xavier) rte_prefetch0(rxq->sw_ring[rxq->next_to_use + 3].mbuf); 130a3d4f4d2SWei Hu (Xavier) 131a3d4f4d2SWei Hu (Xavier) bd_err_mask = 0; 132a3d4f4d2SWei Hu (Xavier) nb_rx = hns3_recv_burst_vec(rxq, rx_pkts, nb_pkts, &bd_err_mask); 133a3d4f4d2SWei Hu (Xavier) if (unlikely(bd_err_mask)) 134a3d4f4d2SWei Hu (Xavier) nb_rx = hns3_rx_reassemble_pkts(rx_pkts, nb_rx, bd_err_mask); 135a3d4f4d2SWei Hu (Xavier) 136a3d4f4d2SWei Hu (Xavier) return nb_rx; 137a3d4f4d2SWei Hu (Xavier) } 138a3d4f4d2SWei Hu (Xavier) 139a3d4f4d2SWei Hu (Xavier) static void 140a3d4f4d2SWei Hu (Xavier) hns3_rxq_vec_setup_rearm_data(struct hns3_rx_queue *rxq) 141a3d4f4d2SWei Hu (Xavier) { 142a3d4f4d2SWei Hu (Xavier) uintptr_t p; 143a3d4f4d2SWei Hu (Xavier) struct rte_mbuf mb_def = { .buf_addr = 0 }; /* zeroed mbuf */ 144a3d4f4d2SWei Hu (Xavier) 145a3d4f4d2SWei Hu (Xavier) mb_def.nb_segs = 1; 146a3d4f4d2SWei Hu (Xavier) mb_def.data_off = RTE_PKTMBUF_HEADROOM; 147a3d4f4d2SWei Hu (Xavier) mb_def.port = rxq->port_id; 148a3d4f4d2SWei Hu (Xavier) rte_mbuf_refcnt_set(&mb_def, 1); 149a3d4f4d2SWei Hu (Xavier) 150a3d4f4d2SWei Hu (Xavier) /* prevent compiler reordering: rearm_data covers previous fields */ 151a3d4f4d2SWei Hu (Xavier) rte_compiler_barrier(); 152a3d4f4d2SWei Hu (Xavier) p = (uintptr_t)&mb_def.rearm_data; 153a3d4f4d2SWei Hu (Xavier) rxq->mbuf_initializer = *(uint64_t *)p; 154a3d4f4d2SWei Hu (Xavier) } 155a3d4f4d2SWei Hu (Xavier) 156a3d4f4d2SWei Hu (Xavier) void 157a3d4f4d2SWei Hu (Xavier) hns3_rxq_vec_setup(struct hns3_rx_queue *rxq) 158a3d4f4d2SWei Hu (Xavier) { 159a3d4f4d2SWei Hu (Xavier) struct hns3_entry *sw_ring = &rxq->sw_ring[rxq->nb_rx_desc]; 160a3d4f4d2SWei Hu (Xavier) unsigned int i; 161a3d4f4d2SWei Hu (Xavier) 162a3d4f4d2SWei Hu (Xavier) memset(&rxq->rx_ring[rxq->nb_rx_desc], 0, 163a3d4f4d2SWei Hu (Xavier) sizeof(struct hns3_desc) * HNS3_DEFAULT_RX_BURST); 164a3d4f4d2SWei Hu (Xavier) 165a3d4f4d2SWei Hu (Xavier) memset(&rxq->fake_mbuf, 0, sizeof(rxq->fake_mbuf)); 166a3d4f4d2SWei Hu (Xavier) for (i = 0; i < HNS3_DEFAULT_RX_BURST; i++) 167a3d4f4d2SWei Hu (Xavier) sw_ring[i].mbuf = &rxq->fake_mbuf; 168a3d4f4d2SWei Hu (Xavier) 169a3d4f4d2SWei Hu (Xavier) hns3_rxq_vec_setup_rearm_data(rxq); 170a3d4f4d2SWei Hu (Xavier) 171a3d4f4d2SWei Hu (Xavier) memset(rxq->offset_table, 0, sizeof(rxq->offset_table)); 172a3d4f4d2SWei Hu (Xavier) } 173a3d4f4d2SWei Hu (Xavier) 174a3d4f4d2SWei Hu (Xavier) static int 175a3d4f4d2SWei Hu (Xavier) hns3_rxq_vec_check(struct hns3_rx_queue *rxq, void *arg) 176a3d4f4d2SWei Hu (Xavier) { 177a3d4f4d2SWei Hu (Xavier) uint32_t min_vec_bds = HNS3_DEFAULT_RXQ_REARM_THRESH + 178a3d4f4d2SWei Hu (Xavier) HNS3_DEFAULT_RX_BURST; 179a3d4f4d2SWei Hu (Xavier) 180a3d4f4d2SWei Hu (Xavier) if (rxq->nb_rx_desc < min_vec_bds) 181a3d4f4d2SWei Hu (Xavier) return -ENOTSUP; 182a3d4f4d2SWei Hu (Xavier) 183a3d4f4d2SWei Hu (Xavier) if (rxq->nb_rx_desc % HNS3_DEFAULT_RXQ_REARM_THRESH) 184a3d4f4d2SWei Hu (Xavier) return -ENOTSUP; 185a3d4f4d2SWei Hu (Xavier) 186a3d4f4d2SWei Hu (Xavier) RTE_SET_USED(arg); 187a3d4f4d2SWei Hu (Xavier) return 0; 188a3d4f4d2SWei Hu (Xavier) } 189a3d4f4d2SWei Hu (Xavier) 190a3d4f4d2SWei Hu (Xavier) int 191a3d4f4d2SWei Hu (Xavier) hns3_rx_check_vec_support(struct rte_eth_dev *dev) 192a3d4f4d2SWei Hu (Xavier) { 193a3d4f4d2SWei Hu (Xavier) struct rte_fdir_conf *fconf = &dev->data->dev_conf.fdir_conf; 194a3d4f4d2SWei Hu (Xavier) struct rte_eth_rxmode *rxmode = &dev->data->dev_conf.rxmode; 195a3d4f4d2SWei Hu (Xavier) uint64_t offloads_mask = DEV_RX_OFFLOAD_TCP_LRO | 196a3d4f4d2SWei Hu (Xavier) DEV_RX_OFFLOAD_VLAN; 197a3d4f4d2SWei Hu (Xavier) 198*38b539d9SMin Hu (Connor) struct hns3_hw *hw = HNS3_DEV_PRIVATE_TO_HW(dev->data->dev_private); 199*38b539d9SMin Hu (Connor) if (hns3_dev_ptp_supported(hw)) 200*38b539d9SMin Hu (Connor) return -ENOTSUP; 201*38b539d9SMin Hu (Connor) 202a3d4f4d2SWei Hu (Xavier) if (dev->data->scattered_rx) 203a3d4f4d2SWei Hu (Xavier) return -ENOTSUP; 204a3d4f4d2SWei Hu (Xavier) 205a3d4f4d2SWei Hu (Xavier) if (fconf->mode != RTE_FDIR_MODE_NONE) 206a3d4f4d2SWei Hu (Xavier) return -ENOTSUP; 207a3d4f4d2SWei Hu (Xavier) 208a3d4f4d2SWei Hu (Xavier) if (rxmode->offloads & offloads_mask) 209a3d4f4d2SWei Hu (Xavier) return -ENOTSUP; 210a3d4f4d2SWei Hu (Xavier) 211a3d4f4d2SWei Hu (Xavier) if (hns3_rxq_iterate(dev, hns3_rxq_vec_check, NULL) != 0) 212a3d4f4d2SWei Hu (Xavier) return -ENOTSUP; 213a3d4f4d2SWei Hu (Xavier) 214a3d4f4d2SWei Hu (Xavier) return 0; 215a3d4f4d2SWei Hu (Xavier) } 216