12e22920bSAdrien Mazarguil /*- 22e22920bSAdrien Mazarguil * BSD LICENSE 32e22920bSAdrien Mazarguil * 42e22920bSAdrien Mazarguil * Copyright 2015 6WIND S.A. 52e22920bSAdrien Mazarguil * Copyright 2015 Mellanox. 62e22920bSAdrien Mazarguil * 72e22920bSAdrien Mazarguil * Redistribution and use in source and binary forms, with or without 82e22920bSAdrien Mazarguil * modification, are permitted provided that the following conditions 92e22920bSAdrien Mazarguil * are met: 102e22920bSAdrien Mazarguil * 112e22920bSAdrien Mazarguil * * Redistributions of source code must retain the above copyright 122e22920bSAdrien Mazarguil * notice, this list of conditions and the following disclaimer. 132e22920bSAdrien Mazarguil * * Redistributions in binary form must reproduce the above copyright 142e22920bSAdrien Mazarguil * notice, this list of conditions and the following disclaimer in 152e22920bSAdrien Mazarguil * the documentation and/or other materials provided with the 162e22920bSAdrien Mazarguil * distribution. 172e22920bSAdrien Mazarguil * * Neither the name of 6WIND S.A. nor the names of its 182e22920bSAdrien Mazarguil * contributors may be used to endorse or promote products derived 192e22920bSAdrien Mazarguil * from this software without specific prior written permission. 202e22920bSAdrien Mazarguil * 212e22920bSAdrien Mazarguil * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 222e22920bSAdrien Mazarguil * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 232e22920bSAdrien Mazarguil * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 242e22920bSAdrien Mazarguil * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 252e22920bSAdrien Mazarguil * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 262e22920bSAdrien Mazarguil * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 272e22920bSAdrien Mazarguil * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 282e22920bSAdrien Mazarguil * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 292e22920bSAdrien Mazarguil * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 302e22920bSAdrien Mazarguil * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 312e22920bSAdrien Mazarguil * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 322e22920bSAdrien Mazarguil */ 332e22920bSAdrien Mazarguil 342e22920bSAdrien Mazarguil #include <assert.h> 352e22920bSAdrien Mazarguil #include <stdint.h> 362e22920bSAdrien Mazarguil #include <string.h> 372e22920bSAdrien Mazarguil #include <stdlib.h> 382e22920bSAdrien Mazarguil 392e22920bSAdrien Mazarguil /* Verbs header. */ 402e22920bSAdrien Mazarguil /* ISO C doesn't support unnamed structs/unions, disabling -pedantic. */ 412e22920bSAdrien Mazarguil #ifdef PEDANTIC 42fc5b160fSBruce Richardson #pragma GCC diagnostic ignored "-Wpedantic" 432e22920bSAdrien Mazarguil #endif 442e22920bSAdrien Mazarguil #include <infiniband/verbs.h> 456218063bSNélio Laranjeiro #include <infiniband/mlx5_hw.h> 466218063bSNélio Laranjeiro #include <infiniband/arch.h> 472e22920bSAdrien Mazarguil #ifdef PEDANTIC 48fc5b160fSBruce Richardson #pragma GCC diagnostic error "-Wpedantic" 492e22920bSAdrien Mazarguil #endif 502e22920bSAdrien Mazarguil 512e22920bSAdrien Mazarguil /* DPDK headers don't like -pedantic. */ 522e22920bSAdrien Mazarguil #ifdef PEDANTIC 53fc5b160fSBruce Richardson #pragma GCC diagnostic ignored "-Wpedantic" 542e22920bSAdrien Mazarguil #endif 552e22920bSAdrien Mazarguil #include <rte_mbuf.h> 562e22920bSAdrien Mazarguil #include <rte_mempool.h> 572e22920bSAdrien Mazarguil #include <rte_prefetch.h> 582e22920bSAdrien Mazarguil #include <rte_common.h> 592e22920bSAdrien Mazarguil #include <rte_branch_prediction.h> 606218063bSNélio Laranjeiro #include <rte_ether.h> 612e22920bSAdrien Mazarguil #ifdef PEDANTIC 62fc5b160fSBruce Richardson #pragma GCC diagnostic error "-Wpedantic" 632e22920bSAdrien Mazarguil #endif 642e22920bSAdrien Mazarguil 652e22920bSAdrien Mazarguil #include "mlx5.h" 662e22920bSAdrien Mazarguil #include "mlx5_utils.h" 672e22920bSAdrien Mazarguil #include "mlx5_rxtx.h" 68f3db9489SYaacov Hazan #include "mlx5_autoconf.h" 692e22920bSAdrien Mazarguil #include "mlx5_defs.h" 706218063bSNélio Laranjeiro #include "mlx5_prm.h" 716218063bSNélio Laranjeiro 7299c12dccSNélio Laranjeiro #ifndef NDEBUG 7399c12dccSNélio Laranjeiro 7499c12dccSNélio Laranjeiro /** 7599c12dccSNélio Laranjeiro * Verify or set magic value in CQE. 7699c12dccSNélio Laranjeiro * 7799c12dccSNélio Laranjeiro * @param cqe 7899c12dccSNélio Laranjeiro * Pointer to CQE. 7999c12dccSNélio Laranjeiro * 8099c12dccSNélio Laranjeiro * @return 8199c12dccSNélio Laranjeiro * 0 the first time. 8299c12dccSNélio Laranjeiro */ 8399c12dccSNélio Laranjeiro static inline int 8497267b8eSNelio Laranjeiro check_cqe_seen(volatile struct mlx5_cqe *cqe) 8599c12dccSNélio Laranjeiro { 8699c12dccSNélio Laranjeiro static const uint8_t magic[] = "seen"; 87ea3bc3b1SNélio Laranjeiro volatile uint8_t (*buf)[sizeof(cqe->rsvd0)] = &cqe->rsvd0; 8899c12dccSNélio Laranjeiro int ret = 1; 8999c12dccSNélio Laranjeiro unsigned int i; 9099c12dccSNélio Laranjeiro 9199c12dccSNélio Laranjeiro for (i = 0; i < sizeof(magic) && i < sizeof(*buf); ++i) 9299c12dccSNélio Laranjeiro if (!ret || (*buf)[i] != magic[i]) { 9399c12dccSNélio Laranjeiro ret = 0; 9499c12dccSNélio Laranjeiro (*buf)[i] = magic[i]; 9599c12dccSNélio Laranjeiro } 9699c12dccSNélio Laranjeiro return ret; 9799c12dccSNélio Laranjeiro } 9899c12dccSNélio Laranjeiro 9999c12dccSNélio Laranjeiro #endif /* NDEBUG */ 1006218063bSNélio Laranjeiro 1016218063bSNélio Laranjeiro static inline int 10297267b8eSNelio Laranjeiro check_cqe(volatile struct mlx5_cqe *cqe, 10399c12dccSNélio Laranjeiro unsigned int cqes_n, const uint16_t ci) 10499c12dccSNélio Laranjeiro __attribute__((always_inline)); 1056218063bSNélio Laranjeiro 10699c12dccSNélio Laranjeiro /** 10799c12dccSNélio Laranjeiro * Check whether CQE is valid. 10899c12dccSNélio Laranjeiro * 10999c12dccSNélio Laranjeiro * @param cqe 11099c12dccSNélio Laranjeiro * Pointer to CQE. 11199c12dccSNélio Laranjeiro * @param cqes_n 11299c12dccSNélio Laranjeiro * Size of completion queue. 11399c12dccSNélio Laranjeiro * @param ci 11499c12dccSNélio Laranjeiro * Consumer index. 11599c12dccSNélio Laranjeiro * 11699c12dccSNélio Laranjeiro * @return 11799c12dccSNélio Laranjeiro * 0 on success, 1 on failure. 11899c12dccSNélio Laranjeiro */ 11999c12dccSNélio Laranjeiro static inline int 12097267b8eSNelio Laranjeiro check_cqe(volatile struct mlx5_cqe *cqe, 12199c12dccSNélio Laranjeiro unsigned int cqes_n, const uint16_t ci) 1226218063bSNélio Laranjeiro { 12399c12dccSNélio Laranjeiro uint16_t idx = ci & cqes_n; 12499c12dccSNélio Laranjeiro uint8_t op_own = cqe->op_own; 12599c12dccSNélio Laranjeiro uint8_t op_owner = MLX5_CQE_OWNER(op_own); 12699c12dccSNélio Laranjeiro uint8_t op_code = MLX5_CQE_OPCODE(op_own); 1276218063bSNélio Laranjeiro 12899c12dccSNélio Laranjeiro if (unlikely((op_owner != (!!(idx))) || (op_code == MLX5_CQE_INVALID))) 12999c12dccSNélio Laranjeiro return 1; /* No CQE. */ 13099c12dccSNélio Laranjeiro #ifndef NDEBUG 13199c12dccSNélio Laranjeiro if ((op_code == MLX5_CQE_RESP_ERR) || 13299c12dccSNélio Laranjeiro (op_code == MLX5_CQE_REQ_ERR)) { 13399c12dccSNélio Laranjeiro volatile struct mlx5_err_cqe *err_cqe = (volatile void *)cqe; 13499c12dccSNélio Laranjeiro uint8_t syndrome = err_cqe->syndrome; 13599c12dccSNélio Laranjeiro 13699c12dccSNélio Laranjeiro if ((syndrome == MLX5_CQE_SYNDROME_LOCAL_LENGTH_ERR) || 13799c12dccSNélio Laranjeiro (syndrome == MLX5_CQE_SYNDROME_REMOTE_ABORTED_ERR)) 13899c12dccSNélio Laranjeiro return 0; 13997267b8eSNelio Laranjeiro if (!check_cqe_seen(cqe)) 14099c12dccSNélio Laranjeiro ERROR("unexpected CQE error %u (0x%02x)" 14199c12dccSNélio Laranjeiro " syndrome 0x%02x", 14299c12dccSNélio Laranjeiro op_code, op_code, syndrome); 14399c12dccSNélio Laranjeiro return 1; 14499c12dccSNélio Laranjeiro } else if ((op_code != MLX5_CQE_RESP_SEND) && 14599c12dccSNélio Laranjeiro (op_code != MLX5_CQE_REQ)) { 14697267b8eSNelio Laranjeiro if (!check_cqe_seen(cqe)) 14799c12dccSNélio Laranjeiro ERROR("unexpected CQE opcode %u (0x%02x)", 14899c12dccSNélio Laranjeiro op_code, op_code); 14999c12dccSNélio Laranjeiro return 1; 1506218063bSNélio Laranjeiro } 15199c12dccSNélio Laranjeiro #endif /* NDEBUG */ 15299c12dccSNélio Laranjeiro return 0; 1536218063bSNélio Laranjeiro } 1542e22920bSAdrien Mazarguil 155fdcb0f53SNélio Laranjeiro /** 156fdcb0f53SNélio Laranjeiro * Return the address of the WQE. 157fdcb0f53SNélio Laranjeiro * 158fdcb0f53SNélio Laranjeiro * @param txq 159fdcb0f53SNélio Laranjeiro * Pointer to TX queue structure. 160fdcb0f53SNélio Laranjeiro * @param wqe_ci 161fdcb0f53SNélio Laranjeiro * WQE consumer index. 162fdcb0f53SNélio Laranjeiro * 163fdcb0f53SNélio Laranjeiro * @return 164fdcb0f53SNélio Laranjeiro * WQE address. 165fdcb0f53SNélio Laranjeiro */ 166fdcb0f53SNélio Laranjeiro static inline uintptr_t * 167fdcb0f53SNélio Laranjeiro tx_mlx5_wqe(struct txq *txq, uint16_t ci) 168fdcb0f53SNélio Laranjeiro { 169fdcb0f53SNélio Laranjeiro ci &= ((1 << txq->wqe_n) - 1); 170fdcb0f53SNélio Laranjeiro return (uintptr_t *)((uintptr_t)txq->wqes + ci * MLX5_WQE_SIZE); 171fdcb0f53SNélio Laranjeiro } 172fdcb0f53SNélio Laranjeiro 173a6ca35aaSNélio Laranjeiro static inline void 174a6ca35aaSNélio Laranjeiro txq_complete(struct txq *txq) __attribute__((always_inline)); 175a6ca35aaSNélio Laranjeiro 1762e22920bSAdrien Mazarguil /** 1772e22920bSAdrien Mazarguil * Manage TX completions. 1782e22920bSAdrien Mazarguil * 1792e22920bSAdrien Mazarguil * When sending a burst, mlx5_tx_burst() posts several WRs. 1802e22920bSAdrien Mazarguil * 1812e22920bSAdrien Mazarguil * @param txq 1822e22920bSAdrien Mazarguil * Pointer to TX queue structure. 1832e22920bSAdrien Mazarguil */ 184a6ca35aaSNélio Laranjeiro static inline void 1852e22920bSAdrien Mazarguil txq_complete(struct txq *txq) 1862e22920bSAdrien Mazarguil { 187b4b12e55SNélio Laranjeiro const unsigned int elts_n = 1 << txq->elts_n; 188e2f116eeSNélio Laranjeiro const unsigned int cqe_n = 1 << txq->cqe_n; 18999c12dccSNélio Laranjeiro const unsigned int cqe_cnt = cqe_n - 1; 1901d88ba17SNélio Laranjeiro uint16_t elts_free = txq->elts_tail; 1911d88ba17SNélio Laranjeiro uint16_t elts_tail; 1921d88ba17SNélio Laranjeiro uint16_t cq_ci = txq->cq_ci; 19397267b8eSNelio Laranjeiro volatile struct mlx5_cqe *cqe = NULL; 194fdcb0f53SNélio Laranjeiro volatile struct mlx5_wqe_ctrl *ctrl; 1952e22920bSAdrien Mazarguil 19699c12dccSNélio Laranjeiro do { 19797267b8eSNelio Laranjeiro volatile struct mlx5_cqe *tmp; 1981d88ba17SNélio Laranjeiro 19997267b8eSNelio Laranjeiro tmp = &(*txq->cqes)[cq_ci & cqe_cnt]; 20097267b8eSNelio Laranjeiro if (check_cqe(tmp, cqe_n, cq_ci)) 2011d88ba17SNélio Laranjeiro break; 202c305090bSAdrien Mazarguil cqe = tmp; 20399c12dccSNélio Laranjeiro #ifndef NDEBUG 20499c12dccSNélio Laranjeiro if (MLX5_CQE_FORMAT(cqe->op_own) == MLX5_COMPRESSED) { 20597267b8eSNelio Laranjeiro if (!check_cqe_seen(cqe)) 20699c12dccSNélio Laranjeiro ERROR("unexpected compressed CQE, TX stopped"); 20799c12dccSNélio Laranjeiro return; 2082e22920bSAdrien Mazarguil } 20999c12dccSNélio Laranjeiro if ((MLX5_CQE_OPCODE(cqe->op_own) == MLX5_CQE_RESP_ERR) || 21099c12dccSNélio Laranjeiro (MLX5_CQE_OPCODE(cqe->op_own) == MLX5_CQE_REQ_ERR)) { 21197267b8eSNelio Laranjeiro if (!check_cqe_seen(cqe)) 21299c12dccSNélio Laranjeiro ERROR("unexpected error CQE, TX stopped"); 21399c12dccSNélio Laranjeiro return; 21499c12dccSNélio Laranjeiro } 21599c12dccSNélio Laranjeiro #endif /* NDEBUG */ 21699c12dccSNélio Laranjeiro ++cq_ci; 21799c12dccSNélio Laranjeiro } while (1); 218c305090bSAdrien Mazarguil if (unlikely(cqe == NULL)) 2191d88ba17SNélio Laranjeiro return; 220fdcb0f53SNélio Laranjeiro ctrl = (volatile struct mlx5_wqe_ctrl *) 221fdcb0f53SNélio Laranjeiro tx_mlx5_wqe(txq, ntohs(cqe->wqe_counter)); 222fdcb0f53SNélio Laranjeiro elts_tail = ctrl->ctrl3; 223a821d09dSNélio Laranjeiro assert(elts_tail < (1 << txq->wqe_n)); 2241d88ba17SNélio Laranjeiro /* Free buffers. */ 225c305090bSAdrien Mazarguil while (elts_free != elts_tail) { 2261d88ba17SNélio Laranjeiro struct rte_mbuf *elt = (*txq->elts)[elts_free]; 227a859e8a9SNelio Laranjeiro unsigned int elts_free_next = 2281d88ba17SNélio Laranjeiro (elts_free + 1) & (elts_n - 1); 2291d88ba17SNélio Laranjeiro struct rte_mbuf *elt_next = (*txq->elts)[elts_free_next]; 230a859e8a9SNelio Laranjeiro 231b185e63fSAdrien Mazarguil #ifndef NDEBUG 232b185e63fSAdrien Mazarguil /* Poisoning. */ 2331d88ba17SNélio Laranjeiro memset(&(*txq->elts)[elts_free], 2341d88ba17SNélio Laranjeiro 0x66, 2351d88ba17SNélio Laranjeiro sizeof((*txq->elts)[elts_free])); 236b185e63fSAdrien Mazarguil #endif 2371d88ba17SNélio Laranjeiro RTE_MBUF_PREFETCH_TO_FREE(elt_next); 2381d88ba17SNélio Laranjeiro /* Only one segment needs to be freed. */ 2391d88ba17SNélio Laranjeiro rte_pktmbuf_free_seg(elt); 240a859e8a9SNelio Laranjeiro elts_free = elts_free_next; 241c305090bSAdrien Mazarguil } 2421d88ba17SNélio Laranjeiro txq->cq_ci = cq_ci; 2432e22920bSAdrien Mazarguil txq->elts_tail = elts_tail; 2441d88ba17SNélio Laranjeiro /* Update the consumer index. */ 2451d88ba17SNélio Laranjeiro rte_wmb(); 2461d88ba17SNélio Laranjeiro *txq->cq_db = htonl(cq_ci); 2472e22920bSAdrien Mazarguil } 2482e22920bSAdrien Mazarguil 2492e22920bSAdrien Mazarguil /** 2508340392eSAdrien Mazarguil * Get Memory Pool (MP) from mbuf. If mbuf is indirect, the pool from which 2518340392eSAdrien Mazarguil * the cloned mbuf is allocated is returned instead. 2528340392eSAdrien Mazarguil * 2538340392eSAdrien Mazarguil * @param buf 2548340392eSAdrien Mazarguil * Pointer to mbuf. 2558340392eSAdrien Mazarguil * 2568340392eSAdrien Mazarguil * @return 2578340392eSAdrien Mazarguil * Memory pool where data is located for given mbuf. 2588340392eSAdrien Mazarguil */ 2598340392eSAdrien Mazarguil static struct rte_mempool * 2608340392eSAdrien Mazarguil txq_mb2mp(struct rte_mbuf *buf) 2618340392eSAdrien Mazarguil { 2628340392eSAdrien Mazarguil if (unlikely(RTE_MBUF_INDIRECT(buf))) 2638340392eSAdrien Mazarguil return rte_mbuf_from_indirect(buf)->pool; 2648340392eSAdrien Mazarguil return buf->pool; 2658340392eSAdrien Mazarguil } 2668340392eSAdrien Mazarguil 267491770faSNélio Laranjeiro static inline uint32_t 268491770faSNélio Laranjeiro txq_mp2mr(struct txq *txq, struct rte_mempool *mp) 269491770faSNélio Laranjeiro __attribute__((always_inline)); 270491770faSNélio Laranjeiro 2718340392eSAdrien Mazarguil /** 2722e22920bSAdrien Mazarguil * Get Memory Region (MR) <-> Memory Pool (MP) association from txq->mp2mr[]. 2732e22920bSAdrien Mazarguil * Add MP to txq->mp2mr[] if it's not registered yet. If mp2mr[] is full, 2742e22920bSAdrien Mazarguil * remove an entry first. 2752e22920bSAdrien Mazarguil * 2762e22920bSAdrien Mazarguil * @param txq 2772e22920bSAdrien Mazarguil * Pointer to TX queue structure. 2782e22920bSAdrien Mazarguil * @param[in] mp 2792e22920bSAdrien Mazarguil * Memory Pool for which a Memory Region lkey must be returned. 2802e22920bSAdrien Mazarguil * 2812e22920bSAdrien Mazarguil * @return 2822e22920bSAdrien Mazarguil * mr->lkey on success, (uint32_t)-1 on failure. 2832e22920bSAdrien Mazarguil */ 284491770faSNélio Laranjeiro static inline uint32_t 285d1d914ebSOlivier Matz txq_mp2mr(struct txq *txq, struct rte_mempool *mp) 2862e22920bSAdrien Mazarguil { 2872e22920bSAdrien Mazarguil unsigned int i; 288491770faSNélio Laranjeiro uint32_t lkey = (uint32_t)-1; 2892e22920bSAdrien Mazarguil 2902e22920bSAdrien Mazarguil for (i = 0; (i != RTE_DIM(txq->mp2mr)); ++i) { 2912e22920bSAdrien Mazarguil if (unlikely(txq->mp2mr[i].mp == NULL)) { 2922e22920bSAdrien Mazarguil /* Unknown MP, add a new MR for it. */ 2932e22920bSAdrien Mazarguil break; 2942e22920bSAdrien Mazarguil } 2952e22920bSAdrien Mazarguil if (txq->mp2mr[i].mp == mp) { 2962e22920bSAdrien Mazarguil assert(txq->mp2mr[i].lkey != (uint32_t)-1); 2971d88ba17SNélio Laranjeiro assert(htonl(txq->mp2mr[i].mr->lkey) == 2981d88ba17SNélio Laranjeiro txq->mp2mr[i].lkey); 299491770faSNélio Laranjeiro lkey = txq->mp2mr[i].lkey; 300491770faSNélio Laranjeiro break; 3012e22920bSAdrien Mazarguil } 3022e22920bSAdrien Mazarguil } 303491770faSNélio Laranjeiro if (unlikely(lkey == (uint32_t)-1)) 304491770faSNélio Laranjeiro lkey = txq_mp2mr_reg(txq, mp, i); 305491770faSNélio Laranjeiro return lkey; 3060a3b350dSOlga Shern } 3070a3b350dSOlga Shern 308e192ef80SYaacov Hazan /** 3091d88ba17SNélio Laranjeiro * Ring TX queue doorbell. 3101d88ba17SNélio Laranjeiro * 3111d88ba17SNélio Laranjeiro * @param txq 3121d88ba17SNélio Laranjeiro * Pointer to TX queue structure. 3131d88ba17SNélio Laranjeiro */ 3141d88ba17SNélio Laranjeiro static inline void 3151d88ba17SNélio Laranjeiro mlx5_tx_dbrec(struct txq *txq) 3161d88ba17SNélio Laranjeiro { 3171d88ba17SNélio Laranjeiro uint8_t *dst = (uint8_t *)((uintptr_t)txq->bf_reg + txq->bf_offset); 3181d88ba17SNélio Laranjeiro uint32_t data[4] = { 3191d88ba17SNélio Laranjeiro htonl((txq->wqe_ci << 8) | MLX5_OPCODE_SEND), 3201d88ba17SNélio Laranjeiro htonl(txq->qp_num_8s), 3211d88ba17SNélio Laranjeiro 0, 3221d88ba17SNélio Laranjeiro 0, 3231d88ba17SNélio Laranjeiro }; 3241d88ba17SNélio Laranjeiro rte_wmb(); 3251d88ba17SNélio Laranjeiro *txq->qp_db = htonl(txq->wqe_ci); 3261d88ba17SNélio Laranjeiro /* Ensure ordering between DB record and BF copy. */ 3271d88ba17SNélio Laranjeiro rte_wmb(); 328609a0767SElad Persiko memcpy(dst, (uint8_t *)data, 16); 329d5793daeSNélio Laranjeiro txq->bf_offset ^= (1 << txq->bf_buf_size); 3301d88ba17SNélio Laranjeiro } 331e192ef80SYaacov Hazan 3321d88ba17SNélio Laranjeiro /** 3331d88ba17SNélio Laranjeiro * Prefetch a CQE. 3341d88ba17SNélio Laranjeiro * 3351d88ba17SNélio Laranjeiro * @param txq 3361d88ba17SNélio Laranjeiro * Pointer to TX queue structure. 3371d88ba17SNélio Laranjeiro * @param cqe_ci 3381d88ba17SNélio Laranjeiro * CQE consumer index. 3391d88ba17SNélio Laranjeiro */ 3401d88ba17SNélio Laranjeiro static inline void 3411d88ba17SNélio Laranjeiro tx_prefetch_cqe(struct txq *txq, uint16_t ci) 3421d88ba17SNélio Laranjeiro { 343e2f116eeSNélio Laranjeiro volatile struct mlx5_cqe *cqe; 3441d88ba17SNélio Laranjeiro 345e2f116eeSNélio Laranjeiro cqe = &(*txq->cqes)[ci & ((1 << txq->cqe_n) - 1)]; 3461d88ba17SNélio Laranjeiro rte_prefetch0(cqe); 347e192ef80SYaacov Hazan } 348e192ef80SYaacov Hazan 3492e22920bSAdrien Mazarguil /** 3502e22920bSAdrien Mazarguil * DPDK callback for TX. 3512e22920bSAdrien Mazarguil * 3522e22920bSAdrien Mazarguil * @param dpdk_txq 3532e22920bSAdrien Mazarguil * Generic pointer to TX queue structure. 3542e22920bSAdrien Mazarguil * @param[in] pkts 3552e22920bSAdrien Mazarguil * Packets to transmit. 3562e22920bSAdrien Mazarguil * @param pkts_n 3572e22920bSAdrien Mazarguil * Number of packets in array. 3582e22920bSAdrien Mazarguil * 3592e22920bSAdrien Mazarguil * @return 3602e22920bSAdrien Mazarguil * Number of packets successfully transmitted (<= pkts_n). 3612e22920bSAdrien Mazarguil */ 3622e22920bSAdrien Mazarguil uint16_t 3632e22920bSAdrien Mazarguil mlx5_tx_burst(void *dpdk_txq, struct rte_mbuf **pkts, uint16_t pkts_n) 3642e22920bSAdrien Mazarguil { 3652e22920bSAdrien Mazarguil struct txq *txq = (struct txq *)dpdk_txq; 3661d88ba17SNélio Laranjeiro uint16_t elts_head = txq->elts_head; 367b4b12e55SNélio Laranjeiro const unsigned int elts_n = 1 << txq->elts_n; 368c3d62cc9SAdrien Mazarguil unsigned int i = 0; 369a5bf6af9SAdrien Mazarguil unsigned int j = 0; 3702e22920bSAdrien Mazarguil unsigned int max; 371c305090bSAdrien Mazarguil unsigned int comp; 372*9a7fa9f7SNélio Laranjeiro volatile struct mlx5_wqe_v *wqe = NULL; 3736579c27cSNélio Laranjeiro unsigned int segs_n = 0; 3746579c27cSNélio Laranjeiro struct rte_mbuf *buf = NULL; 3756579c27cSNélio Laranjeiro uint8_t *raw; 3762e22920bSAdrien Mazarguil 3771d88ba17SNélio Laranjeiro if (unlikely(!pkts_n)) 3781d88ba17SNélio Laranjeiro return 0; 3795e1d11ecSNelio Laranjeiro /* Prefetch first packet cacheline. */ 3801d88ba17SNélio Laranjeiro tx_prefetch_cqe(txq, txq->cq_ci); 3811d88ba17SNélio Laranjeiro tx_prefetch_cqe(txq, txq->cq_ci + 1); 382c3d62cc9SAdrien Mazarguil rte_prefetch0(*pkts); 3831d88ba17SNélio Laranjeiro /* Start processing. */ 3842e22920bSAdrien Mazarguil txq_complete(txq); 3854f52bbfbSNelio Laranjeiro max = (elts_n - (elts_head - txq->elts_tail)); 3862e22920bSAdrien Mazarguil if (max > elts_n) 3872e22920bSAdrien Mazarguil max -= elts_n; 388c3d62cc9SAdrien Mazarguil do { 389*9a7fa9f7SNélio Laranjeiro volatile rte_v128u32_t *dseg = NULL; 390573f54afSNélio Laranjeiro uint32_t length; 3918688b2f8SNélio Laranjeiro unsigned int ds = 0; 3926579c27cSNélio Laranjeiro uintptr_t addr; 393*9a7fa9f7SNélio Laranjeiro uint64_t naddr; 394b8fe952eSNélio Laranjeiro uint16_t pkt_inline_sz = MLX5_WQE_DWORD_SIZE; 395b8fe952eSNélio Laranjeiro uint8_t ehdr[2]; 396*9a7fa9f7SNélio Laranjeiro uint8_t cs_flags = 0; 3976579c27cSNélio Laranjeiro #ifdef MLX5_PMD_SOFT_COUNTERS 3986579c27cSNélio Laranjeiro uint32_t total_length = 0; 3996579c27cSNélio Laranjeiro #endif 4002e22920bSAdrien Mazarguil 4016579c27cSNélio Laranjeiro /* first_seg */ 4026579c27cSNélio Laranjeiro buf = *(pkts++); 4036579c27cSNélio Laranjeiro segs_n = buf->nb_segs; 404c3d62cc9SAdrien Mazarguil /* 405c3d62cc9SAdrien Mazarguil * Make sure there is enough room to store this packet and 406c3d62cc9SAdrien Mazarguil * that one ring entry remains unused. 407c3d62cc9SAdrien Mazarguil */ 408a5bf6af9SAdrien Mazarguil assert(segs_n); 409a5bf6af9SAdrien Mazarguil if (max < segs_n + 1) 410c3d62cc9SAdrien Mazarguil break; 411a5bf6af9SAdrien Mazarguil max -= segs_n; 4126579c27cSNélio Laranjeiro --segs_n; 4136579c27cSNélio Laranjeiro if (!segs_n) 414c3d62cc9SAdrien Mazarguil --pkts_n; 415*9a7fa9f7SNélio Laranjeiro wqe = (volatile struct mlx5_wqe_v *) 416fdcb0f53SNélio Laranjeiro tx_mlx5_wqe(txq, txq->wqe_ci); 417fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, txq->wqe_ci + 1)); 4186579c27cSNélio Laranjeiro if (pkts_n > 1) 419c3d62cc9SAdrien Mazarguil rte_prefetch0(*pkts); 4206579c27cSNélio Laranjeiro addr = rte_pktmbuf_mtod(buf, uintptr_t); 4212e22920bSAdrien Mazarguil length = DATA_LEN(buf); 422b8fe952eSNélio Laranjeiro ehdr[0] = ((uint8_t *)addr)[0]; 423b8fe952eSNélio Laranjeiro ehdr[1] = ((uint8_t *)addr)[1]; 4246579c27cSNélio Laranjeiro #ifdef MLX5_PMD_SOFT_COUNTERS 4256579c27cSNélio Laranjeiro total_length = length; 4266579c27cSNélio Laranjeiro #endif 4276579c27cSNélio Laranjeiro assert(length >= MLX5_WQE_DWORD_SIZE); 4282e22920bSAdrien Mazarguil /* Update element. */ 4291d88ba17SNélio Laranjeiro (*txq->elts)[elts_head] = buf; 4306579c27cSNélio Laranjeiro elts_head = (elts_head + 1) & (elts_n - 1); 4315e1d11ecSNelio Laranjeiro /* Prefetch next buffer data. */ 4326579c27cSNélio Laranjeiro if (pkts_n > 1) { 4336579c27cSNélio Laranjeiro volatile void *pkt_addr; 4346579c27cSNélio Laranjeiro 4356579c27cSNélio Laranjeiro pkt_addr = rte_pktmbuf_mtod(*pkts, volatile void *); 4366579c27cSNélio Laranjeiro rte_prefetch0(pkt_addr); 4376579c27cSNélio Laranjeiro } 4381d88ba17SNélio Laranjeiro /* Should we enable HW CKSUM offload */ 4391d88ba17SNélio Laranjeiro if (buf->ol_flags & 4401d88ba17SNélio Laranjeiro (PKT_TX_IP_CKSUM | PKT_TX_TCP_CKSUM | PKT_TX_UDP_CKSUM)) { 441*9a7fa9f7SNélio Laranjeiro cs_flags = MLX5_ETH_WQE_L3_CSUM | MLX5_ETH_WQE_L4_CSUM; 4421d88ba17SNélio Laranjeiro } 443b8fe952eSNélio Laranjeiro raw = ((uint8_t *)(uintptr_t)wqe) + 2 * MLX5_WQE_DWORD_SIZE; 444b8fe952eSNélio Laranjeiro /* 445b8fe952eSNélio Laranjeiro * Start by copying the Ethernet header minus the first two 446b8fe952eSNélio Laranjeiro * bytes which will be appended at the end of the Ethernet 447b8fe952eSNélio Laranjeiro * segment. 448b8fe952eSNélio Laranjeiro */ 449b8fe952eSNélio Laranjeiro memcpy((uint8_t *)raw, ((uint8_t *)addr) + 2, 16); 4506579c27cSNélio Laranjeiro length -= MLX5_WQE_DWORD_SIZE; 4516579c27cSNélio Laranjeiro addr += MLX5_WQE_DWORD_SIZE; 4526579c27cSNélio Laranjeiro /* Replace the Ethernet type by the VLAN if necessary. */ 4536579c27cSNélio Laranjeiro if (buf->ol_flags & PKT_TX_VLAN_PKT) { 4546579c27cSNélio Laranjeiro uint32_t vlan = htonl(0x81000000 | buf->vlan_tci); 4556579c27cSNélio Laranjeiro 456b8fe952eSNélio Laranjeiro memcpy((uint8_t *)(raw + MLX5_WQE_DWORD_SIZE - 2 - 4576579c27cSNélio Laranjeiro sizeof(vlan)), 4586579c27cSNélio Laranjeiro &vlan, sizeof(vlan)); 4596579c27cSNélio Laranjeiro addr -= sizeof(vlan); 4606579c27cSNélio Laranjeiro length += sizeof(vlan); 4616579c27cSNélio Laranjeiro } 4626579c27cSNélio Laranjeiro /* Inline if enough room. */ 4636579c27cSNélio Laranjeiro if (txq->max_inline != 0) { 464fdcb0f53SNélio Laranjeiro uintptr_t end = (uintptr_t) 465fdcb0f53SNélio Laranjeiro (((uintptr_t)txq->wqes) + 466fdcb0f53SNélio Laranjeiro (1 << txq->wqe_n) * MLX5_WQE_SIZE); 4676579c27cSNélio Laranjeiro uint16_t max_inline = 4686579c27cSNélio Laranjeiro txq->max_inline * RTE_CACHE_LINE_SIZE; 4696579c27cSNélio Laranjeiro uint16_t room; 4706579c27cSNélio Laranjeiro 471b8fe952eSNélio Laranjeiro /* 472b8fe952eSNélio Laranjeiro * raw starts two bytes before the boundary to 473b8fe952eSNélio Laranjeiro * continue the above copy of packet data. 474b8fe952eSNélio Laranjeiro */ 475b8fe952eSNélio Laranjeiro raw += MLX5_WQE_DWORD_SIZE - 2; 4766579c27cSNélio Laranjeiro room = end - (uintptr_t)raw; 4776579c27cSNélio Laranjeiro if (room > max_inline) { 4786579c27cSNélio Laranjeiro uintptr_t addr_end = (addr + max_inline) & 4796579c27cSNélio Laranjeiro ~(RTE_CACHE_LINE_SIZE - 1); 4806579c27cSNélio Laranjeiro uint16_t copy_b = ((addr_end - addr) > length) ? 4816579c27cSNélio Laranjeiro length : 4826579c27cSNélio Laranjeiro (addr_end - addr); 4836579c27cSNélio Laranjeiro 4846579c27cSNélio Laranjeiro rte_memcpy((void *)raw, (void *)addr, copy_b); 4856579c27cSNélio Laranjeiro addr += copy_b; 4866579c27cSNélio Laranjeiro length -= copy_b; 4876579c27cSNélio Laranjeiro pkt_inline_sz += copy_b; 4886579c27cSNélio Laranjeiro /* Sanity check. */ 4896579c27cSNélio Laranjeiro assert(addr <= addr_end); 4906579c27cSNélio Laranjeiro } 4916579c27cSNélio Laranjeiro /* 4926579c27cSNélio Laranjeiro * 2 DWORDs consumed by the WQE header + 1 DSEG + 4936579c27cSNélio Laranjeiro * the size of the inline part of the packet. 4946579c27cSNélio Laranjeiro */ 4956579c27cSNélio Laranjeiro ds = 2 + MLX5_WQE_DS(pkt_inline_sz - 2); 4966579c27cSNélio Laranjeiro if (length > 0) { 497*9a7fa9f7SNélio Laranjeiro dseg = (volatile rte_v128u32_t *) 4986579c27cSNélio Laranjeiro ((uintptr_t)wqe + 4996579c27cSNélio Laranjeiro (ds * MLX5_WQE_DWORD_SIZE)); 5006579c27cSNélio Laranjeiro if ((uintptr_t)dseg >= end) 501*9a7fa9f7SNélio Laranjeiro dseg = (volatile rte_v128u32_t *) 502fdcb0f53SNélio Laranjeiro txq->wqes; 5036579c27cSNélio Laranjeiro goto use_dseg; 5046579c27cSNélio Laranjeiro } else if (!segs_n) { 5056579c27cSNélio Laranjeiro goto next_pkt; 5066579c27cSNélio Laranjeiro } else { 5076579c27cSNélio Laranjeiro goto next_seg; 5086579c27cSNélio Laranjeiro } 5096579c27cSNélio Laranjeiro } else { 5106579c27cSNélio Laranjeiro /* 5116579c27cSNélio Laranjeiro * No inline has been done in the packet, only the 5126579c27cSNélio Laranjeiro * Ethernet Header as been stored. 5136579c27cSNélio Laranjeiro */ 514*9a7fa9f7SNélio Laranjeiro dseg = (volatile rte_v128u32_t *) 5156579c27cSNélio Laranjeiro ((uintptr_t)wqe + (3 * MLX5_WQE_DWORD_SIZE)); 5166579c27cSNélio Laranjeiro ds = 3; 5176579c27cSNélio Laranjeiro use_dseg: 5186579c27cSNélio Laranjeiro /* Add the remaining packet as a simple ds. */ 519*9a7fa9f7SNélio Laranjeiro naddr = htonll(addr); 520*9a7fa9f7SNélio Laranjeiro *dseg = (rte_v128u32_t){ 521*9a7fa9f7SNélio Laranjeiro htonl(length), 522*9a7fa9f7SNélio Laranjeiro txq_mp2mr(txq, txq_mb2mp(buf)), 523*9a7fa9f7SNélio Laranjeiro naddr, 524*9a7fa9f7SNélio Laranjeiro naddr >> 32, 5256579c27cSNélio Laranjeiro }; 5266579c27cSNélio Laranjeiro ++ds; 5276579c27cSNélio Laranjeiro if (!segs_n) 5286579c27cSNélio Laranjeiro goto next_pkt; 5296579c27cSNélio Laranjeiro } 5306579c27cSNélio Laranjeiro next_seg: 5316579c27cSNélio Laranjeiro assert(buf); 5326579c27cSNélio Laranjeiro assert(ds); 5336579c27cSNélio Laranjeiro assert(wqe); 534a5bf6af9SAdrien Mazarguil /* 535a5bf6af9SAdrien Mazarguil * Spill on next WQE when the current one does not have 536a5bf6af9SAdrien Mazarguil * enough room left. Size of WQE must a be a multiple 537a5bf6af9SAdrien Mazarguil * of data segment size. 538a5bf6af9SAdrien Mazarguil */ 5398688b2f8SNélio Laranjeiro assert(!(MLX5_WQE_SIZE % MLX5_WQE_DWORD_SIZE)); 5406579c27cSNélio Laranjeiro if (!(ds % (MLX5_WQE_SIZE / MLX5_WQE_DWORD_SIZE))) { 5416579c27cSNélio Laranjeiro unsigned int n = (txq->wqe_ci + ((ds + 3) / 4)) & 5426579c27cSNélio Laranjeiro ((1 << txq->wqe_n) - 1); 5436579c27cSNélio Laranjeiro 544*9a7fa9f7SNélio Laranjeiro dseg = (volatile rte_v128u32_t *) 545fdcb0f53SNélio Laranjeiro tx_mlx5_wqe(txq, n); 546fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, n + 1)); 5476579c27cSNélio Laranjeiro } else { 548a5bf6af9SAdrien Mazarguil ++dseg; 5496579c27cSNélio Laranjeiro } 550a5bf6af9SAdrien Mazarguil ++ds; 551a5bf6af9SAdrien Mazarguil buf = buf->next; 552a5bf6af9SAdrien Mazarguil assert(buf); 5536579c27cSNélio Laranjeiro length = DATA_LEN(buf); 554a5bf6af9SAdrien Mazarguil #ifdef MLX5_PMD_SOFT_COUNTERS 5556579c27cSNélio Laranjeiro total_length += length; 556a5bf6af9SAdrien Mazarguil #endif 5576579c27cSNélio Laranjeiro /* Store segment information. */ 558*9a7fa9f7SNélio Laranjeiro naddr = htonll(rte_pktmbuf_mtod(buf, uintptr_t)); 559*9a7fa9f7SNélio Laranjeiro *dseg = (rte_v128u32_t){ 560*9a7fa9f7SNélio Laranjeiro htonl(length), 561*9a7fa9f7SNélio Laranjeiro txq_mp2mr(txq, txq_mb2mp(buf)), 562*9a7fa9f7SNélio Laranjeiro naddr, 563*9a7fa9f7SNélio Laranjeiro naddr >> 32, 5646579c27cSNélio Laranjeiro }; 5656579c27cSNélio Laranjeiro (*txq->elts)[elts_head] = buf; 5666579c27cSNélio Laranjeiro elts_head = (elts_head + 1) & (elts_n - 1); 567a5bf6af9SAdrien Mazarguil ++j; 5686579c27cSNélio Laranjeiro --segs_n; 5696579c27cSNélio Laranjeiro if (segs_n) 5706579c27cSNélio Laranjeiro goto next_seg; 5716579c27cSNélio Laranjeiro else 5726579c27cSNélio Laranjeiro --pkts_n; 5736579c27cSNélio Laranjeiro next_pkt: 5746579c27cSNélio Laranjeiro ++i; 575b8fe952eSNélio Laranjeiro /* Initialize known and common part of the WQE structure. */ 576*9a7fa9f7SNélio Laranjeiro wqe->ctrl = (rte_v128u32_t){ 577*9a7fa9f7SNélio Laranjeiro htonl((txq->wqe_ci << 8) | MLX5_OPCODE_SEND), 578*9a7fa9f7SNélio Laranjeiro htonl(txq->qp_num_8s | ds), 579*9a7fa9f7SNélio Laranjeiro 0, 580*9a7fa9f7SNélio Laranjeiro 0, 581*9a7fa9f7SNélio Laranjeiro }; 582*9a7fa9f7SNélio Laranjeiro wqe->eseg = (rte_v128u32_t){ 583*9a7fa9f7SNélio Laranjeiro 0, 584*9a7fa9f7SNélio Laranjeiro cs_flags, 585*9a7fa9f7SNélio Laranjeiro 0, 586*9a7fa9f7SNélio Laranjeiro (ehdr[1] << 24) | (ehdr[0] << 16) | 587*9a7fa9f7SNélio Laranjeiro htons(pkt_inline_sz), 588*9a7fa9f7SNélio Laranjeiro }; 5896579c27cSNélio Laranjeiro txq->wqe_ci += (ds + 3) / 4; 59087011737SAdrien Mazarguil #ifdef MLX5_PMD_SOFT_COUNTERS 591573f54afSNélio Laranjeiro /* Increment sent bytes counter. */ 5926579c27cSNélio Laranjeiro txq->stats.obytes += total_length; 59387011737SAdrien Mazarguil #endif 594c3d62cc9SAdrien Mazarguil } while (pkts_n); 5952e22920bSAdrien Mazarguil /* Take a shortcut if nothing must be sent. */ 5962e22920bSAdrien Mazarguil if (unlikely(i == 0)) 5972e22920bSAdrien Mazarguil return 0; 598c305090bSAdrien Mazarguil /* Check whether completion threshold has been reached. */ 599a5bf6af9SAdrien Mazarguil comp = txq->elts_comp + i + j; 600c305090bSAdrien Mazarguil if (comp >= MLX5_TX_COMP_THRESH) { 601*9a7fa9f7SNélio Laranjeiro volatile struct mlx5_wqe_ctrl *w = 602*9a7fa9f7SNélio Laranjeiro (volatile struct mlx5_wqe_ctrl *)wqe; 603*9a7fa9f7SNélio Laranjeiro 604c305090bSAdrien Mazarguil /* Request completion on last WQE. */ 605*9a7fa9f7SNélio Laranjeiro w->ctrl2 = htonl(8); 606c305090bSAdrien Mazarguil /* Save elts_head in unused "immediate" field of WQE. */ 607*9a7fa9f7SNélio Laranjeiro w->ctrl3 = elts_head; 608c305090bSAdrien Mazarguil txq->elts_comp = 0; 609c305090bSAdrien Mazarguil } else { 610c305090bSAdrien Mazarguil txq->elts_comp = comp; 611c305090bSAdrien Mazarguil } 61287011737SAdrien Mazarguil #ifdef MLX5_PMD_SOFT_COUNTERS 61387011737SAdrien Mazarguil /* Increment sent packets counter. */ 61487011737SAdrien Mazarguil txq->stats.opackets += i; 61587011737SAdrien Mazarguil #endif 6162e22920bSAdrien Mazarguil /* Ring QP doorbell. */ 6171d88ba17SNélio Laranjeiro mlx5_tx_dbrec(txq); 6182e22920bSAdrien Mazarguil txq->elts_head = elts_head; 6192e22920bSAdrien Mazarguil return i; 6202e22920bSAdrien Mazarguil } 6212e22920bSAdrien Mazarguil 6222e22920bSAdrien Mazarguil /** 623230189d9SNélio Laranjeiro * Open a MPW session. 624230189d9SNélio Laranjeiro * 625230189d9SNélio Laranjeiro * @param txq 626230189d9SNélio Laranjeiro * Pointer to TX queue structure. 627230189d9SNélio Laranjeiro * @param mpw 628230189d9SNélio Laranjeiro * Pointer to MPW session structure. 629230189d9SNélio Laranjeiro * @param length 630230189d9SNélio Laranjeiro * Packet length. 631230189d9SNélio Laranjeiro */ 632230189d9SNélio Laranjeiro static inline void 633230189d9SNélio Laranjeiro mlx5_mpw_new(struct txq *txq, struct mlx5_mpw *mpw, uint32_t length) 634230189d9SNélio Laranjeiro { 635a821d09dSNélio Laranjeiro uint16_t idx = txq->wqe_ci & ((1 << txq->wqe_n) - 1); 636230189d9SNélio Laranjeiro volatile struct mlx5_wqe_data_seg (*dseg)[MLX5_MPW_DSEG_MAX] = 637230189d9SNélio Laranjeiro (volatile struct mlx5_wqe_data_seg (*)[]) 638fdcb0f53SNélio Laranjeiro tx_mlx5_wqe(txq, idx + 1); 639230189d9SNélio Laranjeiro 640230189d9SNélio Laranjeiro mpw->state = MLX5_MPW_STATE_OPENED; 641230189d9SNélio Laranjeiro mpw->pkts_n = 0; 642230189d9SNélio Laranjeiro mpw->len = length; 643230189d9SNélio Laranjeiro mpw->total_len = 0; 644fdcb0f53SNélio Laranjeiro mpw->wqe = (volatile struct mlx5_wqe *)tx_mlx5_wqe(txq, idx); 6458688b2f8SNélio Laranjeiro mpw->wqe->eseg.mss = htons(length); 6468688b2f8SNélio Laranjeiro mpw->wqe->eseg.inline_hdr_sz = 0; 6478688b2f8SNélio Laranjeiro mpw->wqe->eseg.rsvd0 = 0; 6488688b2f8SNélio Laranjeiro mpw->wqe->eseg.rsvd1 = 0; 6498688b2f8SNélio Laranjeiro mpw->wqe->eseg.rsvd2 = 0; 6508688b2f8SNélio Laranjeiro mpw->wqe->ctrl[0] = htonl((MLX5_OPC_MOD_MPW << 24) | 651c904ae25SNélio Laranjeiro (txq->wqe_ci << 8) | MLX5_OPCODE_TSO); 6528688b2f8SNélio Laranjeiro mpw->wqe->ctrl[2] = 0; 6538688b2f8SNélio Laranjeiro mpw->wqe->ctrl[3] = 0; 6548688b2f8SNélio Laranjeiro mpw->data.dseg[0] = (volatile struct mlx5_wqe_data_seg *) 6558688b2f8SNélio Laranjeiro (((uintptr_t)mpw->wqe) + (2 * MLX5_WQE_DWORD_SIZE)); 6568688b2f8SNélio Laranjeiro mpw->data.dseg[1] = (volatile struct mlx5_wqe_data_seg *) 6578688b2f8SNélio Laranjeiro (((uintptr_t)mpw->wqe) + (3 * MLX5_WQE_DWORD_SIZE)); 658230189d9SNélio Laranjeiro mpw->data.dseg[2] = &(*dseg)[0]; 659230189d9SNélio Laranjeiro mpw->data.dseg[3] = &(*dseg)[1]; 660230189d9SNélio Laranjeiro mpw->data.dseg[4] = &(*dseg)[2]; 661230189d9SNélio Laranjeiro } 662230189d9SNélio Laranjeiro 663230189d9SNélio Laranjeiro /** 664230189d9SNélio Laranjeiro * Close a MPW session. 665230189d9SNélio Laranjeiro * 666230189d9SNélio Laranjeiro * @param txq 667230189d9SNélio Laranjeiro * Pointer to TX queue structure. 668230189d9SNélio Laranjeiro * @param mpw 669230189d9SNélio Laranjeiro * Pointer to MPW session structure. 670230189d9SNélio Laranjeiro */ 671230189d9SNélio Laranjeiro static inline void 672230189d9SNélio Laranjeiro mlx5_mpw_close(struct txq *txq, struct mlx5_mpw *mpw) 673230189d9SNélio Laranjeiro { 674230189d9SNélio Laranjeiro unsigned int num = mpw->pkts_n; 675230189d9SNélio Laranjeiro 676230189d9SNélio Laranjeiro /* 677230189d9SNélio Laranjeiro * Store size in multiple of 16 bytes. Control and Ethernet segments 678230189d9SNélio Laranjeiro * count as 2. 679230189d9SNélio Laranjeiro */ 6808688b2f8SNélio Laranjeiro mpw->wqe->ctrl[1] = htonl(txq->qp_num_8s | (2 + num)); 681230189d9SNélio Laranjeiro mpw->state = MLX5_MPW_STATE_CLOSED; 682230189d9SNélio Laranjeiro if (num < 3) 683230189d9SNélio Laranjeiro ++txq->wqe_ci; 684230189d9SNélio Laranjeiro else 685230189d9SNélio Laranjeiro txq->wqe_ci += 2; 686fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, txq->wqe_ci)); 687fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, txq->wqe_ci + 1)); 688230189d9SNélio Laranjeiro } 689230189d9SNélio Laranjeiro 690230189d9SNélio Laranjeiro /** 691230189d9SNélio Laranjeiro * DPDK callback for TX with MPW support. 692230189d9SNélio Laranjeiro * 693230189d9SNélio Laranjeiro * @param dpdk_txq 694230189d9SNélio Laranjeiro * Generic pointer to TX queue structure. 695230189d9SNélio Laranjeiro * @param[in] pkts 696230189d9SNélio Laranjeiro * Packets to transmit. 697230189d9SNélio Laranjeiro * @param pkts_n 698230189d9SNélio Laranjeiro * Number of packets in array. 699230189d9SNélio Laranjeiro * 700230189d9SNélio Laranjeiro * @return 701230189d9SNélio Laranjeiro * Number of packets successfully transmitted (<= pkts_n). 702230189d9SNélio Laranjeiro */ 703230189d9SNélio Laranjeiro uint16_t 704230189d9SNélio Laranjeiro mlx5_tx_burst_mpw(void *dpdk_txq, struct rte_mbuf **pkts, uint16_t pkts_n) 705230189d9SNélio Laranjeiro { 706230189d9SNélio Laranjeiro struct txq *txq = (struct txq *)dpdk_txq; 707230189d9SNélio Laranjeiro uint16_t elts_head = txq->elts_head; 708b4b12e55SNélio Laranjeiro const unsigned int elts_n = 1 << txq->elts_n; 709c3d62cc9SAdrien Mazarguil unsigned int i = 0; 710a5bf6af9SAdrien Mazarguil unsigned int j = 0; 711230189d9SNélio Laranjeiro unsigned int max; 712230189d9SNélio Laranjeiro unsigned int comp; 713230189d9SNélio Laranjeiro struct mlx5_mpw mpw = { 714230189d9SNélio Laranjeiro .state = MLX5_MPW_STATE_CLOSED, 715230189d9SNélio Laranjeiro }; 716230189d9SNélio Laranjeiro 717c3d62cc9SAdrien Mazarguil if (unlikely(!pkts_n)) 718c3d62cc9SAdrien Mazarguil return 0; 719230189d9SNélio Laranjeiro /* Prefetch first packet cacheline. */ 720230189d9SNélio Laranjeiro tx_prefetch_cqe(txq, txq->cq_ci); 721fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, txq->wqe_ci)); 722fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, txq->wqe_ci + 1)); 723230189d9SNélio Laranjeiro /* Start processing. */ 724230189d9SNélio Laranjeiro txq_complete(txq); 725230189d9SNélio Laranjeiro max = (elts_n - (elts_head - txq->elts_tail)); 726230189d9SNélio Laranjeiro if (max > elts_n) 727230189d9SNélio Laranjeiro max -= elts_n; 728c3d62cc9SAdrien Mazarguil do { 729a5bf6af9SAdrien Mazarguil struct rte_mbuf *buf = *(pkts++); 730c3d62cc9SAdrien Mazarguil unsigned int elts_head_next; 731230189d9SNélio Laranjeiro uint32_t length; 732a5bf6af9SAdrien Mazarguil unsigned int segs_n = buf->nb_segs; 733230189d9SNélio Laranjeiro uint32_t cs_flags = 0; 734230189d9SNélio Laranjeiro 735c3d62cc9SAdrien Mazarguil /* 736c3d62cc9SAdrien Mazarguil * Make sure there is enough room to store this packet and 737c3d62cc9SAdrien Mazarguil * that one ring entry remains unused. 738c3d62cc9SAdrien Mazarguil */ 739a5bf6af9SAdrien Mazarguil assert(segs_n); 740a5bf6af9SAdrien Mazarguil if (max < segs_n + 1) 741c3d62cc9SAdrien Mazarguil break; 742a5bf6af9SAdrien Mazarguil /* Do not bother with large packets MPW cannot handle. */ 743a5bf6af9SAdrien Mazarguil if (segs_n > MLX5_MPW_DSEG_MAX) 744a5bf6af9SAdrien Mazarguil break; 745a5bf6af9SAdrien Mazarguil max -= segs_n; 746c3d62cc9SAdrien Mazarguil --pkts_n; 747230189d9SNélio Laranjeiro /* Should we enable HW CKSUM offload */ 748230189d9SNélio Laranjeiro if (buf->ol_flags & 749230189d9SNélio Laranjeiro (PKT_TX_IP_CKSUM | PKT_TX_TCP_CKSUM | PKT_TX_UDP_CKSUM)) 750230189d9SNélio Laranjeiro cs_flags = MLX5_ETH_WQE_L3_CSUM | MLX5_ETH_WQE_L4_CSUM; 751a5bf6af9SAdrien Mazarguil /* Retrieve packet information. */ 752a5bf6af9SAdrien Mazarguil length = PKT_LEN(buf); 753a5bf6af9SAdrien Mazarguil assert(length); 754230189d9SNélio Laranjeiro /* Start new session if packet differs. */ 755230189d9SNélio Laranjeiro if ((mpw.state == MLX5_MPW_STATE_OPENED) && 756230189d9SNélio Laranjeiro ((mpw.len != length) || 757a5bf6af9SAdrien Mazarguil (segs_n != 1) || 7588688b2f8SNélio Laranjeiro (mpw.wqe->eseg.cs_flags != cs_flags))) 759230189d9SNélio Laranjeiro mlx5_mpw_close(txq, &mpw); 760230189d9SNélio Laranjeiro if (mpw.state == MLX5_MPW_STATE_CLOSED) { 761230189d9SNélio Laranjeiro mlx5_mpw_new(txq, &mpw, length); 7628688b2f8SNélio Laranjeiro mpw.wqe->eseg.cs_flags = cs_flags; 763230189d9SNélio Laranjeiro } 764a5bf6af9SAdrien Mazarguil /* Multi-segment packets must be alone in their MPW. */ 765a5bf6af9SAdrien Mazarguil assert((segs_n == 1) || (mpw.pkts_n == 0)); 766a5bf6af9SAdrien Mazarguil #if defined(MLX5_PMD_SOFT_COUNTERS) || !defined(NDEBUG) 767a5bf6af9SAdrien Mazarguil length = 0; 768a5bf6af9SAdrien Mazarguil #endif 769a5bf6af9SAdrien Mazarguil do { 770a5bf6af9SAdrien Mazarguil volatile struct mlx5_wqe_data_seg *dseg; 771a5bf6af9SAdrien Mazarguil uintptr_t addr; 772a5bf6af9SAdrien Mazarguil 773a5bf6af9SAdrien Mazarguil elts_head_next = (elts_head + 1) & (elts_n - 1); 774a5bf6af9SAdrien Mazarguil assert(buf); 775a5bf6af9SAdrien Mazarguil (*txq->elts)[elts_head] = buf; 776230189d9SNélio Laranjeiro dseg = mpw.data.dseg[mpw.pkts_n]; 777a5bf6af9SAdrien Mazarguil addr = rte_pktmbuf_mtod(buf, uintptr_t); 778230189d9SNélio Laranjeiro *dseg = (struct mlx5_wqe_data_seg){ 779a5bf6af9SAdrien Mazarguil .byte_count = htonl(DATA_LEN(buf)), 780230189d9SNélio Laranjeiro .lkey = txq_mp2mr(txq, txq_mb2mp(buf)), 781230189d9SNélio Laranjeiro .addr = htonll(addr), 782230189d9SNélio Laranjeiro }; 783a5bf6af9SAdrien Mazarguil elts_head = elts_head_next; 784a5bf6af9SAdrien Mazarguil #if defined(MLX5_PMD_SOFT_COUNTERS) || !defined(NDEBUG) 785a5bf6af9SAdrien Mazarguil length += DATA_LEN(buf); 786a5bf6af9SAdrien Mazarguil #endif 787a5bf6af9SAdrien Mazarguil buf = buf->next; 788230189d9SNélio Laranjeiro ++mpw.pkts_n; 789a5bf6af9SAdrien Mazarguil ++j; 790a5bf6af9SAdrien Mazarguil } while (--segs_n); 791a5bf6af9SAdrien Mazarguil assert(length == mpw.len); 792230189d9SNélio Laranjeiro if (mpw.pkts_n == MLX5_MPW_DSEG_MAX) 793230189d9SNélio Laranjeiro mlx5_mpw_close(txq, &mpw); 794230189d9SNélio Laranjeiro elts_head = elts_head_next; 795230189d9SNélio Laranjeiro #ifdef MLX5_PMD_SOFT_COUNTERS 796230189d9SNélio Laranjeiro /* Increment sent bytes counter. */ 797230189d9SNélio Laranjeiro txq->stats.obytes += length; 798230189d9SNélio Laranjeiro #endif 799c3d62cc9SAdrien Mazarguil ++i; 800c3d62cc9SAdrien Mazarguil } while (pkts_n); 801230189d9SNélio Laranjeiro /* Take a shortcut if nothing must be sent. */ 802230189d9SNélio Laranjeiro if (unlikely(i == 0)) 803230189d9SNélio Laranjeiro return 0; 804230189d9SNélio Laranjeiro /* Check whether completion threshold has been reached. */ 805a5bf6af9SAdrien Mazarguil /* "j" includes both packets and segments. */ 806a5bf6af9SAdrien Mazarguil comp = txq->elts_comp + j; 807230189d9SNélio Laranjeiro if (comp >= MLX5_TX_COMP_THRESH) { 8088688b2f8SNélio Laranjeiro volatile struct mlx5_wqe *wqe = mpw.wqe; 809230189d9SNélio Laranjeiro 810230189d9SNélio Laranjeiro /* Request completion on last WQE. */ 8118688b2f8SNélio Laranjeiro wqe->ctrl[2] = htonl(8); 812230189d9SNélio Laranjeiro /* Save elts_head in unused "immediate" field of WQE. */ 8138688b2f8SNélio Laranjeiro wqe->ctrl[3] = elts_head; 814230189d9SNélio Laranjeiro txq->elts_comp = 0; 815230189d9SNélio Laranjeiro } else { 816230189d9SNélio Laranjeiro txq->elts_comp = comp; 817230189d9SNélio Laranjeiro } 818230189d9SNélio Laranjeiro #ifdef MLX5_PMD_SOFT_COUNTERS 819230189d9SNélio Laranjeiro /* Increment sent packets counter. */ 820230189d9SNélio Laranjeiro txq->stats.opackets += i; 821230189d9SNélio Laranjeiro #endif 822230189d9SNélio Laranjeiro /* Ring QP doorbell. */ 823230189d9SNélio Laranjeiro if (mpw.state == MLX5_MPW_STATE_OPENED) 824230189d9SNélio Laranjeiro mlx5_mpw_close(txq, &mpw); 825230189d9SNélio Laranjeiro mlx5_tx_dbrec(txq); 826230189d9SNélio Laranjeiro txq->elts_head = elts_head; 827230189d9SNélio Laranjeiro return i; 828230189d9SNélio Laranjeiro } 829230189d9SNélio Laranjeiro 830230189d9SNélio Laranjeiro /** 831230189d9SNélio Laranjeiro * Open a MPW inline session. 832230189d9SNélio Laranjeiro * 833230189d9SNélio Laranjeiro * @param txq 834230189d9SNélio Laranjeiro * Pointer to TX queue structure. 835230189d9SNélio Laranjeiro * @param mpw 836230189d9SNélio Laranjeiro * Pointer to MPW session structure. 837230189d9SNélio Laranjeiro * @param length 838230189d9SNélio Laranjeiro * Packet length. 839230189d9SNélio Laranjeiro */ 840230189d9SNélio Laranjeiro static inline void 841230189d9SNélio Laranjeiro mlx5_mpw_inline_new(struct txq *txq, struct mlx5_mpw *mpw, uint32_t length) 842230189d9SNélio Laranjeiro { 843a821d09dSNélio Laranjeiro uint16_t idx = txq->wqe_ci & ((1 << txq->wqe_n) - 1); 8448688b2f8SNélio Laranjeiro struct mlx5_wqe_inl_small *inl; 845230189d9SNélio Laranjeiro 846230189d9SNélio Laranjeiro mpw->state = MLX5_MPW_INL_STATE_OPENED; 847230189d9SNélio Laranjeiro mpw->pkts_n = 0; 848230189d9SNélio Laranjeiro mpw->len = length; 849230189d9SNélio Laranjeiro mpw->total_len = 0; 850fdcb0f53SNélio Laranjeiro mpw->wqe = (volatile struct mlx5_wqe *)tx_mlx5_wqe(txq, idx); 8518688b2f8SNélio Laranjeiro mpw->wqe->ctrl[0] = htonl((MLX5_OPC_MOD_MPW << 24) | 852230189d9SNélio Laranjeiro (txq->wqe_ci << 8) | 853c904ae25SNélio Laranjeiro MLX5_OPCODE_TSO); 8548688b2f8SNélio Laranjeiro mpw->wqe->ctrl[2] = 0; 8558688b2f8SNélio Laranjeiro mpw->wqe->ctrl[3] = 0; 8568688b2f8SNélio Laranjeiro mpw->wqe->eseg.mss = htons(length); 8578688b2f8SNélio Laranjeiro mpw->wqe->eseg.inline_hdr_sz = 0; 8588688b2f8SNélio Laranjeiro mpw->wqe->eseg.cs_flags = 0; 8598688b2f8SNélio Laranjeiro mpw->wqe->eseg.rsvd0 = 0; 8608688b2f8SNélio Laranjeiro mpw->wqe->eseg.rsvd1 = 0; 8618688b2f8SNélio Laranjeiro mpw->wqe->eseg.rsvd2 = 0; 8628688b2f8SNélio Laranjeiro inl = (struct mlx5_wqe_inl_small *) 8638688b2f8SNélio Laranjeiro (((uintptr_t)mpw->wqe) + 2 * MLX5_WQE_DWORD_SIZE); 8648688b2f8SNélio Laranjeiro mpw->data.raw = (uint8_t *)&inl->raw; 865230189d9SNélio Laranjeiro } 866230189d9SNélio Laranjeiro 867230189d9SNélio Laranjeiro /** 868230189d9SNélio Laranjeiro * Close a MPW inline session. 869230189d9SNélio Laranjeiro * 870230189d9SNélio Laranjeiro * @param txq 871230189d9SNélio Laranjeiro * Pointer to TX queue structure. 872230189d9SNélio Laranjeiro * @param mpw 873230189d9SNélio Laranjeiro * Pointer to MPW session structure. 874230189d9SNélio Laranjeiro */ 875230189d9SNélio Laranjeiro static inline void 876230189d9SNélio Laranjeiro mlx5_mpw_inline_close(struct txq *txq, struct mlx5_mpw *mpw) 877230189d9SNélio Laranjeiro { 878230189d9SNélio Laranjeiro unsigned int size; 8798688b2f8SNélio Laranjeiro struct mlx5_wqe_inl_small *inl = (struct mlx5_wqe_inl_small *) 8808688b2f8SNélio Laranjeiro (((uintptr_t)mpw->wqe) + (2 * MLX5_WQE_DWORD_SIZE)); 881230189d9SNélio Laranjeiro 8828688b2f8SNélio Laranjeiro size = MLX5_WQE_SIZE - MLX5_MWQE64_INL_DATA + mpw->total_len; 883230189d9SNélio Laranjeiro /* 884230189d9SNélio Laranjeiro * Store size in multiple of 16 bytes. Control and Ethernet segments 885230189d9SNélio Laranjeiro * count as 2. 886230189d9SNélio Laranjeiro */ 8878688b2f8SNélio Laranjeiro mpw->wqe->ctrl[1] = htonl(txq->qp_num_8s | MLX5_WQE_DS(size)); 888230189d9SNélio Laranjeiro mpw->state = MLX5_MPW_STATE_CLOSED; 8898688b2f8SNélio Laranjeiro inl->byte_cnt = htonl(mpw->total_len | MLX5_INLINE_SEG); 8908688b2f8SNélio Laranjeiro txq->wqe_ci += (size + (MLX5_WQE_SIZE - 1)) / MLX5_WQE_SIZE; 891230189d9SNélio Laranjeiro } 892230189d9SNélio Laranjeiro 893230189d9SNélio Laranjeiro /** 894230189d9SNélio Laranjeiro * DPDK callback for TX with MPW inline support. 895230189d9SNélio Laranjeiro * 896230189d9SNélio Laranjeiro * @param dpdk_txq 897230189d9SNélio Laranjeiro * Generic pointer to TX queue structure. 898230189d9SNélio Laranjeiro * @param[in] pkts 899230189d9SNélio Laranjeiro * Packets to transmit. 900230189d9SNélio Laranjeiro * @param pkts_n 901230189d9SNélio Laranjeiro * Number of packets in array. 902230189d9SNélio Laranjeiro * 903230189d9SNélio Laranjeiro * @return 904230189d9SNélio Laranjeiro * Number of packets successfully transmitted (<= pkts_n). 905230189d9SNélio Laranjeiro */ 906230189d9SNélio Laranjeiro uint16_t 907230189d9SNélio Laranjeiro mlx5_tx_burst_mpw_inline(void *dpdk_txq, struct rte_mbuf **pkts, 908230189d9SNélio Laranjeiro uint16_t pkts_n) 909230189d9SNélio Laranjeiro { 910230189d9SNélio Laranjeiro struct txq *txq = (struct txq *)dpdk_txq; 911230189d9SNélio Laranjeiro uint16_t elts_head = txq->elts_head; 912b4b12e55SNélio Laranjeiro const unsigned int elts_n = 1 << txq->elts_n; 913c3d62cc9SAdrien Mazarguil unsigned int i = 0; 914a5bf6af9SAdrien Mazarguil unsigned int j = 0; 915230189d9SNélio Laranjeiro unsigned int max; 916230189d9SNélio Laranjeiro unsigned int comp; 9170e8679fcSNélio Laranjeiro unsigned int inline_room = txq->max_inline * RTE_CACHE_LINE_SIZE; 918230189d9SNélio Laranjeiro struct mlx5_mpw mpw = { 919230189d9SNélio Laranjeiro .state = MLX5_MPW_STATE_CLOSED, 920230189d9SNélio Laranjeiro }; 921230189d9SNélio Laranjeiro 922c3d62cc9SAdrien Mazarguil if (unlikely(!pkts_n)) 923c3d62cc9SAdrien Mazarguil return 0; 924230189d9SNélio Laranjeiro /* Prefetch first packet cacheline. */ 925230189d9SNélio Laranjeiro tx_prefetch_cqe(txq, txq->cq_ci); 926fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, txq->wqe_ci)); 927fdcb0f53SNélio Laranjeiro rte_prefetch0(tx_mlx5_wqe(txq, txq->wqe_ci + 1)); 928230189d9SNélio Laranjeiro /* Start processing. */ 929230189d9SNélio Laranjeiro txq_complete(txq); 930230189d9SNélio Laranjeiro max = (elts_n - (elts_head - txq->elts_tail)); 931230189d9SNélio Laranjeiro if (max > elts_n) 932230189d9SNélio Laranjeiro max -= elts_n; 933c3d62cc9SAdrien Mazarguil do { 934a5bf6af9SAdrien Mazarguil struct rte_mbuf *buf = *(pkts++); 935c3d62cc9SAdrien Mazarguil unsigned int elts_head_next; 936230189d9SNélio Laranjeiro uintptr_t addr; 937230189d9SNélio Laranjeiro uint32_t length; 938a5bf6af9SAdrien Mazarguil unsigned int segs_n = buf->nb_segs; 939230189d9SNélio Laranjeiro uint32_t cs_flags = 0; 940230189d9SNélio Laranjeiro 941c3d62cc9SAdrien Mazarguil /* 942c3d62cc9SAdrien Mazarguil * Make sure there is enough room to store this packet and 943c3d62cc9SAdrien Mazarguil * that one ring entry remains unused. 944c3d62cc9SAdrien Mazarguil */ 945a5bf6af9SAdrien Mazarguil assert(segs_n); 946a5bf6af9SAdrien Mazarguil if (max < segs_n + 1) 947c3d62cc9SAdrien Mazarguil break; 948a5bf6af9SAdrien Mazarguil /* Do not bother with large packets MPW cannot handle. */ 949a5bf6af9SAdrien Mazarguil if (segs_n > MLX5_MPW_DSEG_MAX) 950a5bf6af9SAdrien Mazarguil break; 951a5bf6af9SAdrien Mazarguil max -= segs_n; 952c3d62cc9SAdrien Mazarguil --pkts_n; 953230189d9SNélio Laranjeiro /* Should we enable HW CKSUM offload */ 954230189d9SNélio Laranjeiro if (buf->ol_flags & 955230189d9SNélio Laranjeiro (PKT_TX_IP_CKSUM | PKT_TX_TCP_CKSUM | PKT_TX_UDP_CKSUM)) 956230189d9SNélio Laranjeiro cs_flags = MLX5_ETH_WQE_L3_CSUM | MLX5_ETH_WQE_L4_CSUM; 957a5bf6af9SAdrien Mazarguil /* Retrieve packet information. */ 958a5bf6af9SAdrien Mazarguil length = PKT_LEN(buf); 959230189d9SNélio Laranjeiro /* Start new session if packet differs. */ 960230189d9SNélio Laranjeiro if (mpw.state == MLX5_MPW_STATE_OPENED) { 961230189d9SNélio Laranjeiro if ((mpw.len != length) || 962a5bf6af9SAdrien Mazarguil (segs_n != 1) || 9638688b2f8SNélio Laranjeiro (mpw.wqe->eseg.cs_flags != cs_flags)) 964230189d9SNélio Laranjeiro mlx5_mpw_close(txq, &mpw); 965230189d9SNélio Laranjeiro } else if (mpw.state == MLX5_MPW_INL_STATE_OPENED) { 966230189d9SNélio Laranjeiro if ((mpw.len != length) || 967a5bf6af9SAdrien Mazarguil (segs_n != 1) || 968230189d9SNélio Laranjeiro (length > inline_room) || 9698688b2f8SNélio Laranjeiro (mpw.wqe->eseg.cs_flags != cs_flags)) { 970230189d9SNélio Laranjeiro mlx5_mpw_inline_close(txq, &mpw); 9710e8679fcSNélio Laranjeiro inline_room = 9720e8679fcSNélio Laranjeiro txq->max_inline * RTE_CACHE_LINE_SIZE; 973230189d9SNélio Laranjeiro } 974230189d9SNélio Laranjeiro } 975230189d9SNélio Laranjeiro if (mpw.state == MLX5_MPW_STATE_CLOSED) { 976a5bf6af9SAdrien Mazarguil if ((segs_n != 1) || 977a5bf6af9SAdrien Mazarguil (length > inline_room)) { 978230189d9SNélio Laranjeiro mlx5_mpw_new(txq, &mpw, length); 9798688b2f8SNélio Laranjeiro mpw.wqe->eseg.cs_flags = cs_flags; 980230189d9SNélio Laranjeiro } else { 981230189d9SNélio Laranjeiro mlx5_mpw_inline_new(txq, &mpw, length); 9828688b2f8SNélio Laranjeiro mpw.wqe->eseg.cs_flags = cs_flags; 983230189d9SNélio Laranjeiro } 984230189d9SNélio Laranjeiro } 985a5bf6af9SAdrien Mazarguil /* Multi-segment packets must be alone in their MPW. */ 986a5bf6af9SAdrien Mazarguil assert((segs_n == 1) || (mpw.pkts_n == 0)); 987230189d9SNélio Laranjeiro if (mpw.state == MLX5_MPW_STATE_OPENED) { 9880e8679fcSNélio Laranjeiro assert(inline_room == 9890e8679fcSNélio Laranjeiro txq->max_inline * RTE_CACHE_LINE_SIZE); 990a5bf6af9SAdrien Mazarguil #if defined(MLX5_PMD_SOFT_COUNTERS) || !defined(NDEBUG) 991a5bf6af9SAdrien Mazarguil length = 0; 992a5bf6af9SAdrien Mazarguil #endif 993a5bf6af9SAdrien Mazarguil do { 994230189d9SNélio Laranjeiro volatile struct mlx5_wqe_data_seg *dseg; 995230189d9SNélio Laranjeiro 996a5bf6af9SAdrien Mazarguil elts_head_next = 997a5bf6af9SAdrien Mazarguil (elts_head + 1) & (elts_n - 1); 998a5bf6af9SAdrien Mazarguil assert(buf); 999a5bf6af9SAdrien Mazarguil (*txq->elts)[elts_head] = buf; 1000230189d9SNélio Laranjeiro dseg = mpw.data.dseg[mpw.pkts_n]; 1001a5bf6af9SAdrien Mazarguil addr = rte_pktmbuf_mtod(buf, uintptr_t); 1002230189d9SNélio Laranjeiro *dseg = (struct mlx5_wqe_data_seg){ 1003a5bf6af9SAdrien Mazarguil .byte_count = htonl(DATA_LEN(buf)), 1004230189d9SNélio Laranjeiro .lkey = txq_mp2mr(txq, txq_mb2mp(buf)), 1005230189d9SNélio Laranjeiro .addr = htonll(addr), 1006230189d9SNélio Laranjeiro }; 1007a5bf6af9SAdrien Mazarguil elts_head = elts_head_next; 1008a5bf6af9SAdrien Mazarguil #if defined(MLX5_PMD_SOFT_COUNTERS) || !defined(NDEBUG) 1009a5bf6af9SAdrien Mazarguil length += DATA_LEN(buf); 1010a5bf6af9SAdrien Mazarguil #endif 1011a5bf6af9SAdrien Mazarguil buf = buf->next; 1012230189d9SNélio Laranjeiro ++mpw.pkts_n; 1013a5bf6af9SAdrien Mazarguil ++j; 1014a5bf6af9SAdrien Mazarguil } while (--segs_n); 1015a5bf6af9SAdrien Mazarguil assert(length == mpw.len); 1016230189d9SNélio Laranjeiro if (mpw.pkts_n == MLX5_MPW_DSEG_MAX) 1017230189d9SNélio Laranjeiro mlx5_mpw_close(txq, &mpw); 1018230189d9SNélio Laranjeiro } else { 1019230189d9SNélio Laranjeiro unsigned int max; 1020230189d9SNélio Laranjeiro 1021230189d9SNélio Laranjeiro assert(mpw.state == MLX5_MPW_INL_STATE_OPENED); 1022230189d9SNélio Laranjeiro assert(length <= inline_room); 1023a5bf6af9SAdrien Mazarguil assert(length == DATA_LEN(buf)); 1024a5bf6af9SAdrien Mazarguil elts_head_next = (elts_head + 1) & (elts_n - 1); 1025a5bf6af9SAdrien Mazarguil addr = rte_pktmbuf_mtod(buf, uintptr_t); 1026a5bf6af9SAdrien Mazarguil (*txq->elts)[elts_head] = buf; 1027230189d9SNélio Laranjeiro /* Maximum number of bytes before wrapping. */ 1028fdcb0f53SNélio Laranjeiro max = ((((uintptr_t)(txq->wqes)) + 1029fdcb0f53SNélio Laranjeiro (1 << txq->wqe_n) * 1030fdcb0f53SNélio Laranjeiro MLX5_WQE_SIZE) - 1031230189d9SNélio Laranjeiro (uintptr_t)mpw.data.raw); 1032230189d9SNélio Laranjeiro if (length > max) { 1033230189d9SNélio Laranjeiro rte_memcpy((void *)(uintptr_t)mpw.data.raw, 1034230189d9SNélio Laranjeiro (void *)addr, 1035230189d9SNélio Laranjeiro max); 1036fdcb0f53SNélio Laranjeiro mpw.data.raw = (volatile void *)txq->wqes; 1037230189d9SNélio Laranjeiro rte_memcpy((void *)(uintptr_t)mpw.data.raw, 1038230189d9SNélio Laranjeiro (void *)(addr + max), 1039230189d9SNélio Laranjeiro length - max); 1040230189d9SNélio Laranjeiro mpw.data.raw += length - max; 1041230189d9SNélio Laranjeiro } else { 1042230189d9SNélio Laranjeiro rte_memcpy((void *)(uintptr_t)mpw.data.raw, 1043230189d9SNélio Laranjeiro (void *)addr, 1044230189d9SNélio Laranjeiro length); 1045230189d9SNélio Laranjeiro mpw.data.raw += length; 1046230189d9SNélio Laranjeiro } 1047230189d9SNélio Laranjeiro if ((uintptr_t)mpw.data.raw == 1048fdcb0f53SNélio Laranjeiro (uintptr_t)tx_mlx5_wqe(txq, 1 << txq->wqe_n)) 1049fdcb0f53SNélio Laranjeiro mpw.data.raw = (volatile void *)txq->wqes; 1050230189d9SNélio Laranjeiro ++mpw.pkts_n; 1051a5bf6af9SAdrien Mazarguil ++j; 1052230189d9SNélio Laranjeiro if (mpw.pkts_n == MLX5_MPW_DSEG_MAX) { 1053230189d9SNélio Laranjeiro mlx5_mpw_inline_close(txq, &mpw); 10540e8679fcSNélio Laranjeiro inline_room = 10550e8679fcSNélio Laranjeiro txq->max_inline * RTE_CACHE_LINE_SIZE; 1056230189d9SNélio Laranjeiro } else { 1057230189d9SNélio Laranjeiro inline_room -= length; 1058230189d9SNélio Laranjeiro } 1059230189d9SNélio Laranjeiro } 1060230189d9SNélio Laranjeiro mpw.total_len += length; 1061230189d9SNélio Laranjeiro elts_head = elts_head_next; 1062230189d9SNélio Laranjeiro #ifdef MLX5_PMD_SOFT_COUNTERS 1063230189d9SNélio Laranjeiro /* Increment sent bytes counter. */ 1064230189d9SNélio Laranjeiro txq->stats.obytes += length; 1065230189d9SNélio Laranjeiro #endif 1066c3d62cc9SAdrien Mazarguil ++i; 1067c3d62cc9SAdrien Mazarguil } while (pkts_n); 1068230189d9SNélio Laranjeiro /* Take a shortcut if nothing must be sent. */ 1069230189d9SNélio Laranjeiro if (unlikely(i == 0)) 1070230189d9SNélio Laranjeiro return 0; 1071230189d9SNélio Laranjeiro /* Check whether completion threshold has been reached. */ 1072a5bf6af9SAdrien Mazarguil /* "j" includes both packets and segments. */ 1073a5bf6af9SAdrien Mazarguil comp = txq->elts_comp + j; 1074230189d9SNélio Laranjeiro if (comp >= MLX5_TX_COMP_THRESH) { 10758688b2f8SNélio Laranjeiro volatile struct mlx5_wqe *wqe = mpw.wqe; 1076230189d9SNélio Laranjeiro 1077230189d9SNélio Laranjeiro /* Request completion on last WQE. */ 10788688b2f8SNélio Laranjeiro wqe->ctrl[2] = htonl(8); 1079230189d9SNélio Laranjeiro /* Save elts_head in unused "immediate" field of WQE. */ 10808688b2f8SNélio Laranjeiro wqe->ctrl[3] = elts_head; 1081230189d9SNélio Laranjeiro txq->elts_comp = 0; 1082230189d9SNélio Laranjeiro } else { 1083230189d9SNélio Laranjeiro txq->elts_comp = comp; 1084230189d9SNélio Laranjeiro } 1085230189d9SNélio Laranjeiro #ifdef MLX5_PMD_SOFT_COUNTERS 1086230189d9SNélio Laranjeiro /* Increment sent packets counter. */ 1087230189d9SNélio Laranjeiro txq->stats.opackets += i; 1088230189d9SNélio Laranjeiro #endif 1089230189d9SNélio Laranjeiro /* Ring QP doorbell. */ 1090230189d9SNélio Laranjeiro if (mpw.state == MLX5_MPW_INL_STATE_OPENED) 1091230189d9SNélio Laranjeiro mlx5_mpw_inline_close(txq, &mpw); 1092230189d9SNélio Laranjeiro else if (mpw.state == MLX5_MPW_STATE_OPENED) 1093230189d9SNélio Laranjeiro mlx5_mpw_close(txq, &mpw); 1094230189d9SNélio Laranjeiro mlx5_tx_dbrec(txq); 1095230189d9SNélio Laranjeiro txq->elts_head = elts_head; 1096230189d9SNélio Laranjeiro return i; 1097230189d9SNélio Laranjeiro } 1098230189d9SNélio Laranjeiro 1099230189d9SNélio Laranjeiro /** 110067fa62bcSAdrien Mazarguil * Translate RX completion flags to packet type. 110167fa62bcSAdrien Mazarguil * 11026218063bSNélio Laranjeiro * @param[in] cqe 11036218063bSNélio Laranjeiro * Pointer to CQE. 110467fa62bcSAdrien Mazarguil * 110578a38edfSJianfeng Tan * @note: fix mlx5_dev_supported_ptypes_get() if any change here. 110678a38edfSJianfeng Tan * 110767fa62bcSAdrien Mazarguil * @return 110867fa62bcSAdrien Mazarguil * Packet type for struct rte_mbuf. 110967fa62bcSAdrien Mazarguil */ 111067fa62bcSAdrien Mazarguil static inline uint32_t 111197267b8eSNelio Laranjeiro rxq_cq_to_pkt_type(volatile struct mlx5_cqe *cqe) 111267fa62bcSAdrien Mazarguil { 111367fa62bcSAdrien Mazarguil uint32_t pkt_type; 11146218063bSNélio Laranjeiro uint8_t flags = cqe->l4_hdr_type_etc; 111567fa62bcSAdrien Mazarguil 111697267b8eSNelio Laranjeiro if (cqe->pkt_info & MLX5_CQE_RX_TUNNEL_PACKET) 111767fa62bcSAdrien Mazarguil pkt_type = 111867fa62bcSAdrien Mazarguil TRANSPOSE(flags, 1119350f4c48SNelio Laranjeiro MLX5_CQE_RX_OUTER_IPV4_PACKET, 112067fa62bcSAdrien Mazarguil RTE_PTYPE_L3_IPV4) | 112167fa62bcSAdrien Mazarguil TRANSPOSE(flags, 1122350f4c48SNelio Laranjeiro MLX5_CQE_RX_OUTER_IPV6_PACKET, 112367fa62bcSAdrien Mazarguil RTE_PTYPE_L3_IPV6) | 112467fa62bcSAdrien Mazarguil TRANSPOSE(flags, 1125350f4c48SNelio Laranjeiro MLX5_CQE_RX_IPV4_PACKET, 112667fa62bcSAdrien Mazarguil RTE_PTYPE_INNER_L3_IPV4) | 112767fa62bcSAdrien Mazarguil TRANSPOSE(flags, 1128350f4c48SNelio Laranjeiro MLX5_CQE_RX_IPV6_PACKET, 112967fa62bcSAdrien Mazarguil RTE_PTYPE_INNER_L3_IPV6); 113067fa62bcSAdrien Mazarguil else 113167fa62bcSAdrien Mazarguil pkt_type = 113267fa62bcSAdrien Mazarguil TRANSPOSE(flags, 11336218063bSNélio Laranjeiro MLX5_CQE_L3_HDR_TYPE_IPV6, 11346218063bSNélio Laranjeiro RTE_PTYPE_L3_IPV6) | 113567fa62bcSAdrien Mazarguil TRANSPOSE(flags, 11366218063bSNélio Laranjeiro MLX5_CQE_L3_HDR_TYPE_IPV4, 11376218063bSNélio Laranjeiro RTE_PTYPE_L3_IPV4); 113867fa62bcSAdrien Mazarguil return pkt_type; 113967fa62bcSAdrien Mazarguil } 114067fa62bcSAdrien Mazarguil 114167fa62bcSAdrien Mazarguil /** 114299c12dccSNélio Laranjeiro * Get size of the next packet for a given CQE. For compressed CQEs, the 114399c12dccSNélio Laranjeiro * consumer index is updated only once all packets of the current one have 114499c12dccSNélio Laranjeiro * been processed. 114599c12dccSNélio Laranjeiro * 114699c12dccSNélio Laranjeiro * @param rxq 114799c12dccSNélio Laranjeiro * Pointer to RX queue. 114899c12dccSNélio Laranjeiro * @param cqe 114999c12dccSNélio Laranjeiro * CQE to process. 1150ecf60761SNélio Laranjeiro * @param[out] rss_hash 1151ecf60761SNélio Laranjeiro * Packet RSS Hash result. 115299c12dccSNélio Laranjeiro * 115399c12dccSNélio Laranjeiro * @return 115499c12dccSNélio Laranjeiro * Packet size in bytes (0 if there is none), -1 in case of completion 115599c12dccSNélio Laranjeiro * with error. 115699c12dccSNélio Laranjeiro */ 115799c12dccSNélio Laranjeiro static inline int 115897267b8eSNelio Laranjeiro mlx5_rx_poll_len(struct rxq *rxq, volatile struct mlx5_cqe *cqe, 1159ecf60761SNélio Laranjeiro uint16_t cqe_cnt, uint32_t *rss_hash) 116099c12dccSNélio Laranjeiro { 116199c12dccSNélio Laranjeiro struct rxq_zip *zip = &rxq->zip; 116299c12dccSNélio Laranjeiro uint16_t cqe_n = cqe_cnt + 1; 116399c12dccSNélio Laranjeiro int len = 0; 116499c12dccSNélio Laranjeiro 116599c12dccSNélio Laranjeiro /* Process compressed data in the CQE and mini arrays. */ 116699c12dccSNélio Laranjeiro if (zip->ai) { 116799c12dccSNélio Laranjeiro volatile struct mlx5_mini_cqe8 (*mc)[8] = 116899c12dccSNélio Laranjeiro (volatile struct mlx5_mini_cqe8 (*)[8]) 116997267b8eSNelio Laranjeiro (uintptr_t)(&(*rxq->cqes)[zip->ca & cqe_cnt]); 117099c12dccSNélio Laranjeiro 117199c12dccSNélio Laranjeiro len = ntohl((*mc)[zip->ai & 7].byte_cnt); 1172ecf60761SNélio Laranjeiro *rss_hash = ntohl((*mc)[zip->ai & 7].rx_hash_result); 117399c12dccSNélio Laranjeiro if ((++zip->ai & 7) == 0) { 117499c12dccSNélio Laranjeiro /* 117599c12dccSNélio Laranjeiro * Increment consumer index to skip the number of 117699c12dccSNélio Laranjeiro * CQEs consumed. Hardware leaves holes in the CQ 117799c12dccSNélio Laranjeiro * ring for software use. 117899c12dccSNélio Laranjeiro */ 117999c12dccSNélio Laranjeiro zip->ca = zip->na; 118099c12dccSNélio Laranjeiro zip->na += 8; 118199c12dccSNélio Laranjeiro } 118299c12dccSNélio Laranjeiro if (unlikely(rxq->zip.ai == rxq->zip.cqe_cnt)) { 1183b5750af6SNélio Laranjeiro uint16_t idx = rxq->cq_ci + 1; 118499c12dccSNélio Laranjeiro uint16_t end = zip->cq_ci; 118599c12dccSNélio Laranjeiro 118699c12dccSNélio Laranjeiro while (idx != end) { 118797267b8eSNelio Laranjeiro (*rxq->cqes)[idx & cqe_cnt].op_own = 118899c12dccSNélio Laranjeiro MLX5_CQE_INVALIDATE; 118999c12dccSNélio Laranjeiro ++idx; 119099c12dccSNélio Laranjeiro } 119199c12dccSNélio Laranjeiro rxq->cq_ci = zip->cq_ci; 119299c12dccSNélio Laranjeiro zip->ai = 0; 119399c12dccSNélio Laranjeiro } 119499c12dccSNélio Laranjeiro /* No compressed data, get next CQE and verify if it is compressed. */ 119599c12dccSNélio Laranjeiro } else { 119699c12dccSNélio Laranjeiro int ret; 119799c12dccSNélio Laranjeiro int8_t op_own; 119899c12dccSNélio Laranjeiro 119997267b8eSNelio Laranjeiro ret = check_cqe(cqe, cqe_n, rxq->cq_ci); 120099c12dccSNélio Laranjeiro if (unlikely(ret == 1)) 120199c12dccSNélio Laranjeiro return 0; 120299c12dccSNélio Laranjeiro ++rxq->cq_ci; 120399c12dccSNélio Laranjeiro op_own = cqe->op_own; 120499c12dccSNélio Laranjeiro if (MLX5_CQE_FORMAT(op_own) == MLX5_COMPRESSED) { 120599c12dccSNélio Laranjeiro volatile struct mlx5_mini_cqe8 (*mc)[8] = 120699c12dccSNélio Laranjeiro (volatile struct mlx5_mini_cqe8 (*)[8]) 120799c12dccSNélio Laranjeiro (uintptr_t)(&(*rxq->cqes)[rxq->cq_ci & 120897267b8eSNelio Laranjeiro cqe_cnt]); 120999c12dccSNélio Laranjeiro 121099c12dccSNélio Laranjeiro /* Fix endianness. */ 121199c12dccSNélio Laranjeiro zip->cqe_cnt = ntohl(cqe->byte_cnt); 121299c12dccSNélio Laranjeiro /* 121399c12dccSNélio Laranjeiro * Current mini array position is the one returned by 121499c12dccSNélio Laranjeiro * check_cqe64(). 121599c12dccSNélio Laranjeiro * 121699c12dccSNélio Laranjeiro * If completion comprises several mini arrays, as a 121799c12dccSNélio Laranjeiro * special case the second one is located 7 CQEs after 121899c12dccSNélio Laranjeiro * the initial CQE instead of 8 for subsequent ones. 121999c12dccSNélio Laranjeiro */ 122099c12dccSNélio Laranjeiro zip->ca = rxq->cq_ci & cqe_cnt; 122199c12dccSNélio Laranjeiro zip->na = zip->ca + 7; 122299c12dccSNélio Laranjeiro /* Compute the next non compressed CQE. */ 122399c12dccSNélio Laranjeiro --rxq->cq_ci; 122499c12dccSNélio Laranjeiro zip->cq_ci = rxq->cq_ci + zip->cqe_cnt; 122599c12dccSNélio Laranjeiro /* Get packet size to return. */ 122699c12dccSNélio Laranjeiro len = ntohl((*mc)[0].byte_cnt); 1227ecf60761SNélio Laranjeiro *rss_hash = ntohl((*mc)[0].rx_hash_result); 122899c12dccSNélio Laranjeiro zip->ai = 1; 122999c12dccSNélio Laranjeiro } else { 123099c12dccSNélio Laranjeiro len = ntohl(cqe->byte_cnt); 1231ecf60761SNélio Laranjeiro *rss_hash = ntohl(cqe->rx_hash_res); 123299c12dccSNélio Laranjeiro } 123399c12dccSNélio Laranjeiro /* Error while receiving packet. */ 123499c12dccSNélio Laranjeiro if (unlikely(MLX5_CQE_OPCODE(op_own) == MLX5_CQE_RESP_ERR)) 123599c12dccSNélio Laranjeiro return -1; 123699c12dccSNélio Laranjeiro } 123799c12dccSNélio Laranjeiro return len; 123899c12dccSNélio Laranjeiro } 123999c12dccSNélio Laranjeiro 124099c12dccSNélio Laranjeiro /** 124167fa62bcSAdrien Mazarguil * Translate RX completion flags to offload flags. 124267fa62bcSAdrien Mazarguil * 124367fa62bcSAdrien Mazarguil * @param[in] rxq 124467fa62bcSAdrien Mazarguil * Pointer to RX queue structure. 12456218063bSNélio Laranjeiro * @param[in] cqe 12466218063bSNélio Laranjeiro * Pointer to CQE. 124767fa62bcSAdrien Mazarguil * 124867fa62bcSAdrien Mazarguil * @return 124967fa62bcSAdrien Mazarguil * Offload flags (ol_flags) for struct rte_mbuf. 125067fa62bcSAdrien Mazarguil */ 125167fa62bcSAdrien Mazarguil static inline uint32_t 125297267b8eSNelio Laranjeiro rxq_cq_to_ol_flags(struct rxq *rxq, volatile struct mlx5_cqe *cqe) 125367fa62bcSAdrien Mazarguil { 125467fa62bcSAdrien Mazarguil uint32_t ol_flags = 0; 12556218063bSNélio Laranjeiro uint8_t l3_hdr = (cqe->l4_hdr_type_etc) & MLX5_CQE_L3_HDR_TYPE_MASK; 12566218063bSNélio Laranjeiro uint8_t l4_hdr = (cqe->l4_hdr_type_etc) & MLX5_CQE_L4_HDR_TYPE_MASK; 125767fa62bcSAdrien Mazarguil 12586218063bSNélio Laranjeiro if ((l3_hdr == MLX5_CQE_L3_HDR_TYPE_IPV4) || 12596218063bSNélio Laranjeiro (l3_hdr == MLX5_CQE_L3_HDR_TYPE_IPV6)) 126083e9d9a3SNelio Laranjeiro ol_flags |= TRANSPOSE(cqe->hds_ip_ext, 126183e9d9a3SNelio Laranjeiro MLX5_CQE_L3_OK, 126283e9d9a3SNelio Laranjeiro PKT_RX_IP_CKSUM_GOOD); 12636218063bSNélio Laranjeiro if ((l4_hdr == MLX5_CQE_L4_HDR_TYPE_TCP) || 12646218063bSNélio Laranjeiro (l4_hdr == MLX5_CQE_L4_HDR_TYPE_TCP_EMP_ACK) || 12656218063bSNélio Laranjeiro (l4_hdr == MLX5_CQE_L4_HDR_TYPE_TCP_ACK) || 12666218063bSNélio Laranjeiro (l4_hdr == MLX5_CQE_L4_HDR_TYPE_UDP)) 126783e9d9a3SNelio Laranjeiro ol_flags |= TRANSPOSE(cqe->hds_ip_ext, 126883e9d9a3SNelio Laranjeiro MLX5_CQE_L4_OK, 126983e9d9a3SNelio Laranjeiro PKT_RX_L4_CKSUM_GOOD); 127097267b8eSNelio Laranjeiro if ((cqe->pkt_info & MLX5_CQE_RX_TUNNEL_PACKET) && (rxq->csum_l2tun)) 127167fa62bcSAdrien Mazarguil ol_flags |= 127283e9d9a3SNelio Laranjeiro TRANSPOSE(cqe->l4_hdr_type_etc, 1273350f4c48SNelio Laranjeiro MLX5_CQE_RX_OUTER_IP_CSUM_OK, 127483e9d9a3SNelio Laranjeiro PKT_RX_IP_CKSUM_GOOD) | 127583e9d9a3SNelio Laranjeiro TRANSPOSE(cqe->l4_hdr_type_etc, 1276350f4c48SNelio Laranjeiro MLX5_CQE_RX_OUTER_TCP_UDP_CSUM_OK, 127783e9d9a3SNelio Laranjeiro PKT_RX_L4_CKSUM_GOOD); 127867fa62bcSAdrien Mazarguil return ol_flags; 127967fa62bcSAdrien Mazarguil } 128067fa62bcSAdrien Mazarguil 128167fa62bcSAdrien Mazarguil /** 12822e22920bSAdrien Mazarguil * DPDK callback for RX. 12832e22920bSAdrien Mazarguil * 12842e22920bSAdrien Mazarguil * @param dpdk_rxq 12852e22920bSAdrien Mazarguil * Generic pointer to RX queue structure. 12862e22920bSAdrien Mazarguil * @param[out] pkts 12872e22920bSAdrien Mazarguil * Array to store received packets. 12882e22920bSAdrien Mazarguil * @param pkts_n 12892e22920bSAdrien Mazarguil * Maximum number of packets in array. 12902e22920bSAdrien Mazarguil * 12912e22920bSAdrien Mazarguil * @return 12922e22920bSAdrien Mazarguil * Number of packets successfully received (<= pkts_n). 12932e22920bSAdrien Mazarguil */ 12942e22920bSAdrien Mazarguil uint16_t 12952e22920bSAdrien Mazarguil mlx5_rx_burst(void *dpdk_rxq, struct rte_mbuf **pkts, uint16_t pkts_n) 12962e22920bSAdrien Mazarguil { 12976218063bSNélio Laranjeiro struct rxq *rxq = dpdk_rxq; 1298b4b12e55SNélio Laranjeiro const unsigned int wqe_cnt = (1 << rxq->elts_n) - 1; 1299e2f116eeSNélio Laranjeiro const unsigned int cqe_cnt = (1 << rxq->cqe_n) - 1; 13009964b965SNélio Laranjeiro const unsigned int sges_n = rxq->sges_n; 13019964b965SNélio Laranjeiro struct rte_mbuf *pkt = NULL; 13029964b965SNélio Laranjeiro struct rte_mbuf *seg = NULL; 130397267b8eSNelio Laranjeiro volatile struct mlx5_cqe *cqe = 130497267b8eSNelio Laranjeiro &(*rxq->cqes)[rxq->cq_ci & cqe_cnt]; 13059964b965SNélio Laranjeiro unsigned int i = 0; 13069964b965SNélio Laranjeiro unsigned int rq_ci = rxq->rq_ci << sges_n; 1307ecf60761SNélio Laranjeiro int len; /* keep its value across iterations. */ 13082e22920bSAdrien Mazarguil 13099964b965SNélio Laranjeiro while (pkts_n) { 13109964b965SNélio Laranjeiro unsigned int idx = rq_ci & wqe_cnt; 13119964b965SNélio Laranjeiro volatile struct mlx5_wqe_data_seg *wqe = &(*rxq->wqes)[idx]; 13129964b965SNélio Laranjeiro struct rte_mbuf *rep = (*rxq->elts)[idx]; 1313ecf60761SNélio Laranjeiro uint32_t rss_hash_res = 0; 13149964b965SNélio Laranjeiro 13159964b965SNélio Laranjeiro if (pkt) 13169964b965SNélio Laranjeiro NEXT(seg) = rep; 13179964b965SNélio Laranjeiro seg = rep; 13189964b965SNélio Laranjeiro rte_prefetch0(seg); 13196218063bSNélio Laranjeiro rte_prefetch0(cqe); 13209964b965SNélio Laranjeiro rte_prefetch0(wqe); 1321fbfd9955SOlivier Matz rep = rte_mbuf_raw_alloc(rxq->mp); 13222e22920bSAdrien Mazarguil if (unlikely(rep == NULL)) { 132315a756b6SSagi Grimberg ++rxq->stats.rx_nombuf; 132415a756b6SSagi Grimberg if (!pkt) { 132515a756b6SSagi Grimberg /* 132615a756b6SSagi Grimberg * no buffers before we even started, 132715a756b6SSagi Grimberg * bail out silently. 132815a756b6SSagi Grimberg */ 132915a756b6SSagi Grimberg break; 133015a756b6SSagi Grimberg } 1331a1bdb71aSNélio Laranjeiro while (pkt != seg) { 1332a1bdb71aSNélio Laranjeiro assert(pkt != (*rxq->elts)[idx]); 1333fe5fe382SNélio Laranjeiro rep = NEXT(pkt); 13349964b965SNélio Laranjeiro rte_mbuf_refcnt_set(pkt, 0); 13359964b965SNélio Laranjeiro __rte_mbuf_raw_free(pkt); 1336fe5fe382SNélio Laranjeiro pkt = rep; 13379964b965SNélio Laranjeiro } 13386218063bSNélio Laranjeiro break; 13392e22920bSAdrien Mazarguil } 13409964b965SNélio Laranjeiro if (!pkt) { 134197267b8eSNelio Laranjeiro cqe = &(*rxq->cqes)[rxq->cq_ci & cqe_cnt]; 1342ecf60761SNélio Laranjeiro len = mlx5_rx_poll_len(rxq, cqe, cqe_cnt, 1343ecf60761SNélio Laranjeiro &rss_hash_res); 1344ecf60761SNélio Laranjeiro if (!len) { 13456218063bSNélio Laranjeiro rte_mbuf_refcnt_set(rep, 0); 13466218063bSNélio Laranjeiro __rte_mbuf_raw_free(rep); 13476218063bSNélio Laranjeiro break; 13486218063bSNélio Laranjeiro } 134999c12dccSNélio Laranjeiro if (unlikely(len == -1)) { 135099c12dccSNélio Laranjeiro /* RX error, packet is likely too large. */ 135199c12dccSNélio Laranjeiro rte_mbuf_refcnt_set(rep, 0); 135299c12dccSNélio Laranjeiro __rte_mbuf_raw_free(rep); 135399c12dccSNélio Laranjeiro ++rxq->stats.idropped; 135499c12dccSNélio Laranjeiro goto skip; 135599c12dccSNélio Laranjeiro } 13569964b965SNélio Laranjeiro pkt = seg; 13579964b965SNélio Laranjeiro assert(len >= (rxq->crc_present << 2)); 13589964b965SNélio Laranjeiro /* Update packet information. */ 13590ac64846SMaxime Leroy pkt->packet_type = 0; 13600ac64846SMaxime Leroy pkt->ol_flags = 0; 136136ba0c00SNélio Laranjeiro if (rss_hash_res && rxq->rss_hash) { 1362ecf60761SNélio Laranjeiro pkt->hash.rss = rss_hash_res; 1363ecf60761SNélio Laranjeiro pkt->ol_flags = PKT_RX_RSS_HASH; 1364ecf60761SNélio Laranjeiro } 1365ea3bc3b1SNélio Laranjeiro if (rxq->mark && 1366ea3bc3b1SNélio Laranjeiro ((cqe->sop_drop_qpn != 1367ea3bc3b1SNélio Laranjeiro htonl(MLX5_FLOW_MARK_INVALID)) || 1368ea3bc3b1SNélio Laranjeiro (cqe->sop_drop_qpn != 1369ea3bc3b1SNélio Laranjeiro htonl(MLX5_FLOW_MARK_DEFAULT)))) { 1370ea3bc3b1SNélio Laranjeiro pkt->hash.fdir.hi = 1371ea3bc3b1SNélio Laranjeiro mlx5_flow_mark_get(cqe->sop_drop_qpn); 1372ea3bc3b1SNélio Laranjeiro pkt->ol_flags &= ~PKT_RX_RSS_HASH; 1373ea3bc3b1SNélio Laranjeiro pkt->ol_flags |= PKT_RX_FDIR | PKT_RX_FDIR_ID; 1374ea3bc3b1SNélio Laranjeiro } 13756218063bSNélio Laranjeiro if (rxq->csum | rxq->csum_l2tun | rxq->vlan_strip | 13766218063bSNélio Laranjeiro rxq->crc_present) { 13776218063bSNélio Laranjeiro if (rxq->csum) { 13789964b965SNélio Laranjeiro pkt->packet_type = 13799964b965SNélio Laranjeiro rxq_cq_to_pkt_type(cqe); 1380ecf60761SNélio Laranjeiro pkt->ol_flags |= 13819964b965SNélio Laranjeiro rxq_cq_to_ol_flags(rxq, cqe); 13826218063bSNélio Laranjeiro } 13839964b965SNélio Laranjeiro if (cqe->l4_hdr_type_etc & 13849964b965SNélio Laranjeiro MLX5_CQE_VLAN_STRIPPED) { 13856218063bSNélio Laranjeiro pkt->ol_flags |= PKT_RX_VLAN_PKT | 1386b37b528dSOlivier Matz PKT_RX_VLAN_STRIPPED; 13876218063bSNélio Laranjeiro pkt->vlan_tci = ntohs(cqe->vlan_info); 1388f3db9489SYaacov Hazan } 13896218063bSNélio Laranjeiro if (rxq->crc_present) 13906218063bSNélio Laranjeiro len -= ETHER_CRC_LEN; 1391081f7eaeSNelio Laranjeiro } 13926218063bSNélio Laranjeiro PKT_LEN(pkt) = len; 13939964b965SNélio Laranjeiro } 13949964b965SNélio Laranjeiro DATA_LEN(rep) = DATA_LEN(seg); 13959964b965SNélio Laranjeiro PKT_LEN(rep) = PKT_LEN(seg); 13969964b965SNélio Laranjeiro SET_DATA_OFF(rep, DATA_OFF(seg)); 13979964b965SNélio Laranjeiro NB_SEGS(rep) = NB_SEGS(seg); 13989964b965SNélio Laranjeiro PORT(rep) = PORT(seg); 13999964b965SNélio Laranjeiro NEXT(rep) = NULL; 14009964b965SNélio Laranjeiro (*rxq->elts)[idx] = rep; 14019964b965SNélio Laranjeiro /* 14029964b965SNélio Laranjeiro * Fill NIC descriptor with the new buffer. The lkey and size 14039964b965SNélio Laranjeiro * of the buffers are already known, only the buffer address 14049964b965SNélio Laranjeiro * changes. 14059964b965SNélio Laranjeiro */ 14069964b965SNélio Laranjeiro wqe->addr = htonll(rte_pktmbuf_mtod(rep, uintptr_t)); 14079964b965SNélio Laranjeiro if (len > DATA_LEN(seg)) { 14089964b965SNélio Laranjeiro len -= DATA_LEN(seg); 14099964b965SNélio Laranjeiro ++NB_SEGS(pkt); 14109964b965SNélio Laranjeiro ++rq_ci; 14119964b965SNélio Laranjeiro continue; 14129964b965SNélio Laranjeiro } 14139964b965SNélio Laranjeiro DATA_LEN(seg) = len; 141487011737SAdrien Mazarguil #ifdef MLX5_PMD_SOFT_COUNTERS 141587011737SAdrien Mazarguil /* Increment bytes counter. */ 14169964b965SNélio Laranjeiro rxq->stats.ibytes += PKT_LEN(pkt); 141787011737SAdrien Mazarguil #endif 14186218063bSNélio Laranjeiro /* Return packet. */ 14196218063bSNélio Laranjeiro *(pkts++) = pkt; 14209964b965SNélio Laranjeiro pkt = NULL; 14219964b965SNélio Laranjeiro --pkts_n; 14229964b965SNélio Laranjeiro ++i; 142399c12dccSNélio Laranjeiro skip: 14249964b965SNélio Laranjeiro /* Align consumer index to the next stride. */ 14259964b965SNélio Laranjeiro rq_ci >>= sges_n; 14266218063bSNélio Laranjeiro ++rq_ci; 14279964b965SNélio Laranjeiro rq_ci <<= sges_n; 14282e22920bSAdrien Mazarguil } 14299964b965SNélio Laranjeiro if (unlikely((i == 0) && ((rq_ci >> sges_n) == rxq->rq_ci))) 14302e22920bSAdrien Mazarguil return 0; 14316218063bSNélio Laranjeiro /* Update the consumer index. */ 14329964b965SNélio Laranjeiro rxq->rq_ci = rq_ci >> sges_n; 14336218063bSNélio Laranjeiro rte_wmb(); 14346218063bSNélio Laranjeiro *rxq->cq_db = htonl(rxq->cq_ci); 14356218063bSNélio Laranjeiro rte_wmb(); 14366218063bSNélio Laranjeiro *rxq->rq_db = htonl(rxq->rq_ci); 143787011737SAdrien Mazarguil #ifdef MLX5_PMD_SOFT_COUNTERS 143887011737SAdrien Mazarguil /* Increment packets counter. */ 14399964b965SNélio Laranjeiro rxq->stats.ipackets += i; 144087011737SAdrien Mazarguil #endif 14419964b965SNélio Laranjeiro return i; 14422e22920bSAdrien Mazarguil } 14432e22920bSAdrien Mazarguil 14442e22920bSAdrien Mazarguil /** 14452e22920bSAdrien Mazarguil * Dummy DPDK callback for TX. 14462e22920bSAdrien Mazarguil * 14472e22920bSAdrien Mazarguil * This function is used to temporarily replace the real callback during 14482e22920bSAdrien Mazarguil * unsafe control operations on the queue, or in case of error. 14492e22920bSAdrien Mazarguil * 14502e22920bSAdrien Mazarguil * @param dpdk_txq 14512e22920bSAdrien Mazarguil * Generic pointer to TX queue structure. 14522e22920bSAdrien Mazarguil * @param[in] pkts 14532e22920bSAdrien Mazarguil * Packets to transmit. 14542e22920bSAdrien Mazarguil * @param pkts_n 14552e22920bSAdrien Mazarguil * Number of packets in array. 14562e22920bSAdrien Mazarguil * 14572e22920bSAdrien Mazarguil * @return 14582e22920bSAdrien Mazarguil * Number of packets successfully transmitted (<= pkts_n). 14592e22920bSAdrien Mazarguil */ 14602e22920bSAdrien Mazarguil uint16_t 14612e22920bSAdrien Mazarguil removed_tx_burst(void *dpdk_txq, struct rte_mbuf **pkts, uint16_t pkts_n) 14622e22920bSAdrien Mazarguil { 14632e22920bSAdrien Mazarguil (void)dpdk_txq; 14642e22920bSAdrien Mazarguil (void)pkts; 14652e22920bSAdrien Mazarguil (void)pkts_n; 14662e22920bSAdrien Mazarguil return 0; 14672e22920bSAdrien Mazarguil } 14682e22920bSAdrien Mazarguil 14692e22920bSAdrien Mazarguil /** 14702e22920bSAdrien Mazarguil * Dummy DPDK callback for RX. 14712e22920bSAdrien Mazarguil * 14722e22920bSAdrien Mazarguil * This function is used to temporarily replace the real callback during 14732e22920bSAdrien Mazarguil * unsafe control operations on the queue, or in case of error. 14742e22920bSAdrien Mazarguil * 14752e22920bSAdrien Mazarguil * @param dpdk_rxq 14762e22920bSAdrien Mazarguil * Generic pointer to RX queue structure. 14772e22920bSAdrien Mazarguil * @param[out] pkts 14782e22920bSAdrien Mazarguil * Array to store received packets. 14792e22920bSAdrien Mazarguil * @param pkts_n 14802e22920bSAdrien Mazarguil * Maximum number of packets in array. 14812e22920bSAdrien Mazarguil * 14822e22920bSAdrien Mazarguil * @return 14832e22920bSAdrien Mazarguil * Number of packets successfully received (<= pkts_n). 14842e22920bSAdrien Mazarguil */ 14852e22920bSAdrien Mazarguil uint16_t 14862e22920bSAdrien Mazarguil removed_rx_burst(void *dpdk_rxq, struct rte_mbuf **pkts, uint16_t pkts_n) 14872e22920bSAdrien Mazarguil { 14882e22920bSAdrien Mazarguil (void)dpdk_rxq; 14892e22920bSAdrien Mazarguil (void)pkts; 14902e22920bSAdrien Mazarguil (void)pkts_n; 14912e22920bSAdrien Mazarguil return 0; 14922e22920bSAdrien Mazarguil } 1493