18fd92a66SOlivier Matz /* SPDX-License-Identifier: BSD-3-Clause 2771fa900SAdrien Mazarguil * Copyright 2015 6WIND S.A. 35feecc57SShahaf Shuler * Copyright 2015 Mellanox Technologies, Ltd 4771fa900SAdrien Mazarguil */ 5771fa900SAdrien Mazarguil 6771fa900SAdrien Mazarguil #include <stddef.h> 7771fa900SAdrien Mazarguil #include <unistd.h> 8771fa900SAdrien Mazarguil #include <string.h> 9771fa900SAdrien Mazarguil #include <assert.h> 1059b91becSAdrien Mazarguil #include <dlfcn.h> 11771fa900SAdrien Mazarguil #include <stdint.h> 12771fa900SAdrien Mazarguil #include <stdlib.h> 13e72dd09bSNélio Laranjeiro #include <errno.h> 14771fa900SAdrien Mazarguil #include <net/if.h> 154a984153SXueming Li #include <sys/mman.h> 1626c08b97SAdrien Mazarguil #include <linux/netlink.h> 17ccdcba53SNélio Laranjeiro #include <linux/rtnetlink.h> 18771fa900SAdrien Mazarguil 19771fa900SAdrien Mazarguil /* Verbs header. */ 20771fa900SAdrien Mazarguil /* ISO C doesn't support unnamed structs/unions, disabling -pedantic. */ 21771fa900SAdrien Mazarguil #ifdef PEDANTIC 22fc5b160fSBruce Richardson #pragma GCC diagnostic ignored "-Wpedantic" 23771fa900SAdrien Mazarguil #endif 24771fa900SAdrien Mazarguil #include <infiniband/verbs.h> 25771fa900SAdrien Mazarguil #ifdef PEDANTIC 26fc5b160fSBruce Richardson #pragma GCC diagnostic error "-Wpedantic" 27771fa900SAdrien Mazarguil #endif 28771fa900SAdrien Mazarguil 29771fa900SAdrien Mazarguil #include <rte_malloc.h> 30ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h> 31fdf91e0fSJan Blunck #include <rte_ethdev_pci.h> 32771fa900SAdrien Mazarguil #include <rte_pci.h> 33c752998bSGaetan Rivet #include <rte_bus_pci.h> 34771fa900SAdrien Mazarguil #include <rte_common.h> 3559b91becSAdrien Mazarguil #include <rte_config.h> 364a984153SXueming Li #include <rte_eal_memconfig.h> 37e72dd09bSNélio Laranjeiro #include <rte_kvargs.h> 38e89c15b6SAdrien Mazarguil #include <rte_rwlock.h> 39e89c15b6SAdrien Mazarguil #include <rte_spinlock.h> 40f38c5457SAdrien Mazarguil #include <rte_string_fns.h> 41771fa900SAdrien Mazarguil 42771fa900SAdrien Mazarguil #include "mlx5.h" 43771fa900SAdrien Mazarguil #include "mlx5_utils.h" 442e22920bSAdrien Mazarguil #include "mlx5_rxtx.h" 45771fa900SAdrien Mazarguil #include "mlx5_autoconf.h" 4613d57bd5SAdrien Mazarguil #include "mlx5_defs.h" 470e83b8e5SNelio Laranjeiro #include "mlx5_glue.h" 48974f1e7eSYongseok Koh #include "mlx5_mr.h" 4984c406e7SOri Kam #include "mlx5_flow.h" 50771fa900SAdrien Mazarguil 5199c12dccSNélio Laranjeiro /* Device parameter to enable RX completion queue compression. */ 5299c12dccSNélio Laranjeiro #define MLX5_RXQ_CQE_COMP_EN "rxq_cqe_comp_en" 5399c12dccSNélio Laranjeiro 54bc91e8dbSYongseok Koh /* Device parameter to enable RX completion entry padding to 128B. */ 55bc91e8dbSYongseok Koh #define MLX5_RXQ_CQE_PAD_EN "rxq_cqe_pad_en" 56bc91e8dbSYongseok Koh 5778c7a16dSYongseok Koh /* Device parameter to enable padding Rx packet to cacheline size. */ 5878c7a16dSYongseok Koh #define MLX5_RXQ_PKT_PAD_EN "rxq_pkt_pad_en" 5978c7a16dSYongseok Koh 607d6bf6b8SYongseok Koh /* Device parameter to enable Multi-Packet Rx queue. */ 617d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_EN "mprq_en" 627d6bf6b8SYongseok Koh 637d6bf6b8SYongseok Koh /* Device parameter to configure log 2 of the number of strides for MPRQ. */ 647d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_LOG_STRIDE_NUM "mprq_log_stride_num" 657d6bf6b8SYongseok Koh 667d6bf6b8SYongseok Koh /* Device parameter to limit the size of memcpy'd packet for MPRQ. */ 677d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_MAX_MEMCPY_LEN "mprq_max_memcpy_len" 687d6bf6b8SYongseok Koh 697d6bf6b8SYongseok Koh /* Device parameter to set the minimum number of Rx queues to enable MPRQ. */ 707d6bf6b8SYongseok Koh #define MLX5_RXQS_MIN_MPRQ "rxqs_min_mprq" 717d6bf6b8SYongseok Koh 722a66cf37SYaacov Hazan /* Device parameter to configure inline send. */ 732a66cf37SYaacov Hazan #define MLX5_TXQ_INLINE "txq_inline" 742a66cf37SYaacov Hazan 752a66cf37SYaacov Hazan /* 762a66cf37SYaacov Hazan * Device parameter to configure the number of TX queues threshold for 772a66cf37SYaacov Hazan * enabling inline send. 782a66cf37SYaacov Hazan */ 792a66cf37SYaacov Hazan #define MLX5_TXQS_MIN_INLINE "txqs_min_inline" 802a66cf37SYaacov Hazan 8109d8b416SYongseok Koh /* 8209d8b416SYongseok Koh * Device parameter to configure the number of TX queues threshold for 8309d8b416SYongseok Koh * enabling vectorized Tx. 8409d8b416SYongseok Koh */ 8509d8b416SYongseok Koh #define MLX5_TXQS_MAX_VEC "txqs_max_vec" 8609d8b416SYongseok Koh 87230189d9SNélio Laranjeiro /* Device parameter to enable multi-packet send WQEs. */ 88230189d9SNélio Laranjeiro #define MLX5_TXQ_MPW_EN "txq_mpw_en" 89230189d9SNélio Laranjeiro 906ce84bd8SYongseok Koh /* Device parameter to include 2 dsegs in the title WQEBB. */ 916ce84bd8SYongseok Koh #define MLX5_TXQ_MPW_HDR_DSEG_EN "txq_mpw_hdr_dseg_en" 926ce84bd8SYongseok Koh 936ce84bd8SYongseok Koh /* Device parameter to limit the size of inlining packet. */ 946ce84bd8SYongseok Koh #define MLX5_TXQ_MAX_INLINE_LEN "txq_max_inline_len" 956ce84bd8SYongseok Koh 965644d5b9SNelio Laranjeiro /* Device parameter to enable hardware Tx vector. */ 975644d5b9SNelio Laranjeiro #define MLX5_TX_VEC_EN "tx_vec_en" 985644d5b9SNelio Laranjeiro 995644d5b9SNelio Laranjeiro /* Device parameter to enable hardware Rx vector. */ 1005644d5b9SNelio Laranjeiro #define MLX5_RX_VEC_EN "rx_vec_en" 1015644d5b9SNelio Laranjeiro 10278a54648SXueming Li /* Allow L3 VXLAN flow creation. */ 10378a54648SXueming Li #define MLX5_L3_VXLAN_EN "l3_vxlan_en" 10478a54648SXueming Li 10551e72d38SOri Kam /* Activate DV flow steering. */ 10651e72d38SOri Kam #define MLX5_DV_FLOW_EN "dv_flow_en" 10751e72d38SOri Kam 108db209cc3SNélio Laranjeiro /* Activate Netlink support in VF mode. */ 109db209cc3SNélio Laranjeiro #define MLX5_VF_NL_EN "vf_nl_en" 110db209cc3SNélio Laranjeiro 1116de569f5SAdrien Mazarguil /* Select port representors to instantiate. */ 1126de569f5SAdrien Mazarguil #define MLX5_REPRESENTOR "representor" 1136de569f5SAdrien Mazarguil 11443e9d979SShachar Beiser #ifndef HAVE_IBV_MLX5_MOD_MPW 11543e9d979SShachar Beiser #define MLX5DV_CONTEXT_FLAGS_MPW_ALLOWED (1 << 2) 11643e9d979SShachar Beiser #define MLX5DV_CONTEXT_FLAGS_ENHANCED_MPW (1 << 3) 11743e9d979SShachar Beiser #endif 11843e9d979SShachar Beiser 119523f5a74SYongseok Koh #ifndef HAVE_IBV_MLX5_MOD_CQE_128B_COMP 120523f5a74SYongseok Koh #define MLX5DV_CONTEXT_FLAGS_CQE_128B_COMP (1 << 4) 121523f5a74SYongseok Koh #endif 122523f5a74SYongseok Koh 123974f1e7eSYongseok Koh static const char *MZ_MLX5_PMD_SHARED_DATA = "mlx5_pmd_shared_data"; 124974f1e7eSYongseok Koh 125974f1e7eSYongseok Koh /* Shared memory between primary and secondary processes. */ 126974f1e7eSYongseok Koh struct mlx5_shared_data *mlx5_shared_data; 127974f1e7eSYongseok Koh 128974f1e7eSYongseok Koh /* Spinlock for mlx5_shared_data allocation. */ 129974f1e7eSYongseok Koh static rte_spinlock_t mlx5_shared_data_lock = RTE_SPINLOCK_INITIALIZER; 130974f1e7eSYongseok Koh 131a170a30dSNélio Laranjeiro /** Driver-specific log messages type. */ 132a170a30dSNélio Laranjeiro int mlx5_logtype; 133a170a30dSNélio Laranjeiro 134771fa900SAdrien Mazarguil /** 135974f1e7eSYongseok Koh * Prepare shared data between primary and secondary process. 136974f1e7eSYongseok Koh */ 137974f1e7eSYongseok Koh static void 138974f1e7eSYongseok Koh mlx5_prepare_shared_data(void) 139974f1e7eSYongseok Koh { 140974f1e7eSYongseok Koh const struct rte_memzone *mz; 141974f1e7eSYongseok Koh 142974f1e7eSYongseok Koh rte_spinlock_lock(&mlx5_shared_data_lock); 143974f1e7eSYongseok Koh if (mlx5_shared_data == NULL) { 144974f1e7eSYongseok Koh if (rte_eal_process_type() == RTE_PROC_PRIMARY) { 145974f1e7eSYongseok Koh /* Allocate shared memory. */ 146974f1e7eSYongseok Koh mz = rte_memzone_reserve(MZ_MLX5_PMD_SHARED_DATA, 147974f1e7eSYongseok Koh sizeof(*mlx5_shared_data), 148974f1e7eSYongseok Koh SOCKET_ID_ANY, 0); 149974f1e7eSYongseok Koh } else { 150974f1e7eSYongseok Koh /* Lookup allocated shared memory. */ 151974f1e7eSYongseok Koh mz = rte_memzone_lookup(MZ_MLX5_PMD_SHARED_DATA); 152974f1e7eSYongseok Koh } 153974f1e7eSYongseok Koh if (mz == NULL) 154974f1e7eSYongseok Koh rte_panic("Cannot allocate mlx5 shared data\n"); 155974f1e7eSYongseok Koh mlx5_shared_data = mz->addr; 156974f1e7eSYongseok Koh /* Initialize shared data. */ 157974f1e7eSYongseok Koh if (rte_eal_process_type() == RTE_PROC_PRIMARY) { 158974f1e7eSYongseok Koh LIST_INIT(&mlx5_shared_data->mem_event_cb_list); 159974f1e7eSYongseok Koh rte_rwlock_init(&mlx5_shared_data->mem_event_rwlock); 160974f1e7eSYongseok Koh } 16144b1d513SDavid Marchand rte_mem_event_callback_register("MLX5_MEM_EVENT_CB", 16244b1d513SDavid Marchand mlx5_mr_mem_event_cb, NULL); 163974f1e7eSYongseok Koh } 164974f1e7eSYongseok Koh rte_spinlock_unlock(&mlx5_shared_data_lock); 165974f1e7eSYongseok Koh } 166974f1e7eSYongseok Koh 167974f1e7eSYongseok Koh /** 1684d803a72SOlga Shern * Retrieve integer value from environment variable. 1694d803a72SOlga Shern * 1704d803a72SOlga Shern * @param[in] name 1714d803a72SOlga Shern * Environment variable name. 1724d803a72SOlga Shern * 1734d803a72SOlga Shern * @return 1744d803a72SOlga Shern * Integer value, 0 if the variable is not set. 1754d803a72SOlga Shern */ 1764d803a72SOlga Shern int 1774d803a72SOlga Shern mlx5_getenv_int(const char *name) 1784d803a72SOlga Shern { 1794d803a72SOlga Shern const char *val = getenv(name); 1804d803a72SOlga Shern 1814d803a72SOlga Shern if (val == NULL) 1824d803a72SOlga Shern return 0; 1834d803a72SOlga Shern return atoi(val); 1844d803a72SOlga Shern } 1854d803a72SOlga Shern 1864d803a72SOlga Shern /** 1871e3a39f7SXueming Li * Verbs callback to allocate a memory. This function should allocate the space 1881e3a39f7SXueming Li * according to the size provided residing inside a huge page. 1891e3a39f7SXueming Li * Please note that all allocation must respect the alignment from libmlx5 1901e3a39f7SXueming Li * (i.e. currently sysconf(_SC_PAGESIZE)). 1911e3a39f7SXueming Li * 1921e3a39f7SXueming Li * @param[in] size 1931e3a39f7SXueming Li * The size in bytes of the memory to allocate. 1941e3a39f7SXueming Li * @param[in] data 1951e3a39f7SXueming Li * A pointer to the callback data. 1961e3a39f7SXueming Li * 1971e3a39f7SXueming Li * @return 198a6d83b6aSNélio Laranjeiro * Allocated buffer, NULL otherwise and rte_errno is set. 1991e3a39f7SXueming Li */ 2001e3a39f7SXueming Li static void * 2011e3a39f7SXueming Li mlx5_alloc_verbs_buf(size_t size, void *data) 2021e3a39f7SXueming Li { 2031e3a39f7SXueming Li struct priv *priv = data; 2041e3a39f7SXueming Li void *ret; 2051e3a39f7SXueming Li size_t alignment = sysconf(_SC_PAGESIZE); 206d10b09dbSOlivier Matz unsigned int socket = SOCKET_ID_ANY; 2071e3a39f7SXueming Li 208d10b09dbSOlivier Matz if (priv->verbs_alloc_ctx.type == MLX5_VERBS_ALLOC_TYPE_TX_QUEUE) { 209d10b09dbSOlivier Matz const struct mlx5_txq_ctrl *ctrl = priv->verbs_alloc_ctx.obj; 210d10b09dbSOlivier Matz 211d10b09dbSOlivier Matz socket = ctrl->socket; 212d10b09dbSOlivier Matz } else if (priv->verbs_alloc_ctx.type == 213d10b09dbSOlivier Matz MLX5_VERBS_ALLOC_TYPE_RX_QUEUE) { 214d10b09dbSOlivier Matz const struct mlx5_rxq_ctrl *ctrl = priv->verbs_alloc_ctx.obj; 215d10b09dbSOlivier Matz 216d10b09dbSOlivier Matz socket = ctrl->socket; 217d10b09dbSOlivier Matz } 2181e3a39f7SXueming Li assert(data != NULL); 219d10b09dbSOlivier Matz ret = rte_malloc_socket(__func__, size, alignment, socket); 220a6d83b6aSNélio Laranjeiro if (!ret && size) 221a6d83b6aSNélio Laranjeiro rte_errno = ENOMEM; 2221e3a39f7SXueming Li return ret; 2231e3a39f7SXueming Li } 2241e3a39f7SXueming Li 2251e3a39f7SXueming Li /** 2261e3a39f7SXueming Li * Verbs callback to free a memory. 2271e3a39f7SXueming Li * 2281e3a39f7SXueming Li * @param[in] ptr 2291e3a39f7SXueming Li * A pointer to the memory to free. 2301e3a39f7SXueming Li * @param[in] data 2311e3a39f7SXueming Li * A pointer to the callback data. 2321e3a39f7SXueming Li */ 2331e3a39f7SXueming Li static void 2341e3a39f7SXueming Li mlx5_free_verbs_buf(void *ptr, void *data __rte_unused) 2351e3a39f7SXueming Li { 2361e3a39f7SXueming Li assert(data != NULL); 2371e3a39f7SXueming Li rte_free(ptr); 2381e3a39f7SXueming Li } 2391e3a39f7SXueming Li 2401e3a39f7SXueming Li /** 241771fa900SAdrien Mazarguil * DPDK callback to close the device. 242771fa900SAdrien Mazarguil * 243771fa900SAdrien Mazarguil * Destroy all queues and objects, free memory. 244771fa900SAdrien Mazarguil * 245771fa900SAdrien Mazarguil * @param dev 246771fa900SAdrien Mazarguil * Pointer to Ethernet device structure. 247771fa900SAdrien Mazarguil */ 248771fa900SAdrien Mazarguil static void 249771fa900SAdrien Mazarguil mlx5_dev_close(struct rte_eth_dev *dev) 250771fa900SAdrien Mazarguil { 25101d79216SNélio Laranjeiro struct priv *priv = dev->data->dev_private; 2522e22920bSAdrien Mazarguil unsigned int i; 2536af6b973SNélio Laranjeiro int ret; 254771fa900SAdrien Mazarguil 255a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "port %u closing device \"%s\"", 2560f99970bSNélio Laranjeiro dev->data->port_id, 257771fa900SAdrien Mazarguil ((priv->ctx != NULL) ? priv->ctx->device->name : "")); 258ecc1c29dSAdrien Mazarguil /* In case mlx5_dev_stop() has not been called. */ 259af4f09f2SNélio Laranjeiro mlx5_dev_interrupt_handler_uninstall(dev); 260af4f09f2SNélio Laranjeiro mlx5_traffic_disable(dev); 261af689f1fSNelio Laranjeiro mlx5_flow_flush(dev, NULL); 2622e22920bSAdrien Mazarguil /* Prevent crashes when queues are still in use. */ 2632e22920bSAdrien Mazarguil dev->rx_pkt_burst = removed_rx_burst; 2642e22920bSAdrien Mazarguil dev->tx_pkt_burst = removed_tx_burst; 2652e22920bSAdrien Mazarguil if (priv->rxqs != NULL) { 2662e22920bSAdrien Mazarguil /* XXX race condition if mlx5_rx_burst() is still running. */ 2672e22920bSAdrien Mazarguil usleep(1000); 268a1366b1aSNélio Laranjeiro for (i = 0; (i != priv->rxqs_n); ++i) 269af4f09f2SNélio Laranjeiro mlx5_rxq_release(dev, i); 2702e22920bSAdrien Mazarguil priv->rxqs_n = 0; 2712e22920bSAdrien Mazarguil priv->rxqs = NULL; 2722e22920bSAdrien Mazarguil } 2732e22920bSAdrien Mazarguil if (priv->txqs != NULL) { 2742e22920bSAdrien Mazarguil /* XXX race condition if mlx5_tx_burst() is still running. */ 2752e22920bSAdrien Mazarguil usleep(1000); 2766e78005aSNélio Laranjeiro for (i = 0; (i != priv->txqs_n); ++i) 277af4f09f2SNélio Laranjeiro mlx5_txq_release(dev, i); 2782e22920bSAdrien Mazarguil priv->txqs_n = 0; 2792e22920bSAdrien Mazarguil priv->txqs = NULL; 2802e22920bSAdrien Mazarguil } 2817d6bf6b8SYongseok Koh mlx5_mprq_free_mp(dev); 282974f1e7eSYongseok Koh mlx5_mr_release(dev); 283771fa900SAdrien Mazarguil if (priv->pd != NULL) { 284771fa900SAdrien Mazarguil assert(priv->ctx != NULL); 2850e83b8e5SNelio Laranjeiro claim_zero(mlx5_glue->dealloc_pd(priv->pd)); 2860e83b8e5SNelio Laranjeiro claim_zero(mlx5_glue->close_device(priv->ctx)); 287771fa900SAdrien Mazarguil } else 288771fa900SAdrien Mazarguil assert(priv->ctx == NULL); 28929c1d8bbSNélio Laranjeiro if (priv->rss_conf.rss_key != NULL) 29029c1d8bbSNélio Laranjeiro rte_free(priv->rss_conf.rss_key); 291634efbc2SNelio Laranjeiro if (priv->reta_idx != NULL) 292634efbc2SNelio Laranjeiro rte_free(priv->reta_idx); 2938c5bca92SXueming Li if (priv->primary_socket) 294af4f09f2SNélio Laranjeiro mlx5_socket_uninit(dev); 295ccdcba53SNélio Laranjeiro if (priv->config.vf) 296ccdcba53SNélio Laranjeiro mlx5_nl_mac_addr_flush(dev); 29726c08b97SAdrien Mazarguil if (priv->nl_socket_route >= 0) 29826c08b97SAdrien Mazarguil close(priv->nl_socket_route); 29926c08b97SAdrien Mazarguil if (priv->nl_socket_rdma >= 0) 30026c08b97SAdrien Mazarguil close(priv->nl_socket_rdma); 301d53180afSMoti Haimovsky if (priv->tcf_context) 302d53180afSMoti Haimovsky mlx5_flow_tcf_context_destroy(priv->tcf_context); 303af4f09f2SNélio Laranjeiro ret = mlx5_hrxq_ibv_verify(dev); 304f5479b68SNélio Laranjeiro if (ret) 305a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "port %u some hash Rx queue still remain", 3060f99970bSNélio Laranjeiro dev->data->port_id); 307af4f09f2SNélio Laranjeiro ret = mlx5_ind_table_ibv_verify(dev); 3084c7a0f5fSNélio Laranjeiro if (ret) 309a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "port %u some indirection table still remain", 3100f99970bSNélio Laranjeiro dev->data->port_id); 311af4f09f2SNélio Laranjeiro ret = mlx5_rxq_ibv_verify(dev); 31209cb5b58SNélio Laranjeiro if (ret) 313a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "port %u some Verbs Rx queue still remain", 3140f99970bSNélio Laranjeiro dev->data->port_id); 315af4f09f2SNélio Laranjeiro ret = mlx5_rxq_verify(dev); 316a1366b1aSNélio Laranjeiro if (ret) 317a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "port %u some Rx queues still remain", 3180f99970bSNélio Laranjeiro dev->data->port_id); 319af4f09f2SNélio Laranjeiro ret = mlx5_txq_ibv_verify(dev); 320faf2667fSNélio Laranjeiro if (ret) 321a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "port %u some Verbs Tx queue still remain", 3220f99970bSNélio Laranjeiro dev->data->port_id); 323af4f09f2SNélio Laranjeiro ret = mlx5_txq_verify(dev); 3246e78005aSNélio Laranjeiro if (ret) 325a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "port %u some Tx queues still remain", 3260f99970bSNélio Laranjeiro dev->data->port_id); 327af4f09f2SNélio Laranjeiro ret = mlx5_flow_verify(dev); 3286af6b973SNélio Laranjeiro if (ret) 329a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "port %u some flows still remain", 330a170a30dSNélio Laranjeiro dev->data->port_id); 3312b730263SAdrien Mazarguil if (priv->domain_id != RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID) { 3322b730263SAdrien Mazarguil unsigned int c = 0; 3332b730263SAdrien Mazarguil unsigned int i = mlx5_dev_to_port_id(dev->device, NULL, 0); 3342b730263SAdrien Mazarguil uint16_t port_id[i]; 3352b730263SAdrien Mazarguil 3362b730263SAdrien Mazarguil i = RTE_MIN(mlx5_dev_to_port_id(dev->device, port_id, i), i); 3372b730263SAdrien Mazarguil while (i--) { 3382b730263SAdrien Mazarguil struct priv *opriv = 3392b730263SAdrien Mazarguil rte_eth_devices[port_id[i]].data->dev_private; 3402b730263SAdrien Mazarguil 3412b730263SAdrien Mazarguil if (!opriv || 3422b730263SAdrien Mazarguil opriv->domain_id != priv->domain_id || 3432b730263SAdrien Mazarguil &rte_eth_devices[port_id[i]] == dev) 3442b730263SAdrien Mazarguil continue; 3452b730263SAdrien Mazarguil ++c; 3462b730263SAdrien Mazarguil } 3472b730263SAdrien Mazarguil if (!c) 3482b730263SAdrien Mazarguil claim_zero(rte_eth_switch_domain_free(priv->domain_id)); 3492b730263SAdrien Mazarguil } 350771fa900SAdrien Mazarguil memset(priv, 0, sizeof(*priv)); 3512b730263SAdrien Mazarguil priv->domain_id = RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID; 35242603bbdSOphir Munk /* 35342603bbdSOphir Munk * Reset mac_addrs to NULL such that it is not freed as part of 35442603bbdSOphir Munk * rte_eth_dev_release_port(). mac_addrs is part of dev_private so 35542603bbdSOphir Munk * it is freed when dev_private is freed. 35642603bbdSOphir Munk */ 35742603bbdSOphir Munk dev->data->mac_addrs = NULL; 358771fa900SAdrien Mazarguil } 359771fa900SAdrien Mazarguil 3600887aa7fSNélio Laranjeiro const struct eth_dev_ops mlx5_dev_ops = { 361e60fbd5bSAdrien Mazarguil .dev_configure = mlx5_dev_configure, 362e60fbd5bSAdrien Mazarguil .dev_start = mlx5_dev_start, 363e60fbd5bSAdrien Mazarguil .dev_stop = mlx5_dev_stop, 36462072098SOr Ami .dev_set_link_down = mlx5_set_link_down, 36562072098SOr Ami .dev_set_link_up = mlx5_set_link_up, 366771fa900SAdrien Mazarguil .dev_close = mlx5_dev_close, 3671bdbe1afSAdrien Mazarguil .promiscuous_enable = mlx5_promiscuous_enable, 3681bdbe1afSAdrien Mazarguil .promiscuous_disable = mlx5_promiscuous_disable, 3691bdbe1afSAdrien Mazarguil .allmulticast_enable = mlx5_allmulticast_enable, 3701bdbe1afSAdrien Mazarguil .allmulticast_disable = mlx5_allmulticast_disable, 371cb8faed7SAdrien Mazarguil .link_update = mlx5_link_update, 37287011737SAdrien Mazarguil .stats_get = mlx5_stats_get, 37387011737SAdrien Mazarguil .stats_reset = mlx5_stats_reset, 374a4193ae3SShahaf Shuler .xstats_get = mlx5_xstats_get, 375a4193ae3SShahaf Shuler .xstats_reset = mlx5_xstats_reset, 376a4193ae3SShahaf Shuler .xstats_get_names = mlx5_xstats_get_names, 377e60fbd5bSAdrien Mazarguil .dev_infos_get = mlx5_dev_infos_get, 37878a38edfSJianfeng Tan .dev_supported_ptypes_get = mlx5_dev_supported_ptypes_get, 379e9086978SAdrien Mazarguil .vlan_filter_set = mlx5_vlan_filter_set, 3802e22920bSAdrien Mazarguil .rx_queue_setup = mlx5_rx_queue_setup, 3812e22920bSAdrien Mazarguil .tx_queue_setup = mlx5_tx_queue_setup, 3822e22920bSAdrien Mazarguil .rx_queue_release = mlx5_rx_queue_release, 3832e22920bSAdrien Mazarguil .tx_queue_release = mlx5_tx_queue_release, 38402d75430SAdrien Mazarguil .flow_ctrl_get = mlx5_dev_get_flow_ctrl, 38502d75430SAdrien Mazarguil .flow_ctrl_set = mlx5_dev_set_flow_ctrl, 3863318aef7SAdrien Mazarguil .mac_addr_remove = mlx5_mac_addr_remove, 3873318aef7SAdrien Mazarguil .mac_addr_add = mlx5_mac_addr_add, 38886977fccSDavid Marchand .mac_addr_set = mlx5_mac_addr_set, 389e0586a8dSNélio Laranjeiro .set_mc_addr_list = mlx5_set_mc_addr_list, 390cf37ca95SAdrien Mazarguil .mtu_set = mlx5_dev_set_mtu, 391f3db9489SYaacov Hazan .vlan_strip_queue_set = mlx5_vlan_strip_queue_set, 392f3db9489SYaacov Hazan .vlan_offload_set = mlx5_vlan_offload_set, 393634efbc2SNelio Laranjeiro .reta_update = mlx5_dev_rss_reta_update, 394634efbc2SNelio Laranjeiro .reta_query = mlx5_dev_rss_reta_query, 3952f97422eSNelio Laranjeiro .rss_hash_update = mlx5_rss_hash_update, 3962f97422eSNelio Laranjeiro .rss_hash_conf_get = mlx5_rss_hash_conf_get, 39776f5c99eSYaacov Hazan .filter_ctrl = mlx5_dev_filter_ctrl, 3988788fec1SOlivier Matz .rx_descriptor_status = mlx5_rx_descriptor_status, 3998788fec1SOlivier Matz .tx_descriptor_status = mlx5_tx_descriptor_status, 40026f04883STom Barbette .rx_queue_count = mlx5_rx_queue_count, 4013c7d44afSShahaf Shuler .rx_queue_intr_enable = mlx5_rx_intr_enable, 4023c7d44afSShahaf Shuler .rx_queue_intr_disable = mlx5_rx_intr_disable, 403d3e0f392SMatan Azrad .is_removed = mlx5_is_removed, 404771fa900SAdrien Mazarguil }; 405771fa900SAdrien Mazarguil 40687ec44ceSXueming Li static const struct eth_dev_ops mlx5_dev_sec_ops = { 40787ec44ceSXueming Li .stats_get = mlx5_stats_get, 40887ec44ceSXueming Li .stats_reset = mlx5_stats_reset, 40987ec44ceSXueming Li .xstats_get = mlx5_xstats_get, 41087ec44ceSXueming Li .xstats_reset = mlx5_xstats_reset, 41187ec44ceSXueming Li .xstats_get_names = mlx5_xstats_get_names, 41287ec44ceSXueming Li .dev_infos_get = mlx5_dev_infos_get, 41387ec44ceSXueming Li .rx_descriptor_status = mlx5_rx_descriptor_status, 41487ec44ceSXueming Li .tx_descriptor_status = mlx5_tx_descriptor_status, 41587ec44ceSXueming Li }; 41687ec44ceSXueming Li 4170887aa7fSNélio Laranjeiro /* Available operators in flow isolated mode. */ 4180887aa7fSNélio Laranjeiro const struct eth_dev_ops mlx5_dev_ops_isolate = { 4190887aa7fSNélio Laranjeiro .dev_configure = mlx5_dev_configure, 4200887aa7fSNélio Laranjeiro .dev_start = mlx5_dev_start, 4210887aa7fSNélio Laranjeiro .dev_stop = mlx5_dev_stop, 4220887aa7fSNélio Laranjeiro .dev_set_link_down = mlx5_set_link_down, 4230887aa7fSNélio Laranjeiro .dev_set_link_up = mlx5_set_link_up, 4240887aa7fSNélio Laranjeiro .dev_close = mlx5_dev_close, 42524b068adSYongseok Koh .promiscuous_enable = mlx5_promiscuous_enable, 42624b068adSYongseok Koh .promiscuous_disable = mlx5_promiscuous_disable, 4272547ee74SYongseok Koh .allmulticast_enable = mlx5_allmulticast_enable, 4282547ee74SYongseok Koh .allmulticast_disable = mlx5_allmulticast_disable, 4290887aa7fSNélio Laranjeiro .link_update = mlx5_link_update, 4300887aa7fSNélio Laranjeiro .stats_get = mlx5_stats_get, 4310887aa7fSNélio Laranjeiro .stats_reset = mlx5_stats_reset, 4320887aa7fSNélio Laranjeiro .xstats_get = mlx5_xstats_get, 4330887aa7fSNélio Laranjeiro .xstats_reset = mlx5_xstats_reset, 4340887aa7fSNélio Laranjeiro .xstats_get_names = mlx5_xstats_get_names, 4350887aa7fSNélio Laranjeiro .dev_infos_get = mlx5_dev_infos_get, 4360887aa7fSNélio Laranjeiro .dev_supported_ptypes_get = mlx5_dev_supported_ptypes_get, 4370887aa7fSNélio Laranjeiro .vlan_filter_set = mlx5_vlan_filter_set, 4380887aa7fSNélio Laranjeiro .rx_queue_setup = mlx5_rx_queue_setup, 4390887aa7fSNélio Laranjeiro .tx_queue_setup = mlx5_tx_queue_setup, 4400887aa7fSNélio Laranjeiro .rx_queue_release = mlx5_rx_queue_release, 4410887aa7fSNélio Laranjeiro .tx_queue_release = mlx5_tx_queue_release, 4420887aa7fSNélio Laranjeiro .flow_ctrl_get = mlx5_dev_get_flow_ctrl, 4430887aa7fSNélio Laranjeiro .flow_ctrl_set = mlx5_dev_set_flow_ctrl, 4440887aa7fSNélio Laranjeiro .mac_addr_remove = mlx5_mac_addr_remove, 4450887aa7fSNélio Laranjeiro .mac_addr_add = mlx5_mac_addr_add, 4460887aa7fSNélio Laranjeiro .mac_addr_set = mlx5_mac_addr_set, 447e0586a8dSNélio Laranjeiro .set_mc_addr_list = mlx5_set_mc_addr_list, 4480887aa7fSNélio Laranjeiro .mtu_set = mlx5_dev_set_mtu, 4490887aa7fSNélio Laranjeiro .vlan_strip_queue_set = mlx5_vlan_strip_queue_set, 4500887aa7fSNélio Laranjeiro .vlan_offload_set = mlx5_vlan_offload_set, 4510887aa7fSNélio Laranjeiro .filter_ctrl = mlx5_dev_filter_ctrl, 4520887aa7fSNélio Laranjeiro .rx_descriptor_status = mlx5_rx_descriptor_status, 4530887aa7fSNélio Laranjeiro .tx_descriptor_status = mlx5_tx_descriptor_status, 4540887aa7fSNélio Laranjeiro .rx_queue_intr_enable = mlx5_rx_intr_enable, 4550887aa7fSNélio Laranjeiro .rx_queue_intr_disable = mlx5_rx_intr_disable, 456d3e0f392SMatan Azrad .is_removed = mlx5_is_removed, 4570887aa7fSNélio Laranjeiro }; 4580887aa7fSNélio Laranjeiro 459e72dd09bSNélio Laranjeiro /** 460e72dd09bSNélio Laranjeiro * Verify and store value for device argument. 461e72dd09bSNélio Laranjeiro * 462e72dd09bSNélio Laranjeiro * @param[in] key 463e72dd09bSNélio Laranjeiro * Key argument to verify. 464e72dd09bSNélio Laranjeiro * @param[in] val 465e72dd09bSNélio Laranjeiro * Value associated with key. 466e72dd09bSNélio Laranjeiro * @param opaque 467e72dd09bSNélio Laranjeiro * User data. 468e72dd09bSNélio Laranjeiro * 469e72dd09bSNélio Laranjeiro * @return 470a6d83b6aSNélio Laranjeiro * 0 on success, a negative errno value otherwise and rte_errno is set. 471e72dd09bSNélio Laranjeiro */ 472e72dd09bSNélio Laranjeiro static int 473e72dd09bSNélio Laranjeiro mlx5_args_check(const char *key, const char *val, void *opaque) 474e72dd09bSNélio Laranjeiro { 4757fe24446SShahaf Shuler struct mlx5_dev_config *config = opaque; 47699c12dccSNélio Laranjeiro unsigned long tmp; 477e72dd09bSNélio Laranjeiro 4786de569f5SAdrien Mazarguil /* No-op, port representors are processed in mlx5_dev_spawn(). */ 4796de569f5SAdrien Mazarguil if (!strcmp(MLX5_REPRESENTOR, key)) 4806de569f5SAdrien Mazarguil return 0; 48199c12dccSNélio Laranjeiro errno = 0; 48299c12dccSNélio Laranjeiro tmp = strtoul(val, NULL, 0); 48399c12dccSNélio Laranjeiro if (errno) { 484a6d83b6aSNélio Laranjeiro rte_errno = errno; 485a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "%s: \"%s\" is not a valid integer", key, val); 486a6d83b6aSNélio Laranjeiro return -rte_errno; 48799c12dccSNélio Laranjeiro } 48899c12dccSNélio Laranjeiro if (strcmp(MLX5_RXQ_CQE_COMP_EN, key) == 0) { 4897fe24446SShahaf Shuler config->cqe_comp = !!tmp; 490bc91e8dbSYongseok Koh } else if (strcmp(MLX5_RXQ_CQE_PAD_EN, key) == 0) { 491bc91e8dbSYongseok Koh config->cqe_pad = !!tmp; 49278c7a16dSYongseok Koh } else if (strcmp(MLX5_RXQ_PKT_PAD_EN, key) == 0) { 49378c7a16dSYongseok Koh config->hw_padding = !!tmp; 4947d6bf6b8SYongseok Koh } else if (strcmp(MLX5_RX_MPRQ_EN, key) == 0) { 4957d6bf6b8SYongseok Koh config->mprq.enabled = !!tmp; 4967d6bf6b8SYongseok Koh } else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_NUM, key) == 0) { 4977d6bf6b8SYongseok Koh config->mprq.stride_num_n = tmp; 4987d6bf6b8SYongseok Koh } else if (strcmp(MLX5_RX_MPRQ_MAX_MEMCPY_LEN, key) == 0) { 4997d6bf6b8SYongseok Koh config->mprq.max_memcpy_len = tmp; 5007d6bf6b8SYongseok Koh } else if (strcmp(MLX5_RXQS_MIN_MPRQ, key) == 0) { 5017d6bf6b8SYongseok Koh config->mprq.min_rxqs_num = tmp; 5022a66cf37SYaacov Hazan } else if (strcmp(MLX5_TXQ_INLINE, key) == 0) { 5037fe24446SShahaf Shuler config->txq_inline = tmp; 5042a66cf37SYaacov Hazan } else if (strcmp(MLX5_TXQS_MIN_INLINE, key) == 0) { 5057fe24446SShahaf Shuler config->txqs_inline = tmp; 50609d8b416SYongseok Koh } else if (strcmp(MLX5_TXQS_MAX_VEC, key) == 0) { 50709d8b416SYongseok Koh config->txqs_vec = tmp; 508230189d9SNélio Laranjeiro } else if (strcmp(MLX5_TXQ_MPW_EN, key) == 0) { 509f9de8718SShahaf Shuler config->mps = !!tmp; 5106ce84bd8SYongseok Koh } else if (strcmp(MLX5_TXQ_MPW_HDR_DSEG_EN, key) == 0) { 5117fe24446SShahaf Shuler config->mpw_hdr_dseg = !!tmp; 5126ce84bd8SYongseok Koh } else if (strcmp(MLX5_TXQ_MAX_INLINE_LEN, key) == 0) { 5137fe24446SShahaf Shuler config->inline_max_packet_sz = tmp; 5145644d5b9SNelio Laranjeiro } else if (strcmp(MLX5_TX_VEC_EN, key) == 0) { 5157fe24446SShahaf Shuler config->tx_vec_en = !!tmp; 5165644d5b9SNelio Laranjeiro } else if (strcmp(MLX5_RX_VEC_EN, key) == 0) { 5177fe24446SShahaf Shuler config->rx_vec_en = !!tmp; 51878a54648SXueming Li } else if (strcmp(MLX5_L3_VXLAN_EN, key) == 0) { 51978a54648SXueming Li config->l3_vxlan_en = !!tmp; 520db209cc3SNélio Laranjeiro } else if (strcmp(MLX5_VF_NL_EN, key) == 0) { 521db209cc3SNélio Laranjeiro config->vf_nl_en = !!tmp; 52251e72d38SOri Kam } else if (strcmp(MLX5_DV_FLOW_EN, key) == 0) { 52351e72d38SOri Kam config->dv_flow_en = !!tmp; 52499c12dccSNélio Laranjeiro } else { 525a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "%s: unknown parameter", key); 526a6d83b6aSNélio Laranjeiro rte_errno = EINVAL; 527a6d83b6aSNélio Laranjeiro return -rte_errno; 528e72dd09bSNélio Laranjeiro } 52999c12dccSNélio Laranjeiro return 0; 53099c12dccSNélio Laranjeiro } 531e72dd09bSNélio Laranjeiro 532e72dd09bSNélio Laranjeiro /** 533e72dd09bSNélio Laranjeiro * Parse device parameters. 534e72dd09bSNélio Laranjeiro * 5357fe24446SShahaf Shuler * @param config 5367fe24446SShahaf Shuler * Pointer to device configuration structure. 537e72dd09bSNélio Laranjeiro * @param devargs 538e72dd09bSNélio Laranjeiro * Device arguments structure. 539e72dd09bSNélio Laranjeiro * 540e72dd09bSNélio Laranjeiro * @return 541a6d83b6aSNélio Laranjeiro * 0 on success, a negative errno value otherwise and rte_errno is set. 542e72dd09bSNélio Laranjeiro */ 543e72dd09bSNélio Laranjeiro static int 5447fe24446SShahaf Shuler mlx5_args(struct mlx5_dev_config *config, struct rte_devargs *devargs) 545e72dd09bSNélio Laranjeiro { 546e72dd09bSNélio Laranjeiro const char **params = (const char *[]){ 54799c12dccSNélio Laranjeiro MLX5_RXQ_CQE_COMP_EN, 548bc91e8dbSYongseok Koh MLX5_RXQ_CQE_PAD_EN, 54978c7a16dSYongseok Koh MLX5_RXQ_PKT_PAD_EN, 5507d6bf6b8SYongseok Koh MLX5_RX_MPRQ_EN, 5517d6bf6b8SYongseok Koh MLX5_RX_MPRQ_LOG_STRIDE_NUM, 5527d6bf6b8SYongseok Koh MLX5_RX_MPRQ_MAX_MEMCPY_LEN, 5537d6bf6b8SYongseok Koh MLX5_RXQS_MIN_MPRQ, 5542a66cf37SYaacov Hazan MLX5_TXQ_INLINE, 5552a66cf37SYaacov Hazan MLX5_TXQS_MIN_INLINE, 55609d8b416SYongseok Koh MLX5_TXQS_MAX_VEC, 557230189d9SNélio Laranjeiro MLX5_TXQ_MPW_EN, 5586ce84bd8SYongseok Koh MLX5_TXQ_MPW_HDR_DSEG_EN, 5596ce84bd8SYongseok Koh MLX5_TXQ_MAX_INLINE_LEN, 5605644d5b9SNelio Laranjeiro MLX5_TX_VEC_EN, 5615644d5b9SNelio Laranjeiro MLX5_RX_VEC_EN, 56278a54648SXueming Li MLX5_L3_VXLAN_EN, 563db209cc3SNélio Laranjeiro MLX5_VF_NL_EN, 56451e72d38SOri Kam MLX5_DV_FLOW_EN, 5656de569f5SAdrien Mazarguil MLX5_REPRESENTOR, 566e72dd09bSNélio Laranjeiro NULL, 567e72dd09bSNélio Laranjeiro }; 568e72dd09bSNélio Laranjeiro struct rte_kvargs *kvlist; 569e72dd09bSNélio Laranjeiro int ret = 0; 570e72dd09bSNélio Laranjeiro int i; 571e72dd09bSNélio Laranjeiro 572e72dd09bSNélio Laranjeiro if (devargs == NULL) 573e72dd09bSNélio Laranjeiro return 0; 574e72dd09bSNélio Laranjeiro /* Following UGLY cast is done to pass checkpatch. */ 575e72dd09bSNélio Laranjeiro kvlist = rte_kvargs_parse(devargs->args, params); 576e72dd09bSNélio Laranjeiro if (kvlist == NULL) 577e72dd09bSNélio Laranjeiro return 0; 578e72dd09bSNélio Laranjeiro /* Process parameters. */ 579e72dd09bSNélio Laranjeiro for (i = 0; (params[i] != NULL); ++i) { 580e72dd09bSNélio Laranjeiro if (rte_kvargs_count(kvlist, params[i])) { 581e72dd09bSNélio Laranjeiro ret = rte_kvargs_process(kvlist, params[i], 5827fe24446SShahaf Shuler mlx5_args_check, config); 583a6d83b6aSNélio Laranjeiro if (ret) { 584a6d83b6aSNélio Laranjeiro rte_errno = EINVAL; 585a67323e4SShahaf Shuler rte_kvargs_free(kvlist); 586a6d83b6aSNélio Laranjeiro return -rte_errno; 587e72dd09bSNélio Laranjeiro } 588e72dd09bSNélio Laranjeiro } 589a67323e4SShahaf Shuler } 590e72dd09bSNélio Laranjeiro rte_kvargs_free(kvlist); 591e72dd09bSNélio Laranjeiro return 0; 592e72dd09bSNélio Laranjeiro } 593e72dd09bSNélio Laranjeiro 594fdf91e0fSJan Blunck static struct rte_pci_driver mlx5_driver; 595771fa900SAdrien Mazarguil 5964a984153SXueming Li /* 5974a984153SXueming Li * Reserved UAR address space for TXQ UAR(hw doorbell) mapping, process 5984a984153SXueming Li * local resource used by both primary and secondary to avoid duplicate 5994a984153SXueming Li * reservation. 6004a984153SXueming Li * The space has to be available on both primary and secondary process, 6014a984153SXueming Li * TXQ UAR maps to this area using fixed mmap w/o double check. 6024a984153SXueming Li */ 6034a984153SXueming Li static void *uar_base; 6044a984153SXueming Li 6058594a202SAnatoly Burakov static int 6065282bb1cSAnatoly Burakov find_lower_va_bound(const struct rte_memseg_list *msl, 60766cc45e2SAnatoly Burakov const struct rte_memseg *ms, void *arg) 6088594a202SAnatoly Burakov { 6098594a202SAnatoly Burakov void **addr = arg; 6108594a202SAnatoly Burakov 6115282bb1cSAnatoly Burakov if (msl->external) 6125282bb1cSAnatoly Burakov return 0; 6138594a202SAnatoly Burakov if (*addr == NULL) 6148594a202SAnatoly Burakov *addr = ms->addr; 6158594a202SAnatoly Burakov else 6168594a202SAnatoly Burakov *addr = RTE_MIN(*addr, ms->addr); 6178594a202SAnatoly Burakov 6188594a202SAnatoly Burakov return 0; 6198594a202SAnatoly Burakov } 6208594a202SAnatoly Burakov 6214a984153SXueming Li /** 6224a984153SXueming Li * Reserve UAR address space for primary process. 6234a984153SXueming Li * 624af4f09f2SNélio Laranjeiro * @param[in] dev 625af4f09f2SNélio Laranjeiro * Pointer to Ethernet device. 6264a984153SXueming Li * 6274a984153SXueming Li * @return 628a6d83b6aSNélio Laranjeiro * 0 on success, a negative errno value otherwise and rte_errno is set. 6294a984153SXueming Li */ 6304a984153SXueming Li static int 631af4f09f2SNélio Laranjeiro mlx5_uar_init_primary(struct rte_eth_dev *dev) 6324a984153SXueming Li { 633af4f09f2SNélio Laranjeiro struct priv *priv = dev->data->dev_private; 6344a984153SXueming Li void *addr = (void *)0; 6354a984153SXueming Li 6364a984153SXueming Li if (uar_base) { /* UAR address space mapped. */ 6374a984153SXueming Li priv->uar_base = uar_base; 6384a984153SXueming Li return 0; 6394a984153SXueming Li } 6404a984153SXueming Li /* find out lower bound of hugepage segments */ 6418594a202SAnatoly Burakov rte_memseg_walk(find_lower_va_bound, &addr); 6428594a202SAnatoly Burakov 6434a984153SXueming Li /* keep distance to hugepages to minimize potential conflicts. */ 6446bf10ab6SMoti Haimovsky addr = RTE_PTR_SUB(addr, (uintptr_t)(MLX5_UAR_OFFSET + MLX5_UAR_SIZE)); 6454a984153SXueming Li /* anonymous mmap, no real memory consumption. */ 6464a984153SXueming Li addr = mmap(addr, MLX5_UAR_SIZE, 6474a984153SXueming Li PROT_NONE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); 6484a984153SXueming Li if (addr == MAP_FAILED) { 649a170a30dSNélio Laranjeiro DRV_LOG(ERR, 650a170a30dSNélio Laranjeiro "port %u failed to reserve UAR address space, please" 6510f99970bSNélio Laranjeiro " adjust MLX5_UAR_SIZE or try --base-virtaddr", 6520f99970bSNélio Laranjeiro dev->data->port_id); 653a6d83b6aSNélio Laranjeiro rte_errno = ENOMEM; 654a6d83b6aSNélio Laranjeiro return -rte_errno; 6554a984153SXueming Li } 6564a984153SXueming Li /* Accept either same addr or a new addr returned from mmap if target 6574a984153SXueming Li * range occupied. 6584a984153SXueming Li */ 659a170a30dSNélio Laranjeiro DRV_LOG(INFO, "port %u reserved UAR address space: %p", 660a170a30dSNélio Laranjeiro dev->data->port_id, addr); 6614a984153SXueming Li priv->uar_base = addr; /* for primary and secondary UAR re-mmap. */ 6624a984153SXueming Li uar_base = addr; /* process local, don't reserve again. */ 6634a984153SXueming Li return 0; 6644a984153SXueming Li } 6654a984153SXueming Li 6664a984153SXueming Li /** 6674a984153SXueming Li * Reserve UAR address space for secondary process, align with 6684a984153SXueming Li * primary process. 6694a984153SXueming Li * 670af4f09f2SNélio Laranjeiro * @param[in] dev 671af4f09f2SNélio Laranjeiro * Pointer to Ethernet device. 6724a984153SXueming Li * 6734a984153SXueming Li * @return 674a6d83b6aSNélio Laranjeiro * 0 on success, a negative errno value otherwise and rte_errno is set. 6754a984153SXueming Li */ 6764a984153SXueming Li static int 677af4f09f2SNélio Laranjeiro mlx5_uar_init_secondary(struct rte_eth_dev *dev) 6784a984153SXueming Li { 679af4f09f2SNélio Laranjeiro struct priv *priv = dev->data->dev_private; 6804a984153SXueming Li void *addr; 6814a984153SXueming Li 6824a984153SXueming Li assert(priv->uar_base); 6834a984153SXueming Li if (uar_base) { /* already reserved. */ 6844a984153SXueming Li assert(uar_base == priv->uar_base); 6854a984153SXueming Li return 0; 6864a984153SXueming Li } 6874a984153SXueming Li /* anonymous mmap, no real memory consumption. */ 6884a984153SXueming Li addr = mmap(priv->uar_base, MLX5_UAR_SIZE, 6894a984153SXueming Li PROT_NONE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); 6904a984153SXueming Li if (addr == MAP_FAILED) { 691a170a30dSNélio Laranjeiro DRV_LOG(ERR, "port %u UAR mmap failed: %p size: %llu", 6920f99970bSNélio Laranjeiro dev->data->port_id, priv->uar_base, MLX5_UAR_SIZE); 693a6d83b6aSNélio Laranjeiro rte_errno = ENXIO; 694a6d83b6aSNélio Laranjeiro return -rte_errno; 6954a984153SXueming Li } 6964a984153SXueming Li if (priv->uar_base != addr) { 697a170a30dSNélio Laranjeiro DRV_LOG(ERR, 698a170a30dSNélio Laranjeiro "port %u UAR address %p size %llu occupied, please" 699a170a30dSNélio Laranjeiro " adjust MLX5_UAR_OFFSET or try EAL parameter" 700a170a30dSNélio Laranjeiro " --base-virtaddr", 7010f99970bSNélio Laranjeiro dev->data->port_id, priv->uar_base, MLX5_UAR_SIZE); 702a6d83b6aSNélio Laranjeiro rte_errno = ENXIO; 703a6d83b6aSNélio Laranjeiro return -rte_errno; 7044a984153SXueming Li } 7054a984153SXueming Li uar_base = addr; /* process local, don't reserve again */ 706a170a30dSNélio Laranjeiro DRV_LOG(INFO, "port %u reserved UAR address space: %p", 707a170a30dSNélio Laranjeiro dev->data->port_id, addr); 7084a984153SXueming Li return 0; 7094a984153SXueming Li } 7104a984153SXueming Li 711771fa900SAdrien Mazarguil /** 712f38c5457SAdrien Mazarguil * Spawn an Ethernet device from Verbs information. 713771fa900SAdrien Mazarguil * 714f38c5457SAdrien Mazarguil * @param dpdk_dev 715f38c5457SAdrien Mazarguil * Backing DPDK device. 716f38c5457SAdrien Mazarguil * @param ibv_dev 717f38c5457SAdrien Mazarguil * Verbs device. 718f87bfa8eSYongseok Koh * @param config 719f87bfa8eSYongseok Koh * Device configuration parameters. 7202b730263SAdrien Mazarguil * @param[in] switch_info 7212b730263SAdrien Mazarguil * Switch properties of Ethernet device. 722771fa900SAdrien Mazarguil * 723771fa900SAdrien Mazarguil * @return 724f38c5457SAdrien Mazarguil * A valid Ethernet device object on success, NULL otherwise and rte_errno 725206254b7SOphir Munk * is set. The following errors are defined: 7266de569f5SAdrien Mazarguil * 7276de569f5SAdrien Mazarguil * EBUSY: device is not supposed to be spawned. 728206254b7SOphir Munk * EEXIST: device is already spawned 729771fa900SAdrien Mazarguil */ 730f38c5457SAdrien Mazarguil static struct rte_eth_dev * 731f38c5457SAdrien Mazarguil mlx5_dev_spawn(struct rte_device *dpdk_dev, 732f38c5457SAdrien Mazarguil struct ibv_device *ibv_dev, 733f87bfa8eSYongseok Koh struct mlx5_dev_config config, 7342b730263SAdrien Mazarguil const struct mlx5_switch_info *switch_info) 735771fa900SAdrien Mazarguil { 736f5bf91deSMoti Haimovsky struct ibv_context *ctx = NULL; 7373ff4b086SAdrien Mazarguil struct ibv_device_attr_ex attr; 73868128934SAdrien Mazarguil struct ibv_port_attr port_attr; 7399083982cSAdrien Mazarguil struct ibv_pd *pd = NULL; 7406057a10bSAdrien Mazarguil struct mlx5dv_context dv_attr = { .comp_mask = 0 }; 7419083982cSAdrien Mazarguil struct rte_eth_dev *eth_dev = NULL; 7429083982cSAdrien Mazarguil struct priv *priv = NULL; 743771fa900SAdrien Mazarguil int err = 0; 74478c7a16dSYongseok Koh unsigned int hw_padding = 0; 745e192ef80SYaacov Hazan unsigned int mps; 746523f5a74SYongseok Koh unsigned int cqe_comp; 747bc91e8dbSYongseok Koh unsigned int cqe_pad = 0; 748772d3435SXueming Li unsigned int tunnel_en = 0; 7491f106da2SMatan Azrad unsigned int mpls_en = 0; 7505f8ba81cSXueming Li unsigned int swp = 0; 7517d6bf6b8SYongseok Koh unsigned int mprq = 0; 7527d6bf6b8SYongseok Koh unsigned int mprq_min_stride_size_n = 0; 7537d6bf6b8SYongseok Koh unsigned int mprq_max_stride_size_n = 0; 7547d6bf6b8SYongseok Koh unsigned int mprq_min_stride_num_n = 0; 7557d6bf6b8SYongseok Koh unsigned int mprq_max_stride_num_n = 0; 75668128934SAdrien Mazarguil struct ether_addr mac; 75768128934SAdrien Mazarguil char name[RTE_ETH_NAME_MAX_LEN]; 7582b730263SAdrien Mazarguil int own_domain_id = 0; 759206254b7SOphir Munk uint16_t port_id; 7602b730263SAdrien Mazarguil unsigned int i; 761771fa900SAdrien Mazarguil 7626de569f5SAdrien Mazarguil /* Determine if this port representor is supposed to be spawned. */ 7636de569f5SAdrien Mazarguil if (switch_info->representor && dpdk_dev->devargs) { 7646de569f5SAdrien Mazarguil struct rte_eth_devargs eth_da; 7656de569f5SAdrien Mazarguil 7666de569f5SAdrien Mazarguil err = rte_eth_devargs_parse(dpdk_dev->devargs->args, ð_da); 7676de569f5SAdrien Mazarguil if (err) { 7686de569f5SAdrien Mazarguil rte_errno = -err; 7696de569f5SAdrien Mazarguil DRV_LOG(ERR, "failed to process device arguments: %s", 7706de569f5SAdrien Mazarguil strerror(rte_errno)); 7716de569f5SAdrien Mazarguil return NULL; 7726de569f5SAdrien Mazarguil } 7736de569f5SAdrien Mazarguil for (i = 0; i < eth_da.nb_representor_ports; ++i) 7746de569f5SAdrien Mazarguil if (eth_da.representor_ports[i] == 7756de569f5SAdrien Mazarguil (uint16_t)switch_info->port_name) 7766de569f5SAdrien Mazarguil break; 7776de569f5SAdrien Mazarguil if (i == eth_da.nb_representor_ports) { 7786de569f5SAdrien Mazarguil rte_errno = EBUSY; 7796de569f5SAdrien Mazarguil return NULL; 7806de569f5SAdrien Mazarguil } 7816de569f5SAdrien Mazarguil } 782206254b7SOphir Munk /* Build device name. */ 783206254b7SOphir Munk if (!switch_info->representor) 784206254b7SOphir Munk rte_strlcpy(name, dpdk_dev->name, sizeof(name)); 785206254b7SOphir Munk else 786206254b7SOphir Munk snprintf(name, sizeof(name), "%s_representor_%u", 787206254b7SOphir Munk dpdk_dev->name, switch_info->port_name); 788206254b7SOphir Munk /* check if the device is already spawned */ 789206254b7SOphir Munk if (rte_eth_dev_get_port_by_name(name, &port_id) == 0) { 790206254b7SOphir Munk rte_errno = EEXIST; 791206254b7SOphir Munk return NULL; 792206254b7SOphir Munk } 793974f1e7eSYongseok Koh /* Prepare shared data between primary and secondary process. */ 794974f1e7eSYongseok Koh mlx5_prepare_shared_data(); 795f38c5457SAdrien Mazarguil errno = 0; 796f5bf91deSMoti Haimovsky ctx = mlx5_glue->dv_open_device(ibv_dev); 797f5bf91deSMoti Haimovsky if (ctx) { 798f5bf91deSMoti Haimovsky config.devx = 1; 799f5bf91deSMoti Haimovsky DRV_LOG(DEBUG, "DEVX is supported"); 800f5bf91deSMoti Haimovsky } else { 801f38c5457SAdrien Mazarguil ctx = mlx5_glue->open_device(ibv_dev); 802f38c5457SAdrien Mazarguil if (!ctx) { 803f38c5457SAdrien Mazarguil rte_errno = errno ? errno : ENODEV; 804f38c5457SAdrien Mazarguil return NULL; 805771fa900SAdrien Mazarguil } 806f5bf91deSMoti Haimovsky } 8075f8ba81cSXueming Li #ifdef HAVE_IBV_MLX5_MOD_SWP 8086057a10bSAdrien Mazarguil dv_attr.comp_mask |= MLX5DV_CONTEXT_MASK_SWP; 8095f8ba81cSXueming Li #endif 81043e9d979SShachar Beiser /* 81143e9d979SShachar Beiser * Multi-packet send is supported by ConnectX-4 Lx PF as well 81243e9d979SShachar Beiser * as all ConnectX-5 devices. 81343e9d979SShachar Beiser */ 814038e7251SShahaf Shuler #ifdef HAVE_IBV_DEVICE_TUNNEL_SUPPORT 8156057a10bSAdrien Mazarguil dv_attr.comp_mask |= MLX5DV_CONTEXT_MASK_TUNNEL_OFFLOADS; 816038e7251SShahaf Shuler #endif 8177d6bf6b8SYongseok Koh #ifdef HAVE_IBV_DEVICE_STRIDING_RQ_SUPPORT 8186057a10bSAdrien Mazarguil dv_attr.comp_mask |= MLX5DV_CONTEXT_MASK_STRIDING_RQ; 8197d6bf6b8SYongseok Koh #endif 8203ff4b086SAdrien Mazarguil mlx5_glue->dv_query_device(ctx, &dv_attr); 8216057a10bSAdrien Mazarguil if (dv_attr.flags & MLX5DV_CONTEXT_FLAGS_MPW_ALLOWED) { 8226057a10bSAdrien Mazarguil if (dv_attr.flags & MLX5DV_CONTEXT_FLAGS_ENHANCED_MPW) { 823a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "enhanced MPW is supported"); 82443e9d979SShachar Beiser mps = MLX5_MPW_ENHANCED; 82543e9d979SShachar Beiser } else { 826a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "MPW is supported"); 827e589960cSYongseok Koh mps = MLX5_MPW; 828e589960cSYongseok Koh } 829e589960cSYongseok Koh } else { 830a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "MPW isn't supported"); 83143e9d979SShachar Beiser mps = MLX5_MPW_DISABLED; 83243e9d979SShachar Beiser } 8335f8ba81cSXueming Li #ifdef HAVE_IBV_MLX5_MOD_SWP 8346057a10bSAdrien Mazarguil if (dv_attr.comp_mask & MLX5DV_CONTEXT_MASK_SWP) 8356057a10bSAdrien Mazarguil swp = dv_attr.sw_parsing_caps.sw_parsing_offloads; 8365f8ba81cSXueming Li DRV_LOG(DEBUG, "SWP support: %u", swp); 8375f8ba81cSXueming Li #endif 83868128934SAdrien Mazarguil config.swp = !!swp; 8397d6bf6b8SYongseok Koh #ifdef HAVE_IBV_DEVICE_STRIDING_RQ_SUPPORT 8406057a10bSAdrien Mazarguil if (dv_attr.comp_mask & MLX5DV_CONTEXT_MASK_STRIDING_RQ) { 8417d6bf6b8SYongseok Koh struct mlx5dv_striding_rq_caps mprq_caps = 8426057a10bSAdrien Mazarguil dv_attr.striding_rq_caps; 8437d6bf6b8SYongseok Koh 8447d6bf6b8SYongseok Koh DRV_LOG(DEBUG, "\tmin_single_stride_log_num_of_bytes: %d", 8457d6bf6b8SYongseok Koh mprq_caps.min_single_stride_log_num_of_bytes); 8467d6bf6b8SYongseok Koh DRV_LOG(DEBUG, "\tmax_single_stride_log_num_of_bytes: %d", 8477d6bf6b8SYongseok Koh mprq_caps.max_single_stride_log_num_of_bytes); 8487d6bf6b8SYongseok Koh DRV_LOG(DEBUG, "\tmin_single_wqe_log_num_of_strides: %d", 8497d6bf6b8SYongseok Koh mprq_caps.min_single_wqe_log_num_of_strides); 8507d6bf6b8SYongseok Koh DRV_LOG(DEBUG, "\tmax_single_wqe_log_num_of_strides: %d", 8517d6bf6b8SYongseok Koh mprq_caps.max_single_wqe_log_num_of_strides); 8527d6bf6b8SYongseok Koh DRV_LOG(DEBUG, "\tsupported_qpts: %d", 8537d6bf6b8SYongseok Koh mprq_caps.supported_qpts); 8547d6bf6b8SYongseok Koh DRV_LOG(DEBUG, "device supports Multi-Packet RQ"); 8557d6bf6b8SYongseok Koh mprq = 1; 8567d6bf6b8SYongseok Koh mprq_min_stride_size_n = 8577d6bf6b8SYongseok Koh mprq_caps.min_single_stride_log_num_of_bytes; 8587d6bf6b8SYongseok Koh mprq_max_stride_size_n = 8597d6bf6b8SYongseok Koh mprq_caps.max_single_stride_log_num_of_bytes; 8607d6bf6b8SYongseok Koh mprq_min_stride_num_n = 8617d6bf6b8SYongseok Koh mprq_caps.min_single_wqe_log_num_of_strides; 8627d6bf6b8SYongseok Koh mprq_max_stride_num_n = 8637d6bf6b8SYongseok Koh mprq_caps.max_single_wqe_log_num_of_strides; 86468128934SAdrien Mazarguil config.mprq.stride_num_n = RTE_MAX(MLX5_MPRQ_STRIDE_NUM_N, 86568128934SAdrien Mazarguil mprq_min_stride_num_n); 8667d6bf6b8SYongseok Koh } 8677d6bf6b8SYongseok Koh #endif 868523f5a74SYongseok Koh if (RTE_CACHE_LINE_SIZE == 128 && 8696057a10bSAdrien Mazarguil !(dv_attr.flags & MLX5DV_CONTEXT_FLAGS_CQE_128B_COMP)) 870523f5a74SYongseok Koh cqe_comp = 0; 871523f5a74SYongseok Koh else 872523f5a74SYongseok Koh cqe_comp = 1; 87368128934SAdrien Mazarguil config.cqe_comp = cqe_comp; 874bc91e8dbSYongseok Koh #ifdef HAVE_IBV_MLX5_MOD_CQE_128B_PAD 875bc91e8dbSYongseok Koh /* Whether device supports 128B Rx CQE padding. */ 876bc91e8dbSYongseok Koh cqe_pad = RTE_CACHE_LINE_SIZE == 128 && 877bc91e8dbSYongseok Koh (dv_attr.flags & MLX5DV_CONTEXT_FLAGS_CQE_128B_PAD); 878bc91e8dbSYongseok Koh #endif 879038e7251SShahaf Shuler #ifdef HAVE_IBV_DEVICE_TUNNEL_SUPPORT 8806057a10bSAdrien Mazarguil if (dv_attr.comp_mask & MLX5DV_CONTEXT_MASK_TUNNEL_OFFLOADS) { 8816057a10bSAdrien Mazarguil tunnel_en = ((dv_attr.tunnel_offloads_caps & 882038e7251SShahaf Shuler MLX5DV_RAW_PACKET_CAP_TUNNELED_OFFLOAD_VXLAN) && 8836057a10bSAdrien Mazarguil (dv_attr.tunnel_offloads_caps & 884038e7251SShahaf Shuler MLX5DV_RAW_PACKET_CAP_TUNNELED_OFFLOAD_GRE)); 885038e7251SShahaf Shuler } 886a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "tunnel offloading is %ssupported", 887a170a30dSNélio Laranjeiro tunnel_en ? "" : "not "); 888038e7251SShahaf Shuler #else 889a170a30dSNélio Laranjeiro DRV_LOG(WARNING, 890a170a30dSNélio Laranjeiro "tunnel offloading disabled due to old OFED/rdma-core version"); 891038e7251SShahaf Shuler #endif 89268128934SAdrien Mazarguil config.tunnel_en = tunnel_en; 8931f106da2SMatan Azrad #ifdef HAVE_IBV_DEVICE_MPLS_SUPPORT 8946057a10bSAdrien Mazarguil mpls_en = ((dv_attr.tunnel_offloads_caps & 8951f106da2SMatan Azrad MLX5DV_RAW_PACKET_CAP_TUNNELED_OFFLOAD_CW_MPLS_OVER_GRE) && 8966057a10bSAdrien Mazarguil (dv_attr.tunnel_offloads_caps & 8971f106da2SMatan Azrad MLX5DV_RAW_PACKET_CAP_TUNNELED_OFFLOAD_CW_MPLS_OVER_UDP)); 8981f106da2SMatan Azrad DRV_LOG(DEBUG, "MPLS over GRE/UDP tunnel offloading is %ssupported", 8991f106da2SMatan Azrad mpls_en ? "" : "not "); 9001f106da2SMatan Azrad #else 9011f106da2SMatan Azrad DRV_LOG(WARNING, "MPLS over GRE/UDP tunnel offloading disabled due to" 9021f106da2SMatan Azrad " old OFED/rdma-core version or firmware configuration"); 9031f106da2SMatan Azrad #endif 90468128934SAdrien Mazarguil config.mpls_en = mpls_en; 9053ff4b086SAdrien Mazarguil err = mlx5_glue->query_device_ex(ctx, NULL, &attr); 906012ad994SShahaf Shuler if (err) { 907012ad994SShahaf Shuler DEBUG("ibv_query_device_ex() failed"); 908771fa900SAdrien Mazarguil goto error; 909a6d83b6aSNélio Laranjeiro } 9102b730263SAdrien Mazarguil DRV_LOG(DEBUG, "naming Ethernet device \"%s\"", name); 91151e7fa8dSNélio Laranjeiro if (rte_eal_process_type() == RTE_PROC_SECONDARY) { 912f8b9a3baSXueming Li eth_dev = rte_eth_dev_attach_secondary(name); 913f8b9a3baSXueming Li if (eth_dev == NULL) { 914a170a30dSNélio Laranjeiro DRV_LOG(ERR, "can not attach rte ethdev"); 915a6d83b6aSNélio Laranjeiro rte_errno = ENOMEM; 916a6d83b6aSNélio Laranjeiro err = rte_errno; 917f8b9a3baSXueming Li goto error; 918f8b9a3baSXueming Li } 919f38c5457SAdrien Mazarguil eth_dev->device = dpdk_dev; 92087ec44ceSXueming Li eth_dev->dev_ops = &mlx5_dev_sec_ops; 921af4f09f2SNélio Laranjeiro err = mlx5_uar_init_secondary(eth_dev); 922012ad994SShahaf Shuler if (err) { 923012ad994SShahaf Shuler err = rte_errno; 9244a984153SXueming Li goto error; 925012ad994SShahaf Shuler } 926f8b9a3baSXueming Li /* Receive command fd from primary process */ 927af4f09f2SNélio Laranjeiro err = mlx5_socket_connect(eth_dev); 928012ad994SShahaf Shuler if (err < 0) { 929012ad994SShahaf Shuler err = rte_errno; 930f8b9a3baSXueming Li goto error; 931012ad994SShahaf Shuler } 932f8b9a3baSXueming Li /* Remap UAR for Tx queues. */ 933af4f09f2SNélio Laranjeiro err = mlx5_tx_uar_remap(eth_dev, err); 934012ad994SShahaf Shuler if (err) { 935012ad994SShahaf Shuler err = rte_errno; 936f8b9a3baSXueming Li goto error; 937012ad994SShahaf Shuler } 9381cfa649bSShahaf Shuler /* 9391cfa649bSShahaf Shuler * Ethdev pointer is still required as input since 9401cfa649bSShahaf Shuler * the primary device is not accessible from the 9411cfa649bSShahaf Shuler * secondary process. 9421cfa649bSShahaf Shuler */ 94368128934SAdrien Mazarguil eth_dev->rx_pkt_burst = mlx5_select_rx_function(eth_dev); 94468128934SAdrien Mazarguil eth_dev->tx_pkt_burst = mlx5_select_tx_function(eth_dev); 9459083982cSAdrien Mazarguil claim_zero(mlx5_glue->close_device(ctx)); 946f38c5457SAdrien Mazarguil return eth_dev; 947e1c3e305SMatan Azrad } 948771fa900SAdrien Mazarguil /* Check port status. */ 9499083982cSAdrien Mazarguil err = mlx5_glue->query_port(ctx, 1, &port_attr); 950771fa900SAdrien Mazarguil if (err) { 951a170a30dSNélio Laranjeiro DRV_LOG(ERR, "port query failed: %s", strerror(err)); 9529083982cSAdrien Mazarguil goto error; 953771fa900SAdrien Mazarguil } 9541371f4dfSOr Ami if (port_attr.link_layer != IBV_LINK_LAYER_ETHERNET) { 9559083982cSAdrien Mazarguil DRV_LOG(ERR, "port is not configured in Ethernet mode"); 956e1c3e305SMatan Azrad err = EINVAL; 9579083982cSAdrien Mazarguil goto error; 9581371f4dfSOr Ami } 959771fa900SAdrien Mazarguil if (port_attr.state != IBV_PORT_ACTIVE) 9609083982cSAdrien Mazarguil DRV_LOG(DEBUG, "port is not active: \"%s\" (%d)", 961a170a30dSNélio Laranjeiro mlx5_glue->port_state_str(port_attr.state), 962771fa900SAdrien Mazarguil port_attr.state); 963771fa900SAdrien Mazarguil /* Allocate protection domain. */ 9640e83b8e5SNelio Laranjeiro pd = mlx5_glue->alloc_pd(ctx); 965771fa900SAdrien Mazarguil if (pd == NULL) { 966a170a30dSNélio Laranjeiro DRV_LOG(ERR, "PD allocation failure"); 967771fa900SAdrien Mazarguil err = ENOMEM; 9689083982cSAdrien Mazarguil goto error; 969771fa900SAdrien Mazarguil } 970771fa900SAdrien Mazarguil priv = rte_zmalloc("ethdev private structure", 971771fa900SAdrien Mazarguil sizeof(*priv), 972771fa900SAdrien Mazarguil RTE_CACHE_LINE_SIZE); 973771fa900SAdrien Mazarguil if (priv == NULL) { 974a170a30dSNélio Laranjeiro DRV_LOG(ERR, "priv allocation failure"); 975771fa900SAdrien Mazarguil err = ENOMEM; 9769083982cSAdrien Mazarguil goto error; 977771fa900SAdrien Mazarguil } 978771fa900SAdrien Mazarguil priv->ctx = ctx; 9792b730263SAdrien Mazarguil strncpy(priv->ibdev_name, priv->ctx->device->name, 9802b730263SAdrien Mazarguil sizeof(priv->ibdev_name)); 98187ec44ceSXueming Li strncpy(priv->ibdev_path, priv->ctx->device->ibdev_path, 98287ec44ceSXueming Li sizeof(priv->ibdev_path)); 9833ff4b086SAdrien Mazarguil priv->device_attr = attr; 984771fa900SAdrien Mazarguil priv->pd = pd; 985771fa900SAdrien Mazarguil priv->mtu = ETHER_MTU; 9866bf10ab6SMoti Haimovsky #ifndef RTE_ARCH_64 9876bf10ab6SMoti Haimovsky /* Initialize UAR access locks for 32bit implementations. */ 9886bf10ab6SMoti Haimovsky rte_spinlock_init(&priv->uar_lock_cq); 9896bf10ab6SMoti Haimovsky for (i = 0; i < MLX5_UAR_PAGE_NUM_MAX; i++) 9906bf10ab6SMoti Haimovsky rte_spinlock_init(&priv->uar_lock[i]); 9916bf10ab6SMoti Haimovsky #endif 99226c08b97SAdrien Mazarguil /* Some internal functions rely on Netlink sockets, open them now. */ 9935366074bSNelio Laranjeiro priv->nl_socket_rdma = mlx5_nl_init(NETLINK_RDMA); 9945366074bSNelio Laranjeiro priv->nl_socket_route = mlx5_nl_init(NETLINK_ROUTE); 99526c08b97SAdrien Mazarguil priv->nl_sn = 0; 9962b730263SAdrien Mazarguil priv->representor = !!switch_info->representor; 9972b730263SAdrien Mazarguil priv->domain_id = RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID; 9982b730263SAdrien Mazarguil priv->representor_id = 9992b730263SAdrien Mazarguil switch_info->representor ? switch_info->port_name : -1; 10002b730263SAdrien Mazarguil /* 10012b730263SAdrien Mazarguil * Look for sibling devices in order to reuse their switch domain 10022b730263SAdrien Mazarguil * if any, otherwise allocate one. 10032b730263SAdrien Mazarguil */ 10042b730263SAdrien Mazarguil i = mlx5_dev_to_port_id(dpdk_dev, NULL, 0); 10052b730263SAdrien Mazarguil if (i > 0) { 10062b730263SAdrien Mazarguil uint16_t port_id[i]; 10072b730263SAdrien Mazarguil 10082b730263SAdrien Mazarguil i = RTE_MIN(mlx5_dev_to_port_id(dpdk_dev, port_id, i), i); 10092b730263SAdrien Mazarguil while (i--) { 10102b730263SAdrien Mazarguil const struct priv *opriv = 10112b730263SAdrien Mazarguil rte_eth_devices[port_id[i]].data->dev_private; 10122b730263SAdrien Mazarguil 10132b730263SAdrien Mazarguil if (!opriv || 10142b730263SAdrien Mazarguil opriv->domain_id == 10152b730263SAdrien Mazarguil RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID) 10162b730263SAdrien Mazarguil continue; 10172b730263SAdrien Mazarguil priv->domain_id = opriv->domain_id; 10182b730263SAdrien Mazarguil break; 10192b730263SAdrien Mazarguil } 10202b730263SAdrien Mazarguil } 10212b730263SAdrien Mazarguil if (priv->domain_id == RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID) { 10222b730263SAdrien Mazarguil err = rte_eth_switch_domain_alloc(&priv->domain_id); 10232b730263SAdrien Mazarguil if (err) { 10242b730263SAdrien Mazarguil err = rte_errno; 10252b730263SAdrien Mazarguil DRV_LOG(ERR, "unable to allocate switch domain: %s", 10262b730263SAdrien Mazarguil strerror(rte_errno)); 10272b730263SAdrien Mazarguil goto error; 10282b730263SAdrien Mazarguil } 10292b730263SAdrien Mazarguil own_domain_id = 1; 10302b730263SAdrien Mazarguil } 1031f38c5457SAdrien Mazarguil err = mlx5_args(&config, dpdk_dev->devargs); 1032e72dd09bSNélio Laranjeiro if (err) { 1033012ad994SShahaf Shuler err = rte_errno; 103493068a9dSAdrien Mazarguil DRV_LOG(ERR, "failed to process device arguments: %s", 103593068a9dSAdrien Mazarguil strerror(rte_errno)); 10369083982cSAdrien Mazarguil goto error; 1037e72dd09bSNélio Laranjeiro } 103868128934SAdrien Mazarguil config.hw_csum = !!(attr.device_cap_flags_ex & IBV_DEVICE_RAW_IP_CSUM); 1039a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "checksum offloading is %ssupported", 10407fe24446SShahaf Shuler (config.hw_csum ? "" : "not ")); 10412dd8b721SViacheslav Ovsiienko #if !defined(HAVE_IBV_DEVICE_COUNTERS_SET_V42) && \ 10422dd8b721SViacheslav Ovsiienko !defined(HAVE_IBV_DEVICE_COUNTERS_SET_V45) 10432dd8b721SViacheslav Ovsiienko DRV_LOG(DEBUG, "counters are not supported"); 10449a761de8SOri Kam #endif 104558b1312eSYongseok Koh #ifndef HAVE_IBV_FLOW_DV_SUPPORT 104658b1312eSYongseok Koh if (config.dv_flow_en) { 104758b1312eSYongseok Koh DRV_LOG(WARNING, "DV flow is not supported"); 104858b1312eSYongseok Koh config.dv_flow_en = 0; 104958b1312eSYongseok Koh } 105058b1312eSYongseok Koh #endif 10517fe24446SShahaf Shuler config.ind_table_max_size = 10523ff4b086SAdrien Mazarguil attr.rss_caps.max_rwq_indirection_table_size; 105368128934SAdrien Mazarguil /* 105468128934SAdrien Mazarguil * Remove this check once DPDK supports larger/variable 105568128934SAdrien Mazarguil * indirection tables. 105668128934SAdrien Mazarguil */ 105768128934SAdrien Mazarguil if (config.ind_table_max_size > (unsigned int)ETH_RSS_RETA_SIZE_512) 10587fe24446SShahaf Shuler config.ind_table_max_size = ETH_RSS_RETA_SIZE_512; 1059a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "maximum Rx indirection table size is %u", 10607fe24446SShahaf Shuler config.ind_table_max_size); 10613ff4b086SAdrien Mazarguil config.hw_vlan_strip = !!(attr.raw_packet_caps & 106243e9d979SShachar Beiser IBV_RAW_PACKET_CAP_CVLAN_STRIPPING); 1063a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "VLAN stripping is %ssupported", 10647fe24446SShahaf Shuler (config.hw_vlan_strip ? "" : "not ")); 10653ff4b086SAdrien Mazarguil config.hw_fcs_strip = !!(attr.raw_packet_caps & 1066cd230a3eSShahaf Shuler IBV_RAW_PACKET_CAP_SCATTER_FCS); 1067a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "FCS stripping configuration is %ssupported", 10687fe24446SShahaf Shuler (config.hw_fcs_strip ? "" : "not ")); 1069*2014a7fbSYongseok Koh #if defined(HAVE_IBV_WQ_FLAG_RX_END_PADDING) 107078c7a16dSYongseok Koh hw_padding = !!attr.rx_pad_end_addr_align; 1071*2014a7fbSYongseok Koh #elif defined(HAVE_IBV_WQ_FLAGS_PCI_WRITE_END_PADDING) 1072*2014a7fbSYongseok Koh hw_padding = !!(attr.device_cap_flags_ex & 1073*2014a7fbSYongseok Koh IBV_DEVICE_PCI_WRITE_END_PADDING); 107443e9d979SShachar Beiser #endif 107578c7a16dSYongseok Koh if (config.hw_padding && !hw_padding) { 107678c7a16dSYongseok Koh DRV_LOG(DEBUG, "Rx end alignment padding isn't supported"); 107778c7a16dSYongseok Koh config.hw_padding = 0; 107878c7a16dSYongseok Koh } else if (config.hw_padding) { 107978c7a16dSYongseok Koh DRV_LOG(DEBUG, "Rx end alignment padding is enabled"); 108078c7a16dSYongseok Koh } 10813ff4b086SAdrien Mazarguil config.tso = (attr.tso_caps.max_tso > 0 && 10823ff4b086SAdrien Mazarguil (attr.tso_caps.supported_qpts & 108343e9d979SShachar Beiser (1 << IBV_QPT_RAW_PACKET))); 10847fe24446SShahaf Shuler if (config.tso) 10853ff4b086SAdrien Mazarguil config.tso_max_payload_sz = attr.tso_caps.max_tso; 1086f9de8718SShahaf Shuler /* 1087f9de8718SShahaf Shuler * MPW is disabled by default, while the Enhanced MPW is enabled 1088f9de8718SShahaf Shuler * by default. 1089f9de8718SShahaf Shuler */ 1090f9de8718SShahaf Shuler if (config.mps == MLX5_ARG_UNSET) 1091f9de8718SShahaf Shuler config.mps = (mps == MLX5_MPW_ENHANCED) ? MLX5_MPW_ENHANCED : 1092f9de8718SShahaf Shuler MLX5_MPW_DISABLED; 1093f9de8718SShahaf Shuler else 1094f9de8718SShahaf Shuler config.mps = config.mps ? mps : MLX5_MPW_DISABLED; 1095a170a30dSNélio Laranjeiro DRV_LOG(INFO, "%sMPS is %s", 10960f99970bSNélio Laranjeiro config.mps == MLX5_MPW_ENHANCED ? "enhanced " : "", 109768128934SAdrien Mazarguil config.mps != MLX5_MPW_DISABLED ? "enabled" : "disabled"); 10987fe24446SShahaf Shuler if (config.cqe_comp && !cqe_comp) { 1099a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "Rx CQE compression isn't supported"); 11007fe24446SShahaf Shuler config.cqe_comp = 0; 1101523f5a74SYongseok Koh } 1102bc91e8dbSYongseok Koh if (config.cqe_pad && !cqe_pad) { 1103bc91e8dbSYongseok Koh DRV_LOG(WARNING, "Rx CQE padding isn't supported"); 1104bc91e8dbSYongseok Koh config.cqe_pad = 0; 1105bc91e8dbSYongseok Koh } else if (config.cqe_pad) { 1106bc91e8dbSYongseok Koh DRV_LOG(INFO, "Rx CQE padding is enabled"); 1107bc91e8dbSYongseok Koh } 11085c0e2db6SYongseok Koh if (config.mprq.enabled && mprq) { 11097d6bf6b8SYongseok Koh if (config.mprq.stride_num_n > mprq_max_stride_num_n || 11107d6bf6b8SYongseok Koh config.mprq.stride_num_n < mprq_min_stride_num_n) { 11117d6bf6b8SYongseok Koh config.mprq.stride_num_n = 11127d6bf6b8SYongseok Koh RTE_MAX(MLX5_MPRQ_STRIDE_NUM_N, 11137d6bf6b8SYongseok Koh mprq_min_stride_num_n); 11147d6bf6b8SYongseok Koh DRV_LOG(WARNING, 11157d6bf6b8SYongseok Koh "the number of strides" 11167d6bf6b8SYongseok Koh " for Multi-Packet RQ is out of range," 11177d6bf6b8SYongseok Koh " setting default value (%u)", 11187d6bf6b8SYongseok Koh 1 << config.mprq.stride_num_n); 11197d6bf6b8SYongseok Koh } 11207d6bf6b8SYongseok Koh config.mprq.min_stride_size_n = mprq_min_stride_size_n; 11217d6bf6b8SYongseok Koh config.mprq.max_stride_size_n = mprq_max_stride_size_n; 11225c0e2db6SYongseok Koh } else if (config.mprq.enabled && !mprq) { 11235c0e2db6SYongseok Koh DRV_LOG(WARNING, "Multi-Packet RQ isn't supported"); 11245c0e2db6SYongseok Koh config.mprq.enabled = 0; 11257d6bf6b8SYongseok Koh } 1126af4f09f2SNélio Laranjeiro eth_dev = rte_eth_dev_allocate(name); 1127af4f09f2SNélio Laranjeiro if (eth_dev == NULL) { 1128a170a30dSNélio Laranjeiro DRV_LOG(ERR, "can not allocate rte ethdev"); 1129af4f09f2SNélio Laranjeiro err = ENOMEM; 11309083982cSAdrien Mazarguil goto error; 1131af4f09f2SNélio Laranjeiro } 113215febafdSThomas Monjalon /* Flag to call rte_eth_dev_release_port() in rte_eth_dev_close(). */ 113315febafdSThomas Monjalon eth_dev->data->dev_flags |= RTE_ETH_DEV_CLOSE_REMOVE; 1134a7d3c627SThomas Monjalon if (priv->representor) { 11352b730263SAdrien Mazarguil eth_dev->data->dev_flags |= RTE_ETH_DEV_REPRESENTOR; 1136a7d3c627SThomas Monjalon eth_dev->data->representor_id = priv->representor_id; 1137a7d3c627SThomas Monjalon } 1138af4f09f2SNélio Laranjeiro eth_dev->data->dev_private = priv; 1139df428ceeSYongseok Koh priv->dev_data = eth_dev->data; 1140af4f09f2SNélio Laranjeiro eth_dev->data->mac_addrs = priv->mac; 1141f38c5457SAdrien Mazarguil eth_dev->device = dpdk_dev; 1142af4f09f2SNélio Laranjeiro err = mlx5_uar_init_primary(eth_dev); 1143012ad994SShahaf Shuler if (err) { 1144012ad994SShahaf Shuler err = rte_errno; 11459083982cSAdrien Mazarguil goto error; 1146012ad994SShahaf Shuler } 1147771fa900SAdrien Mazarguil /* Configure the first MAC address by default. */ 1148af4f09f2SNélio Laranjeiro if (mlx5_get_mac(eth_dev, &mac.addr_bytes)) { 1149a170a30dSNélio Laranjeiro DRV_LOG(ERR, 1150a170a30dSNélio Laranjeiro "port %u cannot get MAC address, is mlx5_en" 1151a170a30dSNélio Laranjeiro " loaded? (errno: %s)", 11528c3c2372SAdrien Mazarguil eth_dev->data->port_id, strerror(rte_errno)); 1153e1c3e305SMatan Azrad err = ENODEV; 11549083982cSAdrien Mazarguil goto error; 1155771fa900SAdrien Mazarguil } 1156a170a30dSNélio Laranjeiro DRV_LOG(INFO, 1157a170a30dSNélio Laranjeiro "port %u MAC address is %02x:%02x:%02x:%02x:%02x:%02x", 11580f99970bSNélio Laranjeiro eth_dev->data->port_id, 1159771fa900SAdrien Mazarguil mac.addr_bytes[0], mac.addr_bytes[1], 1160771fa900SAdrien Mazarguil mac.addr_bytes[2], mac.addr_bytes[3], 1161771fa900SAdrien Mazarguil mac.addr_bytes[4], mac.addr_bytes[5]); 1162771fa900SAdrien Mazarguil #ifndef NDEBUG 1163771fa900SAdrien Mazarguil { 1164771fa900SAdrien Mazarguil char ifname[IF_NAMESIZE]; 1165771fa900SAdrien Mazarguil 1166af4f09f2SNélio Laranjeiro if (mlx5_get_ifname(eth_dev, &ifname) == 0) 1167a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "port %u ifname is \"%s\"", 11680f99970bSNélio Laranjeiro eth_dev->data->port_id, ifname); 1169771fa900SAdrien Mazarguil else 1170a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "port %u ifname is unknown", 11710f99970bSNélio Laranjeiro eth_dev->data->port_id); 1172771fa900SAdrien Mazarguil } 1173771fa900SAdrien Mazarguil #endif 1174771fa900SAdrien Mazarguil /* Get actual MTU if possible. */ 1175a6d83b6aSNélio Laranjeiro err = mlx5_get_mtu(eth_dev, &priv->mtu); 1176012ad994SShahaf Shuler if (err) { 1177012ad994SShahaf Shuler err = rte_errno; 11789083982cSAdrien Mazarguil goto error; 1179012ad994SShahaf Shuler } 1180a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "port %u MTU is %u", eth_dev->data->port_id, 1181a170a30dSNélio Laranjeiro priv->mtu); 118268128934SAdrien Mazarguil /* Initialize burst functions to prevent crashes before link-up. */ 1183e313ef4cSShahaf Shuler eth_dev->rx_pkt_burst = removed_rx_burst; 1184e313ef4cSShahaf Shuler eth_dev->tx_pkt_burst = removed_tx_burst; 1185771fa900SAdrien Mazarguil eth_dev->dev_ops = &mlx5_dev_ops; 1186272733b5SNélio Laranjeiro /* Register MAC address. */ 1187272733b5SNélio Laranjeiro claim_zero(mlx5_mac_addr_add(eth_dev, &mac, 0, 0)); 1188f87bfa8eSYongseok Koh if (config.vf && config.vf_nl_en) 1189ccdcba53SNélio Laranjeiro mlx5_nl_mac_addr_sync(eth_dev); 1190d53180afSMoti Haimovsky priv->tcf_context = mlx5_flow_tcf_context_create(); 1191d53180afSMoti Haimovsky if (!priv->tcf_context) { 119257123c00SYongseok Koh err = -rte_errno; 119357123c00SYongseok Koh DRV_LOG(WARNING, 119457123c00SYongseok Koh "flow rules relying on switch offloads will not be" 119557123c00SYongseok Koh " supported: cannot open libmnl socket: %s", 119657123c00SYongseok Koh strerror(rte_errno)); 119757123c00SYongseok Koh } else { 119857123c00SYongseok Koh struct rte_flow_error error; 119957123c00SYongseok Koh unsigned int ifindex = mlx5_ifindex(eth_dev); 120057123c00SYongseok Koh 120157123c00SYongseok Koh if (!ifindex) { 120257123c00SYongseok Koh err = -rte_errno; 120357123c00SYongseok Koh error.message = 120457123c00SYongseok Koh "cannot retrieve network interface index"; 120557123c00SYongseok Koh } else { 1206d53180afSMoti Haimovsky err = mlx5_flow_tcf_init(priv->tcf_context, 1207d53180afSMoti Haimovsky ifindex, &error); 120857123c00SYongseok Koh } 120957123c00SYongseok Koh if (err) { 121057123c00SYongseok Koh DRV_LOG(WARNING, 121157123c00SYongseok Koh "flow rules relying on switch offloads will" 121257123c00SYongseok Koh " not be supported: %s: %s", 121357123c00SYongseok Koh error.message, strerror(rte_errno)); 1214d53180afSMoti Haimovsky mlx5_flow_tcf_context_destroy(priv->tcf_context); 1215d53180afSMoti Haimovsky priv->tcf_context = NULL; 121657123c00SYongseok Koh } 121757123c00SYongseok Koh } 1218c8ffb8a9SNélio Laranjeiro TAILQ_INIT(&priv->flows); 12191b37f5d8SNélio Laranjeiro TAILQ_INIT(&priv->ctrl_flows); 12201e3a39f7SXueming Li /* Hint libmlx5 to use PMD allocator for data plane resources */ 12211e3a39f7SXueming Li struct mlx5dv_ctx_allocators alctr = { 12221e3a39f7SXueming Li .alloc = &mlx5_alloc_verbs_buf, 12231e3a39f7SXueming Li .free = &mlx5_free_verbs_buf, 12241e3a39f7SXueming Li .data = priv, 12251e3a39f7SXueming Li }; 122668128934SAdrien Mazarguil mlx5_glue->dv_set_context_attr(ctx, MLX5DV_CTX_ATTR_BUF_ALLOCATORS, 12271e3a39f7SXueming Li (void *)((uintptr_t)&alctr)); 1228771fa900SAdrien Mazarguil /* Bring Ethernet device up. */ 1229a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "port %u forcing Ethernet interface up", 12300f99970bSNélio Laranjeiro eth_dev->data->port_id); 12317ba5320bSNélio Laranjeiro mlx5_set_link_up(eth_dev); 1232a85a606cSShahaf Shuler /* 1233a85a606cSShahaf Shuler * Even though the interrupt handler is not installed yet, 1234a85a606cSShahaf Shuler * interrupts will still trigger on the asyn_fd from 1235a85a606cSShahaf Shuler * Verbs context returned by ibv_open_device(). 1236a85a606cSShahaf Shuler */ 1237a85a606cSShahaf Shuler mlx5_link_update(eth_dev, 0); 12387fe24446SShahaf Shuler /* Store device configuration on private structure. */ 12397fe24446SShahaf Shuler priv->config = config; 124078be8852SNelio Laranjeiro /* Supported Verbs flow priority number detection. */ 12412815702bSNelio Laranjeiro err = mlx5_flow_discover_priorities(eth_dev); 12422815702bSNelio Laranjeiro if (err < 0) 12439083982cSAdrien Mazarguil goto error; 12442815702bSNelio Laranjeiro priv->config.flow_prio = err; 12450ace586dSXueming Li /* 12460ace586dSXueming Li * Once the device is added to the list of memory event 12470ace586dSXueming Li * callback, its global MR cache table cannot be expanded 12480ace586dSXueming Li * on the fly because of deadlock. If it overflows, lookup 12490ace586dSXueming Li * should be done by searching MR list linearly, which is slow. 12500ace586dSXueming Li */ 12510ace586dSXueming Li err = mlx5_mr_btree_init(&priv->mr.cache, 12520ace586dSXueming Li MLX5_MR_BTREE_CACHE_N * 2, 12530ace586dSXueming Li eth_dev->device->numa_node); 12540ace586dSXueming Li if (err) { 12550ace586dSXueming Li err = rte_errno; 12569083982cSAdrien Mazarguil goto error; 12570ace586dSXueming Li } 1258e89c15b6SAdrien Mazarguil /* Add device to memory callback list. */ 1259e89c15b6SAdrien Mazarguil rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock); 1260e89c15b6SAdrien Mazarguil LIST_INSERT_HEAD(&mlx5_shared_data->mem_event_cb_list, 1261e89c15b6SAdrien Mazarguil priv, mem_event_cb); 1262e89c15b6SAdrien Mazarguil rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock); 1263f38c5457SAdrien Mazarguil return eth_dev; 12649083982cSAdrien Mazarguil error: 126526c08b97SAdrien Mazarguil if (priv) { 126626c08b97SAdrien Mazarguil if (priv->nl_socket_route >= 0) 126726c08b97SAdrien Mazarguil close(priv->nl_socket_route); 126826c08b97SAdrien Mazarguil if (priv->nl_socket_rdma >= 0) 126926c08b97SAdrien Mazarguil close(priv->nl_socket_rdma); 1270d53180afSMoti Haimovsky if (priv->tcf_context) 1271d53180afSMoti Haimovsky mlx5_flow_tcf_context_destroy(priv->tcf_context); 12722b730263SAdrien Mazarguil if (own_domain_id) 12732b730263SAdrien Mazarguil claim_zero(rte_eth_switch_domain_free(priv->domain_id)); 1274771fa900SAdrien Mazarguil rte_free(priv); 1275e16adf08SThomas Monjalon if (eth_dev != NULL) 1276e16adf08SThomas Monjalon eth_dev->data->dev_private = NULL; 127726c08b97SAdrien Mazarguil } 1278771fa900SAdrien Mazarguil if (pd) 12790e83b8e5SNelio Laranjeiro claim_zero(mlx5_glue->dealloc_pd(pd)); 1280e16adf08SThomas Monjalon if (eth_dev != NULL) { 1281e16adf08SThomas Monjalon /* mac_addrs must not be freed alone because part of dev_private */ 1282e16adf08SThomas Monjalon eth_dev->data->mac_addrs = NULL; 1283690de285SRaslan Darawsheh rte_eth_dev_release_port(eth_dev); 1284e16adf08SThomas Monjalon } 12853ff4b086SAdrien Mazarguil if (ctx) 12863ff4b086SAdrien Mazarguil claim_zero(mlx5_glue->close_device(ctx)); 1287f38c5457SAdrien Mazarguil assert(err > 0); 1288a6d83b6aSNélio Laranjeiro rte_errno = err; 1289f38c5457SAdrien Mazarguil return NULL; 1290f38c5457SAdrien Mazarguil } 1291f38c5457SAdrien Mazarguil 1292116f90adSAdrien Mazarguil /** Data associated with devices to spawn. */ 1293116f90adSAdrien Mazarguil struct mlx5_dev_spawn_data { 1294116f90adSAdrien Mazarguil unsigned int ifindex; /**< Network interface index. */ 1295116f90adSAdrien Mazarguil struct mlx5_switch_info info; /**< Switch information. */ 1296116f90adSAdrien Mazarguil struct ibv_device *ibv_dev; /**< Associated IB device. */ 1297116f90adSAdrien Mazarguil struct rte_eth_dev *eth_dev; /**< Associated Ethernet device. */ 1298116f90adSAdrien Mazarguil }; 1299116f90adSAdrien Mazarguil 1300116f90adSAdrien Mazarguil /** 1301116f90adSAdrien Mazarguil * Comparison callback to sort device data. 1302116f90adSAdrien Mazarguil * 1303116f90adSAdrien Mazarguil * This is meant to be used with qsort(). 1304116f90adSAdrien Mazarguil * 1305116f90adSAdrien Mazarguil * @param a[in] 1306116f90adSAdrien Mazarguil * Pointer to pointer to first data object. 1307116f90adSAdrien Mazarguil * @param b[in] 1308116f90adSAdrien Mazarguil * Pointer to pointer to second data object. 1309116f90adSAdrien Mazarguil * 1310116f90adSAdrien Mazarguil * @return 1311116f90adSAdrien Mazarguil * 0 if both objects are equal, less than 0 if the first argument is less 1312116f90adSAdrien Mazarguil * than the second, greater than 0 otherwise. 1313116f90adSAdrien Mazarguil */ 1314116f90adSAdrien Mazarguil static int 1315116f90adSAdrien Mazarguil mlx5_dev_spawn_data_cmp(const void *a, const void *b) 1316116f90adSAdrien Mazarguil { 1317116f90adSAdrien Mazarguil const struct mlx5_switch_info *si_a = 1318116f90adSAdrien Mazarguil &((const struct mlx5_dev_spawn_data *)a)->info; 1319116f90adSAdrien Mazarguil const struct mlx5_switch_info *si_b = 1320116f90adSAdrien Mazarguil &((const struct mlx5_dev_spawn_data *)b)->info; 1321116f90adSAdrien Mazarguil int ret; 1322116f90adSAdrien Mazarguil 1323116f90adSAdrien Mazarguil /* Master device first. */ 1324116f90adSAdrien Mazarguil ret = si_b->master - si_a->master; 1325116f90adSAdrien Mazarguil if (ret) 1326116f90adSAdrien Mazarguil return ret; 1327116f90adSAdrien Mazarguil /* Then representor devices. */ 1328116f90adSAdrien Mazarguil ret = si_b->representor - si_a->representor; 1329116f90adSAdrien Mazarguil if (ret) 1330116f90adSAdrien Mazarguil return ret; 1331116f90adSAdrien Mazarguil /* Unidentified devices come last in no specific order. */ 1332116f90adSAdrien Mazarguil if (!si_a->representor) 1333116f90adSAdrien Mazarguil return 0; 1334116f90adSAdrien Mazarguil /* Order representors by name. */ 1335116f90adSAdrien Mazarguil return si_a->port_name - si_b->port_name; 1336116f90adSAdrien Mazarguil } 1337116f90adSAdrien Mazarguil 1338f38c5457SAdrien Mazarguil /** 1339f38c5457SAdrien Mazarguil * DPDK callback to register a PCI device. 1340f38c5457SAdrien Mazarguil * 13412b730263SAdrien Mazarguil * This function spawns Ethernet devices out of a given PCI device. 1342f38c5457SAdrien Mazarguil * 1343f38c5457SAdrien Mazarguil * @param[in] pci_drv 1344f38c5457SAdrien Mazarguil * PCI driver structure (mlx5_driver). 1345f38c5457SAdrien Mazarguil * @param[in] pci_dev 1346f38c5457SAdrien Mazarguil * PCI device information. 1347f38c5457SAdrien Mazarguil * 1348f38c5457SAdrien Mazarguil * @return 1349f38c5457SAdrien Mazarguil * 0 on success, a negative errno value otherwise and rte_errno is set. 1350f38c5457SAdrien Mazarguil */ 1351f38c5457SAdrien Mazarguil static int 1352f38c5457SAdrien Mazarguil mlx5_pci_probe(struct rte_pci_driver *pci_drv __rte_unused, 1353f38c5457SAdrien Mazarguil struct rte_pci_device *pci_dev) 1354f38c5457SAdrien Mazarguil { 1355f38c5457SAdrien Mazarguil struct ibv_device **ibv_list; 135626c08b97SAdrien Mazarguil unsigned int n = 0; 1357f87bfa8eSYongseok Koh struct mlx5_dev_config dev_config; 1358f38c5457SAdrien Mazarguil int ret; 1359f38c5457SAdrien Mazarguil 1360f38c5457SAdrien Mazarguil assert(pci_drv == &mlx5_driver); 1361f38c5457SAdrien Mazarguil errno = 0; 1362f38c5457SAdrien Mazarguil ibv_list = mlx5_glue->get_device_list(&ret); 1363f38c5457SAdrien Mazarguil if (!ibv_list) { 1364f38c5457SAdrien Mazarguil rte_errno = errno ? errno : ENOSYS; 1365f38c5457SAdrien Mazarguil DRV_LOG(ERR, "cannot list devices, is ib_uverbs loaded?"); 1366a6d83b6aSNélio Laranjeiro return -rte_errno; 1367a6d83b6aSNélio Laranjeiro } 136826c08b97SAdrien Mazarguil 136926c08b97SAdrien Mazarguil struct ibv_device *ibv_match[ret + 1]; 137026c08b97SAdrien Mazarguil 1371f38c5457SAdrien Mazarguil while (ret-- > 0) { 1372f38c5457SAdrien Mazarguil struct rte_pci_addr pci_addr; 1373f38c5457SAdrien Mazarguil 1374f38c5457SAdrien Mazarguil DRV_LOG(DEBUG, "checking device \"%s\"", ibv_list[ret]->name); 1375f38c5457SAdrien Mazarguil if (mlx5_ibv_device_to_pci_addr(ibv_list[ret], &pci_addr)) 1376f38c5457SAdrien Mazarguil continue; 1377f38c5457SAdrien Mazarguil if (pci_dev->addr.domain != pci_addr.domain || 1378f38c5457SAdrien Mazarguil pci_dev->addr.bus != pci_addr.bus || 1379f38c5457SAdrien Mazarguil pci_dev->addr.devid != pci_addr.devid || 1380f38c5457SAdrien Mazarguil pci_dev->addr.function != pci_addr.function) 1381f38c5457SAdrien Mazarguil continue; 138226c08b97SAdrien Mazarguil DRV_LOG(INFO, "PCI information matches for device \"%s\"", 1383f38c5457SAdrien Mazarguil ibv_list[ret]->name); 138426c08b97SAdrien Mazarguil ibv_match[n++] = ibv_list[ret]; 138526c08b97SAdrien Mazarguil } 138626c08b97SAdrien Mazarguil ibv_match[n] = NULL; 138726c08b97SAdrien Mazarguil 1388116f90adSAdrien Mazarguil struct mlx5_dev_spawn_data list[n]; 13895366074bSNelio Laranjeiro int nl_route = n ? mlx5_nl_init(NETLINK_ROUTE) : -1; 13905366074bSNelio Laranjeiro int nl_rdma = n ? mlx5_nl_init(NETLINK_RDMA) : -1; 139126c08b97SAdrien Mazarguil unsigned int i; 13922b730263SAdrien Mazarguil unsigned int u; 139326c08b97SAdrien Mazarguil 139426c08b97SAdrien Mazarguil /* 139526c08b97SAdrien Mazarguil * The existence of several matching entries (n > 1) means port 139626c08b97SAdrien Mazarguil * representors have been instantiated. No existing Verbs call nor 139726c08b97SAdrien Mazarguil * /sys entries can tell them apart, this can only be done through 139826c08b97SAdrien Mazarguil * Netlink calls assuming kernel drivers are recent enough to 139926c08b97SAdrien Mazarguil * support them. 140026c08b97SAdrien Mazarguil * 1401f872b4b9SNelio Laranjeiro * In the event of identification failure through Netlink, try again 1402f872b4b9SNelio Laranjeiro * through sysfs, then either: 140326c08b97SAdrien Mazarguil * 140426c08b97SAdrien Mazarguil * 1. No device matches (n == 0), complain and bail out. 140526c08b97SAdrien Mazarguil * 2. A single IB device matches (n == 1) and is not a representor, 140626c08b97SAdrien Mazarguil * assume no switch support. 140726c08b97SAdrien Mazarguil * 3. Otherwise no safe assumptions can be made; complain louder and 140826c08b97SAdrien Mazarguil * bail out. 140926c08b97SAdrien Mazarguil */ 141026c08b97SAdrien Mazarguil for (i = 0; i != n; ++i) { 1411116f90adSAdrien Mazarguil list[i].ibv_dev = ibv_match[i]; 1412116f90adSAdrien Mazarguil list[i].eth_dev = NULL; 141326c08b97SAdrien Mazarguil if (nl_rdma < 0) 1414116f90adSAdrien Mazarguil list[i].ifindex = 0; 141526c08b97SAdrien Mazarguil else 1416116f90adSAdrien Mazarguil list[i].ifindex = mlx5_nl_ifindex 1417116f90adSAdrien Mazarguil (nl_rdma, list[i].ibv_dev->name); 141826c08b97SAdrien Mazarguil if (nl_route < 0 || 1419116f90adSAdrien Mazarguil !list[i].ifindex || 1420116f90adSAdrien Mazarguil mlx5_nl_switch_info(nl_route, list[i].ifindex, 1421f872b4b9SNelio Laranjeiro &list[i].info) || 1422f872b4b9SNelio Laranjeiro ((!list[i].info.representor && !list[i].info.master) && 1423f872b4b9SNelio Laranjeiro mlx5_sysfs_switch_info(list[i].ifindex, &list[i].info))) { 1424116f90adSAdrien Mazarguil list[i].ifindex = 0; 1425116f90adSAdrien Mazarguil memset(&list[i].info, 0, sizeof(list[i].info)); 142626c08b97SAdrien Mazarguil continue; 142726c08b97SAdrien Mazarguil } 142826c08b97SAdrien Mazarguil } 142926c08b97SAdrien Mazarguil if (nl_rdma >= 0) 143026c08b97SAdrien Mazarguil close(nl_rdma); 143126c08b97SAdrien Mazarguil if (nl_route >= 0) 143226c08b97SAdrien Mazarguil close(nl_route); 14332b730263SAdrien Mazarguil /* Count unidentified devices. */ 14342b730263SAdrien Mazarguil for (u = 0, i = 0; i != n; ++i) 1435116f90adSAdrien Mazarguil if (!list[i].info.master && !list[i].info.representor) 14362b730263SAdrien Mazarguil ++u; 14372b730263SAdrien Mazarguil if (u) { 14382b730263SAdrien Mazarguil if (n == 1 && u == 1) { 143926c08b97SAdrien Mazarguil /* Case #2. */ 144026c08b97SAdrien Mazarguil DRV_LOG(INFO, "no switch support detected"); 144126c08b97SAdrien Mazarguil } else { 144226c08b97SAdrien Mazarguil /* Case #3. */ 144326c08b97SAdrien Mazarguil DRV_LOG(ERR, 144426c08b97SAdrien Mazarguil "unable to tell which of the matching devices" 144526c08b97SAdrien Mazarguil " is the master (lack of kernel support?)"); 144626c08b97SAdrien Mazarguil n = 0; 144726c08b97SAdrien Mazarguil } 1448f38c5457SAdrien Mazarguil } 1449116f90adSAdrien Mazarguil /* 1450116f90adSAdrien Mazarguil * Sort list to probe devices in natural order for users convenience 1451116f90adSAdrien Mazarguil * (i.e. master first, then representors from lowest to highest ID). 1452116f90adSAdrien Mazarguil */ 1453116f90adSAdrien Mazarguil if (n) 1454116f90adSAdrien Mazarguil qsort(list, n, sizeof(*list), mlx5_dev_spawn_data_cmp); 1455f87bfa8eSYongseok Koh /* Default configuration. */ 1456f87bfa8eSYongseok Koh dev_config = (struct mlx5_dev_config){ 145778c7a16dSYongseok Koh .hw_padding = 0, 1458f87bfa8eSYongseok Koh .mps = MLX5_ARG_UNSET, 1459f87bfa8eSYongseok Koh .tx_vec_en = 1, 1460f87bfa8eSYongseok Koh .rx_vec_en = 1, 1461f87bfa8eSYongseok Koh .txq_inline = MLX5_ARG_UNSET, 1462f87bfa8eSYongseok Koh .txqs_inline = MLX5_ARG_UNSET, 146309d8b416SYongseok Koh .txqs_vec = MLX5_ARG_UNSET, 1464f87bfa8eSYongseok Koh .inline_max_packet_sz = MLX5_ARG_UNSET, 1465f87bfa8eSYongseok Koh .vf_nl_en = 1, 1466f87bfa8eSYongseok Koh .mprq = { 1467f87bfa8eSYongseok Koh .enabled = 0, /* Disabled by default. */ 1468f87bfa8eSYongseok Koh .stride_num_n = MLX5_MPRQ_STRIDE_NUM_N, 1469f87bfa8eSYongseok Koh .max_memcpy_len = MLX5_MPRQ_MEMCPY_DEFAULT_LEN, 1470f87bfa8eSYongseok Koh .min_rxqs_num = MLX5_MPRQ_MIN_RXQS, 1471f87bfa8eSYongseok Koh }, 1472f87bfa8eSYongseok Koh }; 1473f87bfa8eSYongseok Koh /* Device speicific configuration. */ 1474f38c5457SAdrien Mazarguil switch (pci_dev->id.device_id) { 147509d8b416SYongseok Koh case PCI_DEVICE_ID_MELLANOX_CONNECTX5BF: 147609d8b416SYongseok Koh dev_config.txqs_vec = MLX5_VPMD_MAX_TXQS_BLUEFIELD; 147709d8b416SYongseok Koh break; 1478f38c5457SAdrien Mazarguil case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF: 1479f38c5457SAdrien Mazarguil case PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF: 1480f38c5457SAdrien Mazarguil case PCI_DEVICE_ID_MELLANOX_CONNECTX5VF: 1481f38c5457SAdrien Mazarguil case PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF: 1482f87bfa8eSYongseok Koh dev_config.vf = 1; 1483f38c5457SAdrien Mazarguil break; 1484f38c5457SAdrien Mazarguil default: 1485f87bfa8eSYongseok Koh break; 1486f38c5457SAdrien Mazarguil } 148709d8b416SYongseok Koh /* Set architecture-dependent default value if unset. */ 148809d8b416SYongseok Koh if (dev_config.txqs_vec == MLX5_ARG_UNSET) 148909d8b416SYongseok Koh dev_config.txqs_vec = MLX5_VPMD_MAX_TXQS; 14902b730263SAdrien Mazarguil for (i = 0; i != n; ++i) { 14912b730263SAdrien Mazarguil uint32_t restore; 14922b730263SAdrien Mazarguil 1493f87bfa8eSYongseok Koh list[i].eth_dev = mlx5_dev_spawn(&pci_dev->device, 1494f87bfa8eSYongseok Koh list[i].ibv_dev, dev_config, 1495f87bfa8eSYongseok Koh &list[i].info); 14966de569f5SAdrien Mazarguil if (!list[i].eth_dev) { 1497206254b7SOphir Munk if (rte_errno != EBUSY && rte_errno != EEXIST) 14982b730263SAdrien Mazarguil break; 1499206254b7SOphir Munk /* Device is disabled or already spawned. Ignore it. */ 15006de569f5SAdrien Mazarguil continue; 15016de569f5SAdrien Mazarguil } 1502116f90adSAdrien Mazarguil restore = list[i].eth_dev->data->dev_flags; 1503116f90adSAdrien Mazarguil rte_eth_copy_pci_info(list[i].eth_dev, pci_dev); 15042b730263SAdrien Mazarguil /* Restore non-PCI flags cleared by the above call. */ 1505116f90adSAdrien Mazarguil list[i].eth_dev->data->dev_flags |= restore; 1506116f90adSAdrien Mazarguil rte_eth_dev_probing_finish(list[i].eth_dev); 15072b730263SAdrien Mazarguil } 1508f38c5457SAdrien Mazarguil mlx5_glue->free_device_list(ibv_list); 150926c08b97SAdrien Mazarguil if (!n) { 1510f38c5457SAdrien Mazarguil DRV_LOG(WARNING, 1511f38c5457SAdrien Mazarguil "no Verbs device matches PCI device " PCI_PRI_FMT "," 1512f38c5457SAdrien Mazarguil " are kernel drivers loaded?", 1513f38c5457SAdrien Mazarguil pci_dev->addr.domain, pci_dev->addr.bus, 1514f38c5457SAdrien Mazarguil pci_dev->addr.devid, pci_dev->addr.function); 1515f38c5457SAdrien Mazarguil rte_errno = ENOENT; 1516f38c5457SAdrien Mazarguil ret = -rte_errno; 15172b730263SAdrien Mazarguil } else if (i != n) { 1518f38c5457SAdrien Mazarguil DRV_LOG(ERR, 1519f38c5457SAdrien Mazarguil "probe of PCI device " PCI_PRI_FMT " aborted after" 1520f38c5457SAdrien Mazarguil " encountering an error: %s", 1521f38c5457SAdrien Mazarguil pci_dev->addr.domain, pci_dev->addr.bus, 1522f38c5457SAdrien Mazarguil pci_dev->addr.devid, pci_dev->addr.function, 1523f38c5457SAdrien Mazarguil strerror(rte_errno)); 1524f38c5457SAdrien Mazarguil ret = -rte_errno; 15252b730263SAdrien Mazarguil /* Roll back. */ 15262b730263SAdrien Mazarguil while (i--) { 15276de569f5SAdrien Mazarguil if (!list[i].eth_dev) 15286de569f5SAdrien Mazarguil continue; 1529116f90adSAdrien Mazarguil mlx5_dev_close(list[i].eth_dev); 1530e16adf08SThomas Monjalon /* mac_addrs must not be freed because in dev_private */ 1531e16adf08SThomas Monjalon list[i].eth_dev->data->mac_addrs = NULL; 1532116f90adSAdrien Mazarguil claim_zero(rte_eth_dev_release_port(list[i].eth_dev)); 15332b730263SAdrien Mazarguil } 15342b730263SAdrien Mazarguil /* Restore original error. */ 15352b730263SAdrien Mazarguil rte_errno = -ret; 1536f38c5457SAdrien Mazarguil } else { 1537f38c5457SAdrien Mazarguil ret = 0; 1538f38c5457SAdrien Mazarguil } 1539f38c5457SAdrien Mazarguil return ret; 1540771fa900SAdrien Mazarguil } 1541771fa900SAdrien Mazarguil 15423a820742SOphir Munk /** 15433a820742SOphir Munk * DPDK callback to remove a PCI device. 15443a820742SOphir Munk * 15453a820742SOphir Munk * This function removes all Ethernet devices belong to a given PCI device. 15463a820742SOphir Munk * 15473a820742SOphir Munk * @param[in] pci_dev 15483a820742SOphir Munk * Pointer to the PCI device. 15493a820742SOphir Munk * 15503a820742SOphir Munk * @return 15513a820742SOphir Munk * 0 on success, the function cannot fail. 15523a820742SOphir Munk */ 15533a820742SOphir Munk static int 15543a820742SOphir Munk mlx5_pci_remove(struct rte_pci_device *pci_dev) 15553a820742SOphir Munk { 15563a820742SOphir Munk uint16_t port_id; 15573a820742SOphir Munk struct rte_eth_dev *port; 15583a820742SOphir Munk 15593a820742SOphir Munk for (port_id = 0; port_id < RTE_MAX_ETHPORTS; port_id++) { 15603a820742SOphir Munk port = &rte_eth_devices[port_id]; 15613a820742SOphir Munk if (port->state != RTE_ETH_DEV_UNUSED && 15623a820742SOphir Munk port->device == &pci_dev->device) 15633a820742SOphir Munk rte_eth_dev_close(port_id); 15643a820742SOphir Munk } 15653a820742SOphir Munk return 0; 15663a820742SOphir Munk } 15673a820742SOphir Munk 1568771fa900SAdrien Mazarguil static const struct rte_pci_id mlx5_pci_id_map[] = { 1569771fa900SAdrien Mazarguil { 15701d1bc870SNélio Laranjeiro RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 15711d1bc870SNélio Laranjeiro PCI_DEVICE_ID_MELLANOX_CONNECTX4) 1572771fa900SAdrien Mazarguil }, 1573771fa900SAdrien Mazarguil { 15741d1bc870SNélio Laranjeiro RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 15751d1bc870SNélio Laranjeiro PCI_DEVICE_ID_MELLANOX_CONNECTX4VF) 1576771fa900SAdrien Mazarguil }, 1577771fa900SAdrien Mazarguil { 15781d1bc870SNélio Laranjeiro RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 15791d1bc870SNélio Laranjeiro PCI_DEVICE_ID_MELLANOX_CONNECTX4LX) 1580771fa900SAdrien Mazarguil }, 1581771fa900SAdrien Mazarguil { 15821d1bc870SNélio Laranjeiro RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 15831d1bc870SNélio Laranjeiro PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF) 1584771fa900SAdrien Mazarguil }, 1585771fa900SAdrien Mazarguil { 1586528a9fbeSYongseok Koh RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1587528a9fbeSYongseok Koh PCI_DEVICE_ID_MELLANOX_CONNECTX5) 1588528a9fbeSYongseok Koh }, 1589528a9fbeSYongseok Koh { 1590528a9fbeSYongseok Koh RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1591528a9fbeSYongseok Koh PCI_DEVICE_ID_MELLANOX_CONNECTX5VF) 1592528a9fbeSYongseok Koh }, 1593528a9fbeSYongseok Koh { 1594528a9fbeSYongseok Koh RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1595528a9fbeSYongseok Koh PCI_DEVICE_ID_MELLANOX_CONNECTX5EX) 1596528a9fbeSYongseok Koh }, 1597528a9fbeSYongseok Koh { 1598528a9fbeSYongseok Koh RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1599528a9fbeSYongseok Koh PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF) 1600528a9fbeSYongseok Koh }, 1601528a9fbeSYongseok Koh { 1602dd3331c6SShahaf Shuler RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1603dd3331c6SShahaf Shuler PCI_DEVICE_ID_MELLANOX_CONNECTX5BF) 1604dd3331c6SShahaf Shuler }, 1605dd3331c6SShahaf Shuler { 1606c322c0e5SOri Kam RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1607c322c0e5SOri Kam PCI_DEVICE_ID_MELLANOX_CONNECTX5BFVF) 1608c322c0e5SOri Kam }, 1609c322c0e5SOri Kam { 1610f0354d84SWisam Jaddo RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1611f0354d84SWisam Jaddo PCI_DEVICE_ID_MELLANOX_CONNECTX6) 1612f0354d84SWisam Jaddo }, 1613f0354d84SWisam Jaddo { 1614f0354d84SWisam Jaddo RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX, 1615f0354d84SWisam Jaddo PCI_DEVICE_ID_MELLANOX_CONNECTX6VF) 1616f0354d84SWisam Jaddo }, 1617f0354d84SWisam Jaddo { 1618771fa900SAdrien Mazarguil .vendor_id = 0 1619771fa900SAdrien Mazarguil } 1620771fa900SAdrien Mazarguil }; 1621771fa900SAdrien Mazarguil 1622fdf91e0fSJan Blunck static struct rte_pci_driver mlx5_driver = { 16232f3193cfSJan Viktorin .driver = { 16242f3193cfSJan Viktorin .name = MLX5_DRIVER_NAME 16252f3193cfSJan Viktorin }, 1626771fa900SAdrien Mazarguil .id_table = mlx5_pci_id_map, 1627af424af8SShreyansh Jain .probe = mlx5_pci_probe, 16283a820742SOphir Munk .remove = mlx5_pci_remove, 1629206254b7SOphir Munk .drv_flags = (RTE_PCI_DRV_INTR_LSC | RTE_PCI_DRV_INTR_RMV | 1630206254b7SOphir Munk RTE_PCI_DRV_PROBE_AGAIN), 1631771fa900SAdrien Mazarguil }; 1632771fa900SAdrien Mazarguil 163372b934adSThomas Monjalon #ifdef RTE_IBVERBS_LINK_DLOPEN 163459b91becSAdrien Mazarguil 163559b91becSAdrien Mazarguil /** 163608c028d0SAdrien Mazarguil * Suffix RTE_EAL_PMD_PATH with "-glue". 163708c028d0SAdrien Mazarguil * 163808c028d0SAdrien Mazarguil * This function performs a sanity check on RTE_EAL_PMD_PATH before 163908c028d0SAdrien Mazarguil * suffixing its last component. 164008c028d0SAdrien Mazarguil * 164108c028d0SAdrien Mazarguil * @param buf[out] 164208c028d0SAdrien Mazarguil * Output buffer, should be large enough otherwise NULL is returned. 164308c028d0SAdrien Mazarguil * @param size 164408c028d0SAdrien Mazarguil * Size of @p out. 164508c028d0SAdrien Mazarguil * 164608c028d0SAdrien Mazarguil * @return 164708c028d0SAdrien Mazarguil * Pointer to @p buf or @p NULL in case suffix cannot be appended. 164808c028d0SAdrien Mazarguil */ 164908c028d0SAdrien Mazarguil static char * 165008c028d0SAdrien Mazarguil mlx5_glue_path(char *buf, size_t size) 165108c028d0SAdrien Mazarguil { 165208c028d0SAdrien Mazarguil static const char *const bad[] = { "/", ".", "..", NULL }; 165308c028d0SAdrien Mazarguil const char *path = RTE_EAL_PMD_PATH; 165408c028d0SAdrien Mazarguil size_t len = strlen(path); 165508c028d0SAdrien Mazarguil size_t off; 165608c028d0SAdrien Mazarguil int i; 165708c028d0SAdrien Mazarguil 165808c028d0SAdrien Mazarguil while (len && path[len - 1] == '/') 165908c028d0SAdrien Mazarguil --len; 166008c028d0SAdrien Mazarguil for (off = len; off && path[off - 1] != '/'; --off) 166108c028d0SAdrien Mazarguil ; 166208c028d0SAdrien Mazarguil for (i = 0; bad[i]; ++i) 166308c028d0SAdrien Mazarguil if (!strncmp(path + off, bad[i], (int)(len - off))) 166408c028d0SAdrien Mazarguil goto error; 166508c028d0SAdrien Mazarguil i = snprintf(buf, size, "%.*s-glue", (int)len, path); 166608c028d0SAdrien Mazarguil if (i == -1 || (size_t)i >= size) 166708c028d0SAdrien Mazarguil goto error; 166808c028d0SAdrien Mazarguil return buf; 166908c028d0SAdrien Mazarguil error: 1670a170a30dSNélio Laranjeiro DRV_LOG(ERR, 1671a170a30dSNélio Laranjeiro "unable to append \"-glue\" to last component of" 167208c028d0SAdrien Mazarguil " RTE_EAL_PMD_PATH (\"" RTE_EAL_PMD_PATH "\")," 167308c028d0SAdrien Mazarguil " please re-configure DPDK"); 167408c028d0SAdrien Mazarguil return NULL; 167508c028d0SAdrien Mazarguil } 167608c028d0SAdrien Mazarguil 167708c028d0SAdrien Mazarguil /** 167859b91becSAdrien Mazarguil * Initialization routine for run-time dependency on rdma-core. 167959b91becSAdrien Mazarguil */ 168059b91becSAdrien Mazarguil static int 168159b91becSAdrien Mazarguil mlx5_glue_init(void) 168259b91becSAdrien Mazarguil { 168308c028d0SAdrien Mazarguil char glue_path[sizeof(RTE_EAL_PMD_PATH) - 1 + sizeof("-glue")]; 1684f6242d06SAdrien Mazarguil const char *path[] = { 1685f6242d06SAdrien Mazarguil /* 1686f6242d06SAdrien Mazarguil * A basic security check is necessary before trusting 1687f6242d06SAdrien Mazarguil * MLX5_GLUE_PATH, which may override RTE_EAL_PMD_PATH. 1688f6242d06SAdrien Mazarguil */ 1689f6242d06SAdrien Mazarguil (geteuid() == getuid() && getegid() == getgid() ? 1690f6242d06SAdrien Mazarguil getenv("MLX5_GLUE_PATH") : NULL), 169108c028d0SAdrien Mazarguil /* 169208c028d0SAdrien Mazarguil * When RTE_EAL_PMD_PATH is set, use its glue-suffixed 169308c028d0SAdrien Mazarguil * variant, otherwise let dlopen() look up libraries on its 169408c028d0SAdrien Mazarguil * own. 169508c028d0SAdrien Mazarguil */ 169608c028d0SAdrien Mazarguil (*RTE_EAL_PMD_PATH ? 169708c028d0SAdrien Mazarguil mlx5_glue_path(glue_path, sizeof(glue_path)) : ""), 1698f6242d06SAdrien Mazarguil }; 1699f6242d06SAdrien Mazarguil unsigned int i = 0; 170059b91becSAdrien Mazarguil void *handle = NULL; 170159b91becSAdrien Mazarguil void **sym; 170259b91becSAdrien Mazarguil const char *dlmsg; 170359b91becSAdrien Mazarguil 1704f6242d06SAdrien Mazarguil while (!handle && i != RTE_DIM(path)) { 1705f6242d06SAdrien Mazarguil const char *end; 1706f6242d06SAdrien Mazarguil size_t len; 1707f6242d06SAdrien Mazarguil int ret; 1708f6242d06SAdrien Mazarguil 1709f6242d06SAdrien Mazarguil if (!path[i]) { 1710f6242d06SAdrien Mazarguil ++i; 1711f6242d06SAdrien Mazarguil continue; 1712f6242d06SAdrien Mazarguil } 1713f6242d06SAdrien Mazarguil end = strpbrk(path[i], ":;"); 1714f6242d06SAdrien Mazarguil if (!end) 1715f6242d06SAdrien Mazarguil end = path[i] + strlen(path[i]); 1716f6242d06SAdrien Mazarguil len = end - path[i]; 1717f6242d06SAdrien Mazarguil ret = 0; 1718f6242d06SAdrien Mazarguil do { 1719f6242d06SAdrien Mazarguil char name[ret + 1]; 1720f6242d06SAdrien Mazarguil 1721f6242d06SAdrien Mazarguil ret = snprintf(name, sizeof(name), "%.*s%s" MLX5_GLUE, 1722f6242d06SAdrien Mazarguil (int)len, path[i], 1723f6242d06SAdrien Mazarguil (!len || *(end - 1) == '/') ? "" : "/"); 1724f6242d06SAdrien Mazarguil if (ret == -1) 1725f6242d06SAdrien Mazarguil break; 1726f6242d06SAdrien Mazarguil if (sizeof(name) != (size_t)ret + 1) 1727f6242d06SAdrien Mazarguil continue; 1728a170a30dSNélio Laranjeiro DRV_LOG(DEBUG, "looking for rdma-core glue as \"%s\"", 1729a170a30dSNélio Laranjeiro name); 1730f6242d06SAdrien Mazarguil handle = dlopen(name, RTLD_LAZY); 1731f6242d06SAdrien Mazarguil break; 1732f6242d06SAdrien Mazarguil } while (1); 1733f6242d06SAdrien Mazarguil path[i] = end + 1; 1734f6242d06SAdrien Mazarguil if (!*end) 1735f6242d06SAdrien Mazarguil ++i; 1736f6242d06SAdrien Mazarguil } 173759b91becSAdrien Mazarguil if (!handle) { 173859b91becSAdrien Mazarguil rte_errno = EINVAL; 173959b91becSAdrien Mazarguil dlmsg = dlerror(); 174059b91becSAdrien Mazarguil if (dlmsg) 1741a170a30dSNélio Laranjeiro DRV_LOG(WARNING, "cannot load glue library: %s", dlmsg); 174259b91becSAdrien Mazarguil goto glue_error; 174359b91becSAdrien Mazarguil } 174459b91becSAdrien Mazarguil sym = dlsym(handle, "mlx5_glue"); 174559b91becSAdrien Mazarguil if (!sym || !*sym) { 174659b91becSAdrien Mazarguil rte_errno = EINVAL; 174759b91becSAdrien Mazarguil dlmsg = dlerror(); 174859b91becSAdrien Mazarguil if (dlmsg) 1749a170a30dSNélio Laranjeiro DRV_LOG(ERR, "cannot resolve glue symbol: %s", dlmsg); 175059b91becSAdrien Mazarguil goto glue_error; 175159b91becSAdrien Mazarguil } 175259b91becSAdrien Mazarguil mlx5_glue = *sym; 175359b91becSAdrien Mazarguil return 0; 175459b91becSAdrien Mazarguil glue_error: 175559b91becSAdrien Mazarguil if (handle) 175659b91becSAdrien Mazarguil dlclose(handle); 1757a170a30dSNélio Laranjeiro DRV_LOG(WARNING, 1758a170a30dSNélio Laranjeiro "cannot initialize PMD due to missing run-time dependency on" 1759a170a30dSNélio Laranjeiro " rdma-core libraries (libibverbs, libmlx5)"); 176059b91becSAdrien Mazarguil return -rte_errno; 176159b91becSAdrien Mazarguil } 176259b91becSAdrien Mazarguil 176359b91becSAdrien Mazarguil #endif 176459b91becSAdrien Mazarguil 1765771fa900SAdrien Mazarguil /** 1766771fa900SAdrien Mazarguil * Driver initialization routine. 1767771fa900SAdrien Mazarguil */ 1768f8e99896SThomas Monjalon RTE_INIT(rte_mlx5_pmd_init) 1769771fa900SAdrien Mazarguil { 17703d96644aSStephen Hemminger /* Initialize driver log type. */ 17713d96644aSStephen Hemminger mlx5_logtype = rte_log_register("pmd.net.mlx5"); 17723d96644aSStephen Hemminger if (mlx5_logtype >= 0) 17733d96644aSStephen Hemminger rte_log_set_level(mlx5_logtype, RTE_LOG_NOTICE); 17743d96644aSStephen Hemminger 17755f8ba81cSXueming Li /* Build the static tables for Verbs conversion. */ 1776ea16068cSYongseok Koh mlx5_set_ptype_table(); 17775f8ba81cSXueming Li mlx5_set_cksum_table(); 17785f8ba81cSXueming Li mlx5_set_swp_types_table(); 1779771fa900SAdrien Mazarguil /* 1780771fa900SAdrien Mazarguil * RDMAV_HUGEPAGES_SAFE tells ibv_fork_init() we intend to use 1781771fa900SAdrien Mazarguil * huge pages. Calling ibv_fork_init() during init allows 1782771fa900SAdrien Mazarguil * applications to use fork() safely for purposes other than 1783771fa900SAdrien Mazarguil * using this PMD, which is not supported in forked processes. 1784771fa900SAdrien Mazarguil */ 1785771fa900SAdrien Mazarguil setenv("RDMAV_HUGEPAGES_SAFE", "1", 1); 1786161b93e5SYongseok Koh /* Match the size of Rx completion entry to the size of a cacheline. */ 1787161b93e5SYongseok Koh if (RTE_CACHE_LINE_SIZE == 128) 1788161b93e5SYongseok Koh setenv("MLX5_CQE_SIZE", "128", 0); 17891ff30d18SMatan Azrad /* 17901ff30d18SMatan Azrad * MLX5_DEVICE_FATAL_CLEANUP tells ibv_destroy functions to 17911ff30d18SMatan Azrad * cleanup all the Verbs resources even when the device was removed. 17921ff30d18SMatan Azrad */ 17931ff30d18SMatan Azrad setenv("MLX5_DEVICE_FATAL_CLEANUP", "1", 1); 179472b934adSThomas Monjalon #ifdef RTE_IBVERBS_LINK_DLOPEN 179559b91becSAdrien Mazarguil if (mlx5_glue_init()) 179659b91becSAdrien Mazarguil return; 179759b91becSAdrien Mazarguil assert(mlx5_glue); 179859b91becSAdrien Mazarguil #endif 17992a3b0097SAdrien Mazarguil #ifndef NDEBUG 18002a3b0097SAdrien Mazarguil /* Glue structure must not contain any NULL pointers. */ 18012a3b0097SAdrien Mazarguil { 18022a3b0097SAdrien Mazarguil unsigned int i; 18032a3b0097SAdrien Mazarguil 18042a3b0097SAdrien Mazarguil for (i = 0; i != sizeof(*mlx5_glue) / sizeof(void *); ++i) 18052a3b0097SAdrien Mazarguil assert(((const void *const *)mlx5_glue)[i]); 18062a3b0097SAdrien Mazarguil } 18072a3b0097SAdrien Mazarguil #endif 18086d5df2eaSAdrien Mazarguil if (strcmp(mlx5_glue->version, MLX5_GLUE_VERSION)) { 1809a170a30dSNélio Laranjeiro DRV_LOG(ERR, 1810a170a30dSNélio Laranjeiro "rdma-core glue \"%s\" mismatch: \"%s\" is required", 18116d5df2eaSAdrien Mazarguil mlx5_glue->version, MLX5_GLUE_VERSION); 18126d5df2eaSAdrien Mazarguil return; 18136d5df2eaSAdrien Mazarguil } 18140e83b8e5SNelio Laranjeiro mlx5_glue->fork_init(); 18153dcfe039SThomas Monjalon rte_pci_register(&mlx5_driver); 1816771fa900SAdrien Mazarguil } 1817771fa900SAdrien Mazarguil 181801f19227SShreyansh Jain RTE_PMD_EXPORT_NAME(net_mlx5, __COUNTER__); 181901f19227SShreyansh Jain RTE_PMD_REGISTER_PCI_TABLE(net_mlx5, mlx5_pci_id_map); 18200880c401SOlivier Matz RTE_PMD_REGISTER_KMOD_DEP(net_mlx5, "* ib_uverbs & mlx5_core & mlx5_ib"); 1821