xref: /dpdk/drivers/net/mlx5/mlx5.c (revision 51e7fa8d20876cb221b11013cd23b1881cc9b75c)
1771fa900SAdrien Mazarguil /*-
2771fa900SAdrien Mazarguil  *   BSD LICENSE
3771fa900SAdrien Mazarguil  *
4771fa900SAdrien Mazarguil  *   Copyright 2015 6WIND S.A.
5771fa900SAdrien Mazarguil  *   Copyright 2015 Mellanox.
6771fa900SAdrien Mazarguil  *
7771fa900SAdrien Mazarguil  *   Redistribution and use in source and binary forms, with or without
8771fa900SAdrien Mazarguil  *   modification, are permitted provided that the following conditions
9771fa900SAdrien Mazarguil  *   are met:
10771fa900SAdrien Mazarguil  *
11771fa900SAdrien Mazarguil  *     * Redistributions of source code must retain the above copyright
12771fa900SAdrien Mazarguil  *       notice, this list of conditions and the following disclaimer.
13771fa900SAdrien Mazarguil  *     * Redistributions in binary form must reproduce the above copyright
14771fa900SAdrien Mazarguil  *       notice, this list of conditions and the following disclaimer in
15771fa900SAdrien Mazarguil  *       the documentation and/or other materials provided with the
16771fa900SAdrien Mazarguil  *       distribution.
17771fa900SAdrien Mazarguil  *     * Neither the name of 6WIND S.A. nor the names of its
18771fa900SAdrien Mazarguil  *       contributors may be used to endorse or promote products derived
19771fa900SAdrien Mazarguil  *       from this software without specific prior written permission.
20771fa900SAdrien Mazarguil  *
21771fa900SAdrien Mazarguil  *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22771fa900SAdrien Mazarguil  *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23771fa900SAdrien Mazarguil  *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24771fa900SAdrien Mazarguil  *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25771fa900SAdrien Mazarguil  *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26771fa900SAdrien Mazarguil  *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27771fa900SAdrien Mazarguil  *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28771fa900SAdrien Mazarguil  *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29771fa900SAdrien Mazarguil  *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30771fa900SAdrien Mazarguil  *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31771fa900SAdrien Mazarguil  *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32771fa900SAdrien Mazarguil  */
33771fa900SAdrien Mazarguil 
34771fa900SAdrien Mazarguil #include <stddef.h>
35771fa900SAdrien Mazarguil #include <unistd.h>
36771fa900SAdrien Mazarguil #include <string.h>
37771fa900SAdrien Mazarguil #include <assert.h>
38771fa900SAdrien Mazarguil #include <stdint.h>
39771fa900SAdrien Mazarguil #include <stdlib.h>
40e72dd09bSNélio Laranjeiro #include <errno.h>
41771fa900SAdrien Mazarguil #include <net/if.h>
42771fa900SAdrien Mazarguil 
43771fa900SAdrien Mazarguil /* Verbs header. */
44771fa900SAdrien Mazarguil /* ISO C doesn't support unnamed structs/unions, disabling -pedantic. */
45771fa900SAdrien Mazarguil #ifdef PEDANTIC
46fc5b160fSBruce Richardson #pragma GCC diagnostic ignored "-Wpedantic"
47771fa900SAdrien Mazarguil #endif
48771fa900SAdrien Mazarguil #include <infiniband/verbs.h>
49771fa900SAdrien Mazarguil #ifdef PEDANTIC
50fc5b160fSBruce Richardson #pragma GCC diagnostic error "-Wpedantic"
51771fa900SAdrien Mazarguil #endif
52771fa900SAdrien Mazarguil 
53771fa900SAdrien Mazarguil #include <rte_malloc.h>
54771fa900SAdrien Mazarguil #include <rte_ethdev.h>
55fdf91e0fSJan Blunck #include <rte_ethdev_pci.h>
56771fa900SAdrien Mazarguil #include <rte_pci.h>
57c752998bSGaetan Rivet #include <rte_bus_pci.h>
58771fa900SAdrien Mazarguil #include <rte_common.h>
59e72dd09bSNélio Laranjeiro #include <rte_kvargs.h>
60771fa900SAdrien Mazarguil 
61771fa900SAdrien Mazarguil #include "mlx5.h"
62771fa900SAdrien Mazarguil #include "mlx5_utils.h"
632e22920bSAdrien Mazarguil #include "mlx5_rxtx.h"
64771fa900SAdrien Mazarguil #include "mlx5_autoconf.h"
6513d57bd5SAdrien Mazarguil #include "mlx5_defs.h"
66771fa900SAdrien Mazarguil 
6799c12dccSNélio Laranjeiro /* Device parameter to enable RX completion queue compression. */
6899c12dccSNélio Laranjeiro #define MLX5_RXQ_CQE_COMP_EN "rxq_cqe_comp_en"
6999c12dccSNélio Laranjeiro 
702a66cf37SYaacov Hazan /* Device parameter to configure inline send. */
712a66cf37SYaacov Hazan #define MLX5_TXQ_INLINE "txq_inline"
722a66cf37SYaacov Hazan 
732a66cf37SYaacov Hazan /*
742a66cf37SYaacov Hazan  * Device parameter to configure the number of TX queues threshold for
752a66cf37SYaacov Hazan  * enabling inline send.
762a66cf37SYaacov Hazan  */
772a66cf37SYaacov Hazan #define MLX5_TXQS_MIN_INLINE "txqs_min_inline"
782a66cf37SYaacov Hazan 
79230189d9SNélio Laranjeiro /* Device parameter to enable multi-packet send WQEs. */
80230189d9SNélio Laranjeiro #define MLX5_TXQ_MPW_EN "txq_mpw_en"
81230189d9SNélio Laranjeiro 
826ce84bd8SYongseok Koh /* Device parameter to include 2 dsegs in the title WQEBB. */
836ce84bd8SYongseok Koh #define MLX5_TXQ_MPW_HDR_DSEG_EN "txq_mpw_hdr_dseg_en"
846ce84bd8SYongseok Koh 
856ce84bd8SYongseok Koh /* Device parameter to limit the size of inlining packet. */
866ce84bd8SYongseok Koh #define MLX5_TXQ_MAX_INLINE_LEN "txq_max_inline_len"
876ce84bd8SYongseok Koh 
883f13f8c2SShahaf Shuler /* Device parameter to enable hardware TSO offload. */
893f13f8c2SShahaf Shuler #define MLX5_TSO "tso"
903f13f8c2SShahaf Shuler 
915644d5b9SNelio Laranjeiro /* Device parameter to enable hardware Tx vector. */
925644d5b9SNelio Laranjeiro #define MLX5_TX_VEC_EN "tx_vec_en"
935644d5b9SNelio Laranjeiro 
945644d5b9SNelio Laranjeiro /* Device parameter to enable hardware Rx vector. */
955644d5b9SNelio Laranjeiro #define MLX5_RX_VEC_EN "rx_vec_en"
965644d5b9SNelio Laranjeiro 
9750b244a1SShahaf Shuler /* Default PMD specific parameter value. */
9850b244a1SShahaf Shuler #define MLX5_ARG_UNSET (-1)
9950b244a1SShahaf Shuler 
10043e9d979SShachar Beiser #ifndef HAVE_IBV_MLX5_MOD_MPW
10143e9d979SShachar Beiser #define MLX5DV_CONTEXT_FLAGS_MPW_ALLOWED (1 << 2)
10243e9d979SShachar Beiser #define MLX5DV_CONTEXT_FLAGS_ENHANCED_MPW (1 << 3)
10343e9d979SShachar Beiser #endif
10443e9d979SShachar Beiser 
105523f5a74SYongseok Koh #ifndef HAVE_IBV_MLX5_MOD_CQE_128B_COMP
106523f5a74SYongseok Koh #define MLX5DV_CONTEXT_FLAGS_CQE_128B_COMP (1 << 4)
107523f5a74SYongseok Koh #endif
108523f5a74SYongseok Koh 
10950b244a1SShahaf Shuler struct mlx5_args {
11050b244a1SShahaf Shuler 	int cqe_comp;
11150b244a1SShahaf Shuler 	int txq_inline;
11250b244a1SShahaf Shuler 	int txqs_inline;
11350b244a1SShahaf Shuler 	int mps;
11450b244a1SShahaf Shuler 	int mpw_hdr_dseg;
11550b244a1SShahaf Shuler 	int inline_max_packet_sz;
11650b244a1SShahaf Shuler 	int tso;
1175644d5b9SNelio Laranjeiro 	int tx_vec_en;
1185644d5b9SNelio Laranjeiro 	int rx_vec_en;
11950b244a1SShahaf Shuler };
120771fa900SAdrien Mazarguil /**
1214d803a72SOlga Shern  * Retrieve integer value from environment variable.
1224d803a72SOlga Shern  *
1234d803a72SOlga Shern  * @param[in] name
1244d803a72SOlga Shern  *   Environment variable name.
1254d803a72SOlga Shern  *
1264d803a72SOlga Shern  * @return
1274d803a72SOlga Shern  *   Integer value, 0 if the variable is not set.
1284d803a72SOlga Shern  */
1294d803a72SOlga Shern int
1304d803a72SOlga Shern mlx5_getenv_int(const char *name)
1314d803a72SOlga Shern {
1324d803a72SOlga Shern 	const char *val = getenv(name);
1334d803a72SOlga Shern 
1344d803a72SOlga Shern 	if (val == NULL)
1354d803a72SOlga Shern 		return 0;
1364d803a72SOlga Shern 	return atoi(val);
1374d803a72SOlga Shern }
1384d803a72SOlga Shern 
1394d803a72SOlga Shern /**
1401e3a39f7SXueming Li  * Verbs callback to allocate a memory. This function should allocate the space
1411e3a39f7SXueming Li  * according to the size provided residing inside a huge page.
1421e3a39f7SXueming Li  * Please note that all allocation must respect the alignment from libmlx5
1431e3a39f7SXueming Li  * (i.e. currently sysconf(_SC_PAGESIZE)).
1441e3a39f7SXueming Li  *
1451e3a39f7SXueming Li  * @param[in] size
1461e3a39f7SXueming Li  *   The size in bytes of the memory to allocate.
1471e3a39f7SXueming Li  * @param[in] data
1481e3a39f7SXueming Li  *   A pointer to the callback data.
1491e3a39f7SXueming Li  *
1501e3a39f7SXueming Li  * @return
1511e3a39f7SXueming Li  *   a pointer to the allocate space.
1521e3a39f7SXueming Li  */
1531e3a39f7SXueming Li static void *
1541e3a39f7SXueming Li mlx5_alloc_verbs_buf(size_t size, void *data)
1551e3a39f7SXueming Li {
1561e3a39f7SXueming Li 	struct priv *priv = data;
1571e3a39f7SXueming Li 	void *ret;
1581e3a39f7SXueming Li 	size_t alignment = sysconf(_SC_PAGESIZE);
1591e3a39f7SXueming Li 
1601e3a39f7SXueming Li 	assert(data != NULL);
1611e3a39f7SXueming Li 	ret = rte_malloc_socket(__func__, size, alignment,
1621e3a39f7SXueming Li 				priv->dev->device->numa_node);
1631e3a39f7SXueming Li 	DEBUG("Extern alloc size: %lu, align: %lu: %p", size, alignment, ret);
1641e3a39f7SXueming Li 	return ret;
1651e3a39f7SXueming Li }
1661e3a39f7SXueming Li 
1671e3a39f7SXueming Li /**
1681e3a39f7SXueming Li  * Verbs callback to free a memory.
1691e3a39f7SXueming Li  *
1701e3a39f7SXueming Li  * @param[in] ptr
1711e3a39f7SXueming Li  *   A pointer to the memory to free.
1721e3a39f7SXueming Li  * @param[in] data
1731e3a39f7SXueming Li  *   A pointer to the callback data.
1741e3a39f7SXueming Li  */
1751e3a39f7SXueming Li static void
1761e3a39f7SXueming Li mlx5_free_verbs_buf(void *ptr, void *data __rte_unused)
1771e3a39f7SXueming Li {
1781e3a39f7SXueming Li 	assert(data != NULL);
1791e3a39f7SXueming Li 	DEBUG("Extern free request: %p", ptr);
1801e3a39f7SXueming Li 	rte_free(ptr);
1811e3a39f7SXueming Li }
1821e3a39f7SXueming Li 
1831e3a39f7SXueming Li /**
184771fa900SAdrien Mazarguil  * DPDK callback to close the device.
185771fa900SAdrien Mazarguil  *
186771fa900SAdrien Mazarguil  * Destroy all queues and objects, free memory.
187771fa900SAdrien Mazarguil  *
188771fa900SAdrien Mazarguil  * @param dev
189771fa900SAdrien Mazarguil  *   Pointer to Ethernet device structure.
190771fa900SAdrien Mazarguil  */
191771fa900SAdrien Mazarguil static void
192771fa900SAdrien Mazarguil mlx5_dev_close(struct rte_eth_dev *dev)
193771fa900SAdrien Mazarguil {
19401d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
1952e22920bSAdrien Mazarguil 	unsigned int i;
1966af6b973SNélio Laranjeiro 	int ret;
197771fa900SAdrien Mazarguil 
198771fa900SAdrien Mazarguil 	priv_lock(priv);
199771fa900SAdrien Mazarguil 	DEBUG("%p: closing device \"%s\"",
200771fa900SAdrien Mazarguil 	      (void *)dev,
201771fa900SAdrien Mazarguil 	      ((priv->ctx != NULL) ? priv->ctx->device->name : ""));
202ecc1c29dSAdrien Mazarguil 	/* In case mlx5_dev_stop() has not been called. */
203198a3c33SNelio Laranjeiro 	priv_dev_interrupt_handler_uninstall(priv, dev);
204272733b5SNélio Laranjeiro 	priv_dev_traffic_disable(priv, dev);
2052e22920bSAdrien Mazarguil 	/* Prevent crashes when queues are still in use. */
2062e22920bSAdrien Mazarguil 	dev->rx_pkt_burst = removed_rx_burst;
2072e22920bSAdrien Mazarguil 	dev->tx_pkt_burst = removed_tx_burst;
2082e22920bSAdrien Mazarguil 	if (priv->rxqs != NULL) {
2092e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_rx_burst() is still running. */
2102e22920bSAdrien Mazarguil 		usleep(1000);
211a1366b1aSNélio Laranjeiro 		for (i = 0; (i != priv->rxqs_n); ++i)
212a1366b1aSNélio Laranjeiro 			mlx5_priv_rxq_release(priv, i);
2132e22920bSAdrien Mazarguil 		priv->rxqs_n = 0;
2142e22920bSAdrien Mazarguil 		priv->rxqs = NULL;
2152e22920bSAdrien Mazarguil 	}
2162e22920bSAdrien Mazarguil 	if (priv->txqs != NULL) {
2172e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_tx_burst() is still running. */
2182e22920bSAdrien Mazarguil 		usleep(1000);
2196e78005aSNélio Laranjeiro 		for (i = 0; (i != priv->txqs_n); ++i)
2206e78005aSNélio Laranjeiro 			mlx5_priv_txq_release(priv, i);
2212e22920bSAdrien Mazarguil 		priv->txqs_n = 0;
2222e22920bSAdrien Mazarguil 		priv->txqs = NULL;
2232e22920bSAdrien Mazarguil 	}
224771fa900SAdrien Mazarguil 	if (priv->pd != NULL) {
225771fa900SAdrien Mazarguil 		assert(priv->ctx != NULL);
226771fa900SAdrien Mazarguil 		claim_zero(ibv_dealloc_pd(priv->pd));
227771fa900SAdrien Mazarguil 		claim_zero(ibv_close_device(priv->ctx));
228771fa900SAdrien Mazarguil 	} else
229771fa900SAdrien Mazarguil 		assert(priv->ctx == NULL);
23029c1d8bbSNélio Laranjeiro 	if (priv->rss_conf.rss_key != NULL)
23129c1d8bbSNélio Laranjeiro 		rte_free(priv->rss_conf.rss_key);
232634efbc2SNelio Laranjeiro 	if (priv->reta_idx != NULL)
233634efbc2SNelio Laranjeiro 		rte_free(priv->reta_idx);
234f8b9a3baSXueming Li 	priv_socket_uninit(priv);
235f5479b68SNélio Laranjeiro 	ret = mlx5_priv_hrxq_ibv_verify(priv);
236f5479b68SNélio Laranjeiro 	if (ret)
237f5479b68SNélio Laranjeiro 		WARN("%p: some Hash Rx queue still remain", (void *)priv);
2384c7a0f5fSNélio Laranjeiro 	ret = mlx5_priv_ind_table_ibv_verify(priv);
2394c7a0f5fSNélio Laranjeiro 	if (ret)
2404c7a0f5fSNélio Laranjeiro 		WARN("%p: some Indirection table still remain", (void *)priv);
24109cb5b58SNélio Laranjeiro 	ret = mlx5_priv_rxq_ibv_verify(priv);
24209cb5b58SNélio Laranjeiro 	if (ret)
24309cb5b58SNélio Laranjeiro 		WARN("%p: some Verbs Rx queue still remain", (void *)priv);
244a1366b1aSNélio Laranjeiro 	ret = mlx5_priv_rxq_verify(priv);
245a1366b1aSNélio Laranjeiro 	if (ret)
246a1366b1aSNélio Laranjeiro 		WARN("%p: some Rx Queues still remain", (void *)priv);
247faf2667fSNélio Laranjeiro 	ret = mlx5_priv_txq_ibv_verify(priv);
248faf2667fSNélio Laranjeiro 	if (ret)
249faf2667fSNélio Laranjeiro 		WARN("%p: some Verbs Tx queue still remain", (void *)priv);
2506e78005aSNélio Laranjeiro 	ret = mlx5_priv_txq_verify(priv);
2516e78005aSNélio Laranjeiro 	if (ret)
2526e78005aSNélio Laranjeiro 		WARN("%p: some Tx Queues still remain", (void *)priv);
2536af6b973SNélio Laranjeiro 	ret = priv_flow_verify(priv);
2546af6b973SNélio Laranjeiro 	if (ret)
2556af6b973SNélio Laranjeiro 		WARN("%p: some flows still remain", (void *)priv);
256f8fb87d5SNélio Laranjeiro 	ret = priv_mr_verify(priv);
257f8fb87d5SNélio Laranjeiro 	if (ret)
258f8fb87d5SNélio Laranjeiro 		WARN("%p: some Memory Region still remain", (void *)priv);
259771fa900SAdrien Mazarguil 	priv_unlock(priv);
260771fa900SAdrien Mazarguil 	memset(priv, 0, sizeof(*priv));
261771fa900SAdrien Mazarguil }
262771fa900SAdrien Mazarguil 
2630887aa7fSNélio Laranjeiro const struct eth_dev_ops mlx5_dev_ops = {
264e60fbd5bSAdrien Mazarguil 	.dev_configure = mlx5_dev_configure,
265e60fbd5bSAdrien Mazarguil 	.dev_start = mlx5_dev_start,
266e60fbd5bSAdrien Mazarguil 	.dev_stop = mlx5_dev_stop,
26762072098SOr Ami 	.dev_set_link_down = mlx5_set_link_down,
26862072098SOr Ami 	.dev_set_link_up = mlx5_set_link_up,
269771fa900SAdrien Mazarguil 	.dev_close = mlx5_dev_close,
2701bdbe1afSAdrien Mazarguil 	.promiscuous_enable = mlx5_promiscuous_enable,
2711bdbe1afSAdrien Mazarguil 	.promiscuous_disable = mlx5_promiscuous_disable,
2721bdbe1afSAdrien Mazarguil 	.allmulticast_enable = mlx5_allmulticast_enable,
2731bdbe1afSAdrien Mazarguil 	.allmulticast_disable = mlx5_allmulticast_disable,
274cb8faed7SAdrien Mazarguil 	.link_update = mlx5_link_update,
27587011737SAdrien Mazarguil 	.stats_get = mlx5_stats_get,
27687011737SAdrien Mazarguil 	.stats_reset = mlx5_stats_reset,
277a4193ae3SShahaf Shuler 	.xstats_get = mlx5_xstats_get,
278a4193ae3SShahaf Shuler 	.xstats_reset = mlx5_xstats_reset,
279a4193ae3SShahaf Shuler 	.xstats_get_names = mlx5_xstats_get_names,
280e60fbd5bSAdrien Mazarguil 	.dev_infos_get = mlx5_dev_infos_get,
28178a38edfSJianfeng Tan 	.dev_supported_ptypes_get = mlx5_dev_supported_ptypes_get,
282e9086978SAdrien Mazarguil 	.vlan_filter_set = mlx5_vlan_filter_set,
2832e22920bSAdrien Mazarguil 	.rx_queue_setup = mlx5_rx_queue_setup,
2842e22920bSAdrien Mazarguil 	.tx_queue_setup = mlx5_tx_queue_setup,
2852e22920bSAdrien Mazarguil 	.rx_queue_release = mlx5_rx_queue_release,
2862e22920bSAdrien Mazarguil 	.tx_queue_release = mlx5_tx_queue_release,
28702d75430SAdrien Mazarguil 	.flow_ctrl_get = mlx5_dev_get_flow_ctrl,
28802d75430SAdrien Mazarguil 	.flow_ctrl_set = mlx5_dev_set_flow_ctrl,
2893318aef7SAdrien Mazarguil 	.mac_addr_remove = mlx5_mac_addr_remove,
2903318aef7SAdrien Mazarguil 	.mac_addr_add = mlx5_mac_addr_add,
29186977fccSDavid Marchand 	.mac_addr_set = mlx5_mac_addr_set,
292cf37ca95SAdrien Mazarguil 	.mtu_set = mlx5_dev_set_mtu,
293f3db9489SYaacov Hazan 	.vlan_strip_queue_set = mlx5_vlan_strip_queue_set,
294f3db9489SYaacov Hazan 	.vlan_offload_set = mlx5_vlan_offload_set,
295634efbc2SNelio Laranjeiro 	.reta_update = mlx5_dev_rss_reta_update,
296634efbc2SNelio Laranjeiro 	.reta_query = mlx5_dev_rss_reta_query,
2972f97422eSNelio Laranjeiro 	.rss_hash_update = mlx5_rss_hash_update,
2982f97422eSNelio Laranjeiro 	.rss_hash_conf_get = mlx5_rss_hash_conf_get,
29976f5c99eSYaacov Hazan 	.filter_ctrl = mlx5_dev_filter_ctrl,
3008788fec1SOlivier Matz 	.rx_descriptor_status = mlx5_rx_descriptor_status,
3018788fec1SOlivier Matz 	.tx_descriptor_status = mlx5_tx_descriptor_status,
3023c7d44afSShahaf Shuler 	.rx_queue_intr_enable = mlx5_rx_intr_enable,
3033c7d44afSShahaf Shuler 	.rx_queue_intr_disable = mlx5_rx_intr_disable,
304771fa900SAdrien Mazarguil };
305771fa900SAdrien Mazarguil 
30687ec44ceSXueming Li static const struct eth_dev_ops mlx5_dev_sec_ops = {
30787ec44ceSXueming Li 	.stats_get = mlx5_stats_get,
30887ec44ceSXueming Li 	.stats_reset = mlx5_stats_reset,
30987ec44ceSXueming Li 	.xstats_get = mlx5_xstats_get,
31087ec44ceSXueming Li 	.xstats_reset = mlx5_xstats_reset,
31187ec44ceSXueming Li 	.xstats_get_names = mlx5_xstats_get_names,
31287ec44ceSXueming Li 	.dev_infos_get = mlx5_dev_infos_get,
31387ec44ceSXueming Li 	.rx_descriptor_status = mlx5_rx_descriptor_status,
31487ec44ceSXueming Li 	.tx_descriptor_status = mlx5_tx_descriptor_status,
31587ec44ceSXueming Li };
31687ec44ceSXueming Li 
3170887aa7fSNélio Laranjeiro /* Available operators in flow isolated mode. */
3180887aa7fSNélio Laranjeiro const struct eth_dev_ops mlx5_dev_ops_isolate = {
3190887aa7fSNélio Laranjeiro 	.dev_configure = mlx5_dev_configure,
3200887aa7fSNélio Laranjeiro 	.dev_start = mlx5_dev_start,
3210887aa7fSNélio Laranjeiro 	.dev_stop = mlx5_dev_stop,
3220887aa7fSNélio Laranjeiro 	.dev_set_link_down = mlx5_set_link_down,
3230887aa7fSNélio Laranjeiro 	.dev_set_link_up = mlx5_set_link_up,
3240887aa7fSNélio Laranjeiro 	.dev_close = mlx5_dev_close,
3250887aa7fSNélio Laranjeiro 	.link_update = mlx5_link_update,
3260887aa7fSNélio Laranjeiro 	.stats_get = mlx5_stats_get,
3270887aa7fSNélio Laranjeiro 	.stats_reset = mlx5_stats_reset,
3280887aa7fSNélio Laranjeiro 	.xstats_get = mlx5_xstats_get,
3290887aa7fSNélio Laranjeiro 	.xstats_reset = mlx5_xstats_reset,
3300887aa7fSNélio Laranjeiro 	.xstats_get_names = mlx5_xstats_get_names,
3310887aa7fSNélio Laranjeiro 	.dev_infos_get = mlx5_dev_infos_get,
3320887aa7fSNélio Laranjeiro 	.dev_supported_ptypes_get = mlx5_dev_supported_ptypes_get,
3330887aa7fSNélio Laranjeiro 	.vlan_filter_set = mlx5_vlan_filter_set,
3340887aa7fSNélio Laranjeiro 	.rx_queue_setup = mlx5_rx_queue_setup,
3350887aa7fSNélio Laranjeiro 	.tx_queue_setup = mlx5_tx_queue_setup,
3360887aa7fSNélio Laranjeiro 	.rx_queue_release = mlx5_rx_queue_release,
3370887aa7fSNélio Laranjeiro 	.tx_queue_release = mlx5_tx_queue_release,
3380887aa7fSNélio Laranjeiro 	.flow_ctrl_get = mlx5_dev_get_flow_ctrl,
3390887aa7fSNélio Laranjeiro 	.flow_ctrl_set = mlx5_dev_set_flow_ctrl,
3400887aa7fSNélio Laranjeiro 	.mac_addr_remove = mlx5_mac_addr_remove,
3410887aa7fSNélio Laranjeiro 	.mac_addr_add = mlx5_mac_addr_add,
3420887aa7fSNélio Laranjeiro 	.mac_addr_set = mlx5_mac_addr_set,
3430887aa7fSNélio Laranjeiro 	.mtu_set = mlx5_dev_set_mtu,
3440887aa7fSNélio Laranjeiro 	.vlan_strip_queue_set = mlx5_vlan_strip_queue_set,
3450887aa7fSNélio Laranjeiro 	.vlan_offload_set = mlx5_vlan_offload_set,
3460887aa7fSNélio Laranjeiro 	.filter_ctrl = mlx5_dev_filter_ctrl,
3470887aa7fSNélio Laranjeiro 	.rx_descriptor_status = mlx5_rx_descriptor_status,
3480887aa7fSNélio Laranjeiro 	.tx_descriptor_status = mlx5_tx_descriptor_status,
3490887aa7fSNélio Laranjeiro 	.rx_queue_intr_enable = mlx5_rx_intr_enable,
3500887aa7fSNélio Laranjeiro 	.rx_queue_intr_disable = mlx5_rx_intr_disable,
3510887aa7fSNélio Laranjeiro };
3520887aa7fSNélio Laranjeiro 
353771fa900SAdrien Mazarguil static struct {
354771fa900SAdrien Mazarguil 	struct rte_pci_addr pci_addr; /* associated PCI address */
355771fa900SAdrien Mazarguil 	uint32_t ports; /* physical ports bitfield. */
356771fa900SAdrien Mazarguil } mlx5_dev[32];
357771fa900SAdrien Mazarguil 
358771fa900SAdrien Mazarguil /**
359771fa900SAdrien Mazarguil  * Get device index in mlx5_dev[] from PCI bus address.
360771fa900SAdrien Mazarguil  *
361771fa900SAdrien Mazarguil  * @param[in] pci_addr
362771fa900SAdrien Mazarguil  *   PCI bus address to look for.
363771fa900SAdrien Mazarguil  *
364771fa900SAdrien Mazarguil  * @return
365771fa900SAdrien Mazarguil  *   mlx5_dev[] index on success, -1 on failure.
366771fa900SAdrien Mazarguil  */
367771fa900SAdrien Mazarguil static int
368771fa900SAdrien Mazarguil mlx5_dev_idx(struct rte_pci_addr *pci_addr)
369771fa900SAdrien Mazarguil {
370771fa900SAdrien Mazarguil 	unsigned int i;
371771fa900SAdrien Mazarguil 	int ret = -1;
372771fa900SAdrien Mazarguil 
373771fa900SAdrien Mazarguil 	assert(pci_addr != NULL);
374771fa900SAdrien Mazarguil 	for (i = 0; (i != RTE_DIM(mlx5_dev)); ++i) {
375771fa900SAdrien Mazarguil 		if ((mlx5_dev[i].pci_addr.domain == pci_addr->domain) &&
376771fa900SAdrien Mazarguil 		    (mlx5_dev[i].pci_addr.bus == pci_addr->bus) &&
377771fa900SAdrien Mazarguil 		    (mlx5_dev[i].pci_addr.devid == pci_addr->devid) &&
378771fa900SAdrien Mazarguil 		    (mlx5_dev[i].pci_addr.function == pci_addr->function))
379771fa900SAdrien Mazarguil 			return i;
380771fa900SAdrien Mazarguil 		if ((mlx5_dev[i].ports == 0) && (ret == -1))
381771fa900SAdrien Mazarguil 			ret = i;
382771fa900SAdrien Mazarguil 	}
383771fa900SAdrien Mazarguil 	return ret;
384771fa900SAdrien Mazarguil }
385771fa900SAdrien Mazarguil 
386e72dd09bSNélio Laranjeiro /**
387e72dd09bSNélio Laranjeiro  * Verify and store value for device argument.
388e72dd09bSNélio Laranjeiro  *
389e72dd09bSNélio Laranjeiro  * @param[in] key
390e72dd09bSNélio Laranjeiro  *   Key argument to verify.
391e72dd09bSNélio Laranjeiro  * @param[in] val
392e72dd09bSNélio Laranjeiro  *   Value associated with key.
393e72dd09bSNélio Laranjeiro  * @param opaque
394e72dd09bSNélio Laranjeiro  *   User data.
395e72dd09bSNélio Laranjeiro  *
396e72dd09bSNélio Laranjeiro  * @return
397e72dd09bSNélio Laranjeiro  *   0 on success, negative errno value on failure.
398e72dd09bSNélio Laranjeiro  */
399e72dd09bSNélio Laranjeiro static int
400e72dd09bSNélio Laranjeiro mlx5_args_check(const char *key, const char *val, void *opaque)
401e72dd09bSNélio Laranjeiro {
40250b244a1SShahaf Shuler 	struct mlx5_args *args = opaque;
40399c12dccSNélio Laranjeiro 	unsigned long tmp;
404e72dd09bSNélio Laranjeiro 
40599c12dccSNélio Laranjeiro 	errno = 0;
40699c12dccSNélio Laranjeiro 	tmp = strtoul(val, NULL, 0);
40799c12dccSNélio Laranjeiro 	if (errno) {
40899c12dccSNélio Laranjeiro 		WARN("%s: \"%s\" is not a valid integer", key, val);
40999c12dccSNélio Laranjeiro 		return errno;
41099c12dccSNélio Laranjeiro 	}
41199c12dccSNélio Laranjeiro 	if (strcmp(MLX5_RXQ_CQE_COMP_EN, key) == 0) {
41250b244a1SShahaf Shuler 		args->cqe_comp = !!tmp;
4132a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQ_INLINE, key) == 0) {
41450b244a1SShahaf Shuler 		args->txq_inline = tmp;
4152a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQS_MIN_INLINE, key) == 0) {
41650b244a1SShahaf Shuler 		args->txqs_inline = tmp;
417230189d9SNélio Laranjeiro 	} else if (strcmp(MLX5_TXQ_MPW_EN, key) == 0) {
41850b244a1SShahaf Shuler 		args->mps = !!tmp;
4196ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MPW_HDR_DSEG_EN, key) == 0) {
42050b244a1SShahaf Shuler 		args->mpw_hdr_dseg = !!tmp;
4216ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MAX_INLINE_LEN, key) == 0) {
42250b244a1SShahaf Shuler 		args->inline_max_packet_sz = tmp;
4233f13f8c2SShahaf Shuler 	} else if (strcmp(MLX5_TSO, key) == 0) {
42450b244a1SShahaf Shuler 		args->tso = !!tmp;
4255644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_TX_VEC_EN, key) == 0) {
4265644d5b9SNelio Laranjeiro 		args->tx_vec_en = !!tmp;
4275644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_RX_VEC_EN, key) == 0) {
4285644d5b9SNelio Laranjeiro 		args->rx_vec_en = !!tmp;
42999c12dccSNélio Laranjeiro 	} else {
430e72dd09bSNélio Laranjeiro 		WARN("%s: unknown parameter", key);
431e72dd09bSNélio Laranjeiro 		return -EINVAL;
432e72dd09bSNélio Laranjeiro 	}
43399c12dccSNélio Laranjeiro 	return 0;
43499c12dccSNélio Laranjeiro }
435e72dd09bSNélio Laranjeiro 
436e72dd09bSNélio Laranjeiro /**
437e72dd09bSNélio Laranjeiro  * Parse device parameters.
438e72dd09bSNélio Laranjeiro  *
439e72dd09bSNélio Laranjeiro  * @param priv
440e72dd09bSNélio Laranjeiro  *   Pointer to private structure.
441e72dd09bSNélio Laranjeiro  * @param devargs
442e72dd09bSNélio Laranjeiro  *   Device arguments structure.
443e72dd09bSNélio Laranjeiro  *
444e72dd09bSNélio Laranjeiro  * @return
445e72dd09bSNélio Laranjeiro  *   0 on success, errno value on failure.
446e72dd09bSNélio Laranjeiro  */
447e72dd09bSNélio Laranjeiro static int
44850b244a1SShahaf Shuler mlx5_args(struct mlx5_args *args, struct rte_devargs *devargs)
449e72dd09bSNélio Laranjeiro {
450e72dd09bSNélio Laranjeiro 	const char **params = (const char *[]){
45199c12dccSNélio Laranjeiro 		MLX5_RXQ_CQE_COMP_EN,
4522a66cf37SYaacov Hazan 		MLX5_TXQ_INLINE,
4532a66cf37SYaacov Hazan 		MLX5_TXQS_MIN_INLINE,
454230189d9SNélio Laranjeiro 		MLX5_TXQ_MPW_EN,
4556ce84bd8SYongseok Koh 		MLX5_TXQ_MPW_HDR_DSEG_EN,
4566ce84bd8SYongseok Koh 		MLX5_TXQ_MAX_INLINE_LEN,
4573f13f8c2SShahaf Shuler 		MLX5_TSO,
4585644d5b9SNelio Laranjeiro 		MLX5_TX_VEC_EN,
4595644d5b9SNelio Laranjeiro 		MLX5_RX_VEC_EN,
460e72dd09bSNélio Laranjeiro 		NULL,
461e72dd09bSNélio Laranjeiro 	};
462e72dd09bSNélio Laranjeiro 	struct rte_kvargs *kvlist;
463e72dd09bSNélio Laranjeiro 	int ret = 0;
464e72dd09bSNélio Laranjeiro 	int i;
465e72dd09bSNélio Laranjeiro 
466e72dd09bSNélio Laranjeiro 	if (devargs == NULL)
467e72dd09bSNélio Laranjeiro 		return 0;
468e72dd09bSNélio Laranjeiro 	/* Following UGLY cast is done to pass checkpatch. */
469e72dd09bSNélio Laranjeiro 	kvlist = rte_kvargs_parse(devargs->args, params);
470e72dd09bSNélio Laranjeiro 	if (kvlist == NULL)
471e72dd09bSNélio Laranjeiro 		return 0;
472e72dd09bSNélio Laranjeiro 	/* Process parameters. */
473e72dd09bSNélio Laranjeiro 	for (i = 0; (params[i] != NULL); ++i) {
474e72dd09bSNélio Laranjeiro 		if (rte_kvargs_count(kvlist, params[i])) {
475e72dd09bSNélio Laranjeiro 			ret = rte_kvargs_process(kvlist, params[i],
47650b244a1SShahaf Shuler 						 mlx5_args_check, args);
477a67323e4SShahaf Shuler 			if (ret != 0) {
478a67323e4SShahaf Shuler 				rte_kvargs_free(kvlist);
479e72dd09bSNélio Laranjeiro 				return ret;
480e72dd09bSNélio Laranjeiro 			}
481e72dd09bSNélio Laranjeiro 		}
482a67323e4SShahaf Shuler 	}
483e72dd09bSNélio Laranjeiro 	rte_kvargs_free(kvlist);
484e72dd09bSNélio Laranjeiro 	return 0;
485e72dd09bSNélio Laranjeiro }
486e72dd09bSNélio Laranjeiro 
487fdf91e0fSJan Blunck static struct rte_pci_driver mlx5_driver;
488771fa900SAdrien Mazarguil 
489771fa900SAdrien Mazarguil /**
49050b244a1SShahaf Shuler  * Assign parameters from args into priv, only non default
49150b244a1SShahaf Shuler  * values are considered.
49250b244a1SShahaf Shuler  *
49350b244a1SShahaf Shuler  * @param[out] priv
49450b244a1SShahaf Shuler  *   Pointer to private structure.
49550b244a1SShahaf Shuler  * @param[in] args
49650b244a1SShahaf Shuler  *   Pointer to args values.
49750b244a1SShahaf Shuler  */
49850b244a1SShahaf Shuler static void
49950b244a1SShahaf Shuler mlx5_args_assign(struct priv *priv, struct mlx5_args *args)
50050b244a1SShahaf Shuler {
50150b244a1SShahaf Shuler 	if (args->cqe_comp != MLX5_ARG_UNSET)
50250b244a1SShahaf Shuler 		priv->cqe_comp = args->cqe_comp;
50350b244a1SShahaf Shuler 	if (args->txq_inline != MLX5_ARG_UNSET)
50450b244a1SShahaf Shuler 		priv->txq_inline = args->txq_inline;
50550b244a1SShahaf Shuler 	if (args->txqs_inline != MLX5_ARG_UNSET)
50650b244a1SShahaf Shuler 		priv->txqs_inline = args->txqs_inline;
50750b244a1SShahaf Shuler 	if (args->mps != MLX5_ARG_UNSET)
50850b244a1SShahaf Shuler 		priv->mps = args->mps ? priv->mps : 0;
50950b244a1SShahaf Shuler 	if (args->mpw_hdr_dseg != MLX5_ARG_UNSET)
51050b244a1SShahaf Shuler 		priv->mpw_hdr_dseg = args->mpw_hdr_dseg;
51150b244a1SShahaf Shuler 	if (args->inline_max_packet_sz != MLX5_ARG_UNSET)
51250b244a1SShahaf Shuler 		priv->inline_max_packet_sz = args->inline_max_packet_sz;
51350b244a1SShahaf Shuler 	if (args->tso != MLX5_ARG_UNSET)
51450b244a1SShahaf Shuler 		priv->tso = args->tso;
5155644d5b9SNelio Laranjeiro 	if (args->tx_vec_en != MLX5_ARG_UNSET)
5165644d5b9SNelio Laranjeiro 		priv->tx_vec_en = args->tx_vec_en;
5175644d5b9SNelio Laranjeiro 	if (args->rx_vec_en != MLX5_ARG_UNSET)
5185644d5b9SNelio Laranjeiro 		priv->rx_vec_en = args->rx_vec_en;
51950b244a1SShahaf Shuler }
52050b244a1SShahaf Shuler 
52150b244a1SShahaf Shuler /**
522771fa900SAdrien Mazarguil  * DPDK callback to register a PCI device.
523771fa900SAdrien Mazarguil  *
524771fa900SAdrien Mazarguil  * This function creates an Ethernet device for each port of a given
525771fa900SAdrien Mazarguil  * PCI device.
526771fa900SAdrien Mazarguil  *
527771fa900SAdrien Mazarguil  * @param[in] pci_drv
528771fa900SAdrien Mazarguil  *   PCI driver structure (mlx5_driver).
529771fa900SAdrien Mazarguil  * @param[in] pci_dev
530771fa900SAdrien Mazarguil  *   PCI device information.
531771fa900SAdrien Mazarguil  *
532771fa900SAdrien Mazarguil  * @return
533771fa900SAdrien Mazarguil  *   0 on success, negative errno value on failure.
534771fa900SAdrien Mazarguil  */
535771fa900SAdrien Mazarguil static int
536af424af8SShreyansh Jain mlx5_pci_probe(struct rte_pci_driver *pci_drv, struct rte_pci_device *pci_dev)
537771fa900SAdrien Mazarguil {
538771fa900SAdrien Mazarguil 	struct ibv_device **list;
539771fa900SAdrien Mazarguil 	struct ibv_device *ibv_dev;
540771fa900SAdrien Mazarguil 	int err = 0;
541771fa900SAdrien Mazarguil 	struct ibv_context *attr_ctx = NULL;
54243e9d979SShachar Beiser 	struct ibv_device_attr_ex device_attr;
54385e347dbSNélio Laranjeiro 	unsigned int sriov;
544e192ef80SYaacov Hazan 	unsigned int mps;
545523f5a74SYongseok Koh 	unsigned int cqe_comp;
546772d3435SXueming Li 	unsigned int tunnel_en = 0;
547771fa900SAdrien Mazarguil 	int idx;
548771fa900SAdrien Mazarguil 	int i;
54943e9d979SShachar Beiser 	struct mlx5dv_context attrs_out;
5509a761de8SOri Kam #ifdef HAVE_IBV_DEVICE_COUNTERS_SET_SUPPORT
5519a761de8SOri Kam 	struct ibv_counter_set_description cs_desc;
5529a761de8SOri Kam #endif
553771fa900SAdrien Mazarguil 
554771fa900SAdrien Mazarguil 	(void)pci_drv;
555fdf91e0fSJan Blunck 	assert(pci_drv == &mlx5_driver);
556771fa900SAdrien Mazarguil 	/* Get mlx5_dev[] index. */
557771fa900SAdrien Mazarguil 	idx = mlx5_dev_idx(&pci_dev->addr);
558771fa900SAdrien Mazarguil 	if (idx == -1) {
559771fa900SAdrien Mazarguil 		ERROR("this driver cannot support any more adapters");
560771fa900SAdrien Mazarguil 		return -ENOMEM;
561771fa900SAdrien Mazarguil 	}
562771fa900SAdrien Mazarguil 	DEBUG("using driver device index %d", idx);
563771fa900SAdrien Mazarguil 
564771fa900SAdrien Mazarguil 	/* Save PCI address. */
565771fa900SAdrien Mazarguil 	mlx5_dev[idx].pci_addr = pci_dev->addr;
566771fa900SAdrien Mazarguil 	list = ibv_get_device_list(&i);
567771fa900SAdrien Mazarguil 	if (list == NULL) {
568771fa900SAdrien Mazarguil 		assert(errno);
5695525aa8fSGaetan Rivet 		if (errno == ENOSYS)
5705525aa8fSGaetan Rivet 			ERROR("cannot list devices, is ib_uverbs loaded?");
571771fa900SAdrien Mazarguil 		return -errno;
572771fa900SAdrien Mazarguil 	}
573771fa900SAdrien Mazarguil 	assert(i >= 0);
574771fa900SAdrien Mazarguil 	/*
575771fa900SAdrien Mazarguil 	 * For each listed device, check related sysfs entry against
576771fa900SAdrien Mazarguil 	 * the provided PCI ID.
577771fa900SAdrien Mazarguil 	 */
578771fa900SAdrien Mazarguil 	while (i != 0) {
579771fa900SAdrien Mazarguil 		struct rte_pci_addr pci_addr;
580771fa900SAdrien Mazarguil 
581771fa900SAdrien Mazarguil 		--i;
582771fa900SAdrien Mazarguil 		DEBUG("checking device \"%s\"", list[i]->name);
583771fa900SAdrien Mazarguil 		if (mlx5_ibv_device_to_pci_addr(list[i], &pci_addr))
584771fa900SAdrien Mazarguil 			continue;
585771fa900SAdrien Mazarguil 		if ((pci_dev->addr.domain != pci_addr.domain) ||
586771fa900SAdrien Mazarguil 		    (pci_dev->addr.bus != pci_addr.bus) ||
587771fa900SAdrien Mazarguil 		    (pci_dev->addr.devid != pci_addr.devid) ||
588771fa900SAdrien Mazarguil 		    (pci_dev->addr.function != pci_addr.function))
589771fa900SAdrien Mazarguil 			continue;
59085e347dbSNélio Laranjeiro 		sriov = ((pci_dev->id.device_id ==
591771fa900SAdrien Mazarguil 		       PCI_DEVICE_ID_MELLANOX_CONNECTX4VF) ||
592771fa900SAdrien Mazarguil 		      (pci_dev->id.device_id ==
593528a9fbeSYongseok Koh 		       PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF) ||
594528a9fbeSYongseok Koh 		      (pci_dev->id.device_id ==
595528a9fbeSYongseok Koh 		       PCI_DEVICE_ID_MELLANOX_CONNECTX5VF) ||
596528a9fbeSYongseok Koh 		      (pci_dev->id.device_id ==
597528a9fbeSYongseok Koh 		       PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF));
598528a9fbeSYongseok Koh 		switch (pci_dev->id.device_id) {
599f5fde520SShahaf Shuler 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
600f5fde520SShahaf Shuler 			tunnel_en = 1;
601f5fde520SShahaf Shuler 			break;
602528a9fbeSYongseok Koh 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4LX:
603528a9fbeSYongseok Koh 		case PCI_DEVICE_ID_MELLANOX_CONNECTX5:
604528a9fbeSYongseok Koh 		case PCI_DEVICE_ID_MELLANOX_CONNECTX5VF:
605528a9fbeSYongseok Koh 		case PCI_DEVICE_ID_MELLANOX_CONNECTX5EX:
606528a9fbeSYongseok Koh 		case PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF:
607f5fde520SShahaf Shuler 			tunnel_en = 1;
608528a9fbeSYongseok Koh 			break;
609528a9fbeSYongseok Koh 		default:
61043e9d979SShachar Beiser 			break;
611528a9fbeSYongseok Koh 		}
61285e347dbSNélio Laranjeiro 		INFO("PCI information matches, using device \"%s\""
61343e9d979SShachar Beiser 		     " (SR-IOV: %s)",
614e192ef80SYaacov Hazan 		     list[i]->name,
61543e9d979SShachar Beiser 		     sriov ? "true" : "false");
616771fa900SAdrien Mazarguil 		attr_ctx = ibv_open_device(list[i]);
617771fa900SAdrien Mazarguil 		err = errno;
618771fa900SAdrien Mazarguil 		break;
619771fa900SAdrien Mazarguil 	}
620771fa900SAdrien Mazarguil 	if (attr_ctx == NULL) {
621771fa900SAdrien Mazarguil 		ibv_free_device_list(list);
622771fa900SAdrien Mazarguil 		switch (err) {
623771fa900SAdrien Mazarguil 		case 0:
6245525aa8fSGaetan Rivet 			ERROR("cannot access device, is mlx5_ib loaded?");
6255525aa8fSGaetan Rivet 			return -ENODEV;
626771fa900SAdrien Mazarguil 		case EINVAL:
6275525aa8fSGaetan Rivet 			ERROR("cannot use device, are drivers up to date?");
6285525aa8fSGaetan Rivet 			return -EINVAL;
629771fa900SAdrien Mazarguil 		}
630771fa900SAdrien Mazarguil 		assert(err > 0);
631771fa900SAdrien Mazarguil 		return -err;
632771fa900SAdrien Mazarguil 	}
633771fa900SAdrien Mazarguil 	ibv_dev = list[i];
634771fa900SAdrien Mazarguil 
635771fa900SAdrien Mazarguil 	DEBUG("device opened");
63643e9d979SShachar Beiser 	/*
63743e9d979SShachar Beiser 	 * Multi-packet send is supported by ConnectX-4 Lx PF as well
63843e9d979SShachar Beiser 	 * as all ConnectX-5 devices.
63943e9d979SShachar Beiser 	 */
64043e9d979SShachar Beiser 	mlx5dv_query_device(attr_ctx, &attrs_out);
641e589960cSYongseok Koh 	if (attrs_out.flags & MLX5DV_CONTEXT_FLAGS_MPW_ALLOWED) {
642e589960cSYongseok Koh 		if (attrs_out.flags & MLX5DV_CONTEXT_FLAGS_ENHANCED_MPW) {
643e589960cSYongseok Koh 			DEBUG("Enhanced MPW is supported");
64443e9d979SShachar Beiser 			mps = MLX5_MPW_ENHANCED;
64543e9d979SShachar Beiser 		} else {
646e589960cSYongseok Koh 			DEBUG("MPW is supported");
647e589960cSYongseok Koh 			mps = MLX5_MPW;
648e589960cSYongseok Koh 		}
649e589960cSYongseok Koh 	} else {
650e589960cSYongseok Koh 		DEBUG("MPW isn't supported");
65143e9d979SShachar Beiser 		mps = MLX5_MPW_DISABLED;
65243e9d979SShachar Beiser 	}
653523f5a74SYongseok Koh 	if (RTE_CACHE_LINE_SIZE == 128 &&
654523f5a74SYongseok Koh 	    !(attrs_out.flags & MLX5DV_CONTEXT_FLAGS_CQE_128B_COMP))
655523f5a74SYongseok Koh 		cqe_comp = 0;
656523f5a74SYongseok Koh 	else
657523f5a74SYongseok Koh 		cqe_comp = 1;
65843e9d979SShachar Beiser 	if (ibv_query_device_ex(attr_ctx, NULL, &device_attr))
659771fa900SAdrien Mazarguil 		goto error;
66043e9d979SShachar Beiser 	INFO("%u port(s) detected", device_attr.orig_attr.phys_port_cnt);
661771fa900SAdrien Mazarguil 
66243e9d979SShachar Beiser 	for (i = 0; i < device_attr.orig_attr.phys_port_cnt; i++) {
663771fa900SAdrien Mazarguil 		uint32_t port = i + 1; /* ports are indexed from one */
664771fa900SAdrien Mazarguil 		uint32_t test = (1 << i);
665771fa900SAdrien Mazarguil 		struct ibv_context *ctx = NULL;
666771fa900SAdrien Mazarguil 		struct ibv_port_attr port_attr;
667771fa900SAdrien Mazarguil 		struct ibv_pd *pd = NULL;
668771fa900SAdrien Mazarguil 		struct priv *priv = NULL;
669771fa900SAdrien Mazarguil 		struct rte_eth_dev *eth_dev;
67043e9d979SShachar Beiser 		struct ibv_device_attr_ex device_attr_ex;
671771fa900SAdrien Mazarguil 		struct ether_addr mac;
67285e347dbSNélio Laranjeiro 		uint16_t num_vfs = 0;
6739a761de8SOri Kam 		struct ibv_device_attr_ex device_attr;
67450b244a1SShahaf Shuler 		struct mlx5_args args = {
67550b244a1SShahaf Shuler 			.cqe_comp = MLX5_ARG_UNSET,
67650b244a1SShahaf Shuler 			.txq_inline = MLX5_ARG_UNSET,
67750b244a1SShahaf Shuler 			.txqs_inline = MLX5_ARG_UNSET,
67850b244a1SShahaf Shuler 			.mps = MLX5_ARG_UNSET,
67950b244a1SShahaf Shuler 			.mpw_hdr_dseg = MLX5_ARG_UNSET,
68050b244a1SShahaf Shuler 			.inline_max_packet_sz = MLX5_ARG_UNSET,
68150b244a1SShahaf Shuler 			.tso = MLX5_ARG_UNSET,
6825644d5b9SNelio Laranjeiro 			.tx_vec_en = MLX5_ARG_UNSET,
6835644d5b9SNelio Laranjeiro 			.rx_vec_en = MLX5_ARG_UNSET,
68450b244a1SShahaf Shuler 		};
685771fa900SAdrien Mazarguil 
686f8b9a3baSXueming Li 		mlx5_dev[idx].ports |= test;
687f8b9a3baSXueming Li 
688*51e7fa8dSNélio Laranjeiro 		if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
689f8b9a3baSXueming Li 			/* from rte_ethdev.c */
690f8b9a3baSXueming Li 			char name[RTE_ETH_NAME_MAX_LEN];
691f8b9a3baSXueming Li 
692f8b9a3baSXueming Li 			snprintf(name, sizeof(name), "%s port %u",
693f8b9a3baSXueming Li 				 ibv_get_device_name(ibv_dev), port);
694f8b9a3baSXueming Li 			eth_dev = rte_eth_dev_attach_secondary(name);
695f8b9a3baSXueming Li 			if (eth_dev == NULL) {
696f8b9a3baSXueming Li 				ERROR("can not attach rte ethdev");
697f8b9a3baSXueming Li 				err = ENOMEM;
698f8b9a3baSXueming Li 				goto error;
699f8b9a3baSXueming Li 			}
700f8b9a3baSXueming Li 			eth_dev->device = &pci_dev->device;
70187ec44ceSXueming Li 			eth_dev->dev_ops = &mlx5_dev_sec_ops;
702f8b9a3baSXueming Li 			priv = eth_dev->data->dev_private;
703f8b9a3baSXueming Li 			/* Receive command fd from primary process */
704f8b9a3baSXueming Li 			err = priv_socket_connect(priv);
705f8b9a3baSXueming Li 			if (err < 0) {
706f8b9a3baSXueming Li 				err = -err;
707f8b9a3baSXueming Li 				goto error;
708f8b9a3baSXueming Li 			}
709f8b9a3baSXueming Li 			/* Remap UAR for Tx queues. */
710f8b9a3baSXueming Li 			err = priv_tx_uar_remap(priv, err);
711f8b9a3baSXueming Li 			if (err < 0) {
712f8b9a3baSXueming Li 				err = -err;
713f8b9a3baSXueming Li 				goto error;
714f8b9a3baSXueming Li 			}
715f8b9a3baSXueming Li 			priv_dev_select_rx_function(priv, eth_dev);
716f8b9a3baSXueming Li 			priv_dev_select_tx_function(priv, eth_dev);
717f8b9a3baSXueming Li 			continue;
718f8b9a3baSXueming Li 		}
719f8b9a3baSXueming Li 
720771fa900SAdrien Mazarguil 		DEBUG("using port %u (%08" PRIx32 ")", port, test);
721771fa900SAdrien Mazarguil 
722771fa900SAdrien Mazarguil 		ctx = ibv_open_device(ibv_dev);
723e1c3e305SMatan Azrad 		if (ctx == NULL) {
724e1c3e305SMatan Azrad 			err = ENODEV;
725771fa900SAdrien Mazarguil 			goto port_error;
726e1c3e305SMatan Azrad 		}
727771fa900SAdrien Mazarguil 
7289a761de8SOri Kam 		ibv_query_device_ex(ctx, NULL, &device_attr);
729771fa900SAdrien Mazarguil 		/* Check port status. */
730771fa900SAdrien Mazarguil 		err = ibv_query_port(ctx, port, &port_attr);
731771fa900SAdrien Mazarguil 		if (err) {
732771fa900SAdrien Mazarguil 			ERROR("port query failed: %s", strerror(err));
733771fa900SAdrien Mazarguil 			goto port_error;
734771fa900SAdrien Mazarguil 		}
7351371f4dfSOr Ami 
7361371f4dfSOr Ami 		if (port_attr.link_layer != IBV_LINK_LAYER_ETHERNET) {
7371371f4dfSOr Ami 			ERROR("port %d is not configured in Ethernet mode",
7381371f4dfSOr Ami 			      port);
739e1c3e305SMatan Azrad 			err = EINVAL;
7401371f4dfSOr Ami 			goto port_error;
7411371f4dfSOr Ami 		}
7421371f4dfSOr Ami 
743771fa900SAdrien Mazarguil 		if (port_attr.state != IBV_PORT_ACTIVE)
744771fa900SAdrien Mazarguil 			DEBUG("port %d is not active: \"%s\" (%d)",
745771fa900SAdrien Mazarguil 			      port, ibv_port_state_str(port_attr.state),
746771fa900SAdrien Mazarguil 			      port_attr.state);
747771fa900SAdrien Mazarguil 
748771fa900SAdrien Mazarguil 		/* Allocate protection domain. */
749771fa900SAdrien Mazarguil 		pd = ibv_alloc_pd(ctx);
750771fa900SAdrien Mazarguil 		if (pd == NULL) {
751771fa900SAdrien Mazarguil 			ERROR("PD allocation failure");
752771fa900SAdrien Mazarguil 			err = ENOMEM;
753771fa900SAdrien Mazarguil 			goto port_error;
754771fa900SAdrien Mazarguil 		}
755771fa900SAdrien Mazarguil 
756771fa900SAdrien Mazarguil 		mlx5_dev[idx].ports |= test;
757771fa900SAdrien Mazarguil 
758771fa900SAdrien Mazarguil 		/* from rte_ethdev.c */
759771fa900SAdrien Mazarguil 		priv = rte_zmalloc("ethdev private structure",
760771fa900SAdrien Mazarguil 				   sizeof(*priv),
761771fa900SAdrien Mazarguil 				   RTE_CACHE_LINE_SIZE);
762771fa900SAdrien Mazarguil 		if (priv == NULL) {
763771fa900SAdrien Mazarguil 			ERROR("priv allocation failure");
764771fa900SAdrien Mazarguil 			err = ENOMEM;
765771fa900SAdrien Mazarguil 			goto port_error;
766771fa900SAdrien Mazarguil 		}
767771fa900SAdrien Mazarguil 
768771fa900SAdrien Mazarguil 		priv->ctx = ctx;
76987ec44ceSXueming Li 		strncpy(priv->ibdev_path, priv->ctx->device->ibdev_path,
77087ec44ceSXueming Li 			sizeof(priv->ibdev_path));
771771fa900SAdrien Mazarguil 		priv->device_attr = device_attr;
772771fa900SAdrien Mazarguil 		priv->port = port;
773771fa900SAdrien Mazarguil 		priv->pd = pd;
774771fa900SAdrien Mazarguil 		priv->mtu = ETHER_MTU;
775230189d9SNélio Laranjeiro 		priv->mps = mps; /* Enable MPW by default if supported. */
776523f5a74SYongseok Koh 		priv->cqe_comp = cqe_comp;
777f5fde520SShahaf Shuler 		priv->tunnel_en = tunnel_en;
7785644d5b9SNelio Laranjeiro 		/* Enable vector by default if supported. */
7795644d5b9SNelio Laranjeiro 		priv->tx_vec_en = 1;
7805644d5b9SNelio Laranjeiro 		priv->rx_vec_en = 1;
78150b244a1SShahaf Shuler 		err = mlx5_args(&args, pci_dev->device.devargs);
782e72dd09bSNélio Laranjeiro 		if (err) {
783e72dd09bSNélio Laranjeiro 			ERROR("failed to process device arguments: %s",
784e72dd09bSNélio Laranjeiro 			      strerror(err));
785e72dd09bSNélio Laranjeiro 			goto port_error;
786e72dd09bSNélio Laranjeiro 		}
78750b244a1SShahaf Shuler 		mlx5_args_assign(priv, &args);
78843e9d979SShachar Beiser 		if (ibv_query_device_ex(ctx, NULL, &device_attr_ex)) {
78943e9d979SShachar Beiser 			ERROR("ibv_query_device_ex() failed");
790771fa900SAdrien Mazarguil 			goto port_error;
791771fa900SAdrien Mazarguil 		}
792771fa900SAdrien Mazarguil 
793771fa900SAdrien Mazarguil 		priv->hw_csum =
79443e9d979SShachar Beiser 			!!(device_attr_ex.device_cap_flags_ex &
79543e9d979SShachar Beiser 			   IBV_DEVICE_RAW_IP_CSUM);
796771fa900SAdrien Mazarguil 		DEBUG("checksum offloading is %ssupported",
797771fa900SAdrien Mazarguil 		      (priv->hw_csum ? "" : "not "));
798771fa900SAdrien Mazarguil 
79943e9d979SShachar Beiser #ifdef HAVE_IBV_DEVICE_VXLAN_SUPPORT
800771fa900SAdrien Mazarguil 		priv->hw_csum_l2tun = !!(exp_device_attr.exp_device_cap_flags &
80143e9d979SShachar Beiser 					 IBV_DEVICE_VXLAN_SUPPORT);
80243e9d979SShachar Beiser #endif
803771fa900SAdrien Mazarguil 		DEBUG("L2 tunnel checksum offloads are %ssupported",
804771fa900SAdrien Mazarguil 		      (priv->hw_csum_l2tun ? "" : "not "));
805771fa900SAdrien Mazarguil 
8069a761de8SOri Kam #ifdef HAVE_IBV_DEVICE_COUNTERS_SET_SUPPORT
8079a761de8SOri Kam 		priv->counter_set_supported = !!(device_attr.max_counter_sets);
8089a761de8SOri Kam 		ibv_describe_counter_set(ctx, 0, &cs_desc);
8099a761de8SOri Kam 		DEBUG("counter type = %d, num of cs = %ld, attributes = %d",
8109a761de8SOri Kam 		      cs_desc.counter_type, cs_desc.num_of_cs,
8119a761de8SOri Kam 		      cs_desc.attributes);
8129a761de8SOri Kam #endif
81343e9d979SShachar Beiser 		priv->ind_table_max_size =
81443e9d979SShachar Beiser 			device_attr_ex.rss_caps.max_rwq_indirection_table_size;
81513d57bd5SAdrien Mazarguil 		/* Remove this check once DPDK supports larger/variable
81613d57bd5SAdrien Mazarguil 		 * indirection tables. */
817ec1fed22SYongseok Koh 		if (priv->ind_table_max_size >
818ec1fed22SYongseok Koh 				(unsigned int)ETH_RSS_RETA_SIZE_512)
819ec1fed22SYongseok Koh 			priv->ind_table_max_size = ETH_RSS_RETA_SIZE_512;
82095e16ef3SNelio Laranjeiro 		DEBUG("maximum RX indirection table size is %u",
82195e16ef3SNelio Laranjeiro 		      priv->ind_table_max_size);
82243e9d979SShachar Beiser 		priv->hw_vlan_strip = !!(device_attr_ex.raw_packet_caps &
82343e9d979SShachar Beiser 					 IBV_RAW_PACKET_CAP_CVLAN_STRIPPING);
824f3db9489SYaacov Hazan 		DEBUG("VLAN stripping is %ssupported",
825f3db9489SYaacov Hazan 		      (priv->hw_vlan_strip ? "" : "not "));
82695e16ef3SNelio Laranjeiro 
82743e9d979SShachar Beiser 		priv->hw_fcs_strip =
82843e9d979SShachar Beiser 				!!(device_attr_ex.orig_attr.device_cap_flags &
82943e9d979SShachar Beiser 				IBV_WQ_FLAGS_SCATTER_FCS);
8304d326709SOlga Shern 		DEBUG("FCS stripping configuration is %ssupported",
8314d326709SOlga Shern 		      (priv->hw_fcs_strip ? "" : "not "));
8324d326709SOlga Shern 
83343e9d979SShachar Beiser #ifdef HAVE_IBV_WQ_FLAG_RX_END_PADDING
83443e9d979SShachar Beiser 		priv->hw_padding = !!device_attr_ex.rx_pad_end_addr_align;
83543e9d979SShachar Beiser #endif
8364d803a72SOlga Shern 		DEBUG("hardware RX end alignment padding is %ssupported",
8374d803a72SOlga Shern 		      (priv->hw_padding ? "" : "not "));
8384d803a72SOlga Shern 
83985e347dbSNélio Laranjeiro 		priv_get_num_vfs(priv, &num_vfs);
84085e347dbSNélio Laranjeiro 		priv->sriov = (num_vfs || sriov);
8413f13f8c2SShahaf Shuler 		priv->tso = ((priv->tso) &&
84243e9d979SShachar Beiser 			    (device_attr_ex.tso_caps.max_tso > 0) &&
84343e9d979SShachar Beiser 			    (device_attr_ex.tso_caps.supported_qpts &
84443e9d979SShachar Beiser 			    (1 << IBV_QPT_RAW_PACKET)));
8453f13f8c2SShahaf Shuler 		if (priv->tso)
8463f13f8c2SShahaf Shuler 			priv->max_tso_payload_sz =
84743e9d979SShachar Beiser 				device_attr_ex.tso_caps.max_tso;
848230189d9SNélio Laranjeiro 		if (priv->mps && !mps) {
849230189d9SNélio Laranjeiro 			ERROR("multi-packet send not supported on this device"
850230189d9SNélio Laranjeiro 			      " (" MLX5_TXQ_MPW_EN ")");
851230189d9SNélio Laranjeiro 			err = ENOTSUP;
852230189d9SNélio Laranjeiro 			goto port_error;
8533f13f8c2SShahaf Shuler 		} else if (priv->mps && priv->tso) {
8543f13f8c2SShahaf Shuler 			WARN("multi-packet send not supported in conjunction "
8553f13f8c2SShahaf Shuler 			      "with TSO. MPS disabled");
8563f13f8c2SShahaf Shuler 			priv->mps = 0;
857230189d9SNélio Laranjeiro 		}
8586ce84bd8SYongseok Koh 		INFO("%sMPS is %s",
8596ce84bd8SYongseok Koh 		     priv->mps == MLX5_MPW_ENHANCED ? "Enhanced " : "",
8606ce84bd8SYongseok Koh 		     priv->mps != MLX5_MPW_DISABLED ? "enabled" : "disabled");
8612dfbbd92SShahaf Shuler 		/* Set default values for Enhanced MPW, a.k.a MPWv2. */
8622dfbbd92SShahaf Shuler 		if (priv->mps == MLX5_MPW_ENHANCED) {
8632dfbbd92SShahaf Shuler 			if (args.txqs_inline == MLX5_ARG_UNSET)
8642dfbbd92SShahaf Shuler 				priv->txqs_inline = MLX5_EMPW_MIN_TXQS;
8652dfbbd92SShahaf Shuler 			if (args.inline_max_packet_sz == MLX5_ARG_UNSET)
8662dfbbd92SShahaf Shuler 				priv->inline_max_packet_sz =
8672dfbbd92SShahaf Shuler 					MLX5_EMPW_MAX_INLINE_LEN;
8682dfbbd92SShahaf Shuler 			if (args.txq_inline == MLX5_ARG_UNSET)
8692dfbbd92SShahaf Shuler 				priv->txq_inline = MLX5_WQE_SIZE_MAX -
8702dfbbd92SShahaf Shuler 						   MLX5_WQE_SIZE;
8712dfbbd92SShahaf Shuler 		}
872523f5a74SYongseok Koh 		if (priv->cqe_comp && !cqe_comp) {
873523f5a74SYongseok Koh 			WARN("Rx CQE compression isn't supported");
874523f5a74SYongseok Koh 			priv->cqe_comp = 0;
875523f5a74SYongseok Koh 		}
876771fa900SAdrien Mazarguil 		/* Configure the first MAC address by default. */
877771fa900SAdrien Mazarguil 		if (priv_get_mac(priv, &mac.addr_bytes)) {
878771fa900SAdrien Mazarguil 			ERROR("cannot get MAC address, is mlx5_en loaded?"
879771fa900SAdrien Mazarguil 			      " (errno: %s)", strerror(errno));
880e1c3e305SMatan Azrad 			err = ENODEV;
881771fa900SAdrien Mazarguil 			goto port_error;
882771fa900SAdrien Mazarguil 		}
883771fa900SAdrien Mazarguil 		INFO("port %u MAC address is %02x:%02x:%02x:%02x:%02x:%02x",
884771fa900SAdrien Mazarguil 		     priv->port,
885771fa900SAdrien Mazarguil 		     mac.addr_bytes[0], mac.addr_bytes[1],
886771fa900SAdrien Mazarguil 		     mac.addr_bytes[2], mac.addr_bytes[3],
887771fa900SAdrien Mazarguil 		     mac.addr_bytes[4], mac.addr_bytes[5]);
888771fa900SAdrien Mazarguil #ifndef NDEBUG
889771fa900SAdrien Mazarguil 		{
890771fa900SAdrien Mazarguil 			char ifname[IF_NAMESIZE];
891771fa900SAdrien Mazarguil 
892771fa900SAdrien Mazarguil 			if (priv_get_ifname(priv, &ifname) == 0)
893771fa900SAdrien Mazarguil 				DEBUG("port %u ifname is \"%s\"",
894771fa900SAdrien Mazarguil 				      priv->port, ifname);
895771fa900SAdrien Mazarguil 			else
896771fa900SAdrien Mazarguil 				DEBUG("port %u ifname is unknown", priv->port);
897771fa900SAdrien Mazarguil 		}
898771fa900SAdrien Mazarguil #endif
899771fa900SAdrien Mazarguil 		/* Get actual MTU if possible. */
900771fa900SAdrien Mazarguil 		priv_get_mtu(priv, &priv->mtu);
901771fa900SAdrien Mazarguil 		DEBUG("port %u MTU is %u", priv->port, priv->mtu);
902771fa900SAdrien Mazarguil 
903771fa900SAdrien Mazarguil 		/* from rte_ethdev.c */
904771fa900SAdrien Mazarguil 		{
905771fa900SAdrien Mazarguil 			char name[RTE_ETH_NAME_MAX_LEN];
906771fa900SAdrien Mazarguil 
907771fa900SAdrien Mazarguil 			snprintf(name, sizeof(name), "%s port %u",
908771fa900SAdrien Mazarguil 				 ibv_get_device_name(ibv_dev), port);
9096751f6deSDavid Marchand 			eth_dev = rte_eth_dev_allocate(name);
910771fa900SAdrien Mazarguil 		}
911771fa900SAdrien Mazarguil 		if (eth_dev == NULL) {
912771fa900SAdrien Mazarguil 			ERROR("can not allocate rte ethdev");
913771fa900SAdrien Mazarguil 			err = ENOMEM;
914771fa900SAdrien Mazarguil 			goto port_error;
915771fa900SAdrien Mazarguil 		}
916771fa900SAdrien Mazarguil 		eth_dev->data->dev_private = priv;
917a48deadaSOr Ami 		eth_dev->data->mac_addrs = priv->mac;
918eac901ceSJan Blunck 		eth_dev->device = &pci_dev->device;
919a48deadaSOr Ami 		rte_eth_copy_pci_info(eth_dev, pci_dev);
920fdf91e0fSJan Blunck 		eth_dev->device->driver = &mlx5_driver.driver;
921771fa900SAdrien Mazarguil 		priv->dev = eth_dev;
922771fa900SAdrien Mazarguil 		eth_dev->dev_ops = &mlx5_dev_ops;
923272733b5SNélio Laranjeiro 		/* Register MAC address. */
924272733b5SNélio Laranjeiro 		claim_zero(mlx5_mac_addr_add(eth_dev, &mac, 0, 0));
925c8ffb8a9SNélio Laranjeiro 		TAILQ_INIT(&priv->flows);
9261b37f5d8SNélio Laranjeiro 		TAILQ_INIT(&priv->ctrl_flows);
927a48deadaSOr Ami 
9281e3a39f7SXueming Li 		/* Hint libmlx5 to use PMD allocator for data plane resources */
9291e3a39f7SXueming Li 		struct mlx5dv_ctx_allocators alctr = {
9301e3a39f7SXueming Li 			.alloc = &mlx5_alloc_verbs_buf,
9311e3a39f7SXueming Li 			.free = &mlx5_free_verbs_buf,
9321e3a39f7SXueming Li 			.data = priv,
9331e3a39f7SXueming Li 		};
9341e3a39f7SXueming Li 		mlx5dv_set_context_attr(ctx, MLX5DV_CTX_ATTR_BUF_ALLOCATORS,
9351e3a39f7SXueming Li 					(void *)((uintptr_t)&alctr));
9361e3a39f7SXueming Li 
937771fa900SAdrien Mazarguil 		/* Bring Ethernet device up. */
938771fa900SAdrien Mazarguil 		DEBUG("forcing Ethernet interface up");
939771fa900SAdrien Mazarguil 		priv_set_flags(priv, ~IFF_UP, IFF_UP);
9402c960a51SMatthieu Ternisien d'Ouville 		mlx5_link_update(priv->dev, 1);
941771fa900SAdrien Mazarguil 		continue;
942771fa900SAdrien Mazarguil 
943771fa900SAdrien Mazarguil port_error:
94429c1d8bbSNélio Laranjeiro 		if (priv)
945771fa900SAdrien Mazarguil 			rte_free(priv);
946771fa900SAdrien Mazarguil 		if (pd)
947771fa900SAdrien Mazarguil 			claim_zero(ibv_dealloc_pd(pd));
948771fa900SAdrien Mazarguil 		if (ctx)
949771fa900SAdrien Mazarguil 			claim_zero(ibv_close_device(ctx));
950771fa900SAdrien Mazarguil 		break;
951771fa900SAdrien Mazarguil 	}
952771fa900SAdrien Mazarguil 
953771fa900SAdrien Mazarguil 	/*
954771fa900SAdrien Mazarguil 	 * XXX if something went wrong in the loop above, there is a resource
955771fa900SAdrien Mazarguil 	 * leak (ctx, pd, priv, dpdk ethdev) but we can do nothing about it as
956771fa900SAdrien Mazarguil 	 * long as the dpdk does not provide a way to deallocate a ethdev and a
957771fa900SAdrien Mazarguil 	 * way to enumerate the registered ethdevs to free the previous ones.
958771fa900SAdrien Mazarguil 	 */
959771fa900SAdrien Mazarguil 
960771fa900SAdrien Mazarguil 	/* no port found, complain */
961771fa900SAdrien Mazarguil 	if (!mlx5_dev[idx].ports) {
962771fa900SAdrien Mazarguil 		err = ENODEV;
963771fa900SAdrien Mazarguil 		goto error;
964771fa900SAdrien Mazarguil 	}
965771fa900SAdrien Mazarguil 
966771fa900SAdrien Mazarguil error:
967771fa900SAdrien Mazarguil 	if (attr_ctx)
968771fa900SAdrien Mazarguil 		claim_zero(ibv_close_device(attr_ctx));
969771fa900SAdrien Mazarguil 	if (list)
970771fa900SAdrien Mazarguil 		ibv_free_device_list(list);
971771fa900SAdrien Mazarguil 	assert(err >= 0);
972771fa900SAdrien Mazarguil 	return -err;
973771fa900SAdrien Mazarguil }
974771fa900SAdrien Mazarguil 
975771fa900SAdrien Mazarguil static const struct rte_pci_id mlx5_pci_id_map[] = {
976771fa900SAdrien Mazarguil 	{
9771d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
9781d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4)
979771fa900SAdrien Mazarguil 	},
980771fa900SAdrien Mazarguil 	{
9811d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
9821d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4VF)
983771fa900SAdrien Mazarguil 	},
984771fa900SAdrien Mazarguil 	{
9851d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
9861d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LX)
987771fa900SAdrien Mazarguil 	},
988771fa900SAdrien Mazarguil 	{
9891d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
9901d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF)
991771fa900SAdrien Mazarguil 	},
992771fa900SAdrien Mazarguil 	{
993528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
994528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5)
995528a9fbeSYongseok Koh 	},
996528a9fbeSYongseok Koh 	{
997528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
998528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5VF)
999528a9fbeSYongseok Koh 	},
1000528a9fbeSYongseok Koh 	{
1001528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
1002528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EX)
1003528a9fbeSYongseok Koh 	},
1004528a9fbeSYongseok Koh 	{
1005528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
1006528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF)
1007528a9fbeSYongseok Koh 	},
1008528a9fbeSYongseok Koh 	{
1009771fa900SAdrien Mazarguil 		.vendor_id = 0
1010771fa900SAdrien Mazarguil 	}
1011771fa900SAdrien Mazarguil };
1012771fa900SAdrien Mazarguil 
1013fdf91e0fSJan Blunck static struct rte_pci_driver mlx5_driver = {
10142f3193cfSJan Viktorin 	.driver = {
10152f3193cfSJan Viktorin 		.name = MLX5_DRIVER_NAME
10162f3193cfSJan Viktorin 	},
1017771fa900SAdrien Mazarguil 	.id_table = mlx5_pci_id_map,
1018af424af8SShreyansh Jain 	.probe = mlx5_pci_probe,
10197d7d7ad1SMatan Azrad 	.drv_flags = RTE_PCI_DRV_INTR_LSC | RTE_PCI_DRV_INTR_RMV,
1020771fa900SAdrien Mazarguil };
1021771fa900SAdrien Mazarguil 
1022771fa900SAdrien Mazarguil /**
1023771fa900SAdrien Mazarguil  * Driver initialization routine.
1024771fa900SAdrien Mazarguil  */
1025c830cb29SDavid Marchand RTE_INIT(rte_mlx5_pmd_init);
1026c830cb29SDavid Marchand static void
1027c830cb29SDavid Marchand rte_mlx5_pmd_init(void)
1028771fa900SAdrien Mazarguil {
1029ea16068cSYongseok Koh 	/* Build the static table for ptype conversion. */
1030ea16068cSYongseok Koh 	mlx5_set_ptype_table();
1031771fa900SAdrien Mazarguil 	/*
1032771fa900SAdrien Mazarguil 	 * RDMAV_HUGEPAGES_SAFE tells ibv_fork_init() we intend to use
1033771fa900SAdrien Mazarguil 	 * huge pages. Calling ibv_fork_init() during init allows
1034771fa900SAdrien Mazarguil 	 * applications to use fork() safely for purposes other than
1035771fa900SAdrien Mazarguil 	 * using this PMD, which is not supported in forked processes.
1036771fa900SAdrien Mazarguil 	 */
1037771fa900SAdrien Mazarguil 	setenv("RDMAV_HUGEPAGES_SAFE", "1", 1);
1038161b93e5SYongseok Koh 	/* Match the size of Rx completion entry to the size of a cacheline. */
1039161b93e5SYongseok Koh 	if (RTE_CACHE_LINE_SIZE == 128)
1040161b93e5SYongseok Koh 		setenv("MLX5_CQE_SIZE", "128", 0);
1041771fa900SAdrien Mazarguil 	ibv_fork_init();
10423dcfe039SThomas Monjalon 	rte_pci_register(&mlx5_driver);
1043771fa900SAdrien Mazarguil }
1044771fa900SAdrien Mazarguil 
104501f19227SShreyansh Jain RTE_PMD_EXPORT_NAME(net_mlx5, __COUNTER__);
104601f19227SShreyansh Jain RTE_PMD_REGISTER_PCI_TABLE(net_mlx5, mlx5_pci_id_map);
10470880c401SOlivier Matz RTE_PMD_REGISTER_KMOD_DEP(net_mlx5, "* ib_uverbs & mlx5_core & mlx5_ib");
1048