xref: /dpdk/drivers/net/mlx5/mlx5.c (revision 495b2ed40a39b2bc7c6c146535c511e983ae2b64)
18fd92a66SOlivier Matz /* SPDX-License-Identifier: BSD-3-Clause
2771fa900SAdrien Mazarguil  * Copyright 2015 6WIND S.A.
35feecc57SShahaf Shuler  * Copyright 2015 Mellanox Technologies, Ltd
4771fa900SAdrien Mazarguil  */
5771fa900SAdrien Mazarguil 
6771fa900SAdrien Mazarguil #include <stddef.h>
7771fa900SAdrien Mazarguil #include <unistd.h>
8771fa900SAdrien Mazarguil #include <string.h>
9771fa900SAdrien Mazarguil #include <stdint.h>
10771fa900SAdrien Mazarguil #include <stdlib.h>
11e72dd09bSNélio Laranjeiro #include <errno.h>
12771fa900SAdrien Mazarguil 
13771fa900SAdrien Mazarguil #include <rte_malloc.h>
14ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h>
15fdf91e0fSJan Blunck #include <rte_ethdev_pci.h>
16771fa900SAdrien Mazarguil #include <rte_pci.h>
17c752998bSGaetan Rivet #include <rte_bus_pci.h>
18771fa900SAdrien Mazarguil #include <rte_common.h>
19e72dd09bSNélio Laranjeiro #include <rte_kvargs.h>
20e89c15b6SAdrien Mazarguil #include <rte_rwlock.h>
21e89c15b6SAdrien Mazarguil #include <rte_spinlock.h>
22f38c5457SAdrien Mazarguil #include <rte_string_fns.h>
23f15db67dSMatan Azrad #include <rte_alarm.h>
24771fa900SAdrien Mazarguil 
257b4f1e6bSMatan Azrad #include <mlx5_glue.h>
267b4f1e6bSMatan Azrad #include <mlx5_devx_cmds.h>
2793e30982SMatan Azrad #include <mlx5_common.h>
28391b8bccSOphir Munk #include <mlx5_common_os.h>
29a4de9586SVu Pham #include <mlx5_common_mp.h>
30392bf908SParav Pandit #include <mlx5_common_pci.h>
3183c2047cSSuanming Mou #include <mlx5_malloc.h>
327b4f1e6bSMatan Azrad 
337b4f1e6bSMatan Azrad #include "mlx5_defs.h"
34771fa900SAdrien Mazarguil #include "mlx5.h"
35771fa900SAdrien Mazarguil #include "mlx5_utils.h"
362e22920bSAdrien Mazarguil #include "mlx5_rxtx.h"
37771fa900SAdrien Mazarguil #include "mlx5_autoconf.h"
38974f1e7eSYongseok Koh #include "mlx5_mr.h"
3984c406e7SOri Kam #include "mlx5_flow.h"
40efa79e68SOri Kam #include "rte_pmd_mlx5.h"
41771fa900SAdrien Mazarguil 
4299c12dccSNélio Laranjeiro /* Device parameter to enable RX completion queue compression. */
4399c12dccSNélio Laranjeiro #define MLX5_RXQ_CQE_COMP_EN "rxq_cqe_comp_en"
4499c12dccSNélio Laranjeiro 
45bc91e8dbSYongseok Koh /* Device parameter to enable RX completion entry padding to 128B. */
46bc91e8dbSYongseok Koh #define MLX5_RXQ_CQE_PAD_EN "rxq_cqe_pad_en"
47bc91e8dbSYongseok Koh 
4878c7a16dSYongseok Koh /* Device parameter to enable padding Rx packet to cacheline size. */
4978c7a16dSYongseok Koh #define MLX5_RXQ_PKT_PAD_EN "rxq_pkt_pad_en"
5078c7a16dSYongseok Koh 
517d6bf6b8SYongseok Koh /* Device parameter to enable Multi-Packet Rx queue. */
527d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_EN "mprq_en"
537d6bf6b8SYongseok Koh 
547d6bf6b8SYongseok Koh /* Device parameter to configure log 2 of the number of strides for MPRQ. */
557d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_LOG_STRIDE_NUM "mprq_log_stride_num"
567d6bf6b8SYongseok Koh 
57ecb16045SAlexander Kozyrev /* Device parameter to configure log 2 of the stride size for MPRQ. */
58ecb16045SAlexander Kozyrev #define MLX5_RX_MPRQ_LOG_STRIDE_SIZE "mprq_log_stride_size"
59ecb16045SAlexander Kozyrev 
607d6bf6b8SYongseok Koh /* Device parameter to limit the size of memcpy'd packet for MPRQ. */
617d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_MAX_MEMCPY_LEN "mprq_max_memcpy_len"
627d6bf6b8SYongseok Koh 
637d6bf6b8SYongseok Koh /* Device parameter to set the minimum number of Rx queues to enable MPRQ. */
647d6bf6b8SYongseok Koh #define MLX5_RXQS_MIN_MPRQ "rxqs_min_mprq"
657d6bf6b8SYongseok Koh 
66a6bd4911SViacheslav Ovsiienko /* Device parameter to configure inline send. Deprecated, ignored.*/
672a66cf37SYaacov Hazan #define MLX5_TXQ_INLINE "txq_inline"
682a66cf37SYaacov Hazan 
69505f1fe4SViacheslav Ovsiienko /* Device parameter to limit packet size to inline with ordinary SEND. */
70505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MAX "txq_inline_max"
71505f1fe4SViacheslav Ovsiienko 
72505f1fe4SViacheslav Ovsiienko /* Device parameter to configure minimal data size to inline. */
73505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MIN "txq_inline_min"
74505f1fe4SViacheslav Ovsiienko 
75505f1fe4SViacheslav Ovsiienko /* Device parameter to limit packet size to inline with Enhanced MPW. */
76505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MPW "txq_inline_mpw"
77505f1fe4SViacheslav Ovsiienko 
782a66cf37SYaacov Hazan /*
792a66cf37SYaacov Hazan  * Device parameter to configure the number of TX queues threshold for
802a66cf37SYaacov Hazan  * enabling inline send.
812a66cf37SYaacov Hazan  */
822a66cf37SYaacov Hazan #define MLX5_TXQS_MIN_INLINE "txqs_min_inline"
832a66cf37SYaacov Hazan 
8409d8b416SYongseok Koh /*
8509d8b416SYongseok Koh  * Device parameter to configure the number of TX queues threshold for
86a6bd4911SViacheslav Ovsiienko  * enabling vectorized Tx, deprecated, ignored (no vectorized Tx routines).
8709d8b416SYongseok Koh  */
8809d8b416SYongseok Koh #define MLX5_TXQS_MAX_VEC "txqs_max_vec"
8909d8b416SYongseok Koh 
90230189d9SNélio Laranjeiro /* Device parameter to enable multi-packet send WQEs. */
91230189d9SNélio Laranjeiro #define MLX5_TXQ_MPW_EN "txq_mpw_en"
92230189d9SNélio Laranjeiro 
93a6bd4911SViacheslav Ovsiienko /*
948409a285SViacheslav Ovsiienko  * Device parameter to force doorbell register mapping
958409a285SViacheslav Ovsiienko  * to non-cahed region eliminating the extra write memory barrier.
968409a285SViacheslav Ovsiienko  */
978409a285SViacheslav Ovsiienko #define MLX5_TX_DB_NC "tx_db_nc"
988409a285SViacheslav Ovsiienko 
998409a285SViacheslav Ovsiienko /*
100a6bd4911SViacheslav Ovsiienko  * Device parameter to include 2 dsegs in the title WQEBB.
101a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored.
102a6bd4911SViacheslav Ovsiienko  */
1036ce84bd8SYongseok Koh #define MLX5_TXQ_MPW_HDR_DSEG_EN "txq_mpw_hdr_dseg_en"
1046ce84bd8SYongseok Koh 
105a6bd4911SViacheslav Ovsiienko /*
106a6bd4911SViacheslav Ovsiienko  * Device parameter to limit the size of inlining packet.
107a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored.
108a6bd4911SViacheslav Ovsiienko  */
1096ce84bd8SYongseok Koh #define MLX5_TXQ_MAX_INLINE_LEN "txq_max_inline_len"
1106ce84bd8SYongseok Koh 
111a6bd4911SViacheslav Ovsiienko /*
1128f848f32SViacheslav Ovsiienko  * Device parameter to enable Tx scheduling on timestamps
1138f848f32SViacheslav Ovsiienko  * and specify the packet pacing granularity in nanoseconds.
1148f848f32SViacheslav Ovsiienko  */
1158f848f32SViacheslav Ovsiienko #define MLX5_TX_PP "tx_pp"
1168f848f32SViacheslav Ovsiienko 
1178f848f32SViacheslav Ovsiienko /*
1188f848f32SViacheslav Ovsiienko  * Device parameter to specify skew in nanoseconds on Tx datapath,
1198f848f32SViacheslav Ovsiienko  * it represents the time between SQ start WQE processing and
1208f848f32SViacheslav Ovsiienko  * appearing actual packet data on the wire.
1218f848f32SViacheslav Ovsiienko  */
1228f848f32SViacheslav Ovsiienko #define MLX5_TX_SKEW "tx_skew"
1238f848f32SViacheslav Ovsiienko 
1248f848f32SViacheslav Ovsiienko /*
125a6bd4911SViacheslav Ovsiienko  * Device parameter to enable hardware Tx vector.
126a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored (no vectorized Tx routines anymore).
127a6bd4911SViacheslav Ovsiienko  */
1285644d5b9SNelio Laranjeiro #define MLX5_TX_VEC_EN "tx_vec_en"
1295644d5b9SNelio Laranjeiro 
1305644d5b9SNelio Laranjeiro /* Device parameter to enable hardware Rx vector. */
1315644d5b9SNelio Laranjeiro #define MLX5_RX_VEC_EN "rx_vec_en"
1325644d5b9SNelio Laranjeiro 
13378a54648SXueming Li /* Allow L3 VXLAN flow creation. */
13478a54648SXueming Li #define MLX5_L3_VXLAN_EN "l3_vxlan_en"
13578a54648SXueming Li 
136e2b4925eSOri Kam /* Activate DV E-Switch flow steering. */
137e2b4925eSOri Kam #define MLX5_DV_ESW_EN "dv_esw_en"
138e2b4925eSOri Kam 
13951e72d38SOri Kam /* Activate DV flow steering. */
14051e72d38SOri Kam #define MLX5_DV_FLOW_EN "dv_flow_en"
14151e72d38SOri Kam 
1422d241515SViacheslav Ovsiienko /* Enable extensive flow metadata support. */
1432d241515SViacheslav Ovsiienko #define MLX5_DV_XMETA_EN "dv_xmeta_en"
1442d241515SViacheslav Ovsiienko 
1450f0ae73aSShiri Kuzin /* Device parameter to let the user manage the lacp traffic of bonded device */
1460f0ae73aSShiri Kuzin #define MLX5_LACP_BY_USER "lacp_by_user"
1470f0ae73aSShiri Kuzin 
148db209cc3SNélio Laranjeiro /* Activate Netlink support in VF mode. */
149db209cc3SNélio Laranjeiro #define MLX5_VF_NL_EN "vf_nl_en"
150db209cc3SNélio Laranjeiro 
151dceb5029SYongseok Koh /* Enable extending memsegs when creating a MR. */
152dceb5029SYongseok Koh #define MLX5_MR_EXT_MEMSEG_EN "mr_ext_memseg_en"
153dceb5029SYongseok Koh 
1546de569f5SAdrien Mazarguil /* Select port representors to instantiate. */
1556de569f5SAdrien Mazarguil #define MLX5_REPRESENTOR "representor"
1566de569f5SAdrien Mazarguil 
157066cfecdSMatan Azrad /* Device parameter to configure the maximum number of dump files per queue. */
158066cfecdSMatan Azrad #define MLX5_MAX_DUMP_FILES_NUM "max_dump_files_num"
159066cfecdSMatan Azrad 
16021bb6c7eSDekel Peled /* Configure timeout of LRO session (in microseconds). */
16121bb6c7eSDekel Peled #define MLX5_LRO_TIMEOUT_USEC "lro_timeout_usec"
16221bb6c7eSDekel Peled 
1631ad9a3d0SBing Zhao /*
1641ad9a3d0SBing Zhao  * Device parameter to configure the total data buffer size for a single
1651ad9a3d0SBing Zhao  * hairpin queue (logarithm value).
1661ad9a3d0SBing Zhao  */
1671ad9a3d0SBing Zhao #define MLX5_HP_BUF_SIZE "hp_buf_log_sz"
1681ad9a3d0SBing Zhao 
169a1da6f62SSuanming Mou /* Flow memory reclaim mode. */
170a1da6f62SSuanming Mou #define MLX5_RECLAIM_MEM "reclaim_mem_mode"
171a1da6f62SSuanming Mou 
1725522da6bSSuanming Mou /* The default memory allocator used in PMD. */
1735522da6bSSuanming Mou #define MLX5_SYS_MEM_EN "sys_mem_en"
17450f95b23SSuanming Mou /* Decap will be used or not. */
17550f95b23SSuanming Mou #define MLX5_DECAP_EN "decap_en"
1765522da6bSSuanming Mou 
177974f1e7eSYongseok Koh /* Shared memory between primary and secondary processes. */
178974f1e7eSYongseok Koh struct mlx5_shared_data *mlx5_shared_data;
179974f1e7eSYongseok Koh 
1802e86c4e5SOphir Munk /** Driver-specific log messages type. */
1812e86c4e5SOphir Munk int mlx5_logtype;
182a170a30dSNélio Laranjeiro 
18391389890SOphir Munk static LIST_HEAD(, mlx5_dev_ctx_shared) mlx5_dev_ctx_list =
18491389890SOphir Munk 						LIST_HEAD_INITIALIZER();
18591389890SOphir Munk static pthread_mutex_t mlx5_dev_ctx_list_mutex = PTHREAD_MUTEX_INITIALIZER;
18617e19bc4SViacheslav Ovsiienko 
1875c761238SGregory Etelson static const struct mlx5_indexed_pool_config mlx5_ipool_cfg[] = {
188b88341caSSuanming Mou #ifdef HAVE_IBV_FLOW_DV_SUPPORT
1899cac7dedSGregory Etelson 	[MLX5_IPOOL_DECAP_ENCAP] = {
190014d1cbeSSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_encap_decap_resource),
191014d1cbeSSuanming Mou 		.trunk_size = 64,
192014d1cbeSSuanming Mou 		.grow_trunk = 3,
193014d1cbeSSuanming Mou 		.grow_shift = 2,
1942f3dc1f4SSuanming Mou 		.need_lock = 1,
195014d1cbeSSuanming Mou 		.release_mem_en = 1,
19683c2047cSSuanming Mou 		.malloc = mlx5_malloc,
19783c2047cSSuanming Mou 		.free = mlx5_free,
198014d1cbeSSuanming Mou 		.type = "mlx5_encap_decap_ipool",
199014d1cbeSSuanming Mou 	},
2009cac7dedSGregory Etelson 	[MLX5_IPOOL_PUSH_VLAN] = {
2018acf8ac9SSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_push_vlan_action_resource),
2028acf8ac9SSuanming Mou 		.trunk_size = 64,
2038acf8ac9SSuanming Mou 		.grow_trunk = 3,
2048acf8ac9SSuanming Mou 		.grow_shift = 2,
2052f3dc1f4SSuanming Mou 		.need_lock = 1,
2068acf8ac9SSuanming Mou 		.release_mem_en = 1,
20783c2047cSSuanming Mou 		.malloc = mlx5_malloc,
20883c2047cSSuanming Mou 		.free = mlx5_free,
2098acf8ac9SSuanming Mou 		.type = "mlx5_push_vlan_ipool",
2108acf8ac9SSuanming Mou 	},
2119cac7dedSGregory Etelson 	[MLX5_IPOOL_TAG] = {
2125f114269SSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_tag_resource),
2135f114269SSuanming Mou 		.trunk_size = 64,
2145f114269SSuanming Mou 		.grow_trunk = 3,
2155f114269SSuanming Mou 		.grow_shift = 2,
2162f3dc1f4SSuanming Mou 		.need_lock = 1,
2175f114269SSuanming Mou 		.release_mem_en = 1,
21883c2047cSSuanming Mou 		.malloc = mlx5_malloc,
21983c2047cSSuanming Mou 		.free = mlx5_free,
2205f114269SSuanming Mou 		.type = "mlx5_tag_ipool",
2215f114269SSuanming Mou 	},
2229cac7dedSGregory Etelson 	[MLX5_IPOOL_PORT_ID] = {
223f3faf9eaSSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_port_id_action_resource),
224f3faf9eaSSuanming Mou 		.trunk_size = 64,
225f3faf9eaSSuanming Mou 		.grow_trunk = 3,
226f3faf9eaSSuanming Mou 		.grow_shift = 2,
2272f3dc1f4SSuanming Mou 		.need_lock = 1,
228f3faf9eaSSuanming Mou 		.release_mem_en = 1,
22983c2047cSSuanming Mou 		.malloc = mlx5_malloc,
23083c2047cSSuanming Mou 		.free = mlx5_free,
231f3faf9eaSSuanming Mou 		.type = "mlx5_port_id_ipool",
232f3faf9eaSSuanming Mou 	},
2339cac7dedSGregory Etelson 	[MLX5_IPOOL_JUMP] = {
2347ac99475SSuanming Mou 		.size = sizeof(struct mlx5_flow_tbl_data_entry),
2357ac99475SSuanming Mou 		.trunk_size = 64,
2367ac99475SSuanming Mou 		.grow_trunk = 3,
2377ac99475SSuanming Mou 		.grow_shift = 2,
2382f3dc1f4SSuanming Mou 		.need_lock = 1,
2397ac99475SSuanming Mou 		.release_mem_en = 1,
24083c2047cSSuanming Mou 		.malloc = mlx5_malloc,
24183c2047cSSuanming Mou 		.free = mlx5_free,
2427ac99475SSuanming Mou 		.type = "mlx5_jump_ipool",
2437ac99475SSuanming Mou 	},
2449cac7dedSGregory Etelson 	[MLX5_IPOOL_SAMPLE] = {
245b4c0ddbfSJiawei Wang 		.size = sizeof(struct mlx5_flow_dv_sample_resource),
246b4c0ddbfSJiawei Wang 		.trunk_size = 64,
247b4c0ddbfSJiawei Wang 		.grow_trunk = 3,
248b4c0ddbfSJiawei Wang 		.grow_shift = 2,
2492f3dc1f4SSuanming Mou 		.need_lock = 1,
250b4c0ddbfSJiawei Wang 		.release_mem_en = 1,
251b4c0ddbfSJiawei Wang 		.malloc = mlx5_malloc,
252b4c0ddbfSJiawei Wang 		.free = mlx5_free,
253b4c0ddbfSJiawei Wang 		.type = "mlx5_sample_ipool",
254b4c0ddbfSJiawei Wang 	},
2559cac7dedSGregory Etelson 	[MLX5_IPOOL_DEST_ARRAY] = {
25600c10c22SJiawei Wang 		.size = sizeof(struct mlx5_flow_dv_dest_array_resource),
25700c10c22SJiawei Wang 		.trunk_size = 64,
25800c10c22SJiawei Wang 		.grow_trunk = 3,
25900c10c22SJiawei Wang 		.grow_shift = 2,
2602f3dc1f4SSuanming Mou 		.need_lock = 1,
26100c10c22SJiawei Wang 		.release_mem_en = 1,
26200c10c22SJiawei Wang 		.malloc = mlx5_malloc,
26300c10c22SJiawei Wang 		.free = mlx5_free,
26400c10c22SJiawei Wang 		.type = "mlx5_dest_array_ipool",
26500c10c22SJiawei Wang 	},
2669cac7dedSGregory Etelson 	[MLX5_IPOOL_TUNNEL_ID] = {
2679cac7dedSGregory Etelson 		.size = sizeof(struct mlx5_flow_tunnel),
268*495b2ed4SSuanming Mou 		.trunk_size = MLX5_MAX_TUNNELS,
2699cac7dedSGregory Etelson 		.need_lock = 1,
2709cac7dedSGregory Etelson 		.release_mem_en = 1,
2719cac7dedSGregory Etelson 		.type = "mlx5_tunnel_offload",
2729cac7dedSGregory Etelson 	},
2739cac7dedSGregory Etelson 	[MLX5_IPOOL_TNL_TBL_ID] = {
2749cac7dedSGregory Etelson 		.size = 0,
2759cac7dedSGregory Etelson 		.need_lock = 1,
2769cac7dedSGregory Etelson 		.type = "mlx5_flow_tnl_tbl_ipool",
2779cac7dedSGregory Etelson 	},
278b88341caSSuanming Mou #endif
2799cac7dedSGregory Etelson 	[MLX5_IPOOL_MTR] = {
2808638e2b0SSuanming Mou 		.size = sizeof(struct mlx5_flow_meter),
2818638e2b0SSuanming Mou 		.trunk_size = 64,
2828638e2b0SSuanming Mou 		.grow_trunk = 3,
2838638e2b0SSuanming Mou 		.grow_shift = 2,
2842f3dc1f4SSuanming Mou 		.need_lock = 1,
2858638e2b0SSuanming Mou 		.release_mem_en = 1,
28683c2047cSSuanming Mou 		.malloc = mlx5_malloc,
28783c2047cSSuanming Mou 		.free = mlx5_free,
2888638e2b0SSuanming Mou 		.type = "mlx5_meter_ipool",
2898638e2b0SSuanming Mou 	},
2909cac7dedSGregory Etelson 	[MLX5_IPOOL_MCP] = {
29190e6053aSSuanming Mou 		.size = sizeof(struct mlx5_flow_mreg_copy_resource),
29290e6053aSSuanming Mou 		.trunk_size = 64,
29390e6053aSSuanming Mou 		.grow_trunk = 3,
29490e6053aSSuanming Mou 		.grow_shift = 2,
2952f3dc1f4SSuanming Mou 		.need_lock = 1,
29690e6053aSSuanming Mou 		.release_mem_en = 1,
29783c2047cSSuanming Mou 		.malloc = mlx5_malloc,
29883c2047cSSuanming Mou 		.free = mlx5_free,
29990e6053aSSuanming Mou 		.type = "mlx5_mcp_ipool",
30090e6053aSSuanming Mou 	},
3019cac7dedSGregory Etelson 	[MLX5_IPOOL_HRXQ] = {
302772dc0ebSSuanming Mou 		.size = (sizeof(struct mlx5_hrxq) + MLX5_RSS_HASH_KEY_LEN),
303772dc0ebSSuanming Mou 		.trunk_size = 64,
304772dc0ebSSuanming Mou 		.grow_trunk = 3,
305772dc0ebSSuanming Mou 		.grow_shift = 2,
3062f3dc1f4SSuanming Mou 		.need_lock = 1,
307772dc0ebSSuanming Mou 		.release_mem_en = 1,
30883c2047cSSuanming Mou 		.malloc = mlx5_malloc,
30983c2047cSSuanming Mou 		.free = mlx5_free,
310772dc0ebSSuanming Mou 		.type = "mlx5_hrxq_ipool",
311772dc0ebSSuanming Mou 	},
3129cac7dedSGregory Etelson 	[MLX5_IPOOL_MLX5_FLOW] = {
3135c761238SGregory Etelson 		/*
3145c761238SGregory Etelson 		 * MLX5_IPOOL_MLX5_FLOW size varies for DV and VERBS flows.
3155c761238SGregory Etelson 		 * It set in run time according to PCI function configuration.
3165c761238SGregory Etelson 		 */
3175c761238SGregory Etelson 		.size = 0,
318b88341caSSuanming Mou 		.trunk_size = 64,
319b88341caSSuanming Mou 		.grow_trunk = 3,
320b88341caSSuanming Mou 		.grow_shift = 2,
3212f3dc1f4SSuanming Mou 		.need_lock = 1,
322b88341caSSuanming Mou 		.release_mem_en = 1,
32383c2047cSSuanming Mou 		.malloc = mlx5_malloc,
32483c2047cSSuanming Mou 		.free = mlx5_free,
325b88341caSSuanming Mou 		.type = "mlx5_flow_handle_ipool",
326b88341caSSuanming Mou 	},
3279cac7dedSGregory Etelson 	[MLX5_IPOOL_RTE_FLOW] = {
328ab612adcSSuanming Mou 		.size = sizeof(struct rte_flow),
329ab612adcSSuanming Mou 		.trunk_size = 4096,
330ab612adcSSuanming Mou 		.need_lock = 1,
331ab612adcSSuanming Mou 		.release_mem_en = 1,
33283c2047cSSuanming Mou 		.malloc = mlx5_malloc,
33383c2047cSSuanming Mou 		.free = mlx5_free,
334ab612adcSSuanming Mou 		.type = "rte_flow_ipool",
335ab612adcSSuanming Mou 	},
3369cac7dedSGregory Etelson 	[MLX5_IPOOL_RSS_EXPANTION_FLOW_ID] = {
3374ae8825cSXueming Li 		.size = 0,
3384ae8825cSXueming Li 		.need_lock = 1,
3394ae8825cSXueming Li 		.type = "mlx5_flow_rss_id_ipool",
3404ae8825cSXueming Li 	},
3419cac7dedSGregory Etelson 	[MLX5_IPOOL_RSS_SHARED_ACTIONS] = {
3424a42ac1fSMatan Azrad 		.size = sizeof(struct mlx5_shared_action_rss),
3434a42ac1fSMatan Azrad 		.trunk_size = 64,
3444a42ac1fSMatan Azrad 		.grow_trunk = 3,
3454a42ac1fSMatan Azrad 		.grow_shift = 2,
3464a42ac1fSMatan Azrad 		.need_lock = 1,
3474a42ac1fSMatan Azrad 		.release_mem_en = 1,
3484a42ac1fSMatan Azrad 		.malloc = mlx5_malloc,
3494a42ac1fSMatan Azrad 		.free = mlx5_free,
3504a42ac1fSMatan Azrad 		.type = "mlx5_shared_action_rss",
3514a42ac1fSMatan Azrad 	},
352014d1cbeSSuanming Mou };
353014d1cbeSSuanming Mou 
354014d1cbeSSuanming Mou 
355830d2091SOri Kam #define MLX5_FLOW_MIN_ID_POOL_SIZE 512
356830d2091SOri Kam #define MLX5_ID_GENERATION_ARRAY_FACTOR 16
357830d2091SOri Kam 
358860897d2SBing Zhao #define MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE 4096
359860897d2SBing Zhao 
360830d2091SOri Kam /**
361f935ed4bSDekel Peled  * Initialize the ASO aging management structure.
362f935ed4bSDekel Peled  *
363f935ed4bSDekel Peled  * @param[in] sh
364f935ed4bSDekel Peled  *   Pointer to mlx5_dev_ctx_shared object to free
365f935ed4bSDekel Peled  *
366f935ed4bSDekel Peled  * @return
367f935ed4bSDekel Peled  *   0 on success, a negative errno value otherwise and rte_errno is set.
368f935ed4bSDekel Peled  */
369f935ed4bSDekel Peled int
370f935ed4bSDekel Peled mlx5_flow_aso_age_mng_init(struct mlx5_dev_ctx_shared *sh)
371f935ed4bSDekel Peled {
372f935ed4bSDekel Peled 	int err;
373f935ed4bSDekel Peled 
374f935ed4bSDekel Peled 	if (sh->aso_age_mng)
375f935ed4bSDekel Peled 		return 0;
376f935ed4bSDekel Peled 	sh->aso_age_mng = mlx5_malloc(MLX5_MEM_ZERO, sizeof(*sh->aso_age_mng),
377f935ed4bSDekel Peled 				      RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
378f935ed4bSDekel Peled 	if (!sh->aso_age_mng) {
379f935ed4bSDekel Peled 		DRV_LOG(ERR, "aso_age_mng allocation was failed.");
380f935ed4bSDekel Peled 		rte_errno = ENOMEM;
381f935ed4bSDekel Peled 		return -ENOMEM;
382f935ed4bSDekel Peled 	}
383f935ed4bSDekel Peled 	err = mlx5_aso_queue_init(sh);
384f935ed4bSDekel Peled 	if (err) {
385f935ed4bSDekel Peled 		mlx5_free(sh->aso_age_mng);
386f935ed4bSDekel Peled 		return -1;
387f935ed4bSDekel Peled 	}
388f935ed4bSDekel Peled 	rte_spinlock_init(&sh->aso_age_mng->resize_sl);
389f935ed4bSDekel Peled 	rte_spinlock_init(&sh->aso_age_mng->free_sl);
390f935ed4bSDekel Peled 	LIST_INIT(&sh->aso_age_mng->free);
391f935ed4bSDekel Peled 	return 0;
392f935ed4bSDekel Peled }
393f935ed4bSDekel Peled 
394f935ed4bSDekel Peled /**
395f935ed4bSDekel Peled  * Close and release all the resources of the ASO aging management structure.
396f935ed4bSDekel Peled  *
397f935ed4bSDekel Peled  * @param[in] sh
398f935ed4bSDekel Peled  *   Pointer to mlx5_dev_ctx_shared object to free.
399f935ed4bSDekel Peled  */
400f935ed4bSDekel Peled static void
401f935ed4bSDekel Peled mlx5_flow_aso_age_mng_close(struct mlx5_dev_ctx_shared *sh)
402f935ed4bSDekel Peled {
403f935ed4bSDekel Peled 	int i, j;
404f935ed4bSDekel Peled 
405f935ed4bSDekel Peled 	mlx5_aso_queue_stop(sh);
406f935ed4bSDekel Peled 	mlx5_aso_queue_uninit(sh);
407f935ed4bSDekel Peled 	if (sh->aso_age_mng->pools) {
408f935ed4bSDekel Peled 		struct mlx5_aso_age_pool *pool;
409f935ed4bSDekel Peled 
410f935ed4bSDekel Peled 		for (i = 0; i < sh->aso_age_mng->next; ++i) {
411f935ed4bSDekel Peled 			pool = sh->aso_age_mng->pools[i];
412f935ed4bSDekel Peled 			claim_zero(mlx5_devx_cmd_destroy
413f935ed4bSDekel Peled 						(pool->flow_hit_aso_obj));
414f935ed4bSDekel Peled 			for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j)
415f935ed4bSDekel Peled 				if (pool->actions[j].dr_action)
416f935ed4bSDekel Peled 					claim_zero
417f935ed4bSDekel Peled 						(mlx5_glue->destroy_flow_action
418f935ed4bSDekel Peled 						  (pool->actions[j].dr_action));
419f935ed4bSDekel Peled 			mlx5_free(pool);
420f935ed4bSDekel Peled 		}
421f935ed4bSDekel Peled 		mlx5_free(sh->aso_age_mng->pools);
422f935ed4bSDekel Peled 	}
4237ad0b6d9SDekel Peled 	mlx5_free(sh->aso_age_mng);
424f935ed4bSDekel Peled }
425f935ed4bSDekel Peled 
426f935ed4bSDekel Peled /**
427fa2d01c8SDong Zhou  * Initialize the shared aging list information per port.
428fa2d01c8SDong Zhou  *
429fa2d01c8SDong Zhou  * @param[in] sh
4306e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
431fa2d01c8SDong Zhou  */
432fa2d01c8SDong Zhou static void
4336e88bc42SOphir Munk mlx5_flow_aging_init(struct mlx5_dev_ctx_shared *sh)
434fa2d01c8SDong Zhou {
435fa2d01c8SDong Zhou 	uint32_t i;
436fa2d01c8SDong Zhou 	struct mlx5_age_info *age_info;
437fa2d01c8SDong Zhou 
438fa2d01c8SDong Zhou 	for (i = 0; i < sh->max_port; i++) {
439fa2d01c8SDong Zhou 		age_info = &sh->port[i].age_info;
440fa2d01c8SDong Zhou 		age_info->flags = 0;
441fa2d01c8SDong Zhou 		TAILQ_INIT(&age_info->aged_counters);
442f9bc5274SMatan Azrad 		LIST_INIT(&age_info->aged_aso);
443fa2d01c8SDong Zhou 		rte_spinlock_init(&age_info->aged_sl);
444fa2d01c8SDong Zhou 		MLX5_AGE_SET(age_info, MLX5_AGE_TRIGGER);
445fa2d01c8SDong Zhou 	}
446fa2d01c8SDong Zhou }
447fa2d01c8SDong Zhou 
448fa2d01c8SDong Zhou /**
4495382d28cSMatan Azrad  * Initialize the counters management structure.
4505382d28cSMatan Azrad  *
4515382d28cSMatan Azrad  * @param[in] sh
4526e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free
4535382d28cSMatan Azrad  */
4545382d28cSMatan Azrad static void
4556e88bc42SOphir Munk mlx5_flow_counters_mng_init(struct mlx5_dev_ctx_shared *sh)
4565382d28cSMatan Azrad {
457994829e6SSuanming Mou 	int i;
4585382d28cSMatan Azrad 
4595af61440SMatan Azrad 	memset(&sh->cmng, 0, sizeof(sh->cmng));
4605382d28cSMatan Azrad 	TAILQ_INIT(&sh->cmng.flow_counters);
461994829e6SSuanming Mou 	sh->cmng.min_id = MLX5_CNT_BATCH_OFFSET;
462994829e6SSuanming Mou 	sh->cmng.max_id = -1;
463994829e6SSuanming Mou 	sh->cmng.last_pool_idx = POOL_IDX_INVALID;
4643aa27915SSuanming Mou 	rte_spinlock_init(&sh->cmng.pool_update_sl);
465994829e6SSuanming Mou 	for (i = 0; i < MLX5_COUNTER_TYPE_MAX; i++) {
466994829e6SSuanming Mou 		TAILQ_INIT(&sh->cmng.counters[i]);
467994829e6SSuanming Mou 		rte_spinlock_init(&sh->cmng.csl[i]);
468fa2d01c8SDong Zhou 	}
4695382d28cSMatan Azrad }
4705382d28cSMatan Azrad 
4715382d28cSMatan Azrad /**
4725382d28cSMatan Azrad  * Destroy all the resources allocated for a counter memory management.
4735382d28cSMatan Azrad  *
4745382d28cSMatan Azrad  * @param[in] mng
4755382d28cSMatan Azrad  *   Pointer to the memory management structure.
4765382d28cSMatan Azrad  */
4775382d28cSMatan Azrad static void
4785382d28cSMatan Azrad mlx5_flow_destroy_counter_stat_mem_mng(struct mlx5_counter_stats_mem_mng *mng)
4795382d28cSMatan Azrad {
4805382d28cSMatan Azrad 	uint8_t *mem = (uint8_t *)(uintptr_t)mng->raws[0].data;
4815382d28cSMatan Azrad 
4825382d28cSMatan Azrad 	LIST_REMOVE(mng, next);
4835382d28cSMatan Azrad 	claim_zero(mlx5_devx_cmd_destroy(mng->dm));
4845382d28cSMatan Azrad 	claim_zero(mlx5_glue->devx_umem_dereg(mng->umem));
48583c2047cSSuanming Mou 	mlx5_free(mem);
4865382d28cSMatan Azrad }
4875382d28cSMatan Azrad 
4885382d28cSMatan Azrad /**
4895382d28cSMatan Azrad  * Close and release all the resources of the counters management.
4905382d28cSMatan Azrad  *
4915382d28cSMatan Azrad  * @param[in] sh
4926e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free.
4935382d28cSMatan Azrad  */
4945382d28cSMatan Azrad static void
4956e88bc42SOphir Munk mlx5_flow_counters_mng_close(struct mlx5_dev_ctx_shared *sh)
4965382d28cSMatan Azrad {
4975382d28cSMatan Azrad 	struct mlx5_counter_stats_mem_mng *mng;
4983aa27915SSuanming Mou 	int i, j;
499f15db67dSMatan Azrad 	int retries = 1024;
5005382d28cSMatan Azrad 
501f15db67dSMatan Azrad 	rte_errno = 0;
502f15db67dSMatan Azrad 	while (--retries) {
503f15db67dSMatan Azrad 		rte_eal_alarm_cancel(mlx5_flow_query_alarm, sh);
504f15db67dSMatan Azrad 		if (rte_errno != EINPROGRESS)
505f15db67dSMatan Azrad 			break;
506f15db67dSMatan Azrad 		rte_pause();
507f15db67dSMatan Azrad 	}
5085382d28cSMatan Azrad 
509994829e6SSuanming Mou 	if (sh->cmng.pools) {
510994829e6SSuanming Mou 		struct mlx5_flow_counter_pool *pool;
5113aa27915SSuanming Mou 		uint16_t n_valid = sh->cmng.n_valid;
5122b5b1aebSSuanming Mou 		bool fallback = sh->cmng.counter_fallback;
513994829e6SSuanming Mou 
5143aa27915SSuanming Mou 		for (i = 0; i < n_valid; ++i) {
5153aa27915SSuanming Mou 			pool = sh->cmng.pools[i];
5162b5b1aebSSuanming Mou 			if (!fallback && pool->min_dcs)
5175af61440SMatan Azrad 				claim_zero(mlx5_devx_cmd_destroy
518fa2d01c8SDong Zhou 							       (pool->min_dcs));
5195382d28cSMatan Azrad 			for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j) {
5202b5b1aebSSuanming Mou 				struct mlx5_flow_counter *cnt =
5212b5b1aebSSuanming Mou 						MLX5_POOL_GET_CNT(pool, j);
5222b5b1aebSSuanming Mou 
5232b5b1aebSSuanming Mou 				if (cnt->action)
5245382d28cSMatan Azrad 					claim_zero
5255382d28cSMatan Azrad 					 (mlx5_glue->destroy_flow_action
5262b5b1aebSSuanming Mou 					  (cnt->action));
5272b5b1aebSSuanming Mou 				if (fallback && MLX5_POOL_GET_CNT
5282b5b1aebSSuanming Mou 				    (pool, j)->dcs_when_free)
5295382d28cSMatan Azrad 					claim_zero(mlx5_devx_cmd_destroy
5302b5b1aebSSuanming Mou 						   (cnt->dcs_when_free));
5315382d28cSMatan Azrad 			}
53283c2047cSSuanming Mou 			mlx5_free(pool);
5335382d28cSMatan Azrad 		}
534994829e6SSuanming Mou 		mlx5_free(sh->cmng.pools);
5355382d28cSMatan Azrad 	}
5365382d28cSMatan Azrad 	mng = LIST_FIRST(&sh->cmng.mem_mngs);
5375382d28cSMatan Azrad 	while (mng) {
5385382d28cSMatan Azrad 		mlx5_flow_destroy_counter_stat_mem_mng(mng);
5395382d28cSMatan Azrad 		mng = LIST_FIRST(&sh->cmng.mem_mngs);
5405382d28cSMatan Azrad 	}
5415382d28cSMatan Azrad 	memset(&sh->cmng, 0, sizeof(sh->cmng));
5425382d28cSMatan Azrad }
5435382d28cSMatan Azrad 
544f935ed4bSDekel Peled /* Send FLOW_AGED event if needed. */
545f935ed4bSDekel Peled void
546f935ed4bSDekel Peled mlx5_age_event_prepare(struct mlx5_dev_ctx_shared *sh)
547f935ed4bSDekel Peled {
548f935ed4bSDekel Peled 	struct mlx5_age_info *age_info;
549f935ed4bSDekel Peled 	uint32_t i;
550f935ed4bSDekel Peled 
551f935ed4bSDekel Peled 	for (i = 0; i < sh->max_port; i++) {
552f935ed4bSDekel Peled 		age_info = &sh->port[i].age_info;
553f935ed4bSDekel Peled 		if (!MLX5_AGE_GET(age_info, MLX5_AGE_EVENT_NEW))
554f935ed4bSDekel Peled 			continue;
555f935ed4bSDekel Peled 		if (MLX5_AGE_GET(age_info, MLX5_AGE_TRIGGER))
556f935ed4bSDekel Peled 			rte_eth_dev_callback_process
557f935ed4bSDekel Peled 				(&rte_eth_devices[sh->port[i].devx_ih_port_id],
558f935ed4bSDekel Peled 				RTE_ETH_EVENT_FLOW_AGED, NULL);
559f935ed4bSDekel Peled 		age_info->flags = 0;
560f935ed4bSDekel Peled 	}
561f935ed4bSDekel Peled }
562f935ed4bSDekel Peled 
5635382d28cSMatan Azrad /**
564014d1cbeSSuanming Mou  * Initialize the flow resources' indexed mempool.
565014d1cbeSSuanming Mou  *
566014d1cbeSSuanming Mou  * @param[in] sh
5676e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
568b88341caSSuanming Mou  * @param[in] sh
569b88341caSSuanming Mou  *   Pointer to user dev config.
570014d1cbeSSuanming Mou  */
571014d1cbeSSuanming Mou static void
5726e88bc42SOphir Munk mlx5_flow_ipool_create(struct mlx5_dev_ctx_shared *sh,
5735c761238SGregory Etelson 		       const struct mlx5_dev_config *config)
574014d1cbeSSuanming Mou {
575014d1cbeSSuanming Mou 	uint8_t i;
5765c761238SGregory Etelson 	struct mlx5_indexed_pool_config cfg;
577014d1cbeSSuanming Mou 
578a1da6f62SSuanming Mou 	for (i = 0; i < MLX5_IPOOL_MAX; ++i) {
5795c761238SGregory Etelson 		cfg = mlx5_ipool_cfg[i];
5805c761238SGregory Etelson 		switch (i) {
5815c761238SGregory Etelson 		default:
5825c761238SGregory Etelson 			break;
5835c761238SGregory Etelson 		/*
5845c761238SGregory Etelson 		 * Set MLX5_IPOOL_MLX5_FLOW ipool size
5855c761238SGregory Etelson 		 * according to PCI function flow configuration.
5865c761238SGregory Etelson 		 */
5875c761238SGregory Etelson 		case MLX5_IPOOL_MLX5_FLOW:
5885c761238SGregory Etelson 			cfg.size = config->dv_flow_en ?
5895c761238SGregory Etelson 				sizeof(struct mlx5_flow_handle) :
5905c761238SGregory Etelson 				MLX5_FLOW_HANDLE_VERBS_SIZE;
5915c761238SGregory Etelson 			break;
5925c761238SGregory Etelson 		}
593a1da6f62SSuanming Mou 		if (config->reclaim_mode)
5945c761238SGregory Etelson 			cfg.release_mem_en = 1;
5955c761238SGregory Etelson 		sh->ipool[i] = mlx5_ipool_create(&cfg);
596014d1cbeSSuanming Mou 	}
597a1da6f62SSuanming Mou }
598014d1cbeSSuanming Mou 
599014d1cbeSSuanming Mou /**
600014d1cbeSSuanming Mou  * Release the flow resources' indexed mempool.
601014d1cbeSSuanming Mou  *
602014d1cbeSSuanming Mou  * @param[in] sh
6036e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
604014d1cbeSSuanming Mou  */
605014d1cbeSSuanming Mou static void
6066e88bc42SOphir Munk mlx5_flow_ipool_destroy(struct mlx5_dev_ctx_shared *sh)
607014d1cbeSSuanming Mou {
608014d1cbeSSuanming Mou 	uint8_t i;
609014d1cbeSSuanming Mou 
610014d1cbeSSuanming Mou 	for (i = 0; i < MLX5_IPOOL_MAX; ++i)
611014d1cbeSSuanming Mou 		mlx5_ipool_destroy(sh->ipool[i]);
612014d1cbeSSuanming Mou }
613014d1cbeSSuanming Mou 
614daa38a89SBing Zhao /*
615daa38a89SBing Zhao  * Check if dynamic flex parser for eCPRI already exists.
616daa38a89SBing Zhao  *
617daa38a89SBing Zhao  * @param dev
618daa38a89SBing Zhao  *   Pointer to Ethernet device structure.
619daa38a89SBing Zhao  *
620daa38a89SBing Zhao  * @return
621daa38a89SBing Zhao  *   true on exists, false on not.
622daa38a89SBing Zhao  */
623daa38a89SBing Zhao bool
624daa38a89SBing Zhao mlx5_flex_parser_ecpri_exist(struct rte_eth_dev *dev)
625daa38a89SBing Zhao {
626daa38a89SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
627daa38a89SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
628daa38a89SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
629daa38a89SBing Zhao 
630daa38a89SBing Zhao 	return !!prf->obj;
631daa38a89SBing Zhao }
632daa38a89SBing Zhao 
633daa38a89SBing Zhao /*
634daa38a89SBing Zhao  * Allocation of a flex parser for eCPRI. Once created, this parser related
635daa38a89SBing Zhao  * resources will be held until the device is closed.
636daa38a89SBing Zhao  *
637daa38a89SBing Zhao  * @param dev
638daa38a89SBing Zhao  *   Pointer to Ethernet device structure.
639daa38a89SBing Zhao  *
640daa38a89SBing Zhao  * @return
641daa38a89SBing Zhao  *   0 on success, a negative errno value otherwise and rte_errno is set.
642daa38a89SBing Zhao  */
643daa38a89SBing Zhao int
644daa38a89SBing Zhao mlx5_flex_parser_ecpri_alloc(struct rte_eth_dev *dev)
645daa38a89SBing Zhao {
646daa38a89SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
647daa38a89SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
648daa38a89SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
6491c506404SBing Zhao 	struct mlx5_devx_graph_node_attr node = {
6501c506404SBing Zhao 		.modify_field_select = 0,
6511c506404SBing Zhao 	};
6521c506404SBing Zhao 	uint32_t ids[8];
6531c506404SBing Zhao 	int ret;
654daa38a89SBing Zhao 
655d7c49561SBing Zhao 	if (!priv->config.hca_attr.parse_graph_flex_node) {
656d7c49561SBing Zhao 		DRV_LOG(ERR, "Dynamic flex parser is not supported "
657d7c49561SBing Zhao 			"for device %s.", priv->dev_data->name);
658d7c49561SBing Zhao 		return -ENOTSUP;
659d7c49561SBing Zhao 	}
6601c506404SBing Zhao 	node.header_length_mode = MLX5_GRAPH_NODE_LEN_FIXED;
6611c506404SBing Zhao 	/* 8 bytes now: 4B common header + 4B message body header. */
6621c506404SBing Zhao 	node.header_length_base_value = 0x8;
6631c506404SBing Zhao 	/* After MAC layer: Ether / VLAN. */
6641c506404SBing Zhao 	node.in[0].arc_parse_graph_node = MLX5_GRAPH_ARC_NODE_MAC;
6651c506404SBing Zhao 	/* Type of compared condition should be 0xAEFE in the L2 layer. */
6661c506404SBing Zhao 	node.in[0].compare_condition_value = RTE_ETHER_TYPE_ECPRI;
6671c506404SBing Zhao 	/* Sample #0: type in common header. */
6681c506404SBing Zhao 	node.sample[0].flow_match_sample_en = 1;
6691c506404SBing Zhao 	/* Fixed offset. */
6701c506404SBing Zhao 	node.sample[0].flow_match_sample_offset_mode = 0x0;
6711c506404SBing Zhao 	/* Only the 2nd byte will be used. */
6721c506404SBing Zhao 	node.sample[0].flow_match_sample_field_base_offset = 0x0;
6731c506404SBing Zhao 	/* Sample #1: message payload. */
6741c506404SBing Zhao 	node.sample[1].flow_match_sample_en = 1;
6751c506404SBing Zhao 	/* Fixed offset. */
6761c506404SBing Zhao 	node.sample[1].flow_match_sample_offset_mode = 0x0;
6771c506404SBing Zhao 	/*
6781c506404SBing Zhao 	 * Only the first two bytes will be used right now, and its offset will
6791c506404SBing Zhao 	 * start after the common header that with the length of a DW(u32).
6801c506404SBing Zhao 	 */
6811c506404SBing Zhao 	node.sample[1].flow_match_sample_field_base_offset = sizeof(uint32_t);
6821c506404SBing Zhao 	prf->obj = mlx5_devx_cmd_create_flex_parser(priv->sh->ctx, &node);
6831c506404SBing Zhao 	if (!prf->obj) {
6841c506404SBing Zhao 		DRV_LOG(ERR, "Failed to create flex parser node object.");
6851c506404SBing Zhao 		return (rte_errno == 0) ? -ENODEV : -rte_errno;
6861c506404SBing Zhao 	}
6871c506404SBing Zhao 	prf->num = 2;
6881c506404SBing Zhao 	ret = mlx5_devx_cmd_query_parse_samples(prf->obj, ids, prf->num);
6891c506404SBing Zhao 	if (ret) {
6901c506404SBing Zhao 		DRV_LOG(ERR, "Failed to query sample IDs.");
6911c506404SBing Zhao 		return (rte_errno == 0) ? -ENODEV : -rte_errno;
6921c506404SBing Zhao 	}
6931c506404SBing Zhao 	prf->offset[0] = 0x0;
6941c506404SBing Zhao 	prf->offset[1] = sizeof(uint32_t);
6951c506404SBing Zhao 	prf->ids[0] = ids[0];
6961c506404SBing Zhao 	prf->ids[1] = ids[1];
697daa38a89SBing Zhao 	return 0;
698daa38a89SBing Zhao }
699daa38a89SBing Zhao 
7001c506404SBing Zhao /*
7011c506404SBing Zhao  * Destroy the flex parser node, including the parser itself, input / output
7021c506404SBing Zhao  * arcs and DW samples. Resources could be reused then.
7031c506404SBing Zhao  *
7041c506404SBing Zhao  * @param dev
7051c506404SBing Zhao  *   Pointer to Ethernet device structure.
7061c506404SBing Zhao  */
7071c506404SBing Zhao static void
7081c506404SBing Zhao mlx5_flex_parser_ecpri_release(struct rte_eth_dev *dev)
7091c506404SBing Zhao {
7101c506404SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
7111c506404SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
7121c506404SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
7131c506404SBing Zhao 
7141c506404SBing Zhao 	if (prf->obj)
7151c506404SBing Zhao 		mlx5_devx_cmd_destroy(prf->obj);
7161c506404SBing Zhao 	prf->obj = NULL;
7171c506404SBing Zhao }
7181c506404SBing Zhao 
719a0bfe9d5SViacheslav Ovsiienko /*
720a0bfe9d5SViacheslav Ovsiienko  * Allocate Rx and Tx UARs in robust fashion.
721a0bfe9d5SViacheslav Ovsiienko  * This routine handles the following UAR allocation issues:
722a0bfe9d5SViacheslav Ovsiienko  *
723a0bfe9d5SViacheslav Ovsiienko  *  - tries to allocate the UAR with the most appropriate memory
724a0bfe9d5SViacheslav Ovsiienko  *    mapping type from the ones supported by the host
725a0bfe9d5SViacheslav Ovsiienko  *
726a0bfe9d5SViacheslav Ovsiienko  *  - tries to allocate the UAR with non-NULL base address
727a0bfe9d5SViacheslav Ovsiienko  *    OFED 5.0.x and Upstream rdma_core before v29 returned the NULL as
728a0bfe9d5SViacheslav Ovsiienko  *    UAR base address if UAR was not the first object in the UAR page.
729a0bfe9d5SViacheslav Ovsiienko  *    It caused the PMD failure and we should try to get another UAR
730a0bfe9d5SViacheslav Ovsiienko  *    till we get the first one with non-NULL base address returned.
731a0bfe9d5SViacheslav Ovsiienko  */
732a0bfe9d5SViacheslav Ovsiienko static int
733a0bfe9d5SViacheslav Ovsiienko mlx5_alloc_rxtx_uars(struct mlx5_dev_ctx_shared *sh,
734a0bfe9d5SViacheslav Ovsiienko 		     const struct mlx5_dev_config *config)
735a0bfe9d5SViacheslav Ovsiienko {
736a0bfe9d5SViacheslav Ovsiienko 	uint32_t uar_mapping, retry;
737a0bfe9d5SViacheslav Ovsiienko 	int err = 0;
7381f66ac5bSOphir Munk 	void *base_addr;
739a0bfe9d5SViacheslav Ovsiienko 
740a0bfe9d5SViacheslav Ovsiienko 	for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
741a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
742a0bfe9d5SViacheslav Ovsiienko 		/* Control the mapping type according to the settings. */
743a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = (config->dbnc == MLX5_TXDB_NCACHED) ?
744a0bfe9d5SViacheslav Ovsiienko 			      MLX5DV_UAR_ALLOC_TYPE_NC :
745a0bfe9d5SViacheslav Ovsiienko 			      MLX5DV_UAR_ALLOC_TYPE_BF;
746a0bfe9d5SViacheslav Ovsiienko #else
747a0bfe9d5SViacheslav Ovsiienko 		RTE_SET_USED(config);
748a0bfe9d5SViacheslav Ovsiienko 		/*
749a0bfe9d5SViacheslav Ovsiienko 		 * It seems we have no way to control the memory mapping type
750a0bfe9d5SViacheslav Ovsiienko 		 * for the UAR, the default "Write-Combining" type is supposed.
751a0bfe9d5SViacheslav Ovsiienko 		 * The UAR initialization on queue creation queries the
752a0bfe9d5SViacheslav Ovsiienko 		 * actual mapping type done by Verbs/kernel and setups the
753a0bfe9d5SViacheslav Ovsiienko 		 * PMD datapath accordingly.
754a0bfe9d5SViacheslav Ovsiienko 		 */
755a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = 0;
756a0bfe9d5SViacheslav Ovsiienko #endif
757a0bfe9d5SViacheslav Ovsiienko 		sh->tx_uar = mlx5_glue->devx_alloc_uar(sh->ctx, uar_mapping);
758a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
759a0bfe9d5SViacheslav Ovsiienko 		if (!sh->tx_uar &&
760a0bfe9d5SViacheslav Ovsiienko 		    uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
761a0bfe9d5SViacheslav Ovsiienko 			if (config->dbnc == MLX5_TXDB_CACHED ||
762a0bfe9d5SViacheslav Ovsiienko 			    config->dbnc == MLX5_TXDB_HEURISTIC)
763a0bfe9d5SViacheslav Ovsiienko 				DRV_LOG(WARNING, "Devarg tx_db_nc setting "
764a0bfe9d5SViacheslav Ovsiienko 						 "is not supported by DevX");
765a0bfe9d5SViacheslav Ovsiienko 			/*
766a0bfe9d5SViacheslav Ovsiienko 			 * In some environments like virtual machine
767a0bfe9d5SViacheslav Ovsiienko 			 * the Write Combining mapped might be not supported
768a0bfe9d5SViacheslav Ovsiienko 			 * and UAR allocation fails. We try "Non-Cached"
769a0bfe9d5SViacheslav Ovsiienko 			 * mapping for the case. The tx_burst routines take
770a0bfe9d5SViacheslav Ovsiienko 			 * the UAR mapping type into account on UAR setup
771a0bfe9d5SViacheslav Ovsiienko 			 * on queue creation.
772a0bfe9d5SViacheslav Ovsiienko 			 */
773a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Tx DevX UAR (BF)");
774a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
775a0bfe9d5SViacheslav Ovsiienko 			sh->tx_uar = mlx5_glue->devx_alloc_uar
776a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
777a0bfe9d5SViacheslav Ovsiienko 		} else if (!sh->tx_uar &&
778a0bfe9d5SViacheslav Ovsiienko 			   uar_mapping == MLX5DV_UAR_ALLOC_TYPE_NC) {
779a0bfe9d5SViacheslav Ovsiienko 			if (config->dbnc == MLX5_TXDB_NCACHED)
780a0bfe9d5SViacheslav Ovsiienko 				DRV_LOG(WARNING, "Devarg tx_db_nc settings "
781a0bfe9d5SViacheslav Ovsiienko 						 "is not supported by DevX");
782a0bfe9d5SViacheslav Ovsiienko 			/*
783a0bfe9d5SViacheslav Ovsiienko 			 * If Verbs/kernel does not support "Non-Cached"
784a0bfe9d5SViacheslav Ovsiienko 			 * try the "Write-Combining".
785a0bfe9d5SViacheslav Ovsiienko 			 */
786a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Tx DevX UAR (NC)");
787a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_BF;
788a0bfe9d5SViacheslav Ovsiienko 			sh->tx_uar = mlx5_glue->devx_alloc_uar
789a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
790a0bfe9d5SViacheslav Ovsiienko 		}
791a0bfe9d5SViacheslav Ovsiienko #endif
792a0bfe9d5SViacheslav Ovsiienko 		if (!sh->tx_uar) {
793a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (BF/NC)");
794a0bfe9d5SViacheslav Ovsiienko 			err = ENOMEM;
795a0bfe9d5SViacheslav Ovsiienko 			goto exit;
796a0bfe9d5SViacheslav Ovsiienko 		}
7971f66ac5bSOphir Munk 		base_addr = mlx5_os_get_devx_uar_base_addr(sh->tx_uar);
7981f66ac5bSOphir Munk 		if (base_addr)
799a0bfe9d5SViacheslav Ovsiienko 			break;
800a0bfe9d5SViacheslav Ovsiienko 		/*
801a0bfe9d5SViacheslav Ovsiienko 		 * The UARs are allocated by rdma_core within the
802a0bfe9d5SViacheslav Ovsiienko 		 * IB device context, on context closure all UARs
803a0bfe9d5SViacheslav Ovsiienko 		 * will be freed, should be no memory/object leakage.
804a0bfe9d5SViacheslav Ovsiienko 		 */
805a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(WARNING, "Retrying to allocate Tx DevX UAR");
806a0bfe9d5SViacheslav Ovsiienko 		sh->tx_uar = NULL;
807a0bfe9d5SViacheslav Ovsiienko 	}
808a0bfe9d5SViacheslav Ovsiienko 	/* Check whether we finally succeeded with valid UAR allocation. */
809a0bfe9d5SViacheslav Ovsiienko 	if (!sh->tx_uar) {
810a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (NULL base)");
811a0bfe9d5SViacheslav Ovsiienko 		err = ENOMEM;
812a0bfe9d5SViacheslav Ovsiienko 		goto exit;
813a0bfe9d5SViacheslav Ovsiienko 	}
814a0bfe9d5SViacheslav Ovsiienko 	for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
815a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = 0;
816a0bfe9d5SViacheslav Ovsiienko 		sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
817a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
818a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
819a0bfe9d5SViacheslav Ovsiienko 		if (!sh->devx_rx_uar &&
820a0bfe9d5SViacheslav Ovsiienko 		    uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
821a0bfe9d5SViacheslav Ovsiienko 			/*
822a0bfe9d5SViacheslav Ovsiienko 			 * Rx UAR is used to control interrupts only,
823a0bfe9d5SViacheslav Ovsiienko 			 * should be no datapath noticeable impact,
824a0bfe9d5SViacheslav Ovsiienko 			 * can try "Non-Cached" mapping safely.
825a0bfe9d5SViacheslav Ovsiienko 			 */
826a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Rx DevX UAR (BF)");
827a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
828a0bfe9d5SViacheslav Ovsiienko 			sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
829a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
830a0bfe9d5SViacheslav Ovsiienko 		}
831a0bfe9d5SViacheslav Ovsiienko #endif
832a0bfe9d5SViacheslav Ovsiienko 		if (!sh->devx_rx_uar) {
833a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (BF/NC)");
834a0bfe9d5SViacheslav Ovsiienko 			err = ENOMEM;
835a0bfe9d5SViacheslav Ovsiienko 			goto exit;
836a0bfe9d5SViacheslav Ovsiienko 		}
8371f66ac5bSOphir Munk 		base_addr = mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar);
8381f66ac5bSOphir Munk 		if (base_addr)
839a0bfe9d5SViacheslav Ovsiienko 			break;
840a0bfe9d5SViacheslav Ovsiienko 		/*
841a0bfe9d5SViacheslav Ovsiienko 		 * The UARs are allocated by rdma_core within the
842a0bfe9d5SViacheslav Ovsiienko 		 * IB device context, on context closure all UARs
843a0bfe9d5SViacheslav Ovsiienko 		 * will be freed, should be no memory/object leakage.
844a0bfe9d5SViacheslav Ovsiienko 		 */
845a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(WARNING, "Retrying to allocate Rx DevX UAR");
846a0bfe9d5SViacheslav Ovsiienko 		sh->devx_rx_uar = NULL;
847a0bfe9d5SViacheslav Ovsiienko 	}
848a0bfe9d5SViacheslav Ovsiienko 	/* Check whether we finally succeeded with valid UAR allocation. */
849a0bfe9d5SViacheslav Ovsiienko 	if (!sh->devx_rx_uar) {
850a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (NULL base)");
851a0bfe9d5SViacheslav Ovsiienko 		err = ENOMEM;
852a0bfe9d5SViacheslav Ovsiienko 	}
853a0bfe9d5SViacheslav Ovsiienko exit:
854a0bfe9d5SViacheslav Ovsiienko 	return err;
855a0bfe9d5SViacheslav Ovsiienko }
856a0bfe9d5SViacheslav Ovsiienko 
857014d1cbeSSuanming Mou /**
85891389890SOphir Munk  * Allocate shared device context. If there is multiport device the
85917e19bc4SViacheslav Ovsiienko  * master and representors will share this context, if there is single
86091389890SOphir Munk  * port dedicated device, the context will be used by only given
86117e19bc4SViacheslav Ovsiienko  * port due to unification.
86217e19bc4SViacheslav Ovsiienko  *
86391389890SOphir Munk  * Routine first searches the context for the specified device name,
86417e19bc4SViacheslav Ovsiienko  * if found the shared context assumed and reference counter is incremented.
86517e19bc4SViacheslav Ovsiienko  * If no context found the new one is created and initialized with specified
86691389890SOphir Munk  * device context and parameters.
86717e19bc4SViacheslav Ovsiienko  *
86817e19bc4SViacheslav Ovsiienko  * @param[in] spawn
86991389890SOphir Munk  *   Pointer to the device attributes (name, port, etc).
8708409a285SViacheslav Ovsiienko  * @param[in] config
8718409a285SViacheslav Ovsiienko  *   Pointer to device configuration structure.
87217e19bc4SViacheslav Ovsiienko  *
87317e19bc4SViacheslav Ovsiienko  * @return
8746e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object on success,
87517e19bc4SViacheslav Ovsiienko  *   otherwise NULL and rte_errno is set.
87617e19bc4SViacheslav Ovsiienko  */
8772eb4d010SOphir Munk struct mlx5_dev_ctx_shared *
87891389890SOphir Munk mlx5_alloc_shared_dev_ctx(const struct mlx5_dev_spawn_data *spawn,
8798409a285SViacheslav Ovsiienko 			   const struct mlx5_dev_config *config)
88017e19bc4SViacheslav Ovsiienko {
8816e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh;
88217e19bc4SViacheslav Ovsiienko 	int err = 0;
88353e5a82fSViacheslav Ovsiienko 	uint32_t i;
884ae18a1aeSOri Kam 	struct mlx5_devx_tis_attr tis_attr = { 0 };
88517e19bc4SViacheslav Ovsiienko 
8868e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(spawn);
88717e19bc4SViacheslav Ovsiienko 	/* Secondary process should not create the shared context. */
8888e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
88991389890SOphir Munk 	pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
89017e19bc4SViacheslav Ovsiienko 	/* Search for IB context by device name. */
89191389890SOphir Munk 	LIST_FOREACH(sh, &mlx5_dev_ctx_list, next) {
892834a9019SOphir Munk 		if (!strcmp(sh->ibdev_name,
893834a9019SOphir Munk 			mlx5_os_get_dev_device_name(spawn->phys_dev))) {
89417e19bc4SViacheslav Ovsiienko 			sh->refcnt++;
89517e19bc4SViacheslav Ovsiienko 			goto exit;
89617e19bc4SViacheslav Ovsiienko 		}
89717e19bc4SViacheslav Ovsiienko 	}
898ae4eb7dcSViacheslav Ovsiienko 	/* No device found, we have to create new shared context. */
8998e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(spawn->max_port);
9002175c4dcSSuanming Mou 	sh = mlx5_malloc(MLX5_MEM_ZERO | MLX5_MEM_RTE,
9016e88bc42SOphir Munk 			 sizeof(struct mlx5_dev_ctx_shared) +
90217e19bc4SViacheslav Ovsiienko 			 spawn->max_port *
90391389890SOphir Munk 			 sizeof(struct mlx5_dev_shared_port),
9042175c4dcSSuanming Mou 			 RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
90517e19bc4SViacheslav Ovsiienko 	if (!sh) {
90617e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "shared context allocation failure");
90717e19bc4SViacheslav Ovsiienko 		rte_errno  = ENOMEM;
90817e19bc4SViacheslav Ovsiienko 		goto exit;
90917e19bc4SViacheslav Ovsiienko 	}
9102eb4d010SOphir Munk 	err = mlx5_os_open_device(spawn, config, sh);
91106f78b5eSViacheslav Ovsiienko 	if (!sh->ctx)
91217e19bc4SViacheslav Ovsiienko 		goto error;
913e85f623eSOphir Munk 	err = mlx5_os_get_dev_attr(sh->ctx, &sh->device_attr);
91417e19bc4SViacheslav Ovsiienko 	if (err) {
915e85f623eSOphir Munk 		DRV_LOG(DEBUG, "mlx5_os_get_dev_attr() failed");
91617e19bc4SViacheslav Ovsiienko 		goto error;
91717e19bc4SViacheslav Ovsiienko 	}
91817e19bc4SViacheslav Ovsiienko 	sh->refcnt = 1;
919e6818853SXueming Li 	sh->bond_dev = UINT16_MAX;
92017e19bc4SViacheslav Ovsiienko 	sh->max_port = spawn->max_port;
921f44b09f9SOphir Munk 	strncpy(sh->ibdev_name, mlx5_os_get_ctx_device_name(sh->ctx),
922f44b09f9SOphir Munk 		sizeof(sh->ibdev_name) - 1);
923f44b09f9SOphir Munk 	strncpy(sh->ibdev_path, mlx5_os_get_ctx_device_path(sh->ctx),
924f44b09f9SOphir Munk 		sizeof(sh->ibdev_path) - 1);
92553e5a82fSViacheslav Ovsiienko 	/*
92653e5a82fSViacheslav Ovsiienko 	 * Setting port_id to max unallowed value means
92753e5a82fSViacheslav Ovsiienko 	 * there is no interrupt subhandler installed for
92853e5a82fSViacheslav Ovsiienko 	 * the given port index i.
92953e5a82fSViacheslav Ovsiienko 	 */
93023242063SMatan Azrad 	for (i = 0; i < sh->max_port; i++) {
93153e5a82fSViacheslav Ovsiienko 		sh->port[i].ih_port_id = RTE_MAX_ETHPORTS;
93223242063SMatan Azrad 		sh->port[i].devx_ih_port_id = RTE_MAX_ETHPORTS;
93323242063SMatan Azrad 	}
93417e19bc4SViacheslav Ovsiienko 	sh->pd = mlx5_glue->alloc_pd(sh->ctx);
93517e19bc4SViacheslav Ovsiienko 	if (sh->pd == NULL) {
93617e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "PD allocation failure");
93717e19bc4SViacheslav Ovsiienko 		err = ENOMEM;
93817e19bc4SViacheslav Ovsiienko 		goto error;
93917e19bc4SViacheslav Ovsiienko 	}
940ae18a1aeSOri Kam 	if (sh->devx) {
941e7055bbfSMichael Baum 		/* Query the EQN for this core. */
9428dc775d8SMatan Azrad 		err = mlx5_glue->devx_query_eqn(sh->ctx, 0, &sh->eqn);
943e7055bbfSMichael Baum 		if (err) {
944e7055bbfSMichael Baum 			rte_errno = errno;
945e7055bbfSMichael Baum 			DRV_LOG(ERR, "Failed to query event queue number %d.",
946e7055bbfSMichael Baum 				rte_errno);
947e7055bbfSMichael Baum 			goto error;
948e7055bbfSMichael Baum 		}
9492eb4d010SOphir Munk 		err = mlx5_os_get_pdn(sh->pd, &sh->pdn);
950b9d86122SDekel Peled 		if (err) {
951b9d86122SDekel Peled 			DRV_LOG(ERR, "Fail to extract pdn from PD");
952b9d86122SDekel Peled 			goto error;
953b9d86122SDekel Peled 		}
954ae18a1aeSOri Kam 		sh->td = mlx5_devx_cmd_create_td(sh->ctx);
955ae18a1aeSOri Kam 		if (!sh->td) {
956ae18a1aeSOri Kam 			DRV_LOG(ERR, "TD allocation failure");
957ae18a1aeSOri Kam 			err = ENOMEM;
958ae18a1aeSOri Kam 			goto error;
959ae18a1aeSOri Kam 		}
960ae18a1aeSOri Kam 		tis_attr.transport_domain = sh->td->id;
961ae18a1aeSOri Kam 		sh->tis = mlx5_devx_cmd_create_tis(sh->ctx, &tis_attr);
962ae18a1aeSOri Kam 		if (!sh->tis) {
963ae18a1aeSOri Kam 			DRV_LOG(ERR, "TIS allocation failure");
964ae18a1aeSOri Kam 			err = ENOMEM;
965ae18a1aeSOri Kam 			goto error;
966ae18a1aeSOri Kam 		}
967a0bfe9d5SViacheslav Ovsiienko 		err = mlx5_alloc_rxtx_uars(sh, config);
968a0bfe9d5SViacheslav Ovsiienko 		if (err)
969fc4d4f73SViacheslav Ovsiienko 			goto error;
9701f66ac5bSOphir Munk 		MLX5_ASSERT(sh->tx_uar);
9711f66ac5bSOphir Munk 		MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->tx_uar));
9721f66ac5bSOphir Munk 
9731f66ac5bSOphir Munk 		MLX5_ASSERT(sh->devx_rx_uar);
9741f66ac5bSOphir Munk 		MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar));
975ae18a1aeSOri Kam 	}
97624feb045SViacheslav Ovsiienko #ifndef RTE_ARCH_64
97724feb045SViacheslav Ovsiienko 	/* Initialize UAR access locks for 32bit implementations. */
97824feb045SViacheslav Ovsiienko 	rte_spinlock_init(&sh->uar_lock_cq);
97924feb045SViacheslav Ovsiienko 	for (i = 0; i < MLX5_UAR_PAGE_NUM_MAX; i++)
98024feb045SViacheslav Ovsiienko 		rte_spinlock_init(&sh->uar_lock[i]);
98124feb045SViacheslav Ovsiienko #endif
982ab3cffcfSViacheslav Ovsiienko 	/*
983ab3cffcfSViacheslav Ovsiienko 	 * Once the device is added to the list of memory event
984ab3cffcfSViacheslav Ovsiienko 	 * callback, its global MR cache table cannot be expanded
985ab3cffcfSViacheslav Ovsiienko 	 * on the fly because of deadlock. If it overflows, lookup
986ab3cffcfSViacheslav Ovsiienko 	 * should be done by searching MR list linearly, which is slow.
987ab3cffcfSViacheslav Ovsiienko 	 *
988ab3cffcfSViacheslav Ovsiienko 	 * At this point the device is not added to the memory
989ab3cffcfSViacheslav Ovsiienko 	 * event list yet, context is just being created.
990ab3cffcfSViacheslav Ovsiienko 	 */
991b8dc6b0eSVu Pham 	err = mlx5_mr_btree_init(&sh->share_cache.cache,
992ab3cffcfSViacheslav Ovsiienko 				 MLX5_MR_BTREE_CACHE_N * 2,
99346e10a4cSViacheslav Ovsiienko 				 spawn->pci_dev->device.numa_node);
994ab3cffcfSViacheslav Ovsiienko 	if (err) {
995ab3cffcfSViacheslav Ovsiienko 		err = rte_errno;
996ab3cffcfSViacheslav Ovsiienko 		goto error;
997ab3cffcfSViacheslav Ovsiienko 	}
998d5ed8aa9SOphir Munk 	mlx5_os_set_reg_mr_cb(&sh->share_cache.reg_mr_cb,
999d5ed8aa9SOphir Munk 			      &sh->share_cache.dereg_mr_cb);
10002eb4d010SOphir Munk 	mlx5_os_dev_shared_handler_install(sh);
1001632f0f19SSuanming Mou 	sh->cnt_id_tbl = mlx5_l3t_create(MLX5_L3T_TYPE_DWORD);
1002632f0f19SSuanming Mou 	if (!sh->cnt_id_tbl) {
1003632f0f19SSuanming Mou 		err = rte_errno;
1004632f0f19SSuanming Mou 		goto error;
1005632f0f19SSuanming Mou 	}
1006fa2d01c8SDong Zhou 	mlx5_flow_aging_init(sh);
10075382d28cSMatan Azrad 	mlx5_flow_counters_mng_init(sh);
1008b88341caSSuanming Mou 	mlx5_flow_ipool_create(sh, config);
10090e3d0525SViacheslav Ovsiienko 	/* Add device to memory callback list. */
10100e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
10110e3d0525SViacheslav Ovsiienko 	LIST_INSERT_HEAD(&mlx5_shared_data->mem_event_cb_list,
10120e3d0525SViacheslav Ovsiienko 			 sh, mem_event_cb);
10130e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
10140e3d0525SViacheslav Ovsiienko 	/* Add context to the global device list. */
101591389890SOphir Munk 	LIST_INSERT_HEAD(&mlx5_dev_ctx_list, sh, next);
101617e19bc4SViacheslav Ovsiienko exit:
101791389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
101817e19bc4SViacheslav Ovsiienko 	return sh;
101917e19bc4SViacheslav Ovsiienko error:
1020d133f4cdSViacheslav Ovsiienko 	pthread_mutex_destroy(&sh->txpp.mutex);
102191389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
10228e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
1023a0bfe9d5SViacheslav Ovsiienko 	if (sh->cnt_id_tbl)
1024632f0f19SSuanming Mou 		mlx5_l3t_destroy(sh->cnt_id_tbl);
1025ae18a1aeSOri Kam 	if (sh->tis)
1026ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->tis));
1027ae18a1aeSOri Kam 	if (sh->td)
1028ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->td));
102908d1838fSDekel Peled 	if (sh->devx_rx_uar)
103008d1838fSDekel Peled 		mlx5_glue->devx_free_uar(sh->devx_rx_uar);
1031a0bfe9d5SViacheslav Ovsiienko 	if (sh->tx_uar)
1032a0bfe9d5SViacheslav Ovsiienko 		mlx5_glue->devx_free_uar(sh->tx_uar);
103317e19bc4SViacheslav Ovsiienko 	if (sh->pd)
103417e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->dealloc_pd(sh->pd));
103517e19bc4SViacheslav Ovsiienko 	if (sh->ctx)
103617e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->close_device(sh->ctx));
10372175c4dcSSuanming Mou 	mlx5_free(sh);
10388e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(err > 0);
103917e19bc4SViacheslav Ovsiienko 	rte_errno = err;
104017e19bc4SViacheslav Ovsiienko 	return NULL;
104117e19bc4SViacheslav Ovsiienko }
104217e19bc4SViacheslav Ovsiienko 
104317e19bc4SViacheslav Ovsiienko /**
104417e19bc4SViacheslav Ovsiienko  * Free shared IB device context. Decrement counter and if zero free
104517e19bc4SViacheslav Ovsiienko  * all allocated resources and close handles.
104617e19bc4SViacheslav Ovsiienko  *
104717e19bc4SViacheslav Ovsiienko  * @param[in] sh
10486e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free
104917e19bc4SViacheslav Ovsiienko  */
10502eb4d010SOphir Munk void
105191389890SOphir Munk mlx5_free_shared_dev_ctx(struct mlx5_dev_ctx_shared *sh)
105217e19bc4SViacheslav Ovsiienko {
105391389890SOphir Munk 	pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
10540afacb04SAlexander Kozyrev #ifdef RTE_LIBRTE_MLX5_DEBUG
105517e19bc4SViacheslav Ovsiienko 	/* Check the object presence in the list. */
10566e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *lctx;
105717e19bc4SViacheslav Ovsiienko 
105891389890SOphir Munk 	LIST_FOREACH(lctx, &mlx5_dev_ctx_list, next)
105917e19bc4SViacheslav Ovsiienko 		if (lctx == sh)
106017e19bc4SViacheslav Ovsiienko 			break;
10618e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(lctx);
106217e19bc4SViacheslav Ovsiienko 	if (lctx != sh) {
106317e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "Freeing non-existing shared IB context");
106417e19bc4SViacheslav Ovsiienko 		goto exit;
106517e19bc4SViacheslav Ovsiienko 	}
106617e19bc4SViacheslav Ovsiienko #endif
10678e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
10688e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh->refcnt);
106917e19bc4SViacheslav Ovsiienko 	/* Secondary process should not free the shared context. */
10708e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
107117e19bc4SViacheslav Ovsiienko 	if (--sh->refcnt)
107217e19bc4SViacheslav Ovsiienko 		goto exit;
10730e3d0525SViacheslav Ovsiienko 	/* Remove from memory callback device list. */
10740e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
10750e3d0525SViacheslav Ovsiienko 	LIST_REMOVE(sh, mem_event_cb);
10760e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
10774f8e6befSMichael Baum 	/* Release created Memory Regions. */
1078b8dc6b0eSVu Pham 	mlx5_mr_release_cache(&sh->share_cache);
10790e3d0525SViacheslav Ovsiienko 	/* Remove context from the global device list. */
108017e19bc4SViacheslav Ovsiienko 	LIST_REMOVE(sh, next);
1081f4a08731SMichael Baum 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
108253e5a82fSViacheslav Ovsiienko 	/*
108353e5a82fSViacheslav Ovsiienko 	 *  Ensure there is no async event handler installed.
108453e5a82fSViacheslav Ovsiienko 	 *  Only primary process handles async device events.
108553e5a82fSViacheslav Ovsiienko 	 **/
10865382d28cSMatan Azrad 	mlx5_flow_counters_mng_close(sh);
1087f935ed4bSDekel Peled 	if (sh->aso_age_mng) {
1088f935ed4bSDekel Peled 		mlx5_flow_aso_age_mng_close(sh);
1089f935ed4bSDekel Peled 		sh->aso_age_mng = NULL;
1090f935ed4bSDekel Peled 	}
1091014d1cbeSSuanming Mou 	mlx5_flow_ipool_destroy(sh);
10922eb4d010SOphir Munk 	mlx5_os_dev_shared_handler_uninstall(sh);
1093632f0f19SSuanming Mou 	if (sh->cnt_id_tbl) {
1094632f0f19SSuanming Mou 		mlx5_l3t_destroy(sh->cnt_id_tbl);
1095632f0f19SSuanming Mou 		sh->cnt_id_tbl = NULL;
1096632f0f19SSuanming Mou 	}
1097fc4d4f73SViacheslav Ovsiienko 	if (sh->tx_uar) {
1098fc4d4f73SViacheslav Ovsiienko 		mlx5_glue->devx_free_uar(sh->tx_uar);
1099fc4d4f73SViacheslav Ovsiienko 		sh->tx_uar = NULL;
1100fc4d4f73SViacheslav Ovsiienko 	}
110117e19bc4SViacheslav Ovsiienko 	if (sh->pd)
110217e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->dealloc_pd(sh->pd));
1103ae18a1aeSOri Kam 	if (sh->tis)
1104ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->tis));
1105ae18a1aeSOri Kam 	if (sh->td)
1106ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->td));
110708d1838fSDekel Peled 	if (sh->devx_rx_uar)
110808d1838fSDekel Peled 		mlx5_glue->devx_free_uar(sh->devx_rx_uar);
110917e19bc4SViacheslav Ovsiienko 	if (sh->ctx)
111017e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->close_device(sh->ctx));
1111d133f4cdSViacheslav Ovsiienko 	pthread_mutex_destroy(&sh->txpp.mutex);
11122175c4dcSSuanming Mou 	mlx5_free(sh);
1113f4a08731SMichael Baum 	return;
111417e19bc4SViacheslav Ovsiienko exit:
111591389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
111617e19bc4SViacheslav Ovsiienko }
111717e19bc4SViacheslav Ovsiienko 
1118771fa900SAdrien Mazarguil /**
1119afd7a625SXueming Li  * Destroy table hash list.
112054534725SMatan Azrad  *
112154534725SMatan Azrad  * @param[in] priv
112254534725SMatan Azrad  *   Pointer to the private device data structure.
112354534725SMatan Azrad  */
11242eb4d010SOphir Munk void
112554534725SMatan Azrad mlx5_free_table_hash_list(struct mlx5_priv *priv)
112654534725SMatan Azrad {
11276e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
112854534725SMatan Azrad 
112954534725SMatan Azrad 	if (!sh->flow_tbls)
113054534725SMatan Azrad 		return;
1131e69a5922SXueming Li 	mlx5_hlist_destroy(sh->flow_tbls);
113254534725SMatan Azrad }
113354534725SMatan Azrad 
113454534725SMatan Azrad /**
113554534725SMatan Azrad  * Initialize flow table hash list and create the root tables entry
113654534725SMatan Azrad  * for each domain.
113754534725SMatan Azrad  *
113854534725SMatan Azrad  * @param[in] priv
113954534725SMatan Azrad  *   Pointer to the private device data structure.
114054534725SMatan Azrad  *
114154534725SMatan Azrad  * @return
114254534725SMatan Azrad  *   Zero on success, positive error code otherwise.
114354534725SMatan Azrad  */
11442eb4d010SOphir Munk int
1145afd7a625SXueming Li mlx5_alloc_table_hash_list(struct mlx5_priv *priv __rte_unused)
114654534725SMatan Azrad {
1147afd7a625SXueming Li 	int err = 0;
1148afd7a625SXueming Li 	/* Tables are only used in DV and DR modes. */
1149afd7a625SXueming Li #ifdef HAVE_IBV_FLOW_DV_SUPPORT
11506e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
115154534725SMatan Azrad 	char s[MLX5_HLIST_NAMESIZE];
115254534725SMatan Azrad 
11538e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
115454534725SMatan Azrad 	snprintf(s, sizeof(s), "%s_flow_table", priv->sh->ibdev_name);
1155e69a5922SXueming Li 	sh->flow_tbls = mlx5_hlist_create(s, MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE,
1156f5b0aed2SSuanming Mou 					  0, 0, flow_dv_tbl_create_cb,
1157f5b0aed2SSuanming Mou 					  flow_dv_tbl_match_cb,
1158afd7a625SXueming Li 					  flow_dv_tbl_remove_cb);
115954534725SMatan Azrad 	if (!sh->flow_tbls) {
116063783b01SDavid Marchand 		DRV_LOG(ERR, "flow tables with hash creation failed.");
116154534725SMatan Azrad 		err = ENOMEM;
116254534725SMatan Azrad 		return err;
116354534725SMatan Azrad 	}
1164afd7a625SXueming Li 	sh->flow_tbls->ctx = sh;
116554534725SMatan Azrad #ifndef HAVE_MLX5DV_DR
1166afd7a625SXueming Li 	struct rte_flow_error error;
1167afd7a625SXueming Li 	struct rte_eth_dev *dev = &rte_eth_devices[priv->dev_data->port_id];
1168afd7a625SXueming Li 
116954534725SMatan Azrad 	/*
117054534725SMatan Azrad 	 * In case we have not DR support, the zero tables should be created
117154534725SMatan Azrad 	 * because DV expect to see them even if they cannot be created by
117254534725SMatan Azrad 	 * RDMA-CORE.
117354534725SMatan Azrad 	 */
1174afd7a625SXueming Li 	if (!flow_dv_tbl_resource_get(dev, 0, 0, 0, 0, NULL, 0, 1, &error) ||
1175afd7a625SXueming Li 	    !flow_dv_tbl_resource_get(dev, 0, 1, 0, 0, NULL, 0, 1, &error) ||
1176afd7a625SXueming Li 	    !flow_dv_tbl_resource_get(dev, 0, 0, 1, 0, NULL, 0, 1, &error)) {
117754534725SMatan Azrad 		err = ENOMEM;
117854534725SMatan Azrad 		goto error;
117954534725SMatan Azrad 	}
118054534725SMatan Azrad 	return err;
118154534725SMatan Azrad error:
118254534725SMatan Azrad 	mlx5_free_table_hash_list(priv);
118354534725SMatan Azrad #endif /* HAVE_MLX5DV_DR */
1184afd7a625SXueming Li #endif
118554534725SMatan Azrad 	return err;
118654534725SMatan Azrad }
118754534725SMatan Azrad 
118854534725SMatan Azrad /**
11894d803a72SOlga Shern  * Retrieve integer value from environment variable.
11904d803a72SOlga Shern  *
11914d803a72SOlga Shern  * @param[in] name
11924d803a72SOlga Shern  *   Environment variable name.
11934d803a72SOlga Shern  *
11944d803a72SOlga Shern  * @return
11954d803a72SOlga Shern  *   Integer value, 0 if the variable is not set.
11964d803a72SOlga Shern  */
11974d803a72SOlga Shern int
11984d803a72SOlga Shern mlx5_getenv_int(const char *name)
11994d803a72SOlga Shern {
12004d803a72SOlga Shern 	const char *val = getenv(name);
12014d803a72SOlga Shern 
12024d803a72SOlga Shern 	if (val == NULL)
12034d803a72SOlga Shern 		return 0;
12044d803a72SOlga Shern 	return atoi(val);
12054d803a72SOlga Shern }
12064d803a72SOlga Shern 
12074d803a72SOlga Shern /**
1208c9ba7523SRaslan Darawsheh  * DPDK callback to add udp tunnel port
1209c9ba7523SRaslan Darawsheh  *
1210c9ba7523SRaslan Darawsheh  * @param[in] dev
1211c9ba7523SRaslan Darawsheh  *   A pointer to eth_dev
1212c9ba7523SRaslan Darawsheh  * @param[in] udp_tunnel
1213c9ba7523SRaslan Darawsheh  *   A pointer to udp tunnel
1214c9ba7523SRaslan Darawsheh  *
1215c9ba7523SRaslan Darawsheh  * @return
1216c9ba7523SRaslan Darawsheh  *   0 on valid udp ports and tunnels, -ENOTSUP otherwise.
1217c9ba7523SRaslan Darawsheh  */
1218c9ba7523SRaslan Darawsheh int
1219c9ba7523SRaslan Darawsheh mlx5_udp_tunnel_port_add(struct rte_eth_dev *dev __rte_unused,
1220c9ba7523SRaslan Darawsheh 			 struct rte_eth_udp_tunnel *udp_tunnel)
1221c9ba7523SRaslan Darawsheh {
12228e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(udp_tunnel != NULL);
1223c9ba7523SRaslan Darawsheh 	if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN &&
1224c9ba7523SRaslan Darawsheh 	    udp_tunnel->udp_port == 4789)
1225c9ba7523SRaslan Darawsheh 		return 0;
1226c9ba7523SRaslan Darawsheh 	if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN_GPE &&
1227c9ba7523SRaslan Darawsheh 	    udp_tunnel->udp_port == 4790)
1228c9ba7523SRaslan Darawsheh 		return 0;
1229c9ba7523SRaslan Darawsheh 	return -ENOTSUP;
1230c9ba7523SRaslan Darawsheh }
1231c9ba7523SRaslan Darawsheh 
1232c9ba7523SRaslan Darawsheh /**
1233120dc4a7SYongseok Koh  * Initialize process private data structure.
1234120dc4a7SYongseok Koh  *
1235120dc4a7SYongseok Koh  * @param dev
1236120dc4a7SYongseok Koh  *   Pointer to Ethernet device structure.
1237120dc4a7SYongseok Koh  *
1238120dc4a7SYongseok Koh  * @return
1239120dc4a7SYongseok Koh  *   0 on success, a negative errno value otherwise and rte_errno is set.
1240120dc4a7SYongseok Koh  */
1241120dc4a7SYongseok Koh int
1242120dc4a7SYongseok Koh mlx5_proc_priv_init(struct rte_eth_dev *dev)
1243120dc4a7SYongseok Koh {
1244120dc4a7SYongseok Koh 	struct mlx5_priv *priv = dev->data->dev_private;
1245120dc4a7SYongseok Koh 	struct mlx5_proc_priv *ppriv;
1246120dc4a7SYongseok Koh 	size_t ppriv_size;
1247120dc4a7SYongseok Koh 
1248120dc4a7SYongseok Koh 	/*
1249120dc4a7SYongseok Koh 	 * UAR register table follows the process private structure. BlueFlame
1250120dc4a7SYongseok Koh 	 * registers for Tx queues are stored in the table.
1251120dc4a7SYongseok Koh 	 */
1252120dc4a7SYongseok Koh 	ppriv_size =
1253120dc4a7SYongseok Koh 		sizeof(struct mlx5_proc_priv) + priv->txqs_n * sizeof(void *);
12542175c4dcSSuanming Mou 	ppriv = mlx5_malloc(MLX5_MEM_RTE, ppriv_size, RTE_CACHE_LINE_SIZE,
12552175c4dcSSuanming Mou 			    dev->device->numa_node);
1256120dc4a7SYongseok Koh 	if (!ppriv) {
1257120dc4a7SYongseok Koh 		rte_errno = ENOMEM;
1258120dc4a7SYongseok Koh 		return -rte_errno;
1259120dc4a7SYongseok Koh 	}
1260120dc4a7SYongseok Koh 	ppriv->uar_table_sz = ppriv_size;
1261120dc4a7SYongseok Koh 	dev->process_private = ppriv;
1262120dc4a7SYongseok Koh 	return 0;
1263120dc4a7SYongseok Koh }
1264120dc4a7SYongseok Koh 
1265120dc4a7SYongseok Koh /**
1266120dc4a7SYongseok Koh  * Un-initialize process private data structure.
1267120dc4a7SYongseok Koh  *
1268120dc4a7SYongseok Koh  * @param dev
1269120dc4a7SYongseok Koh  *   Pointer to Ethernet device structure.
1270120dc4a7SYongseok Koh  */
1271120dc4a7SYongseok Koh static void
1272120dc4a7SYongseok Koh mlx5_proc_priv_uninit(struct rte_eth_dev *dev)
1273120dc4a7SYongseok Koh {
1274120dc4a7SYongseok Koh 	if (!dev->process_private)
1275120dc4a7SYongseok Koh 		return;
12762175c4dcSSuanming Mou 	mlx5_free(dev->process_private);
1277120dc4a7SYongseok Koh 	dev->process_private = NULL;
1278120dc4a7SYongseok Koh }
1279120dc4a7SYongseok Koh 
1280120dc4a7SYongseok Koh /**
1281771fa900SAdrien Mazarguil  * DPDK callback to close the device.
1282771fa900SAdrien Mazarguil  *
1283771fa900SAdrien Mazarguil  * Destroy all queues and objects, free memory.
1284771fa900SAdrien Mazarguil  *
1285771fa900SAdrien Mazarguil  * @param dev
1286771fa900SAdrien Mazarguil  *   Pointer to Ethernet device structure.
1287771fa900SAdrien Mazarguil  */
1288b142387bSThomas Monjalon int
1289771fa900SAdrien Mazarguil mlx5_dev_close(struct rte_eth_dev *dev)
1290771fa900SAdrien Mazarguil {
1291dbeba4cfSThomas Monjalon 	struct mlx5_priv *priv = dev->data->dev_private;
12922e22920bSAdrien Mazarguil 	unsigned int i;
12936af6b973SNélio Laranjeiro 	int ret;
1294771fa900SAdrien Mazarguil 
12952786b7bfSSuanming Mou 	if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
12962786b7bfSSuanming Mou 		/* Check if process_private released. */
12972786b7bfSSuanming Mou 		if (!dev->process_private)
1298b142387bSThomas Monjalon 			return 0;
12992786b7bfSSuanming Mou 		mlx5_tx_uar_uninit_secondary(dev);
13002786b7bfSSuanming Mou 		mlx5_proc_priv_uninit(dev);
13012786b7bfSSuanming Mou 		rte_eth_dev_release_port(dev);
1302b142387bSThomas Monjalon 		return 0;
13032786b7bfSSuanming Mou 	}
13042786b7bfSSuanming Mou 	if (!priv->sh)
1305b142387bSThomas Monjalon 		return 0;
1306a170a30dSNélio Laranjeiro 	DRV_LOG(DEBUG, "port %u closing device \"%s\"",
13070f99970bSNélio Laranjeiro 		dev->data->port_id,
1308f44b09f9SOphir Munk 		((priv->sh->ctx != NULL) ?
1309f44b09f9SOphir Munk 		mlx5_os_get_ctx_device_name(priv->sh->ctx) : ""));
13108db7e3b6SBing Zhao 	/*
13118db7e3b6SBing Zhao 	 * If default mreg copy action is removed at the stop stage,
13128db7e3b6SBing Zhao 	 * the search will return none and nothing will be done anymore.
13138db7e3b6SBing Zhao 	 */
13148db7e3b6SBing Zhao 	mlx5_flow_stop_default(dev);
1315af4f09f2SNélio Laranjeiro 	mlx5_traffic_disable(dev);
13168db7e3b6SBing Zhao 	/*
13178db7e3b6SBing Zhao 	 * If all the flows are already flushed in the device stop stage,
13188db7e3b6SBing Zhao 	 * then this will return directly without any action.
13198db7e3b6SBing Zhao 	 */
13208db7e3b6SBing Zhao 	mlx5_flow_list_flush(dev, &priv->flows, true);
1321d7cfcdddSAndrey Vesnovaty 	mlx5_shared_action_flush(dev);
132202e76468SSuanming Mou 	mlx5_flow_meter_flush(dev, NULL);
13232e22920bSAdrien Mazarguil 	/* Prevent crashes when queues are still in use. */
13242e22920bSAdrien Mazarguil 	dev->rx_pkt_burst = removed_rx_burst;
13252e22920bSAdrien Mazarguil 	dev->tx_pkt_burst = removed_tx_burst;
13262aac5b5dSYongseok Koh 	rte_wmb();
13272aac5b5dSYongseok Koh 	/* Disable datapath on secondary process. */
13282e86c4e5SOphir Munk 	mlx5_mp_os_req_stop_rxtx(dev);
13291c506404SBing Zhao 	/* Free the eCPRI flex parser resource. */
13301c506404SBing Zhao 	mlx5_flex_parser_ecpri_release(dev);
13312e22920bSAdrien Mazarguil 	if (priv->rxqs != NULL) {
13322e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_rx_burst() is still running. */
13332e22920bSAdrien Mazarguil 		usleep(1000);
1334a1366b1aSNélio Laranjeiro 		for (i = 0; (i != priv->rxqs_n); ++i)
1335af4f09f2SNélio Laranjeiro 			mlx5_rxq_release(dev, i);
13362e22920bSAdrien Mazarguil 		priv->rxqs_n = 0;
13372e22920bSAdrien Mazarguil 		priv->rxqs = NULL;
13382e22920bSAdrien Mazarguil 	}
13392e22920bSAdrien Mazarguil 	if (priv->txqs != NULL) {
13402e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_tx_burst() is still running. */
13412e22920bSAdrien Mazarguil 		usleep(1000);
13426e78005aSNélio Laranjeiro 		for (i = 0; (i != priv->txqs_n); ++i)
1343af4f09f2SNélio Laranjeiro 			mlx5_txq_release(dev, i);
13442e22920bSAdrien Mazarguil 		priv->txqs_n = 0;
13452e22920bSAdrien Mazarguil 		priv->txqs = NULL;
13462e22920bSAdrien Mazarguil 	}
1347120dc4a7SYongseok Koh 	mlx5_proc_priv_uninit(dev);
134865b3cd0dSSuanming Mou 	if (priv->drop_queue.hrxq)
134965b3cd0dSSuanming Mou 		mlx5_drop_action_destroy(dev);
1350dd3c774fSViacheslav Ovsiienko 	if (priv->mreg_cp_tbl)
1351e69a5922SXueming Li 		mlx5_hlist_destroy(priv->mreg_cp_tbl);
13527d6bf6b8SYongseok Koh 	mlx5_mprq_free_mp(dev);
13532eb4d010SOphir Munk 	mlx5_os_free_shared_dr(priv);
135429c1d8bbSNélio Laranjeiro 	if (priv->rss_conf.rss_key != NULL)
135583c2047cSSuanming Mou 		mlx5_free(priv->rss_conf.rss_key);
1356634efbc2SNelio Laranjeiro 	if (priv->reta_idx != NULL)
135783c2047cSSuanming Mou 		mlx5_free(priv->reta_idx);
1358ccdcba53SNélio Laranjeiro 	if (priv->config.vf)
1359f00f6562SOphir Munk 		mlx5_os_mac_addr_flush(dev);
136026c08b97SAdrien Mazarguil 	if (priv->nl_socket_route >= 0)
136126c08b97SAdrien Mazarguil 		close(priv->nl_socket_route);
136226c08b97SAdrien Mazarguil 	if (priv->nl_socket_rdma >= 0)
136326c08b97SAdrien Mazarguil 		close(priv->nl_socket_rdma);
1364dfedf3e3SViacheslav Ovsiienko 	if (priv->vmwa_context)
1365dfedf3e3SViacheslav Ovsiienko 		mlx5_vlan_vmwa_exit(priv->vmwa_context);
136623820a79SDekel Peled 	ret = mlx5_hrxq_verify(dev);
1367f5479b68SNélio Laranjeiro 	if (ret)
1368a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some hash Rx queue still remain",
13690f99970bSNélio Laranjeiro 			dev->data->port_id);
137015c80a12SDekel Peled 	ret = mlx5_ind_table_obj_verify(dev);
13714c7a0f5fSNélio Laranjeiro 	if (ret)
1372a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some indirection table still remain",
13730f99970bSNélio Laranjeiro 			dev->data->port_id);
137493403560SDekel Peled 	ret = mlx5_rxq_obj_verify(dev);
137509cb5b58SNélio Laranjeiro 	if (ret)
137693403560SDekel Peled 		DRV_LOG(WARNING, "port %u some Rx queue objects still remain",
13770f99970bSNélio Laranjeiro 			dev->data->port_id);
1378af4f09f2SNélio Laranjeiro 	ret = mlx5_rxq_verify(dev);
1379a1366b1aSNélio Laranjeiro 	if (ret)
1380a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Rx queues still remain",
13810f99970bSNélio Laranjeiro 			dev->data->port_id);
1382894c4a8eSOri Kam 	ret = mlx5_txq_obj_verify(dev);
1383faf2667fSNélio Laranjeiro 	if (ret)
1384a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Verbs Tx queue still remain",
13850f99970bSNélio Laranjeiro 			dev->data->port_id);
1386af4f09f2SNélio Laranjeiro 	ret = mlx5_txq_verify(dev);
13876e78005aSNélio Laranjeiro 	if (ret)
1388a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Tx queues still remain",
13890f99970bSNélio Laranjeiro 			dev->data->port_id);
1390af4f09f2SNélio Laranjeiro 	ret = mlx5_flow_verify(dev);
13916af6b973SNélio Laranjeiro 	if (ret)
1392a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some flows still remain",
1393a170a30dSNélio Laranjeiro 			dev->data->port_id);
1394e1592b6cSSuanming Mou 	mlx5_cache_list_destroy(&priv->hrxqs);
1395772dc0ebSSuanming Mou 	/*
1396772dc0ebSSuanming Mou 	 * Free the shared context in last turn, because the cleanup
1397772dc0ebSSuanming Mou 	 * routines above may use some shared fields, like
1398f00f6562SOphir Munk 	 * mlx5_os_mac_addr_flush() uses ibdev_path for retrieveing
1399772dc0ebSSuanming Mou 	 * ifindex if Netlink fails.
1400772dc0ebSSuanming Mou 	 */
140191389890SOphir Munk 	mlx5_free_shared_dev_ctx(priv->sh);
14022b730263SAdrien Mazarguil 	if (priv->domain_id != RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID) {
14032b730263SAdrien Mazarguil 		unsigned int c = 0;
1404d874a4eeSThomas Monjalon 		uint16_t port_id;
14052b730263SAdrien Mazarguil 
1406fbc83412SViacheslav Ovsiienko 		MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
1407dbeba4cfSThomas Monjalon 			struct mlx5_priv *opriv =
1408d874a4eeSThomas Monjalon 				rte_eth_devices[port_id].data->dev_private;
14092b730263SAdrien Mazarguil 
14102b730263SAdrien Mazarguil 			if (!opriv ||
14112b730263SAdrien Mazarguil 			    opriv->domain_id != priv->domain_id ||
1412d874a4eeSThomas Monjalon 			    &rte_eth_devices[port_id] == dev)
14132b730263SAdrien Mazarguil 				continue;
14142b730263SAdrien Mazarguil 			++c;
1415f7e95215SViacheslav Ovsiienko 			break;
14162b730263SAdrien Mazarguil 		}
14172b730263SAdrien Mazarguil 		if (!c)
14182b730263SAdrien Mazarguil 			claim_zero(rte_eth_switch_domain_free(priv->domain_id));
14192b730263SAdrien Mazarguil 	}
1420771fa900SAdrien Mazarguil 	memset(priv, 0, sizeof(*priv));
14212b730263SAdrien Mazarguil 	priv->domain_id = RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID;
142242603bbdSOphir Munk 	/*
142342603bbdSOphir Munk 	 * Reset mac_addrs to NULL such that it is not freed as part of
142442603bbdSOphir Munk 	 * rte_eth_dev_release_port(). mac_addrs is part of dev_private so
142542603bbdSOphir Munk 	 * it is freed when dev_private is freed.
142642603bbdSOphir Munk 	 */
142742603bbdSOphir Munk 	dev->data->mac_addrs = NULL;
1428b142387bSThomas Monjalon 	return 0;
1429771fa900SAdrien Mazarguil }
1430771fa900SAdrien Mazarguil 
1431e72dd09bSNélio Laranjeiro /**
1432e72dd09bSNélio Laranjeiro  * Verify and store value for device argument.
1433e72dd09bSNélio Laranjeiro  *
1434e72dd09bSNélio Laranjeiro  * @param[in] key
1435e72dd09bSNélio Laranjeiro  *   Key argument to verify.
1436e72dd09bSNélio Laranjeiro  * @param[in] val
1437e72dd09bSNélio Laranjeiro  *   Value associated with key.
1438e72dd09bSNélio Laranjeiro  * @param opaque
1439e72dd09bSNélio Laranjeiro  *   User data.
1440e72dd09bSNélio Laranjeiro  *
1441e72dd09bSNélio Laranjeiro  * @return
1442a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
1443e72dd09bSNélio Laranjeiro  */
1444e72dd09bSNélio Laranjeiro static int
1445e72dd09bSNélio Laranjeiro mlx5_args_check(const char *key, const char *val, void *opaque)
1446e72dd09bSNélio Laranjeiro {
14477fe24446SShahaf Shuler 	struct mlx5_dev_config *config = opaque;
14488f848f32SViacheslav Ovsiienko 	unsigned long mod;
14498f848f32SViacheslav Ovsiienko 	signed long tmp;
1450e72dd09bSNélio Laranjeiro 
14516de569f5SAdrien Mazarguil 	/* No-op, port representors are processed in mlx5_dev_spawn(). */
14526de569f5SAdrien Mazarguil 	if (!strcmp(MLX5_REPRESENTOR, key))
14536de569f5SAdrien Mazarguil 		return 0;
145499c12dccSNélio Laranjeiro 	errno = 0;
14558f848f32SViacheslav Ovsiienko 	tmp = strtol(val, NULL, 0);
145699c12dccSNélio Laranjeiro 	if (errno) {
1457a6d83b6aSNélio Laranjeiro 		rte_errno = errno;
1458a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "%s: \"%s\" is not a valid integer", key, val);
1459a6d83b6aSNélio Laranjeiro 		return -rte_errno;
146099c12dccSNélio Laranjeiro 	}
14618f848f32SViacheslav Ovsiienko 	if (tmp < 0 && strcmp(MLX5_TX_PP, key) && strcmp(MLX5_TX_SKEW, key)) {
14628f848f32SViacheslav Ovsiienko 		/* Negative values are acceptable for some keys only. */
14638f848f32SViacheslav Ovsiienko 		rte_errno = EINVAL;
14648f848f32SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: invalid negative value \"%s\"", key, val);
14658f848f32SViacheslav Ovsiienko 		return -rte_errno;
14668f848f32SViacheslav Ovsiienko 	}
14678f848f32SViacheslav Ovsiienko 	mod = tmp >= 0 ? tmp : -tmp;
146899c12dccSNélio Laranjeiro 	if (strcmp(MLX5_RXQ_CQE_COMP_EN, key) == 0) {
146954c2d46bSAlexander Kozyrev 		if (tmp > MLX5_CQE_RESP_FORMAT_L34H_STRIDX) {
147054c2d46bSAlexander Kozyrev 			DRV_LOG(ERR, "invalid CQE compression "
147154c2d46bSAlexander Kozyrev 				     "format parameter");
147254c2d46bSAlexander Kozyrev 			rte_errno = EINVAL;
147354c2d46bSAlexander Kozyrev 			return -rte_errno;
147454c2d46bSAlexander Kozyrev 		}
14757fe24446SShahaf Shuler 		config->cqe_comp = !!tmp;
147654c2d46bSAlexander Kozyrev 		config->cqe_comp_fmt = tmp;
1477bc91e8dbSYongseok Koh 	} else if (strcmp(MLX5_RXQ_CQE_PAD_EN, key) == 0) {
1478bc91e8dbSYongseok Koh 		config->cqe_pad = !!tmp;
147978c7a16dSYongseok Koh 	} else if (strcmp(MLX5_RXQ_PKT_PAD_EN, key) == 0) {
148078c7a16dSYongseok Koh 		config->hw_padding = !!tmp;
14817d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_EN, key) == 0) {
14827d6bf6b8SYongseok Koh 		config->mprq.enabled = !!tmp;
14837d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_NUM, key) == 0) {
14847d6bf6b8SYongseok Koh 		config->mprq.stride_num_n = tmp;
1485ecb16045SAlexander Kozyrev 	} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_SIZE, key) == 0) {
1486ecb16045SAlexander Kozyrev 		config->mprq.stride_size_n = tmp;
14877d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_MAX_MEMCPY_LEN, key) == 0) {
14887d6bf6b8SYongseok Koh 		config->mprq.max_memcpy_len = tmp;
14897d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RXQS_MIN_MPRQ, key) == 0) {
14907d6bf6b8SYongseok Koh 		config->mprq.min_rxqs_num = tmp;
14912a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQ_INLINE, key) == 0) {
1492505f1fe4SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter,"
1493505f1fe4SViacheslav Ovsiienko 				 " converted to txq_inline_max", key);
1494505f1fe4SViacheslav Ovsiienko 		config->txq_inline_max = tmp;
1495505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MAX, key) == 0) {
1496505f1fe4SViacheslav Ovsiienko 		config->txq_inline_max = tmp;
1497505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MIN, key) == 0) {
1498505f1fe4SViacheslav Ovsiienko 		config->txq_inline_min = tmp;
1499505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MPW, key) == 0) {
1500505f1fe4SViacheslav Ovsiienko 		config->txq_inline_mpw = tmp;
15012a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQS_MIN_INLINE, key) == 0) {
15027fe24446SShahaf Shuler 		config->txqs_inline = tmp;
150309d8b416SYongseok Koh 	} else if (strcmp(MLX5_TXQS_MAX_VEC, key) == 0) {
1504a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
1505230189d9SNélio Laranjeiro 	} else if (strcmp(MLX5_TXQ_MPW_EN, key) == 0) {
1506f9de8718SShahaf Shuler 		config->mps = !!tmp;
15078409a285SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_DB_NC, key) == 0) {
1508f078ceb6SViacheslav Ovsiienko 		if (tmp != MLX5_TXDB_CACHED &&
1509f078ceb6SViacheslav Ovsiienko 		    tmp != MLX5_TXDB_NCACHED &&
1510f078ceb6SViacheslav Ovsiienko 		    tmp != MLX5_TXDB_HEURISTIC) {
1511f078ceb6SViacheslav Ovsiienko 			DRV_LOG(ERR, "invalid Tx doorbell "
1512f078ceb6SViacheslav Ovsiienko 				     "mapping parameter");
1513f078ceb6SViacheslav Ovsiienko 			rte_errno = EINVAL;
1514f078ceb6SViacheslav Ovsiienko 			return -rte_errno;
1515f078ceb6SViacheslav Ovsiienko 		}
1516f078ceb6SViacheslav Ovsiienko 		config->dbnc = tmp;
15176ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MPW_HDR_DSEG_EN, key) == 0) {
1518a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
15196ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MAX_INLINE_LEN, key) == 0) {
1520505f1fe4SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter,"
1521505f1fe4SViacheslav Ovsiienko 				 " converted to txq_inline_mpw", key);
1522505f1fe4SViacheslav Ovsiienko 		config->txq_inline_mpw = tmp;
15235644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_TX_VEC_EN, key) == 0) {
1524a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
15258f848f32SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_PP, key) == 0) {
15268f848f32SViacheslav Ovsiienko 		if (!mod) {
15278f848f32SViacheslav Ovsiienko 			DRV_LOG(ERR, "Zero Tx packet pacing parameter");
15288f848f32SViacheslav Ovsiienko 			rte_errno = EINVAL;
15298f848f32SViacheslav Ovsiienko 			return -rte_errno;
15308f848f32SViacheslav Ovsiienko 		}
15318f848f32SViacheslav Ovsiienko 		config->tx_pp = tmp;
15328f848f32SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_SKEW, key) == 0) {
15338f848f32SViacheslav Ovsiienko 		config->tx_skew = tmp;
15345644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_RX_VEC_EN, key) == 0) {
15357fe24446SShahaf Shuler 		config->rx_vec_en = !!tmp;
153678a54648SXueming Li 	} else if (strcmp(MLX5_L3_VXLAN_EN, key) == 0) {
153778a54648SXueming Li 		config->l3_vxlan_en = !!tmp;
1538db209cc3SNélio Laranjeiro 	} else if (strcmp(MLX5_VF_NL_EN, key) == 0) {
1539db209cc3SNélio Laranjeiro 		config->vf_nl_en = !!tmp;
1540e2b4925eSOri Kam 	} else if (strcmp(MLX5_DV_ESW_EN, key) == 0) {
1541e2b4925eSOri Kam 		config->dv_esw_en = !!tmp;
154251e72d38SOri Kam 	} else if (strcmp(MLX5_DV_FLOW_EN, key) == 0) {
154351e72d38SOri Kam 		config->dv_flow_en = !!tmp;
15442d241515SViacheslav Ovsiienko 	} else if (strcmp(MLX5_DV_XMETA_EN, key) == 0) {
15452d241515SViacheslav Ovsiienko 		if (tmp != MLX5_XMETA_MODE_LEGACY &&
15462d241515SViacheslav Ovsiienko 		    tmp != MLX5_XMETA_MODE_META16 &&
15474ec6360dSGregory Etelson 		    tmp != MLX5_XMETA_MODE_META32 &&
15484ec6360dSGregory Etelson 		    tmp != MLX5_XMETA_MODE_MISS_INFO) {
1549f078ceb6SViacheslav Ovsiienko 			DRV_LOG(ERR, "invalid extensive "
15502d241515SViacheslav Ovsiienko 				     "metadata parameter");
15512d241515SViacheslav Ovsiienko 			rte_errno = EINVAL;
15522d241515SViacheslav Ovsiienko 			return -rte_errno;
15532d241515SViacheslav Ovsiienko 		}
15544ec6360dSGregory Etelson 		if (tmp != MLX5_XMETA_MODE_MISS_INFO)
15552d241515SViacheslav Ovsiienko 			config->dv_xmeta_en = tmp;
15564ec6360dSGregory Etelson 		else
15574ec6360dSGregory Etelson 			config->dv_miss_info = 1;
15580f0ae73aSShiri Kuzin 	} else if (strcmp(MLX5_LACP_BY_USER, key) == 0) {
15590f0ae73aSShiri Kuzin 		config->lacp_by_user = !!tmp;
1560dceb5029SYongseok Koh 	} else if (strcmp(MLX5_MR_EXT_MEMSEG_EN, key) == 0) {
1561dceb5029SYongseok Koh 		config->mr_ext_memseg_en = !!tmp;
1562066cfecdSMatan Azrad 	} else if (strcmp(MLX5_MAX_DUMP_FILES_NUM, key) == 0) {
1563066cfecdSMatan Azrad 		config->max_dump_files_num = tmp;
156421bb6c7eSDekel Peled 	} else if (strcmp(MLX5_LRO_TIMEOUT_USEC, key) == 0) {
156521bb6c7eSDekel Peled 		config->lro.timeout = tmp;
1566d768f324SMatan Azrad 	} else if (strcmp(MLX5_CLASS_ARG_NAME, key) == 0) {
1567d768f324SMatan Azrad 		DRV_LOG(DEBUG, "class argument is %s.", val);
15681ad9a3d0SBing Zhao 	} else if (strcmp(MLX5_HP_BUF_SIZE, key) == 0) {
15691ad9a3d0SBing Zhao 		config->log_hp_size = tmp;
1570a1da6f62SSuanming Mou 	} else if (strcmp(MLX5_RECLAIM_MEM, key) == 0) {
1571a1da6f62SSuanming Mou 		if (tmp != MLX5_RCM_NONE &&
1572a1da6f62SSuanming Mou 		    tmp != MLX5_RCM_LIGHT &&
1573a1da6f62SSuanming Mou 		    tmp != MLX5_RCM_AGGR) {
1574a1da6f62SSuanming Mou 			DRV_LOG(ERR, "Unrecognize %s: \"%s\"", key, val);
1575a1da6f62SSuanming Mou 			rte_errno = EINVAL;
1576a1da6f62SSuanming Mou 			return -rte_errno;
1577a1da6f62SSuanming Mou 		}
1578a1da6f62SSuanming Mou 		config->reclaim_mode = tmp;
15795522da6bSSuanming Mou 	} else if (strcmp(MLX5_SYS_MEM_EN, key) == 0) {
15805522da6bSSuanming Mou 		config->sys_mem_en = !!tmp;
158150f95b23SSuanming Mou 	} else if (strcmp(MLX5_DECAP_EN, key) == 0) {
158250f95b23SSuanming Mou 		config->decap_en = !!tmp;
158399c12dccSNélio Laranjeiro 	} else {
1584a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "%s: unknown parameter", key);
1585a6d83b6aSNélio Laranjeiro 		rte_errno = EINVAL;
1586a6d83b6aSNélio Laranjeiro 		return -rte_errno;
1587e72dd09bSNélio Laranjeiro 	}
158899c12dccSNélio Laranjeiro 	return 0;
158999c12dccSNélio Laranjeiro }
1590e72dd09bSNélio Laranjeiro 
1591e72dd09bSNélio Laranjeiro /**
1592e72dd09bSNélio Laranjeiro  * Parse device parameters.
1593e72dd09bSNélio Laranjeiro  *
15947fe24446SShahaf Shuler  * @param config
15957fe24446SShahaf Shuler  *   Pointer to device configuration structure.
1596e72dd09bSNélio Laranjeiro  * @param devargs
1597e72dd09bSNélio Laranjeiro  *   Device arguments structure.
1598e72dd09bSNélio Laranjeiro  *
1599e72dd09bSNélio Laranjeiro  * @return
1600a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
1601e72dd09bSNélio Laranjeiro  */
16022eb4d010SOphir Munk int
16037fe24446SShahaf Shuler mlx5_args(struct mlx5_dev_config *config, struct rte_devargs *devargs)
1604e72dd09bSNélio Laranjeiro {
1605e72dd09bSNélio Laranjeiro 	const char **params = (const char *[]){
160699c12dccSNélio Laranjeiro 		MLX5_RXQ_CQE_COMP_EN,
1607bc91e8dbSYongseok Koh 		MLX5_RXQ_CQE_PAD_EN,
160878c7a16dSYongseok Koh 		MLX5_RXQ_PKT_PAD_EN,
16097d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_EN,
16107d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_LOG_STRIDE_NUM,
1611ecb16045SAlexander Kozyrev 		MLX5_RX_MPRQ_LOG_STRIDE_SIZE,
16127d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_MAX_MEMCPY_LEN,
16137d6bf6b8SYongseok Koh 		MLX5_RXQS_MIN_MPRQ,
16142a66cf37SYaacov Hazan 		MLX5_TXQ_INLINE,
1615505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MIN,
1616505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MAX,
1617505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MPW,
16182a66cf37SYaacov Hazan 		MLX5_TXQS_MIN_INLINE,
161909d8b416SYongseok Koh 		MLX5_TXQS_MAX_VEC,
1620230189d9SNélio Laranjeiro 		MLX5_TXQ_MPW_EN,
16216ce84bd8SYongseok Koh 		MLX5_TXQ_MPW_HDR_DSEG_EN,
16226ce84bd8SYongseok Koh 		MLX5_TXQ_MAX_INLINE_LEN,
16238409a285SViacheslav Ovsiienko 		MLX5_TX_DB_NC,
16248f848f32SViacheslav Ovsiienko 		MLX5_TX_PP,
16258f848f32SViacheslav Ovsiienko 		MLX5_TX_SKEW,
16265644d5b9SNelio Laranjeiro 		MLX5_TX_VEC_EN,
16275644d5b9SNelio Laranjeiro 		MLX5_RX_VEC_EN,
162878a54648SXueming Li 		MLX5_L3_VXLAN_EN,
1629db209cc3SNélio Laranjeiro 		MLX5_VF_NL_EN,
1630e2b4925eSOri Kam 		MLX5_DV_ESW_EN,
163151e72d38SOri Kam 		MLX5_DV_FLOW_EN,
16322d241515SViacheslav Ovsiienko 		MLX5_DV_XMETA_EN,
16330f0ae73aSShiri Kuzin 		MLX5_LACP_BY_USER,
1634dceb5029SYongseok Koh 		MLX5_MR_EXT_MEMSEG_EN,
16356de569f5SAdrien Mazarguil 		MLX5_REPRESENTOR,
1636066cfecdSMatan Azrad 		MLX5_MAX_DUMP_FILES_NUM,
163721bb6c7eSDekel Peled 		MLX5_LRO_TIMEOUT_USEC,
1638d768f324SMatan Azrad 		MLX5_CLASS_ARG_NAME,
16391ad9a3d0SBing Zhao 		MLX5_HP_BUF_SIZE,
1640a1da6f62SSuanming Mou 		MLX5_RECLAIM_MEM,
16415522da6bSSuanming Mou 		MLX5_SYS_MEM_EN,
164250f95b23SSuanming Mou 		MLX5_DECAP_EN,
1643e72dd09bSNélio Laranjeiro 		NULL,
1644e72dd09bSNélio Laranjeiro 	};
1645e72dd09bSNélio Laranjeiro 	struct rte_kvargs *kvlist;
1646e72dd09bSNélio Laranjeiro 	int ret = 0;
1647e72dd09bSNélio Laranjeiro 	int i;
1648e72dd09bSNélio Laranjeiro 
1649e72dd09bSNélio Laranjeiro 	if (devargs == NULL)
1650e72dd09bSNélio Laranjeiro 		return 0;
1651e72dd09bSNélio Laranjeiro 	/* Following UGLY cast is done to pass checkpatch. */
1652e72dd09bSNélio Laranjeiro 	kvlist = rte_kvargs_parse(devargs->args, params);
165315b0ea00SMatan Azrad 	if (kvlist == NULL) {
165415b0ea00SMatan Azrad 		rte_errno = EINVAL;
165515b0ea00SMatan Azrad 		return -rte_errno;
165615b0ea00SMatan Azrad 	}
1657e72dd09bSNélio Laranjeiro 	/* Process parameters. */
1658e72dd09bSNélio Laranjeiro 	for (i = 0; (params[i] != NULL); ++i) {
1659e72dd09bSNélio Laranjeiro 		if (rte_kvargs_count(kvlist, params[i])) {
1660e72dd09bSNélio Laranjeiro 			ret = rte_kvargs_process(kvlist, params[i],
16617fe24446SShahaf Shuler 						 mlx5_args_check, config);
1662a6d83b6aSNélio Laranjeiro 			if (ret) {
1663a6d83b6aSNélio Laranjeiro 				rte_errno = EINVAL;
1664a67323e4SShahaf Shuler 				rte_kvargs_free(kvlist);
1665a6d83b6aSNélio Laranjeiro 				return -rte_errno;
1666e72dd09bSNélio Laranjeiro 			}
1667e72dd09bSNélio Laranjeiro 		}
1668a67323e4SShahaf Shuler 	}
1669e72dd09bSNélio Laranjeiro 	rte_kvargs_free(kvlist);
1670e72dd09bSNélio Laranjeiro 	return 0;
1671e72dd09bSNélio Laranjeiro }
1672e72dd09bSNélio Laranjeiro 
16737be600c8SYongseok Koh /**
167438b4b397SViacheslav Ovsiienko  * Configures the minimal amount of data to inline into WQE
167538b4b397SViacheslav Ovsiienko  * while sending packets.
167638b4b397SViacheslav Ovsiienko  *
167738b4b397SViacheslav Ovsiienko  * - the txq_inline_min has the maximal priority, if this
167838b4b397SViacheslav Ovsiienko  *   key is specified in devargs
167938b4b397SViacheslav Ovsiienko  * - if DevX is enabled the inline mode is queried from the
168038b4b397SViacheslav Ovsiienko  *   device (HCA attributes and NIC vport context if needed).
1681ee76bddcSThomas Monjalon  * - otherwise L2 mode (18 bytes) is assumed for ConnectX-4/4 Lx
168238b4b397SViacheslav Ovsiienko  *   and none (0 bytes) for other NICs
168338b4b397SViacheslav Ovsiienko  *
168438b4b397SViacheslav Ovsiienko  * @param spawn
168538b4b397SViacheslav Ovsiienko  *   Verbs device parameters (name, port, switch_info) to spawn.
168638b4b397SViacheslav Ovsiienko  * @param config
168738b4b397SViacheslav Ovsiienko  *   Device configuration parameters.
168838b4b397SViacheslav Ovsiienko  */
16892eb4d010SOphir Munk void
169038b4b397SViacheslav Ovsiienko mlx5_set_min_inline(struct mlx5_dev_spawn_data *spawn,
169138b4b397SViacheslav Ovsiienko 		    struct mlx5_dev_config *config)
169238b4b397SViacheslav Ovsiienko {
169338b4b397SViacheslav Ovsiienko 	if (config->txq_inline_min != MLX5_ARG_UNSET) {
169438b4b397SViacheslav Ovsiienko 		/* Application defines size of inlined data explicitly. */
169538b4b397SViacheslav Ovsiienko 		switch (spawn->pci_dev->id.device_id) {
169638b4b397SViacheslav Ovsiienko 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
169738b4b397SViacheslav Ovsiienko 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
169838b4b397SViacheslav Ovsiienko 			if (config->txq_inline_min <
169938b4b397SViacheslav Ovsiienko 				       (int)MLX5_INLINE_HSIZE_L2) {
170038b4b397SViacheslav Ovsiienko 				DRV_LOG(DEBUG,
170138b4b397SViacheslav Ovsiienko 					"txq_inline_mix aligned to minimal"
170238b4b397SViacheslav Ovsiienko 					" ConnectX-4 required value %d",
170338b4b397SViacheslav Ovsiienko 					(int)MLX5_INLINE_HSIZE_L2);
170438b4b397SViacheslav Ovsiienko 				config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
170538b4b397SViacheslav Ovsiienko 			}
170638b4b397SViacheslav Ovsiienko 			break;
170738b4b397SViacheslav Ovsiienko 		}
170838b4b397SViacheslav Ovsiienko 		goto exit;
170938b4b397SViacheslav Ovsiienko 	}
171038b4b397SViacheslav Ovsiienko 	if (config->hca_attr.eth_net_offloads) {
171138b4b397SViacheslav Ovsiienko 		/* We have DevX enabled, inline mode queried successfully. */
171238b4b397SViacheslav Ovsiienko 		switch (config->hca_attr.wqe_inline_mode) {
171338b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_L2:
171438b4b397SViacheslav Ovsiienko 			/* outer L2 header must be inlined. */
171538b4b397SViacheslav Ovsiienko 			config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
171638b4b397SViacheslav Ovsiienko 			goto exit;
171738b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_NOT_REQUIRED:
171838b4b397SViacheslav Ovsiienko 			/* No inline data are required by NIC. */
171938b4b397SViacheslav Ovsiienko 			config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
172038b4b397SViacheslav Ovsiienko 			config->hw_vlan_insert =
172138b4b397SViacheslav Ovsiienko 				config->hca_attr.wqe_vlan_insert;
172238b4b397SViacheslav Ovsiienko 			DRV_LOG(DEBUG, "Tx VLAN insertion is supported");
172338b4b397SViacheslav Ovsiienko 			goto exit;
172438b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_VPORT_CONTEXT:
172538b4b397SViacheslav Ovsiienko 			/* inline mode is defined by NIC vport context. */
172638b4b397SViacheslav Ovsiienko 			if (!config->hca_attr.eth_virt)
172738b4b397SViacheslav Ovsiienko 				break;
172838b4b397SViacheslav Ovsiienko 			switch (config->hca_attr.vport_inline_mode) {
172938b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_NONE:
173038b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
173138b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_NONE;
173238b4b397SViacheslav Ovsiienko 				goto exit;
173338b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_L2:
173438b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
173538b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L2;
173638b4b397SViacheslav Ovsiienko 				goto exit;
173738b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_IP:
173838b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
173938b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L3;
174038b4b397SViacheslav Ovsiienko 				goto exit;
174138b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_TCP_UDP:
174238b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174338b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L4;
174438b4b397SViacheslav Ovsiienko 				goto exit;
174538b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_L2:
174638b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174738b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L2;
174838b4b397SViacheslav Ovsiienko 				goto exit;
174938b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_IP:
175038b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
175138b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L3;
175238b4b397SViacheslav Ovsiienko 				goto exit;
175338b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_TCP_UDP:
175438b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
175538b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L4;
175638b4b397SViacheslav Ovsiienko 				goto exit;
175738b4b397SViacheslav Ovsiienko 			}
175838b4b397SViacheslav Ovsiienko 		}
175938b4b397SViacheslav Ovsiienko 	}
176038b4b397SViacheslav Ovsiienko 	/*
176138b4b397SViacheslav Ovsiienko 	 * We get here if we are unable to deduce
176238b4b397SViacheslav Ovsiienko 	 * inline data size with DevX. Try PCI ID
176338b4b397SViacheslav Ovsiienko 	 * to determine old NICs.
176438b4b397SViacheslav Ovsiienko 	 */
176538b4b397SViacheslav Ovsiienko 	switch (spawn->pci_dev->id.device_id) {
176638b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
176738b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
176838b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4LX:
176938b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF:
1770614de6c8SViacheslav Ovsiienko 		config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
177138b4b397SViacheslav Ovsiienko 		config->hw_vlan_insert = 0;
177238b4b397SViacheslav Ovsiienko 		break;
177338b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5:
177438b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5VF:
177538b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5EX:
177638b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF:
177738b4b397SViacheslav Ovsiienko 		/*
177838b4b397SViacheslav Ovsiienko 		 * These NICs support VLAN insertion from WQE and
177938b4b397SViacheslav Ovsiienko 		 * report the wqe_vlan_insert flag. But there is the bug
178038b4b397SViacheslav Ovsiienko 		 * and PFC control may be broken, so disable feature.
178138b4b397SViacheslav Ovsiienko 		 */
178238b4b397SViacheslav Ovsiienko 		config->hw_vlan_insert = 0;
178320215627SDavid Christensen 		config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
178438b4b397SViacheslav Ovsiienko 		break;
178538b4b397SViacheslav Ovsiienko 	default:
178638b4b397SViacheslav Ovsiienko 		config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
178738b4b397SViacheslav Ovsiienko 		break;
178838b4b397SViacheslav Ovsiienko 	}
178938b4b397SViacheslav Ovsiienko exit:
179038b4b397SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "min tx inline configured: %d", config->txq_inline_min);
179138b4b397SViacheslav Ovsiienko }
179238b4b397SViacheslav Ovsiienko 
179338b4b397SViacheslav Ovsiienko /**
179439139371SViacheslav Ovsiienko  * Configures the metadata mask fields in the shared context.
179539139371SViacheslav Ovsiienko  *
179639139371SViacheslav Ovsiienko  * @param [in] dev
179739139371SViacheslav Ovsiienko  *   Pointer to Ethernet device.
179839139371SViacheslav Ovsiienko  */
17992eb4d010SOphir Munk void
180039139371SViacheslav Ovsiienko mlx5_set_metadata_mask(struct rte_eth_dev *dev)
180139139371SViacheslav Ovsiienko {
180239139371SViacheslav Ovsiienko 	struct mlx5_priv *priv = dev->data->dev_private;
18036e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
180439139371SViacheslav Ovsiienko 	uint32_t meta, mark, reg_c0;
180539139371SViacheslav Ovsiienko 
180639139371SViacheslav Ovsiienko 	reg_c0 = ~priv->vport_meta_mask;
180739139371SViacheslav Ovsiienko 	switch (priv->config.dv_xmeta_en) {
180839139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_LEGACY:
180939139371SViacheslav Ovsiienko 		meta = UINT32_MAX;
181039139371SViacheslav Ovsiienko 		mark = MLX5_FLOW_MARK_MASK;
181139139371SViacheslav Ovsiienko 		break;
181239139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_META16:
181339139371SViacheslav Ovsiienko 		meta = reg_c0 >> rte_bsf32(reg_c0);
181439139371SViacheslav Ovsiienko 		mark = MLX5_FLOW_MARK_MASK;
181539139371SViacheslav Ovsiienko 		break;
181639139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_META32:
181739139371SViacheslav Ovsiienko 		meta = UINT32_MAX;
181839139371SViacheslav Ovsiienko 		mark = (reg_c0 >> rte_bsf32(reg_c0)) & MLX5_FLOW_MARK_MASK;
181939139371SViacheslav Ovsiienko 		break;
182039139371SViacheslav Ovsiienko 	default:
182139139371SViacheslav Ovsiienko 		meta = 0;
182239139371SViacheslav Ovsiienko 		mark = 0;
18238e46d4e1SAlexander Kozyrev 		MLX5_ASSERT(false);
182439139371SViacheslav Ovsiienko 		break;
182539139371SViacheslav Ovsiienko 	}
182639139371SViacheslav Ovsiienko 	if (sh->dv_mark_mask && sh->dv_mark_mask != mark)
182739139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata MARK mask mismatche %08X:%08X",
182839139371SViacheslav Ovsiienko 				 sh->dv_mark_mask, mark);
182939139371SViacheslav Ovsiienko 	else
183039139371SViacheslav Ovsiienko 		sh->dv_mark_mask = mark;
183139139371SViacheslav Ovsiienko 	if (sh->dv_meta_mask && sh->dv_meta_mask != meta)
183239139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata META mask mismatche %08X:%08X",
183339139371SViacheslav Ovsiienko 				 sh->dv_meta_mask, meta);
183439139371SViacheslav Ovsiienko 	else
183539139371SViacheslav Ovsiienko 		sh->dv_meta_mask = meta;
183639139371SViacheslav Ovsiienko 	if (sh->dv_regc0_mask && sh->dv_regc0_mask != reg_c0)
183739139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata reg_c0 mask mismatche %08X:%08X",
183839139371SViacheslav Ovsiienko 				 sh->dv_meta_mask, reg_c0);
183939139371SViacheslav Ovsiienko 	else
184039139371SViacheslav Ovsiienko 		sh->dv_regc0_mask = reg_c0;
184139139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata mode %u", priv->config.dv_xmeta_en);
184239139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata MARK mask %08X", sh->dv_mark_mask);
184339139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata META mask %08X", sh->dv_meta_mask);
184439139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata reg_c0 mask %08X", sh->dv_regc0_mask);
184539139371SViacheslav Ovsiienko }
184639139371SViacheslav Ovsiienko 
1847efa79e68SOri Kam int
1848efa79e68SOri Kam rte_pmd_mlx5_get_dyn_flag_names(char *names[], unsigned int n)
1849efa79e68SOri Kam {
1850efa79e68SOri Kam 	static const char *const dynf_names[] = {
1851efa79e68SOri Kam 		RTE_PMD_MLX5_FINE_GRANULARITY_INLINE,
18528f848f32SViacheslav Ovsiienko 		RTE_MBUF_DYNFLAG_METADATA_NAME,
18538f848f32SViacheslav Ovsiienko 		RTE_MBUF_DYNFLAG_TX_TIMESTAMP_NAME
1854efa79e68SOri Kam 	};
1855efa79e68SOri Kam 	unsigned int i;
1856efa79e68SOri Kam 
1857efa79e68SOri Kam 	if (n < RTE_DIM(dynf_names))
1858efa79e68SOri Kam 		return -ENOMEM;
1859efa79e68SOri Kam 	for (i = 0; i < RTE_DIM(dynf_names); i++) {
1860efa79e68SOri Kam 		if (names[i] == NULL)
1861efa79e68SOri Kam 			return -EINVAL;
1862efa79e68SOri Kam 		strcpy(names[i], dynf_names[i]);
1863efa79e68SOri Kam 	}
1864efa79e68SOri Kam 	return RTE_DIM(dynf_names);
1865efa79e68SOri Kam }
1866efa79e68SOri Kam 
186721cae858SDekel Peled /**
18682eb4d010SOphir Munk  * Comparison callback to sort device data.
186992d5dd48SViacheslav Ovsiienko  *
18702eb4d010SOphir Munk  * This is meant to be used with qsort().
187192d5dd48SViacheslav Ovsiienko  *
18722eb4d010SOphir Munk  * @param a[in]
18732eb4d010SOphir Munk  *   Pointer to pointer to first data object.
18742eb4d010SOphir Munk  * @param b[in]
18752eb4d010SOphir Munk  *   Pointer to pointer to second data object.
187692d5dd48SViacheslav Ovsiienko  *
187792d5dd48SViacheslav Ovsiienko  * @return
18782eb4d010SOphir Munk  *   0 if both objects are equal, less than 0 if the first argument is less
18792eb4d010SOphir Munk  *   than the second, greater than 0 otherwise.
188092d5dd48SViacheslav Ovsiienko  */
18812eb4d010SOphir Munk int
188292d5dd48SViacheslav Ovsiienko mlx5_dev_check_sibling_config(struct mlx5_priv *priv,
188392d5dd48SViacheslav Ovsiienko 			      struct mlx5_dev_config *config)
188492d5dd48SViacheslav Ovsiienko {
18856e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
188692d5dd48SViacheslav Ovsiienko 	struct mlx5_dev_config *sh_conf = NULL;
188792d5dd48SViacheslav Ovsiienko 	uint16_t port_id;
188892d5dd48SViacheslav Ovsiienko 
18898e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
189092d5dd48SViacheslav Ovsiienko 	/* Nothing to compare for the single/first device. */
189192d5dd48SViacheslav Ovsiienko 	if (sh->refcnt == 1)
189292d5dd48SViacheslav Ovsiienko 		return 0;
189392d5dd48SViacheslav Ovsiienko 	/* Find the device with shared context. */
1894fbc83412SViacheslav Ovsiienko 	MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
189592d5dd48SViacheslav Ovsiienko 		struct mlx5_priv *opriv =
189692d5dd48SViacheslav Ovsiienko 			rte_eth_devices[port_id].data->dev_private;
189792d5dd48SViacheslav Ovsiienko 
189892d5dd48SViacheslav Ovsiienko 		if (opriv && opriv != priv && opriv->sh == sh) {
189992d5dd48SViacheslav Ovsiienko 			sh_conf = &opriv->config;
190092d5dd48SViacheslav Ovsiienko 			break;
190192d5dd48SViacheslav Ovsiienko 		}
190292d5dd48SViacheslav Ovsiienko 	}
190392d5dd48SViacheslav Ovsiienko 	if (!sh_conf)
190492d5dd48SViacheslav Ovsiienko 		return 0;
190592d5dd48SViacheslav Ovsiienko 	if (sh_conf->dv_flow_en ^ config->dv_flow_en) {
190692d5dd48SViacheslav Ovsiienko 		DRV_LOG(ERR, "\"dv_flow_en\" configuration mismatch"
190792d5dd48SViacheslav Ovsiienko 			     " for shared %s context", sh->ibdev_name);
190892d5dd48SViacheslav Ovsiienko 		rte_errno = EINVAL;
190992d5dd48SViacheslav Ovsiienko 		return rte_errno;
191092d5dd48SViacheslav Ovsiienko 	}
19112d241515SViacheslav Ovsiienko 	if (sh_conf->dv_xmeta_en ^ config->dv_xmeta_en) {
19122d241515SViacheslav Ovsiienko 		DRV_LOG(ERR, "\"dv_xmeta_en\" configuration mismatch"
19132d241515SViacheslav Ovsiienko 			     " for shared %s context", sh->ibdev_name);
19142d241515SViacheslav Ovsiienko 		rte_errno = EINVAL;
19152d241515SViacheslav Ovsiienko 		return rte_errno;
19162d241515SViacheslav Ovsiienko 	}
191792d5dd48SViacheslav Ovsiienko 	return 0;
191892d5dd48SViacheslav Ovsiienko }
1919771fa900SAdrien Mazarguil 
1920fbc83412SViacheslav Ovsiienko /**
1921fbc83412SViacheslav Ovsiienko  * Look for the ethernet device belonging to mlx5 driver.
1922fbc83412SViacheslav Ovsiienko  *
1923fbc83412SViacheslav Ovsiienko  * @param[in] port_id
1924fbc83412SViacheslav Ovsiienko  *   port_id to start looking for device.
1925fbc83412SViacheslav Ovsiienko  * @param[in] pci_dev
1926fbc83412SViacheslav Ovsiienko  *   Pointer to the hint PCI device. When device is being probed
1927fbc83412SViacheslav Ovsiienko  *   the its siblings (master and preceding representors might
19282eb4d010SOphir Munk  *   not have assigned driver yet (because the mlx5_os_pci_probe()
1929fbc83412SViacheslav Ovsiienko  *   is not completed yet, for this case match on hint PCI
1930fbc83412SViacheslav Ovsiienko  *   device may be used to detect sibling device.
1931fbc83412SViacheslav Ovsiienko  *
1932fbc83412SViacheslav Ovsiienko  * @return
1933fbc83412SViacheslav Ovsiienko  *   port_id of found device, RTE_MAX_ETHPORT if not found.
1934fbc83412SViacheslav Ovsiienko  */
1935f7e95215SViacheslav Ovsiienko uint16_t
1936fbc83412SViacheslav Ovsiienko mlx5_eth_find_next(uint16_t port_id, struct rte_pci_device *pci_dev)
1937f7e95215SViacheslav Ovsiienko {
1938f7e95215SViacheslav Ovsiienko 	while (port_id < RTE_MAX_ETHPORTS) {
1939f7e95215SViacheslav Ovsiienko 		struct rte_eth_dev *dev = &rte_eth_devices[port_id];
1940f7e95215SViacheslav Ovsiienko 
1941f7e95215SViacheslav Ovsiienko 		if (dev->state != RTE_ETH_DEV_UNUSED &&
1942f7e95215SViacheslav Ovsiienko 		    dev->device &&
1943fbc83412SViacheslav Ovsiienko 		    (dev->device == &pci_dev->device ||
1944fbc83412SViacheslav Ovsiienko 		     (dev->device->driver &&
1945f7e95215SViacheslav Ovsiienko 		     dev->device->driver->name &&
1946fbc83412SViacheslav Ovsiienko 		     !strcmp(dev->device->driver->name, MLX5_DRIVER_NAME))))
1947f7e95215SViacheslav Ovsiienko 			break;
1948f7e95215SViacheslav Ovsiienko 		port_id++;
1949f7e95215SViacheslav Ovsiienko 	}
1950f7e95215SViacheslav Ovsiienko 	if (port_id >= RTE_MAX_ETHPORTS)
1951f7e95215SViacheslav Ovsiienko 		return RTE_MAX_ETHPORTS;
1952f7e95215SViacheslav Ovsiienko 	return port_id;
1953f7e95215SViacheslav Ovsiienko }
1954f7e95215SViacheslav Ovsiienko 
19553a820742SOphir Munk /**
19563a820742SOphir Munk  * DPDK callback to remove a PCI device.
19573a820742SOphir Munk  *
19583a820742SOphir Munk  * This function removes all Ethernet devices belong to a given PCI device.
19593a820742SOphir Munk  *
19603a820742SOphir Munk  * @param[in] pci_dev
19613a820742SOphir Munk  *   Pointer to the PCI device.
19623a820742SOphir Munk  *
19633a820742SOphir Munk  * @return
19643a820742SOphir Munk  *   0 on success, the function cannot fail.
19653a820742SOphir Munk  */
19663a820742SOphir Munk static int
19673a820742SOphir Munk mlx5_pci_remove(struct rte_pci_device *pci_dev)
19683a820742SOphir Munk {
19693a820742SOphir Munk 	uint16_t port_id;
19708a5a0aadSThomas Monjalon 	int ret = 0;
19713a820742SOphir Munk 
19722786b7bfSSuanming Mou 	RTE_ETH_FOREACH_DEV_OF(port_id, &pci_dev->device) {
19732786b7bfSSuanming Mou 		/*
19742786b7bfSSuanming Mou 		 * mlx5_dev_close() is not registered to secondary process,
19752786b7bfSSuanming Mou 		 * call the close function explicitly for secondary process.
19762786b7bfSSuanming Mou 		 */
19772786b7bfSSuanming Mou 		if (rte_eal_process_type() == RTE_PROC_SECONDARY)
19788a5a0aadSThomas Monjalon 			ret |= mlx5_dev_close(&rte_eth_devices[port_id]);
19792786b7bfSSuanming Mou 		else
19808a5a0aadSThomas Monjalon 			ret |= rte_eth_dev_close(port_id);
19812786b7bfSSuanming Mou 	}
19828a5a0aadSThomas Monjalon 	return ret == 0 ? 0 : -EIO;
19833a820742SOphir Munk }
19843a820742SOphir Munk 
1985771fa900SAdrien Mazarguil static const struct rte_pci_id mlx5_pci_id_map[] = {
1986771fa900SAdrien Mazarguil 	{
19871d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19881d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4)
1989771fa900SAdrien Mazarguil 	},
1990771fa900SAdrien Mazarguil 	{
19911d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19921d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4VF)
1993771fa900SAdrien Mazarguil 	},
1994771fa900SAdrien Mazarguil 	{
19951d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19961d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LX)
1997771fa900SAdrien Mazarguil 	},
1998771fa900SAdrien Mazarguil 	{
19991d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20001d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF)
2001771fa900SAdrien Mazarguil 	},
2002771fa900SAdrien Mazarguil 	{
2003528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2004528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5)
2005528a9fbeSYongseok Koh 	},
2006528a9fbeSYongseok Koh 	{
2007528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2008528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5VF)
2009528a9fbeSYongseok Koh 	},
2010528a9fbeSYongseok Koh 	{
2011528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2012528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EX)
2013528a9fbeSYongseok Koh 	},
2014528a9fbeSYongseok Koh 	{
2015528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2016528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF)
2017528a9fbeSYongseok Koh 	},
2018528a9fbeSYongseok Koh 	{
2019dd3331c6SShahaf Shuler 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2020dd3331c6SShahaf Shuler 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5BF)
2021dd3331c6SShahaf Shuler 	},
2022dd3331c6SShahaf Shuler 	{
2023c322c0e5SOri Kam 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2024c322c0e5SOri Kam 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5BFVF)
2025c322c0e5SOri Kam 	},
2026c322c0e5SOri Kam 	{
2027f0354d84SWisam Jaddo 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2028f0354d84SWisam Jaddo 				PCI_DEVICE_ID_MELLANOX_CONNECTX6)
2029f0354d84SWisam Jaddo 	},
2030f0354d84SWisam Jaddo 	{
2031f0354d84SWisam Jaddo 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2032f0354d84SWisam Jaddo 				PCI_DEVICE_ID_MELLANOX_CONNECTX6VF)
2033f0354d84SWisam Jaddo 	},
2034f0354d84SWisam Jaddo 	{
20355fc66630SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20365fc66630SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX6DX)
20375fc66630SRaslan Darawsheh 	},
20385fc66630SRaslan Darawsheh 	{
20395fc66630SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20403ea12cadSRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTXVF)
20415fc66630SRaslan Darawsheh 	},
20425fc66630SRaslan Darawsheh 	{
204358b4a2b1SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
204458b4a2b1SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX6DXBF)
204558b4a2b1SRaslan Darawsheh 	},
204658b4a2b1SRaslan Darawsheh 	{
204728c9a7d7SAli Alnubani 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
204828c9a7d7SAli Alnubani 				PCI_DEVICE_ID_MELLANOX_CONNECTX6LX)
204928c9a7d7SAli Alnubani 	},
205028c9a7d7SAli Alnubani 	{
20516ca37b06SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20526ca37b06SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX7)
20536ca37b06SRaslan Darawsheh 	},
20546ca37b06SRaslan Darawsheh 	{
20556ca37b06SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20566ca37b06SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX7BF)
20576ca37b06SRaslan Darawsheh 	},
20586ca37b06SRaslan Darawsheh 	{
2059771fa900SAdrien Mazarguil 		.vendor_id = 0
2060771fa900SAdrien Mazarguil 	}
2061771fa900SAdrien Mazarguil };
2062771fa900SAdrien Mazarguil 
2063392bf908SParav Pandit static struct mlx5_pci_driver mlx5_driver = {
2064392bf908SParav Pandit 	.driver_class = MLX5_CLASS_NET,
2065392bf908SParav Pandit 	.pci_driver = {
20662f3193cfSJan Viktorin 		.driver = {
2067392bf908SParav Pandit 			.name = MLX5_DRIVER_NAME,
20682f3193cfSJan Viktorin 		},
2069771fa900SAdrien Mazarguil 		.id_table = mlx5_pci_id_map,
20702eb4d010SOphir Munk 		.probe = mlx5_os_pci_probe,
20713a820742SOphir Munk 		.remove = mlx5_pci_remove,
2072989e999dSShahaf Shuler 		.dma_map = mlx5_dma_map,
2073989e999dSShahaf Shuler 		.dma_unmap = mlx5_dma_unmap,
207410f3581dSOphir Munk 		.drv_flags = PCI_DRV_FLAGS,
2075392bf908SParav Pandit 	},
2076771fa900SAdrien Mazarguil };
2077771fa900SAdrien Mazarguil 
20789c99878aSJerin Jacob /* Initialize driver log type. */
20799c99878aSJerin Jacob RTE_LOG_REGISTER(mlx5_logtype, pmd.net.mlx5, NOTICE)
20809c99878aSJerin Jacob 
2081771fa900SAdrien Mazarguil /**
2082771fa900SAdrien Mazarguil  * Driver initialization routine.
2083771fa900SAdrien Mazarguil  */
2084f8e99896SThomas Monjalon RTE_INIT(rte_mlx5_pmd_init)
2085771fa900SAdrien Mazarguil {
208682088001SParav Pandit 	mlx5_common_init();
20875f8ba81cSXueming Li 	/* Build the static tables for Verbs conversion. */
2088ea16068cSYongseok Koh 	mlx5_set_ptype_table();
20895f8ba81cSXueming Li 	mlx5_set_cksum_table();
20905f8ba81cSXueming Li 	mlx5_set_swp_types_table();
20917b4f1e6bSMatan Azrad 	if (mlx5_glue)
2092392bf908SParav Pandit 		mlx5_pci_driver_register(&mlx5_driver);
2093771fa900SAdrien Mazarguil }
2094771fa900SAdrien Mazarguil 
209501f19227SShreyansh Jain RTE_PMD_EXPORT_NAME(net_mlx5, __COUNTER__);
209601f19227SShreyansh Jain RTE_PMD_REGISTER_PCI_TABLE(net_mlx5, mlx5_pci_id_map);
20970880c401SOlivier Matz RTE_PMD_REGISTER_KMOD_DEP(net_mlx5, "* ib_uverbs & mlx5_core & mlx5_ib");
2098