xref: /dpdk/drivers/net/mlx5/mlx5.c (revision 7ad0b6d91f802b11451f25a19e498228777dc84d)
18fd92a66SOlivier Matz /* SPDX-License-Identifier: BSD-3-Clause
2771fa900SAdrien Mazarguil  * Copyright 2015 6WIND S.A.
35feecc57SShahaf Shuler  * Copyright 2015 Mellanox Technologies, Ltd
4771fa900SAdrien Mazarguil  */
5771fa900SAdrien Mazarguil 
6771fa900SAdrien Mazarguil #include <stddef.h>
7771fa900SAdrien Mazarguil #include <unistd.h>
8771fa900SAdrien Mazarguil #include <string.h>
9771fa900SAdrien Mazarguil #include <stdint.h>
10771fa900SAdrien Mazarguil #include <stdlib.h>
11e72dd09bSNélio Laranjeiro #include <errno.h>
12771fa900SAdrien Mazarguil 
13771fa900SAdrien Mazarguil #include <rte_malloc.h>
14ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h>
15fdf91e0fSJan Blunck #include <rte_ethdev_pci.h>
16771fa900SAdrien Mazarguil #include <rte_pci.h>
17c752998bSGaetan Rivet #include <rte_bus_pci.h>
18771fa900SAdrien Mazarguil #include <rte_common.h>
19e72dd09bSNélio Laranjeiro #include <rte_kvargs.h>
20e89c15b6SAdrien Mazarguil #include <rte_rwlock.h>
21e89c15b6SAdrien Mazarguil #include <rte_spinlock.h>
22f38c5457SAdrien Mazarguil #include <rte_string_fns.h>
23f15db67dSMatan Azrad #include <rte_alarm.h>
24771fa900SAdrien Mazarguil 
257b4f1e6bSMatan Azrad #include <mlx5_glue.h>
267b4f1e6bSMatan Azrad #include <mlx5_devx_cmds.h>
2793e30982SMatan Azrad #include <mlx5_common.h>
28391b8bccSOphir Munk #include <mlx5_common_os.h>
29a4de9586SVu Pham #include <mlx5_common_mp.h>
30392bf908SParav Pandit #include <mlx5_common_pci.h>
3183c2047cSSuanming Mou #include <mlx5_malloc.h>
327b4f1e6bSMatan Azrad 
337b4f1e6bSMatan Azrad #include "mlx5_defs.h"
34771fa900SAdrien Mazarguil #include "mlx5.h"
35771fa900SAdrien Mazarguil #include "mlx5_utils.h"
362e22920bSAdrien Mazarguil #include "mlx5_rxtx.h"
37771fa900SAdrien Mazarguil #include "mlx5_autoconf.h"
38974f1e7eSYongseok Koh #include "mlx5_mr.h"
3984c406e7SOri Kam #include "mlx5_flow.h"
40efa79e68SOri Kam #include "rte_pmd_mlx5.h"
41771fa900SAdrien Mazarguil 
4299c12dccSNélio Laranjeiro /* Device parameter to enable RX completion queue compression. */
4399c12dccSNélio Laranjeiro #define MLX5_RXQ_CQE_COMP_EN "rxq_cqe_comp_en"
4499c12dccSNélio Laranjeiro 
45bc91e8dbSYongseok Koh /* Device parameter to enable RX completion entry padding to 128B. */
46bc91e8dbSYongseok Koh #define MLX5_RXQ_CQE_PAD_EN "rxq_cqe_pad_en"
47bc91e8dbSYongseok Koh 
4878c7a16dSYongseok Koh /* Device parameter to enable padding Rx packet to cacheline size. */
4978c7a16dSYongseok Koh #define MLX5_RXQ_PKT_PAD_EN "rxq_pkt_pad_en"
5078c7a16dSYongseok Koh 
517d6bf6b8SYongseok Koh /* Device parameter to enable Multi-Packet Rx queue. */
527d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_EN "mprq_en"
537d6bf6b8SYongseok Koh 
547d6bf6b8SYongseok Koh /* Device parameter to configure log 2 of the number of strides for MPRQ. */
557d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_LOG_STRIDE_NUM "mprq_log_stride_num"
567d6bf6b8SYongseok Koh 
57ecb16045SAlexander Kozyrev /* Device parameter to configure log 2 of the stride size for MPRQ. */
58ecb16045SAlexander Kozyrev #define MLX5_RX_MPRQ_LOG_STRIDE_SIZE "mprq_log_stride_size"
59ecb16045SAlexander Kozyrev 
607d6bf6b8SYongseok Koh /* Device parameter to limit the size of memcpy'd packet for MPRQ. */
617d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_MAX_MEMCPY_LEN "mprq_max_memcpy_len"
627d6bf6b8SYongseok Koh 
637d6bf6b8SYongseok Koh /* Device parameter to set the minimum number of Rx queues to enable MPRQ. */
647d6bf6b8SYongseok Koh #define MLX5_RXQS_MIN_MPRQ "rxqs_min_mprq"
657d6bf6b8SYongseok Koh 
66a6bd4911SViacheslav Ovsiienko /* Device parameter to configure inline send. Deprecated, ignored.*/
672a66cf37SYaacov Hazan #define MLX5_TXQ_INLINE "txq_inline"
682a66cf37SYaacov Hazan 
69505f1fe4SViacheslav Ovsiienko /* Device parameter to limit packet size to inline with ordinary SEND. */
70505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MAX "txq_inline_max"
71505f1fe4SViacheslav Ovsiienko 
72505f1fe4SViacheslav Ovsiienko /* Device parameter to configure minimal data size to inline. */
73505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MIN "txq_inline_min"
74505f1fe4SViacheslav Ovsiienko 
75505f1fe4SViacheslav Ovsiienko /* Device parameter to limit packet size to inline with Enhanced MPW. */
76505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MPW "txq_inline_mpw"
77505f1fe4SViacheslav Ovsiienko 
782a66cf37SYaacov Hazan /*
792a66cf37SYaacov Hazan  * Device parameter to configure the number of TX queues threshold for
802a66cf37SYaacov Hazan  * enabling inline send.
812a66cf37SYaacov Hazan  */
822a66cf37SYaacov Hazan #define MLX5_TXQS_MIN_INLINE "txqs_min_inline"
832a66cf37SYaacov Hazan 
8409d8b416SYongseok Koh /*
8509d8b416SYongseok Koh  * Device parameter to configure the number of TX queues threshold for
86a6bd4911SViacheslav Ovsiienko  * enabling vectorized Tx, deprecated, ignored (no vectorized Tx routines).
8709d8b416SYongseok Koh  */
8809d8b416SYongseok Koh #define MLX5_TXQS_MAX_VEC "txqs_max_vec"
8909d8b416SYongseok Koh 
90230189d9SNélio Laranjeiro /* Device parameter to enable multi-packet send WQEs. */
91230189d9SNélio Laranjeiro #define MLX5_TXQ_MPW_EN "txq_mpw_en"
92230189d9SNélio Laranjeiro 
93a6bd4911SViacheslav Ovsiienko /*
948409a285SViacheslav Ovsiienko  * Device parameter to force doorbell register mapping
958409a285SViacheslav Ovsiienko  * to non-cahed region eliminating the extra write memory barrier.
968409a285SViacheslav Ovsiienko  */
978409a285SViacheslav Ovsiienko #define MLX5_TX_DB_NC "tx_db_nc"
988409a285SViacheslav Ovsiienko 
998409a285SViacheslav Ovsiienko /*
100a6bd4911SViacheslav Ovsiienko  * Device parameter to include 2 dsegs in the title WQEBB.
101a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored.
102a6bd4911SViacheslav Ovsiienko  */
1036ce84bd8SYongseok Koh #define MLX5_TXQ_MPW_HDR_DSEG_EN "txq_mpw_hdr_dseg_en"
1046ce84bd8SYongseok Koh 
105a6bd4911SViacheslav Ovsiienko /*
106a6bd4911SViacheslav Ovsiienko  * Device parameter to limit the size of inlining packet.
107a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored.
108a6bd4911SViacheslav Ovsiienko  */
1096ce84bd8SYongseok Koh #define MLX5_TXQ_MAX_INLINE_LEN "txq_max_inline_len"
1106ce84bd8SYongseok Koh 
111a6bd4911SViacheslav Ovsiienko /*
1128f848f32SViacheslav Ovsiienko  * Device parameter to enable Tx scheduling on timestamps
1138f848f32SViacheslav Ovsiienko  * and specify the packet pacing granularity in nanoseconds.
1148f848f32SViacheslav Ovsiienko  */
1158f848f32SViacheslav Ovsiienko #define MLX5_TX_PP "tx_pp"
1168f848f32SViacheslav Ovsiienko 
1178f848f32SViacheslav Ovsiienko /*
1188f848f32SViacheslav Ovsiienko  * Device parameter to specify skew in nanoseconds on Tx datapath,
1198f848f32SViacheslav Ovsiienko  * it represents the time between SQ start WQE processing and
1208f848f32SViacheslav Ovsiienko  * appearing actual packet data on the wire.
1218f848f32SViacheslav Ovsiienko  */
1228f848f32SViacheslav Ovsiienko #define MLX5_TX_SKEW "tx_skew"
1238f848f32SViacheslav Ovsiienko 
1248f848f32SViacheslav Ovsiienko /*
125a6bd4911SViacheslav Ovsiienko  * Device parameter to enable hardware Tx vector.
126a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored (no vectorized Tx routines anymore).
127a6bd4911SViacheslav Ovsiienko  */
1285644d5b9SNelio Laranjeiro #define MLX5_TX_VEC_EN "tx_vec_en"
1295644d5b9SNelio Laranjeiro 
1305644d5b9SNelio Laranjeiro /* Device parameter to enable hardware Rx vector. */
1315644d5b9SNelio Laranjeiro #define MLX5_RX_VEC_EN "rx_vec_en"
1325644d5b9SNelio Laranjeiro 
13378a54648SXueming Li /* Allow L3 VXLAN flow creation. */
13478a54648SXueming Li #define MLX5_L3_VXLAN_EN "l3_vxlan_en"
13578a54648SXueming Li 
136e2b4925eSOri Kam /* Activate DV E-Switch flow steering. */
137e2b4925eSOri Kam #define MLX5_DV_ESW_EN "dv_esw_en"
138e2b4925eSOri Kam 
13951e72d38SOri Kam /* Activate DV flow steering. */
14051e72d38SOri Kam #define MLX5_DV_FLOW_EN "dv_flow_en"
14151e72d38SOri Kam 
1422d241515SViacheslav Ovsiienko /* Enable extensive flow metadata support. */
1432d241515SViacheslav Ovsiienko #define MLX5_DV_XMETA_EN "dv_xmeta_en"
1442d241515SViacheslav Ovsiienko 
1450f0ae73aSShiri Kuzin /* Device parameter to let the user manage the lacp traffic of bonded device */
1460f0ae73aSShiri Kuzin #define MLX5_LACP_BY_USER "lacp_by_user"
1470f0ae73aSShiri Kuzin 
148db209cc3SNélio Laranjeiro /* Activate Netlink support in VF mode. */
149db209cc3SNélio Laranjeiro #define MLX5_VF_NL_EN "vf_nl_en"
150db209cc3SNélio Laranjeiro 
151dceb5029SYongseok Koh /* Enable extending memsegs when creating a MR. */
152dceb5029SYongseok Koh #define MLX5_MR_EXT_MEMSEG_EN "mr_ext_memseg_en"
153dceb5029SYongseok Koh 
1546de569f5SAdrien Mazarguil /* Select port representors to instantiate. */
1556de569f5SAdrien Mazarguil #define MLX5_REPRESENTOR "representor"
1566de569f5SAdrien Mazarguil 
157066cfecdSMatan Azrad /* Device parameter to configure the maximum number of dump files per queue. */
158066cfecdSMatan Azrad #define MLX5_MAX_DUMP_FILES_NUM "max_dump_files_num"
159066cfecdSMatan Azrad 
16021bb6c7eSDekel Peled /* Configure timeout of LRO session (in microseconds). */
16121bb6c7eSDekel Peled #define MLX5_LRO_TIMEOUT_USEC "lro_timeout_usec"
16221bb6c7eSDekel Peled 
1631ad9a3d0SBing Zhao /*
1641ad9a3d0SBing Zhao  * Device parameter to configure the total data buffer size for a single
1651ad9a3d0SBing Zhao  * hairpin queue (logarithm value).
1661ad9a3d0SBing Zhao  */
1671ad9a3d0SBing Zhao #define MLX5_HP_BUF_SIZE "hp_buf_log_sz"
1681ad9a3d0SBing Zhao 
169a1da6f62SSuanming Mou /* Flow memory reclaim mode. */
170a1da6f62SSuanming Mou #define MLX5_RECLAIM_MEM "reclaim_mem_mode"
171a1da6f62SSuanming Mou 
1725522da6bSSuanming Mou /* The default memory allocator used in PMD. */
1735522da6bSSuanming Mou #define MLX5_SYS_MEM_EN "sys_mem_en"
17450f95b23SSuanming Mou /* Decap will be used or not. */
17550f95b23SSuanming Mou #define MLX5_DECAP_EN "decap_en"
1765522da6bSSuanming Mou 
177974f1e7eSYongseok Koh /* Shared memory between primary and secondary processes. */
178974f1e7eSYongseok Koh struct mlx5_shared_data *mlx5_shared_data;
179974f1e7eSYongseok Koh 
1802e86c4e5SOphir Munk /** Driver-specific log messages type. */
1812e86c4e5SOphir Munk int mlx5_logtype;
182a170a30dSNélio Laranjeiro 
18391389890SOphir Munk static LIST_HEAD(, mlx5_dev_ctx_shared) mlx5_dev_ctx_list =
18491389890SOphir Munk 						LIST_HEAD_INITIALIZER();
18591389890SOphir Munk static pthread_mutex_t mlx5_dev_ctx_list_mutex = PTHREAD_MUTEX_INITIALIZER;
18617e19bc4SViacheslav Ovsiienko 
1875c761238SGregory Etelson static const struct mlx5_indexed_pool_config mlx5_ipool_cfg[] = {
188b88341caSSuanming Mou #ifdef HAVE_IBV_FLOW_DV_SUPPORT
1899cac7dedSGregory Etelson 	[MLX5_IPOOL_DECAP_ENCAP] = {
190014d1cbeSSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_encap_decap_resource),
191014d1cbeSSuanming Mou 		.trunk_size = 64,
192014d1cbeSSuanming Mou 		.grow_trunk = 3,
193014d1cbeSSuanming Mou 		.grow_shift = 2,
1942f3dc1f4SSuanming Mou 		.need_lock = 1,
195014d1cbeSSuanming Mou 		.release_mem_en = 1,
19683c2047cSSuanming Mou 		.malloc = mlx5_malloc,
19783c2047cSSuanming Mou 		.free = mlx5_free,
198014d1cbeSSuanming Mou 		.type = "mlx5_encap_decap_ipool",
199014d1cbeSSuanming Mou 	},
2009cac7dedSGregory Etelson 	[MLX5_IPOOL_PUSH_VLAN] = {
2018acf8ac9SSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_push_vlan_action_resource),
2028acf8ac9SSuanming Mou 		.trunk_size = 64,
2038acf8ac9SSuanming Mou 		.grow_trunk = 3,
2048acf8ac9SSuanming Mou 		.grow_shift = 2,
2052f3dc1f4SSuanming Mou 		.need_lock = 1,
2068acf8ac9SSuanming Mou 		.release_mem_en = 1,
20783c2047cSSuanming Mou 		.malloc = mlx5_malloc,
20883c2047cSSuanming Mou 		.free = mlx5_free,
2098acf8ac9SSuanming Mou 		.type = "mlx5_push_vlan_ipool",
2108acf8ac9SSuanming Mou 	},
2119cac7dedSGregory Etelson 	[MLX5_IPOOL_TAG] = {
2125f114269SSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_tag_resource),
2135f114269SSuanming Mou 		.trunk_size = 64,
2145f114269SSuanming Mou 		.grow_trunk = 3,
2155f114269SSuanming Mou 		.grow_shift = 2,
2162f3dc1f4SSuanming Mou 		.need_lock = 1,
2175f114269SSuanming Mou 		.release_mem_en = 1,
21883c2047cSSuanming Mou 		.malloc = mlx5_malloc,
21983c2047cSSuanming Mou 		.free = mlx5_free,
2205f114269SSuanming Mou 		.type = "mlx5_tag_ipool",
2215f114269SSuanming Mou 	},
2229cac7dedSGregory Etelson 	[MLX5_IPOOL_PORT_ID] = {
223f3faf9eaSSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_port_id_action_resource),
224f3faf9eaSSuanming Mou 		.trunk_size = 64,
225f3faf9eaSSuanming Mou 		.grow_trunk = 3,
226f3faf9eaSSuanming Mou 		.grow_shift = 2,
2272f3dc1f4SSuanming Mou 		.need_lock = 1,
228f3faf9eaSSuanming Mou 		.release_mem_en = 1,
22983c2047cSSuanming Mou 		.malloc = mlx5_malloc,
23083c2047cSSuanming Mou 		.free = mlx5_free,
231f3faf9eaSSuanming Mou 		.type = "mlx5_port_id_ipool",
232f3faf9eaSSuanming Mou 	},
2339cac7dedSGregory Etelson 	[MLX5_IPOOL_JUMP] = {
2347ac99475SSuanming Mou 		.size = sizeof(struct mlx5_flow_tbl_data_entry),
2357ac99475SSuanming Mou 		.trunk_size = 64,
2367ac99475SSuanming Mou 		.grow_trunk = 3,
2377ac99475SSuanming Mou 		.grow_shift = 2,
2382f3dc1f4SSuanming Mou 		.need_lock = 1,
2397ac99475SSuanming Mou 		.release_mem_en = 1,
24083c2047cSSuanming Mou 		.malloc = mlx5_malloc,
24183c2047cSSuanming Mou 		.free = mlx5_free,
2427ac99475SSuanming Mou 		.type = "mlx5_jump_ipool",
2437ac99475SSuanming Mou 	},
2449cac7dedSGregory Etelson 	[MLX5_IPOOL_SAMPLE] = {
245b4c0ddbfSJiawei Wang 		.size = sizeof(struct mlx5_flow_dv_sample_resource),
246b4c0ddbfSJiawei Wang 		.trunk_size = 64,
247b4c0ddbfSJiawei Wang 		.grow_trunk = 3,
248b4c0ddbfSJiawei Wang 		.grow_shift = 2,
2492f3dc1f4SSuanming Mou 		.need_lock = 1,
250b4c0ddbfSJiawei Wang 		.release_mem_en = 1,
251b4c0ddbfSJiawei Wang 		.malloc = mlx5_malloc,
252b4c0ddbfSJiawei Wang 		.free = mlx5_free,
253b4c0ddbfSJiawei Wang 		.type = "mlx5_sample_ipool",
254b4c0ddbfSJiawei Wang 	},
2559cac7dedSGregory Etelson 	[MLX5_IPOOL_DEST_ARRAY] = {
25600c10c22SJiawei Wang 		.size = sizeof(struct mlx5_flow_dv_dest_array_resource),
25700c10c22SJiawei Wang 		.trunk_size = 64,
25800c10c22SJiawei Wang 		.grow_trunk = 3,
25900c10c22SJiawei Wang 		.grow_shift = 2,
2602f3dc1f4SSuanming Mou 		.need_lock = 1,
26100c10c22SJiawei Wang 		.release_mem_en = 1,
26200c10c22SJiawei Wang 		.malloc = mlx5_malloc,
26300c10c22SJiawei Wang 		.free = mlx5_free,
26400c10c22SJiawei Wang 		.type = "mlx5_dest_array_ipool",
26500c10c22SJiawei Wang 	},
2669cac7dedSGregory Etelson 	[MLX5_IPOOL_TUNNEL_ID] = {
2679cac7dedSGregory Etelson 		.size = sizeof(struct mlx5_flow_tunnel),
2689cac7dedSGregory Etelson 		.need_lock = 1,
2699cac7dedSGregory Etelson 		.release_mem_en = 1,
2709cac7dedSGregory Etelson 		.type = "mlx5_tunnel_offload",
2719cac7dedSGregory Etelson 	},
2729cac7dedSGregory Etelson 	[MLX5_IPOOL_TNL_TBL_ID] = {
2739cac7dedSGregory Etelson 		.size = 0,
2749cac7dedSGregory Etelson 		.need_lock = 1,
2759cac7dedSGregory Etelson 		.type = "mlx5_flow_tnl_tbl_ipool",
2769cac7dedSGregory Etelson 	},
277b88341caSSuanming Mou #endif
2789cac7dedSGregory Etelson 	[MLX5_IPOOL_MTR] = {
2798638e2b0SSuanming Mou 		.size = sizeof(struct mlx5_flow_meter),
2808638e2b0SSuanming Mou 		.trunk_size = 64,
2818638e2b0SSuanming Mou 		.grow_trunk = 3,
2828638e2b0SSuanming Mou 		.grow_shift = 2,
2832f3dc1f4SSuanming Mou 		.need_lock = 1,
2848638e2b0SSuanming Mou 		.release_mem_en = 1,
28583c2047cSSuanming Mou 		.malloc = mlx5_malloc,
28683c2047cSSuanming Mou 		.free = mlx5_free,
2878638e2b0SSuanming Mou 		.type = "mlx5_meter_ipool",
2888638e2b0SSuanming Mou 	},
2899cac7dedSGregory Etelson 	[MLX5_IPOOL_MCP] = {
29090e6053aSSuanming Mou 		.size = sizeof(struct mlx5_flow_mreg_copy_resource),
29190e6053aSSuanming Mou 		.trunk_size = 64,
29290e6053aSSuanming Mou 		.grow_trunk = 3,
29390e6053aSSuanming Mou 		.grow_shift = 2,
2942f3dc1f4SSuanming Mou 		.need_lock = 1,
29590e6053aSSuanming Mou 		.release_mem_en = 1,
29683c2047cSSuanming Mou 		.malloc = mlx5_malloc,
29783c2047cSSuanming Mou 		.free = mlx5_free,
29890e6053aSSuanming Mou 		.type = "mlx5_mcp_ipool",
29990e6053aSSuanming Mou 	},
3009cac7dedSGregory Etelson 	[MLX5_IPOOL_HRXQ] = {
301772dc0ebSSuanming Mou 		.size = (sizeof(struct mlx5_hrxq) + MLX5_RSS_HASH_KEY_LEN),
302772dc0ebSSuanming Mou 		.trunk_size = 64,
303772dc0ebSSuanming Mou 		.grow_trunk = 3,
304772dc0ebSSuanming Mou 		.grow_shift = 2,
3052f3dc1f4SSuanming Mou 		.need_lock = 1,
306772dc0ebSSuanming Mou 		.release_mem_en = 1,
30783c2047cSSuanming Mou 		.malloc = mlx5_malloc,
30883c2047cSSuanming Mou 		.free = mlx5_free,
309772dc0ebSSuanming Mou 		.type = "mlx5_hrxq_ipool",
310772dc0ebSSuanming Mou 	},
3119cac7dedSGregory Etelson 	[MLX5_IPOOL_MLX5_FLOW] = {
3125c761238SGregory Etelson 		/*
3135c761238SGregory Etelson 		 * MLX5_IPOOL_MLX5_FLOW size varies for DV and VERBS flows.
3145c761238SGregory Etelson 		 * It set in run time according to PCI function configuration.
3155c761238SGregory Etelson 		 */
3165c761238SGregory Etelson 		.size = 0,
317b88341caSSuanming Mou 		.trunk_size = 64,
318b88341caSSuanming Mou 		.grow_trunk = 3,
319b88341caSSuanming Mou 		.grow_shift = 2,
3202f3dc1f4SSuanming Mou 		.need_lock = 1,
321b88341caSSuanming Mou 		.release_mem_en = 1,
32283c2047cSSuanming Mou 		.malloc = mlx5_malloc,
32383c2047cSSuanming Mou 		.free = mlx5_free,
324b88341caSSuanming Mou 		.type = "mlx5_flow_handle_ipool",
325b88341caSSuanming Mou 	},
3269cac7dedSGregory Etelson 	[MLX5_IPOOL_RTE_FLOW] = {
327ab612adcSSuanming Mou 		.size = sizeof(struct rte_flow),
328ab612adcSSuanming Mou 		.trunk_size = 4096,
329ab612adcSSuanming Mou 		.need_lock = 1,
330ab612adcSSuanming Mou 		.release_mem_en = 1,
33183c2047cSSuanming Mou 		.malloc = mlx5_malloc,
33283c2047cSSuanming Mou 		.free = mlx5_free,
333ab612adcSSuanming Mou 		.type = "rte_flow_ipool",
334ab612adcSSuanming Mou 	},
3359cac7dedSGregory Etelson 	[MLX5_IPOOL_RSS_EXPANTION_FLOW_ID] = {
3364ae8825cSXueming Li 		.size = 0,
3374ae8825cSXueming Li 		.need_lock = 1,
3384ae8825cSXueming Li 		.type = "mlx5_flow_rss_id_ipool",
3394ae8825cSXueming Li 	},
3409cac7dedSGregory Etelson 	[MLX5_IPOOL_RSS_SHARED_ACTIONS] = {
3414a42ac1fSMatan Azrad 		.size = sizeof(struct mlx5_shared_action_rss),
3424a42ac1fSMatan Azrad 		.trunk_size = 64,
3434a42ac1fSMatan Azrad 		.grow_trunk = 3,
3444a42ac1fSMatan Azrad 		.grow_shift = 2,
3454a42ac1fSMatan Azrad 		.need_lock = 1,
3464a42ac1fSMatan Azrad 		.release_mem_en = 1,
3474a42ac1fSMatan Azrad 		.malloc = mlx5_malloc,
3484a42ac1fSMatan Azrad 		.free = mlx5_free,
3494a42ac1fSMatan Azrad 		.type = "mlx5_shared_action_rss",
3504a42ac1fSMatan Azrad 	},
351014d1cbeSSuanming Mou };
352014d1cbeSSuanming Mou 
353014d1cbeSSuanming Mou 
354830d2091SOri Kam #define MLX5_FLOW_MIN_ID_POOL_SIZE 512
355830d2091SOri Kam #define MLX5_ID_GENERATION_ARRAY_FACTOR 16
356830d2091SOri Kam 
357860897d2SBing Zhao #define MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE 4096
358860897d2SBing Zhao 
359830d2091SOri Kam /**
360f935ed4bSDekel Peled  * Initialize the ASO aging management structure.
361f935ed4bSDekel Peled  *
362f935ed4bSDekel Peled  * @param[in] sh
363f935ed4bSDekel Peled  *   Pointer to mlx5_dev_ctx_shared object to free
364f935ed4bSDekel Peled  *
365f935ed4bSDekel Peled  * @return
366f935ed4bSDekel Peled  *   0 on success, a negative errno value otherwise and rte_errno is set.
367f935ed4bSDekel Peled  */
368f935ed4bSDekel Peled int
369f935ed4bSDekel Peled mlx5_flow_aso_age_mng_init(struct mlx5_dev_ctx_shared *sh)
370f935ed4bSDekel Peled {
371f935ed4bSDekel Peled 	int err;
372f935ed4bSDekel Peled 
373f935ed4bSDekel Peled 	if (sh->aso_age_mng)
374f935ed4bSDekel Peled 		return 0;
375f935ed4bSDekel Peled 	sh->aso_age_mng = mlx5_malloc(MLX5_MEM_ZERO, sizeof(*sh->aso_age_mng),
376f935ed4bSDekel Peled 				      RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
377f935ed4bSDekel Peled 	if (!sh->aso_age_mng) {
378f935ed4bSDekel Peled 		DRV_LOG(ERR, "aso_age_mng allocation was failed.");
379f935ed4bSDekel Peled 		rte_errno = ENOMEM;
380f935ed4bSDekel Peled 		return -ENOMEM;
381f935ed4bSDekel Peled 	}
382f935ed4bSDekel Peled 	err = mlx5_aso_queue_init(sh);
383f935ed4bSDekel Peled 	if (err) {
384f935ed4bSDekel Peled 		mlx5_free(sh->aso_age_mng);
385f935ed4bSDekel Peled 		return -1;
386f935ed4bSDekel Peled 	}
387f935ed4bSDekel Peled 	rte_spinlock_init(&sh->aso_age_mng->resize_sl);
388f935ed4bSDekel Peled 	rte_spinlock_init(&sh->aso_age_mng->free_sl);
389f935ed4bSDekel Peled 	LIST_INIT(&sh->aso_age_mng->free);
390f935ed4bSDekel Peled 	return 0;
391f935ed4bSDekel Peled }
392f935ed4bSDekel Peled 
393f935ed4bSDekel Peled /**
394f935ed4bSDekel Peled  * Close and release all the resources of the ASO aging management structure.
395f935ed4bSDekel Peled  *
396f935ed4bSDekel Peled  * @param[in] sh
397f935ed4bSDekel Peled  *   Pointer to mlx5_dev_ctx_shared object to free.
398f935ed4bSDekel Peled  */
399f935ed4bSDekel Peled static void
400f935ed4bSDekel Peled mlx5_flow_aso_age_mng_close(struct mlx5_dev_ctx_shared *sh)
401f935ed4bSDekel Peled {
402f935ed4bSDekel Peled 	int i, j;
403f935ed4bSDekel Peled 
404f935ed4bSDekel Peled 	mlx5_aso_queue_stop(sh);
405f935ed4bSDekel Peled 	mlx5_aso_queue_uninit(sh);
406f935ed4bSDekel Peled 	if (sh->aso_age_mng->pools) {
407f935ed4bSDekel Peled 		struct mlx5_aso_age_pool *pool;
408f935ed4bSDekel Peled 
409f935ed4bSDekel Peled 		for (i = 0; i < sh->aso_age_mng->next; ++i) {
410f935ed4bSDekel Peled 			pool = sh->aso_age_mng->pools[i];
411f935ed4bSDekel Peled 			claim_zero(mlx5_devx_cmd_destroy
412f935ed4bSDekel Peled 						(pool->flow_hit_aso_obj));
413f935ed4bSDekel Peled 			for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j)
414f935ed4bSDekel Peled 				if (pool->actions[j].dr_action)
415f935ed4bSDekel Peled 					claim_zero
416f935ed4bSDekel Peled 						(mlx5_glue->destroy_flow_action
417f935ed4bSDekel Peled 						  (pool->actions[j].dr_action));
418f935ed4bSDekel Peled 			mlx5_free(pool);
419f935ed4bSDekel Peled 		}
420f935ed4bSDekel Peled 		mlx5_free(sh->aso_age_mng->pools);
421f935ed4bSDekel Peled 	}
422*7ad0b6d9SDekel Peled 	mlx5_free(sh->aso_age_mng);
423f935ed4bSDekel Peled }
424f935ed4bSDekel Peled 
425f935ed4bSDekel Peled /**
426fa2d01c8SDong Zhou  * Initialize the shared aging list information per port.
427fa2d01c8SDong Zhou  *
428fa2d01c8SDong Zhou  * @param[in] sh
4296e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
430fa2d01c8SDong Zhou  */
431fa2d01c8SDong Zhou static void
4326e88bc42SOphir Munk mlx5_flow_aging_init(struct mlx5_dev_ctx_shared *sh)
433fa2d01c8SDong Zhou {
434fa2d01c8SDong Zhou 	uint32_t i;
435fa2d01c8SDong Zhou 	struct mlx5_age_info *age_info;
436fa2d01c8SDong Zhou 
437fa2d01c8SDong Zhou 	for (i = 0; i < sh->max_port; i++) {
438fa2d01c8SDong Zhou 		age_info = &sh->port[i].age_info;
439fa2d01c8SDong Zhou 		age_info->flags = 0;
440fa2d01c8SDong Zhou 		TAILQ_INIT(&age_info->aged_counters);
441f9bc5274SMatan Azrad 		LIST_INIT(&age_info->aged_aso);
442fa2d01c8SDong Zhou 		rte_spinlock_init(&age_info->aged_sl);
443fa2d01c8SDong Zhou 		MLX5_AGE_SET(age_info, MLX5_AGE_TRIGGER);
444fa2d01c8SDong Zhou 	}
445fa2d01c8SDong Zhou }
446fa2d01c8SDong Zhou 
447fa2d01c8SDong Zhou /**
4485382d28cSMatan Azrad  * Initialize the counters management structure.
4495382d28cSMatan Azrad  *
4505382d28cSMatan Azrad  * @param[in] sh
4516e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free
4525382d28cSMatan Azrad  */
4535382d28cSMatan Azrad static void
4546e88bc42SOphir Munk mlx5_flow_counters_mng_init(struct mlx5_dev_ctx_shared *sh)
4555382d28cSMatan Azrad {
456994829e6SSuanming Mou 	int i;
4575382d28cSMatan Azrad 
4585af61440SMatan Azrad 	memset(&sh->cmng, 0, sizeof(sh->cmng));
4595382d28cSMatan Azrad 	TAILQ_INIT(&sh->cmng.flow_counters);
460994829e6SSuanming Mou 	sh->cmng.min_id = MLX5_CNT_BATCH_OFFSET;
461994829e6SSuanming Mou 	sh->cmng.max_id = -1;
462994829e6SSuanming Mou 	sh->cmng.last_pool_idx = POOL_IDX_INVALID;
4633aa27915SSuanming Mou 	rte_spinlock_init(&sh->cmng.pool_update_sl);
464994829e6SSuanming Mou 	for (i = 0; i < MLX5_COUNTER_TYPE_MAX; i++) {
465994829e6SSuanming Mou 		TAILQ_INIT(&sh->cmng.counters[i]);
466994829e6SSuanming Mou 		rte_spinlock_init(&sh->cmng.csl[i]);
467fa2d01c8SDong Zhou 	}
4685382d28cSMatan Azrad }
4695382d28cSMatan Azrad 
4705382d28cSMatan Azrad /**
4715382d28cSMatan Azrad  * Destroy all the resources allocated for a counter memory management.
4725382d28cSMatan Azrad  *
4735382d28cSMatan Azrad  * @param[in] mng
4745382d28cSMatan Azrad  *   Pointer to the memory management structure.
4755382d28cSMatan Azrad  */
4765382d28cSMatan Azrad static void
4775382d28cSMatan Azrad mlx5_flow_destroy_counter_stat_mem_mng(struct mlx5_counter_stats_mem_mng *mng)
4785382d28cSMatan Azrad {
4795382d28cSMatan Azrad 	uint8_t *mem = (uint8_t *)(uintptr_t)mng->raws[0].data;
4805382d28cSMatan Azrad 
4815382d28cSMatan Azrad 	LIST_REMOVE(mng, next);
4825382d28cSMatan Azrad 	claim_zero(mlx5_devx_cmd_destroy(mng->dm));
4835382d28cSMatan Azrad 	claim_zero(mlx5_glue->devx_umem_dereg(mng->umem));
48483c2047cSSuanming Mou 	mlx5_free(mem);
4855382d28cSMatan Azrad }
4865382d28cSMatan Azrad 
4875382d28cSMatan Azrad /**
4885382d28cSMatan Azrad  * Close and release all the resources of the counters management.
4895382d28cSMatan Azrad  *
4905382d28cSMatan Azrad  * @param[in] sh
4916e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free.
4925382d28cSMatan Azrad  */
4935382d28cSMatan Azrad static void
4946e88bc42SOphir Munk mlx5_flow_counters_mng_close(struct mlx5_dev_ctx_shared *sh)
4955382d28cSMatan Azrad {
4965382d28cSMatan Azrad 	struct mlx5_counter_stats_mem_mng *mng;
4973aa27915SSuanming Mou 	int i, j;
498f15db67dSMatan Azrad 	int retries = 1024;
4995382d28cSMatan Azrad 
500f15db67dSMatan Azrad 	rte_errno = 0;
501f15db67dSMatan Azrad 	while (--retries) {
502f15db67dSMatan Azrad 		rte_eal_alarm_cancel(mlx5_flow_query_alarm, sh);
503f15db67dSMatan Azrad 		if (rte_errno != EINPROGRESS)
504f15db67dSMatan Azrad 			break;
505f15db67dSMatan Azrad 		rte_pause();
506f15db67dSMatan Azrad 	}
5075382d28cSMatan Azrad 
508994829e6SSuanming Mou 	if (sh->cmng.pools) {
509994829e6SSuanming Mou 		struct mlx5_flow_counter_pool *pool;
5103aa27915SSuanming Mou 		uint16_t n_valid = sh->cmng.n_valid;
5112b5b1aebSSuanming Mou 		bool fallback = sh->cmng.counter_fallback;
512994829e6SSuanming Mou 
5133aa27915SSuanming Mou 		for (i = 0; i < n_valid; ++i) {
5143aa27915SSuanming Mou 			pool = sh->cmng.pools[i];
5152b5b1aebSSuanming Mou 			if (!fallback && pool->min_dcs)
5165af61440SMatan Azrad 				claim_zero(mlx5_devx_cmd_destroy
517fa2d01c8SDong Zhou 							       (pool->min_dcs));
5185382d28cSMatan Azrad 			for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j) {
5192b5b1aebSSuanming Mou 				struct mlx5_flow_counter *cnt =
5202b5b1aebSSuanming Mou 						MLX5_POOL_GET_CNT(pool, j);
5212b5b1aebSSuanming Mou 
5222b5b1aebSSuanming Mou 				if (cnt->action)
5235382d28cSMatan Azrad 					claim_zero
5245382d28cSMatan Azrad 					 (mlx5_glue->destroy_flow_action
5252b5b1aebSSuanming Mou 					  (cnt->action));
5262b5b1aebSSuanming Mou 				if (fallback && MLX5_POOL_GET_CNT
5272b5b1aebSSuanming Mou 				    (pool, j)->dcs_when_free)
5285382d28cSMatan Azrad 					claim_zero(mlx5_devx_cmd_destroy
5292b5b1aebSSuanming Mou 						   (cnt->dcs_when_free));
5305382d28cSMatan Azrad 			}
53183c2047cSSuanming Mou 			mlx5_free(pool);
5325382d28cSMatan Azrad 		}
533994829e6SSuanming Mou 		mlx5_free(sh->cmng.pools);
5345382d28cSMatan Azrad 	}
5355382d28cSMatan Azrad 	mng = LIST_FIRST(&sh->cmng.mem_mngs);
5365382d28cSMatan Azrad 	while (mng) {
5375382d28cSMatan Azrad 		mlx5_flow_destroy_counter_stat_mem_mng(mng);
5385382d28cSMatan Azrad 		mng = LIST_FIRST(&sh->cmng.mem_mngs);
5395382d28cSMatan Azrad 	}
5405382d28cSMatan Azrad 	memset(&sh->cmng, 0, sizeof(sh->cmng));
5415382d28cSMatan Azrad }
5425382d28cSMatan Azrad 
543f935ed4bSDekel Peled /* Send FLOW_AGED event if needed. */
544f935ed4bSDekel Peled void
545f935ed4bSDekel Peled mlx5_age_event_prepare(struct mlx5_dev_ctx_shared *sh)
546f935ed4bSDekel Peled {
547f935ed4bSDekel Peled 	struct mlx5_age_info *age_info;
548f935ed4bSDekel Peled 	uint32_t i;
549f935ed4bSDekel Peled 
550f935ed4bSDekel Peled 	for (i = 0; i < sh->max_port; i++) {
551f935ed4bSDekel Peled 		age_info = &sh->port[i].age_info;
552f935ed4bSDekel Peled 		if (!MLX5_AGE_GET(age_info, MLX5_AGE_EVENT_NEW))
553f935ed4bSDekel Peled 			continue;
554f935ed4bSDekel Peled 		if (MLX5_AGE_GET(age_info, MLX5_AGE_TRIGGER))
555f935ed4bSDekel Peled 			rte_eth_dev_callback_process
556f935ed4bSDekel Peled 				(&rte_eth_devices[sh->port[i].devx_ih_port_id],
557f935ed4bSDekel Peled 				RTE_ETH_EVENT_FLOW_AGED, NULL);
558f935ed4bSDekel Peled 		age_info->flags = 0;
559f935ed4bSDekel Peled 	}
560f935ed4bSDekel Peled }
561f935ed4bSDekel Peled 
5625382d28cSMatan Azrad /**
563014d1cbeSSuanming Mou  * Initialize the flow resources' indexed mempool.
564014d1cbeSSuanming Mou  *
565014d1cbeSSuanming Mou  * @param[in] sh
5666e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
567b88341caSSuanming Mou  * @param[in] sh
568b88341caSSuanming Mou  *   Pointer to user dev config.
569014d1cbeSSuanming Mou  */
570014d1cbeSSuanming Mou static void
5716e88bc42SOphir Munk mlx5_flow_ipool_create(struct mlx5_dev_ctx_shared *sh,
5725c761238SGregory Etelson 		       const struct mlx5_dev_config *config)
573014d1cbeSSuanming Mou {
574014d1cbeSSuanming Mou 	uint8_t i;
5755c761238SGregory Etelson 	struct mlx5_indexed_pool_config cfg;
576014d1cbeSSuanming Mou 
577a1da6f62SSuanming Mou 	for (i = 0; i < MLX5_IPOOL_MAX; ++i) {
5785c761238SGregory Etelson 		cfg = mlx5_ipool_cfg[i];
5795c761238SGregory Etelson 		switch (i) {
5805c761238SGregory Etelson 		default:
5815c761238SGregory Etelson 			break;
5825c761238SGregory Etelson 		/*
5835c761238SGregory Etelson 		 * Set MLX5_IPOOL_MLX5_FLOW ipool size
5845c761238SGregory Etelson 		 * according to PCI function flow configuration.
5855c761238SGregory Etelson 		 */
5865c761238SGregory Etelson 		case MLX5_IPOOL_MLX5_FLOW:
5875c761238SGregory Etelson 			cfg.size = config->dv_flow_en ?
5885c761238SGregory Etelson 				sizeof(struct mlx5_flow_handle) :
5895c761238SGregory Etelson 				MLX5_FLOW_HANDLE_VERBS_SIZE;
5905c761238SGregory Etelson 			break;
5915c761238SGregory Etelson 		}
592a1da6f62SSuanming Mou 		if (config->reclaim_mode)
5935c761238SGregory Etelson 			cfg.release_mem_en = 1;
5945c761238SGregory Etelson 		sh->ipool[i] = mlx5_ipool_create(&cfg);
595014d1cbeSSuanming Mou 	}
596a1da6f62SSuanming Mou }
597014d1cbeSSuanming Mou 
598014d1cbeSSuanming Mou /**
599014d1cbeSSuanming Mou  * Release the flow resources' indexed mempool.
600014d1cbeSSuanming Mou  *
601014d1cbeSSuanming Mou  * @param[in] sh
6026e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
603014d1cbeSSuanming Mou  */
604014d1cbeSSuanming Mou static void
6056e88bc42SOphir Munk mlx5_flow_ipool_destroy(struct mlx5_dev_ctx_shared *sh)
606014d1cbeSSuanming Mou {
607014d1cbeSSuanming Mou 	uint8_t i;
608014d1cbeSSuanming Mou 
609014d1cbeSSuanming Mou 	for (i = 0; i < MLX5_IPOOL_MAX; ++i)
610014d1cbeSSuanming Mou 		mlx5_ipool_destroy(sh->ipool[i]);
611014d1cbeSSuanming Mou }
612014d1cbeSSuanming Mou 
613daa38a89SBing Zhao /*
614daa38a89SBing Zhao  * Check if dynamic flex parser for eCPRI already exists.
615daa38a89SBing Zhao  *
616daa38a89SBing Zhao  * @param dev
617daa38a89SBing Zhao  *   Pointer to Ethernet device structure.
618daa38a89SBing Zhao  *
619daa38a89SBing Zhao  * @return
620daa38a89SBing Zhao  *   true on exists, false on not.
621daa38a89SBing Zhao  */
622daa38a89SBing Zhao bool
623daa38a89SBing Zhao mlx5_flex_parser_ecpri_exist(struct rte_eth_dev *dev)
624daa38a89SBing Zhao {
625daa38a89SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
626daa38a89SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
627daa38a89SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
628daa38a89SBing Zhao 
629daa38a89SBing Zhao 	return !!prf->obj;
630daa38a89SBing Zhao }
631daa38a89SBing Zhao 
632daa38a89SBing Zhao /*
633daa38a89SBing Zhao  * Allocation of a flex parser for eCPRI. Once created, this parser related
634daa38a89SBing Zhao  * resources will be held until the device is closed.
635daa38a89SBing Zhao  *
636daa38a89SBing Zhao  * @param dev
637daa38a89SBing Zhao  *   Pointer to Ethernet device structure.
638daa38a89SBing Zhao  *
639daa38a89SBing Zhao  * @return
640daa38a89SBing Zhao  *   0 on success, a negative errno value otherwise and rte_errno is set.
641daa38a89SBing Zhao  */
642daa38a89SBing Zhao int
643daa38a89SBing Zhao mlx5_flex_parser_ecpri_alloc(struct rte_eth_dev *dev)
644daa38a89SBing Zhao {
645daa38a89SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
646daa38a89SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
647daa38a89SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
6481c506404SBing Zhao 	struct mlx5_devx_graph_node_attr node = {
6491c506404SBing Zhao 		.modify_field_select = 0,
6501c506404SBing Zhao 	};
6511c506404SBing Zhao 	uint32_t ids[8];
6521c506404SBing Zhao 	int ret;
653daa38a89SBing Zhao 
654d7c49561SBing Zhao 	if (!priv->config.hca_attr.parse_graph_flex_node) {
655d7c49561SBing Zhao 		DRV_LOG(ERR, "Dynamic flex parser is not supported "
656d7c49561SBing Zhao 			"for device %s.", priv->dev_data->name);
657d7c49561SBing Zhao 		return -ENOTSUP;
658d7c49561SBing Zhao 	}
6591c506404SBing Zhao 	node.header_length_mode = MLX5_GRAPH_NODE_LEN_FIXED;
6601c506404SBing Zhao 	/* 8 bytes now: 4B common header + 4B message body header. */
6611c506404SBing Zhao 	node.header_length_base_value = 0x8;
6621c506404SBing Zhao 	/* After MAC layer: Ether / VLAN. */
6631c506404SBing Zhao 	node.in[0].arc_parse_graph_node = MLX5_GRAPH_ARC_NODE_MAC;
6641c506404SBing Zhao 	/* Type of compared condition should be 0xAEFE in the L2 layer. */
6651c506404SBing Zhao 	node.in[0].compare_condition_value = RTE_ETHER_TYPE_ECPRI;
6661c506404SBing Zhao 	/* Sample #0: type in common header. */
6671c506404SBing Zhao 	node.sample[0].flow_match_sample_en = 1;
6681c506404SBing Zhao 	/* Fixed offset. */
6691c506404SBing Zhao 	node.sample[0].flow_match_sample_offset_mode = 0x0;
6701c506404SBing Zhao 	/* Only the 2nd byte will be used. */
6711c506404SBing Zhao 	node.sample[0].flow_match_sample_field_base_offset = 0x0;
6721c506404SBing Zhao 	/* Sample #1: message payload. */
6731c506404SBing Zhao 	node.sample[1].flow_match_sample_en = 1;
6741c506404SBing Zhao 	/* Fixed offset. */
6751c506404SBing Zhao 	node.sample[1].flow_match_sample_offset_mode = 0x0;
6761c506404SBing Zhao 	/*
6771c506404SBing Zhao 	 * Only the first two bytes will be used right now, and its offset will
6781c506404SBing Zhao 	 * start after the common header that with the length of a DW(u32).
6791c506404SBing Zhao 	 */
6801c506404SBing Zhao 	node.sample[1].flow_match_sample_field_base_offset = sizeof(uint32_t);
6811c506404SBing Zhao 	prf->obj = mlx5_devx_cmd_create_flex_parser(priv->sh->ctx, &node);
6821c506404SBing Zhao 	if (!prf->obj) {
6831c506404SBing Zhao 		DRV_LOG(ERR, "Failed to create flex parser node object.");
6841c506404SBing Zhao 		return (rte_errno == 0) ? -ENODEV : -rte_errno;
6851c506404SBing Zhao 	}
6861c506404SBing Zhao 	prf->num = 2;
6871c506404SBing Zhao 	ret = mlx5_devx_cmd_query_parse_samples(prf->obj, ids, prf->num);
6881c506404SBing Zhao 	if (ret) {
6891c506404SBing Zhao 		DRV_LOG(ERR, "Failed to query sample IDs.");
6901c506404SBing Zhao 		return (rte_errno == 0) ? -ENODEV : -rte_errno;
6911c506404SBing Zhao 	}
6921c506404SBing Zhao 	prf->offset[0] = 0x0;
6931c506404SBing Zhao 	prf->offset[1] = sizeof(uint32_t);
6941c506404SBing Zhao 	prf->ids[0] = ids[0];
6951c506404SBing Zhao 	prf->ids[1] = ids[1];
696daa38a89SBing Zhao 	return 0;
697daa38a89SBing Zhao }
698daa38a89SBing Zhao 
6991c506404SBing Zhao /*
7001c506404SBing Zhao  * Destroy the flex parser node, including the parser itself, input / output
7011c506404SBing Zhao  * arcs and DW samples. Resources could be reused then.
7021c506404SBing Zhao  *
7031c506404SBing Zhao  * @param dev
7041c506404SBing Zhao  *   Pointer to Ethernet device structure.
7051c506404SBing Zhao  */
7061c506404SBing Zhao static void
7071c506404SBing Zhao mlx5_flex_parser_ecpri_release(struct rte_eth_dev *dev)
7081c506404SBing Zhao {
7091c506404SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
7101c506404SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
7111c506404SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
7121c506404SBing Zhao 
7131c506404SBing Zhao 	if (prf->obj)
7141c506404SBing Zhao 		mlx5_devx_cmd_destroy(prf->obj);
7151c506404SBing Zhao 	prf->obj = NULL;
7161c506404SBing Zhao }
7171c506404SBing Zhao 
718a0bfe9d5SViacheslav Ovsiienko /*
719a0bfe9d5SViacheslav Ovsiienko  * Allocate Rx and Tx UARs in robust fashion.
720a0bfe9d5SViacheslav Ovsiienko  * This routine handles the following UAR allocation issues:
721a0bfe9d5SViacheslav Ovsiienko  *
722a0bfe9d5SViacheslav Ovsiienko  *  - tries to allocate the UAR with the most appropriate memory
723a0bfe9d5SViacheslav Ovsiienko  *    mapping type from the ones supported by the host
724a0bfe9d5SViacheslav Ovsiienko  *
725a0bfe9d5SViacheslav Ovsiienko  *  - tries to allocate the UAR with non-NULL base address
726a0bfe9d5SViacheslav Ovsiienko  *    OFED 5.0.x and Upstream rdma_core before v29 returned the NULL as
727a0bfe9d5SViacheslav Ovsiienko  *    UAR base address if UAR was not the first object in the UAR page.
728a0bfe9d5SViacheslav Ovsiienko  *    It caused the PMD failure and we should try to get another UAR
729a0bfe9d5SViacheslav Ovsiienko  *    till we get the first one with non-NULL base address returned.
730a0bfe9d5SViacheslav Ovsiienko  */
731a0bfe9d5SViacheslav Ovsiienko static int
732a0bfe9d5SViacheslav Ovsiienko mlx5_alloc_rxtx_uars(struct mlx5_dev_ctx_shared *sh,
733a0bfe9d5SViacheslav Ovsiienko 		     const struct mlx5_dev_config *config)
734a0bfe9d5SViacheslav Ovsiienko {
735a0bfe9d5SViacheslav Ovsiienko 	uint32_t uar_mapping, retry;
736a0bfe9d5SViacheslav Ovsiienko 	int err = 0;
7371f66ac5bSOphir Munk 	void *base_addr;
738a0bfe9d5SViacheslav Ovsiienko 
739a0bfe9d5SViacheslav Ovsiienko 	for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
740a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
741a0bfe9d5SViacheslav Ovsiienko 		/* Control the mapping type according to the settings. */
742a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = (config->dbnc == MLX5_TXDB_NCACHED) ?
743a0bfe9d5SViacheslav Ovsiienko 			      MLX5DV_UAR_ALLOC_TYPE_NC :
744a0bfe9d5SViacheslav Ovsiienko 			      MLX5DV_UAR_ALLOC_TYPE_BF;
745a0bfe9d5SViacheslav Ovsiienko #else
746a0bfe9d5SViacheslav Ovsiienko 		RTE_SET_USED(config);
747a0bfe9d5SViacheslav Ovsiienko 		/*
748a0bfe9d5SViacheslav Ovsiienko 		 * It seems we have no way to control the memory mapping type
749a0bfe9d5SViacheslav Ovsiienko 		 * for the UAR, the default "Write-Combining" type is supposed.
750a0bfe9d5SViacheslav Ovsiienko 		 * The UAR initialization on queue creation queries the
751a0bfe9d5SViacheslav Ovsiienko 		 * actual mapping type done by Verbs/kernel and setups the
752a0bfe9d5SViacheslav Ovsiienko 		 * PMD datapath accordingly.
753a0bfe9d5SViacheslav Ovsiienko 		 */
754a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = 0;
755a0bfe9d5SViacheslav Ovsiienko #endif
756a0bfe9d5SViacheslav Ovsiienko 		sh->tx_uar = mlx5_glue->devx_alloc_uar(sh->ctx, uar_mapping);
757a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
758a0bfe9d5SViacheslav Ovsiienko 		if (!sh->tx_uar &&
759a0bfe9d5SViacheslav Ovsiienko 		    uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
760a0bfe9d5SViacheslav Ovsiienko 			if (config->dbnc == MLX5_TXDB_CACHED ||
761a0bfe9d5SViacheslav Ovsiienko 			    config->dbnc == MLX5_TXDB_HEURISTIC)
762a0bfe9d5SViacheslav Ovsiienko 				DRV_LOG(WARNING, "Devarg tx_db_nc setting "
763a0bfe9d5SViacheslav Ovsiienko 						 "is not supported by DevX");
764a0bfe9d5SViacheslav Ovsiienko 			/*
765a0bfe9d5SViacheslav Ovsiienko 			 * In some environments like virtual machine
766a0bfe9d5SViacheslav Ovsiienko 			 * the Write Combining mapped might be not supported
767a0bfe9d5SViacheslav Ovsiienko 			 * and UAR allocation fails. We try "Non-Cached"
768a0bfe9d5SViacheslav Ovsiienko 			 * mapping for the case. The tx_burst routines take
769a0bfe9d5SViacheslav Ovsiienko 			 * the UAR mapping type into account on UAR setup
770a0bfe9d5SViacheslav Ovsiienko 			 * on queue creation.
771a0bfe9d5SViacheslav Ovsiienko 			 */
772a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Tx DevX UAR (BF)");
773a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
774a0bfe9d5SViacheslav Ovsiienko 			sh->tx_uar = mlx5_glue->devx_alloc_uar
775a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
776a0bfe9d5SViacheslav Ovsiienko 		} else if (!sh->tx_uar &&
777a0bfe9d5SViacheslav Ovsiienko 			   uar_mapping == MLX5DV_UAR_ALLOC_TYPE_NC) {
778a0bfe9d5SViacheslav Ovsiienko 			if (config->dbnc == MLX5_TXDB_NCACHED)
779a0bfe9d5SViacheslav Ovsiienko 				DRV_LOG(WARNING, "Devarg tx_db_nc settings "
780a0bfe9d5SViacheslav Ovsiienko 						 "is not supported by DevX");
781a0bfe9d5SViacheslav Ovsiienko 			/*
782a0bfe9d5SViacheslav Ovsiienko 			 * If Verbs/kernel does not support "Non-Cached"
783a0bfe9d5SViacheslav Ovsiienko 			 * try the "Write-Combining".
784a0bfe9d5SViacheslav Ovsiienko 			 */
785a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Tx DevX UAR (NC)");
786a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_BF;
787a0bfe9d5SViacheslav Ovsiienko 			sh->tx_uar = mlx5_glue->devx_alloc_uar
788a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
789a0bfe9d5SViacheslav Ovsiienko 		}
790a0bfe9d5SViacheslav Ovsiienko #endif
791a0bfe9d5SViacheslav Ovsiienko 		if (!sh->tx_uar) {
792a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (BF/NC)");
793a0bfe9d5SViacheslav Ovsiienko 			err = ENOMEM;
794a0bfe9d5SViacheslav Ovsiienko 			goto exit;
795a0bfe9d5SViacheslav Ovsiienko 		}
7961f66ac5bSOphir Munk 		base_addr = mlx5_os_get_devx_uar_base_addr(sh->tx_uar);
7971f66ac5bSOphir Munk 		if (base_addr)
798a0bfe9d5SViacheslav Ovsiienko 			break;
799a0bfe9d5SViacheslav Ovsiienko 		/*
800a0bfe9d5SViacheslav Ovsiienko 		 * The UARs are allocated by rdma_core within the
801a0bfe9d5SViacheslav Ovsiienko 		 * IB device context, on context closure all UARs
802a0bfe9d5SViacheslav Ovsiienko 		 * will be freed, should be no memory/object leakage.
803a0bfe9d5SViacheslav Ovsiienko 		 */
804a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(WARNING, "Retrying to allocate Tx DevX UAR");
805a0bfe9d5SViacheslav Ovsiienko 		sh->tx_uar = NULL;
806a0bfe9d5SViacheslav Ovsiienko 	}
807a0bfe9d5SViacheslav Ovsiienko 	/* Check whether we finally succeeded with valid UAR allocation. */
808a0bfe9d5SViacheslav Ovsiienko 	if (!sh->tx_uar) {
809a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (NULL base)");
810a0bfe9d5SViacheslav Ovsiienko 		err = ENOMEM;
811a0bfe9d5SViacheslav Ovsiienko 		goto exit;
812a0bfe9d5SViacheslav Ovsiienko 	}
813a0bfe9d5SViacheslav Ovsiienko 	for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
814a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = 0;
815a0bfe9d5SViacheslav Ovsiienko 		sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
816a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
817a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
818a0bfe9d5SViacheslav Ovsiienko 		if (!sh->devx_rx_uar &&
819a0bfe9d5SViacheslav Ovsiienko 		    uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
820a0bfe9d5SViacheslav Ovsiienko 			/*
821a0bfe9d5SViacheslav Ovsiienko 			 * Rx UAR is used to control interrupts only,
822a0bfe9d5SViacheslav Ovsiienko 			 * should be no datapath noticeable impact,
823a0bfe9d5SViacheslav Ovsiienko 			 * can try "Non-Cached" mapping safely.
824a0bfe9d5SViacheslav Ovsiienko 			 */
825a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Rx DevX UAR (BF)");
826a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
827a0bfe9d5SViacheslav Ovsiienko 			sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
828a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
829a0bfe9d5SViacheslav Ovsiienko 		}
830a0bfe9d5SViacheslav Ovsiienko #endif
831a0bfe9d5SViacheslav Ovsiienko 		if (!sh->devx_rx_uar) {
832a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (BF/NC)");
833a0bfe9d5SViacheslav Ovsiienko 			err = ENOMEM;
834a0bfe9d5SViacheslav Ovsiienko 			goto exit;
835a0bfe9d5SViacheslav Ovsiienko 		}
8361f66ac5bSOphir Munk 		base_addr = mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar);
8371f66ac5bSOphir Munk 		if (base_addr)
838a0bfe9d5SViacheslav Ovsiienko 			break;
839a0bfe9d5SViacheslav Ovsiienko 		/*
840a0bfe9d5SViacheslav Ovsiienko 		 * The UARs are allocated by rdma_core within the
841a0bfe9d5SViacheslav Ovsiienko 		 * IB device context, on context closure all UARs
842a0bfe9d5SViacheslav Ovsiienko 		 * will be freed, should be no memory/object leakage.
843a0bfe9d5SViacheslav Ovsiienko 		 */
844a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(WARNING, "Retrying to allocate Rx DevX UAR");
845a0bfe9d5SViacheslav Ovsiienko 		sh->devx_rx_uar = NULL;
846a0bfe9d5SViacheslav Ovsiienko 	}
847a0bfe9d5SViacheslav Ovsiienko 	/* Check whether we finally succeeded with valid UAR allocation. */
848a0bfe9d5SViacheslav Ovsiienko 	if (!sh->devx_rx_uar) {
849a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (NULL base)");
850a0bfe9d5SViacheslav Ovsiienko 		err = ENOMEM;
851a0bfe9d5SViacheslav Ovsiienko 	}
852a0bfe9d5SViacheslav Ovsiienko exit:
853a0bfe9d5SViacheslav Ovsiienko 	return err;
854a0bfe9d5SViacheslav Ovsiienko }
855a0bfe9d5SViacheslav Ovsiienko 
856014d1cbeSSuanming Mou /**
85791389890SOphir Munk  * Allocate shared device context. If there is multiport device the
85817e19bc4SViacheslav Ovsiienko  * master and representors will share this context, if there is single
85991389890SOphir Munk  * port dedicated device, the context will be used by only given
86017e19bc4SViacheslav Ovsiienko  * port due to unification.
86117e19bc4SViacheslav Ovsiienko  *
86291389890SOphir Munk  * Routine first searches the context for the specified device name,
86317e19bc4SViacheslav Ovsiienko  * if found the shared context assumed and reference counter is incremented.
86417e19bc4SViacheslav Ovsiienko  * If no context found the new one is created and initialized with specified
86591389890SOphir Munk  * device context and parameters.
86617e19bc4SViacheslav Ovsiienko  *
86717e19bc4SViacheslav Ovsiienko  * @param[in] spawn
86891389890SOphir Munk  *   Pointer to the device attributes (name, port, etc).
8698409a285SViacheslav Ovsiienko  * @param[in] config
8708409a285SViacheslav Ovsiienko  *   Pointer to device configuration structure.
87117e19bc4SViacheslav Ovsiienko  *
87217e19bc4SViacheslav Ovsiienko  * @return
8736e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object on success,
87417e19bc4SViacheslav Ovsiienko  *   otherwise NULL and rte_errno is set.
87517e19bc4SViacheslav Ovsiienko  */
8762eb4d010SOphir Munk struct mlx5_dev_ctx_shared *
87791389890SOphir Munk mlx5_alloc_shared_dev_ctx(const struct mlx5_dev_spawn_data *spawn,
8788409a285SViacheslav Ovsiienko 			   const struct mlx5_dev_config *config)
87917e19bc4SViacheslav Ovsiienko {
8806e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh;
88117e19bc4SViacheslav Ovsiienko 	int err = 0;
88253e5a82fSViacheslav Ovsiienko 	uint32_t i;
883ae18a1aeSOri Kam 	struct mlx5_devx_tis_attr tis_attr = { 0 };
88417e19bc4SViacheslav Ovsiienko 
8858e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(spawn);
88617e19bc4SViacheslav Ovsiienko 	/* Secondary process should not create the shared context. */
8878e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
88891389890SOphir Munk 	pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
88917e19bc4SViacheslav Ovsiienko 	/* Search for IB context by device name. */
89091389890SOphir Munk 	LIST_FOREACH(sh, &mlx5_dev_ctx_list, next) {
891834a9019SOphir Munk 		if (!strcmp(sh->ibdev_name,
892834a9019SOphir Munk 			mlx5_os_get_dev_device_name(spawn->phys_dev))) {
89317e19bc4SViacheslav Ovsiienko 			sh->refcnt++;
89417e19bc4SViacheslav Ovsiienko 			goto exit;
89517e19bc4SViacheslav Ovsiienko 		}
89617e19bc4SViacheslav Ovsiienko 	}
897ae4eb7dcSViacheslav Ovsiienko 	/* No device found, we have to create new shared context. */
8988e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(spawn->max_port);
8992175c4dcSSuanming Mou 	sh = mlx5_malloc(MLX5_MEM_ZERO | MLX5_MEM_RTE,
9006e88bc42SOphir Munk 			 sizeof(struct mlx5_dev_ctx_shared) +
90117e19bc4SViacheslav Ovsiienko 			 spawn->max_port *
90291389890SOphir Munk 			 sizeof(struct mlx5_dev_shared_port),
9032175c4dcSSuanming Mou 			 RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
90417e19bc4SViacheslav Ovsiienko 	if (!sh) {
90517e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "shared context allocation failure");
90617e19bc4SViacheslav Ovsiienko 		rte_errno  = ENOMEM;
90717e19bc4SViacheslav Ovsiienko 		goto exit;
90817e19bc4SViacheslav Ovsiienko 	}
9092eb4d010SOphir Munk 	err = mlx5_os_open_device(spawn, config, sh);
91006f78b5eSViacheslav Ovsiienko 	if (!sh->ctx)
91117e19bc4SViacheslav Ovsiienko 		goto error;
912e85f623eSOphir Munk 	err = mlx5_os_get_dev_attr(sh->ctx, &sh->device_attr);
91317e19bc4SViacheslav Ovsiienko 	if (err) {
914e85f623eSOphir Munk 		DRV_LOG(DEBUG, "mlx5_os_get_dev_attr() failed");
91517e19bc4SViacheslav Ovsiienko 		goto error;
91617e19bc4SViacheslav Ovsiienko 	}
91717e19bc4SViacheslav Ovsiienko 	sh->refcnt = 1;
918e6818853SXueming Li 	sh->bond_dev = UINT16_MAX;
91917e19bc4SViacheslav Ovsiienko 	sh->max_port = spawn->max_port;
920f44b09f9SOphir Munk 	strncpy(sh->ibdev_name, mlx5_os_get_ctx_device_name(sh->ctx),
921f44b09f9SOphir Munk 		sizeof(sh->ibdev_name) - 1);
922f44b09f9SOphir Munk 	strncpy(sh->ibdev_path, mlx5_os_get_ctx_device_path(sh->ctx),
923f44b09f9SOphir Munk 		sizeof(sh->ibdev_path) - 1);
92453e5a82fSViacheslav Ovsiienko 	/*
92553e5a82fSViacheslav Ovsiienko 	 * Setting port_id to max unallowed value means
92653e5a82fSViacheslav Ovsiienko 	 * there is no interrupt subhandler installed for
92753e5a82fSViacheslav Ovsiienko 	 * the given port index i.
92853e5a82fSViacheslav Ovsiienko 	 */
92923242063SMatan Azrad 	for (i = 0; i < sh->max_port; i++) {
93053e5a82fSViacheslav Ovsiienko 		sh->port[i].ih_port_id = RTE_MAX_ETHPORTS;
93123242063SMatan Azrad 		sh->port[i].devx_ih_port_id = RTE_MAX_ETHPORTS;
93223242063SMatan Azrad 	}
93317e19bc4SViacheslav Ovsiienko 	sh->pd = mlx5_glue->alloc_pd(sh->ctx);
93417e19bc4SViacheslav Ovsiienko 	if (sh->pd == NULL) {
93517e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "PD allocation failure");
93617e19bc4SViacheslav Ovsiienko 		err = ENOMEM;
93717e19bc4SViacheslav Ovsiienko 		goto error;
93817e19bc4SViacheslav Ovsiienko 	}
939ae18a1aeSOri Kam 	if (sh->devx) {
940e7055bbfSMichael Baum 		/* Query the EQN for this core. */
9418dc775d8SMatan Azrad 		err = mlx5_glue->devx_query_eqn(sh->ctx, 0, &sh->eqn);
942e7055bbfSMichael Baum 		if (err) {
943e7055bbfSMichael Baum 			rte_errno = errno;
944e7055bbfSMichael Baum 			DRV_LOG(ERR, "Failed to query event queue number %d.",
945e7055bbfSMichael Baum 				rte_errno);
946e7055bbfSMichael Baum 			goto error;
947e7055bbfSMichael Baum 		}
9482eb4d010SOphir Munk 		err = mlx5_os_get_pdn(sh->pd, &sh->pdn);
949b9d86122SDekel Peled 		if (err) {
950b9d86122SDekel Peled 			DRV_LOG(ERR, "Fail to extract pdn from PD");
951b9d86122SDekel Peled 			goto error;
952b9d86122SDekel Peled 		}
953ae18a1aeSOri Kam 		sh->td = mlx5_devx_cmd_create_td(sh->ctx);
954ae18a1aeSOri Kam 		if (!sh->td) {
955ae18a1aeSOri Kam 			DRV_LOG(ERR, "TD allocation failure");
956ae18a1aeSOri Kam 			err = ENOMEM;
957ae18a1aeSOri Kam 			goto error;
958ae18a1aeSOri Kam 		}
959ae18a1aeSOri Kam 		tis_attr.transport_domain = sh->td->id;
960ae18a1aeSOri Kam 		sh->tis = mlx5_devx_cmd_create_tis(sh->ctx, &tis_attr);
961ae18a1aeSOri Kam 		if (!sh->tis) {
962ae18a1aeSOri Kam 			DRV_LOG(ERR, "TIS allocation failure");
963ae18a1aeSOri Kam 			err = ENOMEM;
964ae18a1aeSOri Kam 			goto error;
965ae18a1aeSOri Kam 		}
966a0bfe9d5SViacheslav Ovsiienko 		err = mlx5_alloc_rxtx_uars(sh, config);
967a0bfe9d5SViacheslav Ovsiienko 		if (err)
968fc4d4f73SViacheslav Ovsiienko 			goto error;
9691f66ac5bSOphir Munk 		MLX5_ASSERT(sh->tx_uar);
9701f66ac5bSOphir Munk 		MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->tx_uar));
9711f66ac5bSOphir Munk 
9721f66ac5bSOphir Munk 		MLX5_ASSERT(sh->devx_rx_uar);
9731f66ac5bSOphir Munk 		MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar));
974ae18a1aeSOri Kam 	}
97524feb045SViacheslav Ovsiienko #ifndef RTE_ARCH_64
97624feb045SViacheslav Ovsiienko 	/* Initialize UAR access locks for 32bit implementations. */
97724feb045SViacheslav Ovsiienko 	rte_spinlock_init(&sh->uar_lock_cq);
97824feb045SViacheslav Ovsiienko 	for (i = 0; i < MLX5_UAR_PAGE_NUM_MAX; i++)
97924feb045SViacheslav Ovsiienko 		rte_spinlock_init(&sh->uar_lock[i]);
98024feb045SViacheslav Ovsiienko #endif
981ab3cffcfSViacheslav Ovsiienko 	/*
982ab3cffcfSViacheslav Ovsiienko 	 * Once the device is added to the list of memory event
983ab3cffcfSViacheslav Ovsiienko 	 * callback, its global MR cache table cannot be expanded
984ab3cffcfSViacheslav Ovsiienko 	 * on the fly because of deadlock. If it overflows, lookup
985ab3cffcfSViacheslav Ovsiienko 	 * should be done by searching MR list linearly, which is slow.
986ab3cffcfSViacheslav Ovsiienko 	 *
987ab3cffcfSViacheslav Ovsiienko 	 * At this point the device is not added to the memory
988ab3cffcfSViacheslav Ovsiienko 	 * event list yet, context is just being created.
989ab3cffcfSViacheslav Ovsiienko 	 */
990b8dc6b0eSVu Pham 	err = mlx5_mr_btree_init(&sh->share_cache.cache,
991ab3cffcfSViacheslav Ovsiienko 				 MLX5_MR_BTREE_CACHE_N * 2,
99246e10a4cSViacheslav Ovsiienko 				 spawn->pci_dev->device.numa_node);
993ab3cffcfSViacheslav Ovsiienko 	if (err) {
994ab3cffcfSViacheslav Ovsiienko 		err = rte_errno;
995ab3cffcfSViacheslav Ovsiienko 		goto error;
996ab3cffcfSViacheslav Ovsiienko 	}
997d5ed8aa9SOphir Munk 	mlx5_os_set_reg_mr_cb(&sh->share_cache.reg_mr_cb,
998d5ed8aa9SOphir Munk 			      &sh->share_cache.dereg_mr_cb);
9992eb4d010SOphir Munk 	mlx5_os_dev_shared_handler_install(sh);
1000632f0f19SSuanming Mou 	sh->cnt_id_tbl = mlx5_l3t_create(MLX5_L3T_TYPE_DWORD);
1001632f0f19SSuanming Mou 	if (!sh->cnt_id_tbl) {
1002632f0f19SSuanming Mou 		err = rte_errno;
1003632f0f19SSuanming Mou 		goto error;
1004632f0f19SSuanming Mou 	}
1005fa2d01c8SDong Zhou 	mlx5_flow_aging_init(sh);
10065382d28cSMatan Azrad 	mlx5_flow_counters_mng_init(sh);
1007b88341caSSuanming Mou 	mlx5_flow_ipool_create(sh, config);
10080e3d0525SViacheslav Ovsiienko 	/* Add device to memory callback list. */
10090e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
10100e3d0525SViacheslav Ovsiienko 	LIST_INSERT_HEAD(&mlx5_shared_data->mem_event_cb_list,
10110e3d0525SViacheslav Ovsiienko 			 sh, mem_event_cb);
10120e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
10130e3d0525SViacheslav Ovsiienko 	/* Add context to the global device list. */
101491389890SOphir Munk 	LIST_INSERT_HEAD(&mlx5_dev_ctx_list, sh, next);
101517e19bc4SViacheslav Ovsiienko exit:
101691389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
101717e19bc4SViacheslav Ovsiienko 	return sh;
101817e19bc4SViacheslav Ovsiienko error:
1019d133f4cdSViacheslav Ovsiienko 	pthread_mutex_destroy(&sh->txpp.mutex);
102091389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
10218e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
1022a0bfe9d5SViacheslav Ovsiienko 	if (sh->cnt_id_tbl)
1023632f0f19SSuanming Mou 		mlx5_l3t_destroy(sh->cnt_id_tbl);
1024ae18a1aeSOri Kam 	if (sh->tis)
1025ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->tis));
1026ae18a1aeSOri Kam 	if (sh->td)
1027ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->td));
102808d1838fSDekel Peled 	if (sh->devx_rx_uar)
102908d1838fSDekel Peled 		mlx5_glue->devx_free_uar(sh->devx_rx_uar);
1030a0bfe9d5SViacheslav Ovsiienko 	if (sh->tx_uar)
1031a0bfe9d5SViacheslav Ovsiienko 		mlx5_glue->devx_free_uar(sh->tx_uar);
103217e19bc4SViacheslav Ovsiienko 	if (sh->pd)
103317e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->dealloc_pd(sh->pd));
103417e19bc4SViacheslav Ovsiienko 	if (sh->ctx)
103517e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->close_device(sh->ctx));
10362175c4dcSSuanming Mou 	mlx5_free(sh);
10378e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(err > 0);
103817e19bc4SViacheslav Ovsiienko 	rte_errno = err;
103917e19bc4SViacheslav Ovsiienko 	return NULL;
104017e19bc4SViacheslav Ovsiienko }
104117e19bc4SViacheslav Ovsiienko 
104217e19bc4SViacheslav Ovsiienko /**
104317e19bc4SViacheslav Ovsiienko  * Free shared IB device context. Decrement counter and if zero free
104417e19bc4SViacheslav Ovsiienko  * all allocated resources and close handles.
104517e19bc4SViacheslav Ovsiienko  *
104617e19bc4SViacheslav Ovsiienko  * @param[in] sh
10476e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free
104817e19bc4SViacheslav Ovsiienko  */
10492eb4d010SOphir Munk void
105091389890SOphir Munk mlx5_free_shared_dev_ctx(struct mlx5_dev_ctx_shared *sh)
105117e19bc4SViacheslav Ovsiienko {
105291389890SOphir Munk 	pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
10530afacb04SAlexander Kozyrev #ifdef RTE_LIBRTE_MLX5_DEBUG
105417e19bc4SViacheslav Ovsiienko 	/* Check the object presence in the list. */
10556e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *lctx;
105617e19bc4SViacheslav Ovsiienko 
105791389890SOphir Munk 	LIST_FOREACH(lctx, &mlx5_dev_ctx_list, next)
105817e19bc4SViacheslav Ovsiienko 		if (lctx == sh)
105917e19bc4SViacheslav Ovsiienko 			break;
10608e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(lctx);
106117e19bc4SViacheslav Ovsiienko 	if (lctx != sh) {
106217e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "Freeing non-existing shared IB context");
106317e19bc4SViacheslav Ovsiienko 		goto exit;
106417e19bc4SViacheslav Ovsiienko 	}
106517e19bc4SViacheslav Ovsiienko #endif
10668e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
10678e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh->refcnt);
106817e19bc4SViacheslav Ovsiienko 	/* Secondary process should not free the shared context. */
10698e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
107017e19bc4SViacheslav Ovsiienko 	if (--sh->refcnt)
107117e19bc4SViacheslav Ovsiienko 		goto exit;
10720e3d0525SViacheslav Ovsiienko 	/* Remove from memory callback device list. */
10730e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
10740e3d0525SViacheslav Ovsiienko 	LIST_REMOVE(sh, mem_event_cb);
10750e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
10764f8e6befSMichael Baum 	/* Release created Memory Regions. */
1077b8dc6b0eSVu Pham 	mlx5_mr_release_cache(&sh->share_cache);
10780e3d0525SViacheslav Ovsiienko 	/* Remove context from the global device list. */
107917e19bc4SViacheslav Ovsiienko 	LIST_REMOVE(sh, next);
1080f4a08731SMichael Baum 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
108153e5a82fSViacheslav Ovsiienko 	/*
108253e5a82fSViacheslav Ovsiienko 	 *  Ensure there is no async event handler installed.
108353e5a82fSViacheslav Ovsiienko 	 *  Only primary process handles async device events.
108453e5a82fSViacheslav Ovsiienko 	 **/
10855382d28cSMatan Azrad 	mlx5_flow_counters_mng_close(sh);
1086f935ed4bSDekel Peled 	if (sh->aso_age_mng) {
1087f935ed4bSDekel Peled 		mlx5_flow_aso_age_mng_close(sh);
1088f935ed4bSDekel Peled 		sh->aso_age_mng = NULL;
1089f935ed4bSDekel Peled 	}
1090014d1cbeSSuanming Mou 	mlx5_flow_ipool_destroy(sh);
10912eb4d010SOphir Munk 	mlx5_os_dev_shared_handler_uninstall(sh);
1092632f0f19SSuanming Mou 	if (sh->cnt_id_tbl) {
1093632f0f19SSuanming Mou 		mlx5_l3t_destroy(sh->cnt_id_tbl);
1094632f0f19SSuanming Mou 		sh->cnt_id_tbl = NULL;
1095632f0f19SSuanming Mou 	}
1096fc4d4f73SViacheslav Ovsiienko 	if (sh->tx_uar) {
1097fc4d4f73SViacheslav Ovsiienko 		mlx5_glue->devx_free_uar(sh->tx_uar);
1098fc4d4f73SViacheslav Ovsiienko 		sh->tx_uar = NULL;
1099fc4d4f73SViacheslav Ovsiienko 	}
110017e19bc4SViacheslav Ovsiienko 	if (sh->pd)
110117e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->dealloc_pd(sh->pd));
1102ae18a1aeSOri Kam 	if (sh->tis)
1103ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->tis));
1104ae18a1aeSOri Kam 	if (sh->td)
1105ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->td));
110608d1838fSDekel Peled 	if (sh->devx_rx_uar)
110708d1838fSDekel Peled 		mlx5_glue->devx_free_uar(sh->devx_rx_uar);
110817e19bc4SViacheslav Ovsiienko 	if (sh->ctx)
110917e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->close_device(sh->ctx));
1110d133f4cdSViacheslav Ovsiienko 	pthread_mutex_destroy(&sh->txpp.mutex);
11112175c4dcSSuanming Mou 	mlx5_free(sh);
1112f4a08731SMichael Baum 	return;
111317e19bc4SViacheslav Ovsiienko exit:
111491389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
111517e19bc4SViacheslav Ovsiienko }
111617e19bc4SViacheslav Ovsiienko 
1117771fa900SAdrien Mazarguil /**
1118afd7a625SXueming Li  * Destroy table hash list.
111954534725SMatan Azrad  *
112054534725SMatan Azrad  * @param[in] priv
112154534725SMatan Azrad  *   Pointer to the private device data structure.
112254534725SMatan Azrad  */
11232eb4d010SOphir Munk void
112454534725SMatan Azrad mlx5_free_table_hash_list(struct mlx5_priv *priv)
112554534725SMatan Azrad {
11266e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
112754534725SMatan Azrad 
112854534725SMatan Azrad 	if (!sh->flow_tbls)
112954534725SMatan Azrad 		return;
1130e69a5922SXueming Li 	mlx5_hlist_destroy(sh->flow_tbls);
113154534725SMatan Azrad }
113254534725SMatan Azrad 
113354534725SMatan Azrad /**
113454534725SMatan Azrad  * Initialize flow table hash list and create the root tables entry
113554534725SMatan Azrad  * for each domain.
113654534725SMatan Azrad  *
113754534725SMatan Azrad  * @param[in] priv
113854534725SMatan Azrad  *   Pointer to the private device data structure.
113954534725SMatan Azrad  *
114054534725SMatan Azrad  * @return
114154534725SMatan Azrad  *   Zero on success, positive error code otherwise.
114254534725SMatan Azrad  */
11432eb4d010SOphir Munk int
1144afd7a625SXueming Li mlx5_alloc_table_hash_list(struct mlx5_priv *priv __rte_unused)
114554534725SMatan Azrad {
1146afd7a625SXueming Li 	int err = 0;
1147afd7a625SXueming Li 	/* Tables are only used in DV and DR modes. */
1148afd7a625SXueming Li #ifdef HAVE_IBV_FLOW_DV_SUPPORT
11496e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
115054534725SMatan Azrad 	char s[MLX5_HLIST_NAMESIZE];
115154534725SMatan Azrad 
11528e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
115354534725SMatan Azrad 	snprintf(s, sizeof(s), "%s_flow_table", priv->sh->ibdev_name);
1154e69a5922SXueming Li 	sh->flow_tbls = mlx5_hlist_create(s, MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE,
1155afd7a625SXueming Li 					  0, 0, flow_dv_tbl_create_cb, NULL,
1156afd7a625SXueming Li 					  flow_dv_tbl_remove_cb);
115754534725SMatan Azrad 	if (!sh->flow_tbls) {
115863783b01SDavid Marchand 		DRV_LOG(ERR, "flow tables with hash creation failed.");
115954534725SMatan Azrad 		err = ENOMEM;
116054534725SMatan Azrad 		return err;
116154534725SMatan Azrad 	}
1162afd7a625SXueming Li 	sh->flow_tbls->ctx = sh;
116354534725SMatan Azrad #ifndef HAVE_MLX5DV_DR
1164afd7a625SXueming Li 	struct rte_flow_error error;
1165afd7a625SXueming Li 	struct rte_eth_dev *dev = &rte_eth_devices[priv->dev_data->port_id];
1166afd7a625SXueming Li 
116754534725SMatan Azrad 	/*
116854534725SMatan Azrad 	 * In case we have not DR support, the zero tables should be created
116954534725SMatan Azrad 	 * because DV expect to see them even if they cannot be created by
117054534725SMatan Azrad 	 * RDMA-CORE.
117154534725SMatan Azrad 	 */
1172afd7a625SXueming Li 	if (!flow_dv_tbl_resource_get(dev, 0, 0, 0, 0, NULL, 0, 1, &error) ||
1173afd7a625SXueming Li 	    !flow_dv_tbl_resource_get(dev, 0, 1, 0, 0, NULL, 0, 1, &error) ||
1174afd7a625SXueming Li 	    !flow_dv_tbl_resource_get(dev, 0, 0, 1, 0, NULL, 0, 1, &error)) {
117554534725SMatan Azrad 		err = ENOMEM;
117654534725SMatan Azrad 		goto error;
117754534725SMatan Azrad 	}
117854534725SMatan Azrad 	return err;
117954534725SMatan Azrad error:
118054534725SMatan Azrad 	mlx5_free_table_hash_list(priv);
118154534725SMatan Azrad #endif /* HAVE_MLX5DV_DR */
1182afd7a625SXueming Li #endif
118354534725SMatan Azrad 	return err;
118454534725SMatan Azrad }
118554534725SMatan Azrad 
118654534725SMatan Azrad /**
11874d803a72SOlga Shern  * Retrieve integer value from environment variable.
11884d803a72SOlga Shern  *
11894d803a72SOlga Shern  * @param[in] name
11904d803a72SOlga Shern  *   Environment variable name.
11914d803a72SOlga Shern  *
11924d803a72SOlga Shern  * @return
11934d803a72SOlga Shern  *   Integer value, 0 if the variable is not set.
11944d803a72SOlga Shern  */
11954d803a72SOlga Shern int
11964d803a72SOlga Shern mlx5_getenv_int(const char *name)
11974d803a72SOlga Shern {
11984d803a72SOlga Shern 	const char *val = getenv(name);
11994d803a72SOlga Shern 
12004d803a72SOlga Shern 	if (val == NULL)
12014d803a72SOlga Shern 		return 0;
12024d803a72SOlga Shern 	return atoi(val);
12034d803a72SOlga Shern }
12044d803a72SOlga Shern 
12054d803a72SOlga Shern /**
1206c9ba7523SRaslan Darawsheh  * DPDK callback to add udp tunnel port
1207c9ba7523SRaslan Darawsheh  *
1208c9ba7523SRaslan Darawsheh  * @param[in] dev
1209c9ba7523SRaslan Darawsheh  *   A pointer to eth_dev
1210c9ba7523SRaslan Darawsheh  * @param[in] udp_tunnel
1211c9ba7523SRaslan Darawsheh  *   A pointer to udp tunnel
1212c9ba7523SRaslan Darawsheh  *
1213c9ba7523SRaslan Darawsheh  * @return
1214c9ba7523SRaslan Darawsheh  *   0 on valid udp ports and tunnels, -ENOTSUP otherwise.
1215c9ba7523SRaslan Darawsheh  */
1216c9ba7523SRaslan Darawsheh int
1217c9ba7523SRaslan Darawsheh mlx5_udp_tunnel_port_add(struct rte_eth_dev *dev __rte_unused,
1218c9ba7523SRaslan Darawsheh 			 struct rte_eth_udp_tunnel *udp_tunnel)
1219c9ba7523SRaslan Darawsheh {
12208e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(udp_tunnel != NULL);
1221c9ba7523SRaslan Darawsheh 	if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN &&
1222c9ba7523SRaslan Darawsheh 	    udp_tunnel->udp_port == 4789)
1223c9ba7523SRaslan Darawsheh 		return 0;
1224c9ba7523SRaslan Darawsheh 	if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN_GPE &&
1225c9ba7523SRaslan Darawsheh 	    udp_tunnel->udp_port == 4790)
1226c9ba7523SRaslan Darawsheh 		return 0;
1227c9ba7523SRaslan Darawsheh 	return -ENOTSUP;
1228c9ba7523SRaslan Darawsheh }
1229c9ba7523SRaslan Darawsheh 
1230c9ba7523SRaslan Darawsheh /**
1231120dc4a7SYongseok Koh  * Initialize process private data structure.
1232120dc4a7SYongseok Koh  *
1233120dc4a7SYongseok Koh  * @param dev
1234120dc4a7SYongseok Koh  *   Pointer to Ethernet device structure.
1235120dc4a7SYongseok Koh  *
1236120dc4a7SYongseok Koh  * @return
1237120dc4a7SYongseok Koh  *   0 on success, a negative errno value otherwise and rte_errno is set.
1238120dc4a7SYongseok Koh  */
1239120dc4a7SYongseok Koh int
1240120dc4a7SYongseok Koh mlx5_proc_priv_init(struct rte_eth_dev *dev)
1241120dc4a7SYongseok Koh {
1242120dc4a7SYongseok Koh 	struct mlx5_priv *priv = dev->data->dev_private;
1243120dc4a7SYongseok Koh 	struct mlx5_proc_priv *ppriv;
1244120dc4a7SYongseok Koh 	size_t ppriv_size;
1245120dc4a7SYongseok Koh 
1246120dc4a7SYongseok Koh 	/*
1247120dc4a7SYongseok Koh 	 * UAR register table follows the process private structure. BlueFlame
1248120dc4a7SYongseok Koh 	 * registers for Tx queues are stored in the table.
1249120dc4a7SYongseok Koh 	 */
1250120dc4a7SYongseok Koh 	ppriv_size =
1251120dc4a7SYongseok Koh 		sizeof(struct mlx5_proc_priv) + priv->txqs_n * sizeof(void *);
12522175c4dcSSuanming Mou 	ppriv = mlx5_malloc(MLX5_MEM_RTE, ppriv_size, RTE_CACHE_LINE_SIZE,
12532175c4dcSSuanming Mou 			    dev->device->numa_node);
1254120dc4a7SYongseok Koh 	if (!ppriv) {
1255120dc4a7SYongseok Koh 		rte_errno = ENOMEM;
1256120dc4a7SYongseok Koh 		return -rte_errno;
1257120dc4a7SYongseok Koh 	}
1258120dc4a7SYongseok Koh 	ppriv->uar_table_sz = ppriv_size;
1259120dc4a7SYongseok Koh 	dev->process_private = ppriv;
1260120dc4a7SYongseok Koh 	return 0;
1261120dc4a7SYongseok Koh }
1262120dc4a7SYongseok Koh 
1263120dc4a7SYongseok Koh /**
1264120dc4a7SYongseok Koh  * Un-initialize process private data structure.
1265120dc4a7SYongseok Koh  *
1266120dc4a7SYongseok Koh  * @param dev
1267120dc4a7SYongseok Koh  *   Pointer to Ethernet device structure.
1268120dc4a7SYongseok Koh  */
1269120dc4a7SYongseok Koh static void
1270120dc4a7SYongseok Koh mlx5_proc_priv_uninit(struct rte_eth_dev *dev)
1271120dc4a7SYongseok Koh {
1272120dc4a7SYongseok Koh 	if (!dev->process_private)
1273120dc4a7SYongseok Koh 		return;
12742175c4dcSSuanming Mou 	mlx5_free(dev->process_private);
1275120dc4a7SYongseok Koh 	dev->process_private = NULL;
1276120dc4a7SYongseok Koh }
1277120dc4a7SYongseok Koh 
1278120dc4a7SYongseok Koh /**
1279771fa900SAdrien Mazarguil  * DPDK callback to close the device.
1280771fa900SAdrien Mazarguil  *
1281771fa900SAdrien Mazarguil  * Destroy all queues and objects, free memory.
1282771fa900SAdrien Mazarguil  *
1283771fa900SAdrien Mazarguil  * @param dev
1284771fa900SAdrien Mazarguil  *   Pointer to Ethernet device structure.
1285771fa900SAdrien Mazarguil  */
1286b142387bSThomas Monjalon int
1287771fa900SAdrien Mazarguil mlx5_dev_close(struct rte_eth_dev *dev)
1288771fa900SAdrien Mazarguil {
1289dbeba4cfSThomas Monjalon 	struct mlx5_priv *priv = dev->data->dev_private;
12902e22920bSAdrien Mazarguil 	unsigned int i;
12916af6b973SNélio Laranjeiro 	int ret;
1292771fa900SAdrien Mazarguil 
12932786b7bfSSuanming Mou 	if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
12942786b7bfSSuanming Mou 		/* Check if process_private released. */
12952786b7bfSSuanming Mou 		if (!dev->process_private)
1296b142387bSThomas Monjalon 			return 0;
12972786b7bfSSuanming Mou 		mlx5_tx_uar_uninit_secondary(dev);
12982786b7bfSSuanming Mou 		mlx5_proc_priv_uninit(dev);
12992786b7bfSSuanming Mou 		rte_eth_dev_release_port(dev);
1300b142387bSThomas Monjalon 		return 0;
13012786b7bfSSuanming Mou 	}
13022786b7bfSSuanming Mou 	if (!priv->sh)
1303b142387bSThomas Monjalon 		return 0;
1304a170a30dSNélio Laranjeiro 	DRV_LOG(DEBUG, "port %u closing device \"%s\"",
13050f99970bSNélio Laranjeiro 		dev->data->port_id,
1306f44b09f9SOphir Munk 		((priv->sh->ctx != NULL) ?
1307f44b09f9SOphir Munk 		mlx5_os_get_ctx_device_name(priv->sh->ctx) : ""));
13088db7e3b6SBing Zhao 	/*
13098db7e3b6SBing Zhao 	 * If default mreg copy action is removed at the stop stage,
13108db7e3b6SBing Zhao 	 * the search will return none and nothing will be done anymore.
13118db7e3b6SBing Zhao 	 */
13128db7e3b6SBing Zhao 	mlx5_flow_stop_default(dev);
1313af4f09f2SNélio Laranjeiro 	mlx5_traffic_disable(dev);
13148db7e3b6SBing Zhao 	/*
13158db7e3b6SBing Zhao 	 * If all the flows are already flushed in the device stop stage,
13168db7e3b6SBing Zhao 	 * then this will return directly without any action.
13178db7e3b6SBing Zhao 	 */
13188db7e3b6SBing Zhao 	mlx5_flow_list_flush(dev, &priv->flows, true);
1319d7cfcdddSAndrey Vesnovaty 	mlx5_shared_action_flush(dev);
132002e76468SSuanming Mou 	mlx5_flow_meter_flush(dev, NULL);
13212e22920bSAdrien Mazarguil 	/* Prevent crashes when queues are still in use. */
13222e22920bSAdrien Mazarguil 	dev->rx_pkt_burst = removed_rx_burst;
13232e22920bSAdrien Mazarguil 	dev->tx_pkt_burst = removed_tx_burst;
13242aac5b5dSYongseok Koh 	rte_wmb();
13252aac5b5dSYongseok Koh 	/* Disable datapath on secondary process. */
13262e86c4e5SOphir Munk 	mlx5_mp_os_req_stop_rxtx(dev);
13271c506404SBing Zhao 	/* Free the eCPRI flex parser resource. */
13281c506404SBing Zhao 	mlx5_flex_parser_ecpri_release(dev);
13292e22920bSAdrien Mazarguil 	if (priv->rxqs != NULL) {
13302e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_rx_burst() is still running. */
13312e22920bSAdrien Mazarguil 		usleep(1000);
1332a1366b1aSNélio Laranjeiro 		for (i = 0; (i != priv->rxqs_n); ++i)
1333af4f09f2SNélio Laranjeiro 			mlx5_rxq_release(dev, i);
13342e22920bSAdrien Mazarguil 		priv->rxqs_n = 0;
13352e22920bSAdrien Mazarguil 		priv->rxqs = NULL;
13362e22920bSAdrien Mazarguil 	}
13372e22920bSAdrien Mazarguil 	if (priv->txqs != NULL) {
13382e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_tx_burst() is still running. */
13392e22920bSAdrien Mazarguil 		usleep(1000);
13406e78005aSNélio Laranjeiro 		for (i = 0; (i != priv->txqs_n); ++i)
1341af4f09f2SNélio Laranjeiro 			mlx5_txq_release(dev, i);
13422e22920bSAdrien Mazarguil 		priv->txqs_n = 0;
13432e22920bSAdrien Mazarguil 		priv->txqs = NULL;
13442e22920bSAdrien Mazarguil 	}
1345120dc4a7SYongseok Koh 	mlx5_proc_priv_uninit(dev);
134665b3cd0dSSuanming Mou 	if (priv->drop_queue.hrxq)
134765b3cd0dSSuanming Mou 		mlx5_drop_action_destroy(dev);
1348dd3c774fSViacheslav Ovsiienko 	if (priv->mreg_cp_tbl)
1349e69a5922SXueming Li 		mlx5_hlist_destroy(priv->mreg_cp_tbl);
13507d6bf6b8SYongseok Koh 	mlx5_mprq_free_mp(dev);
13512eb4d010SOphir Munk 	mlx5_os_free_shared_dr(priv);
135229c1d8bbSNélio Laranjeiro 	if (priv->rss_conf.rss_key != NULL)
135383c2047cSSuanming Mou 		mlx5_free(priv->rss_conf.rss_key);
1354634efbc2SNelio Laranjeiro 	if (priv->reta_idx != NULL)
135583c2047cSSuanming Mou 		mlx5_free(priv->reta_idx);
1356ccdcba53SNélio Laranjeiro 	if (priv->config.vf)
1357f00f6562SOphir Munk 		mlx5_os_mac_addr_flush(dev);
135826c08b97SAdrien Mazarguil 	if (priv->nl_socket_route >= 0)
135926c08b97SAdrien Mazarguil 		close(priv->nl_socket_route);
136026c08b97SAdrien Mazarguil 	if (priv->nl_socket_rdma >= 0)
136126c08b97SAdrien Mazarguil 		close(priv->nl_socket_rdma);
1362dfedf3e3SViacheslav Ovsiienko 	if (priv->vmwa_context)
1363dfedf3e3SViacheslav Ovsiienko 		mlx5_vlan_vmwa_exit(priv->vmwa_context);
136423820a79SDekel Peled 	ret = mlx5_hrxq_verify(dev);
1365f5479b68SNélio Laranjeiro 	if (ret)
1366a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some hash Rx queue still remain",
13670f99970bSNélio Laranjeiro 			dev->data->port_id);
136815c80a12SDekel Peled 	ret = mlx5_ind_table_obj_verify(dev);
13694c7a0f5fSNélio Laranjeiro 	if (ret)
1370a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some indirection table still remain",
13710f99970bSNélio Laranjeiro 			dev->data->port_id);
137293403560SDekel Peled 	ret = mlx5_rxq_obj_verify(dev);
137309cb5b58SNélio Laranjeiro 	if (ret)
137493403560SDekel Peled 		DRV_LOG(WARNING, "port %u some Rx queue objects still remain",
13750f99970bSNélio Laranjeiro 			dev->data->port_id);
1376af4f09f2SNélio Laranjeiro 	ret = mlx5_rxq_verify(dev);
1377a1366b1aSNélio Laranjeiro 	if (ret)
1378a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Rx queues still remain",
13790f99970bSNélio Laranjeiro 			dev->data->port_id);
1380894c4a8eSOri Kam 	ret = mlx5_txq_obj_verify(dev);
1381faf2667fSNélio Laranjeiro 	if (ret)
1382a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Verbs Tx queue still remain",
13830f99970bSNélio Laranjeiro 			dev->data->port_id);
1384af4f09f2SNélio Laranjeiro 	ret = mlx5_txq_verify(dev);
13856e78005aSNélio Laranjeiro 	if (ret)
1386a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Tx queues still remain",
13870f99970bSNélio Laranjeiro 			dev->data->port_id);
1388af4f09f2SNélio Laranjeiro 	ret = mlx5_flow_verify(dev);
13896af6b973SNélio Laranjeiro 	if (ret)
1390a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some flows still remain",
1391a170a30dSNélio Laranjeiro 			dev->data->port_id);
1392e1592b6cSSuanming Mou 	mlx5_cache_list_destroy(&priv->hrxqs);
1393772dc0ebSSuanming Mou 	/*
1394772dc0ebSSuanming Mou 	 * Free the shared context in last turn, because the cleanup
1395772dc0ebSSuanming Mou 	 * routines above may use some shared fields, like
1396f00f6562SOphir Munk 	 * mlx5_os_mac_addr_flush() uses ibdev_path for retrieveing
1397772dc0ebSSuanming Mou 	 * ifindex if Netlink fails.
1398772dc0ebSSuanming Mou 	 */
139991389890SOphir Munk 	mlx5_free_shared_dev_ctx(priv->sh);
14002b730263SAdrien Mazarguil 	if (priv->domain_id != RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID) {
14012b730263SAdrien Mazarguil 		unsigned int c = 0;
1402d874a4eeSThomas Monjalon 		uint16_t port_id;
14032b730263SAdrien Mazarguil 
1404fbc83412SViacheslav Ovsiienko 		MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
1405dbeba4cfSThomas Monjalon 			struct mlx5_priv *opriv =
1406d874a4eeSThomas Monjalon 				rte_eth_devices[port_id].data->dev_private;
14072b730263SAdrien Mazarguil 
14082b730263SAdrien Mazarguil 			if (!opriv ||
14092b730263SAdrien Mazarguil 			    opriv->domain_id != priv->domain_id ||
1410d874a4eeSThomas Monjalon 			    &rte_eth_devices[port_id] == dev)
14112b730263SAdrien Mazarguil 				continue;
14122b730263SAdrien Mazarguil 			++c;
1413f7e95215SViacheslav Ovsiienko 			break;
14142b730263SAdrien Mazarguil 		}
14152b730263SAdrien Mazarguil 		if (!c)
14162b730263SAdrien Mazarguil 			claim_zero(rte_eth_switch_domain_free(priv->domain_id));
14172b730263SAdrien Mazarguil 	}
1418771fa900SAdrien Mazarguil 	memset(priv, 0, sizeof(*priv));
14192b730263SAdrien Mazarguil 	priv->domain_id = RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID;
142042603bbdSOphir Munk 	/*
142142603bbdSOphir Munk 	 * Reset mac_addrs to NULL such that it is not freed as part of
142242603bbdSOphir Munk 	 * rte_eth_dev_release_port(). mac_addrs is part of dev_private so
142342603bbdSOphir Munk 	 * it is freed when dev_private is freed.
142442603bbdSOphir Munk 	 */
142542603bbdSOphir Munk 	dev->data->mac_addrs = NULL;
1426b142387bSThomas Monjalon 	return 0;
1427771fa900SAdrien Mazarguil }
1428771fa900SAdrien Mazarguil 
1429e72dd09bSNélio Laranjeiro /**
1430e72dd09bSNélio Laranjeiro  * Verify and store value for device argument.
1431e72dd09bSNélio Laranjeiro  *
1432e72dd09bSNélio Laranjeiro  * @param[in] key
1433e72dd09bSNélio Laranjeiro  *   Key argument to verify.
1434e72dd09bSNélio Laranjeiro  * @param[in] val
1435e72dd09bSNélio Laranjeiro  *   Value associated with key.
1436e72dd09bSNélio Laranjeiro  * @param opaque
1437e72dd09bSNélio Laranjeiro  *   User data.
1438e72dd09bSNélio Laranjeiro  *
1439e72dd09bSNélio Laranjeiro  * @return
1440a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
1441e72dd09bSNélio Laranjeiro  */
1442e72dd09bSNélio Laranjeiro static int
1443e72dd09bSNélio Laranjeiro mlx5_args_check(const char *key, const char *val, void *opaque)
1444e72dd09bSNélio Laranjeiro {
14457fe24446SShahaf Shuler 	struct mlx5_dev_config *config = opaque;
14468f848f32SViacheslav Ovsiienko 	unsigned long mod;
14478f848f32SViacheslav Ovsiienko 	signed long tmp;
1448e72dd09bSNélio Laranjeiro 
14496de569f5SAdrien Mazarguil 	/* No-op, port representors are processed in mlx5_dev_spawn(). */
14506de569f5SAdrien Mazarguil 	if (!strcmp(MLX5_REPRESENTOR, key))
14516de569f5SAdrien Mazarguil 		return 0;
145299c12dccSNélio Laranjeiro 	errno = 0;
14538f848f32SViacheslav Ovsiienko 	tmp = strtol(val, NULL, 0);
145499c12dccSNélio Laranjeiro 	if (errno) {
1455a6d83b6aSNélio Laranjeiro 		rte_errno = errno;
1456a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "%s: \"%s\" is not a valid integer", key, val);
1457a6d83b6aSNélio Laranjeiro 		return -rte_errno;
145899c12dccSNélio Laranjeiro 	}
14598f848f32SViacheslav Ovsiienko 	if (tmp < 0 && strcmp(MLX5_TX_PP, key) && strcmp(MLX5_TX_SKEW, key)) {
14608f848f32SViacheslav Ovsiienko 		/* Negative values are acceptable for some keys only. */
14618f848f32SViacheslav Ovsiienko 		rte_errno = EINVAL;
14628f848f32SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: invalid negative value \"%s\"", key, val);
14638f848f32SViacheslav Ovsiienko 		return -rte_errno;
14648f848f32SViacheslav Ovsiienko 	}
14658f848f32SViacheslav Ovsiienko 	mod = tmp >= 0 ? tmp : -tmp;
146699c12dccSNélio Laranjeiro 	if (strcmp(MLX5_RXQ_CQE_COMP_EN, key) == 0) {
146754c2d46bSAlexander Kozyrev 		if (tmp > MLX5_CQE_RESP_FORMAT_L34H_STRIDX) {
146854c2d46bSAlexander Kozyrev 			DRV_LOG(ERR, "invalid CQE compression "
146954c2d46bSAlexander Kozyrev 				     "format parameter");
147054c2d46bSAlexander Kozyrev 			rte_errno = EINVAL;
147154c2d46bSAlexander Kozyrev 			return -rte_errno;
147254c2d46bSAlexander Kozyrev 		}
14737fe24446SShahaf Shuler 		config->cqe_comp = !!tmp;
147454c2d46bSAlexander Kozyrev 		config->cqe_comp_fmt = tmp;
1475bc91e8dbSYongseok Koh 	} else if (strcmp(MLX5_RXQ_CQE_PAD_EN, key) == 0) {
1476bc91e8dbSYongseok Koh 		config->cqe_pad = !!tmp;
147778c7a16dSYongseok Koh 	} else if (strcmp(MLX5_RXQ_PKT_PAD_EN, key) == 0) {
147878c7a16dSYongseok Koh 		config->hw_padding = !!tmp;
14797d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_EN, key) == 0) {
14807d6bf6b8SYongseok Koh 		config->mprq.enabled = !!tmp;
14817d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_NUM, key) == 0) {
14827d6bf6b8SYongseok Koh 		config->mprq.stride_num_n = tmp;
1483ecb16045SAlexander Kozyrev 	} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_SIZE, key) == 0) {
1484ecb16045SAlexander Kozyrev 		config->mprq.stride_size_n = tmp;
14857d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_MAX_MEMCPY_LEN, key) == 0) {
14867d6bf6b8SYongseok Koh 		config->mprq.max_memcpy_len = tmp;
14877d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RXQS_MIN_MPRQ, key) == 0) {
14887d6bf6b8SYongseok Koh 		config->mprq.min_rxqs_num = tmp;
14892a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQ_INLINE, key) == 0) {
1490505f1fe4SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter,"
1491505f1fe4SViacheslav Ovsiienko 				 " converted to txq_inline_max", key);
1492505f1fe4SViacheslav Ovsiienko 		config->txq_inline_max = tmp;
1493505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MAX, key) == 0) {
1494505f1fe4SViacheslav Ovsiienko 		config->txq_inline_max = tmp;
1495505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MIN, key) == 0) {
1496505f1fe4SViacheslav Ovsiienko 		config->txq_inline_min = tmp;
1497505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MPW, key) == 0) {
1498505f1fe4SViacheslav Ovsiienko 		config->txq_inline_mpw = tmp;
14992a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQS_MIN_INLINE, key) == 0) {
15007fe24446SShahaf Shuler 		config->txqs_inline = tmp;
150109d8b416SYongseok Koh 	} else if (strcmp(MLX5_TXQS_MAX_VEC, key) == 0) {
1502a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
1503230189d9SNélio Laranjeiro 	} else if (strcmp(MLX5_TXQ_MPW_EN, key) == 0) {
1504f9de8718SShahaf Shuler 		config->mps = !!tmp;
15058409a285SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_DB_NC, key) == 0) {
1506f078ceb6SViacheslav Ovsiienko 		if (tmp != MLX5_TXDB_CACHED &&
1507f078ceb6SViacheslav Ovsiienko 		    tmp != MLX5_TXDB_NCACHED &&
1508f078ceb6SViacheslav Ovsiienko 		    tmp != MLX5_TXDB_HEURISTIC) {
1509f078ceb6SViacheslav Ovsiienko 			DRV_LOG(ERR, "invalid Tx doorbell "
1510f078ceb6SViacheslav Ovsiienko 				     "mapping parameter");
1511f078ceb6SViacheslav Ovsiienko 			rte_errno = EINVAL;
1512f078ceb6SViacheslav Ovsiienko 			return -rte_errno;
1513f078ceb6SViacheslav Ovsiienko 		}
1514f078ceb6SViacheslav Ovsiienko 		config->dbnc = tmp;
15156ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MPW_HDR_DSEG_EN, key) == 0) {
1516a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
15176ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MAX_INLINE_LEN, key) == 0) {
1518505f1fe4SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter,"
1519505f1fe4SViacheslav Ovsiienko 				 " converted to txq_inline_mpw", key);
1520505f1fe4SViacheslav Ovsiienko 		config->txq_inline_mpw = tmp;
15215644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_TX_VEC_EN, key) == 0) {
1522a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
15238f848f32SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_PP, key) == 0) {
15248f848f32SViacheslav Ovsiienko 		if (!mod) {
15258f848f32SViacheslav Ovsiienko 			DRV_LOG(ERR, "Zero Tx packet pacing parameter");
15268f848f32SViacheslav Ovsiienko 			rte_errno = EINVAL;
15278f848f32SViacheslav Ovsiienko 			return -rte_errno;
15288f848f32SViacheslav Ovsiienko 		}
15298f848f32SViacheslav Ovsiienko 		config->tx_pp = tmp;
15308f848f32SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_SKEW, key) == 0) {
15318f848f32SViacheslav Ovsiienko 		config->tx_skew = tmp;
15325644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_RX_VEC_EN, key) == 0) {
15337fe24446SShahaf Shuler 		config->rx_vec_en = !!tmp;
153478a54648SXueming Li 	} else if (strcmp(MLX5_L3_VXLAN_EN, key) == 0) {
153578a54648SXueming Li 		config->l3_vxlan_en = !!tmp;
1536db209cc3SNélio Laranjeiro 	} else if (strcmp(MLX5_VF_NL_EN, key) == 0) {
1537db209cc3SNélio Laranjeiro 		config->vf_nl_en = !!tmp;
1538e2b4925eSOri Kam 	} else if (strcmp(MLX5_DV_ESW_EN, key) == 0) {
1539e2b4925eSOri Kam 		config->dv_esw_en = !!tmp;
154051e72d38SOri Kam 	} else if (strcmp(MLX5_DV_FLOW_EN, key) == 0) {
154151e72d38SOri Kam 		config->dv_flow_en = !!tmp;
15422d241515SViacheslav Ovsiienko 	} else if (strcmp(MLX5_DV_XMETA_EN, key) == 0) {
15432d241515SViacheslav Ovsiienko 		if (tmp != MLX5_XMETA_MODE_LEGACY &&
15442d241515SViacheslav Ovsiienko 		    tmp != MLX5_XMETA_MODE_META16 &&
15454ec6360dSGregory Etelson 		    tmp != MLX5_XMETA_MODE_META32 &&
15464ec6360dSGregory Etelson 		    tmp != MLX5_XMETA_MODE_MISS_INFO) {
1547f078ceb6SViacheslav Ovsiienko 			DRV_LOG(ERR, "invalid extensive "
15482d241515SViacheslav Ovsiienko 				     "metadata parameter");
15492d241515SViacheslav Ovsiienko 			rte_errno = EINVAL;
15502d241515SViacheslav Ovsiienko 			return -rte_errno;
15512d241515SViacheslav Ovsiienko 		}
15524ec6360dSGregory Etelson 		if (tmp != MLX5_XMETA_MODE_MISS_INFO)
15532d241515SViacheslav Ovsiienko 			config->dv_xmeta_en = tmp;
15544ec6360dSGregory Etelson 		else
15554ec6360dSGregory Etelson 			config->dv_miss_info = 1;
15560f0ae73aSShiri Kuzin 	} else if (strcmp(MLX5_LACP_BY_USER, key) == 0) {
15570f0ae73aSShiri Kuzin 		config->lacp_by_user = !!tmp;
1558dceb5029SYongseok Koh 	} else if (strcmp(MLX5_MR_EXT_MEMSEG_EN, key) == 0) {
1559dceb5029SYongseok Koh 		config->mr_ext_memseg_en = !!tmp;
1560066cfecdSMatan Azrad 	} else if (strcmp(MLX5_MAX_DUMP_FILES_NUM, key) == 0) {
1561066cfecdSMatan Azrad 		config->max_dump_files_num = tmp;
156221bb6c7eSDekel Peled 	} else if (strcmp(MLX5_LRO_TIMEOUT_USEC, key) == 0) {
156321bb6c7eSDekel Peled 		config->lro.timeout = tmp;
1564d768f324SMatan Azrad 	} else if (strcmp(MLX5_CLASS_ARG_NAME, key) == 0) {
1565d768f324SMatan Azrad 		DRV_LOG(DEBUG, "class argument is %s.", val);
15661ad9a3d0SBing Zhao 	} else if (strcmp(MLX5_HP_BUF_SIZE, key) == 0) {
15671ad9a3d0SBing Zhao 		config->log_hp_size = tmp;
1568a1da6f62SSuanming Mou 	} else if (strcmp(MLX5_RECLAIM_MEM, key) == 0) {
1569a1da6f62SSuanming Mou 		if (tmp != MLX5_RCM_NONE &&
1570a1da6f62SSuanming Mou 		    tmp != MLX5_RCM_LIGHT &&
1571a1da6f62SSuanming Mou 		    tmp != MLX5_RCM_AGGR) {
1572a1da6f62SSuanming Mou 			DRV_LOG(ERR, "Unrecognize %s: \"%s\"", key, val);
1573a1da6f62SSuanming Mou 			rte_errno = EINVAL;
1574a1da6f62SSuanming Mou 			return -rte_errno;
1575a1da6f62SSuanming Mou 		}
1576a1da6f62SSuanming Mou 		config->reclaim_mode = tmp;
15775522da6bSSuanming Mou 	} else if (strcmp(MLX5_SYS_MEM_EN, key) == 0) {
15785522da6bSSuanming Mou 		config->sys_mem_en = !!tmp;
157950f95b23SSuanming Mou 	} else if (strcmp(MLX5_DECAP_EN, key) == 0) {
158050f95b23SSuanming Mou 		config->decap_en = !!tmp;
158199c12dccSNélio Laranjeiro 	} else {
1582a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "%s: unknown parameter", key);
1583a6d83b6aSNélio Laranjeiro 		rte_errno = EINVAL;
1584a6d83b6aSNélio Laranjeiro 		return -rte_errno;
1585e72dd09bSNélio Laranjeiro 	}
158699c12dccSNélio Laranjeiro 	return 0;
158799c12dccSNélio Laranjeiro }
1588e72dd09bSNélio Laranjeiro 
1589e72dd09bSNélio Laranjeiro /**
1590e72dd09bSNélio Laranjeiro  * Parse device parameters.
1591e72dd09bSNélio Laranjeiro  *
15927fe24446SShahaf Shuler  * @param config
15937fe24446SShahaf Shuler  *   Pointer to device configuration structure.
1594e72dd09bSNélio Laranjeiro  * @param devargs
1595e72dd09bSNélio Laranjeiro  *   Device arguments structure.
1596e72dd09bSNélio Laranjeiro  *
1597e72dd09bSNélio Laranjeiro  * @return
1598a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
1599e72dd09bSNélio Laranjeiro  */
16002eb4d010SOphir Munk int
16017fe24446SShahaf Shuler mlx5_args(struct mlx5_dev_config *config, struct rte_devargs *devargs)
1602e72dd09bSNélio Laranjeiro {
1603e72dd09bSNélio Laranjeiro 	const char **params = (const char *[]){
160499c12dccSNélio Laranjeiro 		MLX5_RXQ_CQE_COMP_EN,
1605bc91e8dbSYongseok Koh 		MLX5_RXQ_CQE_PAD_EN,
160678c7a16dSYongseok Koh 		MLX5_RXQ_PKT_PAD_EN,
16077d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_EN,
16087d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_LOG_STRIDE_NUM,
1609ecb16045SAlexander Kozyrev 		MLX5_RX_MPRQ_LOG_STRIDE_SIZE,
16107d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_MAX_MEMCPY_LEN,
16117d6bf6b8SYongseok Koh 		MLX5_RXQS_MIN_MPRQ,
16122a66cf37SYaacov Hazan 		MLX5_TXQ_INLINE,
1613505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MIN,
1614505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MAX,
1615505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MPW,
16162a66cf37SYaacov Hazan 		MLX5_TXQS_MIN_INLINE,
161709d8b416SYongseok Koh 		MLX5_TXQS_MAX_VEC,
1618230189d9SNélio Laranjeiro 		MLX5_TXQ_MPW_EN,
16196ce84bd8SYongseok Koh 		MLX5_TXQ_MPW_HDR_DSEG_EN,
16206ce84bd8SYongseok Koh 		MLX5_TXQ_MAX_INLINE_LEN,
16218409a285SViacheslav Ovsiienko 		MLX5_TX_DB_NC,
16228f848f32SViacheslav Ovsiienko 		MLX5_TX_PP,
16238f848f32SViacheslav Ovsiienko 		MLX5_TX_SKEW,
16245644d5b9SNelio Laranjeiro 		MLX5_TX_VEC_EN,
16255644d5b9SNelio Laranjeiro 		MLX5_RX_VEC_EN,
162678a54648SXueming Li 		MLX5_L3_VXLAN_EN,
1627db209cc3SNélio Laranjeiro 		MLX5_VF_NL_EN,
1628e2b4925eSOri Kam 		MLX5_DV_ESW_EN,
162951e72d38SOri Kam 		MLX5_DV_FLOW_EN,
16302d241515SViacheslav Ovsiienko 		MLX5_DV_XMETA_EN,
16310f0ae73aSShiri Kuzin 		MLX5_LACP_BY_USER,
1632dceb5029SYongseok Koh 		MLX5_MR_EXT_MEMSEG_EN,
16336de569f5SAdrien Mazarguil 		MLX5_REPRESENTOR,
1634066cfecdSMatan Azrad 		MLX5_MAX_DUMP_FILES_NUM,
163521bb6c7eSDekel Peled 		MLX5_LRO_TIMEOUT_USEC,
1636d768f324SMatan Azrad 		MLX5_CLASS_ARG_NAME,
16371ad9a3d0SBing Zhao 		MLX5_HP_BUF_SIZE,
1638a1da6f62SSuanming Mou 		MLX5_RECLAIM_MEM,
16395522da6bSSuanming Mou 		MLX5_SYS_MEM_EN,
164050f95b23SSuanming Mou 		MLX5_DECAP_EN,
1641e72dd09bSNélio Laranjeiro 		NULL,
1642e72dd09bSNélio Laranjeiro 	};
1643e72dd09bSNélio Laranjeiro 	struct rte_kvargs *kvlist;
1644e72dd09bSNélio Laranjeiro 	int ret = 0;
1645e72dd09bSNélio Laranjeiro 	int i;
1646e72dd09bSNélio Laranjeiro 
1647e72dd09bSNélio Laranjeiro 	if (devargs == NULL)
1648e72dd09bSNélio Laranjeiro 		return 0;
1649e72dd09bSNélio Laranjeiro 	/* Following UGLY cast is done to pass checkpatch. */
1650e72dd09bSNélio Laranjeiro 	kvlist = rte_kvargs_parse(devargs->args, params);
165115b0ea00SMatan Azrad 	if (kvlist == NULL) {
165215b0ea00SMatan Azrad 		rte_errno = EINVAL;
165315b0ea00SMatan Azrad 		return -rte_errno;
165415b0ea00SMatan Azrad 	}
1655e72dd09bSNélio Laranjeiro 	/* Process parameters. */
1656e72dd09bSNélio Laranjeiro 	for (i = 0; (params[i] != NULL); ++i) {
1657e72dd09bSNélio Laranjeiro 		if (rte_kvargs_count(kvlist, params[i])) {
1658e72dd09bSNélio Laranjeiro 			ret = rte_kvargs_process(kvlist, params[i],
16597fe24446SShahaf Shuler 						 mlx5_args_check, config);
1660a6d83b6aSNélio Laranjeiro 			if (ret) {
1661a6d83b6aSNélio Laranjeiro 				rte_errno = EINVAL;
1662a67323e4SShahaf Shuler 				rte_kvargs_free(kvlist);
1663a6d83b6aSNélio Laranjeiro 				return -rte_errno;
1664e72dd09bSNélio Laranjeiro 			}
1665e72dd09bSNélio Laranjeiro 		}
1666a67323e4SShahaf Shuler 	}
1667e72dd09bSNélio Laranjeiro 	rte_kvargs_free(kvlist);
1668e72dd09bSNélio Laranjeiro 	return 0;
1669e72dd09bSNélio Laranjeiro }
1670e72dd09bSNélio Laranjeiro 
16717be600c8SYongseok Koh /**
167238b4b397SViacheslav Ovsiienko  * Configures the minimal amount of data to inline into WQE
167338b4b397SViacheslav Ovsiienko  * while sending packets.
167438b4b397SViacheslav Ovsiienko  *
167538b4b397SViacheslav Ovsiienko  * - the txq_inline_min has the maximal priority, if this
167638b4b397SViacheslav Ovsiienko  *   key is specified in devargs
167738b4b397SViacheslav Ovsiienko  * - if DevX is enabled the inline mode is queried from the
167838b4b397SViacheslav Ovsiienko  *   device (HCA attributes and NIC vport context if needed).
1679ee76bddcSThomas Monjalon  * - otherwise L2 mode (18 bytes) is assumed for ConnectX-4/4 Lx
168038b4b397SViacheslav Ovsiienko  *   and none (0 bytes) for other NICs
168138b4b397SViacheslav Ovsiienko  *
168238b4b397SViacheslav Ovsiienko  * @param spawn
168338b4b397SViacheslav Ovsiienko  *   Verbs device parameters (name, port, switch_info) to spawn.
168438b4b397SViacheslav Ovsiienko  * @param config
168538b4b397SViacheslav Ovsiienko  *   Device configuration parameters.
168638b4b397SViacheslav Ovsiienko  */
16872eb4d010SOphir Munk void
168838b4b397SViacheslav Ovsiienko mlx5_set_min_inline(struct mlx5_dev_spawn_data *spawn,
168938b4b397SViacheslav Ovsiienko 		    struct mlx5_dev_config *config)
169038b4b397SViacheslav Ovsiienko {
169138b4b397SViacheslav Ovsiienko 	if (config->txq_inline_min != MLX5_ARG_UNSET) {
169238b4b397SViacheslav Ovsiienko 		/* Application defines size of inlined data explicitly. */
169338b4b397SViacheslav Ovsiienko 		switch (spawn->pci_dev->id.device_id) {
169438b4b397SViacheslav Ovsiienko 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
169538b4b397SViacheslav Ovsiienko 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
169638b4b397SViacheslav Ovsiienko 			if (config->txq_inline_min <
169738b4b397SViacheslav Ovsiienko 				       (int)MLX5_INLINE_HSIZE_L2) {
169838b4b397SViacheslav Ovsiienko 				DRV_LOG(DEBUG,
169938b4b397SViacheslav Ovsiienko 					"txq_inline_mix aligned to minimal"
170038b4b397SViacheslav Ovsiienko 					" ConnectX-4 required value %d",
170138b4b397SViacheslav Ovsiienko 					(int)MLX5_INLINE_HSIZE_L2);
170238b4b397SViacheslav Ovsiienko 				config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
170338b4b397SViacheslav Ovsiienko 			}
170438b4b397SViacheslav Ovsiienko 			break;
170538b4b397SViacheslav Ovsiienko 		}
170638b4b397SViacheslav Ovsiienko 		goto exit;
170738b4b397SViacheslav Ovsiienko 	}
170838b4b397SViacheslav Ovsiienko 	if (config->hca_attr.eth_net_offloads) {
170938b4b397SViacheslav Ovsiienko 		/* We have DevX enabled, inline mode queried successfully. */
171038b4b397SViacheslav Ovsiienko 		switch (config->hca_attr.wqe_inline_mode) {
171138b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_L2:
171238b4b397SViacheslav Ovsiienko 			/* outer L2 header must be inlined. */
171338b4b397SViacheslav Ovsiienko 			config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
171438b4b397SViacheslav Ovsiienko 			goto exit;
171538b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_NOT_REQUIRED:
171638b4b397SViacheslav Ovsiienko 			/* No inline data are required by NIC. */
171738b4b397SViacheslav Ovsiienko 			config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
171838b4b397SViacheslav Ovsiienko 			config->hw_vlan_insert =
171938b4b397SViacheslav Ovsiienko 				config->hca_attr.wqe_vlan_insert;
172038b4b397SViacheslav Ovsiienko 			DRV_LOG(DEBUG, "Tx VLAN insertion is supported");
172138b4b397SViacheslav Ovsiienko 			goto exit;
172238b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_VPORT_CONTEXT:
172338b4b397SViacheslav Ovsiienko 			/* inline mode is defined by NIC vport context. */
172438b4b397SViacheslav Ovsiienko 			if (!config->hca_attr.eth_virt)
172538b4b397SViacheslav Ovsiienko 				break;
172638b4b397SViacheslav Ovsiienko 			switch (config->hca_attr.vport_inline_mode) {
172738b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_NONE:
172838b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
172938b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_NONE;
173038b4b397SViacheslav Ovsiienko 				goto exit;
173138b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_L2:
173238b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
173338b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L2;
173438b4b397SViacheslav Ovsiienko 				goto exit;
173538b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_IP:
173638b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
173738b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L3;
173838b4b397SViacheslav Ovsiienko 				goto exit;
173938b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_TCP_UDP:
174038b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174138b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L4;
174238b4b397SViacheslav Ovsiienko 				goto exit;
174338b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_L2:
174438b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174538b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L2;
174638b4b397SViacheslav Ovsiienko 				goto exit;
174738b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_IP:
174838b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174938b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L3;
175038b4b397SViacheslav Ovsiienko 				goto exit;
175138b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_TCP_UDP:
175238b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
175338b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L4;
175438b4b397SViacheslav Ovsiienko 				goto exit;
175538b4b397SViacheslav Ovsiienko 			}
175638b4b397SViacheslav Ovsiienko 		}
175738b4b397SViacheslav Ovsiienko 	}
175838b4b397SViacheslav Ovsiienko 	/*
175938b4b397SViacheslav Ovsiienko 	 * We get here if we are unable to deduce
176038b4b397SViacheslav Ovsiienko 	 * inline data size with DevX. Try PCI ID
176138b4b397SViacheslav Ovsiienko 	 * to determine old NICs.
176238b4b397SViacheslav Ovsiienko 	 */
176338b4b397SViacheslav Ovsiienko 	switch (spawn->pci_dev->id.device_id) {
176438b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
176538b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
176638b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4LX:
176738b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF:
1768614de6c8SViacheslav Ovsiienko 		config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
176938b4b397SViacheslav Ovsiienko 		config->hw_vlan_insert = 0;
177038b4b397SViacheslav Ovsiienko 		break;
177138b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5:
177238b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5VF:
177338b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5EX:
177438b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF:
177538b4b397SViacheslav Ovsiienko 		/*
177638b4b397SViacheslav Ovsiienko 		 * These NICs support VLAN insertion from WQE and
177738b4b397SViacheslav Ovsiienko 		 * report the wqe_vlan_insert flag. But there is the bug
177838b4b397SViacheslav Ovsiienko 		 * and PFC control may be broken, so disable feature.
177938b4b397SViacheslav Ovsiienko 		 */
178038b4b397SViacheslav Ovsiienko 		config->hw_vlan_insert = 0;
178120215627SDavid Christensen 		config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
178238b4b397SViacheslav Ovsiienko 		break;
178338b4b397SViacheslav Ovsiienko 	default:
178438b4b397SViacheslav Ovsiienko 		config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
178538b4b397SViacheslav Ovsiienko 		break;
178638b4b397SViacheslav Ovsiienko 	}
178738b4b397SViacheslav Ovsiienko exit:
178838b4b397SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "min tx inline configured: %d", config->txq_inline_min);
178938b4b397SViacheslav Ovsiienko }
179038b4b397SViacheslav Ovsiienko 
179138b4b397SViacheslav Ovsiienko /**
179239139371SViacheslav Ovsiienko  * Configures the metadata mask fields in the shared context.
179339139371SViacheslav Ovsiienko  *
179439139371SViacheslav Ovsiienko  * @param [in] dev
179539139371SViacheslav Ovsiienko  *   Pointer to Ethernet device.
179639139371SViacheslav Ovsiienko  */
17972eb4d010SOphir Munk void
179839139371SViacheslav Ovsiienko mlx5_set_metadata_mask(struct rte_eth_dev *dev)
179939139371SViacheslav Ovsiienko {
180039139371SViacheslav Ovsiienko 	struct mlx5_priv *priv = dev->data->dev_private;
18016e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
180239139371SViacheslav Ovsiienko 	uint32_t meta, mark, reg_c0;
180339139371SViacheslav Ovsiienko 
180439139371SViacheslav Ovsiienko 	reg_c0 = ~priv->vport_meta_mask;
180539139371SViacheslav Ovsiienko 	switch (priv->config.dv_xmeta_en) {
180639139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_LEGACY:
180739139371SViacheslav Ovsiienko 		meta = UINT32_MAX;
180839139371SViacheslav Ovsiienko 		mark = MLX5_FLOW_MARK_MASK;
180939139371SViacheslav Ovsiienko 		break;
181039139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_META16:
181139139371SViacheslav Ovsiienko 		meta = reg_c0 >> rte_bsf32(reg_c0);
181239139371SViacheslav Ovsiienko 		mark = MLX5_FLOW_MARK_MASK;
181339139371SViacheslav Ovsiienko 		break;
181439139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_META32:
181539139371SViacheslav Ovsiienko 		meta = UINT32_MAX;
181639139371SViacheslav Ovsiienko 		mark = (reg_c0 >> rte_bsf32(reg_c0)) & MLX5_FLOW_MARK_MASK;
181739139371SViacheslav Ovsiienko 		break;
181839139371SViacheslav Ovsiienko 	default:
181939139371SViacheslav Ovsiienko 		meta = 0;
182039139371SViacheslav Ovsiienko 		mark = 0;
18218e46d4e1SAlexander Kozyrev 		MLX5_ASSERT(false);
182239139371SViacheslav Ovsiienko 		break;
182339139371SViacheslav Ovsiienko 	}
182439139371SViacheslav Ovsiienko 	if (sh->dv_mark_mask && sh->dv_mark_mask != mark)
182539139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata MARK mask mismatche %08X:%08X",
182639139371SViacheslav Ovsiienko 				 sh->dv_mark_mask, mark);
182739139371SViacheslav Ovsiienko 	else
182839139371SViacheslav Ovsiienko 		sh->dv_mark_mask = mark;
182939139371SViacheslav Ovsiienko 	if (sh->dv_meta_mask && sh->dv_meta_mask != meta)
183039139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata META mask mismatche %08X:%08X",
183139139371SViacheslav Ovsiienko 				 sh->dv_meta_mask, meta);
183239139371SViacheslav Ovsiienko 	else
183339139371SViacheslav Ovsiienko 		sh->dv_meta_mask = meta;
183439139371SViacheslav Ovsiienko 	if (sh->dv_regc0_mask && sh->dv_regc0_mask != reg_c0)
183539139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata reg_c0 mask mismatche %08X:%08X",
183639139371SViacheslav Ovsiienko 				 sh->dv_meta_mask, reg_c0);
183739139371SViacheslav Ovsiienko 	else
183839139371SViacheslav Ovsiienko 		sh->dv_regc0_mask = reg_c0;
183939139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata mode %u", priv->config.dv_xmeta_en);
184039139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata MARK mask %08X", sh->dv_mark_mask);
184139139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata META mask %08X", sh->dv_meta_mask);
184239139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata reg_c0 mask %08X", sh->dv_regc0_mask);
184339139371SViacheslav Ovsiienko }
184439139371SViacheslav Ovsiienko 
1845efa79e68SOri Kam int
1846efa79e68SOri Kam rte_pmd_mlx5_get_dyn_flag_names(char *names[], unsigned int n)
1847efa79e68SOri Kam {
1848efa79e68SOri Kam 	static const char *const dynf_names[] = {
1849efa79e68SOri Kam 		RTE_PMD_MLX5_FINE_GRANULARITY_INLINE,
18508f848f32SViacheslav Ovsiienko 		RTE_MBUF_DYNFLAG_METADATA_NAME,
18518f848f32SViacheslav Ovsiienko 		RTE_MBUF_DYNFLAG_TX_TIMESTAMP_NAME
1852efa79e68SOri Kam 	};
1853efa79e68SOri Kam 	unsigned int i;
1854efa79e68SOri Kam 
1855efa79e68SOri Kam 	if (n < RTE_DIM(dynf_names))
1856efa79e68SOri Kam 		return -ENOMEM;
1857efa79e68SOri Kam 	for (i = 0; i < RTE_DIM(dynf_names); i++) {
1858efa79e68SOri Kam 		if (names[i] == NULL)
1859efa79e68SOri Kam 			return -EINVAL;
1860efa79e68SOri Kam 		strcpy(names[i], dynf_names[i]);
1861efa79e68SOri Kam 	}
1862efa79e68SOri Kam 	return RTE_DIM(dynf_names);
1863efa79e68SOri Kam }
1864efa79e68SOri Kam 
186521cae858SDekel Peled /**
18662eb4d010SOphir Munk  * Comparison callback to sort device data.
186792d5dd48SViacheslav Ovsiienko  *
18682eb4d010SOphir Munk  * This is meant to be used with qsort().
186992d5dd48SViacheslav Ovsiienko  *
18702eb4d010SOphir Munk  * @param a[in]
18712eb4d010SOphir Munk  *   Pointer to pointer to first data object.
18722eb4d010SOphir Munk  * @param b[in]
18732eb4d010SOphir Munk  *   Pointer to pointer to second data object.
187492d5dd48SViacheslav Ovsiienko  *
187592d5dd48SViacheslav Ovsiienko  * @return
18762eb4d010SOphir Munk  *   0 if both objects are equal, less than 0 if the first argument is less
18772eb4d010SOphir Munk  *   than the second, greater than 0 otherwise.
187892d5dd48SViacheslav Ovsiienko  */
18792eb4d010SOphir Munk int
188092d5dd48SViacheslav Ovsiienko mlx5_dev_check_sibling_config(struct mlx5_priv *priv,
188192d5dd48SViacheslav Ovsiienko 			      struct mlx5_dev_config *config)
188292d5dd48SViacheslav Ovsiienko {
18836e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
188492d5dd48SViacheslav Ovsiienko 	struct mlx5_dev_config *sh_conf = NULL;
188592d5dd48SViacheslav Ovsiienko 	uint16_t port_id;
188692d5dd48SViacheslav Ovsiienko 
18878e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
188892d5dd48SViacheslav Ovsiienko 	/* Nothing to compare for the single/first device. */
188992d5dd48SViacheslav Ovsiienko 	if (sh->refcnt == 1)
189092d5dd48SViacheslav Ovsiienko 		return 0;
189192d5dd48SViacheslav Ovsiienko 	/* Find the device with shared context. */
1892fbc83412SViacheslav Ovsiienko 	MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
189392d5dd48SViacheslav Ovsiienko 		struct mlx5_priv *opriv =
189492d5dd48SViacheslav Ovsiienko 			rte_eth_devices[port_id].data->dev_private;
189592d5dd48SViacheslav Ovsiienko 
189692d5dd48SViacheslav Ovsiienko 		if (opriv && opriv != priv && opriv->sh == sh) {
189792d5dd48SViacheslav Ovsiienko 			sh_conf = &opriv->config;
189892d5dd48SViacheslav Ovsiienko 			break;
189992d5dd48SViacheslav Ovsiienko 		}
190092d5dd48SViacheslav Ovsiienko 	}
190192d5dd48SViacheslav Ovsiienko 	if (!sh_conf)
190292d5dd48SViacheslav Ovsiienko 		return 0;
190392d5dd48SViacheslav Ovsiienko 	if (sh_conf->dv_flow_en ^ config->dv_flow_en) {
190492d5dd48SViacheslav Ovsiienko 		DRV_LOG(ERR, "\"dv_flow_en\" configuration mismatch"
190592d5dd48SViacheslav Ovsiienko 			     " for shared %s context", sh->ibdev_name);
190692d5dd48SViacheslav Ovsiienko 		rte_errno = EINVAL;
190792d5dd48SViacheslav Ovsiienko 		return rte_errno;
190892d5dd48SViacheslav Ovsiienko 	}
19092d241515SViacheslav Ovsiienko 	if (sh_conf->dv_xmeta_en ^ config->dv_xmeta_en) {
19102d241515SViacheslav Ovsiienko 		DRV_LOG(ERR, "\"dv_xmeta_en\" configuration mismatch"
19112d241515SViacheslav Ovsiienko 			     " for shared %s context", sh->ibdev_name);
19122d241515SViacheslav Ovsiienko 		rte_errno = EINVAL;
19132d241515SViacheslav Ovsiienko 		return rte_errno;
19142d241515SViacheslav Ovsiienko 	}
191592d5dd48SViacheslav Ovsiienko 	return 0;
191692d5dd48SViacheslav Ovsiienko }
1917771fa900SAdrien Mazarguil 
1918fbc83412SViacheslav Ovsiienko /**
1919fbc83412SViacheslav Ovsiienko  * Look for the ethernet device belonging to mlx5 driver.
1920fbc83412SViacheslav Ovsiienko  *
1921fbc83412SViacheslav Ovsiienko  * @param[in] port_id
1922fbc83412SViacheslav Ovsiienko  *   port_id to start looking for device.
1923fbc83412SViacheslav Ovsiienko  * @param[in] pci_dev
1924fbc83412SViacheslav Ovsiienko  *   Pointer to the hint PCI device. When device is being probed
1925fbc83412SViacheslav Ovsiienko  *   the its siblings (master and preceding representors might
19262eb4d010SOphir Munk  *   not have assigned driver yet (because the mlx5_os_pci_probe()
1927fbc83412SViacheslav Ovsiienko  *   is not completed yet, for this case match on hint PCI
1928fbc83412SViacheslav Ovsiienko  *   device may be used to detect sibling device.
1929fbc83412SViacheslav Ovsiienko  *
1930fbc83412SViacheslav Ovsiienko  * @return
1931fbc83412SViacheslav Ovsiienko  *   port_id of found device, RTE_MAX_ETHPORT if not found.
1932fbc83412SViacheslav Ovsiienko  */
1933f7e95215SViacheslav Ovsiienko uint16_t
1934fbc83412SViacheslav Ovsiienko mlx5_eth_find_next(uint16_t port_id, struct rte_pci_device *pci_dev)
1935f7e95215SViacheslav Ovsiienko {
1936f7e95215SViacheslav Ovsiienko 	while (port_id < RTE_MAX_ETHPORTS) {
1937f7e95215SViacheslav Ovsiienko 		struct rte_eth_dev *dev = &rte_eth_devices[port_id];
1938f7e95215SViacheslav Ovsiienko 
1939f7e95215SViacheslav Ovsiienko 		if (dev->state != RTE_ETH_DEV_UNUSED &&
1940f7e95215SViacheslav Ovsiienko 		    dev->device &&
1941fbc83412SViacheslav Ovsiienko 		    (dev->device == &pci_dev->device ||
1942fbc83412SViacheslav Ovsiienko 		     (dev->device->driver &&
1943f7e95215SViacheslav Ovsiienko 		     dev->device->driver->name &&
1944fbc83412SViacheslav Ovsiienko 		     !strcmp(dev->device->driver->name, MLX5_DRIVER_NAME))))
1945f7e95215SViacheslav Ovsiienko 			break;
1946f7e95215SViacheslav Ovsiienko 		port_id++;
1947f7e95215SViacheslav Ovsiienko 	}
1948f7e95215SViacheslav Ovsiienko 	if (port_id >= RTE_MAX_ETHPORTS)
1949f7e95215SViacheslav Ovsiienko 		return RTE_MAX_ETHPORTS;
1950f7e95215SViacheslav Ovsiienko 	return port_id;
1951f7e95215SViacheslav Ovsiienko }
1952f7e95215SViacheslav Ovsiienko 
19533a820742SOphir Munk /**
19543a820742SOphir Munk  * DPDK callback to remove a PCI device.
19553a820742SOphir Munk  *
19563a820742SOphir Munk  * This function removes all Ethernet devices belong to a given PCI device.
19573a820742SOphir Munk  *
19583a820742SOphir Munk  * @param[in] pci_dev
19593a820742SOphir Munk  *   Pointer to the PCI device.
19603a820742SOphir Munk  *
19613a820742SOphir Munk  * @return
19623a820742SOphir Munk  *   0 on success, the function cannot fail.
19633a820742SOphir Munk  */
19643a820742SOphir Munk static int
19653a820742SOphir Munk mlx5_pci_remove(struct rte_pci_device *pci_dev)
19663a820742SOphir Munk {
19673a820742SOphir Munk 	uint16_t port_id;
19688a5a0aadSThomas Monjalon 	int ret = 0;
19693a820742SOphir Munk 
19702786b7bfSSuanming Mou 	RTE_ETH_FOREACH_DEV_OF(port_id, &pci_dev->device) {
19712786b7bfSSuanming Mou 		/*
19722786b7bfSSuanming Mou 		 * mlx5_dev_close() is not registered to secondary process,
19732786b7bfSSuanming Mou 		 * call the close function explicitly for secondary process.
19742786b7bfSSuanming Mou 		 */
19752786b7bfSSuanming Mou 		if (rte_eal_process_type() == RTE_PROC_SECONDARY)
19768a5a0aadSThomas Monjalon 			ret |= mlx5_dev_close(&rte_eth_devices[port_id]);
19772786b7bfSSuanming Mou 		else
19788a5a0aadSThomas Monjalon 			ret |= rte_eth_dev_close(port_id);
19792786b7bfSSuanming Mou 	}
19808a5a0aadSThomas Monjalon 	return ret == 0 ? 0 : -EIO;
19813a820742SOphir Munk }
19823a820742SOphir Munk 
1983771fa900SAdrien Mazarguil static const struct rte_pci_id mlx5_pci_id_map[] = {
1984771fa900SAdrien Mazarguil 	{
19851d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19861d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4)
1987771fa900SAdrien Mazarguil 	},
1988771fa900SAdrien Mazarguil 	{
19891d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19901d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4VF)
1991771fa900SAdrien Mazarguil 	},
1992771fa900SAdrien Mazarguil 	{
19931d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19941d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LX)
1995771fa900SAdrien Mazarguil 	},
1996771fa900SAdrien Mazarguil 	{
19971d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19981d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF)
1999771fa900SAdrien Mazarguil 	},
2000771fa900SAdrien Mazarguil 	{
2001528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2002528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5)
2003528a9fbeSYongseok Koh 	},
2004528a9fbeSYongseok Koh 	{
2005528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2006528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5VF)
2007528a9fbeSYongseok Koh 	},
2008528a9fbeSYongseok Koh 	{
2009528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2010528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EX)
2011528a9fbeSYongseok Koh 	},
2012528a9fbeSYongseok Koh 	{
2013528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2014528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF)
2015528a9fbeSYongseok Koh 	},
2016528a9fbeSYongseok Koh 	{
2017dd3331c6SShahaf Shuler 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2018dd3331c6SShahaf Shuler 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5BF)
2019dd3331c6SShahaf Shuler 	},
2020dd3331c6SShahaf Shuler 	{
2021c322c0e5SOri Kam 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2022c322c0e5SOri Kam 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5BFVF)
2023c322c0e5SOri Kam 	},
2024c322c0e5SOri Kam 	{
2025f0354d84SWisam Jaddo 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2026f0354d84SWisam Jaddo 				PCI_DEVICE_ID_MELLANOX_CONNECTX6)
2027f0354d84SWisam Jaddo 	},
2028f0354d84SWisam Jaddo 	{
2029f0354d84SWisam Jaddo 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2030f0354d84SWisam Jaddo 				PCI_DEVICE_ID_MELLANOX_CONNECTX6VF)
2031f0354d84SWisam Jaddo 	},
2032f0354d84SWisam Jaddo 	{
20335fc66630SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20345fc66630SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX6DX)
20355fc66630SRaslan Darawsheh 	},
20365fc66630SRaslan Darawsheh 	{
20375fc66630SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20383ea12cadSRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTXVF)
20395fc66630SRaslan Darawsheh 	},
20405fc66630SRaslan Darawsheh 	{
204158b4a2b1SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
204258b4a2b1SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX6DXBF)
204358b4a2b1SRaslan Darawsheh 	},
204458b4a2b1SRaslan Darawsheh 	{
204528c9a7d7SAli Alnubani 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
204628c9a7d7SAli Alnubani 				PCI_DEVICE_ID_MELLANOX_CONNECTX6LX)
204728c9a7d7SAli Alnubani 	},
204828c9a7d7SAli Alnubani 	{
20496ca37b06SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20506ca37b06SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX7)
20516ca37b06SRaslan Darawsheh 	},
20526ca37b06SRaslan Darawsheh 	{
20536ca37b06SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20546ca37b06SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX7BF)
20556ca37b06SRaslan Darawsheh 	},
20566ca37b06SRaslan Darawsheh 	{
2057771fa900SAdrien Mazarguil 		.vendor_id = 0
2058771fa900SAdrien Mazarguil 	}
2059771fa900SAdrien Mazarguil };
2060771fa900SAdrien Mazarguil 
2061392bf908SParav Pandit static struct mlx5_pci_driver mlx5_driver = {
2062392bf908SParav Pandit 	.driver_class = MLX5_CLASS_NET,
2063392bf908SParav Pandit 	.pci_driver = {
20642f3193cfSJan Viktorin 		.driver = {
2065392bf908SParav Pandit 			.name = MLX5_DRIVER_NAME,
20662f3193cfSJan Viktorin 		},
2067771fa900SAdrien Mazarguil 		.id_table = mlx5_pci_id_map,
20682eb4d010SOphir Munk 		.probe = mlx5_os_pci_probe,
20693a820742SOphir Munk 		.remove = mlx5_pci_remove,
2070989e999dSShahaf Shuler 		.dma_map = mlx5_dma_map,
2071989e999dSShahaf Shuler 		.dma_unmap = mlx5_dma_unmap,
207210f3581dSOphir Munk 		.drv_flags = PCI_DRV_FLAGS,
2073392bf908SParav Pandit 	},
2074771fa900SAdrien Mazarguil };
2075771fa900SAdrien Mazarguil 
20769c99878aSJerin Jacob /* Initialize driver log type. */
20779c99878aSJerin Jacob RTE_LOG_REGISTER(mlx5_logtype, pmd.net.mlx5, NOTICE)
20789c99878aSJerin Jacob 
2079771fa900SAdrien Mazarguil /**
2080771fa900SAdrien Mazarguil  * Driver initialization routine.
2081771fa900SAdrien Mazarguil  */
2082f8e99896SThomas Monjalon RTE_INIT(rte_mlx5_pmd_init)
2083771fa900SAdrien Mazarguil {
208482088001SParav Pandit 	mlx5_common_init();
20855f8ba81cSXueming Li 	/* Build the static tables for Verbs conversion. */
2086ea16068cSYongseok Koh 	mlx5_set_ptype_table();
20875f8ba81cSXueming Li 	mlx5_set_cksum_table();
20885f8ba81cSXueming Li 	mlx5_set_swp_types_table();
20897b4f1e6bSMatan Azrad 	if (mlx5_glue)
2090392bf908SParav Pandit 		mlx5_pci_driver_register(&mlx5_driver);
2091771fa900SAdrien Mazarguil }
2092771fa900SAdrien Mazarguil 
209301f19227SShreyansh Jain RTE_PMD_EXPORT_NAME(net_mlx5, __COUNTER__);
209401f19227SShreyansh Jain RTE_PMD_REGISTER_PCI_TABLE(net_mlx5, mlx5_pci_id_map);
20950880c401SOlivier Matz RTE_PMD_REGISTER_KMOD_DEP(net_mlx5, "* ib_uverbs & mlx5_core & mlx5_ib");
2096