xref: /dpdk/drivers/net/mlx5/mlx5.c (revision 1cb210abddfaa2f00f0a804ce41b7a81e6093945)
18fd92a66SOlivier Matz /* SPDX-License-Identifier: BSD-3-Clause
2771fa900SAdrien Mazarguil  * Copyright 2015 6WIND S.A.
35feecc57SShahaf Shuler  * Copyright 2015 Mellanox Technologies, Ltd
4771fa900SAdrien Mazarguil  */
5771fa900SAdrien Mazarguil 
6771fa900SAdrien Mazarguil #include <stddef.h>
7771fa900SAdrien Mazarguil #include <unistd.h>
8771fa900SAdrien Mazarguil #include <string.h>
9771fa900SAdrien Mazarguil #include <stdint.h>
10771fa900SAdrien Mazarguil #include <stdlib.h>
11e72dd09bSNélio Laranjeiro #include <errno.h>
12771fa900SAdrien Mazarguil 
13771fa900SAdrien Mazarguil #include <rte_malloc.h>
14ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h>
15fdf91e0fSJan Blunck #include <rte_ethdev_pci.h>
16771fa900SAdrien Mazarguil #include <rte_pci.h>
17c752998bSGaetan Rivet #include <rte_bus_pci.h>
18771fa900SAdrien Mazarguil #include <rte_common.h>
19e72dd09bSNélio Laranjeiro #include <rte_kvargs.h>
20e89c15b6SAdrien Mazarguil #include <rte_rwlock.h>
21e89c15b6SAdrien Mazarguil #include <rte_spinlock.h>
22f38c5457SAdrien Mazarguil #include <rte_string_fns.h>
23f15db67dSMatan Azrad #include <rte_alarm.h>
2420698c9fSOphir Munk #include <rte_cycles.h>
25771fa900SAdrien Mazarguil 
267b4f1e6bSMatan Azrad #include <mlx5_glue.h>
277b4f1e6bSMatan Azrad #include <mlx5_devx_cmds.h>
2893e30982SMatan Azrad #include <mlx5_common.h>
29391b8bccSOphir Munk #include <mlx5_common_os.h>
30a4de9586SVu Pham #include <mlx5_common_mp.h>
31392bf908SParav Pandit #include <mlx5_common_pci.h>
3283c2047cSSuanming Mou #include <mlx5_malloc.h>
337b4f1e6bSMatan Azrad 
347b4f1e6bSMatan Azrad #include "mlx5_defs.h"
35771fa900SAdrien Mazarguil #include "mlx5.h"
36771fa900SAdrien Mazarguil #include "mlx5_utils.h"
372e22920bSAdrien Mazarguil #include "mlx5_rxtx.h"
38771fa900SAdrien Mazarguil #include "mlx5_autoconf.h"
39974f1e7eSYongseok Koh #include "mlx5_mr.h"
4084c406e7SOri Kam #include "mlx5_flow.h"
41efa79e68SOri Kam #include "rte_pmd_mlx5.h"
42771fa900SAdrien Mazarguil 
4399c12dccSNélio Laranjeiro /* Device parameter to enable RX completion queue compression. */
4499c12dccSNélio Laranjeiro #define MLX5_RXQ_CQE_COMP_EN "rxq_cqe_comp_en"
4599c12dccSNélio Laranjeiro 
46bc91e8dbSYongseok Koh /* Device parameter to enable RX completion entry padding to 128B. */
47bc91e8dbSYongseok Koh #define MLX5_RXQ_CQE_PAD_EN "rxq_cqe_pad_en"
48bc91e8dbSYongseok Koh 
4978c7a16dSYongseok Koh /* Device parameter to enable padding Rx packet to cacheline size. */
5078c7a16dSYongseok Koh #define MLX5_RXQ_PKT_PAD_EN "rxq_pkt_pad_en"
5178c7a16dSYongseok Koh 
527d6bf6b8SYongseok Koh /* Device parameter to enable Multi-Packet Rx queue. */
537d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_EN "mprq_en"
547d6bf6b8SYongseok Koh 
557d6bf6b8SYongseok Koh /* Device parameter to configure log 2 of the number of strides for MPRQ. */
567d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_LOG_STRIDE_NUM "mprq_log_stride_num"
577d6bf6b8SYongseok Koh 
58ecb16045SAlexander Kozyrev /* Device parameter to configure log 2 of the stride size for MPRQ. */
59ecb16045SAlexander Kozyrev #define MLX5_RX_MPRQ_LOG_STRIDE_SIZE "mprq_log_stride_size"
60ecb16045SAlexander Kozyrev 
617d6bf6b8SYongseok Koh /* Device parameter to limit the size of memcpy'd packet for MPRQ. */
627d6bf6b8SYongseok Koh #define MLX5_RX_MPRQ_MAX_MEMCPY_LEN "mprq_max_memcpy_len"
637d6bf6b8SYongseok Koh 
647d6bf6b8SYongseok Koh /* Device parameter to set the minimum number of Rx queues to enable MPRQ. */
657d6bf6b8SYongseok Koh #define MLX5_RXQS_MIN_MPRQ "rxqs_min_mprq"
667d6bf6b8SYongseok Koh 
67a6bd4911SViacheslav Ovsiienko /* Device parameter to configure inline send. Deprecated, ignored.*/
682a66cf37SYaacov Hazan #define MLX5_TXQ_INLINE "txq_inline"
692a66cf37SYaacov Hazan 
70505f1fe4SViacheslav Ovsiienko /* Device parameter to limit packet size to inline with ordinary SEND. */
71505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MAX "txq_inline_max"
72505f1fe4SViacheslav Ovsiienko 
73505f1fe4SViacheslav Ovsiienko /* Device parameter to configure minimal data size to inline. */
74505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MIN "txq_inline_min"
75505f1fe4SViacheslav Ovsiienko 
76505f1fe4SViacheslav Ovsiienko /* Device parameter to limit packet size to inline with Enhanced MPW. */
77505f1fe4SViacheslav Ovsiienko #define MLX5_TXQ_INLINE_MPW "txq_inline_mpw"
78505f1fe4SViacheslav Ovsiienko 
792a66cf37SYaacov Hazan /*
802a66cf37SYaacov Hazan  * Device parameter to configure the number of TX queues threshold for
812a66cf37SYaacov Hazan  * enabling inline send.
822a66cf37SYaacov Hazan  */
832a66cf37SYaacov Hazan #define MLX5_TXQS_MIN_INLINE "txqs_min_inline"
842a66cf37SYaacov Hazan 
8509d8b416SYongseok Koh /*
8609d8b416SYongseok Koh  * Device parameter to configure the number of TX queues threshold for
87a6bd4911SViacheslav Ovsiienko  * enabling vectorized Tx, deprecated, ignored (no vectorized Tx routines).
8809d8b416SYongseok Koh  */
8909d8b416SYongseok Koh #define MLX5_TXQS_MAX_VEC "txqs_max_vec"
9009d8b416SYongseok Koh 
91230189d9SNélio Laranjeiro /* Device parameter to enable multi-packet send WQEs. */
92230189d9SNélio Laranjeiro #define MLX5_TXQ_MPW_EN "txq_mpw_en"
93230189d9SNélio Laranjeiro 
94a6bd4911SViacheslav Ovsiienko /*
958409a285SViacheslav Ovsiienko  * Device parameter to force doorbell register mapping
968409a285SViacheslav Ovsiienko  * to non-cahed region eliminating the extra write memory barrier.
978409a285SViacheslav Ovsiienko  */
988409a285SViacheslav Ovsiienko #define MLX5_TX_DB_NC "tx_db_nc"
998409a285SViacheslav Ovsiienko 
1008409a285SViacheslav Ovsiienko /*
101a6bd4911SViacheslav Ovsiienko  * Device parameter to include 2 dsegs in the title WQEBB.
102a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored.
103a6bd4911SViacheslav Ovsiienko  */
1046ce84bd8SYongseok Koh #define MLX5_TXQ_MPW_HDR_DSEG_EN "txq_mpw_hdr_dseg_en"
1056ce84bd8SYongseok Koh 
106a6bd4911SViacheslav Ovsiienko /*
107a6bd4911SViacheslav Ovsiienko  * Device parameter to limit the size of inlining packet.
108a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored.
109a6bd4911SViacheslav Ovsiienko  */
1106ce84bd8SYongseok Koh #define MLX5_TXQ_MAX_INLINE_LEN "txq_max_inline_len"
1116ce84bd8SYongseok Koh 
112a6bd4911SViacheslav Ovsiienko /*
1138f848f32SViacheslav Ovsiienko  * Device parameter to enable Tx scheduling on timestamps
1148f848f32SViacheslav Ovsiienko  * and specify the packet pacing granularity in nanoseconds.
1158f848f32SViacheslav Ovsiienko  */
1168f848f32SViacheslav Ovsiienko #define MLX5_TX_PP "tx_pp"
1178f848f32SViacheslav Ovsiienko 
1188f848f32SViacheslav Ovsiienko /*
1198f848f32SViacheslav Ovsiienko  * Device parameter to specify skew in nanoseconds on Tx datapath,
1208f848f32SViacheslav Ovsiienko  * it represents the time between SQ start WQE processing and
1218f848f32SViacheslav Ovsiienko  * appearing actual packet data on the wire.
1228f848f32SViacheslav Ovsiienko  */
1238f848f32SViacheslav Ovsiienko #define MLX5_TX_SKEW "tx_skew"
1248f848f32SViacheslav Ovsiienko 
1258f848f32SViacheslav Ovsiienko /*
126a6bd4911SViacheslav Ovsiienko  * Device parameter to enable hardware Tx vector.
127a6bd4911SViacheslav Ovsiienko  * Deprecated, ignored (no vectorized Tx routines anymore).
128a6bd4911SViacheslav Ovsiienko  */
1295644d5b9SNelio Laranjeiro #define MLX5_TX_VEC_EN "tx_vec_en"
1305644d5b9SNelio Laranjeiro 
1315644d5b9SNelio Laranjeiro /* Device parameter to enable hardware Rx vector. */
1325644d5b9SNelio Laranjeiro #define MLX5_RX_VEC_EN "rx_vec_en"
1335644d5b9SNelio Laranjeiro 
13478a54648SXueming Li /* Allow L3 VXLAN flow creation. */
13578a54648SXueming Li #define MLX5_L3_VXLAN_EN "l3_vxlan_en"
13678a54648SXueming Li 
137e2b4925eSOri Kam /* Activate DV E-Switch flow steering. */
138e2b4925eSOri Kam #define MLX5_DV_ESW_EN "dv_esw_en"
139e2b4925eSOri Kam 
14051e72d38SOri Kam /* Activate DV flow steering. */
14151e72d38SOri Kam #define MLX5_DV_FLOW_EN "dv_flow_en"
14251e72d38SOri Kam 
1432d241515SViacheslav Ovsiienko /* Enable extensive flow metadata support. */
1442d241515SViacheslav Ovsiienko #define MLX5_DV_XMETA_EN "dv_xmeta_en"
1452d241515SViacheslav Ovsiienko 
1460f0ae73aSShiri Kuzin /* Device parameter to let the user manage the lacp traffic of bonded device */
1470f0ae73aSShiri Kuzin #define MLX5_LACP_BY_USER "lacp_by_user"
1480f0ae73aSShiri Kuzin 
149db209cc3SNélio Laranjeiro /* Activate Netlink support in VF mode. */
150db209cc3SNélio Laranjeiro #define MLX5_VF_NL_EN "vf_nl_en"
151db209cc3SNélio Laranjeiro 
152dceb5029SYongseok Koh /* Enable extending memsegs when creating a MR. */
153dceb5029SYongseok Koh #define MLX5_MR_EXT_MEMSEG_EN "mr_ext_memseg_en"
154dceb5029SYongseok Koh 
1556de569f5SAdrien Mazarguil /* Select port representors to instantiate. */
1566de569f5SAdrien Mazarguil #define MLX5_REPRESENTOR "representor"
1576de569f5SAdrien Mazarguil 
158066cfecdSMatan Azrad /* Device parameter to configure the maximum number of dump files per queue. */
159066cfecdSMatan Azrad #define MLX5_MAX_DUMP_FILES_NUM "max_dump_files_num"
160066cfecdSMatan Azrad 
16121bb6c7eSDekel Peled /* Configure timeout of LRO session (in microseconds). */
16221bb6c7eSDekel Peled #define MLX5_LRO_TIMEOUT_USEC "lro_timeout_usec"
16321bb6c7eSDekel Peled 
1641ad9a3d0SBing Zhao /*
1651ad9a3d0SBing Zhao  * Device parameter to configure the total data buffer size for a single
1661ad9a3d0SBing Zhao  * hairpin queue (logarithm value).
1671ad9a3d0SBing Zhao  */
1681ad9a3d0SBing Zhao #define MLX5_HP_BUF_SIZE "hp_buf_log_sz"
1691ad9a3d0SBing Zhao 
170a1da6f62SSuanming Mou /* Flow memory reclaim mode. */
171a1da6f62SSuanming Mou #define MLX5_RECLAIM_MEM "reclaim_mem_mode"
172a1da6f62SSuanming Mou 
1735522da6bSSuanming Mou /* The default memory allocator used in PMD. */
1745522da6bSSuanming Mou #define MLX5_SYS_MEM_EN "sys_mem_en"
17550f95b23SSuanming Mou /* Decap will be used or not. */
17650f95b23SSuanming Mou #define MLX5_DECAP_EN "decap_en"
1775522da6bSSuanming Mou 
178974f1e7eSYongseok Koh /* Shared memory between primary and secondary processes. */
179974f1e7eSYongseok Koh struct mlx5_shared_data *mlx5_shared_data;
180974f1e7eSYongseok Koh 
1812e86c4e5SOphir Munk /** Driver-specific log messages type. */
1822e86c4e5SOphir Munk int mlx5_logtype;
183a170a30dSNélio Laranjeiro 
18491389890SOphir Munk static LIST_HEAD(, mlx5_dev_ctx_shared) mlx5_dev_ctx_list =
18591389890SOphir Munk 						LIST_HEAD_INITIALIZER();
18691389890SOphir Munk static pthread_mutex_t mlx5_dev_ctx_list_mutex = PTHREAD_MUTEX_INITIALIZER;
18717e19bc4SViacheslav Ovsiienko 
1885c761238SGregory Etelson static const struct mlx5_indexed_pool_config mlx5_ipool_cfg[] = {
189b88341caSSuanming Mou #ifdef HAVE_IBV_FLOW_DV_SUPPORT
1909cac7dedSGregory Etelson 	[MLX5_IPOOL_DECAP_ENCAP] = {
191014d1cbeSSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_encap_decap_resource),
192014d1cbeSSuanming Mou 		.trunk_size = 64,
193014d1cbeSSuanming Mou 		.grow_trunk = 3,
194014d1cbeSSuanming Mou 		.grow_shift = 2,
1952f3dc1f4SSuanming Mou 		.need_lock = 1,
196014d1cbeSSuanming Mou 		.release_mem_en = 1,
19783c2047cSSuanming Mou 		.malloc = mlx5_malloc,
19883c2047cSSuanming Mou 		.free = mlx5_free,
199014d1cbeSSuanming Mou 		.type = "mlx5_encap_decap_ipool",
200014d1cbeSSuanming Mou 	},
2019cac7dedSGregory Etelson 	[MLX5_IPOOL_PUSH_VLAN] = {
2028acf8ac9SSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_push_vlan_action_resource),
2038acf8ac9SSuanming Mou 		.trunk_size = 64,
2048acf8ac9SSuanming Mou 		.grow_trunk = 3,
2058acf8ac9SSuanming Mou 		.grow_shift = 2,
2062f3dc1f4SSuanming Mou 		.need_lock = 1,
2078acf8ac9SSuanming Mou 		.release_mem_en = 1,
20883c2047cSSuanming Mou 		.malloc = mlx5_malloc,
20983c2047cSSuanming Mou 		.free = mlx5_free,
2108acf8ac9SSuanming Mou 		.type = "mlx5_push_vlan_ipool",
2118acf8ac9SSuanming Mou 	},
2129cac7dedSGregory Etelson 	[MLX5_IPOOL_TAG] = {
2135f114269SSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_tag_resource),
2145f114269SSuanming Mou 		.trunk_size = 64,
2155f114269SSuanming Mou 		.grow_trunk = 3,
2165f114269SSuanming Mou 		.grow_shift = 2,
2172f3dc1f4SSuanming Mou 		.need_lock = 1,
2185f114269SSuanming Mou 		.release_mem_en = 1,
21983c2047cSSuanming Mou 		.malloc = mlx5_malloc,
22083c2047cSSuanming Mou 		.free = mlx5_free,
2215f114269SSuanming Mou 		.type = "mlx5_tag_ipool",
2225f114269SSuanming Mou 	},
2239cac7dedSGregory Etelson 	[MLX5_IPOOL_PORT_ID] = {
224f3faf9eaSSuanming Mou 		.size = sizeof(struct mlx5_flow_dv_port_id_action_resource),
225f3faf9eaSSuanming Mou 		.trunk_size = 64,
226f3faf9eaSSuanming Mou 		.grow_trunk = 3,
227f3faf9eaSSuanming Mou 		.grow_shift = 2,
2282f3dc1f4SSuanming Mou 		.need_lock = 1,
229f3faf9eaSSuanming Mou 		.release_mem_en = 1,
23083c2047cSSuanming Mou 		.malloc = mlx5_malloc,
23183c2047cSSuanming Mou 		.free = mlx5_free,
232f3faf9eaSSuanming Mou 		.type = "mlx5_port_id_ipool",
233f3faf9eaSSuanming Mou 	},
2349cac7dedSGregory Etelson 	[MLX5_IPOOL_JUMP] = {
2357ac99475SSuanming Mou 		.size = sizeof(struct mlx5_flow_tbl_data_entry),
2367ac99475SSuanming Mou 		.trunk_size = 64,
2377ac99475SSuanming Mou 		.grow_trunk = 3,
2387ac99475SSuanming Mou 		.grow_shift = 2,
2392f3dc1f4SSuanming Mou 		.need_lock = 1,
2407ac99475SSuanming Mou 		.release_mem_en = 1,
24183c2047cSSuanming Mou 		.malloc = mlx5_malloc,
24283c2047cSSuanming Mou 		.free = mlx5_free,
2437ac99475SSuanming Mou 		.type = "mlx5_jump_ipool",
2447ac99475SSuanming Mou 	},
2459cac7dedSGregory Etelson 	[MLX5_IPOOL_SAMPLE] = {
246b4c0ddbfSJiawei Wang 		.size = sizeof(struct mlx5_flow_dv_sample_resource),
247b4c0ddbfSJiawei Wang 		.trunk_size = 64,
248b4c0ddbfSJiawei Wang 		.grow_trunk = 3,
249b4c0ddbfSJiawei Wang 		.grow_shift = 2,
2502f3dc1f4SSuanming Mou 		.need_lock = 1,
251b4c0ddbfSJiawei Wang 		.release_mem_en = 1,
252b4c0ddbfSJiawei Wang 		.malloc = mlx5_malloc,
253b4c0ddbfSJiawei Wang 		.free = mlx5_free,
254b4c0ddbfSJiawei Wang 		.type = "mlx5_sample_ipool",
255b4c0ddbfSJiawei Wang 	},
2569cac7dedSGregory Etelson 	[MLX5_IPOOL_DEST_ARRAY] = {
25700c10c22SJiawei Wang 		.size = sizeof(struct mlx5_flow_dv_dest_array_resource),
25800c10c22SJiawei Wang 		.trunk_size = 64,
25900c10c22SJiawei Wang 		.grow_trunk = 3,
26000c10c22SJiawei Wang 		.grow_shift = 2,
2612f3dc1f4SSuanming Mou 		.need_lock = 1,
26200c10c22SJiawei Wang 		.release_mem_en = 1,
26300c10c22SJiawei Wang 		.malloc = mlx5_malloc,
26400c10c22SJiawei Wang 		.free = mlx5_free,
26500c10c22SJiawei Wang 		.type = "mlx5_dest_array_ipool",
26600c10c22SJiawei Wang 	},
2679cac7dedSGregory Etelson 	[MLX5_IPOOL_TUNNEL_ID] = {
2689cac7dedSGregory Etelson 		.size = sizeof(struct mlx5_flow_tunnel),
269495b2ed4SSuanming Mou 		.trunk_size = MLX5_MAX_TUNNELS,
2709cac7dedSGregory Etelson 		.need_lock = 1,
2719cac7dedSGregory Etelson 		.release_mem_en = 1,
2729cac7dedSGregory Etelson 		.type = "mlx5_tunnel_offload",
2739cac7dedSGregory Etelson 	},
2749cac7dedSGregory Etelson 	[MLX5_IPOOL_TNL_TBL_ID] = {
2759cac7dedSGregory Etelson 		.size = 0,
2769cac7dedSGregory Etelson 		.need_lock = 1,
2779cac7dedSGregory Etelson 		.type = "mlx5_flow_tnl_tbl_ipool",
2789cac7dedSGregory Etelson 	},
279b88341caSSuanming Mou #endif
2809cac7dedSGregory Etelson 	[MLX5_IPOOL_MTR] = {
2818638e2b0SSuanming Mou 		.size = sizeof(struct mlx5_flow_meter),
2828638e2b0SSuanming Mou 		.trunk_size = 64,
2838638e2b0SSuanming Mou 		.grow_trunk = 3,
2848638e2b0SSuanming Mou 		.grow_shift = 2,
2852f3dc1f4SSuanming Mou 		.need_lock = 1,
2868638e2b0SSuanming Mou 		.release_mem_en = 1,
28783c2047cSSuanming Mou 		.malloc = mlx5_malloc,
28883c2047cSSuanming Mou 		.free = mlx5_free,
2898638e2b0SSuanming Mou 		.type = "mlx5_meter_ipool",
2908638e2b0SSuanming Mou 	},
2919cac7dedSGregory Etelson 	[MLX5_IPOOL_MCP] = {
29290e6053aSSuanming Mou 		.size = sizeof(struct mlx5_flow_mreg_copy_resource),
29390e6053aSSuanming Mou 		.trunk_size = 64,
29490e6053aSSuanming Mou 		.grow_trunk = 3,
29590e6053aSSuanming Mou 		.grow_shift = 2,
2962f3dc1f4SSuanming Mou 		.need_lock = 1,
29790e6053aSSuanming Mou 		.release_mem_en = 1,
29883c2047cSSuanming Mou 		.malloc = mlx5_malloc,
29983c2047cSSuanming Mou 		.free = mlx5_free,
30090e6053aSSuanming Mou 		.type = "mlx5_mcp_ipool",
30190e6053aSSuanming Mou 	},
3029cac7dedSGregory Etelson 	[MLX5_IPOOL_HRXQ] = {
303772dc0ebSSuanming Mou 		.size = (sizeof(struct mlx5_hrxq) + MLX5_RSS_HASH_KEY_LEN),
304772dc0ebSSuanming Mou 		.trunk_size = 64,
305772dc0ebSSuanming Mou 		.grow_trunk = 3,
306772dc0ebSSuanming Mou 		.grow_shift = 2,
3072f3dc1f4SSuanming Mou 		.need_lock = 1,
308772dc0ebSSuanming Mou 		.release_mem_en = 1,
30983c2047cSSuanming Mou 		.malloc = mlx5_malloc,
31083c2047cSSuanming Mou 		.free = mlx5_free,
311772dc0ebSSuanming Mou 		.type = "mlx5_hrxq_ipool",
312772dc0ebSSuanming Mou 	},
3139cac7dedSGregory Etelson 	[MLX5_IPOOL_MLX5_FLOW] = {
3145c761238SGregory Etelson 		/*
3155c761238SGregory Etelson 		 * MLX5_IPOOL_MLX5_FLOW size varies for DV and VERBS flows.
3165c761238SGregory Etelson 		 * It set in run time according to PCI function configuration.
3175c761238SGregory Etelson 		 */
3185c761238SGregory Etelson 		.size = 0,
319b88341caSSuanming Mou 		.trunk_size = 64,
320b88341caSSuanming Mou 		.grow_trunk = 3,
321b88341caSSuanming Mou 		.grow_shift = 2,
3222f3dc1f4SSuanming Mou 		.need_lock = 1,
323b88341caSSuanming Mou 		.release_mem_en = 1,
32483c2047cSSuanming Mou 		.malloc = mlx5_malloc,
32583c2047cSSuanming Mou 		.free = mlx5_free,
326b88341caSSuanming Mou 		.type = "mlx5_flow_handle_ipool",
327b88341caSSuanming Mou 	},
3289cac7dedSGregory Etelson 	[MLX5_IPOOL_RTE_FLOW] = {
329ab612adcSSuanming Mou 		.size = sizeof(struct rte_flow),
330ab612adcSSuanming Mou 		.trunk_size = 4096,
331ab612adcSSuanming Mou 		.need_lock = 1,
332ab612adcSSuanming Mou 		.release_mem_en = 1,
33383c2047cSSuanming Mou 		.malloc = mlx5_malloc,
33483c2047cSSuanming Mou 		.free = mlx5_free,
335ab612adcSSuanming Mou 		.type = "rte_flow_ipool",
336ab612adcSSuanming Mou 	},
3379cac7dedSGregory Etelson 	[MLX5_IPOOL_RSS_EXPANTION_FLOW_ID] = {
3384ae8825cSXueming Li 		.size = 0,
3394ae8825cSXueming Li 		.need_lock = 1,
3404ae8825cSXueming Li 		.type = "mlx5_flow_rss_id_ipool",
3414ae8825cSXueming Li 	},
3429cac7dedSGregory Etelson 	[MLX5_IPOOL_RSS_SHARED_ACTIONS] = {
3434a42ac1fSMatan Azrad 		.size = sizeof(struct mlx5_shared_action_rss),
3444a42ac1fSMatan Azrad 		.trunk_size = 64,
3454a42ac1fSMatan Azrad 		.grow_trunk = 3,
3464a42ac1fSMatan Azrad 		.grow_shift = 2,
3474a42ac1fSMatan Azrad 		.need_lock = 1,
3484a42ac1fSMatan Azrad 		.release_mem_en = 1,
3494a42ac1fSMatan Azrad 		.malloc = mlx5_malloc,
3504a42ac1fSMatan Azrad 		.free = mlx5_free,
3514a42ac1fSMatan Azrad 		.type = "mlx5_shared_action_rss",
3524a42ac1fSMatan Azrad 	},
353014d1cbeSSuanming Mou };
354014d1cbeSSuanming Mou 
355014d1cbeSSuanming Mou 
356830d2091SOri Kam #define MLX5_FLOW_MIN_ID_POOL_SIZE 512
357830d2091SOri Kam #define MLX5_ID_GENERATION_ARRAY_FACTOR 16
358830d2091SOri Kam 
359860897d2SBing Zhao #define MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE 4096
360860897d2SBing Zhao 
361830d2091SOri Kam /**
362f935ed4bSDekel Peled  * Initialize the ASO aging management structure.
363f935ed4bSDekel Peled  *
364f935ed4bSDekel Peled  * @param[in] sh
365f935ed4bSDekel Peled  *   Pointer to mlx5_dev_ctx_shared object to free
366f935ed4bSDekel Peled  *
367f935ed4bSDekel Peled  * @return
368f935ed4bSDekel Peled  *   0 on success, a negative errno value otherwise and rte_errno is set.
369f935ed4bSDekel Peled  */
370f935ed4bSDekel Peled int
371f935ed4bSDekel Peled mlx5_flow_aso_age_mng_init(struct mlx5_dev_ctx_shared *sh)
372f935ed4bSDekel Peled {
373f935ed4bSDekel Peled 	int err;
374f935ed4bSDekel Peled 
375f935ed4bSDekel Peled 	if (sh->aso_age_mng)
376f935ed4bSDekel Peled 		return 0;
377f935ed4bSDekel Peled 	sh->aso_age_mng = mlx5_malloc(MLX5_MEM_ZERO, sizeof(*sh->aso_age_mng),
378f935ed4bSDekel Peled 				      RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
379f935ed4bSDekel Peled 	if (!sh->aso_age_mng) {
380f935ed4bSDekel Peled 		DRV_LOG(ERR, "aso_age_mng allocation was failed.");
381f935ed4bSDekel Peled 		rte_errno = ENOMEM;
382f935ed4bSDekel Peled 		return -ENOMEM;
383f935ed4bSDekel Peled 	}
384f935ed4bSDekel Peled 	err = mlx5_aso_queue_init(sh);
385f935ed4bSDekel Peled 	if (err) {
386f935ed4bSDekel Peled 		mlx5_free(sh->aso_age_mng);
387f935ed4bSDekel Peled 		return -1;
388f935ed4bSDekel Peled 	}
389f935ed4bSDekel Peled 	rte_spinlock_init(&sh->aso_age_mng->resize_sl);
390f935ed4bSDekel Peled 	rte_spinlock_init(&sh->aso_age_mng->free_sl);
391f935ed4bSDekel Peled 	LIST_INIT(&sh->aso_age_mng->free);
392f935ed4bSDekel Peled 	return 0;
393f935ed4bSDekel Peled }
394f935ed4bSDekel Peled 
395f935ed4bSDekel Peled /**
396f935ed4bSDekel Peled  * Close and release all the resources of the ASO aging management structure.
397f935ed4bSDekel Peled  *
398f935ed4bSDekel Peled  * @param[in] sh
399f935ed4bSDekel Peled  *   Pointer to mlx5_dev_ctx_shared object to free.
400f935ed4bSDekel Peled  */
401f935ed4bSDekel Peled static void
402f935ed4bSDekel Peled mlx5_flow_aso_age_mng_close(struct mlx5_dev_ctx_shared *sh)
403f935ed4bSDekel Peled {
404f935ed4bSDekel Peled 	int i, j;
405f935ed4bSDekel Peled 
406f935ed4bSDekel Peled 	mlx5_aso_queue_stop(sh);
407f935ed4bSDekel Peled 	mlx5_aso_queue_uninit(sh);
408f935ed4bSDekel Peled 	if (sh->aso_age_mng->pools) {
409f935ed4bSDekel Peled 		struct mlx5_aso_age_pool *pool;
410f935ed4bSDekel Peled 
411f935ed4bSDekel Peled 		for (i = 0; i < sh->aso_age_mng->next; ++i) {
412f935ed4bSDekel Peled 			pool = sh->aso_age_mng->pools[i];
413f935ed4bSDekel Peled 			claim_zero(mlx5_devx_cmd_destroy
414f935ed4bSDekel Peled 						(pool->flow_hit_aso_obj));
415f935ed4bSDekel Peled 			for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j)
416f935ed4bSDekel Peled 				if (pool->actions[j].dr_action)
417f935ed4bSDekel Peled 					claim_zero
418f935ed4bSDekel Peled 						(mlx5_glue->destroy_flow_action
419f935ed4bSDekel Peled 						  (pool->actions[j].dr_action));
420f935ed4bSDekel Peled 			mlx5_free(pool);
421f935ed4bSDekel Peled 		}
422f935ed4bSDekel Peled 		mlx5_free(sh->aso_age_mng->pools);
423f935ed4bSDekel Peled 	}
4247ad0b6d9SDekel Peled 	mlx5_free(sh->aso_age_mng);
425f935ed4bSDekel Peled }
426f935ed4bSDekel Peled 
427f935ed4bSDekel Peled /**
428fa2d01c8SDong Zhou  * Initialize the shared aging list information per port.
429fa2d01c8SDong Zhou  *
430fa2d01c8SDong Zhou  * @param[in] sh
4316e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
432fa2d01c8SDong Zhou  */
433fa2d01c8SDong Zhou static void
4346e88bc42SOphir Munk mlx5_flow_aging_init(struct mlx5_dev_ctx_shared *sh)
435fa2d01c8SDong Zhou {
436fa2d01c8SDong Zhou 	uint32_t i;
437fa2d01c8SDong Zhou 	struct mlx5_age_info *age_info;
438fa2d01c8SDong Zhou 
439fa2d01c8SDong Zhou 	for (i = 0; i < sh->max_port; i++) {
440fa2d01c8SDong Zhou 		age_info = &sh->port[i].age_info;
441fa2d01c8SDong Zhou 		age_info->flags = 0;
442fa2d01c8SDong Zhou 		TAILQ_INIT(&age_info->aged_counters);
443f9bc5274SMatan Azrad 		LIST_INIT(&age_info->aged_aso);
444fa2d01c8SDong Zhou 		rte_spinlock_init(&age_info->aged_sl);
445fa2d01c8SDong Zhou 		MLX5_AGE_SET(age_info, MLX5_AGE_TRIGGER);
446fa2d01c8SDong Zhou 	}
447fa2d01c8SDong Zhou }
448fa2d01c8SDong Zhou 
449fa2d01c8SDong Zhou /**
4505382d28cSMatan Azrad  * Initialize the counters management structure.
4515382d28cSMatan Azrad  *
4525382d28cSMatan Azrad  * @param[in] sh
4536e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free
4545382d28cSMatan Azrad  */
4555382d28cSMatan Azrad static void
4566e88bc42SOphir Munk mlx5_flow_counters_mng_init(struct mlx5_dev_ctx_shared *sh)
4575382d28cSMatan Azrad {
458994829e6SSuanming Mou 	int i;
4595382d28cSMatan Azrad 
4605af61440SMatan Azrad 	memset(&sh->cmng, 0, sizeof(sh->cmng));
4615382d28cSMatan Azrad 	TAILQ_INIT(&sh->cmng.flow_counters);
462994829e6SSuanming Mou 	sh->cmng.min_id = MLX5_CNT_BATCH_OFFSET;
463994829e6SSuanming Mou 	sh->cmng.max_id = -1;
464994829e6SSuanming Mou 	sh->cmng.last_pool_idx = POOL_IDX_INVALID;
4653aa27915SSuanming Mou 	rte_spinlock_init(&sh->cmng.pool_update_sl);
466994829e6SSuanming Mou 	for (i = 0; i < MLX5_COUNTER_TYPE_MAX; i++) {
467994829e6SSuanming Mou 		TAILQ_INIT(&sh->cmng.counters[i]);
468994829e6SSuanming Mou 		rte_spinlock_init(&sh->cmng.csl[i]);
469fa2d01c8SDong Zhou 	}
4705382d28cSMatan Azrad }
4715382d28cSMatan Azrad 
4725382d28cSMatan Azrad /**
4735382d28cSMatan Azrad  * Destroy all the resources allocated for a counter memory management.
4745382d28cSMatan Azrad  *
4755382d28cSMatan Azrad  * @param[in] mng
4765382d28cSMatan Azrad  *   Pointer to the memory management structure.
4775382d28cSMatan Azrad  */
4785382d28cSMatan Azrad static void
4795382d28cSMatan Azrad mlx5_flow_destroy_counter_stat_mem_mng(struct mlx5_counter_stats_mem_mng *mng)
4805382d28cSMatan Azrad {
4815382d28cSMatan Azrad 	uint8_t *mem = (uint8_t *)(uintptr_t)mng->raws[0].data;
4825382d28cSMatan Azrad 
4835382d28cSMatan Azrad 	LIST_REMOVE(mng, next);
4845382d28cSMatan Azrad 	claim_zero(mlx5_devx_cmd_destroy(mng->dm));
4855382d28cSMatan Azrad 	claim_zero(mlx5_glue->devx_umem_dereg(mng->umem));
48683c2047cSSuanming Mou 	mlx5_free(mem);
4875382d28cSMatan Azrad }
4885382d28cSMatan Azrad 
4895382d28cSMatan Azrad /**
4905382d28cSMatan Azrad  * Close and release all the resources of the counters management.
4915382d28cSMatan Azrad  *
4925382d28cSMatan Azrad  * @param[in] sh
4936e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free.
4945382d28cSMatan Azrad  */
4955382d28cSMatan Azrad static void
4966e88bc42SOphir Munk mlx5_flow_counters_mng_close(struct mlx5_dev_ctx_shared *sh)
4975382d28cSMatan Azrad {
4985382d28cSMatan Azrad 	struct mlx5_counter_stats_mem_mng *mng;
4993aa27915SSuanming Mou 	int i, j;
500f15db67dSMatan Azrad 	int retries = 1024;
5015382d28cSMatan Azrad 
502f15db67dSMatan Azrad 	rte_errno = 0;
503f15db67dSMatan Azrad 	while (--retries) {
504f15db67dSMatan Azrad 		rte_eal_alarm_cancel(mlx5_flow_query_alarm, sh);
505f15db67dSMatan Azrad 		if (rte_errno != EINPROGRESS)
506f15db67dSMatan Azrad 			break;
507f15db67dSMatan Azrad 		rte_pause();
508f15db67dSMatan Azrad 	}
5095382d28cSMatan Azrad 
510994829e6SSuanming Mou 	if (sh->cmng.pools) {
511994829e6SSuanming Mou 		struct mlx5_flow_counter_pool *pool;
5123aa27915SSuanming Mou 		uint16_t n_valid = sh->cmng.n_valid;
5132b5b1aebSSuanming Mou 		bool fallback = sh->cmng.counter_fallback;
514994829e6SSuanming Mou 
5153aa27915SSuanming Mou 		for (i = 0; i < n_valid; ++i) {
5163aa27915SSuanming Mou 			pool = sh->cmng.pools[i];
5172b5b1aebSSuanming Mou 			if (!fallback && pool->min_dcs)
5185af61440SMatan Azrad 				claim_zero(mlx5_devx_cmd_destroy
519fa2d01c8SDong Zhou 							       (pool->min_dcs));
5205382d28cSMatan Azrad 			for (j = 0; j < MLX5_COUNTERS_PER_POOL; ++j) {
5212b5b1aebSSuanming Mou 				struct mlx5_flow_counter *cnt =
5222b5b1aebSSuanming Mou 						MLX5_POOL_GET_CNT(pool, j);
5232b5b1aebSSuanming Mou 
5242b5b1aebSSuanming Mou 				if (cnt->action)
5255382d28cSMatan Azrad 					claim_zero
5265382d28cSMatan Azrad 					 (mlx5_glue->destroy_flow_action
5272b5b1aebSSuanming Mou 					  (cnt->action));
5282b5b1aebSSuanming Mou 				if (fallback && MLX5_POOL_GET_CNT
5292b5b1aebSSuanming Mou 				    (pool, j)->dcs_when_free)
5305382d28cSMatan Azrad 					claim_zero(mlx5_devx_cmd_destroy
5312b5b1aebSSuanming Mou 						   (cnt->dcs_when_free));
5325382d28cSMatan Azrad 			}
53383c2047cSSuanming Mou 			mlx5_free(pool);
5345382d28cSMatan Azrad 		}
535994829e6SSuanming Mou 		mlx5_free(sh->cmng.pools);
5365382d28cSMatan Azrad 	}
5375382d28cSMatan Azrad 	mng = LIST_FIRST(&sh->cmng.mem_mngs);
5385382d28cSMatan Azrad 	while (mng) {
5395382d28cSMatan Azrad 		mlx5_flow_destroy_counter_stat_mem_mng(mng);
5405382d28cSMatan Azrad 		mng = LIST_FIRST(&sh->cmng.mem_mngs);
5415382d28cSMatan Azrad 	}
5425382d28cSMatan Azrad 	memset(&sh->cmng, 0, sizeof(sh->cmng));
5435382d28cSMatan Azrad }
5445382d28cSMatan Azrad 
545f935ed4bSDekel Peled /* Send FLOW_AGED event if needed. */
546f935ed4bSDekel Peled void
547f935ed4bSDekel Peled mlx5_age_event_prepare(struct mlx5_dev_ctx_shared *sh)
548f935ed4bSDekel Peled {
549f935ed4bSDekel Peled 	struct mlx5_age_info *age_info;
550f935ed4bSDekel Peled 	uint32_t i;
551f935ed4bSDekel Peled 
552f935ed4bSDekel Peled 	for (i = 0; i < sh->max_port; i++) {
553f935ed4bSDekel Peled 		age_info = &sh->port[i].age_info;
554f935ed4bSDekel Peled 		if (!MLX5_AGE_GET(age_info, MLX5_AGE_EVENT_NEW))
555f935ed4bSDekel Peled 			continue;
556f935ed4bSDekel Peled 		if (MLX5_AGE_GET(age_info, MLX5_AGE_TRIGGER))
557f935ed4bSDekel Peled 			rte_eth_dev_callback_process
558f935ed4bSDekel Peled 				(&rte_eth_devices[sh->port[i].devx_ih_port_id],
559f935ed4bSDekel Peled 				RTE_ETH_EVENT_FLOW_AGED, NULL);
560f935ed4bSDekel Peled 		age_info->flags = 0;
561f935ed4bSDekel Peled 	}
562f935ed4bSDekel Peled }
563f935ed4bSDekel Peled 
5645382d28cSMatan Azrad /**
565014d1cbeSSuanming Mou  * Initialize the flow resources' indexed mempool.
566014d1cbeSSuanming Mou  *
567014d1cbeSSuanming Mou  * @param[in] sh
5686e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
569b88341caSSuanming Mou  * @param[in] sh
570b88341caSSuanming Mou  *   Pointer to user dev config.
571014d1cbeSSuanming Mou  */
572014d1cbeSSuanming Mou static void
5736e88bc42SOphir Munk mlx5_flow_ipool_create(struct mlx5_dev_ctx_shared *sh,
5745c761238SGregory Etelson 		       const struct mlx5_dev_config *config)
575014d1cbeSSuanming Mou {
576014d1cbeSSuanming Mou 	uint8_t i;
5775c761238SGregory Etelson 	struct mlx5_indexed_pool_config cfg;
578014d1cbeSSuanming Mou 
579a1da6f62SSuanming Mou 	for (i = 0; i < MLX5_IPOOL_MAX; ++i) {
5805c761238SGregory Etelson 		cfg = mlx5_ipool_cfg[i];
5815c761238SGregory Etelson 		switch (i) {
5825c761238SGregory Etelson 		default:
5835c761238SGregory Etelson 			break;
5845c761238SGregory Etelson 		/*
5855c761238SGregory Etelson 		 * Set MLX5_IPOOL_MLX5_FLOW ipool size
5865c761238SGregory Etelson 		 * according to PCI function flow configuration.
5875c761238SGregory Etelson 		 */
5885c761238SGregory Etelson 		case MLX5_IPOOL_MLX5_FLOW:
5895c761238SGregory Etelson 			cfg.size = config->dv_flow_en ?
5905c761238SGregory Etelson 				sizeof(struct mlx5_flow_handle) :
5915c761238SGregory Etelson 				MLX5_FLOW_HANDLE_VERBS_SIZE;
5925c761238SGregory Etelson 			break;
5935c761238SGregory Etelson 		}
594a1da6f62SSuanming Mou 		if (config->reclaim_mode)
5955c761238SGregory Etelson 			cfg.release_mem_en = 1;
5965c761238SGregory Etelson 		sh->ipool[i] = mlx5_ipool_create(&cfg);
597014d1cbeSSuanming Mou 	}
598a1da6f62SSuanming Mou }
599014d1cbeSSuanming Mou 
600014d1cbeSSuanming Mou /**
601014d1cbeSSuanming Mou  * Release the flow resources' indexed mempool.
602014d1cbeSSuanming Mou  *
603014d1cbeSSuanming Mou  * @param[in] sh
6046e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object.
605014d1cbeSSuanming Mou  */
606014d1cbeSSuanming Mou static void
6076e88bc42SOphir Munk mlx5_flow_ipool_destroy(struct mlx5_dev_ctx_shared *sh)
608014d1cbeSSuanming Mou {
609014d1cbeSSuanming Mou 	uint8_t i;
610014d1cbeSSuanming Mou 
611014d1cbeSSuanming Mou 	for (i = 0; i < MLX5_IPOOL_MAX; ++i)
612014d1cbeSSuanming Mou 		mlx5_ipool_destroy(sh->ipool[i]);
613014d1cbeSSuanming Mou }
614014d1cbeSSuanming Mou 
615daa38a89SBing Zhao /*
616daa38a89SBing Zhao  * Check if dynamic flex parser for eCPRI already exists.
617daa38a89SBing Zhao  *
618daa38a89SBing Zhao  * @param dev
619daa38a89SBing Zhao  *   Pointer to Ethernet device structure.
620daa38a89SBing Zhao  *
621daa38a89SBing Zhao  * @return
622daa38a89SBing Zhao  *   true on exists, false on not.
623daa38a89SBing Zhao  */
624daa38a89SBing Zhao bool
625daa38a89SBing Zhao mlx5_flex_parser_ecpri_exist(struct rte_eth_dev *dev)
626daa38a89SBing Zhao {
627daa38a89SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
628daa38a89SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
629daa38a89SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
630daa38a89SBing Zhao 
631daa38a89SBing Zhao 	return !!prf->obj;
632daa38a89SBing Zhao }
633daa38a89SBing Zhao 
634daa38a89SBing Zhao /*
635daa38a89SBing Zhao  * Allocation of a flex parser for eCPRI. Once created, this parser related
636daa38a89SBing Zhao  * resources will be held until the device is closed.
637daa38a89SBing Zhao  *
638daa38a89SBing Zhao  * @param dev
639daa38a89SBing Zhao  *   Pointer to Ethernet device structure.
640daa38a89SBing Zhao  *
641daa38a89SBing Zhao  * @return
642daa38a89SBing Zhao  *   0 on success, a negative errno value otherwise and rte_errno is set.
643daa38a89SBing Zhao  */
644daa38a89SBing Zhao int
645daa38a89SBing Zhao mlx5_flex_parser_ecpri_alloc(struct rte_eth_dev *dev)
646daa38a89SBing Zhao {
647daa38a89SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
648daa38a89SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
649daa38a89SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
6501c506404SBing Zhao 	struct mlx5_devx_graph_node_attr node = {
6511c506404SBing Zhao 		.modify_field_select = 0,
6521c506404SBing Zhao 	};
6531c506404SBing Zhao 	uint32_t ids[8];
6541c506404SBing Zhao 	int ret;
655daa38a89SBing Zhao 
656d7c49561SBing Zhao 	if (!priv->config.hca_attr.parse_graph_flex_node) {
657d7c49561SBing Zhao 		DRV_LOG(ERR, "Dynamic flex parser is not supported "
658d7c49561SBing Zhao 			"for device %s.", priv->dev_data->name);
659d7c49561SBing Zhao 		return -ENOTSUP;
660d7c49561SBing Zhao 	}
6611c506404SBing Zhao 	node.header_length_mode = MLX5_GRAPH_NODE_LEN_FIXED;
6621c506404SBing Zhao 	/* 8 bytes now: 4B common header + 4B message body header. */
6631c506404SBing Zhao 	node.header_length_base_value = 0x8;
6641c506404SBing Zhao 	/* After MAC layer: Ether / VLAN. */
6651c506404SBing Zhao 	node.in[0].arc_parse_graph_node = MLX5_GRAPH_ARC_NODE_MAC;
6661c506404SBing Zhao 	/* Type of compared condition should be 0xAEFE in the L2 layer. */
6671c506404SBing Zhao 	node.in[0].compare_condition_value = RTE_ETHER_TYPE_ECPRI;
6681c506404SBing Zhao 	/* Sample #0: type in common header. */
6691c506404SBing Zhao 	node.sample[0].flow_match_sample_en = 1;
6701c506404SBing Zhao 	/* Fixed offset. */
6711c506404SBing Zhao 	node.sample[0].flow_match_sample_offset_mode = 0x0;
6721c506404SBing Zhao 	/* Only the 2nd byte will be used. */
6731c506404SBing Zhao 	node.sample[0].flow_match_sample_field_base_offset = 0x0;
6741c506404SBing Zhao 	/* Sample #1: message payload. */
6751c506404SBing Zhao 	node.sample[1].flow_match_sample_en = 1;
6761c506404SBing Zhao 	/* Fixed offset. */
6771c506404SBing Zhao 	node.sample[1].flow_match_sample_offset_mode = 0x0;
6781c506404SBing Zhao 	/*
6791c506404SBing Zhao 	 * Only the first two bytes will be used right now, and its offset will
6801c506404SBing Zhao 	 * start after the common header that with the length of a DW(u32).
6811c506404SBing Zhao 	 */
6821c506404SBing Zhao 	node.sample[1].flow_match_sample_field_base_offset = sizeof(uint32_t);
6831c506404SBing Zhao 	prf->obj = mlx5_devx_cmd_create_flex_parser(priv->sh->ctx, &node);
6841c506404SBing Zhao 	if (!prf->obj) {
6851c506404SBing Zhao 		DRV_LOG(ERR, "Failed to create flex parser node object.");
6861c506404SBing Zhao 		return (rte_errno == 0) ? -ENODEV : -rte_errno;
6871c506404SBing Zhao 	}
6881c506404SBing Zhao 	prf->num = 2;
6891c506404SBing Zhao 	ret = mlx5_devx_cmd_query_parse_samples(prf->obj, ids, prf->num);
6901c506404SBing Zhao 	if (ret) {
6911c506404SBing Zhao 		DRV_LOG(ERR, "Failed to query sample IDs.");
6921c506404SBing Zhao 		return (rte_errno == 0) ? -ENODEV : -rte_errno;
6931c506404SBing Zhao 	}
6941c506404SBing Zhao 	prf->offset[0] = 0x0;
6951c506404SBing Zhao 	prf->offset[1] = sizeof(uint32_t);
6961c506404SBing Zhao 	prf->ids[0] = ids[0];
6971c506404SBing Zhao 	prf->ids[1] = ids[1];
698daa38a89SBing Zhao 	return 0;
699daa38a89SBing Zhao }
700daa38a89SBing Zhao 
7011c506404SBing Zhao /*
7021c506404SBing Zhao  * Destroy the flex parser node, including the parser itself, input / output
7031c506404SBing Zhao  * arcs and DW samples. Resources could be reused then.
7041c506404SBing Zhao  *
7051c506404SBing Zhao  * @param dev
7061c506404SBing Zhao  *   Pointer to Ethernet device structure.
7071c506404SBing Zhao  */
7081c506404SBing Zhao static void
7091c506404SBing Zhao mlx5_flex_parser_ecpri_release(struct rte_eth_dev *dev)
7101c506404SBing Zhao {
7111c506404SBing Zhao 	struct mlx5_priv *priv = dev->data->dev_private;
7121c506404SBing Zhao 	struct mlx5_flex_parser_profiles *prf =
7131c506404SBing Zhao 				&priv->sh->fp[MLX5_FLEX_PARSER_ECPRI_0];
7141c506404SBing Zhao 
7151c506404SBing Zhao 	if (prf->obj)
7161c506404SBing Zhao 		mlx5_devx_cmd_destroy(prf->obj);
7171c506404SBing Zhao 	prf->obj = NULL;
7181c506404SBing Zhao }
7191c506404SBing Zhao 
720a0bfe9d5SViacheslav Ovsiienko /*
721a0bfe9d5SViacheslav Ovsiienko  * Allocate Rx and Tx UARs in robust fashion.
722a0bfe9d5SViacheslav Ovsiienko  * This routine handles the following UAR allocation issues:
723a0bfe9d5SViacheslav Ovsiienko  *
724a0bfe9d5SViacheslav Ovsiienko  *  - tries to allocate the UAR with the most appropriate memory
725a0bfe9d5SViacheslav Ovsiienko  *    mapping type from the ones supported by the host
726a0bfe9d5SViacheslav Ovsiienko  *
727a0bfe9d5SViacheslav Ovsiienko  *  - tries to allocate the UAR with non-NULL base address
728a0bfe9d5SViacheslav Ovsiienko  *    OFED 5.0.x and Upstream rdma_core before v29 returned the NULL as
729a0bfe9d5SViacheslav Ovsiienko  *    UAR base address if UAR was not the first object in the UAR page.
730a0bfe9d5SViacheslav Ovsiienko  *    It caused the PMD failure and we should try to get another UAR
731a0bfe9d5SViacheslav Ovsiienko  *    till we get the first one with non-NULL base address returned.
732a0bfe9d5SViacheslav Ovsiienko  */
733a0bfe9d5SViacheslav Ovsiienko static int
734a0bfe9d5SViacheslav Ovsiienko mlx5_alloc_rxtx_uars(struct mlx5_dev_ctx_shared *sh,
735a0bfe9d5SViacheslav Ovsiienko 		     const struct mlx5_dev_config *config)
736a0bfe9d5SViacheslav Ovsiienko {
737a0bfe9d5SViacheslav Ovsiienko 	uint32_t uar_mapping, retry;
738a0bfe9d5SViacheslav Ovsiienko 	int err = 0;
7391f66ac5bSOphir Munk 	void *base_addr;
740a0bfe9d5SViacheslav Ovsiienko 
741a0bfe9d5SViacheslav Ovsiienko 	for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
742a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
743a0bfe9d5SViacheslav Ovsiienko 		/* Control the mapping type according to the settings. */
744a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = (config->dbnc == MLX5_TXDB_NCACHED) ?
745a0bfe9d5SViacheslav Ovsiienko 			      MLX5DV_UAR_ALLOC_TYPE_NC :
746a0bfe9d5SViacheslav Ovsiienko 			      MLX5DV_UAR_ALLOC_TYPE_BF;
747a0bfe9d5SViacheslav Ovsiienko #else
748a0bfe9d5SViacheslav Ovsiienko 		RTE_SET_USED(config);
749a0bfe9d5SViacheslav Ovsiienko 		/*
750a0bfe9d5SViacheslav Ovsiienko 		 * It seems we have no way to control the memory mapping type
751a0bfe9d5SViacheslav Ovsiienko 		 * for the UAR, the default "Write-Combining" type is supposed.
752a0bfe9d5SViacheslav Ovsiienko 		 * The UAR initialization on queue creation queries the
753a0bfe9d5SViacheslav Ovsiienko 		 * actual mapping type done by Verbs/kernel and setups the
754a0bfe9d5SViacheslav Ovsiienko 		 * PMD datapath accordingly.
755a0bfe9d5SViacheslav Ovsiienko 		 */
756a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = 0;
757a0bfe9d5SViacheslav Ovsiienko #endif
758a0bfe9d5SViacheslav Ovsiienko 		sh->tx_uar = mlx5_glue->devx_alloc_uar(sh->ctx, uar_mapping);
759a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
760a0bfe9d5SViacheslav Ovsiienko 		if (!sh->tx_uar &&
761a0bfe9d5SViacheslav Ovsiienko 		    uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
762a0bfe9d5SViacheslav Ovsiienko 			if (config->dbnc == MLX5_TXDB_CACHED ||
763a0bfe9d5SViacheslav Ovsiienko 			    config->dbnc == MLX5_TXDB_HEURISTIC)
764a0bfe9d5SViacheslav Ovsiienko 				DRV_LOG(WARNING, "Devarg tx_db_nc setting "
765a0bfe9d5SViacheslav Ovsiienko 						 "is not supported by DevX");
766a0bfe9d5SViacheslav Ovsiienko 			/*
767a0bfe9d5SViacheslav Ovsiienko 			 * In some environments like virtual machine
768a0bfe9d5SViacheslav Ovsiienko 			 * the Write Combining mapped might be not supported
769a0bfe9d5SViacheslav Ovsiienko 			 * and UAR allocation fails. We try "Non-Cached"
770a0bfe9d5SViacheslav Ovsiienko 			 * mapping for the case. The tx_burst routines take
771a0bfe9d5SViacheslav Ovsiienko 			 * the UAR mapping type into account on UAR setup
772a0bfe9d5SViacheslav Ovsiienko 			 * on queue creation.
773a0bfe9d5SViacheslav Ovsiienko 			 */
774a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Tx DevX UAR (BF)");
775a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
776a0bfe9d5SViacheslav Ovsiienko 			sh->tx_uar = mlx5_glue->devx_alloc_uar
777a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
778a0bfe9d5SViacheslav Ovsiienko 		} else if (!sh->tx_uar &&
779a0bfe9d5SViacheslav Ovsiienko 			   uar_mapping == MLX5DV_UAR_ALLOC_TYPE_NC) {
780a0bfe9d5SViacheslav Ovsiienko 			if (config->dbnc == MLX5_TXDB_NCACHED)
781a0bfe9d5SViacheslav Ovsiienko 				DRV_LOG(WARNING, "Devarg tx_db_nc settings "
782a0bfe9d5SViacheslav Ovsiienko 						 "is not supported by DevX");
783a0bfe9d5SViacheslav Ovsiienko 			/*
784a0bfe9d5SViacheslav Ovsiienko 			 * If Verbs/kernel does not support "Non-Cached"
785a0bfe9d5SViacheslav Ovsiienko 			 * try the "Write-Combining".
786a0bfe9d5SViacheslav Ovsiienko 			 */
787a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Tx DevX UAR (NC)");
788a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_BF;
789a0bfe9d5SViacheslav Ovsiienko 			sh->tx_uar = mlx5_glue->devx_alloc_uar
790a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
791a0bfe9d5SViacheslav Ovsiienko 		}
792a0bfe9d5SViacheslav Ovsiienko #endif
793a0bfe9d5SViacheslav Ovsiienko 		if (!sh->tx_uar) {
794a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (BF/NC)");
795a0bfe9d5SViacheslav Ovsiienko 			err = ENOMEM;
796a0bfe9d5SViacheslav Ovsiienko 			goto exit;
797a0bfe9d5SViacheslav Ovsiienko 		}
7981f66ac5bSOphir Munk 		base_addr = mlx5_os_get_devx_uar_base_addr(sh->tx_uar);
7991f66ac5bSOphir Munk 		if (base_addr)
800a0bfe9d5SViacheslav Ovsiienko 			break;
801a0bfe9d5SViacheslav Ovsiienko 		/*
802a0bfe9d5SViacheslav Ovsiienko 		 * The UARs are allocated by rdma_core within the
803a0bfe9d5SViacheslav Ovsiienko 		 * IB device context, on context closure all UARs
804a0bfe9d5SViacheslav Ovsiienko 		 * will be freed, should be no memory/object leakage.
805a0bfe9d5SViacheslav Ovsiienko 		 */
806a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(WARNING, "Retrying to allocate Tx DevX UAR");
807a0bfe9d5SViacheslav Ovsiienko 		sh->tx_uar = NULL;
808a0bfe9d5SViacheslav Ovsiienko 	}
809a0bfe9d5SViacheslav Ovsiienko 	/* Check whether we finally succeeded with valid UAR allocation. */
810a0bfe9d5SViacheslav Ovsiienko 	if (!sh->tx_uar) {
811a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(ERR, "Failed to allocate Tx DevX UAR (NULL base)");
812a0bfe9d5SViacheslav Ovsiienko 		err = ENOMEM;
813a0bfe9d5SViacheslav Ovsiienko 		goto exit;
814a0bfe9d5SViacheslav Ovsiienko 	}
815a0bfe9d5SViacheslav Ovsiienko 	for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) {
816a0bfe9d5SViacheslav Ovsiienko 		uar_mapping = 0;
817a0bfe9d5SViacheslav Ovsiienko 		sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
818a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
819a0bfe9d5SViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC
820a0bfe9d5SViacheslav Ovsiienko 		if (!sh->devx_rx_uar &&
821a0bfe9d5SViacheslav Ovsiienko 		    uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) {
822a0bfe9d5SViacheslav Ovsiienko 			/*
823a0bfe9d5SViacheslav Ovsiienko 			 * Rx UAR is used to control interrupts only,
824a0bfe9d5SViacheslav Ovsiienko 			 * should be no datapath noticeable impact,
825a0bfe9d5SViacheslav Ovsiienko 			 * can try "Non-Cached" mapping safely.
826a0bfe9d5SViacheslav Ovsiienko 			 */
827a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(WARNING, "Failed to allocate Rx DevX UAR (BF)");
828a0bfe9d5SViacheslav Ovsiienko 			uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC;
829a0bfe9d5SViacheslav Ovsiienko 			sh->devx_rx_uar = mlx5_glue->devx_alloc_uar
830a0bfe9d5SViacheslav Ovsiienko 							(sh->ctx, uar_mapping);
831a0bfe9d5SViacheslav Ovsiienko 		}
832a0bfe9d5SViacheslav Ovsiienko #endif
833a0bfe9d5SViacheslav Ovsiienko 		if (!sh->devx_rx_uar) {
834a0bfe9d5SViacheslav Ovsiienko 			DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (BF/NC)");
835a0bfe9d5SViacheslav Ovsiienko 			err = ENOMEM;
836a0bfe9d5SViacheslav Ovsiienko 			goto exit;
837a0bfe9d5SViacheslav Ovsiienko 		}
8381f66ac5bSOphir Munk 		base_addr = mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar);
8391f66ac5bSOphir Munk 		if (base_addr)
840a0bfe9d5SViacheslav Ovsiienko 			break;
841a0bfe9d5SViacheslav Ovsiienko 		/*
842a0bfe9d5SViacheslav Ovsiienko 		 * The UARs are allocated by rdma_core within the
843a0bfe9d5SViacheslav Ovsiienko 		 * IB device context, on context closure all UARs
844a0bfe9d5SViacheslav Ovsiienko 		 * will be freed, should be no memory/object leakage.
845a0bfe9d5SViacheslav Ovsiienko 		 */
846a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(WARNING, "Retrying to allocate Rx DevX UAR");
847a0bfe9d5SViacheslav Ovsiienko 		sh->devx_rx_uar = NULL;
848a0bfe9d5SViacheslav Ovsiienko 	}
849a0bfe9d5SViacheslav Ovsiienko 	/* Check whether we finally succeeded with valid UAR allocation. */
850a0bfe9d5SViacheslav Ovsiienko 	if (!sh->devx_rx_uar) {
851a0bfe9d5SViacheslav Ovsiienko 		DRV_LOG(ERR, "Failed to allocate Rx DevX UAR (NULL base)");
852a0bfe9d5SViacheslav Ovsiienko 		err = ENOMEM;
853a0bfe9d5SViacheslav Ovsiienko 	}
854a0bfe9d5SViacheslav Ovsiienko exit:
855a0bfe9d5SViacheslav Ovsiienko 	return err;
856a0bfe9d5SViacheslav Ovsiienko }
857a0bfe9d5SViacheslav Ovsiienko 
858014d1cbeSSuanming Mou /**
85991389890SOphir Munk  * Allocate shared device context. If there is multiport device the
86017e19bc4SViacheslav Ovsiienko  * master and representors will share this context, if there is single
86191389890SOphir Munk  * port dedicated device, the context will be used by only given
86217e19bc4SViacheslav Ovsiienko  * port due to unification.
86317e19bc4SViacheslav Ovsiienko  *
86491389890SOphir Munk  * Routine first searches the context for the specified device name,
86517e19bc4SViacheslav Ovsiienko  * if found the shared context assumed and reference counter is incremented.
86617e19bc4SViacheslav Ovsiienko  * If no context found the new one is created and initialized with specified
86791389890SOphir Munk  * device context and parameters.
86817e19bc4SViacheslav Ovsiienko  *
86917e19bc4SViacheslav Ovsiienko  * @param[in] spawn
87091389890SOphir Munk  *   Pointer to the device attributes (name, port, etc).
8718409a285SViacheslav Ovsiienko  * @param[in] config
8728409a285SViacheslav Ovsiienko  *   Pointer to device configuration structure.
87317e19bc4SViacheslav Ovsiienko  *
87417e19bc4SViacheslav Ovsiienko  * @return
8756e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object on success,
87617e19bc4SViacheslav Ovsiienko  *   otherwise NULL and rte_errno is set.
87717e19bc4SViacheslav Ovsiienko  */
8782eb4d010SOphir Munk struct mlx5_dev_ctx_shared *
87991389890SOphir Munk mlx5_alloc_shared_dev_ctx(const struct mlx5_dev_spawn_data *spawn,
8808409a285SViacheslav Ovsiienko 			   const struct mlx5_dev_config *config)
88117e19bc4SViacheslav Ovsiienko {
8826e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh;
88317e19bc4SViacheslav Ovsiienko 	int err = 0;
88453e5a82fSViacheslav Ovsiienko 	uint32_t i;
885ae18a1aeSOri Kam 	struct mlx5_devx_tis_attr tis_attr = { 0 };
88617e19bc4SViacheslav Ovsiienko 
8878e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(spawn);
88817e19bc4SViacheslav Ovsiienko 	/* Secondary process should not create the shared context. */
8898e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
89091389890SOphir Munk 	pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
89117e19bc4SViacheslav Ovsiienko 	/* Search for IB context by device name. */
89291389890SOphir Munk 	LIST_FOREACH(sh, &mlx5_dev_ctx_list, next) {
893834a9019SOphir Munk 		if (!strcmp(sh->ibdev_name,
894834a9019SOphir Munk 			mlx5_os_get_dev_device_name(spawn->phys_dev))) {
89517e19bc4SViacheslav Ovsiienko 			sh->refcnt++;
89617e19bc4SViacheslav Ovsiienko 			goto exit;
89717e19bc4SViacheslav Ovsiienko 		}
89817e19bc4SViacheslav Ovsiienko 	}
899ae4eb7dcSViacheslav Ovsiienko 	/* No device found, we have to create new shared context. */
9008e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(spawn->max_port);
9012175c4dcSSuanming Mou 	sh = mlx5_malloc(MLX5_MEM_ZERO | MLX5_MEM_RTE,
9026e88bc42SOphir Munk 			 sizeof(struct mlx5_dev_ctx_shared) +
90317e19bc4SViacheslav Ovsiienko 			 spawn->max_port *
90491389890SOphir Munk 			 sizeof(struct mlx5_dev_shared_port),
9052175c4dcSSuanming Mou 			 RTE_CACHE_LINE_SIZE, SOCKET_ID_ANY);
90617e19bc4SViacheslav Ovsiienko 	if (!sh) {
90717e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "shared context allocation failure");
90817e19bc4SViacheslav Ovsiienko 		rte_errno  = ENOMEM;
90917e19bc4SViacheslav Ovsiienko 		goto exit;
91017e19bc4SViacheslav Ovsiienko 	}
9112eb4d010SOphir Munk 	err = mlx5_os_open_device(spawn, config, sh);
91206f78b5eSViacheslav Ovsiienko 	if (!sh->ctx)
91317e19bc4SViacheslav Ovsiienko 		goto error;
914e85f623eSOphir Munk 	err = mlx5_os_get_dev_attr(sh->ctx, &sh->device_attr);
91517e19bc4SViacheslav Ovsiienko 	if (err) {
916e85f623eSOphir Munk 		DRV_LOG(DEBUG, "mlx5_os_get_dev_attr() failed");
91717e19bc4SViacheslav Ovsiienko 		goto error;
91817e19bc4SViacheslav Ovsiienko 	}
91917e19bc4SViacheslav Ovsiienko 	sh->refcnt = 1;
920e6818853SXueming Li 	sh->bond_dev = UINT16_MAX;
92117e19bc4SViacheslav Ovsiienko 	sh->max_port = spawn->max_port;
922f44b09f9SOphir Munk 	strncpy(sh->ibdev_name, mlx5_os_get_ctx_device_name(sh->ctx),
923f44b09f9SOphir Munk 		sizeof(sh->ibdev_name) - 1);
924f44b09f9SOphir Munk 	strncpy(sh->ibdev_path, mlx5_os_get_ctx_device_path(sh->ctx),
925f44b09f9SOphir Munk 		sizeof(sh->ibdev_path) - 1);
92653e5a82fSViacheslav Ovsiienko 	/*
92753e5a82fSViacheslav Ovsiienko 	 * Setting port_id to max unallowed value means
92853e5a82fSViacheslav Ovsiienko 	 * there is no interrupt subhandler installed for
92953e5a82fSViacheslav Ovsiienko 	 * the given port index i.
93053e5a82fSViacheslav Ovsiienko 	 */
93123242063SMatan Azrad 	for (i = 0; i < sh->max_port; i++) {
93253e5a82fSViacheslav Ovsiienko 		sh->port[i].ih_port_id = RTE_MAX_ETHPORTS;
93323242063SMatan Azrad 		sh->port[i].devx_ih_port_id = RTE_MAX_ETHPORTS;
93423242063SMatan Azrad 	}
935*1cb210abSOphir Munk 	sh->pd = mlx5_os_alloc_pd(sh->ctx);
93617e19bc4SViacheslav Ovsiienko 	if (sh->pd == NULL) {
93717e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "PD allocation failure");
93817e19bc4SViacheslav Ovsiienko 		err = ENOMEM;
93917e19bc4SViacheslav Ovsiienko 		goto error;
94017e19bc4SViacheslav Ovsiienko 	}
941ae18a1aeSOri Kam 	if (sh->devx) {
942e7055bbfSMichael Baum 		/* Query the EQN for this core. */
9438dc775d8SMatan Azrad 		err = mlx5_glue->devx_query_eqn(sh->ctx, 0, &sh->eqn);
944e7055bbfSMichael Baum 		if (err) {
945e7055bbfSMichael Baum 			rte_errno = errno;
946e7055bbfSMichael Baum 			DRV_LOG(ERR, "Failed to query event queue number %d.",
947e7055bbfSMichael Baum 				rte_errno);
948e7055bbfSMichael Baum 			goto error;
949e7055bbfSMichael Baum 		}
9502eb4d010SOphir Munk 		err = mlx5_os_get_pdn(sh->pd, &sh->pdn);
951b9d86122SDekel Peled 		if (err) {
952b9d86122SDekel Peled 			DRV_LOG(ERR, "Fail to extract pdn from PD");
953b9d86122SDekel Peled 			goto error;
954b9d86122SDekel Peled 		}
955ae18a1aeSOri Kam 		sh->td = mlx5_devx_cmd_create_td(sh->ctx);
956ae18a1aeSOri Kam 		if (!sh->td) {
957ae18a1aeSOri Kam 			DRV_LOG(ERR, "TD allocation failure");
958ae18a1aeSOri Kam 			err = ENOMEM;
959ae18a1aeSOri Kam 			goto error;
960ae18a1aeSOri Kam 		}
961ae18a1aeSOri Kam 		tis_attr.transport_domain = sh->td->id;
962ae18a1aeSOri Kam 		sh->tis = mlx5_devx_cmd_create_tis(sh->ctx, &tis_attr);
963ae18a1aeSOri Kam 		if (!sh->tis) {
964ae18a1aeSOri Kam 			DRV_LOG(ERR, "TIS allocation failure");
965ae18a1aeSOri Kam 			err = ENOMEM;
966ae18a1aeSOri Kam 			goto error;
967ae18a1aeSOri Kam 		}
968a0bfe9d5SViacheslav Ovsiienko 		err = mlx5_alloc_rxtx_uars(sh, config);
969a0bfe9d5SViacheslav Ovsiienko 		if (err)
970fc4d4f73SViacheslav Ovsiienko 			goto error;
9711f66ac5bSOphir Munk 		MLX5_ASSERT(sh->tx_uar);
9721f66ac5bSOphir Munk 		MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->tx_uar));
9731f66ac5bSOphir Munk 
9741f66ac5bSOphir Munk 		MLX5_ASSERT(sh->devx_rx_uar);
9751f66ac5bSOphir Munk 		MLX5_ASSERT(mlx5_os_get_devx_uar_base_addr(sh->devx_rx_uar));
976ae18a1aeSOri Kam 	}
97724feb045SViacheslav Ovsiienko #ifndef RTE_ARCH_64
97824feb045SViacheslav Ovsiienko 	/* Initialize UAR access locks for 32bit implementations. */
97924feb045SViacheslav Ovsiienko 	rte_spinlock_init(&sh->uar_lock_cq);
98024feb045SViacheslav Ovsiienko 	for (i = 0; i < MLX5_UAR_PAGE_NUM_MAX; i++)
98124feb045SViacheslav Ovsiienko 		rte_spinlock_init(&sh->uar_lock[i]);
98224feb045SViacheslav Ovsiienko #endif
983ab3cffcfSViacheslav Ovsiienko 	/*
984ab3cffcfSViacheslav Ovsiienko 	 * Once the device is added to the list of memory event
985ab3cffcfSViacheslav Ovsiienko 	 * callback, its global MR cache table cannot be expanded
986ab3cffcfSViacheslav Ovsiienko 	 * on the fly because of deadlock. If it overflows, lookup
987ab3cffcfSViacheslav Ovsiienko 	 * should be done by searching MR list linearly, which is slow.
988ab3cffcfSViacheslav Ovsiienko 	 *
989ab3cffcfSViacheslav Ovsiienko 	 * At this point the device is not added to the memory
990ab3cffcfSViacheslav Ovsiienko 	 * event list yet, context is just being created.
991ab3cffcfSViacheslav Ovsiienko 	 */
992b8dc6b0eSVu Pham 	err = mlx5_mr_btree_init(&sh->share_cache.cache,
993ab3cffcfSViacheslav Ovsiienko 				 MLX5_MR_BTREE_CACHE_N * 2,
99446e10a4cSViacheslav Ovsiienko 				 spawn->pci_dev->device.numa_node);
995ab3cffcfSViacheslav Ovsiienko 	if (err) {
996ab3cffcfSViacheslav Ovsiienko 		err = rte_errno;
997ab3cffcfSViacheslav Ovsiienko 		goto error;
998ab3cffcfSViacheslav Ovsiienko 	}
999d5ed8aa9SOphir Munk 	mlx5_os_set_reg_mr_cb(&sh->share_cache.reg_mr_cb,
1000d5ed8aa9SOphir Munk 			      &sh->share_cache.dereg_mr_cb);
10012eb4d010SOphir Munk 	mlx5_os_dev_shared_handler_install(sh);
1002632f0f19SSuanming Mou 	sh->cnt_id_tbl = mlx5_l3t_create(MLX5_L3T_TYPE_DWORD);
1003632f0f19SSuanming Mou 	if (!sh->cnt_id_tbl) {
1004632f0f19SSuanming Mou 		err = rte_errno;
1005632f0f19SSuanming Mou 		goto error;
1006632f0f19SSuanming Mou 	}
1007fa2d01c8SDong Zhou 	mlx5_flow_aging_init(sh);
10085382d28cSMatan Azrad 	mlx5_flow_counters_mng_init(sh);
1009b88341caSSuanming Mou 	mlx5_flow_ipool_create(sh, config);
10100e3d0525SViacheslav Ovsiienko 	/* Add device to memory callback list. */
10110e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
10120e3d0525SViacheslav Ovsiienko 	LIST_INSERT_HEAD(&mlx5_shared_data->mem_event_cb_list,
10130e3d0525SViacheslav Ovsiienko 			 sh, mem_event_cb);
10140e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
10150e3d0525SViacheslav Ovsiienko 	/* Add context to the global device list. */
101691389890SOphir Munk 	LIST_INSERT_HEAD(&mlx5_dev_ctx_list, sh, next);
101717e19bc4SViacheslav Ovsiienko exit:
101891389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
101917e19bc4SViacheslav Ovsiienko 	return sh;
102017e19bc4SViacheslav Ovsiienko error:
1021d133f4cdSViacheslav Ovsiienko 	pthread_mutex_destroy(&sh->txpp.mutex);
102291389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
10238e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
1024a0bfe9d5SViacheslav Ovsiienko 	if (sh->cnt_id_tbl)
1025632f0f19SSuanming Mou 		mlx5_l3t_destroy(sh->cnt_id_tbl);
1026ae18a1aeSOri Kam 	if (sh->tis)
1027ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->tis));
1028ae18a1aeSOri Kam 	if (sh->td)
1029ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->td));
103008d1838fSDekel Peled 	if (sh->devx_rx_uar)
103108d1838fSDekel Peled 		mlx5_glue->devx_free_uar(sh->devx_rx_uar);
1032a0bfe9d5SViacheslav Ovsiienko 	if (sh->tx_uar)
1033a0bfe9d5SViacheslav Ovsiienko 		mlx5_glue->devx_free_uar(sh->tx_uar);
103417e19bc4SViacheslav Ovsiienko 	if (sh->pd)
1035*1cb210abSOphir Munk 		claim_zero(mlx5_os_dealloc_pd(sh->pd));
103617e19bc4SViacheslav Ovsiienko 	if (sh->ctx)
103717e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->close_device(sh->ctx));
10382175c4dcSSuanming Mou 	mlx5_free(sh);
10398e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(err > 0);
104017e19bc4SViacheslav Ovsiienko 	rte_errno = err;
104117e19bc4SViacheslav Ovsiienko 	return NULL;
104217e19bc4SViacheslav Ovsiienko }
104317e19bc4SViacheslav Ovsiienko 
104417e19bc4SViacheslav Ovsiienko /**
104517e19bc4SViacheslav Ovsiienko  * Free shared IB device context. Decrement counter and if zero free
104617e19bc4SViacheslav Ovsiienko  * all allocated resources and close handles.
104717e19bc4SViacheslav Ovsiienko  *
104817e19bc4SViacheslav Ovsiienko  * @param[in] sh
10496e88bc42SOphir Munk  *   Pointer to mlx5_dev_ctx_shared object to free
105017e19bc4SViacheslav Ovsiienko  */
10512eb4d010SOphir Munk void
105291389890SOphir Munk mlx5_free_shared_dev_ctx(struct mlx5_dev_ctx_shared *sh)
105317e19bc4SViacheslav Ovsiienko {
105491389890SOphir Munk 	pthread_mutex_lock(&mlx5_dev_ctx_list_mutex);
10550afacb04SAlexander Kozyrev #ifdef RTE_LIBRTE_MLX5_DEBUG
105617e19bc4SViacheslav Ovsiienko 	/* Check the object presence in the list. */
10576e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *lctx;
105817e19bc4SViacheslav Ovsiienko 
105991389890SOphir Munk 	LIST_FOREACH(lctx, &mlx5_dev_ctx_list, next)
106017e19bc4SViacheslav Ovsiienko 		if (lctx == sh)
106117e19bc4SViacheslav Ovsiienko 			break;
10628e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(lctx);
106317e19bc4SViacheslav Ovsiienko 	if (lctx != sh) {
106417e19bc4SViacheslav Ovsiienko 		DRV_LOG(ERR, "Freeing non-existing shared IB context");
106517e19bc4SViacheslav Ovsiienko 		goto exit;
106617e19bc4SViacheslav Ovsiienko 	}
106717e19bc4SViacheslav Ovsiienko #endif
10688e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
10698e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh->refcnt);
107017e19bc4SViacheslav Ovsiienko 	/* Secondary process should not free the shared context. */
10718e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(rte_eal_process_type() == RTE_PROC_PRIMARY);
107217e19bc4SViacheslav Ovsiienko 	if (--sh->refcnt)
107317e19bc4SViacheslav Ovsiienko 		goto exit;
10740e3d0525SViacheslav Ovsiienko 	/* Remove from memory callback device list. */
10750e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_lock(&mlx5_shared_data->mem_event_rwlock);
10760e3d0525SViacheslav Ovsiienko 	LIST_REMOVE(sh, mem_event_cb);
10770e3d0525SViacheslav Ovsiienko 	rte_rwlock_write_unlock(&mlx5_shared_data->mem_event_rwlock);
10784f8e6befSMichael Baum 	/* Release created Memory Regions. */
1079b8dc6b0eSVu Pham 	mlx5_mr_release_cache(&sh->share_cache);
10800e3d0525SViacheslav Ovsiienko 	/* Remove context from the global device list. */
108117e19bc4SViacheslav Ovsiienko 	LIST_REMOVE(sh, next);
1082f4a08731SMichael Baum 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
108353e5a82fSViacheslav Ovsiienko 	/*
108453e5a82fSViacheslav Ovsiienko 	 *  Ensure there is no async event handler installed.
108553e5a82fSViacheslav Ovsiienko 	 *  Only primary process handles async device events.
108653e5a82fSViacheslav Ovsiienko 	 **/
10875382d28cSMatan Azrad 	mlx5_flow_counters_mng_close(sh);
1088f935ed4bSDekel Peled 	if (sh->aso_age_mng) {
1089f935ed4bSDekel Peled 		mlx5_flow_aso_age_mng_close(sh);
1090f935ed4bSDekel Peled 		sh->aso_age_mng = NULL;
1091f935ed4bSDekel Peled 	}
1092014d1cbeSSuanming Mou 	mlx5_flow_ipool_destroy(sh);
10932eb4d010SOphir Munk 	mlx5_os_dev_shared_handler_uninstall(sh);
1094632f0f19SSuanming Mou 	if (sh->cnt_id_tbl) {
1095632f0f19SSuanming Mou 		mlx5_l3t_destroy(sh->cnt_id_tbl);
1096632f0f19SSuanming Mou 		sh->cnt_id_tbl = NULL;
1097632f0f19SSuanming Mou 	}
1098fc4d4f73SViacheslav Ovsiienko 	if (sh->tx_uar) {
1099fc4d4f73SViacheslav Ovsiienko 		mlx5_glue->devx_free_uar(sh->tx_uar);
1100fc4d4f73SViacheslav Ovsiienko 		sh->tx_uar = NULL;
1101fc4d4f73SViacheslav Ovsiienko 	}
110217e19bc4SViacheslav Ovsiienko 	if (sh->pd)
1103*1cb210abSOphir Munk 		claim_zero(mlx5_os_dealloc_pd(sh->pd));
1104ae18a1aeSOri Kam 	if (sh->tis)
1105ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->tis));
1106ae18a1aeSOri Kam 	if (sh->td)
1107ae18a1aeSOri Kam 		claim_zero(mlx5_devx_cmd_destroy(sh->td));
110808d1838fSDekel Peled 	if (sh->devx_rx_uar)
110908d1838fSDekel Peled 		mlx5_glue->devx_free_uar(sh->devx_rx_uar);
111017e19bc4SViacheslav Ovsiienko 	if (sh->ctx)
111117e19bc4SViacheslav Ovsiienko 		claim_zero(mlx5_glue->close_device(sh->ctx));
1112d133f4cdSViacheslav Ovsiienko 	pthread_mutex_destroy(&sh->txpp.mutex);
11132175c4dcSSuanming Mou 	mlx5_free(sh);
1114f4a08731SMichael Baum 	return;
111517e19bc4SViacheslav Ovsiienko exit:
111691389890SOphir Munk 	pthread_mutex_unlock(&mlx5_dev_ctx_list_mutex);
111717e19bc4SViacheslav Ovsiienko }
111817e19bc4SViacheslav Ovsiienko 
1119771fa900SAdrien Mazarguil /**
1120afd7a625SXueming Li  * Destroy table hash list.
112154534725SMatan Azrad  *
112254534725SMatan Azrad  * @param[in] priv
112354534725SMatan Azrad  *   Pointer to the private device data structure.
112454534725SMatan Azrad  */
11252eb4d010SOphir Munk void
112654534725SMatan Azrad mlx5_free_table_hash_list(struct mlx5_priv *priv)
112754534725SMatan Azrad {
11286e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
112954534725SMatan Azrad 
113054534725SMatan Azrad 	if (!sh->flow_tbls)
113154534725SMatan Azrad 		return;
1132e69a5922SXueming Li 	mlx5_hlist_destroy(sh->flow_tbls);
113354534725SMatan Azrad }
113454534725SMatan Azrad 
113554534725SMatan Azrad /**
113654534725SMatan Azrad  * Initialize flow table hash list and create the root tables entry
113754534725SMatan Azrad  * for each domain.
113854534725SMatan Azrad  *
113954534725SMatan Azrad  * @param[in] priv
114054534725SMatan Azrad  *   Pointer to the private device data structure.
114154534725SMatan Azrad  *
114254534725SMatan Azrad  * @return
114354534725SMatan Azrad  *   Zero on success, positive error code otherwise.
114454534725SMatan Azrad  */
11452eb4d010SOphir Munk int
1146afd7a625SXueming Li mlx5_alloc_table_hash_list(struct mlx5_priv *priv __rte_unused)
114754534725SMatan Azrad {
1148afd7a625SXueming Li 	int err = 0;
1149afd7a625SXueming Li 	/* Tables are only used in DV and DR modes. */
1150afd7a625SXueming Li #ifdef HAVE_IBV_FLOW_DV_SUPPORT
11516e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
115254534725SMatan Azrad 	char s[MLX5_HLIST_NAMESIZE];
115354534725SMatan Azrad 
11548e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
115554534725SMatan Azrad 	snprintf(s, sizeof(s), "%s_flow_table", priv->sh->ibdev_name);
1156e69a5922SXueming Li 	sh->flow_tbls = mlx5_hlist_create(s, MLX5_FLOW_TABLE_HLIST_ARRAY_SIZE,
1157f5b0aed2SSuanming Mou 					  0, 0, flow_dv_tbl_create_cb,
1158f5b0aed2SSuanming Mou 					  flow_dv_tbl_match_cb,
1159afd7a625SXueming Li 					  flow_dv_tbl_remove_cb);
116054534725SMatan Azrad 	if (!sh->flow_tbls) {
116163783b01SDavid Marchand 		DRV_LOG(ERR, "flow tables with hash creation failed.");
116254534725SMatan Azrad 		err = ENOMEM;
116354534725SMatan Azrad 		return err;
116454534725SMatan Azrad 	}
1165afd7a625SXueming Li 	sh->flow_tbls->ctx = sh;
116654534725SMatan Azrad #ifndef HAVE_MLX5DV_DR
1167afd7a625SXueming Li 	struct rte_flow_error error;
1168afd7a625SXueming Li 	struct rte_eth_dev *dev = &rte_eth_devices[priv->dev_data->port_id];
1169afd7a625SXueming Li 
117054534725SMatan Azrad 	/*
117154534725SMatan Azrad 	 * In case we have not DR support, the zero tables should be created
117254534725SMatan Azrad 	 * because DV expect to see them even if they cannot be created by
117354534725SMatan Azrad 	 * RDMA-CORE.
117454534725SMatan Azrad 	 */
1175afd7a625SXueming Li 	if (!flow_dv_tbl_resource_get(dev, 0, 0, 0, 0, NULL, 0, 1, &error) ||
1176afd7a625SXueming Li 	    !flow_dv_tbl_resource_get(dev, 0, 1, 0, 0, NULL, 0, 1, &error) ||
1177afd7a625SXueming Li 	    !flow_dv_tbl_resource_get(dev, 0, 0, 1, 0, NULL, 0, 1, &error)) {
117854534725SMatan Azrad 		err = ENOMEM;
117954534725SMatan Azrad 		goto error;
118054534725SMatan Azrad 	}
118154534725SMatan Azrad 	return err;
118254534725SMatan Azrad error:
118354534725SMatan Azrad 	mlx5_free_table_hash_list(priv);
118454534725SMatan Azrad #endif /* HAVE_MLX5DV_DR */
1185afd7a625SXueming Li #endif
118654534725SMatan Azrad 	return err;
118754534725SMatan Azrad }
118854534725SMatan Azrad 
118954534725SMatan Azrad /**
11904d803a72SOlga Shern  * Retrieve integer value from environment variable.
11914d803a72SOlga Shern  *
11924d803a72SOlga Shern  * @param[in] name
11934d803a72SOlga Shern  *   Environment variable name.
11944d803a72SOlga Shern  *
11954d803a72SOlga Shern  * @return
11964d803a72SOlga Shern  *   Integer value, 0 if the variable is not set.
11974d803a72SOlga Shern  */
11984d803a72SOlga Shern int
11994d803a72SOlga Shern mlx5_getenv_int(const char *name)
12004d803a72SOlga Shern {
12014d803a72SOlga Shern 	const char *val = getenv(name);
12024d803a72SOlga Shern 
12034d803a72SOlga Shern 	if (val == NULL)
12044d803a72SOlga Shern 		return 0;
12054d803a72SOlga Shern 	return atoi(val);
12064d803a72SOlga Shern }
12074d803a72SOlga Shern 
12084d803a72SOlga Shern /**
1209c9ba7523SRaslan Darawsheh  * DPDK callback to add udp tunnel port
1210c9ba7523SRaslan Darawsheh  *
1211c9ba7523SRaslan Darawsheh  * @param[in] dev
1212c9ba7523SRaslan Darawsheh  *   A pointer to eth_dev
1213c9ba7523SRaslan Darawsheh  * @param[in] udp_tunnel
1214c9ba7523SRaslan Darawsheh  *   A pointer to udp tunnel
1215c9ba7523SRaslan Darawsheh  *
1216c9ba7523SRaslan Darawsheh  * @return
1217c9ba7523SRaslan Darawsheh  *   0 on valid udp ports and tunnels, -ENOTSUP otherwise.
1218c9ba7523SRaslan Darawsheh  */
1219c9ba7523SRaslan Darawsheh int
1220c9ba7523SRaslan Darawsheh mlx5_udp_tunnel_port_add(struct rte_eth_dev *dev __rte_unused,
1221c9ba7523SRaslan Darawsheh 			 struct rte_eth_udp_tunnel *udp_tunnel)
1222c9ba7523SRaslan Darawsheh {
12238e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(udp_tunnel != NULL);
1224c9ba7523SRaslan Darawsheh 	if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN &&
1225c9ba7523SRaslan Darawsheh 	    udp_tunnel->udp_port == 4789)
1226c9ba7523SRaslan Darawsheh 		return 0;
1227c9ba7523SRaslan Darawsheh 	if (udp_tunnel->prot_type == RTE_TUNNEL_TYPE_VXLAN_GPE &&
1228c9ba7523SRaslan Darawsheh 	    udp_tunnel->udp_port == 4790)
1229c9ba7523SRaslan Darawsheh 		return 0;
1230c9ba7523SRaslan Darawsheh 	return -ENOTSUP;
1231c9ba7523SRaslan Darawsheh }
1232c9ba7523SRaslan Darawsheh 
1233c9ba7523SRaslan Darawsheh /**
1234120dc4a7SYongseok Koh  * Initialize process private data structure.
1235120dc4a7SYongseok Koh  *
1236120dc4a7SYongseok Koh  * @param dev
1237120dc4a7SYongseok Koh  *   Pointer to Ethernet device structure.
1238120dc4a7SYongseok Koh  *
1239120dc4a7SYongseok Koh  * @return
1240120dc4a7SYongseok Koh  *   0 on success, a negative errno value otherwise and rte_errno is set.
1241120dc4a7SYongseok Koh  */
1242120dc4a7SYongseok Koh int
1243120dc4a7SYongseok Koh mlx5_proc_priv_init(struct rte_eth_dev *dev)
1244120dc4a7SYongseok Koh {
1245120dc4a7SYongseok Koh 	struct mlx5_priv *priv = dev->data->dev_private;
1246120dc4a7SYongseok Koh 	struct mlx5_proc_priv *ppriv;
1247120dc4a7SYongseok Koh 	size_t ppriv_size;
1248120dc4a7SYongseok Koh 
1249120dc4a7SYongseok Koh 	/*
1250120dc4a7SYongseok Koh 	 * UAR register table follows the process private structure. BlueFlame
1251120dc4a7SYongseok Koh 	 * registers for Tx queues are stored in the table.
1252120dc4a7SYongseok Koh 	 */
1253120dc4a7SYongseok Koh 	ppriv_size =
1254120dc4a7SYongseok Koh 		sizeof(struct mlx5_proc_priv) + priv->txqs_n * sizeof(void *);
12552175c4dcSSuanming Mou 	ppriv = mlx5_malloc(MLX5_MEM_RTE, ppriv_size, RTE_CACHE_LINE_SIZE,
12562175c4dcSSuanming Mou 			    dev->device->numa_node);
1257120dc4a7SYongseok Koh 	if (!ppriv) {
1258120dc4a7SYongseok Koh 		rte_errno = ENOMEM;
1259120dc4a7SYongseok Koh 		return -rte_errno;
1260120dc4a7SYongseok Koh 	}
1261120dc4a7SYongseok Koh 	ppriv->uar_table_sz = ppriv_size;
1262120dc4a7SYongseok Koh 	dev->process_private = ppriv;
1263120dc4a7SYongseok Koh 	return 0;
1264120dc4a7SYongseok Koh }
1265120dc4a7SYongseok Koh 
1266120dc4a7SYongseok Koh /**
1267120dc4a7SYongseok Koh  * Un-initialize process private data structure.
1268120dc4a7SYongseok Koh  *
1269120dc4a7SYongseok Koh  * @param dev
1270120dc4a7SYongseok Koh  *   Pointer to Ethernet device structure.
1271120dc4a7SYongseok Koh  */
1272120dc4a7SYongseok Koh static void
1273120dc4a7SYongseok Koh mlx5_proc_priv_uninit(struct rte_eth_dev *dev)
1274120dc4a7SYongseok Koh {
1275120dc4a7SYongseok Koh 	if (!dev->process_private)
1276120dc4a7SYongseok Koh 		return;
12772175c4dcSSuanming Mou 	mlx5_free(dev->process_private);
1278120dc4a7SYongseok Koh 	dev->process_private = NULL;
1279120dc4a7SYongseok Koh }
1280120dc4a7SYongseok Koh 
1281120dc4a7SYongseok Koh /**
1282771fa900SAdrien Mazarguil  * DPDK callback to close the device.
1283771fa900SAdrien Mazarguil  *
1284771fa900SAdrien Mazarguil  * Destroy all queues and objects, free memory.
1285771fa900SAdrien Mazarguil  *
1286771fa900SAdrien Mazarguil  * @param dev
1287771fa900SAdrien Mazarguil  *   Pointer to Ethernet device structure.
1288771fa900SAdrien Mazarguil  */
1289b142387bSThomas Monjalon int
1290771fa900SAdrien Mazarguil mlx5_dev_close(struct rte_eth_dev *dev)
1291771fa900SAdrien Mazarguil {
1292dbeba4cfSThomas Monjalon 	struct mlx5_priv *priv = dev->data->dev_private;
12932e22920bSAdrien Mazarguil 	unsigned int i;
12946af6b973SNélio Laranjeiro 	int ret;
1295771fa900SAdrien Mazarguil 
12962786b7bfSSuanming Mou 	if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
12972786b7bfSSuanming Mou 		/* Check if process_private released. */
12982786b7bfSSuanming Mou 		if (!dev->process_private)
1299b142387bSThomas Monjalon 			return 0;
13002786b7bfSSuanming Mou 		mlx5_tx_uar_uninit_secondary(dev);
13012786b7bfSSuanming Mou 		mlx5_proc_priv_uninit(dev);
13022786b7bfSSuanming Mou 		rte_eth_dev_release_port(dev);
1303b142387bSThomas Monjalon 		return 0;
13042786b7bfSSuanming Mou 	}
13052786b7bfSSuanming Mou 	if (!priv->sh)
1306b142387bSThomas Monjalon 		return 0;
1307a170a30dSNélio Laranjeiro 	DRV_LOG(DEBUG, "port %u closing device \"%s\"",
13080f99970bSNélio Laranjeiro 		dev->data->port_id,
1309f44b09f9SOphir Munk 		((priv->sh->ctx != NULL) ?
1310f44b09f9SOphir Munk 		mlx5_os_get_ctx_device_name(priv->sh->ctx) : ""));
13118db7e3b6SBing Zhao 	/*
13128db7e3b6SBing Zhao 	 * If default mreg copy action is removed at the stop stage,
13138db7e3b6SBing Zhao 	 * the search will return none and nothing will be done anymore.
13148db7e3b6SBing Zhao 	 */
13158db7e3b6SBing Zhao 	mlx5_flow_stop_default(dev);
1316af4f09f2SNélio Laranjeiro 	mlx5_traffic_disable(dev);
13178db7e3b6SBing Zhao 	/*
13188db7e3b6SBing Zhao 	 * If all the flows are already flushed in the device stop stage,
13198db7e3b6SBing Zhao 	 * then this will return directly without any action.
13208db7e3b6SBing Zhao 	 */
13218db7e3b6SBing Zhao 	mlx5_flow_list_flush(dev, &priv->flows, true);
1322d7cfcdddSAndrey Vesnovaty 	mlx5_shared_action_flush(dev);
132302e76468SSuanming Mou 	mlx5_flow_meter_flush(dev, NULL);
13242e22920bSAdrien Mazarguil 	/* Prevent crashes when queues are still in use. */
13252e22920bSAdrien Mazarguil 	dev->rx_pkt_burst = removed_rx_burst;
13262e22920bSAdrien Mazarguil 	dev->tx_pkt_burst = removed_tx_burst;
13272aac5b5dSYongseok Koh 	rte_wmb();
13282aac5b5dSYongseok Koh 	/* Disable datapath on secondary process. */
13292e86c4e5SOphir Munk 	mlx5_mp_os_req_stop_rxtx(dev);
13301c506404SBing Zhao 	/* Free the eCPRI flex parser resource. */
13311c506404SBing Zhao 	mlx5_flex_parser_ecpri_release(dev);
13322e22920bSAdrien Mazarguil 	if (priv->rxqs != NULL) {
13332e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_rx_burst() is still running. */
133420698c9fSOphir Munk 		rte_delay_us_sleep(1000);
1335a1366b1aSNélio Laranjeiro 		for (i = 0; (i != priv->rxqs_n); ++i)
1336af4f09f2SNélio Laranjeiro 			mlx5_rxq_release(dev, i);
13372e22920bSAdrien Mazarguil 		priv->rxqs_n = 0;
13382e22920bSAdrien Mazarguil 		priv->rxqs = NULL;
13392e22920bSAdrien Mazarguil 	}
13402e22920bSAdrien Mazarguil 	if (priv->txqs != NULL) {
13412e22920bSAdrien Mazarguil 		/* XXX race condition if mlx5_tx_burst() is still running. */
134220698c9fSOphir Munk 		rte_delay_us_sleep(1000);
13436e78005aSNélio Laranjeiro 		for (i = 0; (i != priv->txqs_n); ++i)
1344af4f09f2SNélio Laranjeiro 			mlx5_txq_release(dev, i);
13452e22920bSAdrien Mazarguil 		priv->txqs_n = 0;
13462e22920bSAdrien Mazarguil 		priv->txqs = NULL;
13472e22920bSAdrien Mazarguil 	}
1348120dc4a7SYongseok Koh 	mlx5_proc_priv_uninit(dev);
134965b3cd0dSSuanming Mou 	if (priv->drop_queue.hrxq)
135065b3cd0dSSuanming Mou 		mlx5_drop_action_destroy(dev);
1351dd3c774fSViacheslav Ovsiienko 	if (priv->mreg_cp_tbl)
1352e69a5922SXueming Li 		mlx5_hlist_destroy(priv->mreg_cp_tbl);
13537d6bf6b8SYongseok Koh 	mlx5_mprq_free_mp(dev);
13542eb4d010SOphir Munk 	mlx5_os_free_shared_dr(priv);
135529c1d8bbSNélio Laranjeiro 	if (priv->rss_conf.rss_key != NULL)
135683c2047cSSuanming Mou 		mlx5_free(priv->rss_conf.rss_key);
1357634efbc2SNelio Laranjeiro 	if (priv->reta_idx != NULL)
135883c2047cSSuanming Mou 		mlx5_free(priv->reta_idx);
1359ccdcba53SNélio Laranjeiro 	if (priv->config.vf)
1360f00f6562SOphir Munk 		mlx5_os_mac_addr_flush(dev);
136126c08b97SAdrien Mazarguil 	if (priv->nl_socket_route >= 0)
136226c08b97SAdrien Mazarguil 		close(priv->nl_socket_route);
136326c08b97SAdrien Mazarguil 	if (priv->nl_socket_rdma >= 0)
136426c08b97SAdrien Mazarguil 		close(priv->nl_socket_rdma);
1365dfedf3e3SViacheslav Ovsiienko 	if (priv->vmwa_context)
1366dfedf3e3SViacheslav Ovsiienko 		mlx5_vlan_vmwa_exit(priv->vmwa_context);
136723820a79SDekel Peled 	ret = mlx5_hrxq_verify(dev);
1368f5479b68SNélio Laranjeiro 	if (ret)
1369a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some hash Rx queue still remain",
13700f99970bSNélio Laranjeiro 			dev->data->port_id);
137115c80a12SDekel Peled 	ret = mlx5_ind_table_obj_verify(dev);
13724c7a0f5fSNélio Laranjeiro 	if (ret)
1373a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some indirection table still remain",
13740f99970bSNélio Laranjeiro 			dev->data->port_id);
137593403560SDekel Peled 	ret = mlx5_rxq_obj_verify(dev);
137609cb5b58SNélio Laranjeiro 	if (ret)
137793403560SDekel Peled 		DRV_LOG(WARNING, "port %u some Rx queue objects still remain",
13780f99970bSNélio Laranjeiro 			dev->data->port_id);
1379af4f09f2SNélio Laranjeiro 	ret = mlx5_rxq_verify(dev);
1380a1366b1aSNélio Laranjeiro 	if (ret)
1381a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Rx queues still remain",
13820f99970bSNélio Laranjeiro 			dev->data->port_id);
1383894c4a8eSOri Kam 	ret = mlx5_txq_obj_verify(dev);
1384faf2667fSNélio Laranjeiro 	if (ret)
1385a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Verbs Tx queue still remain",
13860f99970bSNélio Laranjeiro 			dev->data->port_id);
1387af4f09f2SNélio Laranjeiro 	ret = mlx5_txq_verify(dev);
13886e78005aSNélio Laranjeiro 	if (ret)
1389a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some Tx queues still remain",
13900f99970bSNélio Laranjeiro 			dev->data->port_id);
1391af4f09f2SNélio Laranjeiro 	ret = mlx5_flow_verify(dev);
13926af6b973SNélio Laranjeiro 	if (ret)
1393a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u some flows still remain",
1394a170a30dSNélio Laranjeiro 			dev->data->port_id);
1395e1592b6cSSuanming Mou 	mlx5_cache_list_destroy(&priv->hrxqs);
1396772dc0ebSSuanming Mou 	/*
1397772dc0ebSSuanming Mou 	 * Free the shared context in last turn, because the cleanup
1398772dc0ebSSuanming Mou 	 * routines above may use some shared fields, like
1399f00f6562SOphir Munk 	 * mlx5_os_mac_addr_flush() uses ibdev_path for retrieveing
1400772dc0ebSSuanming Mou 	 * ifindex if Netlink fails.
1401772dc0ebSSuanming Mou 	 */
140291389890SOphir Munk 	mlx5_free_shared_dev_ctx(priv->sh);
14032b730263SAdrien Mazarguil 	if (priv->domain_id != RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID) {
14042b730263SAdrien Mazarguil 		unsigned int c = 0;
1405d874a4eeSThomas Monjalon 		uint16_t port_id;
14062b730263SAdrien Mazarguil 
1407fbc83412SViacheslav Ovsiienko 		MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
1408dbeba4cfSThomas Monjalon 			struct mlx5_priv *opriv =
1409d874a4eeSThomas Monjalon 				rte_eth_devices[port_id].data->dev_private;
14102b730263SAdrien Mazarguil 
14112b730263SAdrien Mazarguil 			if (!opriv ||
14122b730263SAdrien Mazarguil 			    opriv->domain_id != priv->domain_id ||
1413d874a4eeSThomas Monjalon 			    &rte_eth_devices[port_id] == dev)
14142b730263SAdrien Mazarguil 				continue;
14152b730263SAdrien Mazarguil 			++c;
1416f7e95215SViacheslav Ovsiienko 			break;
14172b730263SAdrien Mazarguil 		}
14182b730263SAdrien Mazarguil 		if (!c)
14192b730263SAdrien Mazarguil 			claim_zero(rte_eth_switch_domain_free(priv->domain_id));
14202b730263SAdrien Mazarguil 	}
1421771fa900SAdrien Mazarguil 	memset(priv, 0, sizeof(*priv));
14222b730263SAdrien Mazarguil 	priv->domain_id = RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID;
142342603bbdSOphir Munk 	/*
142442603bbdSOphir Munk 	 * Reset mac_addrs to NULL such that it is not freed as part of
142542603bbdSOphir Munk 	 * rte_eth_dev_release_port(). mac_addrs is part of dev_private so
142642603bbdSOphir Munk 	 * it is freed when dev_private is freed.
142742603bbdSOphir Munk 	 */
142842603bbdSOphir Munk 	dev->data->mac_addrs = NULL;
1429b142387bSThomas Monjalon 	return 0;
1430771fa900SAdrien Mazarguil }
1431771fa900SAdrien Mazarguil 
1432e72dd09bSNélio Laranjeiro /**
1433e72dd09bSNélio Laranjeiro  * Verify and store value for device argument.
1434e72dd09bSNélio Laranjeiro  *
1435e72dd09bSNélio Laranjeiro  * @param[in] key
1436e72dd09bSNélio Laranjeiro  *   Key argument to verify.
1437e72dd09bSNélio Laranjeiro  * @param[in] val
1438e72dd09bSNélio Laranjeiro  *   Value associated with key.
1439e72dd09bSNélio Laranjeiro  * @param opaque
1440e72dd09bSNélio Laranjeiro  *   User data.
1441e72dd09bSNélio Laranjeiro  *
1442e72dd09bSNélio Laranjeiro  * @return
1443a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
1444e72dd09bSNélio Laranjeiro  */
1445e72dd09bSNélio Laranjeiro static int
1446e72dd09bSNélio Laranjeiro mlx5_args_check(const char *key, const char *val, void *opaque)
1447e72dd09bSNélio Laranjeiro {
14487fe24446SShahaf Shuler 	struct mlx5_dev_config *config = opaque;
14498f848f32SViacheslav Ovsiienko 	unsigned long mod;
14508f848f32SViacheslav Ovsiienko 	signed long tmp;
1451e72dd09bSNélio Laranjeiro 
14526de569f5SAdrien Mazarguil 	/* No-op, port representors are processed in mlx5_dev_spawn(). */
14536de569f5SAdrien Mazarguil 	if (!strcmp(MLX5_REPRESENTOR, key))
14546de569f5SAdrien Mazarguil 		return 0;
145599c12dccSNélio Laranjeiro 	errno = 0;
14568f848f32SViacheslav Ovsiienko 	tmp = strtol(val, NULL, 0);
145799c12dccSNélio Laranjeiro 	if (errno) {
1458a6d83b6aSNélio Laranjeiro 		rte_errno = errno;
1459a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "%s: \"%s\" is not a valid integer", key, val);
1460a6d83b6aSNélio Laranjeiro 		return -rte_errno;
146199c12dccSNélio Laranjeiro 	}
14628f848f32SViacheslav Ovsiienko 	if (tmp < 0 && strcmp(MLX5_TX_PP, key) && strcmp(MLX5_TX_SKEW, key)) {
14638f848f32SViacheslav Ovsiienko 		/* Negative values are acceptable for some keys only. */
14648f848f32SViacheslav Ovsiienko 		rte_errno = EINVAL;
14658f848f32SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: invalid negative value \"%s\"", key, val);
14668f848f32SViacheslav Ovsiienko 		return -rte_errno;
14678f848f32SViacheslav Ovsiienko 	}
14688f848f32SViacheslav Ovsiienko 	mod = tmp >= 0 ? tmp : -tmp;
146999c12dccSNélio Laranjeiro 	if (strcmp(MLX5_RXQ_CQE_COMP_EN, key) == 0) {
147054c2d46bSAlexander Kozyrev 		if (tmp > MLX5_CQE_RESP_FORMAT_L34H_STRIDX) {
147154c2d46bSAlexander Kozyrev 			DRV_LOG(ERR, "invalid CQE compression "
147254c2d46bSAlexander Kozyrev 				     "format parameter");
147354c2d46bSAlexander Kozyrev 			rte_errno = EINVAL;
147454c2d46bSAlexander Kozyrev 			return -rte_errno;
147554c2d46bSAlexander Kozyrev 		}
14767fe24446SShahaf Shuler 		config->cqe_comp = !!tmp;
147754c2d46bSAlexander Kozyrev 		config->cqe_comp_fmt = tmp;
1478bc91e8dbSYongseok Koh 	} else if (strcmp(MLX5_RXQ_CQE_PAD_EN, key) == 0) {
1479bc91e8dbSYongseok Koh 		config->cqe_pad = !!tmp;
148078c7a16dSYongseok Koh 	} else if (strcmp(MLX5_RXQ_PKT_PAD_EN, key) == 0) {
148178c7a16dSYongseok Koh 		config->hw_padding = !!tmp;
14827d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_EN, key) == 0) {
14837d6bf6b8SYongseok Koh 		config->mprq.enabled = !!tmp;
14847d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_NUM, key) == 0) {
14857d6bf6b8SYongseok Koh 		config->mprq.stride_num_n = tmp;
1486ecb16045SAlexander Kozyrev 	} else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_SIZE, key) == 0) {
1487ecb16045SAlexander Kozyrev 		config->mprq.stride_size_n = tmp;
14887d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RX_MPRQ_MAX_MEMCPY_LEN, key) == 0) {
14897d6bf6b8SYongseok Koh 		config->mprq.max_memcpy_len = tmp;
14907d6bf6b8SYongseok Koh 	} else if (strcmp(MLX5_RXQS_MIN_MPRQ, key) == 0) {
14917d6bf6b8SYongseok Koh 		config->mprq.min_rxqs_num = tmp;
14922a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQ_INLINE, key) == 0) {
1493505f1fe4SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter,"
1494505f1fe4SViacheslav Ovsiienko 				 " converted to txq_inline_max", key);
1495505f1fe4SViacheslav Ovsiienko 		config->txq_inline_max = tmp;
1496505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MAX, key) == 0) {
1497505f1fe4SViacheslav Ovsiienko 		config->txq_inline_max = tmp;
1498505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MIN, key) == 0) {
1499505f1fe4SViacheslav Ovsiienko 		config->txq_inline_min = tmp;
1500505f1fe4SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TXQ_INLINE_MPW, key) == 0) {
1501505f1fe4SViacheslav Ovsiienko 		config->txq_inline_mpw = tmp;
15022a66cf37SYaacov Hazan 	} else if (strcmp(MLX5_TXQS_MIN_INLINE, key) == 0) {
15037fe24446SShahaf Shuler 		config->txqs_inline = tmp;
150409d8b416SYongseok Koh 	} else if (strcmp(MLX5_TXQS_MAX_VEC, key) == 0) {
1505a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
1506230189d9SNélio Laranjeiro 	} else if (strcmp(MLX5_TXQ_MPW_EN, key) == 0) {
1507f9de8718SShahaf Shuler 		config->mps = !!tmp;
15088409a285SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_DB_NC, key) == 0) {
1509f078ceb6SViacheslav Ovsiienko 		if (tmp != MLX5_TXDB_CACHED &&
1510f078ceb6SViacheslav Ovsiienko 		    tmp != MLX5_TXDB_NCACHED &&
1511f078ceb6SViacheslav Ovsiienko 		    tmp != MLX5_TXDB_HEURISTIC) {
1512f078ceb6SViacheslav Ovsiienko 			DRV_LOG(ERR, "invalid Tx doorbell "
1513f078ceb6SViacheslav Ovsiienko 				     "mapping parameter");
1514f078ceb6SViacheslav Ovsiienko 			rte_errno = EINVAL;
1515f078ceb6SViacheslav Ovsiienko 			return -rte_errno;
1516f078ceb6SViacheslav Ovsiienko 		}
1517f078ceb6SViacheslav Ovsiienko 		config->dbnc = tmp;
15186ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MPW_HDR_DSEG_EN, key) == 0) {
1519a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
15206ce84bd8SYongseok Koh 	} else if (strcmp(MLX5_TXQ_MAX_INLINE_LEN, key) == 0) {
1521505f1fe4SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter,"
1522505f1fe4SViacheslav Ovsiienko 				 " converted to txq_inline_mpw", key);
1523505f1fe4SViacheslav Ovsiienko 		config->txq_inline_mpw = tmp;
15245644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_TX_VEC_EN, key) == 0) {
1525a6bd4911SViacheslav Ovsiienko 		DRV_LOG(WARNING, "%s: deprecated parameter, ignored", key);
15268f848f32SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_PP, key) == 0) {
15278f848f32SViacheslav Ovsiienko 		if (!mod) {
15288f848f32SViacheslav Ovsiienko 			DRV_LOG(ERR, "Zero Tx packet pacing parameter");
15298f848f32SViacheslav Ovsiienko 			rte_errno = EINVAL;
15308f848f32SViacheslav Ovsiienko 			return -rte_errno;
15318f848f32SViacheslav Ovsiienko 		}
15328f848f32SViacheslav Ovsiienko 		config->tx_pp = tmp;
15338f848f32SViacheslav Ovsiienko 	} else if (strcmp(MLX5_TX_SKEW, key) == 0) {
15348f848f32SViacheslav Ovsiienko 		config->tx_skew = tmp;
15355644d5b9SNelio Laranjeiro 	} else if (strcmp(MLX5_RX_VEC_EN, key) == 0) {
15367fe24446SShahaf Shuler 		config->rx_vec_en = !!tmp;
153778a54648SXueming Li 	} else if (strcmp(MLX5_L3_VXLAN_EN, key) == 0) {
153878a54648SXueming Li 		config->l3_vxlan_en = !!tmp;
1539db209cc3SNélio Laranjeiro 	} else if (strcmp(MLX5_VF_NL_EN, key) == 0) {
1540db209cc3SNélio Laranjeiro 		config->vf_nl_en = !!tmp;
1541e2b4925eSOri Kam 	} else if (strcmp(MLX5_DV_ESW_EN, key) == 0) {
1542e2b4925eSOri Kam 		config->dv_esw_en = !!tmp;
154351e72d38SOri Kam 	} else if (strcmp(MLX5_DV_FLOW_EN, key) == 0) {
154451e72d38SOri Kam 		config->dv_flow_en = !!tmp;
15452d241515SViacheslav Ovsiienko 	} else if (strcmp(MLX5_DV_XMETA_EN, key) == 0) {
15462d241515SViacheslav Ovsiienko 		if (tmp != MLX5_XMETA_MODE_LEGACY &&
15472d241515SViacheslav Ovsiienko 		    tmp != MLX5_XMETA_MODE_META16 &&
15484ec6360dSGregory Etelson 		    tmp != MLX5_XMETA_MODE_META32 &&
15494ec6360dSGregory Etelson 		    tmp != MLX5_XMETA_MODE_MISS_INFO) {
1550f078ceb6SViacheslav Ovsiienko 			DRV_LOG(ERR, "invalid extensive "
15512d241515SViacheslav Ovsiienko 				     "metadata parameter");
15522d241515SViacheslav Ovsiienko 			rte_errno = EINVAL;
15532d241515SViacheslav Ovsiienko 			return -rte_errno;
15542d241515SViacheslav Ovsiienko 		}
15554ec6360dSGregory Etelson 		if (tmp != MLX5_XMETA_MODE_MISS_INFO)
15562d241515SViacheslav Ovsiienko 			config->dv_xmeta_en = tmp;
15574ec6360dSGregory Etelson 		else
15584ec6360dSGregory Etelson 			config->dv_miss_info = 1;
15590f0ae73aSShiri Kuzin 	} else if (strcmp(MLX5_LACP_BY_USER, key) == 0) {
15600f0ae73aSShiri Kuzin 		config->lacp_by_user = !!tmp;
1561dceb5029SYongseok Koh 	} else if (strcmp(MLX5_MR_EXT_MEMSEG_EN, key) == 0) {
1562dceb5029SYongseok Koh 		config->mr_ext_memseg_en = !!tmp;
1563066cfecdSMatan Azrad 	} else if (strcmp(MLX5_MAX_DUMP_FILES_NUM, key) == 0) {
1564066cfecdSMatan Azrad 		config->max_dump_files_num = tmp;
156521bb6c7eSDekel Peled 	} else if (strcmp(MLX5_LRO_TIMEOUT_USEC, key) == 0) {
156621bb6c7eSDekel Peled 		config->lro.timeout = tmp;
1567d768f324SMatan Azrad 	} else if (strcmp(MLX5_CLASS_ARG_NAME, key) == 0) {
1568d768f324SMatan Azrad 		DRV_LOG(DEBUG, "class argument is %s.", val);
15691ad9a3d0SBing Zhao 	} else if (strcmp(MLX5_HP_BUF_SIZE, key) == 0) {
15701ad9a3d0SBing Zhao 		config->log_hp_size = tmp;
1571a1da6f62SSuanming Mou 	} else if (strcmp(MLX5_RECLAIM_MEM, key) == 0) {
1572a1da6f62SSuanming Mou 		if (tmp != MLX5_RCM_NONE &&
1573a1da6f62SSuanming Mou 		    tmp != MLX5_RCM_LIGHT &&
1574a1da6f62SSuanming Mou 		    tmp != MLX5_RCM_AGGR) {
1575a1da6f62SSuanming Mou 			DRV_LOG(ERR, "Unrecognize %s: \"%s\"", key, val);
1576a1da6f62SSuanming Mou 			rte_errno = EINVAL;
1577a1da6f62SSuanming Mou 			return -rte_errno;
1578a1da6f62SSuanming Mou 		}
1579a1da6f62SSuanming Mou 		config->reclaim_mode = tmp;
15805522da6bSSuanming Mou 	} else if (strcmp(MLX5_SYS_MEM_EN, key) == 0) {
15815522da6bSSuanming Mou 		config->sys_mem_en = !!tmp;
158250f95b23SSuanming Mou 	} else if (strcmp(MLX5_DECAP_EN, key) == 0) {
158350f95b23SSuanming Mou 		config->decap_en = !!tmp;
158499c12dccSNélio Laranjeiro 	} else {
1585a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "%s: unknown parameter", key);
1586a6d83b6aSNélio Laranjeiro 		rte_errno = EINVAL;
1587a6d83b6aSNélio Laranjeiro 		return -rte_errno;
1588e72dd09bSNélio Laranjeiro 	}
158999c12dccSNélio Laranjeiro 	return 0;
159099c12dccSNélio Laranjeiro }
1591e72dd09bSNélio Laranjeiro 
1592e72dd09bSNélio Laranjeiro /**
1593e72dd09bSNélio Laranjeiro  * Parse device parameters.
1594e72dd09bSNélio Laranjeiro  *
15957fe24446SShahaf Shuler  * @param config
15967fe24446SShahaf Shuler  *   Pointer to device configuration structure.
1597e72dd09bSNélio Laranjeiro  * @param devargs
1598e72dd09bSNélio Laranjeiro  *   Device arguments structure.
1599e72dd09bSNélio Laranjeiro  *
1600e72dd09bSNélio Laranjeiro  * @return
1601a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
1602e72dd09bSNélio Laranjeiro  */
16032eb4d010SOphir Munk int
16047fe24446SShahaf Shuler mlx5_args(struct mlx5_dev_config *config, struct rte_devargs *devargs)
1605e72dd09bSNélio Laranjeiro {
1606e72dd09bSNélio Laranjeiro 	const char **params = (const char *[]){
160799c12dccSNélio Laranjeiro 		MLX5_RXQ_CQE_COMP_EN,
1608bc91e8dbSYongseok Koh 		MLX5_RXQ_CQE_PAD_EN,
160978c7a16dSYongseok Koh 		MLX5_RXQ_PKT_PAD_EN,
16107d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_EN,
16117d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_LOG_STRIDE_NUM,
1612ecb16045SAlexander Kozyrev 		MLX5_RX_MPRQ_LOG_STRIDE_SIZE,
16137d6bf6b8SYongseok Koh 		MLX5_RX_MPRQ_MAX_MEMCPY_LEN,
16147d6bf6b8SYongseok Koh 		MLX5_RXQS_MIN_MPRQ,
16152a66cf37SYaacov Hazan 		MLX5_TXQ_INLINE,
1616505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MIN,
1617505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MAX,
1618505f1fe4SViacheslav Ovsiienko 		MLX5_TXQ_INLINE_MPW,
16192a66cf37SYaacov Hazan 		MLX5_TXQS_MIN_INLINE,
162009d8b416SYongseok Koh 		MLX5_TXQS_MAX_VEC,
1621230189d9SNélio Laranjeiro 		MLX5_TXQ_MPW_EN,
16226ce84bd8SYongseok Koh 		MLX5_TXQ_MPW_HDR_DSEG_EN,
16236ce84bd8SYongseok Koh 		MLX5_TXQ_MAX_INLINE_LEN,
16248409a285SViacheslav Ovsiienko 		MLX5_TX_DB_NC,
16258f848f32SViacheslav Ovsiienko 		MLX5_TX_PP,
16268f848f32SViacheslav Ovsiienko 		MLX5_TX_SKEW,
16275644d5b9SNelio Laranjeiro 		MLX5_TX_VEC_EN,
16285644d5b9SNelio Laranjeiro 		MLX5_RX_VEC_EN,
162978a54648SXueming Li 		MLX5_L3_VXLAN_EN,
1630db209cc3SNélio Laranjeiro 		MLX5_VF_NL_EN,
1631e2b4925eSOri Kam 		MLX5_DV_ESW_EN,
163251e72d38SOri Kam 		MLX5_DV_FLOW_EN,
16332d241515SViacheslav Ovsiienko 		MLX5_DV_XMETA_EN,
16340f0ae73aSShiri Kuzin 		MLX5_LACP_BY_USER,
1635dceb5029SYongseok Koh 		MLX5_MR_EXT_MEMSEG_EN,
16366de569f5SAdrien Mazarguil 		MLX5_REPRESENTOR,
1637066cfecdSMatan Azrad 		MLX5_MAX_DUMP_FILES_NUM,
163821bb6c7eSDekel Peled 		MLX5_LRO_TIMEOUT_USEC,
1639d768f324SMatan Azrad 		MLX5_CLASS_ARG_NAME,
16401ad9a3d0SBing Zhao 		MLX5_HP_BUF_SIZE,
1641a1da6f62SSuanming Mou 		MLX5_RECLAIM_MEM,
16425522da6bSSuanming Mou 		MLX5_SYS_MEM_EN,
164350f95b23SSuanming Mou 		MLX5_DECAP_EN,
1644e72dd09bSNélio Laranjeiro 		NULL,
1645e72dd09bSNélio Laranjeiro 	};
1646e72dd09bSNélio Laranjeiro 	struct rte_kvargs *kvlist;
1647e72dd09bSNélio Laranjeiro 	int ret = 0;
1648e72dd09bSNélio Laranjeiro 	int i;
1649e72dd09bSNélio Laranjeiro 
1650e72dd09bSNélio Laranjeiro 	if (devargs == NULL)
1651e72dd09bSNélio Laranjeiro 		return 0;
1652e72dd09bSNélio Laranjeiro 	/* Following UGLY cast is done to pass checkpatch. */
1653e72dd09bSNélio Laranjeiro 	kvlist = rte_kvargs_parse(devargs->args, params);
165415b0ea00SMatan Azrad 	if (kvlist == NULL) {
165515b0ea00SMatan Azrad 		rte_errno = EINVAL;
165615b0ea00SMatan Azrad 		return -rte_errno;
165715b0ea00SMatan Azrad 	}
1658e72dd09bSNélio Laranjeiro 	/* Process parameters. */
1659e72dd09bSNélio Laranjeiro 	for (i = 0; (params[i] != NULL); ++i) {
1660e72dd09bSNélio Laranjeiro 		if (rte_kvargs_count(kvlist, params[i])) {
1661e72dd09bSNélio Laranjeiro 			ret = rte_kvargs_process(kvlist, params[i],
16627fe24446SShahaf Shuler 						 mlx5_args_check, config);
1663a6d83b6aSNélio Laranjeiro 			if (ret) {
1664a6d83b6aSNélio Laranjeiro 				rte_errno = EINVAL;
1665a67323e4SShahaf Shuler 				rte_kvargs_free(kvlist);
1666a6d83b6aSNélio Laranjeiro 				return -rte_errno;
1667e72dd09bSNélio Laranjeiro 			}
1668e72dd09bSNélio Laranjeiro 		}
1669a67323e4SShahaf Shuler 	}
1670e72dd09bSNélio Laranjeiro 	rte_kvargs_free(kvlist);
1671e72dd09bSNélio Laranjeiro 	return 0;
1672e72dd09bSNélio Laranjeiro }
1673e72dd09bSNélio Laranjeiro 
16747be600c8SYongseok Koh /**
167538b4b397SViacheslav Ovsiienko  * Configures the minimal amount of data to inline into WQE
167638b4b397SViacheslav Ovsiienko  * while sending packets.
167738b4b397SViacheslav Ovsiienko  *
167838b4b397SViacheslav Ovsiienko  * - the txq_inline_min has the maximal priority, if this
167938b4b397SViacheslav Ovsiienko  *   key is specified in devargs
168038b4b397SViacheslav Ovsiienko  * - if DevX is enabled the inline mode is queried from the
168138b4b397SViacheslav Ovsiienko  *   device (HCA attributes and NIC vport context if needed).
1682ee76bddcSThomas Monjalon  * - otherwise L2 mode (18 bytes) is assumed for ConnectX-4/4 Lx
168338b4b397SViacheslav Ovsiienko  *   and none (0 bytes) for other NICs
168438b4b397SViacheslav Ovsiienko  *
168538b4b397SViacheslav Ovsiienko  * @param spawn
168638b4b397SViacheslav Ovsiienko  *   Verbs device parameters (name, port, switch_info) to spawn.
168738b4b397SViacheslav Ovsiienko  * @param config
168838b4b397SViacheslav Ovsiienko  *   Device configuration parameters.
168938b4b397SViacheslav Ovsiienko  */
16902eb4d010SOphir Munk void
169138b4b397SViacheslav Ovsiienko mlx5_set_min_inline(struct mlx5_dev_spawn_data *spawn,
169238b4b397SViacheslav Ovsiienko 		    struct mlx5_dev_config *config)
169338b4b397SViacheslav Ovsiienko {
169438b4b397SViacheslav Ovsiienko 	if (config->txq_inline_min != MLX5_ARG_UNSET) {
169538b4b397SViacheslav Ovsiienko 		/* Application defines size of inlined data explicitly. */
169638b4b397SViacheslav Ovsiienko 		switch (spawn->pci_dev->id.device_id) {
169738b4b397SViacheslav Ovsiienko 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
169838b4b397SViacheslav Ovsiienko 		case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
169938b4b397SViacheslav Ovsiienko 			if (config->txq_inline_min <
170038b4b397SViacheslav Ovsiienko 				       (int)MLX5_INLINE_HSIZE_L2) {
170138b4b397SViacheslav Ovsiienko 				DRV_LOG(DEBUG,
170238b4b397SViacheslav Ovsiienko 					"txq_inline_mix aligned to minimal"
170338b4b397SViacheslav Ovsiienko 					" ConnectX-4 required value %d",
170438b4b397SViacheslav Ovsiienko 					(int)MLX5_INLINE_HSIZE_L2);
170538b4b397SViacheslav Ovsiienko 				config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
170638b4b397SViacheslav Ovsiienko 			}
170738b4b397SViacheslav Ovsiienko 			break;
170838b4b397SViacheslav Ovsiienko 		}
170938b4b397SViacheslav Ovsiienko 		goto exit;
171038b4b397SViacheslav Ovsiienko 	}
171138b4b397SViacheslav Ovsiienko 	if (config->hca_attr.eth_net_offloads) {
171238b4b397SViacheslav Ovsiienko 		/* We have DevX enabled, inline mode queried successfully. */
171338b4b397SViacheslav Ovsiienko 		switch (config->hca_attr.wqe_inline_mode) {
171438b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_L2:
171538b4b397SViacheslav Ovsiienko 			/* outer L2 header must be inlined. */
171638b4b397SViacheslav Ovsiienko 			config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
171738b4b397SViacheslav Ovsiienko 			goto exit;
171838b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_NOT_REQUIRED:
171938b4b397SViacheslav Ovsiienko 			/* No inline data are required by NIC. */
172038b4b397SViacheslav Ovsiienko 			config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
172138b4b397SViacheslav Ovsiienko 			config->hw_vlan_insert =
172238b4b397SViacheslav Ovsiienko 				config->hca_attr.wqe_vlan_insert;
172338b4b397SViacheslav Ovsiienko 			DRV_LOG(DEBUG, "Tx VLAN insertion is supported");
172438b4b397SViacheslav Ovsiienko 			goto exit;
172538b4b397SViacheslav Ovsiienko 		case MLX5_CAP_INLINE_MODE_VPORT_CONTEXT:
172638b4b397SViacheslav Ovsiienko 			/* inline mode is defined by NIC vport context. */
172738b4b397SViacheslav Ovsiienko 			if (!config->hca_attr.eth_virt)
172838b4b397SViacheslav Ovsiienko 				break;
172938b4b397SViacheslav Ovsiienko 			switch (config->hca_attr.vport_inline_mode) {
173038b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_NONE:
173138b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
173238b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_NONE;
173338b4b397SViacheslav Ovsiienko 				goto exit;
173438b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_L2:
173538b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
173638b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L2;
173738b4b397SViacheslav Ovsiienko 				goto exit;
173838b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_IP:
173938b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174038b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L3;
174138b4b397SViacheslav Ovsiienko 				goto exit;
174238b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_TCP_UDP:
174338b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174438b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_L4;
174538b4b397SViacheslav Ovsiienko 				goto exit;
174638b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_L2:
174738b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
174838b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L2;
174938b4b397SViacheslav Ovsiienko 				goto exit;
175038b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_IP:
175138b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
175238b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L3;
175338b4b397SViacheslav Ovsiienko 				goto exit;
175438b4b397SViacheslav Ovsiienko 			case MLX5_INLINE_MODE_INNER_TCP_UDP:
175538b4b397SViacheslav Ovsiienko 				config->txq_inline_min =
175638b4b397SViacheslav Ovsiienko 					MLX5_INLINE_HSIZE_INNER_L4;
175738b4b397SViacheslav Ovsiienko 				goto exit;
175838b4b397SViacheslav Ovsiienko 			}
175938b4b397SViacheslav Ovsiienko 		}
176038b4b397SViacheslav Ovsiienko 	}
176138b4b397SViacheslav Ovsiienko 	/*
176238b4b397SViacheslav Ovsiienko 	 * We get here if we are unable to deduce
176338b4b397SViacheslav Ovsiienko 	 * inline data size with DevX. Try PCI ID
176438b4b397SViacheslav Ovsiienko 	 * to determine old NICs.
176538b4b397SViacheslav Ovsiienko 	 */
176638b4b397SViacheslav Ovsiienko 	switch (spawn->pci_dev->id.device_id) {
176738b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4:
176838b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4VF:
176938b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4LX:
177038b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF:
1771614de6c8SViacheslav Ovsiienko 		config->txq_inline_min = MLX5_INLINE_HSIZE_L2;
177238b4b397SViacheslav Ovsiienko 		config->hw_vlan_insert = 0;
177338b4b397SViacheslav Ovsiienko 		break;
177438b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5:
177538b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5VF:
177638b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5EX:
177738b4b397SViacheslav Ovsiienko 	case PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF:
177838b4b397SViacheslav Ovsiienko 		/*
177938b4b397SViacheslav Ovsiienko 		 * These NICs support VLAN insertion from WQE and
178038b4b397SViacheslav Ovsiienko 		 * report the wqe_vlan_insert flag. But there is the bug
178138b4b397SViacheslav Ovsiienko 		 * and PFC control may be broken, so disable feature.
178238b4b397SViacheslav Ovsiienko 		 */
178338b4b397SViacheslav Ovsiienko 		config->hw_vlan_insert = 0;
178420215627SDavid Christensen 		config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
178538b4b397SViacheslav Ovsiienko 		break;
178638b4b397SViacheslav Ovsiienko 	default:
178738b4b397SViacheslav Ovsiienko 		config->txq_inline_min = MLX5_INLINE_HSIZE_NONE;
178838b4b397SViacheslav Ovsiienko 		break;
178938b4b397SViacheslav Ovsiienko 	}
179038b4b397SViacheslav Ovsiienko exit:
179138b4b397SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "min tx inline configured: %d", config->txq_inline_min);
179238b4b397SViacheslav Ovsiienko }
179338b4b397SViacheslav Ovsiienko 
179438b4b397SViacheslav Ovsiienko /**
179539139371SViacheslav Ovsiienko  * Configures the metadata mask fields in the shared context.
179639139371SViacheslav Ovsiienko  *
179739139371SViacheslav Ovsiienko  * @param [in] dev
179839139371SViacheslav Ovsiienko  *   Pointer to Ethernet device.
179939139371SViacheslav Ovsiienko  */
18002eb4d010SOphir Munk void
180139139371SViacheslav Ovsiienko mlx5_set_metadata_mask(struct rte_eth_dev *dev)
180239139371SViacheslav Ovsiienko {
180339139371SViacheslav Ovsiienko 	struct mlx5_priv *priv = dev->data->dev_private;
18046e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
180539139371SViacheslav Ovsiienko 	uint32_t meta, mark, reg_c0;
180639139371SViacheslav Ovsiienko 
180739139371SViacheslav Ovsiienko 	reg_c0 = ~priv->vport_meta_mask;
180839139371SViacheslav Ovsiienko 	switch (priv->config.dv_xmeta_en) {
180939139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_LEGACY:
181039139371SViacheslav Ovsiienko 		meta = UINT32_MAX;
181139139371SViacheslav Ovsiienko 		mark = MLX5_FLOW_MARK_MASK;
181239139371SViacheslav Ovsiienko 		break;
181339139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_META16:
181439139371SViacheslav Ovsiienko 		meta = reg_c0 >> rte_bsf32(reg_c0);
181539139371SViacheslav Ovsiienko 		mark = MLX5_FLOW_MARK_MASK;
181639139371SViacheslav Ovsiienko 		break;
181739139371SViacheslav Ovsiienko 	case MLX5_XMETA_MODE_META32:
181839139371SViacheslav Ovsiienko 		meta = UINT32_MAX;
181939139371SViacheslav Ovsiienko 		mark = (reg_c0 >> rte_bsf32(reg_c0)) & MLX5_FLOW_MARK_MASK;
182039139371SViacheslav Ovsiienko 		break;
182139139371SViacheslav Ovsiienko 	default:
182239139371SViacheslav Ovsiienko 		meta = 0;
182339139371SViacheslav Ovsiienko 		mark = 0;
18248e46d4e1SAlexander Kozyrev 		MLX5_ASSERT(false);
182539139371SViacheslav Ovsiienko 		break;
182639139371SViacheslav Ovsiienko 	}
182739139371SViacheslav Ovsiienko 	if (sh->dv_mark_mask && sh->dv_mark_mask != mark)
182839139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata MARK mask mismatche %08X:%08X",
182939139371SViacheslav Ovsiienko 				 sh->dv_mark_mask, mark);
183039139371SViacheslav Ovsiienko 	else
183139139371SViacheslav Ovsiienko 		sh->dv_mark_mask = mark;
183239139371SViacheslav Ovsiienko 	if (sh->dv_meta_mask && sh->dv_meta_mask != meta)
183339139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata META mask mismatche %08X:%08X",
183439139371SViacheslav Ovsiienko 				 sh->dv_meta_mask, meta);
183539139371SViacheslav Ovsiienko 	else
183639139371SViacheslav Ovsiienko 		sh->dv_meta_mask = meta;
183739139371SViacheslav Ovsiienko 	if (sh->dv_regc0_mask && sh->dv_regc0_mask != reg_c0)
183839139371SViacheslav Ovsiienko 		DRV_LOG(WARNING, "metadata reg_c0 mask mismatche %08X:%08X",
183939139371SViacheslav Ovsiienko 				 sh->dv_meta_mask, reg_c0);
184039139371SViacheslav Ovsiienko 	else
184139139371SViacheslav Ovsiienko 		sh->dv_regc0_mask = reg_c0;
184239139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata mode %u", priv->config.dv_xmeta_en);
184339139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata MARK mask %08X", sh->dv_mark_mask);
184439139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata META mask %08X", sh->dv_meta_mask);
184539139371SViacheslav Ovsiienko 	DRV_LOG(DEBUG, "metadata reg_c0 mask %08X", sh->dv_regc0_mask);
184639139371SViacheslav Ovsiienko }
184739139371SViacheslav Ovsiienko 
1848efa79e68SOri Kam int
1849efa79e68SOri Kam rte_pmd_mlx5_get_dyn_flag_names(char *names[], unsigned int n)
1850efa79e68SOri Kam {
1851efa79e68SOri Kam 	static const char *const dynf_names[] = {
1852efa79e68SOri Kam 		RTE_PMD_MLX5_FINE_GRANULARITY_INLINE,
18538f848f32SViacheslav Ovsiienko 		RTE_MBUF_DYNFLAG_METADATA_NAME,
18548f848f32SViacheslav Ovsiienko 		RTE_MBUF_DYNFLAG_TX_TIMESTAMP_NAME
1855efa79e68SOri Kam 	};
1856efa79e68SOri Kam 	unsigned int i;
1857efa79e68SOri Kam 
1858efa79e68SOri Kam 	if (n < RTE_DIM(dynf_names))
1859efa79e68SOri Kam 		return -ENOMEM;
1860efa79e68SOri Kam 	for (i = 0; i < RTE_DIM(dynf_names); i++) {
1861efa79e68SOri Kam 		if (names[i] == NULL)
1862efa79e68SOri Kam 			return -EINVAL;
1863efa79e68SOri Kam 		strcpy(names[i], dynf_names[i]);
1864efa79e68SOri Kam 	}
1865efa79e68SOri Kam 	return RTE_DIM(dynf_names);
1866efa79e68SOri Kam }
1867efa79e68SOri Kam 
186821cae858SDekel Peled /**
18692eb4d010SOphir Munk  * Comparison callback to sort device data.
187092d5dd48SViacheslav Ovsiienko  *
18712eb4d010SOphir Munk  * This is meant to be used with qsort().
187292d5dd48SViacheslav Ovsiienko  *
18732eb4d010SOphir Munk  * @param a[in]
18742eb4d010SOphir Munk  *   Pointer to pointer to first data object.
18752eb4d010SOphir Munk  * @param b[in]
18762eb4d010SOphir Munk  *   Pointer to pointer to second data object.
187792d5dd48SViacheslav Ovsiienko  *
187892d5dd48SViacheslav Ovsiienko  * @return
18792eb4d010SOphir Munk  *   0 if both objects are equal, less than 0 if the first argument is less
18802eb4d010SOphir Munk  *   than the second, greater than 0 otherwise.
188192d5dd48SViacheslav Ovsiienko  */
18822eb4d010SOphir Munk int
188392d5dd48SViacheslav Ovsiienko mlx5_dev_check_sibling_config(struct mlx5_priv *priv,
188492d5dd48SViacheslav Ovsiienko 			      struct mlx5_dev_config *config)
188592d5dd48SViacheslav Ovsiienko {
18866e88bc42SOphir Munk 	struct mlx5_dev_ctx_shared *sh = priv->sh;
188792d5dd48SViacheslav Ovsiienko 	struct mlx5_dev_config *sh_conf = NULL;
188892d5dd48SViacheslav Ovsiienko 	uint16_t port_id;
188992d5dd48SViacheslav Ovsiienko 
18908e46d4e1SAlexander Kozyrev 	MLX5_ASSERT(sh);
189192d5dd48SViacheslav Ovsiienko 	/* Nothing to compare for the single/first device. */
189292d5dd48SViacheslav Ovsiienko 	if (sh->refcnt == 1)
189392d5dd48SViacheslav Ovsiienko 		return 0;
189492d5dd48SViacheslav Ovsiienko 	/* Find the device with shared context. */
1895fbc83412SViacheslav Ovsiienko 	MLX5_ETH_FOREACH_DEV(port_id, priv->pci_dev) {
189692d5dd48SViacheslav Ovsiienko 		struct mlx5_priv *opriv =
189792d5dd48SViacheslav Ovsiienko 			rte_eth_devices[port_id].data->dev_private;
189892d5dd48SViacheslav Ovsiienko 
189992d5dd48SViacheslav Ovsiienko 		if (opriv && opriv != priv && opriv->sh == sh) {
190092d5dd48SViacheslav Ovsiienko 			sh_conf = &opriv->config;
190192d5dd48SViacheslav Ovsiienko 			break;
190292d5dd48SViacheslav Ovsiienko 		}
190392d5dd48SViacheslav Ovsiienko 	}
190492d5dd48SViacheslav Ovsiienko 	if (!sh_conf)
190592d5dd48SViacheslav Ovsiienko 		return 0;
190692d5dd48SViacheslav Ovsiienko 	if (sh_conf->dv_flow_en ^ config->dv_flow_en) {
190792d5dd48SViacheslav Ovsiienko 		DRV_LOG(ERR, "\"dv_flow_en\" configuration mismatch"
190892d5dd48SViacheslav Ovsiienko 			     " for shared %s context", sh->ibdev_name);
190992d5dd48SViacheslav Ovsiienko 		rte_errno = EINVAL;
191092d5dd48SViacheslav Ovsiienko 		return rte_errno;
191192d5dd48SViacheslav Ovsiienko 	}
19122d241515SViacheslav Ovsiienko 	if (sh_conf->dv_xmeta_en ^ config->dv_xmeta_en) {
19132d241515SViacheslav Ovsiienko 		DRV_LOG(ERR, "\"dv_xmeta_en\" configuration mismatch"
19142d241515SViacheslav Ovsiienko 			     " for shared %s context", sh->ibdev_name);
19152d241515SViacheslav Ovsiienko 		rte_errno = EINVAL;
19162d241515SViacheslav Ovsiienko 		return rte_errno;
19172d241515SViacheslav Ovsiienko 	}
191892d5dd48SViacheslav Ovsiienko 	return 0;
191992d5dd48SViacheslav Ovsiienko }
1920771fa900SAdrien Mazarguil 
1921fbc83412SViacheslav Ovsiienko /**
1922fbc83412SViacheslav Ovsiienko  * Look for the ethernet device belonging to mlx5 driver.
1923fbc83412SViacheslav Ovsiienko  *
1924fbc83412SViacheslav Ovsiienko  * @param[in] port_id
1925fbc83412SViacheslav Ovsiienko  *   port_id to start looking for device.
1926fbc83412SViacheslav Ovsiienko  * @param[in] pci_dev
1927fbc83412SViacheslav Ovsiienko  *   Pointer to the hint PCI device. When device is being probed
1928fbc83412SViacheslav Ovsiienko  *   the its siblings (master and preceding representors might
19292eb4d010SOphir Munk  *   not have assigned driver yet (because the mlx5_os_pci_probe()
1930fbc83412SViacheslav Ovsiienko  *   is not completed yet, for this case match on hint PCI
1931fbc83412SViacheslav Ovsiienko  *   device may be used to detect sibling device.
1932fbc83412SViacheslav Ovsiienko  *
1933fbc83412SViacheslav Ovsiienko  * @return
1934fbc83412SViacheslav Ovsiienko  *   port_id of found device, RTE_MAX_ETHPORT if not found.
1935fbc83412SViacheslav Ovsiienko  */
1936f7e95215SViacheslav Ovsiienko uint16_t
1937fbc83412SViacheslav Ovsiienko mlx5_eth_find_next(uint16_t port_id, struct rte_pci_device *pci_dev)
1938f7e95215SViacheslav Ovsiienko {
1939f7e95215SViacheslav Ovsiienko 	while (port_id < RTE_MAX_ETHPORTS) {
1940f7e95215SViacheslav Ovsiienko 		struct rte_eth_dev *dev = &rte_eth_devices[port_id];
1941f7e95215SViacheslav Ovsiienko 
1942f7e95215SViacheslav Ovsiienko 		if (dev->state != RTE_ETH_DEV_UNUSED &&
1943f7e95215SViacheslav Ovsiienko 		    dev->device &&
1944fbc83412SViacheslav Ovsiienko 		    (dev->device == &pci_dev->device ||
1945fbc83412SViacheslav Ovsiienko 		     (dev->device->driver &&
1946f7e95215SViacheslav Ovsiienko 		     dev->device->driver->name &&
1947fbc83412SViacheslav Ovsiienko 		     !strcmp(dev->device->driver->name, MLX5_DRIVER_NAME))))
1948f7e95215SViacheslav Ovsiienko 			break;
1949f7e95215SViacheslav Ovsiienko 		port_id++;
1950f7e95215SViacheslav Ovsiienko 	}
1951f7e95215SViacheslav Ovsiienko 	if (port_id >= RTE_MAX_ETHPORTS)
1952f7e95215SViacheslav Ovsiienko 		return RTE_MAX_ETHPORTS;
1953f7e95215SViacheslav Ovsiienko 	return port_id;
1954f7e95215SViacheslav Ovsiienko }
1955f7e95215SViacheslav Ovsiienko 
19563a820742SOphir Munk /**
19573a820742SOphir Munk  * DPDK callback to remove a PCI device.
19583a820742SOphir Munk  *
19593a820742SOphir Munk  * This function removes all Ethernet devices belong to a given PCI device.
19603a820742SOphir Munk  *
19613a820742SOphir Munk  * @param[in] pci_dev
19623a820742SOphir Munk  *   Pointer to the PCI device.
19633a820742SOphir Munk  *
19643a820742SOphir Munk  * @return
19653a820742SOphir Munk  *   0 on success, the function cannot fail.
19663a820742SOphir Munk  */
19673a820742SOphir Munk static int
19683a820742SOphir Munk mlx5_pci_remove(struct rte_pci_device *pci_dev)
19693a820742SOphir Munk {
19703a820742SOphir Munk 	uint16_t port_id;
19718a5a0aadSThomas Monjalon 	int ret = 0;
19723a820742SOphir Munk 
19732786b7bfSSuanming Mou 	RTE_ETH_FOREACH_DEV_OF(port_id, &pci_dev->device) {
19742786b7bfSSuanming Mou 		/*
19752786b7bfSSuanming Mou 		 * mlx5_dev_close() is not registered to secondary process,
19762786b7bfSSuanming Mou 		 * call the close function explicitly for secondary process.
19772786b7bfSSuanming Mou 		 */
19782786b7bfSSuanming Mou 		if (rte_eal_process_type() == RTE_PROC_SECONDARY)
19798a5a0aadSThomas Monjalon 			ret |= mlx5_dev_close(&rte_eth_devices[port_id]);
19802786b7bfSSuanming Mou 		else
19818a5a0aadSThomas Monjalon 			ret |= rte_eth_dev_close(port_id);
19822786b7bfSSuanming Mou 	}
19838a5a0aadSThomas Monjalon 	return ret == 0 ? 0 : -EIO;
19843a820742SOphir Munk }
19853a820742SOphir Munk 
1986771fa900SAdrien Mazarguil static const struct rte_pci_id mlx5_pci_id_map[] = {
1987771fa900SAdrien Mazarguil 	{
19881d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19891d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4)
1990771fa900SAdrien Mazarguil 	},
1991771fa900SAdrien Mazarguil 	{
19921d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19931d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4VF)
1994771fa900SAdrien Mazarguil 	},
1995771fa900SAdrien Mazarguil 	{
19961d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
19971d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LX)
1998771fa900SAdrien Mazarguil 	},
1999771fa900SAdrien Mazarguil 	{
20001d1bc870SNélio Laranjeiro 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20011d1bc870SNélio Laranjeiro 			       PCI_DEVICE_ID_MELLANOX_CONNECTX4LXVF)
2002771fa900SAdrien Mazarguil 	},
2003771fa900SAdrien Mazarguil 	{
2004528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2005528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5)
2006528a9fbeSYongseok Koh 	},
2007528a9fbeSYongseok Koh 	{
2008528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2009528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5VF)
2010528a9fbeSYongseok Koh 	},
2011528a9fbeSYongseok Koh 	{
2012528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2013528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EX)
2014528a9fbeSYongseok Koh 	},
2015528a9fbeSYongseok Koh 	{
2016528a9fbeSYongseok Koh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2017528a9fbeSYongseok Koh 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5EXVF)
2018528a9fbeSYongseok Koh 	},
2019528a9fbeSYongseok Koh 	{
2020dd3331c6SShahaf Shuler 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2021dd3331c6SShahaf Shuler 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5BF)
2022dd3331c6SShahaf Shuler 	},
2023dd3331c6SShahaf Shuler 	{
2024c322c0e5SOri Kam 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2025c322c0e5SOri Kam 			       PCI_DEVICE_ID_MELLANOX_CONNECTX5BFVF)
2026c322c0e5SOri Kam 	},
2027c322c0e5SOri Kam 	{
2028f0354d84SWisam Jaddo 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2029f0354d84SWisam Jaddo 				PCI_DEVICE_ID_MELLANOX_CONNECTX6)
2030f0354d84SWisam Jaddo 	},
2031f0354d84SWisam Jaddo 	{
2032f0354d84SWisam Jaddo 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
2033f0354d84SWisam Jaddo 				PCI_DEVICE_ID_MELLANOX_CONNECTX6VF)
2034f0354d84SWisam Jaddo 	},
2035f0354d84SWisam Jaddo 	{
20365fc66630SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20375fc66630SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX6DX)
20385fc66630SRaslan Darawsheh 	},
20395fc66630SRaslan Darawsheh 	{
20405fc66630SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20413ea12cadSRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTXVF)
20425fc66630SRaslan Darawsheh 	},
20435fc66630SRaslan Darawsheh 	{
204458b4a2b1SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
204558b4a2b1SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX6DXBF)
204658b4a2b1SRaslan Darawsheh 	},
204758b4a2b1SRaslan Darawsheh 	{
204828c9a7d7SAli Alnubani 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
204928c9a7d7SAli Alnubani 				PCI_DEVICE_ID_MELLANOX_CONNECTX6LX)
205028c9a7d7SAli Alnubani 	},
205128c9a7d7SAli Alnubani 	{
20526ca37b06SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20536ca37b06SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX7)
20546ca37b06SRaslan Darawsheh 	},
20556ca37b06SRaslan Darawsheh 	{
20566ca37b06SRaslan Darawsheh 		RTE_PCI_DEVICE(PCI_VENDOR_ID_MELLANOX,
20576ca37b06SRaslan Darawsheh 				PCI_DEVICE_ID_MELLANOX_CONNECTX7BF)
20586ca37b06SRaslan Darawsheh 	},
20596ca37b06SRaslan Darawsheh 	{
2060771fa900SAdrien Mazarguil 		.vendor_id = 0
2061771fa900SAdrien Mazarguil 	}
2062771fa900SAdrien Mazarguil };
2063771fa900SAdrien Mazarguil 
2064392bf908SParav Pandit static struct mlx5_pci_driver mlx5_driver = {
2065392bf908SParav Pandit 	.driver_class = MLX5_CLASS_NET,
2066392bf908SParav Pandit 	.pci_driver = {
20672f3193cfSJan Viktorin 		.driver = {
2068392bf908SParav Pandit 			.name = MLX5_DRIVER_NAME,
20692f3193cfSJan Viktorin 		},
2070771fa900SAdrien Mazarguil 		.id_table = mlx5_pci_id_map,
20712eb4d010SOphir Munk 		.probe = mlx5_os_pci_probe,
20723a820742SOphir Munk 		.remove = mlx5_pci_remove,
2073989e999dSShahaf Shuler 		.dma_map = mlx5_dma_map,
2074989e999dSShahaf Shuler 		.dma_unmap = mlx5_dma_unmap,
207510f3581dSOphir Munk 		.drv_flags = PCI_DRV_FLAGS,
2076392bf908SParav Pandit 	},
2077771fa900SAdrien Mazarguil };
2078771fa900SAdrien Mazarguil 
20799c99878aSJerin Jacob /* Initialize driver log type. */
20809c99878aSJerin Jacob RTE_LOG_REGISTER(mlx5_logtype, pmd.net.mlx5, NOTICE)
20819c99878aSJerin Jacob 
2082771fa900SAdrien Mazarguil /**
2083771fa900SAdrien Mazarguil  * Driver initialization routine.
2084771fa900SAdrien Mazarguil  */
2085f8e99896SThomas Monjalon RTE_INIT(rte_mlx5_pmd_init)
2086771fa900SAdrien Mazarguil {
208782088001SParav Pandit 	mlx5_common_init();
20885f8ba81cSXueming Li 	/* Build the static tables for Verbs conversion. */
2089ea16068cSYongseok Koh 	mlx5_set_ptype_table();
20905f8ba81cSXueming Li 	mlx5_set_cksum_table();
20915f8ba81cSXueming Li 	mlx5_set_swp_types_table();
20927b4f1e6bSMatan Azrad 	if (mlx5_glue)
2093392bf908SParav Pandit 		mlx5_pci_driver_register(&mlx5_driver);
2094771fa900SAdrien Mazarguil }
2095771fa900SAdrien Mazarguil 
209601f19227SShreyansh Jain RTE_PMD_EXPORT_NAME(net_mlx5, __COUNTER__);
209701f19227SShreyansh Jain RTE_PMD_REGISTER_PCI_TABLE(net_mlx5, mlx5_pci_id_map);
20980880c401SOlivier Matz RTE_PMD_REGISTER_KMOD_DEP(net_mlx5, "* ib_uverbs & mlx5_core & mlx5_ib");
2099