xref: /dpdk/drivers/net/mlx5/mlx5_ethdev.c (revision b233b027490b858f740a75fac19632a25d3aefdd)
1771fa900SAdrien Mazarguil /*-
2771fa900SAdrien Mazarguil  *   BSD LICENSE
3771fa900SAdrien Mazarguil  *
4771fa900SAdrien Mazarguil  *   Copyright 2015 6WIND S.A.
5771fa900SAdrien Mazarguil  *   Copyright 2015 Mellanox.
6771fa900SAdrien Mazarguil  *
7771fa900SAdrien Mazarguil  *   Redistribution and use in source and binary forms, with or without
8771fa900SAdrien Mazarguil  *   modification, are permitted provided that the following conditions
9771fa900SAdrien Mazarguil  *   are met:
10771fa900SAdrien Mazarguil  *
11771fa900SAdrien Mazarguil  *     * Redistributions of source code must retain the above copyright
12771fa900SAdrien Mazarguil  *       notice, this list of conditions and the following disclaimer.
13771fa900SAdrien Mazarguil  *     * Redistributions in binary form must reproduce the above copyright
14771fa900SAdrien Mazarguil  *       notice, this list of conditions and the following disclaimer in
15771fa900SAdrien Mazarguil  *       the documentation and/or other materials provided with the
16771fa900SAdrien Mazarguil  *       distribution.
17771fa900SAdrien Mazarguil  *     * Neither the name of 6WIND S.A. nor the names of its
18771fa900SAdrien Mazarguil  *       contributors may be used to endorse or promote products derived
19771fa900SAdrien Mazarguil  *       from this software without specific prior written permission.
20771fa900SAdrien Mazarguil  *
21771fa900SAdrien Mazarguil  *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22771fa900SAdrien Mazarguil  *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23771fa900SAdrien Mazarguil  *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24771fa900SAdrien Mazarguil  *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25771fa900SAdrien Mazarguil  *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26771fa900SAdrien Mazarguil  *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27771fa900SAdrien Mazarguil  *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28771fa900SAdrien Mazarguil  *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29771fa900SAdrien Mazarguil  *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30771fa900SAdrien Mazarguil  *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31771fa900SAdrien Mazarguil  *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32771fa900SAdrien Mazarguil  */
33771fa900SAdrien Mazarguil 
34f8b9a3baSXueming Li #define _GNU_SOURCE
35f8b9a3baSXueming Li 
36771fa900SAdrien Mazarguil #include <stddef.h>
37e60fbd5bSAdrien Mazarguil #include <assert.h>
38771fa900SAdrien Mazarguil #include <unistd.h>
39771fa900SAdrien Mazarguil #include <stdint.h>
40771fa900SAdrien Mazarguil #include <stdio.h>
41771fa900SAdrien Mazarguil #include <string.h>
42771fa900SAdrien Mazarguil #include <stdlib.h>
43771fa900SAdrien Mazarguil #include <errno.h>
44771fa900SAdrien Mazarguil #include <dirent.h>
45771fa900SAdrien Mazarguil #include <net/if.h>
46771fa900SAdrien Mazarguil #include <sys/ioctl.h>
47771fa900SAdrien Mazarguil #include <sys/socket.h>
483a49ffe3SShahaf Shuler #include <sys/utsname.h>
49771fa900SAdrien Mazarguil #include <netinet/in.h>
50cb8faed7SAdrien Mazarguil #include <linux/ethtool.h>
51cb8faed7SAdrien Mazarguil #include <linux/sockios.h>
523a49ffe3SShahaf Shuler #include <linux/version.h>
53198a3c33SNelio Laranjeiro #include <fcntl.h>
5490260d57SNélio Laranjeiro #include <stdalign.h>
55f8b9a3baSXueming Li #include <sys/un.h>
56771fa900SAdrien Mazarguil 
57771fa900SAdrien Mazarguil #include <rte_atomic.h>
58ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h>
59c752998bSGaetan Rivet #include <rte_bus_pci.h>
60771fa900SAdrien Mazarguil #include <rte_mbuf.h>
61771fa900SAdrien Mazarguil #include <rte_common.h>
62198a3c33SNelio Laranjeiro #include <rte_interrupts.h>
63198a3c33SNelio Laranjeiro #include <rte_alarm.h>
64a48deadaSOr Ami #include <rte_malloc.h>
65771fa900SAdrien Mazarguil 
66771fa900SAdrien Mazarguil #include "mlx5.h"
67e60fbd5bSAdrien Mazarguil #include "mlx5_rxtx.h"
68771fa900SAdrien Mazarguil #include "mlx5_utils.h"
69771fa900SAdrien Mazarguil 
703a49ffe3SShahaf Shuler /* Add defines in case the running kernel is not the same as user headers. */
713a49ffe3SShahaf Shuler #ifndef ETHTOOL_GLINKSETTINGS
723a49ffe3SShahaf Shuler struct ethtool_link_settings {
733a49ffe3SShahaf Shuler 	uint32_t cmd;
743a49ffe3SShahaf Shuler 	uint32_t speed;
753a49ffe3SShahaf Shuler 	uint8_t duplex;
763a49ffe3SShahaf Shuler 	uint8_t port;
773a49ffe3SShahaf Shuler 	uint8_t phy_address;
783a49ffe3SShahaf Shuler 	uint8_t autoneg;
793a49ffe3SShahaf Shuler 	uint8_t mdio_support;
803a49ffe3SShahaf Shuler 	uint8_t eth_to_mdix;
813a49ffe3SShahaf Shuler 	uint8_t eth_tp_mdix_ctrl;
823a49ffe3SShahaf Shuler 	int8_t link_mode_masks_nwords;
833a49ffe3SShahaf Shuler 	uint32_t reserved[8];
843a49ffe3SShahaf Shuler 	uint32_t link_mode_masks[];
853a49ffe3SShahaf Shuler };
863a49ffe3SShahaf Shuler 
873a49ffe3SShahaf Shuler #define ETHTOOL_GLINKSETTINGS 0x0000004c
883a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseT_Full_BIT 5
893a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_Autoneg_BIT 6
903a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseKX_Full_BIT 17
913a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT 18
923a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKR_Full_BIT 19
933a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseR_FEC_BIT 20
943a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT 21
953a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT 22
963a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT 23
973a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT 24
983a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT 25
993a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT 26
1003a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT 27
1013a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT 28
1023a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT 29
1033a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT 30
1043a49ffe3SShahaf Shuler #endif
1053a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_25G
1063a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseCR_Full_BIT 31
1073a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseKR_Full_BIT 32
1083a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseSR_Full_BIT 33
1093a49ffe3SShahaf Shuler #endif
1103a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_50G
1113a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT 34
1123a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT 35
1133a49ffe3SShahaf Shuler #endif
1143a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_100G
1153a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT 36
1163a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT 37
1173a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT 38
1183a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT 39
1193a49ffe3SShahaf Shuler #endif
1203a49ffe3SShahaf Shuler 
121771fa900SAdrien Mazarguil /**
122771fa900SAdrien Mazarguil  * Get interface name from private structure.
123771fa900SAdrien Mazarguil  *
124771fa900SAdrien Mazarguil  * @param[in] priv
125771fa900SAdrien Mazarguil  *   Pointer to private structure.
126771fa900SAdrien Mazarguil  * @param[out] ifname
127771fa900SAdrien Mazarguil  *   Interface name output buffer.
128771fa900SAdrien Mazarguil  *
129771fa900SAdrien Mazarguil  * @return
130771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
131771fa900SAdrien Mazarguil  */
132771fa900SAdrien Mazarguil int
133771fa900SAdrien Mazarguil priv_get_ifname(const struct priv *priv, char (*ifname)[IF_NAMESIZE])
134771fa900SAdrien Mazarguil {
135771fa900SAdrien Mazarguil 	DIR *dir;
136771fa900SAdrien Mazarguil 	struct dirent *dent;
137771fa900SAdrien Mazarguil 	unsigned int dev_type = 0;
138771fa900SAdrien Mazarguil 	unsigned int dev_port_prev = ~0u;
139771fa900SAdrien Mazarguil 	char match[IF_NAMESIZE] = "";
140771fa900SAdrien Mazarguil 
141771fa900SAdrien Mazarguil 	{
14287ec44ceSXueming Li 		MKSTR(path, "%s/device/net", priv->ibdev_path);
143771fa900SAdrien Mazarguil 
144771fa900SAdrien Mazarguil 		dir = opendir(path);
145771fa900SAdrien Mazarguil 		if (dir == NULL)
146771fa900SAdrien Mazarguil 			return -1;
147771fa900SAdrien Mazarguil 	}
148771fa900SAdrien Mazarguil 	while ((dent = readdir(dir)) != NULL) {
149771fa900SAdrien Mazarguil 		char *name = dent->d_name;
150771fa900SAdrien Mazarguil 		FILE *file;
151771fa900SAdrien Mazarguil 		unsigned int dev_port;
152771fa900SAdrien Mazarguil 		int r;
153771fa900SAdrien Mazarguil 
154771fa900SAdrien Mazarguil 		if ((name[0] == '.') &&
155771fa900SAdrien Mazarguil 		    ((name[1] == '\0') ||
156771fa900SAdrien Mazarguil 		     ((name[1] == '.') && (name[2] == '\0'))))
157771fa900SAdrien Mazarguil 			continue;
158771fa900SAdrien Mazarguil 
159771fa900SAdrien Mazarguil 		MKSTR(path, "%s/device/net/%s/%s",
16087ec44ceSXueming Li 		      priv->ibdev_path, name,
161771fa900SAdrien Mazarguil 		      (dev_type ? "dev_id" : "dev_port"));
162771fa900SAdrien Mazarguil 
163771fa900SAdrien Mazarguil 		file = fopen(path, "rb");
164771fa900SAdrien Mazarguil 		if (file == NULL) {
165771fa900SAdrien Mazarguil 			if (errno != ENOENT)
166771fa900SAdrien Mazarguil 				continue;
167771fa900SAdrien Mazarguil 			/*
168771fa900SAdrien Mazarguil 			 * Switch to dev_id when dev_port does not exist as
169771fa900SAdrien Mazarguil 			 * is the case with Linux kernel versions < 3.15.
170771fa900SAdrien Mazarguil 			 */
171771fa900SAdrien Mazarguil try_dev_id:
172771fa900SAdrien Mazarguil 			match[0] = '\0';
173771fa900SAdrien Mazarguil 			if (dev_type)
174771fa900SAdrien Mazarguil 				break;
175771fa900SAdrien Mazarguil 			dev_type = 1;
176771fa900SAdrien Mazarguil 			dev_port_prev = ~0u;
177771fa900SAdrien Mazarguil 			rewinddir(dir);
178771fa900SAdrien Mazarguil 			continue;
179771fa900SAdrien Mazarguil 		}
180771fa900SAdrien Mazarguil 		r = fscanf(file, (dev_type ? "%x" : "%u"), &dev_port);
181771fa900SAdrien Mazarguil 		fclose(file);
182771fa900SAdrien Mazarguil 		if (r != 1)
183771fa900SAdrien Mazarguil 			continue;
184771fa900SAdrien Mazarguil 		/*
185771fa900SAdrien Mazarguil 		 * Switch to dev_id when dev_port returns the same value for
186771fa900SAdrien Mazarguil 		 * all ports. May happen when using a MOFED release older than
187771fa900SAdrien Mazarguil 		 * 3.0 with a Linux kernel >= 3.15.
188771fa900SAdrien Mazarguil 		 */
189771fa900SAdrien Mazarguil 		if (dev_port == dev_port_prev)
190771fa900SAdrien Mazarguil 			goto try_dev_id;
191771fa900SAdrien Mazarguil 		dev_port_prev = dev_port;
192771fa900SAdrien Mazarguil 		if (dev_port == (priv->port - 1u))
193771fa900SAdrien Mazarguil 			snprintf(match, sizeof(match), "%s", name);
194771fa900SAdrien Mazarguil 	}
195771fa900SAdrien Mazarguil 	closedir(dir);
196771fa900SAdrien Mazarguil 	if (match[0] == '\0')
197771fa900SAdrien Mazarguil 		return -1;
198771fa900SAdrien Mazarguil 	strncpy(*ifname, match, sizeof(*ifname));
199771fa900SAdrien Mazarguil 	return 0;
200771fa900SAdrien Mazarguil }
201771fa900SAdrien Mazarguil 
202771fa900SAdrien Mazarguil /**
203859081d3SShahaf Shuler  * Check if the counter is located on ib counters file.
204859081d3SShahaf Shuler  *
205859081d3SShahaf Shuler  * @param[in] cntr
206859081d3SShahaf Shuler  *   Counter name.
207859081d3SShahaf Shuler  *
208859081d3SShahaf Shuler  * @return
209859081d3SShahaf Shuler  *   1 if counter is located on ib counters file , 0 otherwise.
210859081d3SShahaf Shuler  */
211859081d3SShahaf Shuler int
212859081d3SShahaf Shuler priv_is_ib_cntr(const char *cntr)
213859081d3SShahaf Shuler {
214859081d3SShahaf Shuler 	if (!strcmp(cntr, "out_of_buffer"))
215859081d3SShahaf Shuler 		return 1;
216859081d3SShahaf Shuler 	return 0;
217859081d3SShahaf Shuler }
218859081d3SShahaf Shuler 
219859081d3SShahaf Shuler /**
220771fa900SAdrien Mazarguil  * Read from sysfs entry.
221771fa900SAdrien Mazarguil  *
222771fa900SAdrien Mazarguil  * @param[in] priv
223771fa900SAdrien Mazarguil  *   Pointer to private structure.
224771fa900SAdrien Mazarguil  * @param[in] entry
225771fa900SAdrien Mazarguil  *   Entry name relative to sysfs path.
226771fa900SAdrien Mazarguil  * @param[out] buf
227771fa900SAdrien Mazarguil  *   Data output buffer.
228771fa900SAdrien Mazarguil  * @param size
229771fa900SAdrien Mazarguil  *   Buffer size.
230771fa900SAdrien Mazarguil  *
231771fa900SAdrien Mazarguil  * @return
232771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
233771fa900SAdrien Mazarguil  */
234771fa900SAdrien Mazarguil static int
235771fa900SAdrien Mazarguil priv_sysfs_read(const struct priv *priv, const char *entry,
236771fa900SAdrien Mazarguil 		char *buf, size_t size)
237771fa900SAdrien Mazarguil {
238771fa900SAdrien Mazarguil 	char ifname[IF_NAMESIZE];
239771fa900SAdrien Mazarguil 	FILE *file;
240771fa900SAdrien Mazarguil 	int ret;
241771fa900SAdrien Mazarguil 	int err;
242771fa900SAdrien Mazarguil 
243771fa900SAdrien Mazarguil 	if (priv_get_ifname(priv, &ifname))
244771fa900SAdrien Mazarguil 		return -1;
245771fa900SAdrien Mazarguil 
246859081d3SShahaf Shuler 	if (priv_is_ib_cntr(entry)) {
247859081d3SShahaf Shuler 		MKSTR(path, "%s/ports/1/hw_counters/%s",
24887ec44ceSXueming Li 		      priv->ibdev_path, entry);
249771fa900SAdrien Mazarguil 		file = fopen(path, "rb");
250859081d3SShahaf Shuler 	} else {
251859081d3SShahaf Shuler 		MKSTR(path, "%s/device/net/%s/%s",
25287ec44ceSXueming Li 		      priv->ibdev_path, ifname, entry);
253859081d3SShahaf Shuler 		file = fopen(path, "rb");
254859081d3SShahaf Shuler 	}
255771fa900SAdrien Mazarguil 	if (file == NULL)
256771fa900SAdrien Mazarguil 		return -1;
257771fa900SAdrien Mazarguil 	ret = fread(buf, 1, size, file);
258771fa900SAdrien Mazarguil 	err = errno;
259771fa900SAdrien Mazarguil 	if (((size_t)ret < size) && (ferror(file)))
260771fa900SAdrien Mazarguil 		ret = -1;
261771fa900SAdrien Mazarguil 	else
262771fa900SAdrien Mazarguil 		ret = size;
263771fa900SAdrien Mazarguil 	fclose(file);
264771fa900SAdrien Mazarguil 	errno = err;
265771fa900SAdrien Mazarguil 	return ret;
266771fa900SAdrien Mazarguil }
267771fa900SAdrien Mazarguil 
268771fa900SAdrien Mazarguil /**
269771fa900SAdrien Mazarguil  * Write to sysfs entry.
270771fa900SAdrien Mazarguil  *
271771fa900SAdrien Mazarguil  * @param[in] priv
272771fa900SAdrien Mazarguil  *   Pointer to private structure.
273771fa900SAdrien Mazarguil  * @param[in] entry
274771fa900SAdrien Mazarguil  *   Entry name relative to sysfs path.
275771fa900SAdrien Mazarguil  * @param[in] buf
276771fa900SAdrien Mazarguil  *   Data buffer.
277771fa900SAdrien Mazarguil  * @param size
278771fa900SAdrien Mazarguil  *   Buffer size.
279771fa900SAdrien Mazarguil  *
280771fa900SAdrien Mazarguil  * @return
281771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
282771fa900SAdrien Mazarguil  */
283771fa900SAdrien Mazarguil static int
284771fa900SAdrien Mazarguil priv_sysfs_write(const struct priv *priv, const char *entry,
285771fa900SAdrien Mazarguil 		 char *buf, size_t size)
286771fa900SAdrien Mazarguil {
287771fa900SAdrien Mazarguil 	char ifname[IF_NAMESIZE];
288771fa900SAdrien Mazarguil 	FILE *file;
289771fa900SAdrien Mazarguil 	int ret;
290771fa900SAdrien Mazarguil 	int err;
291771fa900SAdrien Mazarguil 
292771fa900SAdrien Mazarguil 	if (priv_get_ifname(priv, &ifname))
293771fa900SAdrien Mazarguil 		return -1;
294771fa900SAdrien Mazarguil 
29587ec44ceSXueming Li 	MKSTR(path, "%s/device/net/%s/%s", priv->ibdev_path, ifname, entry);
296771fa900SAdrien Mazarguil 
297771fa900SAdrien Mazarguil 	file = fopen(path, "wb");
298771fa900SAdrien Mazarguil 	if (file == NULL)
299771fa900SAdrien Mazarguil 		return -1;
300771fa900SAdrien Mazarguil 	ret = fwrite(buf, 1, size, file);
301771fa900SAdrien Mazarguil 	err = errno;
302771fa900SAdrien Mazarguil 	if (((size_t)ret < size) || (ferror(file)))
303771fa900SAdrien Mazarguil 		ret = -1;
304771fa900SAdrien Mazarguil 	else
305771fa900SAdrien Mazarguil 		ret = size;
306771fa900SAdrien Mazarguil 	fclose(file);
307771fa900SAdrien Mazarguil 	errno = err;
308771fa900SAdrien Mazarguil 	return ret;
309771fa900SAdrien Mazarguil }
310771fa900SAdrien Mazarguil 
311771fa900SAdrien Mazarguil /**
312771fa900SAdrien Mazarguil  * Get unsigned long sysfs property.
313771fa900SAdrien Mazarguil  *
314771fa900SAdrien Mazarguil  * @param priv
315771fa900SAdrien Mazarguil  *   Pointer to private structure.
316771fa900SAdrien Mazarguil  * @param[in] name
317771fa900SAdrien Mazarguil  *   Entry name relative to sysfs path.
318771fa900SAdrien Mazarguil  * @param[out] value
319771fa900SAdrien Mazarguil  *   Value output buffer.
320771fa900SAdrien Mazarguil  *
321771fa900SAdrien Mazarguil  * @return
322771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
323771fa900SAdrien Mazarguil  */
324771fa900SAdrien Mazarguil static int
325771fa900SAdrien Mazarguil priv_get_sysfs_ulong(struct priv *priv, const char *name, unsigned long *value)
326771fa900SAdrien Mazarguil {
327771fa900SAdrien Mazarguil 	int ret;
328771fa900SAdrien Mazarguil 	unsigned long value_ret;
329771fa900SAdrien Mazarguil 	char value_str[32];
330771fa900SAdrien Mazarguil 
331771fa900SAdrien Mazarguil 	ret = priv_sysfs_read(priv, name, value_str, (sizeof(value_str) - 1));
332771fa900SAdrien Mazarguil 	if (ret == -1) {
333771fa900SAdrien Mazarguil 		DEBUG("cannot read %s value from sysfs: %s",
334771fa900SAdrien Mazarguil 		      name, strerror(errno));
335771fa900SAdrien Mazarguil 		return -1;
336771fa900SAdrien Mazarguil 	}
337771fa900SAdrien Mazarguil 	value_str[ret] = '\0';
338771fa900SAdrien Mazarguil 	errno = 0;
339771fa900SAdrien Mazarguil 	value_ret = strtoul(value_str, NULL, 0);
340771fa900SAdrien Mazarguil 	if (errno) {
341771fa900SAdrien Mazarguil 		DEBUG("invalid %s value `%s': %s", name, value_str,
342771fa900SAdrien Mazarguil 		      strerror(errno));
343771fa900SAdrien Mazarguil 		return -1;
344771fa900SAdrien Mazarguil 	}
345771fa900SAdrien Mazarguil 	*value = value_ret;
346771fa900SAdrien Mazarguil 	return 0;
347771fa900SAdrien Mazarguil }
348771fa900SAdrien Mazarguil 
349771fa900SAdrien Mazarguil /**
350771fa900SAdrien Mazarguil  * Set unsigned long sysfs property.
351771fa900SAdrien Mazarguil  *
352771fa900SAdrien Mazarguil  * @param priv
353771fa900SAdrien Mazarguil  *   Pointer to private structure.
354771fa900SAdrien Mazarguil  * @param[in] name
355771fa900SAdrien Mazarguil  *   Entry name relative to sysfs path.
356771fa900SAdrien Mazarguil  * @param value
357771fa900SAdrien Mazarguil  *   Value to set.
358771fa900SAdrien Mazarguil  *
359771fa900SAdrien Mazarguil  * @return
360771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
361771fa900SAdrien Mazarguil  */
362771fa900SAdrien Mazarguil static int
363771fa900SAdrien Mazarguil priv_set_sysfs_ulong(struct priv *priv, const char *name, unsigned long value)
364771fa900SAdrien Mazarguil {
365771fa900SAdrien Mazarguil 	int ret;
366771fa900SAdrien Mazarguil 	MKSTR(value_str, "%lu", value);
367771fa900SAdrien Mazarguil 
368771fa900SAdrien Mazarguil 	ret = priv_sysfs_write(priv, name, value_str, (sizeof(value_str) - 1));
369771fa900SAdrien Mazarguil 	if (ret == -1) {
370771fa900SAdrien Mazarguil 		DEBUG("cannot write %s `%s' (%lu) to sysfs: %s",
371771fa900SAdrien Mazarguil 		      name, value_str, value, strerror(errno));
372771fa900SAdrien Mazarguil 		return -1;
373771fa900SAdrien Mazarguil 	}
374771fa900SAdrien Mazarguil 	return 0;
375771fa900SAdrien Mazarguil }
376771fa900SAdrien Mazarguil 
377771fa900SAdrien Mazarguil /**
378771fa900SAdrien Mazarguil  * Perform ifreq ioctl() on associated Ethernet device.
379771fa900SAdrien Mazarguil  *
380771fa900SAdrien Mazarguil  * @param[in] priv
381771fa900SAdrien Mazarguil  *   Pointer to private structure.
382771fa900SAdrien Mazarguil  * @param req
383771fa900SAdrien Mazarguil  *   Request number to pass to ioctl().
384771fa900SAdrien Mazarguil  * @param[out] ifr
385771fa900SAdrien Mazarguil  *   Interface request structure output buffer.
386771fa900SAdrien Mazarguil  *
387771fa900SAdrien Mazarguil  * @return
388771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
389771fa900SAdrien Mazarguil  */
390771fa900SAdrien Mazarguil int
391771fa900SAdrien Mazarguil priv_ifreq(const struct priv *priv, int req, struct ifreq *ifr)
392771fa900SAdrien Mazarguil {
393771fa900SAdrien Mazarguil 	int sock = socket(PF_INET, SOCK_DGRAM, IPPROTO_IP);
394771fa900SAdrien Mazarguil 	int ret = -1;
395771fa900SAdrien Mazarguil 
396771fa900SAdrien Mazarguil 	if (sock == -1)
397771fa900SAdrien Mazarguil 		return ret;
398771fa900SAdrien Mazarguil 	if (priv_get_ifname(priv, &ifr->ifr_name) == 0)
399771fa900SAdrien Mazarguil 		ret = ioctl(sock, req, ifr);
400771fa900SAdrien Mazarguil 	close(sock);
401771fa900SAdrien Mazarguil 	return ret;
402771fa900SAdrien Mazarguil }
403771fa900SAdrien Mazarguil 
404771fa900SAdrien Mazarguil /**
40585e347dbSNélio Laranjeiro  * Return the number of active VFs for the current device.
40685e347dbSNélio Laranjeiro  *
40785e347dbSNélio Laranjeiro  * @param[in] priv
40885e347dbSNélio Laranjeiro  *   Pointer to private structure.
40985e347dbSNélio Laranjeiro  * @param[out] num_vfs
41085e347dbSNélio Laranjeiro  *   Number of active VFs.
41185e347dbSNélio Laranjeiro  *
41285e347dbSNélio Laranjeiro  * @return
41385e347dbSNélio Laranjeiro  *   0 on success, -1 on failure and errno is set.
41485e347dbSNélio Laranjeiro  */
41585e347dbSNélio Laranjeiro int
41685e347dbSNélio Laranjeiro priv_get_num_vfs(struct priv *priv, uint16_t *num_vfs)
41785e347dbSNélio Laranjeiro {
41885e347dbSNélio Laranjeiro 	/* The sysfs entry name depends on the operating system. */
41985e347dbSNélio Laranjeiro 	const char **name = (const char *[]){
42085e347dbSNélio Laranjeiro 		"device/sriov_numvfs",
42185e347dbSNélio Laranjeiro 		"device/mlx5_num_vfs",
42285e347dbSNélio Laranjeiro 		NULL,
42385e347dbSNélio Laranjeiro 	};
42485e347dbSNélio Laranjeiro 	int ret;
42585e347dbSNélio Laranjeiro 
42685e347dbSNélio Laranjeiro 	do {
42785e347dbSNélio Laranjeiro 		unsigned long ulong_num_vfs;
42885e347dbSNélio Laranjeiro 
42985e347dbSNélio Laranjeiro 		ret = priv_get_sysfs_ulong(priv, *name, &ulong_num_vfs);
43085e347dbSNélio Laranjeiro 		if (!ret)
43185e347dbSNélio Laranjeiro 			*num_vfs = ulong_num_vfs;
43285e347dbSNélio Laranjeiro 	} while (*(++name) && ret);
43385e347dbSNélio Laranjeiro 	return ret;
43485e347dbSNélio Laranjeiro }
43585e347dbSNélio Laranjeiro 
43685e347dbSNélio Laranjeiro /**
437771fa900SAdrien Mazarguil  * Get device MTU.
438771fa900SAdrien Mazarguil  *
439771fa900SAdrien Mazarguil  * @param priv
440771fa900SAdrien Mazarguil  *   Pointer to private structure.
441771fa900SAdrien Mazarguil  * @param[out] mtu
442771fa900SAdrien Mazarguil  *   MTU value output buffer.
443771fa900SAdrien Mazarguil  *
444771fa900SAdrien Mazarguil  * @return
445771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
446771fa900SAdrien Mazarguil  */
447771fa900SAdrien Mazarguil int
448771fa900SAdrien Mazarguil priv_get_mtu(struct priv *priv, uint16_t *mtu)
449771fa900SAdrien Mazarguil {
450771fa900SAdrien Mazarguil 	unsigned long ulong_mtu;
451771fa900SAdrien Mazarguil 
452771fa900SAdrien Mazarguil 	if (priv_get_sysfs_ulong(priv, "mtu", &ulong_mtu) == -1)
453771fa900SAdrien Mazarguil 		return -1;
454771fa900SAdrien Mazarguil 	*mtu = ulong_mtu;
455771fa900SAdrien Mazarguil 	return 0;
456771fa900SAdrien Mazarguil }
457771fa900SAdrien Mazarguil 
458771fa900SAdrien Mazarguil /**
459859081d3SShahaf Shuler  * Read device counter from sysfs.
460859081d3SShahaf Shuler  *
461859081d3SShahaf Shuler  * @param priv
462859081d3SShahaf Shuler  *   Pointer to private structure.
463859081d3SShahaf Shuler  * @param name
464859081d3SShahaf Shuler  *   Counter name.
465859081d3SShahaf Shuler  * @param[out] cntr
466859081d3SShahaf Shuler  *   Counter output buffer.
467859081d3SShahaf Shuler  *
468859081d3SShahaf Shuler  * @return
469859081d3SShahaf Shuler  *   0 on success, -1 on failure and errno is set.
470859081d3SShahaf Shuler  */
471859081d3SShahaf Shuler int
472859081d3SShahaf Shuler priv_get_cntr_sysfs(struct priv *priv, const char *name, uint64_t *cntr)
473859081d3SShahaf Shuler {
474859081d3SShahaf Shuler 	unsigned long ulong_ctr;
475859081d3SShahaf Shuler 
476859081d3SShahaf Shuler 	if (priv_get_sysfs_ulong(priv, name, &ulong_ctr) == -1)
477859081d3SShahaf Shuler 		return -1;
478859081d3SShahaf Shuler 	*cntr = ulong_ctr;
479859081d3SShahaf Shuler 	return 0;
480859081d3SShahaf Shuler }
481859081d3SShahaf Shuler 
482859081d3SShahaf Shuler /**
483cf37ca95SAdrien Mazarguil  * Set device MTU.
484cf37ca95SAdrien Mazarguil  *
485cf37ca95SAdrien Mazarguil  * @param priv
486cf37ca95SAdrien Mazarguil  *   Pointer to private structure.
487cf37ca95SAdrien Mazarguil  * @param mtu
488cf37ca95SAdrien Mazarguil  *   MTU value to set.
489cf37ca95SAdrien Mazarguil  *
490cf37ca95SAdrien Mazarguil  * @return
491cf37ca95SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
492cf37ca95SAdrien Mazarguil  */
493cf37ca95SAdrien Mazarguil static int
494cf37ca95SAdrien Mazarguil priv_set_mtu(struct priv *priv, uint16_t mtu)
495cf37ca95SAdrien Mazarguil {
496f3b492d7SAdrien Mazarguil 	uint16_t new_mtu;
497f3b492d7SAdrien Mazarguil 
498f3b492d7SAdrien Mazarguil 	if (priv_set_sysfs_ulong(priv, "mtu", mtu) ||
499f3b492d7SAdrien Mazarguil 	    priv_get_mtu(priv, &new_mtu))
500f3b492d7SAdrien Mazarguil 		return -1;
501f3b492d7SAdrien Mazarguil 	if (new_mtu == mtu)
502f3b492d7SAdrien Mazarguil 		return 0;
503f3b492d7SAdrien Mazarguil 	errno = EINVAL;
504f3b492d7SAdrien Mazarguil 	return -1;
505cf37ca95SAdrien Mazarguil }
506cf37ca95SAdrien Mazarguil 
507cf37ca95SAdrien Mazarguil /**
508771fa900SAdrien Mazarguil  * Set device flags.
509771fa900SAdrien Mazarguil  *
510771fa900SAdrien Mazarguil  * @param priv
511771fa900SAdrien Mazarguil  *   Pointer to private structure.
512771fa900SAdrien Mazarguil  * @param keep
513771fa900SAdrien Mazarguil  *   Bitmask for flags that must remain untouched.
514771fa900SAdrien Mazarguil  * @param flags
515771fa900SAdrien Mazarguil  *   Bitmask for flags to modify.
516771fa900SAdrien Mazarguil  *
517771fa900SAdrien Mazarguil  * @return
518771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
519771fa900SAdrien Mazarguil  */
520771fa900SAdrien Mazarguil int
521771fa900SAdrien Mazarguil priv_set_flags(struct priv *priv, unsigned int keep, unsigned int flags)
522771fa900SAdrien Mazarguil {
523771fa900SAdrien Mazarguil 	unsigned long tmp;
524771fa900SAdrien Mazarguil 
525771fa900SAdrien Mazarguil 	if (priv_get_sysfs_ulong(priv, "flags", &tmp) == -1)
526771fa900SAdrien Mazarguil 		return -1;
527771fa900SAdrien Mazarguil 	tmp &= keep;
52833242e3eSOlivier Matz 	tmp |= (flags & (~keep));
529771fa900SAdrien Mazarguil 	return priv_set_sysfs_ulong(priv, "flags", tmp);
530771fa900SAdrien Mazarguil }
531771fa900SAdrien Mazarguil 
532771fa900SAdrien Mazarguil /**
533e60fbd5bSAdrien Mazarguil  * Ethernet device configuration.
534e60fbd5bSAdrien Mazarguil  *
535e60fbd5bSAdrien Mazarguil  * Prepare the driver for a given number of TX and RX queues.
536e60fbd5bSAdrien Mazarguil  *
537e60fbd5bSAdrien Mazarguil  * @param dev
538e60fbd5bSAdrien Mazarguil  *   Pointer to Ethernet device structure.
539e60fbd5bSAdrien Mazarguil  *
540e60fbd5bSAdrien Mazarguil  * @return
541e60fbd5bSAdrien Mazarguil  *   0 on success, errno value on failure.
542e60fbd5bSAdrien Mazarguil  */
543e60fbd5bSAdrien Mazarguil static int
544e60fbd5bSAdrien Mazarguil dev_configure(struct rte_eth_dev *dev)
545e60fbd5bSAdrien Mazarguil {
546e60fbd5bSAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
547e60fbd5bSAdrien Mazarguil 	unsigned int rxqs_n = dev->data->nb_rx_queues;
548e60fbd5bSAdrien Mazarguil 	unsigned int txqs_n = dev->data->nb_tx_queues;
549634efbc2SNelio Laranjeiro 	unsigned int i;
550634efbc2SNelio Laranjeiro 	unsigned int j;
551634efbc2SNelio Laranjeiro 	unsigned int reta_idx_n;
55229c1d8bbSNélio Laranjeiro 	const uint8_t use_app_rss_key =
55321e3a974SShahaf Shuler 		!!dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key;
554dbccb4cdSShahaf Shuler 	uint64_t supp_tx_offloads = mlx5_priv_get_tx_port_offloads(priv);
555dbccb4cdSShahaf Shuler 	uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads;
55617b843ebSShahaf Shuler 	uint64_t supp_rx_offloads =
55717b843ebSShahaf Shuler 		(mlx5_priv_get_rx_port_offloads(priv) |
55817b843ebSShahaf Shuler 		 mlx5_priv_get_rx_queue_offloads(priv));
55917b843ebSShahaf Shuler 	uint64_t rx_offloads = dev->data->dev_conf.rxmode.offloads;
560e60fbd5bSAdrien Mazarguil 
561dbccb4cdSShahaf Shuler 	if ((tx_offloads & supp_tx_offloads) != tx_offloads) {
562dbccb4cdSShahaf Shuler 		ERROR("Some Tx offloads are not supported "
563dbccb4cdSShahaf Shuler 		      "requested 0x%" PRIx64 " supported 0x%" PRIx64,
564dbccb4cdSShahaf Shuler 		      tx_offloads, supp_tx_offloads);
565dbccb4cdSShahaf Shuler 		return ENOTSUP;
566dbccb4cdSShahaf Shuler 	}
56717b843ebSShahaf Shuler 	if ((rx_offloads & supp_rx_offloads) != rx_offloads) {
56817b843ebSShahaf Shuler 		ERROR("Some Rx offloads are not supported "
56917b843ebSShahaf Shuler 		      "requested 0x%" PRIx64 " supported 0x%" PRIx64,
57017b843ebSShahaf Shuler 		      rx_offloads, supp_rx_offloads);
57117b843ebSShahaf Shuler 		return ENOTSUP;
57217b843ebSShahaf Shuler 	}
57329c1d8bbSNélio Laranjeiro 	if (use_app_rss_key &&
57429c1d8bbSNélio Laranjeiro 	    (dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key_len !=
57529c1d8bbSNélio Laranjeiro 	     rss_hash_default_key_len)) {
57629c1d8bbSNélio Laranjeiro 		/* MLX5 RSS only support 40bytes key. */
57729c1d8bbSNélio Laranjeiro 		return EINVAL;
57829c1d8bbSNélio Laranjeiro 	}
57929c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_key =
58029c1d8bbSNélio Laranjeiro 		rte_realloc(priv->rss_conf.rss_key,
58129c1d8bbSNélio Laranjeiro 			    rss_hash_default_key_len, 0);
58229c1d8bbSNélio Laranjeiro 	if (!priv->rss_conf.rss_key) {
58329c1d8bbSNélio Laranjeiro 		ERROR("cannot allocate RSS hash key memory (%u)", rxqs_n);
58429c1d8bbSNélio Laranjeiro 		return ENOMEM;
58529c1d8bbSNélio Laranjeiro 	}
58629c1d8bbSNélio Laranjeiro 	memcpy(priv->rss_conf.rss_key,
58729c1d8bbSNélio Laranjeiro 	       use_app_rss_key ?
58829c1d8bbSNélio Laranjeiro 	       dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key :
58929c1d8bbSNélio Laranjeiro 	       rss_hash_default_key,
59029c1d8bbSNélio Laranjeiro 	       rss_hash_default_key_len);
59129c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_key_len = rss_hash_default_key_len;
59229c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_hf = dev->data->dev_conf.rx_adv_conf.rss_conf.rss_hf;
593e60fbd5bSAdrien Mazarguil 	priv->rxqs = (void *)dev->data->rx_queues;
594e60fbd5bSAdrien Mazarguil 	priv->txqs = (void *)dev->data->tx_queues;
595e60fbd5bSAdrien Mazarguil 	if (txqs_n != priv->txqs_n) {
596e60fbd5bSAdrien Mazarguil 		INFO("%p: TX queues number update: %u -> %u",
597e60fbd5bSAdrien Mazarguil 		     (void *)dev, priv->txqs_n, txqs_n);
598e60fbd5bSAdrien Mazarguil 		priv->txqs_n = txqs_n;
599e60fbd5bSAdrien Mazarguil 	}
6007fe24446SShahaf Shuler 	if (rxqs_n > priv->config.ind_table_max_size) {
601634efbc2SNelio Laranjeiro 		ERROR("cannot handle this many RX queues (%u)", rxqs_n);
602634efbc2SNelio Laranjeiro 		return EINVAL;
603634efbc2SNelio Laranjeiro 	}
604e60fbd5bSAdrien Mazarguil 	if (rxqs_n == priv->rxqs_n)
605e60fbd5bSAdrien Mazarguil 		return 0;
606e60fbd5bSAdrien Mazarguil 	INFO("%p: RX queues number update: %u -> %u",
607e60fbd5bSAdrien Mazarguil 	     (void *)dev, priv->rxqs_n, rxqs_n);
608e60fbd5bSAdrien Mazarguil 	priv->rxqs_n = rxqs_n;
609634efbc2SNelio Laranjeiro 	/* If the requested number of RX queues is not a power of two, use the
610634efbc2SNelio Laranjeiro 	 * maximum indirection table size for better balancing.
611634efbc2SNelio Laranjeiro 	 * The result is always rounded to the next power of two. */
612634efbc2SNelio Laranjeiro 	reta_idx_n = (1 << log2above((rxqs_n & (rxqs_n - 1)) ?
6137fe24446SShahaf Shuler 				     priv->config.ind_table_max_size :
614634efbc2SNelio Laranjeiro 				     rxqs_n));
615634efbc2SNelio Laranjeiro 	if (priv_rss_reta_index_resize(priv, reta_idx_n))
616634efbc2SNelio Laranjeiro 		return ENOMEM;
617634efbc2SNelio Laranjeiro 	/* When the number of RX queues is not a power of two, the remaining
618634efbc2SNelio Laranjeiro 	 * table entries are padded with reused WQs and hashes are not spread
619634efbc2SNelio Laranjeiro 	 * uniformly. */
620634efbc2SNelio Laranjeiro 	for (i = 0, j = 0; (i != reta_idx_n); ++i) {
621634efbc2SNelio Laranjeiro 		(*priv->reta_idx)[i] = j;
622634efbc2SNelio Laranjeiro 		if (++j == rxqs_n)
623634efbc2SNelio Laranjeiro 			j = 0;
624634efbc2SNelio Laranjeiro 	}
625e60fbd5bSAdrien Mazarguil 	return 0;
626e60fbd5bSAdrien Mazarguil }
627e60fbd5bSAdrien Mazarguil 
628e60fbd5bSAdrien Mazarguil /**
629e60fbd5bSAdrien Mazarguil  * DPDK callback for Ethernet device configuration.
630e60fbd5bSAdrien Mazarguil  *
631e60fbd5bSAdrien Mazarguil  * @param dev
632e60fbd5bSAdrien Mazarguil  *   Pointer to Ethernet device structure.
633e60fbd5bSAdrien Mazarguil  *
634e60fbd5bSAdrien Mazarguil  * @return
635e60fbd5bSAdrien Mazarguil  *   0 on success, negative errno value on failure.
636e60fbd5bSAdrien Mazarguil  */
637e60fbd5bSAdrien Mazarguil int
638e60fbd5bSAdrien Mazarguil mlx5_dev_configure(struct rte_eth_dev *dev)
639e60fbd5bSAdrien Mazarguil {
640e60fbd5bSAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
641e60fbd5bSAdrien Mazarguil 	int ret;
642e60fbd5bSAdrien Mazarguil 
643e60fbd5bSAdrien Mazarguil 	priv_lock(priv);
644e60fbd5bSAdrien Mazarguil 	ret = dev_configure(dev);
645e60fbd5bSAdrien Mazarguil 	assert(ret >= 0);
646e60fbd5bSAdrien Mazarguil 	priv_unlock(priv);
647e60fbd5bSAdrien Mazarguil 	return -ret;
648e60fbd5bSAdrien Mazarguil }
649e60fbd5bSAdrien Mazarguil 
650e60fbd5bSAdrien Mazarguil /**
651e60fbd5bSAdrien Mazarguil  * DPDK callback to get information about the device.
652e60fbd5bSAdrien Mazarguil  *
653e60fbd5bSAdrien Mazarguil  * @param dev
654e60fbd5bSAdrien Mazarguil  *   Pointer to Ethernet device structure.
655e60fbd5bSAdrien Mazarguil  * @param[out] info
656e60fbd5bSAdrien Mazarguil  *   Info structure output buffer.
657e60fbd5bSAdrien Mazarguil  */
658e60fbd5bSAdrien Mazarguil void
659e60fbd5bSAdrien Mazarguil mlx5_dev_infos_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *info)
660e60fbd5bSAdrien Mazarguil {
66101d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
6627fe24446SShahaf Shuler 	struct mlx5_dev_config *config = &priv->config;
663e60fbd5bSAdrien Mazarguil 	unsigned int max;
664e60fbd5bSAdrien Mazarguil 	char ifname[IF_NAMESIZE];
665e60fbd5bSAdrien Mazarguil 
666c0802544SFerruh Yigit 	info->pci_dev = RTE_ETH_DEV_TO_PCI(dev);
667ae34410aSJan Blunck 
668e60fbd5bSAdrien Mazarguil 	priv_lock(priv);
669e60fbd5bSAdrien Mazarguil 	/* FIXME: we should ask the device for these values. */
670e60fbd5bSAdrien Mazarguil 	info->min_rx_bufsize = 32;
671e60fbd5bSAdrien Mazarguil 	info->max_rx_pktlen = 65536;
672e60fbd5bSAdrien Mazarguil 	/*
673e60fbd5bSAdrien Mazarguil 	 * Since we need one CQ per QP, the limit is the minimum number
674e60fbd5bSAdrien Mazarguil 	 * between the two values.
675e60fbd5bSAdrien Mazarguil 	 */
67643e9d979SShachar Beiser 	max = RTE_MIN(priv->device_attr.orig_attr.max_cq,
67743e9d979SShachar Beiser 		      priv->device_attr.orig_attr.max_qp);
678e60fbd5bSAdrien Mazarguil 	/* If max >= 65535 then max = 0, max_rx_queues is uint16_t. */
679e60fbd5bSAdrien Mazarguil 	if (max >= 65535)
680e60fbd5bSAdrien Mazarguil 		max = 65535;
681e60fbd5bSAdrien Mazarguil 	info->max_rx_queues = max;
682e60fbd5bSAdrien Mazarguil 	info->max_tx_queues = max;
6830497ddaaSYaacov Hazan 	info->max_mac_addrs = RTE_DIM(priv->mac);
68417b843ebSShahaf Shuler 	info->rx_queue_offload_capa =
68517b843ebSShahaf Shuler 		mlx5_priv_get_rx_queue_offloads(priv);
68617b843ebSShahaf Shuler 	info->rx_offload_capa = (mlx5_priv_get_rx_port_offloads(priv) |
68717b843ebSShahaf Shuler 				 info->rx_queue_offload_capa);
688dbccb4cdSShahaf Shuler 	info->tx_offload_capa = mlx5_priv_get_tx_port_offloads(priv);
689e60fbd5bSAdrien Mazarguil 	if (priv_get_ifname(priv, &ifname) == 0)
690e60fbd5bSAdrien Mazarguil 		info->if_index = if_nametoindex(ifname);
691d365210eSYongseok Koh 	info->reta_size = priv->reta_idx_n ?
6927fe24446SShahaf Shuler 		priv->reta_idx_n : config->ind_table_max_size;
69329c1d8bbSNélio Laranjeiro 	info->hash_key_size = priv->rss_conf.rss_key_len;
69475ef62a9SNélio Laranjeiro 	info->speed_capa = priv->link_speed_capa;
695*b233b027SShahaf Shuler 	info->flow_type_rss_offloads = ~MLX5_RSS_HF_MASK;
696e60fbd5bSAdrien Mazarguil 	priv_unlock(priv);
697e60fbd5bSAdrien Mazarguil }
698e60fbd5bSAdrien Mazarguil 
69978a38edfSJianfeng Tan const uint32_t *
70078a38edfSJianfeng Tan mlx5_dev_supported_ptypes_get(struct rte_eth_dev *dev)
70178a38edfSJianfeng Tan {
70278a38edfSJianfeng Tan 	static const uint32_t ptypes[] = {
70378a38edfSJianfeng Tan 		/* refers to rxq_cq_to_pkt_type() */
704ea16068cSYongseok Koh 		RTE_PTYPE_L2_ETHER,
705c4ba5434SNélio Laranjeiro 		RTE_PTYPE_L3_IPV4_EXT_UNKNOWN,
706c4ba5434SNélio Laranjeiro 		RTE_PTYPE_L3_IPV6_EXT_UNKNOWN,
707ea16068cSYongseok Koh 		RTE_PTYPE_L4_NONFRAG,
708ea16068cSYongseok Koh 		RTE_PTYPE_L4_FRAG,
709ea16068cSYongseok Koh 		RTE_PTYPE_L4_TCP,
710ea16068cSYongseok Koh 		RTE_PTYPE_L4_UDP,
711c4ba5434SNélio Laranjeiro 		RTE_PTYPE_INNER_L3_IPV4_EXT_UNKNOWN,
712c4ba5434SNélio Laranjeiro 		RTE_PTYPE_INNER_L3_IPV6_EXT_UNKNOWN,
713ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_NONFRAG,
714ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_FRAG,
715ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_TCP,
716ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_UDP,
71778a38edfSJianfeng Tan 		RTE_PTYPE_UNKNOWN
71878a38edfSJianfeng Tan 	};
71978a38edfSJianfeng Tan 
7206cb559d6SYongseok Koh 	if (dev->rx_pkt_burst == mlx5_rx_burst ||
7216cb559d6SYongseok Koh 	    dev->rx_pkt_burst == mlx5_rx_burst_vec)
72278a38edfSJianfeng Tan 		return ptypes;
72378a38edfSJianfeng Tan 	return NULL;
72478a38edfSJianfeng Tan }
72578a38edfSJianfeng Tan 
726e60fbd5bSAdrien Mazarguil /**
7272c960a51SMatthieu Ternisien d'Ouville  * DPDK callback to retrieve physical link information.
728cb8faed7SAdrien Mazarguil  *
729cb8faed7SAdrien Mazarguil  * @param dev
730cb8faed7SAdrien Mazarguil  *   Pointer to Ethernet device structure.
731cb8faed7SAdrien Mazarguil  * @param wait_to_complete
732cb8faed7SAdrien Mazarguil  *   Wait for request completion (ignored).
733cb8faed7SAdrien Mazarguil  */
73418840871SNélio Laranjeiro static int
73518840871SNélio Laranjeiro mlx5_link_update_unlocked_gset(struct rte_eth_dev *dev, int wait_to_complete)
736cb8faed7SAdrien Mazarguil {
73701d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
738cb8faed7SAdrien Mazarguil 	struct ethtool_cmd edata = {
73975ef62a9SNélio Laranjeiro 		.cmd = ETHTOOL_GSET /* Deprecated since Linux v4.5. */
740cb8faed7SAdrien Mazarguil 	};
741cb8faed7SAdrien Mazarguil 	struct ifreq ifr;
742cb8faed7SAdrien Mazarguil 	struct rte_eth_link dev_link;
743cb8faed7SAdrien Mazarguil 	int link_speed = 0;
744cb8faed7SAdrien Mazarguil 
7452c960a51SMatthieu Ternisien d'Ouville 	/* priv_lock() is not taken to allow concurrent calls. */
7462c960a51SMatthieu Ternisien d'Ouville 
747cb8faed7SAdrien Mazarguil 	(void)wait_to_complete;
748cb8faed7SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCGIFFLAGS, &ifr)) {
749cb8faed7SAdrien Mazarguil 		WARN("ioctl(SIOCGIFFLAGS) failed: %s", strerror(errno));
750cb8faed7SAdrien Mazarguil 		return -1;
751cb8faed7SAdrien Mazarguil 	}
752cb8faed7SAdrien Mazarguil 	memset(&dev_link, 0, sizeof(dev_link));
753cb8faed7SAdrien Mazarguil 	dev_link.link_status = ((ifr.ifr_flags & IFF_UP) &&
754cb8faed7SAdrien Mazarguil 				(ifr.ifr_flags & IFF_RUNNING));
755d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&edata;
756cb8faed7SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
757cb8faed7SAdrien Mazarguil 		WARN("ioctl(SIOCETHTOOL, ETHTOOL_GSET) failed: %s",
758cb8faed7SAdrien Mazarguil 		     strerror(errno));
759cb8faed7SAdrien Mazarguil 		return -1;
760cb8faed7SAdrien Mazarguil 	}
761cb8faed7SAdrien Mazarguil 	link_speed = ethtool_cmd_speed(&edata);
762cb8faed7SAdrien Mazarguil 	if (link_speed == -1)
763cb8faed7SAdrien Mazarguil 		dev_link.link_speed = 0;
764cb8faed7SAdrien Mazarguil 	else
765cb8faed7SAdrien Mazarguil 		dev_link.link_speed = link_speed;
76675ef62a9SNélio Laranjeiro 	priv->link_speed_capa = 0;
76775ef62a9SNélio Laranjeiro 	if (edata.supported & SUPPORTED_Autoneg)
76875ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
76975ef62a9SNélio Laranjeiro 	if (edata.supported & (SUPPORTED_1000baseT_Full |
77075ef62a9SNélio Laranjeiro 			       SUPPORTED_1000baseKX_Full))
77175ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_1G;
77275ef62a9SNélio Laranjeiro 	if (edata.supported & SUPPORTED_10000baseKR_Full)
77375ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_10G;
77475ef62a9SNélio Laranjeiro 	if (edata.supported & (SUPPORTED_40000baseKR4_Full |
77575ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseCR4_Full |
77675ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseSR4_Full |
77775ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseLR4_Full))
77875ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_40G;
779cb8faed7SAdrien Mazarguil 	dev_link.link_duplex = ((edata.duplex == DUPLEX_HALF) ?
780cb8faed7SAdrien Mazarguil 				ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
78182113036SMarc Sune 	dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
78282113036SMarc Sune 			ETH_LINK_SPEED_FIXED);
783cb8faed7SAdrien Mazarguil 	if (memcmp(&dev_link, &dev->data->dev_link, sizeof(dev_link))) {
784cb8faed7SAdrien Mazarguil 		/* Link status changed. */
785cb8faed7SAdrien Mazarguil 		dev->data->dev_link = dev_link;
786cb8faed7SAdrien Mazarguil 		return 0;
787cb8faed7SAdrien Mazarguil 	}
788cb8faed7SAdrien Mazarguil 	/* Link status is still the same. */
789cb8faed7SAdrien Mazarguil 	return -1;
790cb8faed7SAdrien Mazarguil }
791cb8faed7SAdrien Mazarguil 
792cb8faed7SAdrien Mazarguil /**
7933a49ffe3SShahaf Shuler  * Retrieve physical link information (unlocked version using new ioctl).
79418840871SNélio Laranjeiro  *
79518840871SNélio Laranjeiro  * @param dev
79618840871SNélio Laranjeiro  *   Pointer to Ethernet device structure.
79718840871SNélio Laranjeiro  * @param wait_to_complete
79818840871SNélio Laranjeiro  *   Wait for request completion (ignored).
79918840871SNélio Laranjeiro  */
80018840871SNélio Laranjeiro static int
80118840871SNélio Laranjeiro mlx5_link_update_unlocked_gs(struct rte_eth_dev *dev, int wait_to_complete)
80218840871SNélio Laranjeiro {
80301d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
80437a4406cSNélio Laranjeiro 	struct ethtool_link_settings gcmd = { .cmd = ETHTOOL_GLINKSETTINGS };
80518840871SNélio Laranjeiro 	struct ifreq ifr;
80618840871SNélio Laranjeiro 	struct rte_eth_link dev_link;
80718840871SNélio Laranjeiro 	uint64_t sc;
80818840871SNélio Laranjeiro 
80918840871SNélio Laranjeiro 	(void)wait_to_complete;
81018840871SNélio Laranjeiro 	if (priv_ifreq(priv, SIOCGIFFLAGS, &ifr)) {
81118840871SNélio Laranjeiro 		WARN("ioctl(SIOCGIFFLAGS) failed: %s", strerror(errno));
81218840871SNélio Laranjeiro 		return -1;
81318840871SNélio Laranjeiro 	}
81418840871SNélio Laranjeiro 	memset(&dev_link, 0, sizeof(dev_link));
81518840871SNélio Laranjeiro 	dev_link.link_status = ((ifr.ifr_flags & IFF_UP) &&
81618840871SNélio Laranjeiro 				(ifr.ifr_flags & IFF_RUNNING));
81737a4406cSNélio Laranjeiro 	ifr.ifr_data = (void *)&gcmd;
81818840871SNélio Laranjeiro 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
81918840871SNélio Laranjeiro 		DEBUG("ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS) failed: %s",
82018840871SNélio Laranjeiro 		      strerror(errno));
82118840871SNélio Laranjeiro 		return -1;
82218840871SNélio Laranjeiro 	}
82337a4406cSNélio Laranjeiro 	gcmd.link_mode_masks_nwords = -gcmd.link_mode_masks_nwords;
82437a4406cSNélio Laranjeiro 
82537a4406cSNélio Laranjeiro 	alignas(struct ethtool_link_settings)
82637a4406cSNélio Laranjeiro 	uint8_t data[offsetof(struct ethtool_link_settings, link_mode_masks) +
82737a4406cSNélio Laranjeiro 		     sizeof(uint32_t) * gcmd.link_mode_masks_nwords * 3];
82837a4406cSNélio Laranjeiro 	struct ethtool_link_settings *ecmd = (void *)data;
82937a4406cSNélio Laranjeiro 
83037a4406cSNélio Laranjeiro 	*ecmd = gcmd;
83137a4406cSNélio Laranjeiro 	ifr.ifr_data = (void *)ecmd;
832ef09a7fcSGowrishankar Muthukrishnan 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
833ef09a7fcSGowrishankar Muthukrishnan 		DEBUG("ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS) failed: %s",
834ef09a7fcSGowrishankar Muthukrishnan 		      strerror(errno));
835ef09a7fcSGowrishankar Muthukrishnan 		return -1;
836ef09a7fcSGowrishankar Muthukrishnan 	}
83790260d57SNélio Laranjeiro 	dev_link.link_speed = ecmd->speed;
83890260d57SNélio Laranjeiro 	sc = ecmd->link_mode_masks[0] |
83990260d57SNélio Laranjeiro 		((uint64_t)ecmd->link_mode_masks[1] << 32);
84018840871SNélio Laranjeiro 	priv->link_speed_capa = 0;
841b113cb5eSEdward Makarov 	if (sc & MLX5_BITSHIFT(ETHTOOL_LINK_MODE_Autoneg_BIT))
84218840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
843b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseT_Full_BIT) |
844b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseKX_Full_BIT)))
84518840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_1G;
846b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT) |
847b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKR_Full_BIT) |
848b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseR_FEC_BIT)))
84918840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_10G;
850b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT) |
851b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT)))
85218840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_20G;
853b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT) |
854b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT) |
855b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT) |
856b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT)))
85718840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_40G;
858b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT) |
859b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT) |
860b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT) |
861b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT)))
86218840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_56G;
863b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseCR_Full_BIT) |
864b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseKR_Full_BIT) |
865b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseSR_Full_BIT)))
86618840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_25G;
867b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT) |
868b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT)))
86918840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_50G;
870b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT) |
871b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT) |
872b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT) |
873b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT)))
87418840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_100G;
87590260d57SNélio Laranjeiro 	dev_link.link_duplex = ((ecmd->duplex == DUPLEX_HALF) ?
87618840871SNélio Laranjeiro 				ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
87718840871SNélio Laranjeiro 	dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
87818840871SNélio Laranjeiro 				  ETH_LINK_SPEED_FIXED);
87918840871SNélio Laranjeiro 	if (memcmp(&dev_link, &dev->data->dev_link, sizeof(dev_link))) {
88018840871SNélio Laranjeiro 		/* Link status changed. */
88118840871SNélio Laranjeiro 		dev->data->dev_link = dev_link;
88218840871SNélio Laranjeiro 		return 0;
88318840871SNélio Laranjeiro 	}
88418840871SNélio Laranjeiro 	/* Link status is still the same. */
88518840871SNélio Laranjeiro 	return -1;
88618840871SNélio Laranjeiro }
88718840871SNélio Laranjeiro 
88818840871SNélio Laranjeiro /**
889c7bf6225SYongseok Koh  * Enable receiving and transmitting traffic.
890c7bf6225SYongseok Koh  *
891c7bf6225SYongseok Koh  * @param priv
892c7bf6225SYongseok Koh  *   Pointer to private structure.
893c7bf6225SYongseok Koh  */
894c7bf6225SYongseok Koh static void
895c7bf6225SYongseok Koh priv_link_start(struct priv *priv)
896c7bf6225SYongseok Koh {
897c7bf6225SYongseok Koh 	struct rte_eth_dev *dev = priv->dev;
898c7bf6225SYongseok Koh 	int err;
899c7bf6225SYongseok Koh 
900c7bf6225SYongseok Koh 	dev->tx_pkt_burst = priv_select_tx_function(priv, dev);
901c7bf6225SYongseok Koh 	dev->rx_pkt_burst = priv_select_rx_function(priv, dev);
902c7bf6225SYongseok Koh 	err = priv_dev_traffic_enable(priv, dev);
903c7bf6225SYongseok Koh 	if (err)
904c7bf6225SYongseok Koh 		ERROR("%p: error occurred while configuring control flows: %s",
905c7bf6225SYongseok Koh 		      (void *)priv, strerror(err));
906c7bf6225SYongseok Koh 	err = priv_flow_start(priv, &priv->flows);
907c7bf6225SYongseok Koh 	if (err)
908c7bf6225SYongseok Koh 		ERROR("%p: error occurred while configuring flows: %s",
909c7bf6225SYongseok Koh 		      (void *)priv, strerror(err));
910c7bf6225SYongseok Koh }
911c7bf6225SYongseok Koh 
912c7bf6225SYongseok Koh /**
913c7bf6225SYongseok Koh  * Disable receiving and transmitting traffic.
914c7bf6225SYongseok Koh  *
915c7bf6225SYongseok Koh  * @param priv
916c7bf6225SYongseok Koh  *   Pointer to private structure.
917c7bf6225SYongseok Koh  */
918c7bf6225SYongseok Koh static void
919c7bf6225SYongseok Koh priv_link_stop(struct priv *priv)
920c7bf6225SYongseok Koh {
921c7bf6225SYongseok Koh 	struct rte_eth_dev *dev = priv->dev;
922c7bf6225SYongseok Koh 
923c7bf6225SYongseok Koh 	priv_flow_stop(priv, &priv->flows);
924c7bf6225SYongseok Koh 	priv_dev_traffic_disable(priv, dev);
925c7bf6225SYongseok Koh 	dev->rx_pkt_burst = removed_rx_burst;
926c7bf6225SYongseok Koh 	dev->tx_pkt_burst = removed_tx_burst;
927c7bf6225SYongseok Koh }
928c7bf6225SYongseok Koh 
929c7bf6225SYongseok Koh /**
930c7bf6225SYongseok Koh  * Retrieve physical link information and update rx/tx_pkt_burst callbacks
931c7bf6225SYongseok Koh  * accordingly.
932c7bf6225SYongseok Koh  *
933c7bf6225SYongseok Koh  * @param priv
934c7bf6225SYongseok Koh  *   Pointer to private structure.
935c7bf6225SYongseok Koh  * @param wait_to_complete
936c7bf6225SYongseok Koh  *   Wait for request completion (ignored).
937c7bf6225SYongseok Koh  */
938c7bf6225SYongseok Koh int
939c7bf6225SYongseok Koh priv_link_update(struct priv *priv, int wait_to_complete)
940c7bf6225SYongseok Koh {
941c7bf6225SYongseok Koh 	struct rte_eth_dev *dev = priv->dev;
942c7bf6225SYongseok Koh 	struct utsname utsname;
943c7bf6225SYongseok Koh 	int ver[3];
944c7bf6225SYongseok Koh 	int ret;
945c7bf6225SYongseok Koh 	struct rte_eth_link dev_link = dev->data->dev_link;
946c7bf6225SYongseok Koh 
947c7bf6225SYongseok Koh 	if (uname(&utsname) == -1 ||
948c7bf6225SYongseok Koh 	    sscanf(utsname.release, "%d.%d.%d",
949c7bf6225SYongseok Koh 		   &ver[0], &ver[1], &ver[2]) != 3 ||
950c7bf6225SYongseok Koh 	    KERNEL_VERSION(ver[0], ver[1], ver[2]) < KERNEL_VERSION(4, 9, 0))
951c7bf6225SYongseok Koh 		ret = mlx5_link_update_unlocked_gset(dev, wait_to_complete);
952c7bf6225SYongseok Koh 	else
953c7bf6225SYongseok Koh 		ret = mlx5_link_update_unlocked_gs(dev, wait_to_complete);
954c7bf6225SYongseok Koh 	/* If lsc interrupt is disabled, should always be ready for traffic. */
955c7bf6225SYongseok Koh 	if (!dev->data->dev_conf.intr_conf.lsc) {
956c7bf6225SYongseok Koh 		priv_link_start(priv);
957c7bf6225SYongseok Koh 		return ret;
958c7bf6225SYongseok Koh 	}
959c7bf6225SYongseok Koh 	/* Re-select burst callbacks only if link status has been changed. */
960c7bf6225SYongseok Koh 	if (!ret && dev_link.link_status != dev->data->dev_link.link_status) {
961c7bf6225SYongseok Koh 		if (dev->data->dev_link.link_status == ETH_LINK_UP)
962c7bf6225SYongseok Koh 			priv_link_start(priv);
963c7bf6225SYongseok Koh 		else
964c7bf6225SYongseok Koh 			priv_link_stop(priv);
965c7bf6225SYongseok Koh 	}
966c7bf6225SYongseok Koh 	return ret;
967c7bf6225SYongseok Koh }
968c7bf6225SYongseok Koh 
969c7bf6225SYongseok Koh /**
970cb8faed7SAdrien Mazarguil  * DPDK callback to retrieve physical link information.
971cb8faed7SAdrien Mazarguil  *
972cb8faed7SAdrien Mazarguil  * @param dev
973cb8faed7SAdrien Mazarguil  *   Pointer to Ethernet device structure.
974cb8faed7SAdrien Mazarguil  * @param wait_to_complete
975cb8faed7SAdrien Mazarguil  *   Wait for request completion (ignored).
976cb8faed7SAdrien Mazarguil  */
977cb8faed7SAdrien Mazarguil int
978cb8faed7SAdrien Mazarguil mlx5_link_update(struct rte_eth_dev *dev, int wait_to_complete)
979cb8faed7SAdrien Mazarguil {
980c7bf6225SYongseok Koh 	struct priv *priv = dev->data->dev_private;
981c7bf6225SYongseok Koh 	int ret;
982cb8faed7SAdrien Mazarguil 
983c7bf6225SYongseok Koh 	priv_lock(priv);
984c7bf6225SYongseok Koh 	ret = priv_link_update(priv, wait_to_complete);
985c7bf6225SYongseok Koh 	priv_unlock(priv);
986c7bf6225SYongseok Koh 	return ret;
987cb8faed7SAdrien Mazarguil }
988cb8faed7SAdrien Mazarguil 
989cb8faed7SAdrien Mazarguil /**
990cf37ca95SAdrien Mazarguil  * DPDK callback to change the MTU.
991cf37ca95SAdrien Mazarguil  *
992cf37ca95SAdrien Mazarguil  * @param dev
993cf37ca95SAdrien Mazarguil  *   Pointer to Ethernet device structure.
994cf37ca95SAdrien Mazarguil  * @param in_mtu
995cf37ca95SAdrien Mazarguil  *   New MTU.
996cf37ca95SAdrien Mazarguil  *
997cf37ca95SAdrien Mazarguil  * @return
998cf37ca95SAdrien Mazarguil  *   0 on success, negative errno value on failure.
999cf37ca95SAdrien Mazarguil  */
1000cf37ca95SAdrien Mazarguil int
1001cf37ca95SAdrien Mazarguil mlx5_dev_set_mtu(struct rte_eth_dev *dev, uint16_t mtu)
1002cf37ca95SAdrien Mazarguil {
1003cf37ca95SAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
1004a0edafe4SNelio Laranjeiro 	uint16_t kern_mtu;
1005cf37ca95SAdrien Mazarguil 	int ret = 0;
1006cf37ca95SAdrien Mazarguil 
1007cf37ca95SAdrien Mazarguil 	priv_lock(priv);
1008a0edafe4SNelio Laranjeiro 	ret = priv_get_mtu(priv, &kern_mtu);
1009a0edafe4SNelio Laranjeiro 	if (ret)
1010a0edafe4SNelio Laranjeiro 		goto out;
1011cf37ca95SAdrien Mazarguil 	/* Set kernel interface MTU first. */
1012a0edafe4SNelio Laranjeiro 	ret = priv_set_mtu(priv, mtu);
1013a0edafe4SNelio Laranjeiro 	if (ret)
1014a0edafe4SNelio Laranjeiro 		goto out;
1015a0edafe4SNelio Laranjeiro 	ret = priv_get_mtu(priv, &kern_mtu);
1016a0edafe4SNelio Laranjeiro 	if (ret)
1017a0edafe4SNelio Laranjeiro 		goto out;
1018a0edafe4SNelio Laranjeiro 	if (kern_mtu == mtu) {
1019a0edafe4SNelio Laranjeiro 		priv->mtu = mtu;
1020a0edafe4SNelio Laranjeiro 		DEBUG("adapter port %u MTU set to %u", priv->port, mtu);
1021a0edafe4SNelio Laranjeiro 	}
1022a0edafe4SNelio Laranjeiro 	priv_unlock(priv);
1023a0edafe4SNelio Laranjeiro 	return 0;
1024a0edafe4SNelio Laranjeiro out:
1025cf37ca95SAdrien Mazarguil 	ret = errno;
1026cf37ca95SAdrien Mazarguil 	WARN("cannot set port %u MTU to %u: %s", priv->port, mtu,
1027cf37ca95SAdrien Mazarguil 	     strerror(ret));
1028cf37ca95SAdrien Mazarguil 	priv_unlock(priv);
1029cf37ca95SAdrien Mazarguil 	assert(ret >= 0);
1030cf37ca95SAdrien Mazarguil 	return -ret;
1031cf37ca95SAdrien Mazarguil }
1032cf37ca95SAdrien Mazarguil 
1033cf37ca95SAdrien Mazarguil /**
103402d75430SAdrien Mazarguil  * DPDK callback to get flow control status.
103502d75430SAdrien Mazarguil  *
103602d75430SAdrien Mazarguil  * @param dev
103702d75430SAdrien Mazarguil  *   Pointer to Ethernet device structure.
103802d75430SAdrien Mazarguil  * @param[out] fc_conf
103902d75430SAdrien Mazarguil  *   Flow control output buffer.
104002d75430SAdrien Mazarguil  *
104102d75430SAdrien Mazarguil  * @return
104202d75430SAdrien Mazarguil  *   0 on success, negative errno value on failure.
104302d75430SAdrien Mazarguil  */
104402d75430SAdrien Mazarguil int
104502d75430SAdrien Mazarguil mlx5_dev_get_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
104602d75430SAdrien Mazarguil {
104702d75430SAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
104802d75430SAdrien Mazarguil 	struct ifreq ifr;
104902d75430SAdrien Mazarguil 	struct ethtool_pauseparam ethpause = {
105002d75430SAdrien Mazarguil 		.cmd = ETHTOOL_GPAUSEPARAM
105102d75430SAdrien Mazarguil 	};
105202d75430SAdrien Mazarguil 	int ret;
105302d75430SAdrien Mazarguil 
1054d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&ethpause;
105502d75430SAdrien Mazarguil 	priv_lock(priv);
105602d75430SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
105702d75430SAdrien Mazarguil 		ret = errno;
105802d75430SAdrien Mazarguil 		WARN("ioctl(SIOCETHTOOL, ETHTOOL_GPAUSEPARAM)"
105902d75430SAdrien Mazarguil 		     " failed: %s",
106002d75430SAdrien Mazarguil 		     strerror(ret));
106102d75430SAdrien Mazarguil 		goto out;
106202d75430SAdrien Mazarguil 	}
106302d75430SAdrien Mazarguil 
106402d75430SAdrien Mazarguil 	fc_conf->autoneg = ethpause.autoneg;
106502d75430SAdrien Mazarguil 	if (ethpause.rx_pause && ethpause.tx_pause)
106602d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_FULL;
106702d75430SAdrien Mazarguil 	else if (ethpause.rx_pause)
106802d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_RX_PAUSE;
106902d75430SAdrien Mazarguil 	else if (ethpause.tx_pause)
107002d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_TX_PAUSE;
107102d75430SAdrien Mazarguil 	else
107202d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_NONE;
107302d75430SAdrien Mazarguil 	ret = 0;
107402d75430SAdrien Mazarguil 
107502d75430SAdrien Mazarguil out:
107602d75430SAdrien Mazarguil 	priv_unlock(priv);
107702d75430SAdrien Mazarguil 	assert(ret >= 0);
107802d75430SAdrien Mazarguil 	return -ret;
107902d75430SAdrien Mazarguil }
108002d75430SAdrien Mazarguil 
108102d75430SAdrien Mazarguil /**
108202d75430SAdrien Mazarguil  * DPDK callback to modify flow control parameters.
108302d75430SAdrien Mazarguil  *
108402d75430SAdrien Mazarguil  * @param dev
108502d75430SAdrien Mazarguil  *   Pointer to Ethernet device structure.
108602d75430SAdrien Mazarguil  * @param[in] fc_conf
108702d75430SAdrien Mazarguil  *   Flow control parameters.
108802d75430SAdrien Mazarguil  *
108902d75430SAdrien Mazarguil  * @return
109002d75430SAdrien Mazarguil  *   0 on success, negative errno value on failure.
109102d75430SAdrien Mazarguil  */
109202d75430SAdrien Mazarguil int
109302d75430SAdrien Mazarguil mlx5_dev_set_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
109402d75430SAdrien Mazarguil {
109502d75430SAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
109602d75430SAdrien Mazarguil 	struct ifreq ifr;
109702d75430SAdrien Mazarguil 	struct ethtool_pauseparam ethpause = {
109802d75430SAdrien Mazarguil 		.cmd = ETHTOOL_SPAUSEPARAM
109902d75430SAdrien Mazarguil 	};
110002d75430SAdrien Mazarguil 	int ret;
110102d75430SAdrien Mazarguil 
1102d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&ethpause;
110302d75430SAdrien Mazarguil 	ethpause.autoneg = fc_conf->autoneg;
110402d75430SAdrien Mazarguil 	if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
110502d75430SAdrien Mazarguil 	    (fc_conf->mode & RTE_FC_RX_PAUSE))
110602d75430SAdrien Mazarguil 		ethpause.rx_pause = 1;
110702d75430SAdrien Mazarguil 	else
110802d75430SAdrien Mazarguil 		ethpause.rx_pause = 0;
110902d75430SAdrien Mazarguil 
111002d75430SAdrien Mazarguil 	if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
111102d75430SAdrien Mazarguil 	    (fc_conf->mode & RTE_FC_TX_PAUSE))
111202d75430SAdrien Mazarguil 		ethpause.tx_pause = 1;
111302d75430SAdrien Mazarguil 	else
111402d75430SAdrien Mazarguil 		ethpause.tx_pause = 0;
111502d75430SAdrien Mazarguil 
111602d75430SAdrien Mazarguil 	priv_lock(priv);
111702d75430SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
111802d75430SAdrien Mazarguil 		ret = errno;
111902d75430SAdrien Mazarguil 		WARN("ioctl(SIOCETHTOOL, ETHTOOL_SPAUSEPARAM)"
112002d75430SAdrien Mazarguil 		     " failed: %s",
112102d75430SAdrien Mazarguil 		     strerror(ret));
112202d75430SAdrien Mazarguil 		goto out;
112302d75430SAdrien Mazarguil 	}
112402d75430SAdrien Mazarguil 	ret = 0;
112502d75430SAdrien Mazarguil 
112602d75430SAdrien Mazarguil out:
112702d75430SAdrien Mazarguil 	priv_unlock(priv);
112802d75430SAdrien Mazarguil 	assert(ret >= 0);
112902d75430SAdrien Mazarguil 	return -ret;
113002d75430SAdrien Mazarguil }
113102d75430SAdrien Mazarguil 
113202d75430SAdrien Mazarguil /**
1133771fa900SAdrien Mazarguil  * Get PCI information from struct ibv_device.
1134771fa900SAdrien Mazarguil  *
1135771fa900SAdrien Mazarguil  * @param device
1136771fa900SAdrien Mazarguil  *   Pointer to Ethernet device structure.
1137771fa900SAdrien Mazarguil  * @param[out] pci_addr
1138771fa900SAdrien Mazarguil  *   PCI bus address output buffer.
1139771fa900SAdrien Mazarguil  *
1140771fa900SAdrien Mazarguil  * @return
1141771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
1142771fa900SAdrien Mazarguil  */
1143771fa900SAdrien Mazarguil int
1144771fa900SAdrien Mazarguil mlx5_ibv_device_to_pci_addr(const struct ibv_device *device,
1145771fa900SAdrien Mazarguil 			    struct rte_pci_addr *pci_addr)
1146771fa900SAdrien Mazarguil {
1147771fa900SAdrien Mazarguil 	FILE *file;
1148771fa900SAdrien Mazarguil 	char line[32];
1149771fa900SAdrien Mazarguil 	MKSTR(path, "%s/device/uevent", device->ibdev_path);
1150771fa900SAdrien Mazarguil 
1151771fa900SAdrien Mazarguil 	file = fopen(path, "rb");
1152771fa900SAdrien Mazarguil 	if (file == NULL)
1153771fa900SAdrien Mazarguil 		return -1;
1154771fa900SAdrien Mazarguil 	while (fgets(line, sizeof(line), file) == line) {
1155771fa900SAdrien Mazarguil 		size_t len = strlen(line);
1156771fa900SAdrien Mazarguil 		int ret;
1157771fa900SAdrien Mazarguil 
1158771fa900SAdrien Mazarguil 		/* Truncate long lines. */
1159771fa900SAdrien Mazarguil 		if (len == (sizeof(line) - 1))
1160771fa900SAdrien Mazarguil 			while (line[(len - 1)] != '\n') {
1161771fa900SAdrien Mazarguil 				ret = fgetc(file);
1162771fa900SAdrien Mazarguil 				if (ret == EOF)
1163771fa900SAdrien Mazarguil 					break;
1164771fa900SAdrien Mazarguil 				line[(len - 1)] = ret;
1165771fa900SAdrien Mazarguil 			}
1166771fa900SAdrien Mazarguil 		/* Extract information. */
1167771fa900SAdrien Mazarguil 		if (sscanf(line,
1168771fa900SAdrien Mazarguil 			   "PCI_SLOT_NAME="
1169463ced95SStephen Hemminger 			   "%" SCNx32 ":%" SCNx8 ":%" SCNx8 ".%" SCNx8 "\n",
1170771fa900SAdrien Mazarguil 			   &pci_addr->domain,
1171771fa900SAdrien Mazarguil 			   &pci_addr->bus,
1172771fa900SAdrien Mazarguil 			   &pci_addr->devid,
1173771fa900SAdrien Mazarguil 			   &pci_addr->function) == 4) {
1174771fa900SAdrien Mazarguil 			ret = 0;
1175771fa900SAdrien Mazarguil 			break;
1176771fa900SAdrien Mazarguil 		}
1177771fa900SAdrien Mazarguil 	}
1178771fa900SAdrien Mazarguil 	fclose(file);
1179771fa900SAdrien Mazarguil 	return 0;
1180771fa900SAdrien Mazarguil }
1181198a3c33SNelio Laranjeiro 
1182198a3c33SNelio Laranjeiro /**
1183c26ae069SMatan Azrad  * Update the link status.
1184198a3c33SNelio Laranjeiro  *
1185198a3c33SNelio Laranjeiro  * @param priv
1186198a3c33SNelio Laranjeiro  *   Pointer to private structure.
1187198a3c33SNelio Laranjeiro  *
1188198a3c33SNelio Laranjeiro  * @return
1189c26ae069SMatan Azrad  *   Zero if the callback process can be called immediately.
1190198a3c33SNelio Laranjeiro  */
1191198a3c33SNelio Laranjeiro static int
1192c26ae069SMatan Azrad priv_link_status_update(struct priv *priv)
1193c26ae069SMatan Azrad {
1194c26ae069SMatan Azrad 	struct rte_eth_link *link = &priv->dev->data->dev_link;
1195c26ae069SMatan Azrad 
1196c7bf6225SYongseok Koh 	priv_link_update(priv, 0);
1197c26ae069SMatan Azrad 	if (((link->link_speed == 0) && link->link_status) ||
1198c26ae069SMatan Azrad 		((link->link_speed != 0) && !link->link_status)) {
1199c26ae069SMatan Azrad 		/*
1200c26ae069SMatan Azrad 		 * Inconsistent status. Event likely occurred before the
1201c26ae069SMatan Azrad 		 * kernel netdevice exposes the new status.
1202c26ae069SMatan Azrad 		 */
1203c26ae069SMatan Azrad 		if (!priv->pending_alarm) {
1204c26ae069SMatan Azrad 			priv->pending_alarm = 1;
1205c26ae069SMatan Azrad 			rte_eal_alarm_set(MLX5_ALARM_TIMEOUT_US,
1206c26ae069SMatan Azrad 					  mlx5_dev_link_status_handler,
1207c26ae069SMatan Azrad 					  priv->dev);
1208c26ae069SMatan Azrad 		}
1209c26ae069SMatan Azrad 		return 1;
1210c26ae069SMatan Azrad 	} else if (unlikely(priv->pending_alarm)) {
1211c26ae069SMatan Azrad 		/* Link interrupt occurred while alarm is already scheduled. */
1212c26ae069SMatan Azrad 		priv->pending_alarm = 0;
1213c26ae069SMatan Azrad 		rte_eal_alarm_cancel(mlx5_dev_link_status_handler, priv->dev);
1214c26ae069SMatan Azrad 	}
1215c26ae069SMatan Azrad 	return 0;
1216c26ae069SMatan Azrad }
1217c26ae069SMatan Azrad 
1218c26ae069SMatan Azrad /**
1219c26ae069SMatan Azrad  * Device status handler.
1220c26ae069SMatan Azrad  *
1221c26ae069SMatan Azrad  * @param priv
1222c26ae069SMatan Azrad  *   Pointer to private structure.
1223c26ae069SMatan Azrad  * @param events
1224c26ae069SMatan Azrad  *   Pointer to event flags holder.
1225c26ae069SMatan Azrad  *
1226c26ae069SMatan Azrad  * @return
1227c26ae069SMatan Azrad  *   Events bitmap of callback process which can be called immediately.
1228c26ae069SMatan Azrad  */
1229c26ae069SMatan Azrad static uint32_t
1230c26ae069SMatan Azrad priv_dev_status_handler(struct priv *priv)
1231198a3c33SNelio Laranjeiro {
1232198a3c33SNelio Laranjeiro 	struct ibv_async_event event;
1233c26ae069SMatan Azrad 	uint32_t ret = 0;
1234198a3c33SNelio Laranjeiro 
1235198a3c33SNelio Laranjeiro 	/* Read all message and acknowledge them. */
1236198a3c33SNelio Laranjeiro 	for (;;) {
1237198a3c33SNelio Laranjeiro 		if (ibv_get_async_event(priv->ctx, &event))
1238198a3c33SNelio Laranjeiro 			break;
1239c26ae069SMatan Azrad 		if ((event.event_type == IBV_EVENT_PORT_ACTIVE ||
1240c26ae069SMatan Azrad 			event.event_type == IBV_EVENT_PORT_ERR) &&
1241c26ae069SMatan Azrad 			(priv->dev->data->dev_conf.intr_conf.lsc == 1))
1242c26ae069SMatan Azrad 			ret |= (1 << RTE_ETH_EVENT_INTR_LSC);
12437d7d7ad1SMatan Azrad 		else if (event.event_type == IBV_EVENT_DEVICE_FATAL &&
12447d7d7ad1SMatan Azrad 			priv->dev->data->dev_conf.intr_conf.rmv == 1)
12457d7d7ad1SMatan Azrad 			ret |= (1 << RTE_ETH_EVENT_INTR_RMV);
1246c26ae069SMatan Azrad 		else
1247198a3c33SNelio Laranjeiro 			DEBUG("event type %d on port %d not handled",
1248198a3c33SNelio Laranjeiro 			      event.event_type, event.element.port_num);
1249198a3c33SNelio Laranjeiro 		ibv_ack_async_event(&event);
1250198a3c33SNelio Laranjeiro 	}
1251c26ae069SMatan Azrad 	if (ret & (1 << RTE_ETH_EVENT_INTR_LSC))
1252c26ae069SMatan Azrad 		if (priv_link_status_update(priv))
1253c26ae069SMatan Azrad 			ret &= ~(1 << RTE_ETH_EVENT_INTR_LSC);
1254198a3c33SNelio Laranjeiro 	return ret;
1255198a3c33SNelio Laranjeiro }
1256198a3c33SNelio Laranjeiro 
1257198a3c33SNelio Laranjeiro /**
1258198a3c33SNelio Laranjeiro  * Handle delayed link status event.
1259198a3c33SNelio Laranjeiro  *
1260198a3c33SNelio Laranjeiro  * @param arg
1261198a3c33SNelio Laranjeiro  *   Registered argument.
1262198a3c33SNelio Laranjeiro  */
1263198a3c33SNelio Laranjeiro void
1264198a3c33SNelio Laranjeiro mlx5_dev_link_status_handler(void *arg)
1265198a3c33SNelio Laranjeiro {
1266198a3c33SNelio Laranjeiro 	struct rte_eth_dev *dev = arg;
1267198a3c33SNelio Laranjeiro 	struct priv *priv = dev->data->dev_private;
1268198a3c33SNelio Laranjeiro 	int ret;
1269198a3c33SNelio Laranjeiro 
12706817ad38SYongseok Koh 	while (!priv_trylock(priv)) {
12716817ad38SYongseok Koh 		/* Alarm is being canceled. */
12726817ad38SYongseok Koh 		if (priv->pending_alarm == 0)
12736817ad38SYongseok Koh 			return;
12746817ad38SYongseok Koh 		rte_pause();
12756817ad38SYongseok Koh 	}
1276a9f2fbc4SShahaf Shuler 	priv->pending_alarm = 0;
1277c26ae069SMatan Azrad 	ret = priv_link_status_update(priv);
1278198a3c33SNelio Laranjeiro 	priv_unlock(priv);
1279c26ae069SMatan Azrad 	if (!ret)
1280cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL);
1281198a3c33SNelio Laranjeiro }
1282198a3c33SNelio Laranjeiro 
1283198a3c33SNelio Laranjeiro /**
1284198a3c33SNelio Laranjeiro  * Handle interrupts from the NIC.
1285198a3c33SNelio Laranjeiro  *
1286198a3c33SNelio Laranjeiro  * @param[in] intr_handle
1287198a3c33SNelio Laranjeiro  *   Interrupt handler.
1288198a3c33SNelio Laranjeiro  * @param cb_arg
1289198a3c33SNelio Laranjeiro  *   Callback argument.
1290198a3c33SNelio Laranjeiro  */
1291198a3c33SNelio Laranjeiro void
1292c23a1a30SQi Zhang mlx5_dev_interrupt_handler(void *cb_arg)
1293198a3c33SNelio Laranjeiro {
1294198a3c33SNelio Laranjeiro 	struct rte_eth_dev *dev = cb_arg;
1295198a3c33SNelio Laranjeiro 	struct priv *priv = dev->data->dev_private;
1296c26ae069SMatan Azrad 	uint32_t events;
1297198a3c33SNelio Laranjeiro 
1298198a3c33SNelio Laranjeiro 	priv_lock(priv);
1299c26ae069SMatan Azrad 	events = priv_dev_status_handler(priv);
1300198a3c33SNelio Laranjeiro 	priv_unlock(priv);
1301c26ae069SMatan Azrad 	if (events & (1 << RTE_ETH_EVENT_INTR_LSC))
1302cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL);
13037d7d7ad1SMatan Azrad 	if (events & (1 << RTE_ETH_EVENT_INTR_RMV))
1304cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_RMV, NULL);
1305198a3c33SNelio Laranjeiro }
1306198a3c33SNelio Laranjeiro 
1307198a3c33SNelio Laranjeiro /**
1308f8b9a3baSXueming Li  * Handle interrupts from the socket.
1309f8b9a3baSXueming Li  *
1310f8b9a3baSXueming Li  * @param cb_arg
1311f8b9a3baSXueming Li  *   Callback argument.
1312f8b9a3baSXueming Li  */
1313f8b9a3baSXueming Li static void
1314f8b9a3baSXueming Li mlx5_dev_handler_socket(void *cb_arg)
1315f8b9a3baSXueming Li {
1316f8b9a3baSXueming Li 	struct rte_eth_dev *dev = cb_arg;
1317f8b9a3baSXueming Li 	struct priv *priv = dev->data->dev_private;
1318f8b9a3baSXueming Li 
1319f8b9a3baSXueming Li 	priv_lock(priv);
1320f8b9a3baSXueming Li 	priv_socket_handle(priv);
1321f8b9a3baSXueming Li 	priv_unlock(priv);
1322f8b9a3baSXueming Li }
1323f8b9a3baSXueming Li 
1324f8b9a3baSXueming Li /**
1325198a3c33SNelio Laranjeiro  * Uninstall interrupt handler.
1326198a3c33SNelio Laranjeiro  *
1327198a3c33SNelio Laranjeiro  * @param priv
1328198a3c33SNelio Laranjeiro  *   Pointer to private structure.
1329198a3c33SNelio Laranjeiro  * @param dev
1330198a3c33SNelio Laranjeiro  *   Pointer to the rte_eth_dev structure.
1331198a3c33SNelio Laranjeiro  */
1332198a3c33SNelio Laranjeiro void
1333198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_uninstall(struct priv *priv, struct rte_eth_dev *dev)
1334198a3c33SNelio Laranjeiro {
1335f8b9a3baSXueming Li 	if (dev->data->dev_conf.intr_conf.lsc ||
1336f8b9a3baSXueming Li 	    dev->data->dev_conf.intr_conf.rmv)
1337198a3c33SNelio Laranjeiro 		rte_intr_callback_unregister(&priv->intr_handle,
1338f8b9a3baSXueming Li 					     mlx5_dev_interrupt_handler, dev);
1339f8b9a3baSXueming Li 	if (priv->primary_socket)
1340f8b9a3baSXueming Li 		rte_intr_callback_unregister(&priv->intr_handle_socket,
1341f8b9a3baSXueming Li 					     mlx5_dev_handler_socket, dev);
13426817ad38SYongseok Koh 	if (priv->pending_alarm) {
1343198a3c33SNelio Laranjeiro 		priv->pending_alarm = 0;
13446817ad38SYongseok Koh 		rte_eal_alarm_cancel(mlx5_dev_link_status_handler, dev);
13456817ad38SYongseok Koh 	}
1346198a3c33SNelio Laranjeiro 	priv->intr_handle.fd = 0;
134736351ea3SFerruh Yigit 	priv->intr_handle.type = RTE_INTR_HANDLE_UNKNOWN;
1348f8b9a3baSXueming Li 	priv->intr_handle_socket.fd = 0;
1349f8b9a3baSXueming Li 	priv->intr_handle_socket.type = RTE_INTR_HANDLE_UNKNOWN;
1350198a3c33SNelio Laranjeiro }
1351198a3c33SNelio Laranjeiro 
1352198a3c33SNelio Laranjeiro /**
1353198a3c33SNelio Laranjeiro  * Install interrupt handler.
1354198a3c33SNelio Laranjeiro  *
1355198a3c33SNelio Laranjeiro  * @param priv
1356198a3c33SNelio Laranjeiro  *   Pointer to private structure.
1357198a3c33SNelio Laranjeiro  * @param dev
1358198a3c33SNelio Laranjeiro  *   Pointer to the rte_eth_dev structure.
1359198a3c33SNelio Laranjeiro  */
1360198a3c33SNelio Laranjeiro void
1361198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_install(struct priv *priv, struct rte_eth_dev *dev)
1362198a3c33SNelio Laranjeiro {
1363198a3c33SNelio Laranjeiro 	int rc, flags;
1364198a3c33SNelio Laranjeiro 
1365198a3c33SNelio Laranjeiro 	assert(priv->ctx->async_fd > 0);
1366198a3c33SNelio Laranjeiro 	flags = fcntl(priv->ctx->async_fd, F_GETFL);
1367198a3c33SNelio Laranjeiro 	rc = fcntl(priv->ctx->async_fd, F_SETFL, flags | O_NONBLOCK);
1368198a3c33SNelio Laranjeiro 	if (rc < 0) {
1369198a3c33SNelio Laranjeiro 		INFO("failed to change file descriptor async event queue");
1370198a3c33SNelio Laranjeiro 		dev->data->dev_conf.intr_conf.lsc = 0;
13717d7d7ad1SMatan Azrad 		dev->data->dev_conf.intr_conf.rmv = 0;
1372f8b9a3baSXueming Li 	}
1373f8b9a3baSXueming Li 	if (dev->data->dev_conf.intr_conf.lsc ||
1374f8b9a3baSXueming Li 	    dev->data->dev_conf.intr_conf.rmv) {
1375198a3c33SNelio Laranjeiro 		priv->intr_handle.fd = priv->ctx->async_fd;
1376198a3c33SNelio Laranjeiro 		priv->intr_handle.type = RTE_INTR_HANDLE_EXT;
1377198a3c33SNelio Laranjeiro 		rte_intr_callback_register(&priv->intr_handle,
1378f8b9a3baSXueming Li 					   mlx5_dev_interrupt_handler, dev);
1379f8b9a3baSXueming Li 	}
1380f8b9a3baSXueming Li 
1381f8b9a3baSXueming Li 	rc = priv_socket_init(priv);
1382f8b9a3baSXueming Li 	if (!rc && priv->primary_socket) {
1383f8b9a3baSXueming Li 		priv->intr_handle_socket.fd = priv->primary_socket;
1384f8b9a3baSXueming Li 		priv->intr_handle_socket.type = RTE_INTR_HANDLE_EXT;
1385f8b9a3baSXueming Li 		rte_intr_callback_register(&priv->intr_handle_socket,
1386f8b9a3baSXueming Li 					   mlx5_dev_handler_socket, dev);
1387198a3c33SNelio Laranjeiro 	}
1388198a3c33SNelio Laranjeiro }
138962072098SOr Ami 
139062072098SOr Ami /**
139162072098SOr Ami  * Change the link state (UP / DOWN).
139262072098SOr Ami  *
13933d04e050SOlivier Matz  * @param priv
1394aee1b165SXueming Li  *   Pointer to private data structure.
139562072098SOr Ami  * @param up
139662072098SOr Ami  *   Nonzero for link up, otherwise link down.
139762072098SOr Ami  *
139862072098SOr Ami  * @return
139962072098SOr Ami  *   0 on success, errno value on failure.
140062072098SOr Ami  */
140162072098SOr Ami static int
1402c7bf6225SYongseok Koh priv_dev_set_link(struct priv *priv, int up)
140362072098SOr Ami {
1404c7bf6225SYongseok Koh 	return priv_set_flags(priv, ~IFF_UP, up ? IFF_UP : ~IFF_UP);
140562072098SOr Ami }
140662072098SOr Ami 
140762072098SOr Ami /**
140862072098SOr Ami  * DPDK callback to bring the link DOWN.
140962072098SOr Ami  *
141062072098SOr Ami  * @param dev
141162072098SOr Ami  *   Pointer to Ethernet device structure.
141262072098SOr Ami  *
141362072098SOr Ami  * @return
141462072098SOr Ami  *   0 on success, errno value on failure.
141562072098SOr Ami  */
141662072098SOr Ami int
141762072098SOr Ami mlx5_set_link_down(struct rte_eth_dev *dev)
141862072098SOr Ami {
141962072098SOr Ami 	struct priv *priv = dev->data->dev_private;
142062072098SOr Ami 	int err;
142162072098SOr Ami 
142262072098SOr Ami 	priv_lock(priv);
1423c7bf6225SYongseok Koh 	err = priv_dev_set_link(priv, 0);
142462072098SOr Ami 	priv_unlock(priv);
142562072098SOr Ami 	return err;
142662072098SOr Ami }
142762072098SOr Ami 
142862072098SOr Ami /**
142962072098SOr Ami  * DPDK callback to bring the link UP.
143062072098SOr Ami  *
143162072098SOr Ami  * @param dev
143262072098SOr Ami  *   Pointer to Ethernet device structure.
143362072098SOr Ami  *
143462072098SOr Ami  * @return
143562072098SOr Ami  *   0 on success, errno value on failure.
143662072098SOr Ami  */
143762072098SOr Ami int
143862072098SOr Ami mlx5_set_link_up(struct rte_eth_dev *dev)
143962072098SOr Ami {
144062072098SOr Ami 	struct priv *priv = dev->data->dev_private;
144162072098SOr Ami 	int err;
144262072098SOr Ami 
144362072098SOr Ami 	priv_lock(priv);
1444c7bf6225SYongseok Koh 	err = priv_dev_set_link(priv, 1);
144562072098SOr Ami 	priv_unlock(priv);
144662072098SOr Ami 	return err;
144762072098SOr Ami }
1448a48deadaSOr Ami 
1449a48deadaSOr Ami /**
1450cdab90cbSNélio Laranjeiro  * Configure the TX function to use.
1451cdab90cbSNélio Laranjeiro  *
1452cdab90cbSNélio Laranjeiro  * @param priv
1453aee1b165SXueming Li  *   Pointer to private data structure.
1454aee1b165SXueming Li  * @param dev
1455aee1b165SXueming Li  *   Pointer to rte_eth_dev structure.
14561cfa649bSShahaf Shuler  *
14571cfa649bSShahaf Shuler  * @return
14581cfa649bSShahaf Shuler  *   Pointer to selected Tx burst function.
1459cdab90cbSNélio Laranjeiro  */
14601cfa649bSShahaf Shuler eth_tx_burst_t
1461dbccb4cdSShahaf Shuler priv_select_tx_function(struct priv *priv, struct rte_eth_dev *dev)
1462cdab90cbSNélio Laranjeiro {
14631cfa649bSShahaf Shuler 	eth_tx_burst_t tx_pkt_burst = mlx5_tx_burst;
14647fe24446SShahaf Shuler 	struct mlx5_dev_config *config = &priv->config;
1465dbccb4cdSShahaf Shuler 	uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads;
1466dbccb4cdSShahaf Shuler 	int tso = !!(tx_offloads & (DEV_TX_OFFLOAD_TCP_TSO |
1467dbccb4cdSShahaf Shuler 				    DEV_TX_OFFLOAD_VXLAN_TNL_TSO |
1468dbccb4cdSShahaf Shuler 				    DEV_TX_OFFLOAD_GRE_TNL_TSO));
1469dbccb4cdSShahaf Shuler 	int vlan_insert = !!(tx_offloads & DEV_TX_OFFLOAD_VLAN_INSERT);
14701cfa649bSShahaf Shuler 
1471aee1b165SXueming Li 	assert(priv != NULL);
1472230189d9SNélio Laranjeiro 	/* Select appropriate TX function. */
1473dbccb4cdSShahaf Shuler 	if (vlan_insert || tso)
1474dbccb4cdSShahaf Shuler 		return tx_pkt_burst;
14757fe24446SShahaf Shuler 	if (config->mps == MLX5_MPW_ENHANCED) {
1476dbccb4cdSShahaf Shuler 		if (priv_check_vec_tx_support(priv, dev) > 0) {
1477dbccb4cdSShahaf Shuler 			if (priv_check_raw_vec_tx_support(priv, dev) > 0)
14781cfa649bSShahaf Shuler 				tx_pkt_burst = mlx5_tx_burst_raw_vec;
14796cb559d6SYongseok Koh 			else
14801cfa649bSShahaf Shuler 				tx_pkt_burst = mlx5_tx_burst_vec;
14816cb559d6SYongseok Koh 			DEBUG("selected Enhanced MPW TX vectorized function");
14826cb559d6SYongseok Koh 		} else {
14831cfa649bSShahaf Shuler 			tx_pkt_burst = mlx5_tx_burst_empw;
14846ce84bd8SYongseok Koh 			DEBUG("selected Enhanced MPW TX function");
14856cb559d6SYongseok Koh 		}
14867fe24446SShahaf Shuler 	} else if (config->mps && (config->txq_inline > 0)) {
14871cfa649bSShahaf Shuler 		tx_pkt_burst = mlx5_tx_burst_mpw_inline;
1488230189d9SNélio Laranjeiro 		DEBUG("selected MPW inline TX function");
14897fe24446SShahaf Shuler 	} else if (config->mps) {
14901cfa649bSShahaf Shuler 		tx_pkt_burst = mlx5_tx_burst_mpw;
1491230189d9SNélio Laranjeiro 		DEBUG("selected MPW TX function");
14922a66cf37SYaacov Hazan 	}
14931cfa649bSShahaf Shuler 	return tx_pkt_burst;
1494cdab90cbSNélio Laranjeiro }
1495cdab90cbSNélio Laranjeiro 
1496cdab90cbSNélio Laranjeiro /**
1497cdab90cbSNélio Laranjeiro  * Configure the RX function to use.
1498cdab90cbSNélio Laranjeiro  *
1499cdab90cbSNélio Laranjeiro  * @param priv
1500aee1b165SXueming Li  *   Pointer to private data structure.
1501aee1b165SXueming Li  * @param dev
1502aee1b165SXueming Li  *   Pointer to rte_eth_dev structure.
15031cfa649bSShahaf Shuler  *
15041cfa649bSShahaf Shuler  * @return
15051cfa649bSShahaf Shuler  *   Pointer to selected Rx burst function.
1506cdab90cbSNélio Laranjeiro  */
15071cfa649bSShahaf Shuler eth_rx_burst_t
15081cfa649bSShahaf Shuler priv_select_rx_function(struct priv *priv, __rte_unused struct rte_eth_dev *dev)
1509cdab90cbSNélio Laranjeiro {
15101cfa649bSShahaf Shuler 	eth_rx_burst_t rx_pkt_burst = mlx5_rx_burst;
15111cfa649bSShahaf Shuler 
1512aee1b165SXueming Li 	assert(priv != NULL);
15136cb559d6SYongseok Koh 	if (priv_check_vec_rx_support(priv) > 0) {
15141cfa649bSShahaf Shuler 		rx_pkt_burst = mlx5_rx_burst_vec;
15156cb559d6SYongseok Koh 		DEBUG("selected RX vectorized function");
1516cdab90cbSNélio Laranjeiro 	}
15171cfa649bSShahaf Shuler 	return rx_pkt_burst;
15186cb559d6SYongseok Koh }
1519d3e0f392SMatan Azrad 
1520d3e0f392SMatan Azrad /**
1521d3e0f392SMatan Azrad  * Check if mlx5 device was removed.
1522d3e0f392SMatan Azrad  *
1523d3e0f392SMatan Azrad  * @param dev
1524d3e0f392SMatan Azrad  *   Pointer to Ethernet device structure.
1525d3e0f392SMatan Azrad  *
1526d3e0f392SMatan Azrad  * @return
1527d3e0f392SMatan Azrad  *   1 when device is removed, otherwise 0.
1528d3e0f392SMatan Azrad  */
1529d3e0f392SMatan Azrad int
1530d3e0f392SMatan Azrad mlx5_is_removed(struct rte_eth_dev *dev)
1531d3e0f392SMatan Azrad {
1532d3e0f392SMatan Azrad 	struct ibv_device_attr device_attr;
1533d3e0f392SMatan Azrad 	struct priv *priv = dev->data->dev_private;
1534d3e0f392SMatan Azrad 
1535d3e0f392SMatan Azrad 	if (ibv_query_device(priv->ctx, &device_attr) == EIO)
1536d3e0f392SMatan Azrad 		return 1;
1537d3e0f392SMatan Azrad 	return 0;
1538d3e0f392SMatan Azrad }
1539