xref: /dpdk/drivers/net/mlx5/mlx5_ethdev.c (revision d11d651f6d972a9802f1dc20ed9eaebcd367bc3b)
18fd92a66SOlivier Matz /* SPDX-License-Identifier: BSD-3-Clause
2771fa900SAdrien Mazarguil  * Copyright 2015 6WIND S.A.
35feecc57SShahaf Shuler  * Copyright 2015 Mellanox Technologies, Ltd
4771fa900SAdrien Mazarguil  */
5771fa900SAdrien Mazarguil 
6f8b9a3baSXueming Li #define _GNU_SOURCE
7f8b9a3baSXueming Li 
8771fa900SAdrien Mazarguil #include <stddef.h>
9e60fbd5bSAdrien Mazarguil #include <assert.h>
10fc40db99SAdrien Mazarguil #include <inttypes.h>
11771fa900SAdrien Mazarguil #include <unistd.h>
12771fa900SAdrien Mazarguil #include <stdint.h>
13771fa900SAdrien Mazarguil #include <stdio.h>
14771fa900SAdrien Mazarguil #include <string.h>
15771fa900SAdrien Mazarguil #include <stdlib.h>
16771fa900SAdrien Mazarguil #include <errno.h>
17771fa900SAdrien Mazarguil #include <dirent.h>
18771fa900SAdrien Mazarguil #include <net/if.h>
19771fa900SAdrien Mazarguil #include <sys/ioctl.h>
20771fa900SAdrien Mazarguil #include <sys/socket.h>
21771fa900SAdrien Mazarguil #include <netinet/in.h>
22cb8faed7SAdrien Mazarguil #include <linux/ethtool.h>
23cb8faed7SAdrien Mazarguil #include <linux/sockios.h>
24198a3c33SNelio Laranjeiro #include <fcntl.h>
2590260d57SNélio Laranjeiro #include <stdalign.h>
26f8b9a3baSXueming Li #include <sys/un.h>
27cfee9475SNélio Laranjeiro #include <time.h>
28771fa900SAdrien Mazarguil 
29771fa900SAdrien Mazarguil #include <rte_atomic.h>
30ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h>
31c752998bSGaetan Rivet #include <rte_bus_pci.h>
32771fa900SAdrien Mazarguil #include <rte_mbuf.h>
33771fa900SAdrien Mazarguil #include <rte_common.h>
34198a3c33SNelio Laranjeiro #include <rte_interrupts.h>
35a48deadaSOr Ami #include <rte_malloc.h>
36c022cb40SBruce Richardson #include <rte_string_fns.h>
37771fa900SAdrien Mazarguil 
38771fa900SAdrien Mazarguil #include "mlx5.h"
390e83b8e5SNelio Laranjeiro #include "mlx5_glue.h"
40e60fbd5bSAdrien Mazarguil #include "mlx5_rxtx.h"
41771fa900SAdrien Mazarguil #include "mlx5_utils.h"
42771fa900SAdrien Mazarguil 
433a49ffe3SShahaf Shuler /* Add defines in case the running kernel is not the same as user headers. */
443a49ffe3SShahaf Shuler #ifndef ETHTOOL_GLINKSETTINGS
453a49ffe3SShahaf Shuler struct ethtool_link_settings {
463a49ffe3SShahaf Shuler 	uint32_t cmd;
473a49ffe3SShahaf Shuler 	uint32_t speed;
483a49ffe3SShahaf Shuler 	uint8_t duplex;
493a49ffe3SShahaf Shuler 	uint8_t port;
503a49ffe3SShahaf Shuler 	uint8_t phy_address;
513a49ffe3SShahaf Shuler 	uint8_t autoneg;
523a49ffe3SShahaf Shuler 	uint8_t mdio_support;
533a49ffe3SShahaf Shuler 	uint8_t eth_to_mdix;
543a49ffe3SShahaf Shuler 	uint8_t eth_tp_mdix_ctrl;
553a49ffe3SShahaf Shuler 	int8_t link_mode_masks_nwords;
563a49ffe3SShahaf Shuler 	uint32_t reserved[8];
573a49ffe3SShahaf Shuler 	uint32_t link_mode_masks[];
583a49ffe3SShahaf Shuler };
593a49ffe3SShahaf Shuler 
603a49ffe3SShahaf Shuler #define ETHTOOL_GLINKSETTINGS 0x0000004c
613a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseT_Full_BIT 5
623a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_Autoneg_BIT 6
633a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseKX_Full_BIT 17
643a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT 18
653a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKR_Full_BIT 19
663a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseR_FEC_BIT 20
673a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT 21
683a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT 22
693a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT 23
703a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT 24
713a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT 25
723a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT 26
733a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT 27
743a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT 28
753a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT 29
763a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT 30
773a49ffe3SShahaf Shuler #endif
783a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_25G
793a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseCR_Full_BIT 31
803a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseKR_Full_BIT 32
813a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseSR_Full_BIT 33
823a49ffe3SShahaf Shuler #endif
833a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_50G
843a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT 34
853a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT 35
863a49ffe3SShahaf Shuler #endif
873a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_100G
883a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT 36
893a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT 37
903a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT 38
913a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT 39
923a49ffe3SShahaf Shuler #endif
933a49ffe3SShahaf Shuler 
94771fa900SAdrien Mazarguil /**
95771fa900SAdrien Mazarguil  * Get interface name from private structure.
96771fa900SAdrien Mazarguil  *
97af4f09f2SNélio Laranjeiro  * @param[in] dev
98af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
99771fa900SAdrien Mazarguil  * @param[out] ifname
100771fa900SAdrien Mazarguil  *   Interface name output buffer.
101771fa900SAdrien Mazarguil  *
102771fa900SAdrien Mazarguil  * @return
103a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
104771fa900SAdrien Mazarguil  */
105771fa900SAdrien Mazarguil int
106af4f09f2SNélio Laranjeiro mlx5_get_ifname(const struct rte_eth_dev *dev, char (*ifname)[IF_NAMESIZE])
107771fa900SAdrien Mazarguil {
108af4f09f2SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
109771fa900SAdrien Mazarguil 	DIR *dir;
110771fa900SAdrien Mazarguil 	struct dirent *dent;
111771fa900SAdrien Mazarguil 	unsigned int dev_type = 0;
112771fa900SAdrien Mazarguil 	unsigned int dev_port_prev = ~0u;
113771fa900SAdrien Mazarguil 	char match[IF_NAMESIZE] = "";
114771fa900SAdrien Mazarguil 
115771fa900SAdrien Mazarguil 	{
11687ec44ceSXueming Li 		MKSTR(path, "%s/device/net", priv->ibdev_path);
117771fa900SAdrien Mazarguil 
118771fa900SAdrien Mazarguil 		dir = opendir(path);
119a6d83b6aSNélio Laranjeiro 		if (dir == NULL) {
120a6d83b6aSNélio Laranjeiro 			rte_errno = errno;
121a6d83b6aSNélio Laranjeiro 			return -rte_errno;
122a6d83b6aSNélio Laranjeiro 		}
123771fa900SAdrien Mazarguil 	}
124771fa900SAdrien Mazarguil 	while ((dent = readdir(dir)) != NULL) {
125771fa900SAdrien Mazarguil 		char *name = dent->d_name;
126771fa900SAdrien Mazarguil 		FILE *file;
127771fa900SAdrien Mazarguil 		unsigned int dev_port;
128771fa900SAdrien Mazarguil 		int r;
129771fa900SAdrien Mazarguil 
130771fa900SAdrien Mazarguil 		if ((name[0] == '.') &&
131771fa900SAdrien Mazarguil 		    ((name[1] == '\0') ||
132771fa900SAdrien Mazarguil 		     ((name[1] == '.') && (name[2] == '\0'))))
133771fa900SAdrien Mazarguil 			continue;
134771fa900SAdrien Mazarguil 
135771fa900SAdrien Mazarguil 		MKSTR(path, "%s/device/net/%s/%s",
13687ec44ceSXueming Li 		      priv->ibdev_path, name,
137771fa900SAdrien Mazarguil 		      (dev_type ? "dev_id" : "dev_port"));
138771fa900SAdrien Mazarguil 
139771fa900SAdrien Mazarguil 		file = fopen(path, "rb");
140771fa900SAdrien Mazarguil 		if (file == NULL) {
141771fa900SAdrien Mazarguil 			if (errno != ENOENT)
142771fa900SAdrien Mazarguil 				continue;
143771fa900SAdrien Mazarguil 			/*
144771fa900SAdrien Mazarguil 			 * Switch to dev_id when dev_port does not exist as
145771fa900SAdrien Mazarguil 			 * is the case with Linux kernel versions < 3.15.
146771fa900SAdrien Mazarguil 			 */
147771fa900SAdrien Mazarguil try_dev_id:
148771fa900SAdrien Mazarguil 			match[0] = '\0';
149771fa900SAdrien Mazarguil 			if (dev_type)
150771fa900SAdrien Mazarguil 				break;
151771fa900SAdrien Mazarguil 			dev_type = 1;
152771fa900SAdrien Mazarguil 			dev_port_prev = ~0u;
153771fa900SAdrien Mazarguil 			rewinddir(dir);
154771fa900SAdrien Mazarguil 			continue;
155771fa900SAdrien Mazarguil 		}
156771fa900SAdrien Mazarguil 		r = fscanf(file, (dev_type ? "%x" : "%u"), &dev_port);
157771fa900SAdrien Mazarguil 		fclose(file);
158771fa900SAdrien Mazarguil 		if (r != 1)
159771fa900SAdrien Mazarguil 			continue;
160771fa900SAdrien Mazarguil 		/*
161771fa900SAdrien Mazarguil 		 * Switch to dev_id when dev_port returns the same value for
162771fa900SAdrien Mazarguil 		 * all ports. May happen when using a MOFED release older than
163771fa900SAdrien Mazarguil 		 * 3.0 with a Linux kernel >= 3.15.
164771fa900SAdrien Mazarguil 		 */
165771fa900SAdrien Mazarguil 		if (dev_port == dev_port_prev)
166771fa900SAdrien Mazarguil 			goto try_dev_id;
167771fa900SAdrien Mazarguil 		dev_port_prev = dev_port;
168771fa900SAdrien Mazarguil 		if (dev_port == (priv->port - 1u))
169c022cb40SBruce Richardson 			strlcpy(match, name, sizeof(match));
170771fa900SAdrien Mazarguil 	}
171771fa900SAdrien Mazarguil 	closedir(dir);
172a6d83b6aSNélio Laranjeiro 	if (match[0] == '\0') {
173a6d83b6aSNélio Laranjeiro 		rte_errno = ENOENT;
174a6d83b6aSNélio Laranjeiro 		return -rte_errno;
175a6d83b6aSNélio Laranjeiro 	}
176771fa900SAdrien Mazarguil 	strncpy(*ifname, match, sizeof(*ifname));
177771fa900SAdrien Mazarguil 	return 0;
178771fa900SAdrien Mazarguil }
179771fa900SAdrien Mazarguil 
180771fa900SAdrien Mazarguil /**
181ccdcba53SNélio Laranjeiro  * Get the interface index from device name.
182ccdcba53SNélio Laranjeiro  *
183ccdcba53SNélio Laranjeiro  * @param[in] dev
184ccdcba53SNélio Laranjeiro  *   Pointer to Ethernet device.
185ccdcba53SNélio Laranjeiro  *
186ccdcba53SNélio Laranjeiro  * @return
187ccdcba53SNélio Laranjeiro  *   Interface index on success, a negative errno value otherwise and
188ccdcba53SNélio Laranjeiro  *   rte_errno is set.
189ccdcba53SNélio Laranjeiro  */
190ccdcba53SNélio Laranjeiro int
191ccdcba53SNélio Laranjeiro mlx5_ifindex(const struct rte_eth_dev *dev)
192ccdcba53SNélio Laranjeiro {
193ccdcba53SNélio Laranjeiro 	char ifname[IF_NAMESIZE];
194ccdcba53SNélio Laranjeiro 	int ret;
195ccdcba53SNélio Laranjeiro 
196ccdcba53SNélio Laranjeiro 	ret = mlx5_get_ifname(dev, &ifname);
197ccdcba53SNélio Laranjeiro 	if (ret)
198ccdcba53SNélio Laranjeiro 		return ret;
199ccdcba53SNélio Laranjeiro 	ret = if_nametoindex(ifname);
200ccdcba53SNélio Laranjeiro 	if (ret == -1) {
201ccdcba53SNélio Laranjeiro 		rte_errno = errno;
202ccdcba53SNélio Laranjeiro 		return -rte_errno;
203ccdcba53SNélio Laranjeiro 	}
204ccdcba53SNélio Laranjeiro 	return ret;
205ccdcba53SNélio Laranjeiro }
206ccdcba53SNélio Laranjeiro 
207ccdcba53SNélio Laranjeiro /**
208771fa900SAdrien Mazarguil  * Perform ifreq ioctl() on associated Ethernet device.
209771fa900SAdrien Mazarguil  *
210af4f09f2SNélio Laranjeiro  * @param[in] dev
211af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
212771fa900SAdrien Mazarguil  * @param req
213771fa900SAdrien Mazarguil  *   Request number to pass to ioctl().
214771fa900SAdrien Mazarguil  * @param[out] ifr
215771fa900SAdrien Mazarguil  *   Interface request structure output buffer.
216771fa900SAdrien Mazarguil  *
217771fa900SAdrien Mazarguil  * @return
218a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
219771fa900SAdrien Mazarguil  */
220771fa900SAdrien Mazarguil int
221af4f09f2SNélio Laranjeiro mlx5_ifreq(const struct rte_eth_dev *dev, int req, struct ifreq *ifr)
222771fa900SAdrien Mazarguil {
223771fa900SAdrien Mazarguil 	int sock = socket(PF_INET, SOCK_DGRAM, IPPROTO_IP);
224a6d83b6aSNélio Laranjeiro 	int ret = 0;
225771fa900SAdrien Mazarguil 
226a6d83b6aSNélio Laranjeiro 	if (sock == -1) {
227a6d83b6aSNélio Laranjeiro 		rte_errno = errno;
228a6d83b6aSNélio Laranjeiro 		return -rte_errno;
229a6d83b6aSNélio Laranjeiro 	}
230a6d83b6aSNélio Laranjeiro 	ret = mlx5_get_ifname(dev, &ifr->ifr_name);
231a6d83b6aSNélio Laranjeiro 	if (ret)
232a6d83b6aSNélio Laranjeiro 		goto error;
233771fa900SAdrien Mazarguil 	ret = ioctl(sock, req, ifr);
234a6d83b6aSNélio Laranjeiro 	if (ret == -1) {
235a6d83b6aSNélio Laranjeiro 		rte_errno = errno;
236a6d83b6aSNélio Laranjeiro 		goto error;
237a6d83b6aSNélio Laranjeiro 	}
238771fa900SAdrien Mazarguil 	close(sock);
239a6d83b6aSNélio Laranjeiro 	return 0;
240a6d83b6aSNélio Laranjeiro error:
241a6d83b6aSNélio Laranjeiro 	close(sock);
242a6d83b6aSNélio Laranjeiro 	return -rte_errno;
243771fa900SAdrien Mazarguil }
244771fa900SAdrien Mazarguil 
245771fa900SAdrien Mazarguil /**
246771fa900SAdrien Mazarguil  * Get device MTU.
247771fa900SAdrien Mazarguil  *
248af4f09f2SNélio Laranjeiro  * @param dev
249af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
250771fa900SAdrien Mazarguil  * @param[out] mtu
251771fa900SAdrien Mazarguil  *   MTU value output buffer.
252771fa900SAdrien Mazarguil  *
253771fa900SAdrien Mazarguil  * @return
254a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
255771fa900SAdrien Mazarguil  */
256771fa900SAdrien Mazarguil int
257af4f09f2SNélio Laranjeiro mlx5_get_mtu(struct rte_eth_dev *dev, uint16_t *mtu)
258771fa900SAdrien Mazarguil {
259fc40db99SAdrien Mazarguil 	struct ifreq request;
260af4f09f2SNélio Laranjeiro 	int ret = mlx5_ifreq(dev, SIOCGIFMTU, &request);
261771fa900SAdrien Mazarguil 
262fc40db99SAdrien Mazarguil 	if (ret)
263fc40db99SAdrien Mazarguil 		return ret;
264fc40db99SAdrien Mazarguil 	*mtu = request.ifr_mtu;
265859081d3SShahaf Shuler 	return 0;
266859081d3SShahaf Shuler }
267859081d3SShahaf Shuler 
268859081d3SShahaf Shuler /**
269cf37ca95SAdrien Mazarguil  * Set device MTU.
270cf37ca95SAdrien Mazarguil  *
271af4f09f2SNélio Laranjeiro  * @param dev
272af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
273cf37ca95SAdrien Mazarguil  * @param mtu
274cf37ca95SAdrien Mazarguil  *   MTU value to set.
275cf37ca95SAdrien Mazarguil  *
276cf37ca95SAdrien Mazarguil  * @return
277a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
278cf37ca95SAdrien Mazarguil  */
279cf37ca95SAdrien Mazarguil static int
280af4f09f2SNélio Laranjeiro mlx5_set_mtu(struct rte_eth_dev *dev, uint16_t mtu)
281cf37ca95SAdrien Mazarguil {
282fc40db99SAdrien Mazarguil 	struct ifreq request = { .ifr_mtu = mtu, };
283f3b492d7SAdrien Mazarguil 
284af4f09f2SNélio Laranjeiro 	return mlx5_ifreq(dev, SIOCSIFMTU, &request);
285cf37ca95SAdrien Mazarguil }
286cf37ca95SAdrien Mazarguil 
287cf37ca95SAdrien Mazarguil /**
288771fa900SAdrien Mazarguil  * Set device flags.
289771fa900SAdrien Mazarguil  *
290af4f09f2SNélio Laranjeiro  * @param dev
291af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
292771fa900SAdrien Mazarguil  * @param keep
293771fa900SAdrien Mazarguil  *   Bitmask for flags that must remain untouched.
294771fa900SAdrien Mazarguil  * @param flags
295771fa900SAdrien Mazarguil  *   Bitmask for flags to modify.
296771fa900SAdrien Mazarguil  *
297771fa900SAdrien Mazarguil  * @return
298a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
299771fa900SAdrien Mazarguil  */
300771fa900SAdrien Mazarguil int
301af4f09f2SNélio Laranjeiro mlx5_set_flags(struct rte_eth_dev *dev, unsigned int keep, unsigned int flags)
302771fa900SAdrien Mazarguil {
303fc40db99SAdrien Mazarguil 	struct ifreq request;
304af4f09f2SNélio Laranjeiro 	int ret = mlx5_ifreq(dev, SIOCGIFFLAGS, &request);
305771fa900SAdrien Mazarguil 
306fc40db99SAdrien Mazarguil 	if (ret)
307fc40db99SAdrien Mazarguil 		return ret;
308fc40db99SAdrien Mazarguil 	request.ifr_flags &= keep;
309fc40db99SAdrien Mazarguil 	request.ifr_flags |= flags & ~keep;
310af4f09f2SNélio Laranjeiro 	return mlx5_ifreq(dev, SIOCSIFFLAGS, &request);
311771fa900SAdrien Mazarguil }
312771fa900SAdrien Mazarguil 
313771fa900SAdrien Mazarguil /**
3147b2423cdSNélio Laranjeiro  * DPDK callback for Ethernet device configuration.
315e60fbd5bSAdrien Mazarguil  *
316e60fbd5bSAdrien Mazarguil  * @param dev
317e60fbd5bSAdrien Mazarguil  *   Pointer to Ethernet device structure.
318e60fbd5bSAdrien Mazarguil  *
319e60fbd5bSAdrien Mazarguil  * @return
320a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
321e60fbd5bSAdrien Mazarguil  */
3227b2423cdSNélio Laranjeiro int
3237b2423cdSNélio Laranjeiro mlx5_dev_configure(struct rte_eth_dev *dev)
324e60fbd5bSAdrien Mazarguil {
325e60fbd5bSAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
326e60fbd5bSAdrien Mazarguil 	unsigned int rxqs_n = dev->data->nb_rx_queues;
327e60fbd5bSAdrien Mazarguil 	unsigned int txqs_n = dev->data->nb_tx_queues;
328634efbc2SNelio Laranjeiro 	unsigned int i;
329634efbc2SNelio Laranjeiro 	unsigned int j;
330634efbc2SNelio Laranjeiro 	unsigned int reta_idx_n;
33129c1d8bbSNélio Laranjeiro 	const uint8_t use_app_rss_key =
33221e3a974SShahaf Shuler 		!!dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key;
333af4f09f2SNélio Laranjeiro 	uint64_t supp_tx_offloads = mlx5_get_tx_port_offloads(dev);
334dbccb4cdSShahaf Shuler 	uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads;
33517b843ebSShahaf Shuler 	uint64_t supp_rx_offloads =
336af4f09f2SNélio Laranjeiro 		(mlx5_get_rx_port_offloads() |
337af4f09f2SNélio Laranjeiro 		 mlx5_get_rx_queue_offloads(dev));
33817b843ebSShahaf Shuler 	uint64_t rx_offloads = dev->data->dev_conf.rxmode.offloads;
339a6d83b6aSNélio Laranjeiro 	int ret = 0;
340e60fbd5bSAdrien Mazarguil 
341dbccb4cdSShahaf Shuler 	if ((tx_offloads & supp_tx_offloads) != tx_offloads) {
342a170a30dSNélio Laranjeiro 		DRV_LOG(ERR,
343a170a30dSNélio Laranjeiro 			"port %u some Tx offloads are not supported requested"
344a170a30dSNélio Laranjeiro 			" 0x%" PRIx64 " supported 0x%" PRIx64,
3450f99970bSNélio Laranjeiro 			dev->data->port_id, tx_offloads, supp_tx_offloads);
346a6d83b6aSNélio Laranjeiro 		rte_errno = ENOTSUP;
347a6d83b6aSNélio Laranjeiro 		return -rte_errno;
348dbccb4cdSShahaf Shuler 	}
34917b843ebSShahaf Shuler 	if ((rx_offloads & supp_rx_offloads) != rx_offloads) {
350a170a30dSNélio Laranjeiro 		DRV_LOG(ERR,
351a170a30dSNélio Laranjeiro 			"port %u some Rx offloads are not supported requested"
352a170a30dSNélio Laranjeiro 			" 0x%" PRIx64 " supported 0x%" PRIx64,
3530f99970bSNélio Laranjeiro 			dev->data->port_id, rx_offloads, supp_rx_offloads);
354a6d83b6aSNélio Laranjeiro 		rte_errno = ENOTSUP;
355a6d83b6aSNélio Laranjeiro 		return -rte_errno;
35617b843ebSShahaf Shuler 	}
35729c1d8bbSNélio Laranjeiro 	if (use_app_rss_key &&
35829c1d8bbSNélio Laranjeiro 	    (dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key_len !=
35929c1d8bbSNélio Laranjeiro 	     rss_hash_default_key_len)) {
360a1572312SShahaf Shuler 		DRV_LOG(ERR, "port %u RSS key len must be %zu Bytes long",
361a1572312SShahaf Shuler 			dev->data->port_id, rss_hash_default_key_len);
362a6d83b6aSNélio Laranjeiro 		rte_errno = EINVAL;
363a6d83b6aSNélio Laranjeiro 		return -rte_errno;
36429c1d8bbSNélio Laranjeiro 	}
36529c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_key =
36629c1d8bbSNélio Laranjeiro 		rte_realloc(priv->rss_conf.rss_key,
36729c1d8bbSNélio Laranjeiro 			    rss_hash_default_key_len, 0);
36829c1d8bbSNélio Laranjeiro 	if (!priv->rss_conf.rss_key) {
369a170a30dSNélio Laranjeiro 		DRV_LOG(ERR, "port %u cannot allocate RSS hash key memory (%u)",
3700f99970bSNélio Laranjeiro 			dev->data->port_id, rxqs_n);
371a6d83b6aSNélio Laranjeiro 		rte_errno = ENOMEM;
372a6d83b6aSNélio Laranjeiro 		return -rte_errno;
37329c1d8bbSNélio Laranjeiro 	}
37429c1d8bbSNélio Laranjeiro 	memcpy(priv->rss_conf.rss_key,
37529c1d8bbSNélio Laranjeiro 	       use_app_rss_key ?
37629c1d8bbSNélio Laranjeiro 	       dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key :
37729c1d8bbSNélio Laranjeiro 	       rss_hash_default_key,
37829c1d8bbSNélio Laranjeiro 	       rss_hash_default_key_len);
37929c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_key_len = rss_hash_default_key_len;
38029c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_hf = dev->data->dev_conf.rx_adv_conf.rss_conf.rss_hf;
381e60fbd5bSAdrien Mazarguil 	priv->rxqs = (void *)dev->data->rx_queues;
382e60fbd5bSAdrien Mazarguil 	priv->txqs = (void *)dev->data->tx_queues;
383e60fbd5bSAdrien Mazarguil 	if (txqs_n != priv->txqs_n) {
384a170a30dSNélio Laranjeiro 		DRV_LOG(INFO, "port %u Tx queues number update: %u -> %u",
3850f99970bSNélio Laranjeiro 			dev->data->port_id, priv->txqs_n, txqs_n);
386e60fbd5bSAdrien Mazarguil 		priv->txqs_n = txqs_n;
387e60fbd5bSAdrien Mazarguil 	}
3887fe24446SShahaf Shuler 	if (rxqs_n > priv->config.ind_table_max_size) {
389a170a30dSNélio Laranjeiro 		DRV_LOG(ERR, "port %u cannot handle this many Rx queues (%u)",
3900f99970bSNélio Laranjeiro 			dev->data->port_id, rxqs_n);
391a6d83b6aSNélio Laranjeiro 		rte_errno = EINVAL;
392a6d83b6aSNélio Laranjeiro 		return -rte_errno;
393634efbc2SNelio Laranjeiro 	}
394e60fbd5bSAdrien Mazarguil 	if (rxqs_n == priv->rxqs_n)
395e60fbd5bSAdrien Mazarguil 		return 0;
396a170a30dSNélio Laranjeiro 	DRV_LOG(INFO, "port %u Rx queues number update: %u -> %u",
3970f99970bSNélio Laranjeiro 		dev->data->port_id, priv->rxqs_n, rxqs_n);
398e60fbd5bSAdrien Mazarguil 	priv->rxqs_n = rxqs_n;
399634efbc2SNelio Laranjeiro 	/* If the requested number of RX queues is not a power of two, use the
400634efbc2SNelio Laranjeiro 	 * maximum indirection table size for better balancing.
401634efbc2SNelio Laranjeiro 	 * The result is always rounded to the next power of two. */
402634efbc2SNelio Laranjeiro 	reta_idx_n = (1 << log2above((rxqs_n & (rxqs_n - 1)) ?
4037fe24446SShahaf Shuler 				     priv->config.ind_table_max_size :
404634efbc2SNelio Laranjeiro 				     rxqs_n));
405a6d83b6aSNélio Laranjeiro 	ret = mlx5_rss_reta_index_resize(dev, reta_idx_n);
406a6d83b6aSNélio Laranjeiro 	if (ret)
407a6d83b6aSNélio Laranjeiro 		return ret;
408634efbc2SNelio Laranjeiro 	/* When the number of RX queues is not a power of two, the remaining
409634efbc2SNelio Laranjeiro 	 * table entries are padded with reused WQs and hashes are not spread
410634efbc2SNelio Laranjeiro 	 * uniformly. */
411634efbc2SNelio Laranjeiro 	for (i = 0, j = 0; (i != reta_idx_n); ++i) {
412634efbc2SNelio Laranjeiro 		(*priv->reta_idx)[i] = j;
413634efbc2SNelio Laranjeiro 		if (++j == rxqs_n)
414634efbc2SNelio Laranjeiro 			j = 0;
415634efbc2SNelio Laranjeiro 	}
416e60fbd5bSAdrien Mazarguil 	return 0;
417e60fbd5bSAdrien Mazarguil }
418e60fbd5bSAdrien Mazarguil 
419e60fbd5bSAdrien Mazarguil /**
420*d11d651fSShahaf Shuler  * Sets default tuning parameters.
421*d11d651fSShahaf Shuler  *
422*d11d651fSShahaf Shuler  * @param dev
423*d11d651fSShahaf Shuler  *   Pointer to Ethernet device.
424*d11d651fSShahaf Shuler  * @param[out] info
425*d11d651fSShahaf Shuler  *   Info structure output buffer.
426*d11d651fSShahaf Shuler  */
427*d11d651fSShahaf Shuler static void
428*d11d651fSShahaf Shuler mlx5_set_default_params(struct rte_eth_dev *dev, struct rte_eth_dev_info *info)
429*d11d651fSShahaf Shuler {
430*d11d651fSShahaf Shuler 	struct priv *priv = dev->data->dev_private;
431*d11d651fSShahaf Shuler 
432*d11d651fSShahaf Shuler 	/* Minimum CPU utilization. */
433*d11d651fSShahaf Shuler 	info->default_rxportconf.ring_size = 256;
434*d11d651fSShahaf Shuler 	info->default_txportconf.ring_size = 256;
435*d11d651fSShahaf Shuler 	info->default_rxportconf.burst_size = 64;
436*d11d651fSShahaf Shuler 	info->default_txportconf.burst_size = 64;
437*d11d651fSShahaf Shuler 	if (priv->link_speed_capa & ETH_LINK_SPEED_100G) {
438*d11d651fSShahaf Shuler 		info->default_rxportconf.nb_queues = 16;
439*d11d651fSShahaf Shuler 		info->default_txportconf.nb_queues = 16;
440*d11d651fSShahaf Shuler 		if (dev->data->nb_rx_queues > 2 ||
441*d11d651fSShahaf Shuler 		    dev->data->nb_tx_queues > 2) {
442*d11d651fSShahaf Shuler 			/* Max Throughput. */
443*d11d651fSShahaf Shuler 			info->default_rxportconf.ring_size = 2048;
444*d11d651fSShahaf Shuler 			info->default_txportconf.ring_size = 2048;
445*d11d651fSShahaf Shuler 		}
446*d11d651fSShahaf Shuler 	} else {
447*d11d651fSShahaf Shuler 		info->default_rxportconf.nb_queues = 8;
448*d11d651fSShahaf Shuler 		info->default_txportconf.nb_queues = 8;
449*d11d651fSShahaf Shuler 		if (dev->data->nb_rx_queues > 2 ||
450*d11d651fSShahaf Shuler 		    dev->data->nb_tx_queues > 2) {
451*d11d651fSShahaf Shuler 			/* Max Throughput. */
452*d11d651fSShahaf Shuler 			info->default_rxportconf.ring_size = 4096;
453*d11d651fSShahaf Shuler 			info->default_txportconf.ring_size = 4096;
454*d11d651fSShahaf Shuler 		}
455*d11d651fSShahaf Shuler 	}
456*d11d651fSShahaf Shuler }
457*d11d651fSShahaf Shuler 
458*d11d651fSShahaf Shuler /**
459e60fbd5bSAdrien Mazarguil  * DPDK callback to get information about the device.
460e60fbd5bSAdrien Mazarguil  *
461e60fbd5bSAdrien Mazarguil  * @param dev
462e60fbd5bSAdrien Mazarguil  *   Pointer to Ethernet device structure.
463e60fbd5bSAdrien Mazarguil  * @param[out] info
464e60fbd5bSAdrien Mazarguil  *   Info structure output buffer.
465e60fbd5bSAdrien Mazarguil  */
466e60fbd5bSAdrien Mazarguil void
467e60fbd5bSAdrien Mazarguil mlx5_dev_infos_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *info)
468e60fbd5bSAdrien Mazarguil {
46901d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
4707fe24446SShahaf Shuler 	struct mlx5_dev_config *config = &priv->config;
471e60fbd5bSAdrien Mazarguil 	unsigned int max;
472e60fbd5bSAdrien Mazarguil 	char ifname[IF_NAMESIZE];
473e60fbd5bSAdrien Mazarguil 
474e60fbd5bSAdrien Mazarguil 	/* FIXME: we should ask the device for these values. */
475e60fbd5bSAdrien Mazarguil 	info->min_rx_bufsize = 32;
476e60fbd5bSAdrien Mazarguil 	info->max_rx_pktlen = 65536;
477e60fbd5bSAdrien Mazarguil 	/*
478e60fbd5bSAdrien Mazarguil 	 * Since we need one CQ per QP, the limit is the minimum number
479e60fbd5bSAdrien Mazarguil 	 * between the two values.
480e60fbd5bSAdrien Mazarguil 	 */
48143e9d979SShachar Beiser 	max = RTE_MIN(priv->device_attr.orig_attr.max_cq,
48243e9d979SShachar Beiser 		      priv->device_attr.orig_attr.max_qp);
483e60fbd5bSAdrien Mazarguil 	/* If max >= 65535 then max = 0, max_rx_queues is uint16_t. */
484e60fbd5bSAdrien Mazarguil 	if (max >= 65535)
485e60fbd5bSAdrien Mazarguil 		max = 65535;
486e60fbd5bSAdrien Mazarguil 	info->max_rx_queues = max;
487e60fbd5bSAdrien Mazarguil 	info->max_tx_queues = max;
48818c01b98SNélio Laranjeiro 	info->max_mac_addrs = MLX5_MAX_UC_MAC_ADDRESSES;
489af4f09f2SNélio Laranjeiro 	info->rx_queue_offload_capa = mlx5_get_rx_queue_offloads(dev);
490af4f09f2SNélio Laranjeiro 	info->rx_offload_capa = (mlx5_get_rx_port_offloads() |
49117b843ebSShahaf Shuler 				 info->rx_queue_offload_capa);
492af4f09f2SNélio Laranjeiro 	info->tx_offload_capa = mlx5_get_tx_port_offloads(dev);
493af4f09f2SNélio Laranjeiro 	if (mlx5_get_ifname(dev, &ifname) == 0)
494e60fbd5bSAdrien Mazarguil 		info->if_index = if_nametoindex(ifname);
495d365210eSYongseok Koh 	info->reta_size = priv->reta_idx_n ?
4967fe24446SShahaf Shuler 		priv->reta_idx_n : config->ind_table_max_size;
497e7041f55SShahaf Shuler 	info->hash_key_size = rss_hash_default_key_len;
49875ef62a9SNélio Laranjeiro 	info->speed_capa = priv->link_speed_capa;
499b233b027SShahaf Shuler 	info->flow_type_rss_offloads = ~MLX5_RSS_HF_MASK;
500*d11d651fSShahaf Shuler 	mlx5_set_default_params(dev, info);
501e60fbd5bSAdrien Mazarguil }
502e60fbd5bSAdrien Mazarguil 
503fb732b0aSNélio Laranjeiro /**
504fb732b0aSNélio Laranjeiro  * Get supported packet types.
505fb732b0aSNélio Laranjeiro  *
506fb732b0aSNélio Laranjeiro  * @param dev
507fb732b0aSNélio Laranjeiro  *   Pointer to Ethernet device structure.
508fb732b0aSNélio Laranjeiro  *
509fb732b0aSNélio Laranjeiro  * @return
510fb732b0aSNélio Laranjeiro  *   A pointer to the supported Packet types array.
511fb732b0aSNélio Laranjeiro  */
51278a38edfSJianfeng Tan const uint32_t *
51378a38edfSJianfeng Tan mlx5_dev_supported_ptypes_get(struct rte_eth_dev *dev)
51478a38edfSJianfeng Tan {
51578a38edfSJianfeng Tan 	static const uint32_t ptypes[] = {
51678a38edfSJianfeng Tan 		/* refers to rxq_cq_to_pkt_type() */
517ea16068cSYongseok Koh 		RTE_PTYPE_L2_ETHER,
518c4ba5434SNélio Laranjeiro 		RTE_PTYPE_L3_IPV4_EXT_UNKNOWN,
519c4ba5434SNélio Laranjeiro 		RTE_PTYPE_L3_IPV6_EXT_UNKNOWN,
520ea16068cSYongseok Koh 		RTE_PTYPE_L4_NONFRAG,
521ea16068cSYongseok Koh 		RTE_PTYPE_L4_FRAG,
522ea16068cSYongseok Koh 		RTE_PTYPE_L4_TCP,
523ea16068cSYongseok Koh 		RTE_PTYPE_L4_UDP,
524c4ba5434SNélio Laranjeiro 		RTE_PTYPE_INNER_L3_IPV4_EXT_UNKNOWN,
525c4ba5434SNélio Laranjeiro 		RTE_PTYPE_INNER_L3_IPV6_EXT_UNKNOWN,
526ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_NONFRAG,
527ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_FRAG,
528ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_TCP,
529ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_UDP,
53078a38edfSJianfeng Tan 		RTE_PTYPE_UNKNOWN
53178a38edfSJianfeng Tan 	};
53278a38edfSJianfeng Tan 
5336cb559d6SYongseok Koh 	if (dev->rx_pkt_burst == mlx5_rx_burst ||
5346cb559d6SYongseok Koh 	    dev->rx_pkt_burst == mlx5_rx_burst_vec)
53578a38edfSJianfeng Tan 		return ptypes;
53678a38edfSJianfeng Tan 	return NULL;
53778a38edfSJianfeng Tan }
53878a38edfSJianfeng Tan 
539e60fbd5bSAdrien Mazarguil /**
5402c960a51SMatthieu Ternisien d'Ouville  * DPDK callback to retrieve physical link information.
541cb8faed7SAdrien Mazarguil  *
542cb8faed7SAdrien Mazarguil  * @param dev
543cb8faed7SAdrien Mazarguil  *   Pointer to Ethernet device structure.
544cfee9475SNélio Laranjeiro  * @param[out] link
545cfee9475SNélio Laranjeiro  *   Storage for current link status.
546fb732b0aSNélio Laranjeiro  *
547fb732b0aSNélio Laranjeiro  * @return
548a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
549cb8faed7SAdrien Mazarguil  */
55018840871SNélio Laranjeiro static int
551cfee9475SNélio Laranjeiro mlx5_link_update_unlocked_gset(struct rte_eth_dev *dev,
552cfee9475SNélio Laranjeiro 			       struct rte_eth_link *link)
553cb8faed7SAdrien Mazarguil {
55401d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
555cb8faed7SAdrien Mazarguil 	struct ethtool_cmd edata = {
55675ef62a9SNélio Laranjeiro 		.cmd = ETHTOOL_GSET /* Deprecated since Linux v4.5. */
557cb8faed7SAdrien Mazarguil 	};
558cb8faed7SAdrien Mazarguil 	struct ifreq ifr;
559cb8faed7SAdrien Mazarguil 	struct rte_eth_link dev_link;
560cb8faed7SAdrien Mazarguil 	int link_speed = 0;
561a6d83b6aSNélio Laranjeiro 	int ret;
562cb8faed7SAdrien Mazarguil 
563a6d83b6aSNélio Laranjeiro 	ret = mlx5_ifreq(dev, SIOCGIFFLAGS, &ifr);
564a6d83b6aSNélio Laranjeiro 	if (ret) {
565a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u ioctl(SIOCGIFFLAGS) failed: %s",
5660f99970bSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
567a6d83b6aSNélio Laranjeiro 		return ret;
568cb8faed7SAdrien Mazarguil 	}
569cb8faed7SAdrien Mazarguil 	memset(&dev_link, 0, sizeof(dev_link));
570cb8faed7SAdrien Mazarguil 	dev_link.link_status = ((ifr.ifr_flags & IFF_UP) &&
571cb8faed7SAdrien Mazarguil 				(ifr.ifr_flags & IFF_RUNNING));
572d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&edata;
573a6d83b6aSNélio Laranjeiro 	ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
574a6d83b6aSNélio Laranjeiro 	if (ret) {
575a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING,
576a170a30dSNélio Laranjeiro 			"port %u ioctl(SIOCETHTOOL, ETHTOOL_GSET) failed: %s",
5770f99970bSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
578a6d83b6aSNélio Laranjeiro 		return ret;
579cb8faed7SAdrien Mazarguil 	}
580cb8faed7SAdrien Mazarguil 	link_speed = ethtool_cmd_speed(&edata);
581cb8faed7SAdrien Mazarguil 	if (link_speed == -1)
5823fef0822SFerruh Yigit 		dev_link.link_speed = ETH_SPEED_NUM_NONE;
583cb8faed7SAdrien Mazarguil 	else
584cb8faed7SAdrien Mazarguil 		dev_link.link_speed = link_speed;
58575ef62a9SNélio Laranjeiro 	priv->link_speed_capa = 0;
58675ef62a9SNélio Laranjeiro 	if (edata.supported & SUPPORTED_Autoneg)
58775ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
58875ef62a9SNélio Laranjeiro 	if (edata.supported & (SUPPORTED_1000baseT_Full |
58975ef62a9SNélio Laranjeiro 			       SUPPORTED_1000baseKX_Full))
59075ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_1G;
59175ef62a9SNélio Laranjeiro 	if (edata.supported & SUPPORTED_10000baseKR_Full)
59275ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_10G;
59375ef62a9SNélio Laranjeiro 	if (edata.supported & (SUPPORTED_40000baseKR4_Full |
59475ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseCR4_Full |
59575ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseSR4_Full |
59675ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseLR4_Full))
59775ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_40G;
598cb8faed7SAdrien Mazarguil 	dev_link.link_duplex = ((edata.duplex == DUPLEX_HALF) ?
599cb8faed7SAdrien Mazarguil 				ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
60082113036SMarc Sune 	dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
60182113036SMarc Sune 			ETH_LINK_SPEED_FIXED);
602cfee9475SNélio Laranjeiro 	if ((dev_link.link_speed && !dev_link.link_status) ||
603cfee9475SNélio Laranjeiro 	    (!dev_link.link_speed && dev_link.link_status)) {
604a6d83b6aSNélio Laranjeiro 		rte_errno = EAGAIN;
605a6d83b6aSNélio Laranjeiro 		return -rte_errno;
606cb8faed7SAdrien Mazarguil 	}
607cfee9475SNélio Laranjeiro 	*link = dev_link;
608cfee9475SNélio Laranjeiro 	return 0;
609cfee9475SNélio Laranjeiro }
610cb8faed7SAdrien Mazarguil 
611cb8faed7SAdrien Mazarguil /**
6123a49ffe3SShahaf Shuler  * Retrieve physical link information (unlocked version using new ioctl).
61318840871SNélio Laranjeiro  *
61418840871SNélio Laranjeiro  * @param dev
61518840871SNélio Laranjeiro  *   Pointer to Ethernet device structure.
616cfee9475SNélio Laranjeiro  * @param[out] link
617cfee9475SNélio Laranjeiro  *   Storage for current link status.
618fb732b0aSNélio Laranjeiro  *
619fb732b0aSNélio Laranjeiro  * @return
620a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
62118840871SNélio Laranjeiro  */
62218840871SNélio Laranjeiro static int
623cfee9475SNélio Laranjeiro mlx5_link_update_unlocked_gs(struct rte_eth_dev *dev,
624cfee9475SNélio Laranjeiro 			     struct rte_eth_link *link)
625cfee9475SNélio Laranjeiro 
62618840871SNélio Laranjeiro {
62701d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
62837a4406cSNélio Laranjeiro 	struct ethtool_link_settings gcmd = { .cmd = ETHTOOL_GLINKSETTINGS };
62918840871SNélio Laranjeiro 	struct ifreq ifr;
63018840871SNélio Laranjeiro 	struct rte_eth_link dev_link;
63118840871SNélio Laranjeiro 	uint64_t sc;
632a6d83b6aSNélio Laranjeiro 	int ret;
63318840871SNélio Laranjeiro 
634a6d83b6aSNélio Laranjeiro 	ret = mlx5_ifreq(dev, SIOCGIFFLAGS, &ifr);
635a6d83b6aSNélio Laranjeiro 	if (ret) {
636a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING, "port %u ioctl(SIOCGIFFLAGS) failed: %s",
6370f99970bSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
638a6d83b6aSNélio Laranjeiro 		return ret;
63918840871SNélio Laranjeiro 	}
64018840871SNélio Laranjeiro 	memset(&dev_link, 0, sizeof(dev_link));
64118840871SNélio Laranjeiro 	dev_link.link_status = ((ifr.ifr_flags & IFF_UP) &&
64218840871SNélio Laranjeiro 				(ifr.ifr_flags & IFF_RUNNING));
64337a4406cSNélio Laranjeiro 	ifr.ifr_data = (void *)&gcmd;
644a6d83b6aSNélio Laranjeiro 	ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
645a6d83b6aSNélio Laranjeiro 	if (ret) {
646a170a30dSNélio Laranjeiro 		DRV_LOG(DEBUG,
647a170a30dSNélio Laranjeiro 			"port %u ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS)"
648a170a30dSNélio Laranjeiro 			" failed: %s",
649a170a30dSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
650a6d83b6aSNélio Laranjeiro 		return ret;
65118840871SNélio Laranjeiro 	}
65237a4406cSNélio Laranjeiro 	gcmd.link_mode_masks_nwords = -gcmd.link_mode_masks_nwords;
65337a4406cSNélio Laranjeiro 
65437a4406cSNélio Laranjeiro 	alignas(struct ethtool_link_settings)
65537a4406cSNélio Laranjeiro 	uint8_t data[offsetof(struct ethtool_link_settings, link_mode_masks) +
65637a4406cSNélio Laranjeiro 		     sizeof(uint32_t) * gcmd.link_mode_masks_nwords * 3];
65737a4406cSNélio Laranjeiro 	struct ethtool_link_settings *ecmd = (void *)data;
65837a4406cSNélio Laranjeiro 
65937a4406cSNélio Laranjeiro 	*ecmd = gcmd;
66037a4406cSNélio Laranjeiro 	ifr.ifr_data = (void *)ecmd;
661a6d83b6aSNélio Laranjeiro 	ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
662a6d83b6aSNélio Laranjeiro 	if (ret) {
663a170a30dSNélio Laranjeiro 		DRV_LOG(DEBUG,
664a170a30dSNélio Laranjeiro 			"port %u ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS)"
665a170a30dSNélio Laranjeiro 			" failed: %s",
666a170a30dSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
667a6d83b6aSNélio Laranjeiro 		return ret;
668ef09a7fcSGowrishankar Muthukrishnan 	}
66990260d57SNélio Laranjeiro 	dev_link.link_speed = ecmd->speed;
67090260d57SNélio Laranjeiro 	sc = ecmd->link_mode_masks[0] |
67190260d57SNélio Laranjeiro 		((uint64_t)ecmd->link_mode_masks[1] << 32);
67218840871SNélio Laranjeiro 	priv->link_speed_capa = 0;
673b113cb5eSEdward Makarov 	if (sc & MLX5_BITSHIFT(ETHTOOL_LINK_MODE_Autoneg_BIT))
67418840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
675b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseT_Full_BIT) |
676b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseKX_Full_BIT)))
67718840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_1G;
678b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT) |
679b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKR_Full_BIT) |
680b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseR_FEC_BIT)))
68118840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_10G;
682b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT) |
683b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT)))
68418840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_20G;
685b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT) |
686b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT) |
687b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT) |
688b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT)))
68918840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_40G;
690b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT) |
691b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT) |
692b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT) |
693b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT)))
69418840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_56G;
695b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseCR_Full_BIT) |
696b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseKR_Full_BIT) |
697b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseSR_Full_BIT)))
69818840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_25G;
699b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT) |
700b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT)))
70118840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_50G;
702b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT) |
703b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT) |
704b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT) |
705b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT)))
70618840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_100G;
70790260d57SNélio Laranjeiro 	dev_link.link_duplex = ((ecmd->duplex == DUPLEX_HALF) ?
70818840871SNélio Laranjeiro 				ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
70918840871SNélio Laranjeiro 	dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
71018840871SNélio Laranjeiro 				  ETH_LINK_SPEED_FIXED);
711cfee9475SNélio Laranjeiro 	if ((dev_link.link_speed && !dev_link.link_status) ||
712cfee9475SNélio Laranjeiro 	    (!dev_link.link_speed && dev_link.link_status)) {
713a6d83b6aSNélio Laranjeiro 		rte_errno = EAGAIN;
714a6d83b6aSNélio Laranjeiro 		return -rte_errno;
71518840871SNélio Laranjeiro 	}
716cfee9475SNélio Laranjeiro 	*link = dev_link;
717cfee9475SNélio Laranjeiro 	return 0;
718cfee9475SNélio Laranjeiro }
71918840871SNélio Laranjeiro 
72018840871SNélio Laranjeiro /**
721cb8faed7SAdrien Mazarguil  * DPDK callback to retrieve physical link information.
722cb8faed7SAdrien Mazarguil  *
723cb8faed7SAdrien Mazarguil  * @param dev
724cb8faed7SAdrien Mazarguil  *   Pointer to Ethernet device structure.
725cb8faed7SAdrien Mazarguil  * @param wait_to_complete
726cfee9475SNélio Laranjeiro  *   Wait for request completion.
727fb732b0aSNélio Laranjeiro  *
728fb732b0aSNélio Laranjeiro  * @return
729cfee9475SNélio Laranjeiro  *   0 if link status was not updated, positive if it was, a negative errno
730cfee9475SNélio Laranjeiro  *   value otherwise and rte_errno is set.
731cb8faed7SAdrien Mazarguil  */
732cb8faed7SAdrien Mazarguil int
733cfee9475SNélio Laranjeiro mlx5_link_update(struct rte_eth_dev *dev, int wait_to_complete)
734cb8faed7SAdrien Mazarguil {
735c7bf6225SYongseok Koh 	int ret;
736cfee9475SNélio Laranjeiro 	struct rte_eth_link dev_link;
737cfee9475SNélio Laranjeiro 	time_t start_time = time(NULL);
738cb8faed7SAdrien Mazarguil 
739cfee9475SNélio Laranjeiro 	do {
740cfee9475SNélio Laranjeiro 		ret = mlx5_link_update_unlocked_gs(dev, &dev_link);
7417d2e32f7SShahaf Shuler 		if (ret)
7427d2e32f7SShahaf Shuler 			ret = mlx5_link_update_unlocked_gset(dev, &dev_link);
743cfee9475SNélio Laranjeiro 		if (ret == 0)
744cfee9475SNélio Laranjeiro 			break;
745cfee9475SNélio Laranjeiro 		/* Handle wait to complete situation. */
746cfee9475SNélio Laranjeiro 		if (wait_to_complete && ret == -EAGAIN) {
747cfee9475SNélio Laranjeiro 			if (abs((int)difftime(time(NULL), start_time)) <
748cfee9475SNélio Laranjeiro 			    MLX5_LINK_STATUS_TIMEOUT) {
749cfee9475SNélio Laranjeiro 				usleep(0);
750cfee9475SNélio Laranjeiro 				continue;
751cfee9475SNélio Laranjeiro 			} else {
752cfee9475SNélio Laranjeiro 				rte_errno = EBUSY;
753cfee9475SNélio Laranjeiro 				return -rte_errno;
754cfee9475SNélio Laranjeiro 			}
755cfee9475SNélio Laranjeiro 		} else if (ret < 0) {
756cfee9475SNélio Laranjeiro 			return ret;
757cfee9475SNélio Laranjeiro 		}
758cfee9475SNélio Laranjeiro 	} while (wait_to_complete);
759cfee9475SNélio Laranjeiro 	ret = !!memcmp(&dev->data->dev_link, &dev_link,
760cfee9475SNélio Laranjeiro 		       sizeof(struct rte_eth_link));
761cfee9475SNélio Laranjeiro 	dev->data->dev_link = dev_link;
762cfee9475SNélio Laranjeiro 	return ret;
763cb8faed7SAdrien Mazarguil }
764cb8faed7SAdrien Mazarguil 
765cb8faed7SAdrien Mazarguil /**
766cf37ca95SAdrien Mazarguil  * DPDK callback to change the MTU.
767cf37ca95SAdrien Mazarguil  *
768cf37ca95SAdrien Mazarguil  * @param dev
769cf37ca95SAdrien Mazarguil  *   Pointer to Ethernet device structure.
770cf37ca95SAdrien Mazarguil  * @param in_mtu
771cf37ca95SAdrien Mazarguil  *   New MTU.
772cf37ca95SAdrien Mazarguil  *
773cf37ca95SAdrien Mazarguil  * @return
774a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
775cf37ca95SAdrien Mazarguil  */
776cf37ca95SAdrien Mazarguil int
777cf37ca95SAdrien Mazarguil mlx5_dev_set_mtu(struct rte_eth_dev *dev, uint16_t mtu)
778cf37ca95SAdrien Mazarguil {
779cf37ca95SAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
780a6d83b6aSNélio Laranjeiro 	uint16_t kern_mtu = 0;
781a6d83b6aSNélio Laranjeiro 	int ret;
782cf37ca95SAdrien Mazarguil 
783af4f09f2SNélio Laranjeiro 	ret = mlx5_get_mtu(dev, &kern_mtu);
784a0edafe4SNelio Laranjeiro 	if (ret)
785a6d83b6aSNélio Laranjeiro 		return ret;
786cf37ca95SAdrien Mazarguil 	/* Set kernel interface MTU first. */
787af4f09f2SNélio Laranjeiro 	ret = mlx5_set_mtu(dev, mtu);
788a0edafe4SNelio Laranjeiro 	if (ret)
789a6d83b6aSNélio Laranjeiro 		return ret;
790af4f09f2SNélio Laranjeiro 	ret = mlx5_get_mtu(dev, &kern_mtu);
791a0edafe4SNelio Laranjeiro 	if (ret)
792a6d83b6aSNélio Laranjeiro 		return ret;
793a0edafe4SNelio Laranjeiro 	if (kern_mtu == mtu) {
794a0edafe4SNelio Laranjeiro 		priv->mtu = mtu;
795a170a30dSNélio Laranjeiro 		DRV_LOG(DEBUG, "port %u adapter MTU set to %u",
796a170a30dSNélio Laranjeiro 			dev->data->port_id, mtu);
797a0edafe4SNelio Laranjeiro 		return 0;
798a6d83b6aSNélio Laranjeiro 	}
799a6d83b6aSNélio Laranjeiro 	rte_errno = EAGAIN;
800a6d83b6aSNélio Laranjeiro 	return -rte_errno;
801cf37ca95SAdrien Mazarguil }
802cf37ca95SAdrien Mazarguil 
803cf37ca95SAdrien Mazarguil /**
80402d75430SAdrien Mazarguil  * DPDK callback to get flow control status.
80502d75430SAdrien Mazarguil  *
80602d75430SAdrien Mazarguil  * @param dev
80702d75430SAdrien Mazarguil  *   Pointer to Ethernet device structure.
80802d75430SAdrien Mazarguil  * @param[out] fc_conf
80902d75430SAdrien Mazarguil  *   Flow control output buffer.
81002d75430SAdrien Mazarguil  *
81102d75430SAdrien Mazarguil  * @return
812a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
81302d75430SAdrien Mazarguil  */
81402d75430SAdrien Mazarguil int
81502d75430SAdrien Mazarguil mlx5_dev_get_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
81602d75430SAdrien Mazarguil {
81702d75430SAdrien Mazarguil 	struct ifreq ifr;
81802d75430SAdrien Mazarguil 	struct ethtool_pauseparam ethpause = {
81902d75430SAdrien Mazarguil 		.cmd = ETHTOOL_GPAUSEPARAM
82002d75430SAdrien Mazarguil 	};
82102d75430SAdrien Mazarguil 	int ret;
82202d75430SAdrien Mazarguil 
823d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&ethpause;
824a6d83b6aSNélio Laranjeiro 	ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
825a6d83b6aSNélio Laranjeiro 	if (ret) {
826a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING,
827a170a30dSNélio Laranjeiro 			"port %u ioctl(SIOCETHTOOL, ETHTOOL_GPAUSEPARAM) failed:"
828a170a30dSNélio Laranjeiro 			" %s",
829a170a30dSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
830a6d83b6aSNélio Laranjeiro 		return ret;
83102d75430SAdrien Mazarguil 	}
83202d75430SAdrien Mazarguil 	fc_conf->autoneg = ethpause.autoneg;
83302d75430SAdrien Mazarguil 	if (ethpause.rx_pause && ethpause.tx_pause)
83402d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_FULL;
83502d75430SAdrien Mazarguil 	else if (ethpause.rx_pause)
83602d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_RX_PAUSE;
83702d75430SAdrien Mazarguil 	else if (ethpause.tx_pause)
83802d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_TX_PAUSE;
83902d75430SAdrien Mazarguil 	else
84002d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_NONE;
841a6d83b6aSNélio Laranjeiro 	return 0;
84202d75430SAdrien Mazarguil }
84302d75430SAdrien Mazarguil 
84402d75430SAdrien Mazarguil /**
84502d75430SAdrien Mazarguil  * DPDK callback to modify flow control parameters.
84602d75430SAdrien Mazarguil  *
84702d75430SAdrien Mazarguil  * @param dev
84802d75430SAdrien Mazarguil  *   Pointer to Ethernet device structure.
84902d75430SAdrien Mazarguil  * @param[in] fc_conf
85002d75430SAdrien Mazarguil  *   Flow control parameters.
85102d75430SAdrien Mazarguil  *
85202d75430SAdrien Mazarguil  * @return
853a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
85402d75430SAdrien Mazarguil  */
85502d75430SAdrien Mazarguil int
85602d75430SAdrien Mazarguil mlx5_dev_set_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
85702d75430SAdrien Mazarguil {
85802d75430SAdrien Mazarguil 	struct ifreq ifr;
85902d75430SAdrien Mazarguil 	struct ethtool_pauseparam ethpause = {
86002d75430SAdrien Mazarguil 		.cmd = ETHTOOL_SPAUSEPARAM
86102d75430SAdrien Mazarguil 	};
86202d75430SAdrien Mazarguil 	int ret;
86302d75430SAdrien Mazarguil 
864d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&ethpause;
86502d75430SAdrien Mazarguil 	ethpause.autoneg = fc_conf->autoneg;
86602d75430SAdrien Mazarguil 	if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
86702d75430SAdrien Mazarguil 	    (fc_conf->mode & RTE_FC_RX_PAUSE))
86802d75430SAdrien Mazarguil 		ethpause.rx_pause = 1;
86902d75430SAdrien Mazarguil 	else
87002d75430SAdrien Mazarguil 		ethpause.rx_pause = 0;
87102d75430SAdrien Mazarguil 
87202d75430SAdrien Mazarguil 	if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
87302d75430SAdrien Mazarguil 	    (fc_conf->mode & RTE_FC_TX_PAUSE))
87402d75430SAdrien Mazarguil 		ethpause.tx_pause = 1;
87502d75430SAdrien Mazarguil 	else
87602d75430SAdrien Mazarguil 		ethpause.tx_pause = 0;
877a6d83b6aSNélio Laranjeiro 	ret = mlx5_ifreq(dev, SIOCETHTOOL, &ifr);
878a6d83b6aSNélio Laranjeiro 	if (ret) {
879a170a30dSNélio Laranjeiro 		DRV_LOG(WARNING,
880a170a30dSNélio Laranjeiro 			"port %u ioctl(SIOCETHTOOL, ETHTOOL_SPAUSEPARAM)"
881a170a30dSNélio Laranjeiro 			" failed: %s",
882a170a30dSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
883a6d83b6aSNélio Laranjeiro 		return ret;
88402d75430SAdrien Mazarguil 	}
885a6d83b6aSNélio Laranjeiro 	return 0;
88602d75430SAdrien Mazarguil }
88702d75430SAdrien Mazarguil 
88802d75430SAdrien Mazarguil /**
889771fa900SAdrien Mazarguil  * Get PCI information from struct ibv_device.
890771fa900SAdrien Mazarguil  *
891771fa900SAdrien Mazarguil  * @param device
892771fa900SAdrien Mazarguil  *   Pointer to Ethernet device structure.
893771fa900SAdrien Mazarguil  * @param[out] pci_addr
894771fa900SAdrien Mazarguil  *   PCI bus address output buffer.
895771fa900SAdrien Mazarguil  *
896771fa900SAdrien Mazarguil  * @return
897a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
898771fa900SAdrien Mazarguil  */
899771fa900SAdrien Mazarguil int
900771fa900SAdrien Mazarguil mlx5_ibv_device_to_pci_addr(const struct ibv_device *device,
901771fa900SAdrien Mazarguil 			    struct rte_pci_addr *pci_addr)
902771fa900SAdrien Mazarguil {
903771fa900SAdrien Mazarguil 	FILE *file;
904771fa900SAdrien Mazarguil 	char line[32];
905771fa900SAdrien Mazarguil 	MKSTR(path, "%s/device/uevent", device->ibdev_path);
906771fa900SAdrien Mazarguil 
907771fa900SAdrien Mazarguil 	file = fopen(path, "rb");
908a6d83b6aSNélio Laranjeiro 	if (file == NULL) {
909a6d83b6aSNélio Laranjeiro 		rte_errno = errno;
910a6d83b6aSNélio Laranjeiro 		return -rte_errno;
911a6d83b6aSNélio Laranjeiro 	}
912771fa900SAdrien Mazarguil 	while (fgets(line, sizeof(line), file) == line) {
913771fa900SAdrien Mazarguil 		size_t len = strlen(line);
914771fa900SAdrien Mazarguil 		int ret;
915771fa900SAdrien Mazarguil 
916771fa900SAdrien Mazarguil 		/* Truncate long lines. */
917771fa900SAdrien Mazarguil 		if (len == (sizeof(line) - 1))
918771fa900SAdrien Mazarguil 			while (line[(len - 1)] != '\n') {
919771fa900SAdrien Mazarguil 				ret = fgetc(file);
920771fa900SAdrien Mazarguil 				if (ret == EOF)
921771fa900SAdrien Mazarguil 					break;
922771fa900SAdrien Mazarguil 				line[(len - 1)] = ret;
923771fa900SAdrien Mazarguil 			}
924771fa900SAdrien Mazarguil 		/* Extract information. */
925771fa900SAdrien Mazarguil 		if (sscanf(line,
926771fa900SAdrien Mazarguil 			   "PCI_SLOT_NAME="
927463ced95SStephen Hemminger 			   "%" SCNx32 ":%" SCNx8 ":%" SCNx8 ".%" SCNx8 "\n",
928771fa900SAdrien Mazarguil 			   &pci_addr->domain,
929771fa900SAdrien Mazarguil 			   &pci_addr->bus,
930771fa900SAdrien Mazarguil 			   &pci_addr->devid,
931771fa900SAdrien Mazarguil 			   &pci_addr->function) == 4) {
932771fa900SAdrien Mazarguil 			ret = 0;
933771fa900SAdrien Mazarguil 			break;
934771fa900SAdrien Mazarguil 		}
935771fa900SAdrien Mazarguil 	}
936771fa900SAdrien Mazarguil 	fclose(file);
937771fa900SAdrien Mazarguil 	return 0;
938771fa900SAdrien Mazarguil }
939198a3c33SNelio Laranjeiro 
940198a3c33SNelio Laranjeiro /**
941c26ae069SMatan Azrad  * Device status handler.
942c26ae069SMatan Azrad  *
943af4f09f2SNélio Laranjeiro  * @param dev
944af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
945c26ae069SMatan Azrad  * @param events
946c26ae069SMatan Azrad  *   Pointer to event flags holder.
947c26ae069SMatan Azrad  *
948c26ae069SMatan Azrad  * @return
949c26ae069SMatan Azrad  *   Events bitmap of callback process which can be called immediately.
950c26ae069SMatan Azrad  */
951c26ae069SMatan Azrad static uint32_t
952af4f09f2SNélio Laranjeiro mlx5_dev_status_handler(struct rte_eth_dev *dev)
953198a3c33SNelio Laranjeiro {
954af4f09f2SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
955198a3c33SNelio Laranjeiro 	struct ibv_async_event event;
956c26ae069SMatan Azrad 	uint32_t ret = 0;
957198a3c33SNelio Laranjeiro 
958cfee9475SNélio Laranjeiro 	if (mlx5_link_update(dev, 0) == -EAGAIN) {
959cfee9475SNélio Laranjeiro 		usleep(0);
960cfee9475SNélio Laranjeiro 		return 0;
961cfee9475SNélio Laranjeiro 	}
962198a3c33SNelio Laranjeiro 	/* Read all message and acknowledge them. */
963198a3c33SNelio Laranjeiro 	for (;;) {
9640e83b8e5SNelio Laranjeiro 		if (mlx5_glue->get_async_event(priv->ctx, &event))
965198a3c33SNelio Laranjeiro 			break;
966c26ae069SMatan Azrad 		if ((event.event_type == IBV_EVENT_PORT_ACTIVE ||
967c26ae069SMatan Azrad 			event.event_type == IBV_EVENT_PORT_ERR) &&
968af4f09f2SNélio Laranjeiro 			(dev->data->dev_conf.intr_conf.lsc == 1))
969c26ae069SMatan Azrad 			ret |= (1 << RTE_ETH_EVENT_INTR_LSC);
9707d7d7ad1SMatan Azrad 		else if (event.event_type == IBV_EVENT_DEVICE_FATAL &&
971af4f09f2SNélio Laranjeiro 			dev->data->dev_conf.intr_conf.rmv == 1)
9727d7d7ad1SMatan Azrad 			ret |= (1 << RTE_ETH_EVENT_INTR_RMV);
973c26ae069SMatan Azrad 		else
974a170a30dSNélio Laranjeiro 			DRV_LOG(DEBUG,
975a170a30dSNélio Laranjeiro 				"port %u event type %d on not handled",
9760f99970bSNélio Laranjeiro 				dev->data->port_id, event.event_type);
9770e83b8e5SNelio Laranjeiro 		mlx5_glue->ack_async_event(&event);
978198a3c33SNelio Laranjeiro 	}
979198a3c33SNelio Laranjeiro 	return ret;
980198a3c33SNelio Laranjeiro }
981198a3c33SNelio Laranjeiro 
982198a3c33SNelio Laranjeiro /**
983198a3c33SNelio Laranjeiro  * Handle interrupts from the NIC.
984198a3c33SNelio Laranjeiro  *
985198a3c33SNelio Laranjeiro  * @param[in] intr_handle
986198a3c33SNelio Laranjeiro  *   Interrupt handler.
987198a3c33SNelio Laranjeiro  * @param cb_arg
988198a3c33SNelio Laranjeiro  *   Callback argument.
989198a3c33SNelio Laranjeiro  */
990198a3c33SNelio Laranjeiro void
991c23a1a30SQi Zhang mlx5_dev_interrupt_handler(void *cb_arg)
992198a3c33SNelio Laranjeiro {
993198a3c33SNelio Laranjeiro 	struct rte_eth_dev *dev = cb_arg;
994c26ae069SMatan Azrad 	uint32_t events;
995198a3c33SNelio Laranjeiro 
996af4f09f2SNélio Laranjeiro 	events = mlx5_dev_status_handler(dev);
997c26ae069SMatan Azrad 	if (events & (1 << RTE_ETH_EVENT_INTR_LSC))
998cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL);
9997d7d7ad1SMatan Azrad 	if (events & (1 << RTE_ETH_EVENT_INTR_RMV))
1000cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_RMV, NULL);
1001198a3c33SNelio Laranjeiro }
1002198a3c33SNelio Laranjeiro 
1003198a3c33SNelio Laranjeiro /**
1004f8b9a3baSXueming Li  * Handle interrupts from the socket.
1005f8b9a3baSXueming Li  *
1006f8b9a3baSXueming Li  * @param cb_arg
1007f8b9a3baSXueming Li  *   Callback argument.
1008f8b9a3baSXueming Li  */
1009f8b9a3baSXueming Li static void
1010f8b9a3baSXueming Li mlx5_dev_handler_socket(void *cb_arg)
1011f8b9a3baSXueming Li {
1012f8b9a3baSXueming Li 	struct rte_eth_dev *dev = cb_arg;
1013f8b9a3baSXueming Li 
1014af4f09f2SNélio Laranjeiro 	mlx5_socket_handle(dev);
1015f8b9a3baSXueming Li }
1016f8b9a3baSXueming Li 
1017f8b9a3baSXueming Li /**
1018198a3c33SNelio Laranjeiro  * Uninstall interrupt handler.
1019198a3c33SNelio Laranjeiro  *
1020198a3c33SNelio Laranjeiro  * @param dev
1021af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
1022198a3c33SNelio Laranjeiro  */
1023198a3c33SNelio Laranjeiro void
1024af4f09f2SNélio Laranjeiro mlx5_dev_interrupt_handler_uninstall(struct rte_eth_dev *dev)
1025198a3c33SNelio Laranjeiro {
1026af4f09f2SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
1027af4f09f2SNélio Laranjeiro 
1028f8b9a3baSXueming Li 	if (dev->data->dev_conf.intr_conf.lsc ||
1029f8b9a3baSXueming Li 	    dev->data->dev_conf.intr_conf.rmv)
1030198a3c33SNelio Laranjeiro 		rte_intr_callback_unregister(&priv->intr_handle,
1031f8b9a3baSXueming Li 					     mlx5_dev_interrupt_handler, dev);
1032f8b9a3baSXueming Li 	if (priv->primary_socket)
1033f8b9a3baSXueming Li 		rte_intr_callback_unregister(&priv->intr_handle_socket,
1034f8b9a3baSXueming Li 					     mlx5_dev_handler_socket, dev);
1035198a3c33SNelio Laranjeiro 	priv->intr_handle.fd = 0;
103636351ea3SFerruh Yigit 	priv->intr_handle.type = RTE_INTR_HANDLE_UNKNOWN;
1037f8b9a3baSXueming Li 	priv->intr_handle_socket.fd = 0;
1038f8b9a3baSXueming Li 	priv->intr_handle_socket.type = RTE_INTR_HANDLE_UNKNOWN;
1039198a3c33SNelio Laranjeiro }
1040198a3c33SNelio Laranjeiro 
1041198a3c33SNelio Laranjeiro /**
1042198a3c33SNelio Laranjeiro  * Install interrupt handler.
1043198a3c33SNelio Laranjeiro  *
1044198a3c33SNelio Laranjeiro  * @param dev
1045af4f09f2SNélio Laranjeiro  *   Pointer to Ethernet device.
1046198a3c33SNelio Laranjeiro  */
1047198a3c33SNelio Laranjeiro void
1048af4f09f2SNélio Laranjeiro mlx5_dev_interrupt_handler_install(struct rte_eth_dev *dev)
1049198a3c33SNelio Laranjeiro {
1050af4f09f2SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
1051a6d83b6aSNélio Laranjeiro 	int ret;
1052a6d83b6aSNélio Laranjeiro 	int flags;
1053198a3c33SNelio Laranjeiro 
1054198a3c33SNelio Laranjeiro 	assert(priv->ctx->async_fd > 0);
1055198a3c33SNelio Laranjeiro 	flags = fcntl(priv->ctx->async_fd, F_GETFL);
1056a6d83b6aSNélio Laranjeiro 	ret = fcntl(priv->ctx->async_fd, F_SETFL, flags | O_NONBLOCK);
1057a6d83b6aSNélio Laranjeiro 	if (ret) {
1058a170a30dSNélio Laranjeiro 		DRV_LOG(INFO,
1059a170a30dSNélio Laranjeiro 			"port %u failed to change file descriptor async event"
1060a170a30dSNélio Laranjeiro 			" queue",
1061a170a30dSNélio Laranjeiro 			dev->data->port_id);
1062198a3c33SNelio Laranjeiro 		dev->data->dev_conf.intr_conf.lsc = 0;
10637d7d7ad1SMatan Azrad 		dev->data->dev_conf.intr_conf.rmv = 0;
1064f8b9a3baSXueming Li 	}
1065f8b9a3baSXueming Li 	if (dev->data->dev_conf.intr_conf.lsc ||
1066f8b9a3baSXueming Li 	    dev->data->dev_conf.intr_conf.rmv) {
1067198a3c33SNelio Laranjeiro 		priv->intr_handle.fd = priv->ctx->async_fd;
1068198a3c33SNelio Laranjeiro 		priv->intr_handle.type = RTE_INTR_HANDLE_EXT;
1069198a3c33SNelio Laranjeiro 		rte_intr_callback_register(&priv->intr_handle,
1070f8b9a3baSXueming Li 					   mlx5_dev_interrupt_handler, dev);
1071f8b9a3baSXueming Li 	}
1072a6d83b6aSNélio Laranjeiro 	ret = mlx5_socket_init(dev);
1073a6d83b6aSNélio Laranjeiro 	if (ret)
1074a170a30dSNélio Laranjeiro 		DRV_LOG(ERR, "port %u cannot initialise socket: %s",
10750f99970bSNélio Laranjeiro 			dev->data->port_id, strerror(rte_errno));
1076a6d83b6aSNélio Laranjeiro 	else if (priv->primary_socket) {
1077f8b9a3baSXueming Li 		priv->intr_handle_socket.fd = priv->primary_socket;
1078f8b9a3baSXueming Li 		priv->intr_handle_socket.type = RTE_INTR_HANDLE_EXT;
1079f8b9a3baSXueming Li 		rte_intr_callback_register(&priv->intr_handle_socket,
1080f8b9a3baSXueming Li 					   mlx5_dev_handler_socket, dev);
1081198a3c33SNelio Laranjeiro 	}
1082198a3c33SNelio Laranjeiro }
108362072098SOr Ami 
108462072098SOr Ami /**
108562072098SOr Ami  * DPDK callback to bring the link DOWN.
108662072098SOr Ami  *
108762072098SOr Ami  * @param dev
108862072098SOr Ami  *   Pointer to Ethernet device structure.
108962072098SOr Ami  *
109062072098SOr Ami  * @return
1091a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
109262072098SOr Ami  */
109362072098SOr Ami int
109462072098SOr Ami mlx5_set_link_down(struct rte_eth_dev *dev)
109562072098SOr Ami {
1096af4f09f2SNélio Laranjeiro 	return mlx5_set_flags(dev, ~IFF_UP, ~IFF_UP);
109762072098SOr Ami }
109862072098SOr Ami 
109962072098SOr Ami /**
110062072098SOr Ami  * DPDK callback to bring the link UP.
110162072098SOr Ami  *
110262072098SOr Ami  * @param dev
110362072098SOr Ami  *   Pointer to Ethernet device structure.
110462072098SOr Ami  *
110562072098SOr Ami  * @return
1106a6d83b6aSNélio Laranjeiro  *   0 on success, a negative errno value otherwise and rte_errno is set.
110762072098SOr Ami  */
110862072098SOr Ami int
110962072098SOr Ami mlx5_set_link_up(struct rte_eth_dev *dev)
111062072098SOr Ami {
1111af4f09f2SNélio Laranjeiro 	return mlx5_set_flags(dev, ~IFF_UP, IFF_UP);
111262072098SOr Ami }
1113a48deadaSOr Ami 
1114a48deadaSOr Ami /**
1115cdab90cbSNélio Laranjeiro  * Configure the TX function to use.
1116cdab90cbSNélio Laranjeiro  *
1117aee1b165SXueming Li  * @param dev
1118af4f09f2SNélio Laranjeiro  *   Pointer to private data structure.
11191cfa649bSShahaf Shuler  *
11201cfa649bSShahaf Shuler  * @return
11211cfa649bSShahaf Shuler  *   Pointer to selected Tx burst function.
1122cdab90cbSNélio Laranjeiro  */
11231cfa649bSShahaf Shuler eth_tx_burst_t
1124af4f09f2SNélio Laranjeiro mlx5_select_tx_function(struct rte_eth_dev *dev)
1125cdab90cbSNélio Laranjeiro {
1126af4f09f2SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
11271cfa649bSShahaf Shuler 	eth_tx_burst_t tx_pkt_burst = mlx5_tx_burst;
11287fe24446SShahaf Shuler 	struct mlx5_dev_config *config = &priv->config;
1129dbccb4cdSShahaf Shuler 	uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads;
1130dbccb4cdSShahaf Shuler 	int tso = !!(tx_offloads & (DEV_TX_OFFLOAD_TCP_TSO |
1131dbccb4cdSShahaf Shuler 				    DEV_TX_OFFLOAD_VXLAN_TNL_TSO |
1132dbccb4cdSShahaf Shuler 				    DEV_TX_OFFLOAD_GRE_TNL_TSO));
11335f8ba81cSXueming Li 	int swp = !!(tx_offloads & (DEV_TX_OFFLOAD_IP_TNL_TSO |
11345f8ba81cSXueming Li 				    DEV_TX_OFFLOAD_UDP_TNL_TSO |
11355f8ba81cSXueming Li 				    DEV_TX_OFFLOAD_OUTER_IPV4_CKSUM));
1136dbccb4cdSShahaf Shuler 	int vlan_insert = !!(tx_offloads & DEV_TX_OFFLOAD_VLAN_INSERT);
11371cfa649bSShahaf Shuler 
1138aee1b165SXueming Li 	assert(priv != NULL);
1139230189d9SNélio Laranjeiro 	/* Select appropriate TX function. */
11405f8ba81cSXueming Li 	if (vlan_insert || tso || swp)
1141dbccb4cdSShahaf Shuler 		return tx_pkt_burst;
11427fe24446SShahaf Shuler 	if (config->mps == MLX5_MPW_ENHANCED) {
1143af4f09f2SNélio Laranjeiro 		if (mlx5_check_vec_tx_support(dev) > 0) {
1144af4f09f2SNélio Laranjeiro 			if (mlx5_check_raw_vec_tx_support(dev) > 0)
11451cfa649bSShahaf Shuler 				tx_pkt_burst = mlx5_tx_burst_raw_vec;
11466cb559d6SYongseok Koh 			else
11471cfa649bSShahaf Shuler 				tx_pkt_burst = mlx5_tx_burst_vec;
1148a170a30dSNélio Laranjeiro 			DRV_LOG(DEBUG,
1149a170a30dSNélio Laranjeiro 				"port %u selected enhanced MPW Tx vectorized"
1150a170a30dSNélio Laranjeiro 				" function",
1151a170a30dSNélio Laranjeiro 				dev->data->port_id);
11526cb559d6SYongseok Koh 		} else {
11531cfa649bSShahaf Shuler 			tx_pkt_burst = mlx5_tx_burst_empw;
1154a170a30dSNélio Laranjeiro 			DRV_LOG(DEBUG,
1155a170a30dSNélio Laranjeiro 				"port %u selected enhanced MPW Tx function",
11560f99970bSNélio Laranjeiro 				dev->data->port_id);
11576cb559d6SYongseok Koh 		}
11587fe24446SShahaf Shuler 	} else if (config->mps && (config->txq_inline > 0)) {
11591cfa649bSShahaf Shuler 		tx_pkt_burst = mlx5_tx_burst_mpw_inline;
1160a170a30dSNélio Laranjeiro 		DRV_LOG(DEBUG, "port %u selected MPW inline Tx function",
11610f99970bSNélio Laranjeiro 			dev->data->port_id);
11627fe24446SShahaf Shuler 	} else if (config->mps) {
11631cfa649bSShahaf Shuler 		tx_pkt_burst = mlx5_tx_burst_mpw;
1164a170a30dSNélio Laranjeiro 		DRV_LOG(DEBUG, "port %u selected MPW Tx function",
1165a170a30dSNélio Laranjeiro 			dev->data->port_id);
11662a66cf37SYaacov Hazan 	}
11671cfa649bSShahaf Shuler 	return tx_pkt_burst;
1168cdab90cbSNélio Laranjeiro }
1169cdab90cbSNélio Laranjeiro 
1170cdab90cbSNélio Laranjeiro /**
1171cdab90cbSNélio Laranjeiro  * Configure the RX function to use.
1172cdab90cbSNélio Laranjeiro  *
1173aee1b165SXueming Li  * @param dev
1174af4f09f2SNélio Laranjeiro  *   Pointer to private data structure.
11751cfa649bSShahaf Shuler  *
11761cfa649bSShahaf Shuler  * @return
11771cfa649bSShahaf Shuler  *   Pointer to selected Rx burst function.
1178cdab90cbSNélio Laranjeiro  */
11791cfa649bSShahaf Shuler eth_rx_burst_t
1180af4f09f2SNélio Laranjeiro mlx5_select_rx_function(struct rte_eth_dev *dev)
1181cdab90cbSNélio Laranjeiro {
11821cfa649bSShahaf Shuler 	eth_rx_burst_t rx_pkt_burst = mlx5_rx_burst;
11831cfa649bSShahaf Shuler 
1184af4f09f2SNélio Laranjeiro 	assert(dev != NULL);
1185af4f09f2SNélio Laranjeiro 	if (mlx5_check_vec_rx_support(dev) > 0) {
11861cfa649bSShahaf Shuler 		rx_pkt_burst = mlx5_rx_burst_vec;
1187a170a30dSNélio Laranjeiro 		DRV_LOG(DEBUG, "port %u selected Rx vectorized function",
11880f99970bSNélio Laranjeiro 			dev->data->port_id);
1189cdab90cbSNélio Laranjeiro 	}
11901cfa649bSShahaf Shuler 	return rx_pkt_burst;
11916cb559d6SYongseok Koh }
1192d3e0f392SMatan Azrad 
1193d3e0f392SMatan Azrad /**
1194d3e0f392SMatan Azrad  * Check if mlx5 device was removed.
1195d3e0f392SMatan Azrad  *
1196d3e0f392SMatan Azrad  * @param dev
1197d3e0f392SMatan Azrad  *   Pointer to Ethernet device structure.
1198d3e0f392SMatan Azrad  *
1199d3e0f392SMatan Azrad  * @return
1200d3e0f392SMatan Azrad  *   1 when device is removed, otherwise 0.
1201d3e0f392SMatan Azrad  */
1202d3e0f392SMatan Azrad int
1203d3e0f392SMatan Azrad mlx5_is_removed(struct rte_eth_dev *dev)
1204d3e0f392SMatan Azrad {
1205d3e0f392SMatan Azrad 	struct ibv_device_attr device_attr;
1206d3e0f392SMatan Azrad 	struct priv *priv = dev->data->dev_private;
1207d3e0f392SMatan Azrad 
12080e83b8e5SNelio Laranjeiro 	if (mlx5_glue->query_device(priv->ctx, &device_attr) == EIO)
1209d3e0f392SMatan Azrad 		return 1;
1210d3e0f392SMatan Azrad 	return 0;
1211d3e0f392SMatan Azrad }
1212