xref: /dpdk/drivers/net/mlx5/mlx5_ethdev.c (revision 7b2423cd2e84c61d3052147cea7643d15d49d1e9)
18fd92a66SOlivier Matz /* SPDX-License-Identifier: BSD-3-Clause
2771fa900SAdrien Mazarguil  * Copyright 2015 6WIND S.A.
3771fa900SAdrien Mazarguil  * Copyright 2015 Mellanox.
4771fa900SAdrien Mazarguil  */
5771fa900SAdrien Mazarguil 
6f8b9a3baSXueming Li #define _GNU_SOURCE
7f8b9a3baSXueming Li 
8771fa900SAdrien Mazarguil #include <stddef.h>
9e60fbd5bSAdrien Mazarguil #include <assert.h>
10fc40db99SAdrien Mazarguil #include <inttypes.h>
11771fa900SAdrien Mazarguil #include <unistd.h>
12771fa900SAdrien Mazarguil #include <stdint.h>
13771fa900SAdrien Mazarguil #include <stdio.h>
14771fa900SAdrien Mazarguil #include <string.h>
15771fa900SAdrien Mazarguil #include <stdlib.h>
16771fa900SAdrien Mazarguil #include <errno.h>
17771fa900SAdrien Mazarguil #include <dirent.h>
18771fa900SAdrien Mazarguil #include <net/if.h>
19771fa900SAdrien Mazarguil #include <sys/ioctl.h>
20771fa900SAdrien Mazarguil #include <sys/socket.h>
213a49ffe3SShahaf Shuler #include <sys/utsname.h>
22771fa900SAdrien Mazarguil #include <netinet/in.h>
23cb8faed7SAdrien Mazarguil #include <linux/ethtool.h>
24cb8faed7SAdrien Mazarguil #include <linux/sockios.h>
253a49ffe3SShahaf Shuler #include <linux/version.h>
26198a3c33SNelio Laranjeiro #include <fcntl.h>
2790260d57SNélio Laranjeiro #include <stdalign.h>
28f8b9a3baSXueming Li #include <sys/un.h>
29771fa900SAdrien Mazarguil 
30771fa900SAdrien Mazarguil #include <rte_atomic.h>
31ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h>
32c752998bSGaetan Rivet #include <rte_bus_pci.h>
33771fa900SAdrien Mazarguil #include <rte_mbuf.h>
34771fa900SAdrien Mazarguil #include <rte_common.h>
35198a3c33SNelio Laranjeiro #include <rte_interrupts.h>
36198a3c33SNelio Laranjeiro #include <rte_alarm.h>
37a48deadaSOr Ami #include <rte_malloc.h>
38771fa900SAdrien Mazarguil 
39771fa900SAdrien Mazarguil #include "mlx5.h"
400e83b8e5SNelio Laranjeiro #include "mlx5_glue.h"
41e60fbd5bSAdrien Mazarguil #include "mlx5_rxtx.h"
42771fa900SAdrien Mazarguil #include "mlx5_utils.h"
43771fa900SAdrien Mazarguil 
443a49ffe3SShahaf Shuler /* Add defines in case the running kernel is not the same as user headers. */
453a49ffe3SShahaf Shuler #ifndef ETHTOOL_GLINKSETTINGS
463a49ffe3SShahaf Shuler struct ethtool_link_settings {
473a49ffe3SShahaf Shuler 	uint32_t cmd;
483a49ffe3SShahaf Shuler 	uint32_t speed;
493a49ffe3SShahaf Shuler 	uint8_t duplex;
503a49ffe3SShahaf Shuler 	uint8_t port;
513a49ffe3SShahaf Shuler 	uint8_t phy_address;
523a49ffe3SShahaf Shuler 	uint8_t autoneg;
533a49ffe3SShahaf Shuler 	uint8_t mdio_support;
543a49ffe3SShahaf Shuler 	uint8_t eth_to_mdix;
553a49ffe3SShahaf Shuler 	uint8_t eth_tp_mdix_ctrl;
563a49ffe3SShahaf Shuler 	int8_t link_mode_masks_nwords;
573a49ffe3SShahaf Shuler 	uint32_t reserved[8];
583a49ffe3SShahaf Shuler 	uint32_t link_mode_masks[];
593a49ffe3SShahaf Shuler };
603a49ffe3SShahaf Shuler 
613a49ffe3SShahaf Shuler #define ETHTOOL_GLINKSETTINGS 0x0000004c
623a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseT_Full_BIT 5
633a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_Autoneg_BIT 6
643a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseKX_Full_BIT 17
653a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT 18
663a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKR_Full_BIT 19
673a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseR_FEC_BIT 20
683a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT 21
693a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT 22
703a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT 23
713a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT 24
723a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT 25
733a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT 26
743a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT 27
753a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT 28
763a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT 29
773a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT 30
783a49ffe3SShahaf Shuler #endif
793a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_25G
803a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseCR_Full_BIT 31
813a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseKR_Full_BIT 32
823a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseSR_Full_BIT 33
833a49ffe3SShahaf Shuler #endif
843a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_50G
853a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT 34
863a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT 35
873a49ffe3SShahaf Shuler #endif
883a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_100G
893a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT 36
903a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT 37
913a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT 38
923a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT 39
933a49ffe3SShahaf Shuler #endif
943a49ffe3SShahaf Shuler 
95771fa900SAdrien Mazarguil /**
96771fa900SAdrien Mazarguil  * Get interface name from private structure.
97771fa900SAdrien Mazarguil  *
98771fa900SAdrien Mazarguil  * @param[in] priv
99771fa900SAdrien Mazarguil  *   Pointer to private structure.
100771fa900SAdrien Mazarguil  * @param[out] ifname
101771fa900SAdrien Mazarguil  *   Interface name output buffer.
102771fa900SAdrien Mazarguil  *
103771fa900SAdrien Mazarguil  * @return
104771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
105771fa900SAdrien Mazarguil  */
106771fa900SAdrien Mazarguil int
107771fa900SAdrien Mazarguil priv_get_ifname(const struct priv *priv, char (*ifname)[IF_NAMESIZE])
108771fa900SAdrien Mazarguil {
109771fa900SAdrien Mazarguil 	DIR *dir;
110771fa900SAdrien Mazarguil 	struct dirent *dent;
111771fa900SAdrien Mazarguil 	unsigned int dev_type = 0;
112771fa900SAdrien Mazarguil 	unsigned int dev_port_prev = ~0u;
113771fa900SAdrien Mazarguil 	char match[IF_NAMESIZE] = "";
114771fa900SAdrien Mazarguil 
115771fa900SAdrien Mazarguil 	{
11687ec44ceSXueming Li 		MKSTR(path, "%s/device/net", priv->ibdev_path);
117771fa900SAdrien Mazarguil 
118771fa900SAdrien Mazarguil 		dir = opendir(path);
119771fa900SAdrien Mazarguil 		if (dir == NULL)
120771fa900SAdrien Mazarguil 			return -1;
121771fa900SAdrien Mazarguil 	}
122771fa900SAdrien Mazarguil 	while ((dent = readdir(dir)) != NULL) {
123771fa900SAdrien Mazarguil 		char *name = dent->d_name;
124771fa900SAdrien Mazarguil 		FILE *file;
125771fa900SAdrien Mazarguil 		unsigned int dev_port;
126771fa900SAdrien Mazarguil 		int r;
127771fa900SAdrien Mazarguil 
128771fa900SAdrien Mazarguil 		if ((name[0] == '.') &&
129771fa900SAdrien Mazarguil 		    ((name[1] == '\0') ||
130771fa900SAdrien Mazarguil 		     ((name[1] == '.') && (name[2] == '\0'))))
131771fa900SAdrien Mazarguil 			continue;
132771fa900SAdrien Mazarguil 
133771fa900SAdrien Mazarguil 		MKSTR(path, "%s/device/net/%s/%s",
13487ec44ceSXueming Li 		      priv->ibdev_path, name,
135771fa900SAdrien Mazarguil 		      (dev_type ? "dev_id" : "dev_port"));
136771fa900SAdrien Mazarguil 
137771fa900SAdrien Mazarguil 		file = fopen(path, "rb");
138771fa900SAdrien Mazarguil 		if (file == NULL) {
139771fa900SAdrien Mazarguil 			if (errno != ENOENT)
140771fa900SAdrien Mazarguil 				continue;
141771fa900SAdrien Mazarguil 			/*
142771fa900SAdrien Mazarguil 			 * Switch to dev_id when dev_port does not exist as
143771fa900SAdrien Mazarguil 			 * is the case with Linux kernel versions < 3.15.
144771fa900SAdrien Mazarguil 			 */
145771fa900SAdrien Mazarguil try_dev_id:
146771fa900SAdrien Mazarguil 			match[0] = '\0';
147771fa900SAdrien Mazarguil 			if (dev_type)
148771fa900SAdrien Mazarguil 				break;
149771fa900SAdrien Mazarguil 			dev_type = 1;
150771fa900SAdrien Mazarguil 			dev_port_prev = ~0u;
151771fa900SAdrien Mazarguil 			rewinddir(dir);
152771fa900SAdrien Mazarguil 			continue;
153771fa900SAdrien Mazarguil 		}
154771fa900SAdrien Mazarguil 		r = fscanf(file, (dev_type ? "%x" : "%u"), &dev_port);
155771fa900SAdrien Mazarguil 		fclose(file);
156771fa900SAdrien Mazarguil 		if (r != 1)
157771fa900SAdrien Mazarguil 			continue;
158771fa900SAdrien Mazarguil 		/*
159771fa900SAdrien Mazarguil 		 * Switch to dev_id when dev_port returns the same value for
160771fa900SAdrien Mazarguil 		 * all ports. May happen when using a MOFED release older than
161771fa900SAdrien Mazarguil 		 * 3.0 with a Linux kernel >= 3.15.
162771fa900SAdrien Mazarguil 		 */
163771fa900SAdrien Mazarguil 		if (dev_port == dev_port_prev)
164771fa900SAdrien Mazarguil 			goto try_dev_id;
165771fa900SAdrien Mazarguil 		dev_port_prev = dev_port;
166771fa900SAdrien Mazarguil 		if (dev_port == (priv->port - 1u))
167771fa900SAdrien Mazarguil 			snprintf(match, sizeof(match), "%s", name);
168771fa900SAdrien Mazarguil 	}
169771fa900SAdrien Mazarguil 	closedir(dir);
170771fa900SAdrien Mazarguil 	if (match[0] == '\0')
171771fa900SAdrien Mazarguil 		return -1;
172771fa900SAdrien Mazarguil 	strncpy(*ifname, match, sizeof(*ifname));
173771fa900SAdrien Mazarguil 	return 0;
174771fa900SAdrien Mazarguil }
175771fa900SAdrien Mazarguil 
176771fa900SAdrien Mazarguil /**
177771fa900SAdrien Mazarguil  * Perform ifreq ioctl() on associated Ethernet device.
178771fa900SAdrien Mazarguil  *
179771fa900SAdrien Mazarguil  * @param[in] priv
180771fa900SAdrien Mazarguil  *   Pointer to private structure.
181771fa900SAdrien Mazarguil  * @param req
182771fa900SAdrien Mazarguil  *   Request number to pass to ioctl().
183771fa900SAdrien Mazarguil  * @param[out] ifr
184771fa900SAdrien Mazarguil  *   Interface request structure output buffer.
185771fa900SAdrien Mazarguil  *
186771fa900SAdrien Mazarguil  * @return
187771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
188771fa900SAdrien Mazarguil  */
189771fa900SAdrien Mazarguil int
190771fa900SAdrien Mazarguil priv_ifreq(const struct priv *priv, int req, struct ifreq *ifr)
191771fa900SAdrien Mazarguil {
192771fa900SAdrien Mazarguil 	int sock = socket(PF_INET, SOCK_DGRAM, IPPROTO_IP);
193771fa900SAdrien Mazarguil 	int ret = -1;
194771fa900SAdrien Mazarguil 
195771fa900SAdrien Mazarguil 	if (sock == -1)
196771fa900SAdrien Mazarguil 		return ret;
197771fa900SAdrien Mazarguil 	if (priv_get_ifname(priv, &ifr->ifr_name) == 0)
198771fa900SAdrien Mazarguil 		ret = ioctl(sock, req, ifr);
199771fa900SAdrien Mazarguil 	close(sock);
200771fa900SAdrien Mazarguil 	return ret;
201771fa900SAdrien Mazarguil }
202771fa900SAdrien Mazarguil 
203771fa900SAdrien Mazarguil /**
204771fa900SAdrien Mazarguil  * Get device MTU.
205771fa900SAdrien Mazarguil  *
206771fa900SAdrien Mazarguil  * @param priv
207771fa900SAdrien Mazarguil  *   Pointer to private structure.
208771fa900SAdrien Mazarguil  * @param[out] mtu
209771fa900SAdrien Mazarguil  *   MTU value output buffer.
210771fa900SAdrien Mazarguil  *
211771fa900SAdrien Mazarguil  * @return
212771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
213771fa900SAdrien Mazarguil  */
214771fa900SAdrien Mazarguil int
215771fa900SAdrien Mazarguil priv_get_mtu(struct priv *priv, uint16_t *mtu)
216771fa900SAdrien Mazarguil {
217fc40db99SAdrien Mazarguil 	struct ifreq request;
218fc40db99SAdrien Mazarguil 	int ret = priv_ifreq(priv, SIOCGIFMTU, &request);
219771fa900SAdrien Mazarguil 
220fc40db99SAdrien Mazarguil 	if (ret)
221fc40db99SAdrien Mazarguil 		return ret;
222fc40db99SAdrien Mazarguil 	*mtu = request.ifr_mtu;
223859081d3SShahaf Shuler 	return 0;
224859081d3SShahaf Shuler }
225859081d3SShahaf Shuler 
226859081d3SShahaf Shuler /**
227cf37ca95SAdrien Mazarguil  * Set device MTU.
228cf37ca95SAdrien Mazarguil  *
229cf37ca95SAdrien Mazarguil  * @param priv
230cf37ca95SAdrien Mazarguil  *   Pointer to private structure.
231cf37ca95SAdrien Mazarguil  * @param mtu
232cf37ca95SAdrien Mazarguil  *   MTU value to set.
233cf37ca95SAdrien Mazarguil  *
234cf37ca95SAdrien Mazarguil  * @return
235cf37ca95SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
236cf37ca95SAdrien Mazarguil  */
237cf37ca95SAdrien Mazarguil static int
238cf37ca95SAdrien Mazarguil priv_set_mtu(struct priv *priv, uint16_t mtu)
239cf37ca95SAdrien Mazarguil {
240fc40db99SAdrien Mazarguil 	struct ifreq request = { .ifr_mtu = mtu, };
241f3b492d7SAdrien Mazarguil 
242fc40db99SAdrien Mazarguil 	return priv_ifreq(priv, SIOCSIFMTU, &request);
243cf37ca95SAdrien Mazarguil }
244cf37ca95SAdrien Mazarguil 
245cf37ca95SAdrien Mazarguil /**
246771fa900SAdrien Mazarguil  * Set device flags.
247771fa900SAdrien Mazarguil  *
248771fa900SAdrien Mazarguil  * @param priv
249771fa900SAdrien Mazarguil  *   Pointer to private structure.
250771fa900SAdrien Mazarguil  * @param keep
251771fa900SAdrien Mazarguil  *   Bitmask for flags that must remain untouched.
252771fa900SAdrien Mazarguil  * @param flags
253771fa900SAdrien Mazarguil  *   Bitmask for flags to modify.
254771fa900SAdrien Mazarguil  *
255771fa900SAdrien Mazarguil  * @return
256771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
257771fa900SAdrien Mazarguil  */
258771fa900SAdrien Mazarguil int
259771fa900SAdrien Mazarguil priv_set_flags(struct priv *priv, unsigned int keep, unsigned int flags)
260771fa900SAdrien Mazarguil {
261fc40db99SAdrien Mazarguil 	struct ifreq request;
262fc40db99SAdrien Mazarguil 	int ret = priv_ifreq(priv, SIOCGIFFLAGS, &request);
263771fa900SAdrien Mazarguil 
264fc40db99SAdrien Mazarguil 	if (ret)
265fc40db99SAdrien Mazarguil 		return ret;
266fc40db99SAdrien Mazarguil 	request.ifr_flags &= keep;
267fc40db99SAdrien Mazarguil 	request.ifr_flags |= flags & ~keep;
268fc40db99SAdrien Mazarguil 	return priv_ifreq(priv, SIOCSIFFLAGS, &request);
269771fa900SAdrien Mazarguil }
270771fa900SAdrien Mazarguil 
271771fa900SAdrien Mazarguil /**
272*7b2423cdSNélio Laranjeiro  * DPDK callback for Ethernet device configuration.
273e60fbd5bSAdrien Mazarguil  *
274e60fbd5bSAdrien Mazarguil  * @param dev
275e60fbd5bSAdrien Mazarguil  *   Pointer to Ethernet device structure.
276e60fbd5bSAdrien Mazarguil  *
277e60fbd5bSAdrien Mazarguil  * @return
278*7b2423cdSNélio Laranjeiro  *   0 on success, negative errno value on failure.
279e60fbd5bSAdrien Mazarguil  */
280*7b2423cdSNélio Laranjeiro int
281*7b2423cdSNélio Laranjeiro mlx5_dev_configure(struct rte_eth_dev *dev)
282e60fbd5bSAdrien Mazarguil {
283e60fbd5bSAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
284e60fbd5bSAdrien Mazarguil 	unsigned int rxqs_n = dev->data->nb_rx_queues;
285e60fbd5bSAdrien Mazarguil 	unsigned int txqs_n = dev->data->nb_tx_queues;
286634efbc2SNelio Laranjeiro 	unsigned int i;
287634efbc2SNelio Laranjeiro 	unsigned int j;
288634efbc2SNelio Laranjeiro 	unsigned int reta_idx_n;
28929c1d8bbSNélio Laranjeiro 	const uint8_t use_app_rss_key =
29021e3a974SShahaf Shuler 		!!dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key;
291dbccb4cdSShahaf Shuler 	uint64_t supp_tx_offloads = mlx5_priv_get_tx_port_offloads(priv);
292dbccb4cdSShahaf Shuler 	uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads;
29317b843ebSShahaf Shuler 	uint64_t supp_rx_offloads =
29417b843ebSShahaf Shuler 		(mlx5_priv_get_rx_port_offloads(priv) |
29517b843ebSShahaf Shuler 		 mlx5_priv_get_rx_queue_offloads(priv));
29617b843ebSShahaf Shuler 	uint64_t rx_offloads = dev->data->dev_conf.rxmode.offloads;
297e60fbd5bSAdrien Mazarguil 
298dbccb4cdSShahaf Shuler 	if ((tx_offloads & supp_tx_offloads) != tx_offloads) {
299dbccb4cdSShahaf Shuler 		ERROR("Some Tx offloads are not supported "
300dbccb4cdSShahaf Shuler 		      "requested 0x%" PRIx64 " supported 0x%" PRIx64,
301dbccb4cdSShahaf Shuler 		      tx_offloads, supp_tx_offloads);
302dbccb4cdSShahaf Shuler 		return ENOTSUP;
303dbccb4cdSShahaf Shuler 	}
30417b843ebSShahaf Shuler 	if ((rx_offloads & supp_rx_offloads) != rx_offloads) {
30517b843ebSShahaf Shuler 		ERROR("Some Rx offloads are not supported "
30617b843ebSShahaf Shuler 		      "requested 0x%" PRIx64 " supported 0x%" PRIx64,
30717b843ebSShahaf Shuler 		      rx_offloads, supp_rx_offloads);
30817b843ebSShahaf Shuler 		return ENOTSUP;
30917b843ebSShahaf Shuler 	}
31029c1d8bbSNélio Laranjeiro 	if (use_app_rss_key &&
31129c1d8bbSNélio Laranjeiro 	    (dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key_len !=
31229c1d8bbSNélio Laranjeiro 	     rss_hash_default_key_len)) {
31329c1d8bbSNélio Laranjeiro 		/* MLX5 RSS only support 40bytes key. */
31429c1d8bbSNélio Laranjeiro 		return EINVAL;
31529c1d8bbSNélio Laranjeiro 	}
31629c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_key =
31729c1d8bbSNélio Laranjeiro 		rte_realloc(priv->rss_conf.rss_key,
31829c1d8bbSNélio Laranjeiro 			    rss_hash_default_key_len, 0);
31929c1d8bbSNélio Laranjeiro 	if (!priv->rss_conf.rss_key) {
32029c1d8bbSNélio Laranjeiro 		ERROR("cannot allocate RSS hash key memory (%u)", rxqs_n);
32129c1d8bbSNélio Laranjeiro 		return ENOMEM;
32229c1d8bbSNélio Laranjeiro 	}
32329c1d8bbSNélio Laranjeiro 	memcpy(priv->rss_conf.rss_key,
32429c1d8bbSNélio Laranjeiro 	       use_app_rss_key ?
32529c1d8bbSNélio Laranjeiro 	       dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key :
32629c1d8bbSNélio Laranjeiro 	       rss_hash_default_key,
32729c1d8bbSNélio Laranjeiro 	       rss_hash_default_key_len);
32829c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_key_len = rss_hash_default_key_len;
32929c1d8bbSNélio Laranjeiro 	priv->rss_conf.rss_hf = dev->data->dev_conf.rx_adv_conf.rss_conf.rss_hf;
330e60fbd5bSAdrien Mazarguil 	priv->rxqs = (void *)dev->data->rx_queues;
331e60fbd5bSAdrien Mazarguil 	priv->txqs = (void *)dev->data->tx_queues;
332e60fbd5bSAdrien Mazarguil 	if (txqs_n != priv->txqs_n) {
333e60fbd5bSAdrien Mazarguil 		INFO("%p: TX queues number update: %u -> %u",
334e60fbd5bSAdrien Mazarguil 		     (void *)dev, priv->txqs_n, txqs_n);
335e60fbd5bSAdrien Mazarguil 		priv->txqs_n = txqs_n;
336e60fbd5bSAdrien Mazarguil 	}
3377fe24446SShahaf Shuler 	if (rxqs_n > priv->config.ind_table_max_size) {
338634efbc2SNelio Laranjeiro 		ERROR("cannot handle this many RX queues (%u)", rxqs_n);
339634efbc2SNelio Laranjeiro 		return EINVAL;
340634efbc2SNelio Laranjeiro 	}
341e60fbd5bSAdrien Mazarguil 	if (rxqs_n == priv->rxqs_n)
342e60fbd5bSAdrien Mazarguil 		return 0;
343e60fbd5bSAdrien Mazarguil 	INFO("%p: RX queues number update: %u -> %u",
344e60fbd5bSAdrien Mazarguil 	     (void *)dev, priv->rxqs_n, rxqs_n);
345e60fbd5bSAdrien Mazarguil 	priv->rxqs_n = rxqs_n;
346634efbc2SNelio Laranjeiro 	/* If the requested number of RX queues is not a power of two, use the
347634efbc2SNelio Laranjeiro 	 * maximum indirection table size for better balancing.
348634efbc2SNelio Laranjeiro 	 * The result is always rounded to the next power of two. */
349634efbc2SNelio Laranjeiro 	reta_idx_n = (1 << log2above((rxqs_n & (rxqs_n - 1)) ?
3507fe24446SShahaf Shuler 				     priv->config.ind_table_max_size :
351634efbc2SNelio Laranjeiro 				     rxqs_n));
352634efbc2SNelio Laranjeiro 	if (priv_rss_reta_index_resize(priv, reta_idx_n))
353634efbc2SNelio Laranjeiro 		return ENOMEM;
354634efbc2SNelio Laranjeiro 	/* When the number of RX queues is not a power of two, the remaining
355634efbc2SNelio Laranjeiro 	 * table entries are padded with reused WQs and hashes are not spread
356634efbc2SNelio Laranjeiro 	 * uniformly. */
357634efbc2SNelio Laranjeiro 	for (i = 0, j = 0; (i != reta_idx_n); ++i) {
358634efbc2SNelio Laranjeiro 		(*priv->reta_idx)[i] = j;
359634efbc2SNelio Laranjeiro 		if (++j == rxqs_n)
360634efbc2SNelio Laranjeiro 			j = 0;
361634efbc2SNelio Laranjeiro 	}
362e60fbd5bSAdrien Mazarguil 	return 0;
363e60fbd5bSAdrien Mazarguil 
364e60fbd5bSAdrien Mazarguil }
365e60fbd5bSAdrien Mazarguil 
366e60fbd5bSAdrien Mazarguil /**
367e60fbd5bSAdrien Mazarguil  * DPDK callback to get information about the device.
368e60fbd5bSAdrien Mazarguil  *
369e60fbd5bSAdrien Mazarguil  * @param dev
370e60fbd5bSAdrien Mazarguil  *   Pointer to Ethernet device structure.
371e60fbd5bSAdrien Mazarguil  * @param[out] info
372e60fbd5bSAdrien Mazarguil  *   Info structure output buffer.
373e60fbd5bSAdrien Mazarguil  */
374e60fbd5bSAdrien Mazarguil void
375e60fbd5bSAdrien Mazarguil mlx5_dev_infos_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *info)
376e60fbd5bSAdrien Mazarguil {
37701d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
3787fe24446SShahaf Shuler 	struct mlx5_dev_config *config = &priv->config;
379e60fbd5bSAdrien Mazarguil 	unsigned int max;
380e60fbd5bSAdrien Mazarguil 	char ifname[IF_NAMESIZE];
381e60fbd5bSAdrien Mazarguil 
382c0802544SFerruh Yigit 	info->pci_dev = RTE_ETH_DEV_TO_PCI(dev);
383e60fbd5bSAdrien Mazarguil 	/* FIXME: we should ask the device for these values. */
384e60fbd5bSAdrien Mazarguil 	info->min_rx_bufsize = 32;
385e60fbd5bSAdrien Mazarguil 	info->max_rx_pktlen = 65536;
386e60fbd5bSAdrien Mazarguil 	/*
387e60fbd5bSAdrien Mazarguil 	 * Since we need one CQ per QP, the limit is the minimum number
388e60fbd5bSAdrien Mazarguil 	 * between the two values.
389e60fbd5bSAdrien Mazarguil 	 */
39043e9d979SShachar Beiser 	max = RTE_MIN(priv->device_attr.orig_attr.max_cq,
39143e9d979SShachar Beiser 		      priv->device_attr.orig_attr.max_qp);
392e60fbd5bSAdrien Mazarguil 	/* If max >= 65535 then max = 0, max_rx_queues is uint16_t. */
393e60fbd5bSAdrien Mazarguil 	if (max >= 65535)
394e60fbd5bSAdrien Mazarguil 		max = 65535;
395e60fbd5bSAdrien Mazarguil 	info->max_rx_queues = max;
396e60fbd5bSAdrien Mazarguil 	info->max_tx_queues = max;
3970497ddaaSYaacov Hazan 	info->max_mac_addrs = RTE_DIM(priv->mac);
39817b843ebSShahaf Shuler 	info->rx_queue_offload_capa =
39917b843ebSShahaf Shuler 		mlx5_priv_get_rx_queue_offloads(priv);
40017b843ebSShahaf Shuler 	info->rx_offload_capa = (mlx5_priv_get_rx_port_offloads(priv) |
40117b843ebSShahaf Shuler 				 info->rx_queue_offload_capa);
402dbccb4cdSShahaf Shuler 	info->tx_offload_capa = mlx5_priv_get_tx_port_offloads(priv);
403e60fbd5bSAdrien Mazarguil 	if (priv_get_ifname(priv, &ifname) == 0)
404e60fbd5bSAdrien Mazarguil 		info->if_index = if_nametoindex(ifname);
405d365210eSYongseok Koh 	info->reta_size = priv->reta_idx_n ?
4067fe24446SShahaf Shuler 		priv->reta_idx_n : config->ind_table_max_size;
40729c1d8bbSNélio Laranjeiro 	info->hash_key_size = priv->rss_conf.rss_key_len;
40875ef62a9SNélio Laranjeiro 	info->speed_capa = priv->link_speed_capa;
409b233b027SShahaf Shuler 	info->flow_type_rss_offloads = ~MLX5_RSS_HF_MASK;
410e60fbd5bSAdrien Mazarguil }
411e60fbd5bSAdrien Mazarguil 
412fb732b0aSNélio Laranjeiro /**
413fb732b0aSNélio Laranjeiro  * Get supported packet types.
414fb732b0aSNélio Laranjeiro  *
415fb732b0aSNélio Laranjeiro  * @param dev
416fb732b0aSNélio Laranjeiro  *   Pointer to Ethernet device structure.
417fb732b0aSNélio Laranjeiro  *
418fb732b0aSNélio Laranjeiro  * @return
419fb732b0aSNélio Laranjeiro  *   A pointer to the supported Packet types array.
420fb732b0aSNélio Laranjeiro  */
42178a38edfSJianfeng Tan const uint32_t *
42278a38edfSJianfeng Tan mlx5_dev_supported_ptypes_get(struct rte_eth_dev *dev)
42378a38edfSJianfeng Tan {
42478a38edfSJianfeng Tan 	static const uint32_t ptypes[] = {
42578a38edfSJianfeng Tan 		/* refers to rxq_cq_to_pkt_type() */
426ea16068cSYongseok Koh 		RTE_PTYPE_L2_ETHER,
427c4ba5434SNélio Laranjeiro 		RTE_PTYPE_L3_IPV4_EXT_UNKNOWN,
428c4ba5434SNélio Laranjeiro 		RTE_PTYPE_L3_IPV6_EXT_UNKNOWN,
429ea16068cSYongseok Koh 		RTE_PTYPE_L4_NONFRAG,
430ea16068cSYongseok Koh 		RTE_PTYPE_L4_FRAG,
431ea16068cSYongseok Koh 		RTE_PTYPE_L4_TCP,
432ea16068cSYongseok Koh 		RTE_PTYPE_L4_UDP,
433c4ba5434SNélio Laranjeiro 		RTE_PTYPE_INNER_L3_IPV4_EXT_UNKNOWN,
434c4ba5434SNélio Laranjeiro 		RTE_PTYPE_INNER_L3_IPV6_EXT_UNKNOWN,
435ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_NONFRAG,
436ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_FRAG,
437ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_TCP,
438ea16068cSYongseok Koh 		RTE_PTYPE_INNER_L4_UDP,
43978a38edfSJianfeng Tan 		RTE_PTYPE_UNKNOWN
44078a38edfSJianfeng Tan 	};
44178a38edfSJianfeng Tan 
4426cb559d6SYongseok Koh 	if (dev->rx_pkt_burst == mlx5_rx_burst ||
4436cb559d6SYongseok Koh 	    dev->rx_pkt_burst == mlx5_rx_burst_vec)
44478a38edfSJianfeng Tan 		return ptypes;
44578a38edfSJianfeng Tan 	return NULL;
44678a38edfSJianfeng Tan }
44778a38edfSJianfeng Tan 
448e60fbd5bSAdrien Mazarguil /**
4492c960a51SMatthieu Ternisien d'Ouville  * DPDK callback to retrieve physical link information.
450cb8faed7SAdrien Mazarguil  *
451cb8faed7SAdrien Mazarguil  * @param dev
452cb8faed7SAdrien Mazarguil  *   Pointer to Ethernet device structure.
453fb732b0aSNélio Laranjeiro  *
454fb732b0aSNélio Laranjeiro  * @return
455fb732b0aSNélio Laranjeiro  *   0 on success, -1 on error.
456cb8faed7SAdrien Mazarguil  */
45718840871SNélio Laranjeiro static int
45856f08e16SNélio Laranjeiro mlx5_link_update_unlocked_gset(struct rte_eth_dev *dev)
459cb8faed7SAdrien Mazarguil {
46001d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
461cb8faed7SAdrien Mazarguil 	struct ethtool_cmd edata = {
46275ef62a9SNélio Laranjeiro 		.cmd = ETHTOOL_GSET /* Deprecated since Linux v4.5. */
463cb8faed7SAdrien Mazarguil 	};
464cb8faed7SAdrien Mazarguil 	struct ifreq ifr;
465cb8faed7SAdrien Mazarguil 	struct rte_eth_link dev_link;
466cb8faed7SAdrien Mazarguil 	int link_speed = 0;
467cb8faed7SAdrien Mazarguil 
468cb8faed7SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCGIFFLAGS, &ifr)) {
469cb8faed7SAdrien Mazarguil 		WARN("ioctl(SIOCGIFFLAGS) failed: %s", strerror(errno));
470cb8faed7SAdrien Mazarguil 		return -1;
471cb8faed7SAdrien Mazarguil 	}
472cb8faed7SAdrien Mazarguil 	memset(&dev_link, 0, sizeof(dev_link));
473cb8faed7SAdrien Mazarguil 	dev_link.link_status = ((ifr.ifr_flags & IFF_UP) &&
474cb8faed7SAdrien Mazarguil 				(ifr.ifr_flags & IFF_RUNNING));
475d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&edata;
476cb8faed7SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
477cb8faed7SAdrien Mazarguil 		WARN("ioctl(SIOCETHTOOL, ETHTOOL_GSET) failed: %s",
478cb8faed7SAdrien Mazarguil 		     strerror(errno));
479cb8faed7SAdrien Mazarguil 		return -1;
480cb8faed7SAdrien Mazarguil 	}
481cb8faed7SAdrien Mazarguil 	link_speed = ethtool_cmd_speed(&edata);
482cb8faed7SAdrien Mazarguil 	if (link_speed == -1)
483cb8faed7SAdrien Mazarguil 		dev_link.link_speed = 0;
484cb8faed7SAdrien Mazarguil 	else
485cb8faed7SAdrien Mazarguil 		dev_link.link_speed = link_speed;
48675ef62a9SNélio Laranjeiro 	priv->link_speed_capa = 0;
48775ef62a9SNélio Laranjeiro 	if (edata.supported & SUPPORTED_Autoneg)
48875ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
48975ef62a9SNélio Laranjeiro 	if (edata.supported & (SUPPORTED_1000baseT_Full |
49075ef62a9SNélio Laranjeiro 			       SUPPORTED_1000baseKX_Full))
49175ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_1G;
49275ef62a9SNélio Laranjeiro 	if (edata.supported & SUPPORTED_10000baseKR_Full)
49375ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_10G;
49475ef62a9SNélio Laranjeiro 	if (edata.supported & (SUPPORTED_40000baseKR4_Full |
49575ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseCR4_Full |
49675ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseSR4_Full |
49775ef62a9SNélio Laranjeiro 			       SUPPORTED_40000baseLR4_Full))
49875ef62a9SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_40G;
499cb8faed7SAdrien Mazarguil 	dev_link.link_duplex = ((edata.duplex == DUPLEX_HALF) ?
500cb8faed7SAdrien Mazarguil 				ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
50182113036SMarc Sune 	dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
50282113036SMarc Sune 			ETH_LINK_SPEED_FIXED);
503cb8faed7SAdrien Mazarguil 	if (memcmp(&dev_link, &dev->data->dev_link, sizeof(dev_link))) {
504cb8faed7SAdrien Mazarguil 		/* Link status changed. */
505cb8faed7SAdrien Mazarguil 		dev->data->dev_link = dev_link;
506cb8faed7SAdrien Mazarguil 		return 0;
507cb8faed7SAdrien Mazarguil 	}
508cb8faed7SAdrien Mazarguil 	/* Link status is still the same. */
509cb8faed7SAdrien Mazarguil 	return -1;
510cb8faed7SAdrien Mazarguil }
511cb8faed7SAdrien Mazarguil 
512cb8faed7SAdrien Mazarguil /**
5133a49ffe3SShahaf Shuler  * Retrieve physical link information (unlocked version using new ioctl).
51418840871SNélio Laranjeiro  *
51518840871SNélio Laranjeiro  * @param dev
51618840871SNélio Laranjeiro  *   Pointer to Ethernet device structure.
517fb732b0aSNélio Laranjeiro  *
518fb732b0aSNélio Laranjeiro  * @return
519fb732b0aSNélio Laranjeiro  *   0 on success, -1 on error.
52018840871SNélio Laranjeiro  */
52118840871SNélio Laranjeiro static int
52256f08e16SNélio Laranjeiro mlx5_link_update_unlocked_gs(struct rte_eth_dev *dev)
52318840871SNélio Laranjeiro {
52401d79216SNélio Laranjeiro 	struct priv *priv = dev->data->dev_private;
52537a4406cSNélio Laranjeiro 	struct ethtool_link_settings gcmd = { .cmd = ETHTOOL_GLINKSETTINGS };
52618840871SNélio Laranjeiro 	struct ifreq ifr;
52718840871SNélio Laranjeiro 	struct rte_eth_link dev_link;
52818840871SNélio Laranjeiro 	uint64_t sc;
52918840871SNélio Laranjeiro 
53018840871SNélio Laranjeiro 	if (priv_ifreq(priv, SIOCGIFFLAGS, &ifr)) {
53118840871SNélio Laranjeiro 		WARN("ioctl(SIOCGIFFLAGS) failed: %s", strerror(errno));
53218840871SNélio Laranjeiro 		return -1;
53318840871SNélio Laranjeiro 	}
53418840871SNélio Laranjeiro 	memset(&dev_link, 0, sizeof(dev_link));
53518840871SNélio Laranjeiro 	dev_link.link_status = ((ifr.ifr_flags & IFF_UP) &&
53618840871SNélio Laranjeiro 				(ifr.ifr_flags & IFF_RUNNING));
53737a4406cSNélio Laranjeiro 	ifr.ifr_data = (void *)&gcmd;
53818840871SNélio Laranjeiro 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
53918840871SNélio Laranjeiro 		DEBUG("ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS) failed: %s",
54018840871SNélio Laranjeiro 		      strerror(errno));
54118840871SNélio Laranjeiro 		return -1;
54218840871SNélio Laranjeiro 	}
54337a4406cSNélio Laranjeiro 	gcmd.link_mode_masks_nwords = -gcmd.link_mode_masks_nwords;
54437a4406cSNélio Laranjeiro 
54537a4406cSNélio Laranjeiro 	alignas(struct ethtool_link_settings)
54637a4406cSNélio Laranjeiro 	uint8_t data[offsetof(struct ethtool_link_settings, link_mode_masks) +
54737a4406cSNélio Laranjeiro 		     sizeof(uint32_t) * gcmd.link_mode_masks_nwords * 3];
54837a4406cSNélio Laranjeiro 	struct ethtool_link_settings *ecmd = (void *)data;
54937a4406cSNélio Laranjeiro 
55037a4406cSNélio Laranjeiro 	*ecmd = gcmd;
55137a4406cSNélio Laranjeiro 	ifr.ifr_data = (void *)ecmd;
552ef09a7fcSGowrishankar Muthukrishnan 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
553ef09a7fcSGowrishankar Muthukrishnan 		DEBUG("ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS) failed: %s",
554ef09a7fcSGowrishankar Muthukrishnan 		      strerror(errno));
555ef09a7fcSGowrishankar Muthukrishnan 		return -1;
556ef09a7fcSGowrishankar Muthukrishnan 	}
55790260d57SNélio Laranjeiro 	dev_link.link_speed = ecmd->speed;
55890260d57SNélio Laranjeiro 	sc = ecmd->link_mode_masks[0] |
55990260d57SNélio Laranjeiro 		((uint64_t)ecmd->link_mode_masks[1] << 32);
56018840871SNélio Laranjeiro 	priv->link_speed_capa = 0;
561b113cb5eSEdward Makarov 	if (sc & MLX5_BITSHIFT(ETHTOOL_LINK_MODE_Autoneg_BIT))
56218840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG;
563b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseT_Full_BIT) |
564b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseKX_Full_BIT)))
56518840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_1G;
566b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT) |
567b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKR_Full_BIT) |
568b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseR_FEC_BIT)))
56918840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_10G;
570b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT) |
571b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT)))
57218840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_20G;
573b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT) |
574b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT) |
575b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT) |
576b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT)))
57718840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_40G;
578b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT) |
579b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT) |
580b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT) |
581b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT)))
58218840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_56G;
583b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseCR_Full_BIT) |
584b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseKR_Full_BIT) |
585b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseSR_Full_BIT)))
58618840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_25G;
587b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT) |
588b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT)))
58918840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_50G;
590b113cb5eSEdward Makarov 	if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT) |
591b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT) |
592b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT) |
593b113cb5eSEdward Makarov 		  MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT)))
59418840871SNélio Laranjeiro 		priv->link_speed_capa |= ETH_LINK_SPEED_100G;
59590260d57SNélio Laranjeiro 	dev_link.link_duplex = ((ecmd->duplex == DUPLEX_HALF) ?
59618840871SNélio Laranjeiro 				ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX);
59718840871SNélio Laranjeiro 	dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
59818840871SNélio Laranjeiro 				  ETH_LINK_SPEED_FIXED);
59918840871SNélio Laranjeiro 	if (memcmp(&dev_link, &dev->data->dev_link, sizeof(dev_link))) {
60018840871SNélio Laranjeiro 		/* Link status changed. */
60118840871SNélio Laranjeiro 		dev->data->dev_link = dev_link;
60218840871SNélio Laranjeiro 		return 0;
60318840871SNélio Laranjeiro 	}
60418840871SNélio Laranjeiro 	/* Link status is still the same. */
60518840871SNélio Laranjeiro 	return -1;
60618840871SNélio Laranjeiro }
60718840871SNélio Laranjeiro 
60818840871SNélio Laranjeiro /**
609c7bf6225SYongseok Koh  * Enable receiving and transmitting traffic.
610c7bf6225SYongseok Koh  *
611c7bf6225SYongseok Koh  * @param priv
612c7bf6225SYongseok Koh  *   Pointer to private structure.
613c7bf6225SYongseok Koh  */
614c7bf6225SYongseok Koh static void
615c7bf6225SYongseok Koh priv_link_start(struct priv *priv)
616c7bf6225SYongseok Koh {
617c7bf6225SYongseok Koh 	struct rte_eth_dev *dev = priv->dev;
618c7bf6225SYongseok Koh 	int err;
619c7bf6225SYongseok Koh 
620c7bf6225SYongseok Koh 	dev->tx_pkt_burst = priv_select_tx_function(priv, dev);
621c7bf6225SYongseok Koh 	dev->rx_pkt_burst = priv_select_rx_function(priv, dev);
622c7bf6225SYongseok Koh 	err = priv_dev_traffic_enable(priv, dev);
623c7bf6225SYongseok Koh 	if (err)
624c7bf6225SYongseok Koh 		ERROR("%p: error occurred while configuring control flows: %s",
625c7bf6225SYongseok Koh 		      (void *)priv, strerror(err));
626c7bf6225SYongseok Koh 	err = priv_flow_start(priv, &priv->flows);
627c7bf6225SYongseok Koh 	if (err)
628c7bf6225SYongseok Koh 		ERROR("%p: error occurred while configuring flows: %s",
629c7bf6225SYongseok Koh 		      (void *)priv, strerror(err));
630c7bf6225SYongseok Koh }
631c7bf6225SYongseok Koh 
632c7bf6225SYongseok Koh /**
633c7bf6225SYongseok Koh  * Disable receiving and transmitting traffic.
634c7bf6225SYongseok Koh  *
635c7bf6225SYongseok Koh  * @param priv
636c7bf6225SYongseok Koh  *   Pointer to private structure.
637c7bf6225SYongseok Koh  */
638c7bf6225SYongseok Koh static void
639c7bf6225SYongseok Koh priv_link_stop(struct priv *priv)
640c7bf6225SYongseok Koh {
641c7bf6225SYongseok Koh 	struct rte_eth_dev *dev = priv->dev;
642c7bf6225SYongseok Koh 
643c7bf6225SYongseok Koh 	priv_flow_stop(priv, &priv->flows);
644c7bf6225SYongseok Koh 	priv_dev_traffic_disable(priv, dev);
645c7bf6225SYongseok Koh 	dev->rx_pkt_burst = removed_rx_burst;
646c7bf6225SYongseok Koh 	dev->tx_pkt_burst = removed_tx_burst;
647c7bf6225SYongseok Koh }
648c7bf6225SYongseok Koh 
649c7bf6225SYongseok Koh /**
650c7bf6225SYongseok Koh  * Retrieve physical link information and update rx/tx_pkt_burst callbacks
651c7bf6225SYongseok Koh  * accordingly.
652c7bf6225SYongseok Koh  *
653c7bf6225SYongseok Koh  * @param priv
654c7bf6225SYongseok Koh  *   Pointer to private structure.
655c7bf6225SYongseok Koh  * @param wait_to_complete
656c7bf6225SYongseok Koh  *   Wait for request completion (ignored).
657c7bf6225SYongseok Koh  */
658c7bf6225SYongseok Koh int
65956f08e16SNélio Laranjeiro priv_link_update(struct priv *priv, int wait_to_complete __rte_unused)
660c7bf6225SYongseok Koh {
661c7bf6225SYongseok Koh 	struct rte_eth_dev *dev = priv->dev;
662c7bf6225SYongseok Koh 	struct utsname utsname;
663c7bf6225SYongseok Koh 	int ver[3];
664c7bf6225SYongseok Koh 	int ret;
665c7bf6225SYongseok Koh 	struct rte_eth_link dev_link = dev->data->dev_link;
666c7bf6225SYongseok Koh 
667c7bf6225SYongseok Koh 	if (uname(&utsname) == -1 ||
668c7bf6225SYongseok Koh 	    sscanf(utsname.release, "%d.%d.%d",
669c7bf6225SYongseok Koh 		   &ver[0], &ver[1], &ver[2]) != 3 ||
670c7bf6225SYongseok Koh 	    KERNEL_VERSION(ver[0], ver[1], ver[2]) < KERNEL_VERSION(4, 9, 0))
67156f08e16SNélio Laranjeiro 		ret = mlx5_link_update_unlocked_gset(dev);
672c7bf6225SYongseok Koh 	else
67356f08e16SNélio Laranjeiro 		ret = mlx5_link_update_unlocked_gs(dev);
674c7bf6225SYongseok Koh 	/* If lsc interrupt is disabled, should always be ready for traffic. */
675c7bf6225SYongseok Koh 	if (!dev->data->dev_conf.intr_conf.lsc) {
676c7bf6225SYongseok Koh 		priv_link_start(priv);
677c7bf6225SYongseok Koh 		return ret;
678c7bf6225SYongseok Koh 	}
679c7bf6225SYongseok Koh 	/* Re-select burst callbacks only if link status has been changed. */
680c7bf6225SYongseok Koh 	if (!ret && dev_link.link_status != dev->data->dev_link.link_status) {
681c7bf6225SYongseok Koh 		if (dev->data->dev_link.link_status == ETH_LINK_UP)
682c7bf6225SYongseok Koh 			priv_link_start(priv);
683c7bf6225SYongseok Koh 		else
684c7bf6225SYongseok Koh 			priv_link_stop(priv);
685c7bf6225SYongseok Koh 	}
686c7bf6225SYongseok Koh 	return ret;
687c7bf6225SYongseok Koh }
688c7bf6225SYongseok Koh 
689c7bf6225SYongseok Koh /**
690e313ef4cSShahaf Shuler  * Querying the link status till it changes to the desired state.
691e313ef4cSShahaf Shuler  * Number of query attempts is bounded by MLX5_MAX_LINK_QUERY_ATTEMPTS.
692e313ef4cSShahaf Shuler  *
693e313ef4cSShahaf Shuler  * @param priv
694e313ef4cSShahaf Shuler  *   Pointer to private structure.
695e313ef4cSShahaf Shuler  * @param status
696e313ef4cSShahaf Shuler  *   Link desired status.
697e313ef4cSShahaf Shuler  *
698e313ef4cSShahaf Shuler  * @return
699e313ef4cSShahaf Shuler  *   0 on success, negative errno value on failure.
700e313ef4cSShahaf Shuler  */
701e313ef4cSShahaf Shuler int
702e313ef4cSShahaf Shuler priv_force_link_status_change(struct priv *priv, int status)
703e313ef4cSShahaf Shuler {
704e313ef4cSShahaf Shuler 	int try = 0;
705e313ef4cSShahaf Shuler 
706e313ef4cSShahaf Shuler 	while (try < MLX5_MAX_LINK_QUERY_ATTEMPTS) {
707e313ef4cSShahaf Shuler 		priv_link_update(priv, 0);
708e313ef4cSShahaf Shuler 		if (priv->dev->data->dev_link.link_status == status)
709e313ef4cSShahaf Shuler 			return 0;
710e313ef4cSShahaf Shuler 		try++;
711e313ef4cSShahaf Shuler 		sleep(1);
712e313ef4cSShahaf Shuler 	}
713e313ef4cSShahaf Shuler 	return -EAGAIN;
714e313ef4cSShahaf Shuler }
715e313ef4cSShahaf Shuler 
716e313ef4cSShahaf Shuler /**
717cb8faed7SAdrien Mazarguil  * DPDK callback to retrieve physical link information.
718cb8faed7SAdrien Mazarguil  *
719cb8faed7SAdrien Mazarguil  * @param dev
720cb8faed7SAdrien Mazarguil  *   Pointer to Ethernet device structure.
721cb8faed7SAdrien Mazarguil  * @param wait_to_complete
722cb8faed7SAdrien Mazarguil  *   Wait for request completion (ignored).
723fb732b0aSNélio Laranjeiro  *
724fb732b0aSNélio Laranjeiro  * @return
725fb732b0aSNélio Laranjeiro  *   0 on success, -1 on error.
726cb8faed7SAdrien Mazarguil  */
727cb8faed7SAdrien Mazarguil int
72856f08e16SNélio Laranjeiro mlx5_link_update(struct rte_eth_dev *dev, int wait_to_complete __rte_unused)
729cb8faed7SAdrien Mazarguil {
730c7bf6225SYongseok Koh 	struct priv *priv = dev->data->dev_private;
731c7bf6225SYongseok Koh 	int ret;
732cb8faed7SAdrien Mazarguil 
733c7bf6225SYongseok Koh 	ret = priv_link_update(priv, wait_to_complete);
734c7bf6225SYongseok Koh 	return ret;
735cb8faed7SAdrien Mazarguil }
736cb8faed7SAdrien Mazarguil 
737cb8faed7SAdrien Mazarguil /**
738cf37ca95SAdrien Mazarguil  * DPDK callback to change the MTU.
739cf37ca95SAdrien Mazarguil  *
740cf37ca95SAdrien Mazarguil  * @param dev
741cf37ca95SAdrien Mazarguil  *   Pointer to Ethernet device structure.
742cf37ca95SAdrien Mazarguil  * @param in_mtu
743cf37ca95SAdrien Mazarguil  *   New MTU.
744cf37ca95SAdrien Mazarguil  *
745cf37ca95SAdrien Mazarguil  * @return
746cf37ca95SAdrien Mazarguil  *   0 on success, negative errno value on failure.
747cf37ca95SAdrien Mazarguil  */
748cf37ca95SAdrien Mazarguil int
749cf37ca95SAdrien Mazarguil mlx5_dev_set_mtu(struct rte_eth_dev *dev, uint16_t mtu)
750cf37ca95SAdrien Mazarguil {
751cf37ca95SAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
752a0edafe4SNelio Laranjeiro 	uint16_t kern_mtu;
753cf37ca95SAdrien Mazarguil 	int ret = 0;
754cf37ca95SAdrien Mazarguil 
755a0edafe4SNelio Laranjeiro 	ret = priv_get_mtu(priv, &kern_mtu);
756a0edafe4SNelio Laranjeiro 	if (ret)
757a0edafe4SNelio Laranjeiro 		goto out;
758cf37ca95SAdrien Mazarguil 	/* Set kernel interface MTU first. */
759a0edafe4SNelio Laranjeiro 	ret = priv_set_mtu(priv, mtu);
760a0edafe4SNelio Laranjeiro 	if (ret)
761a0edafe4SNelio Laranjeiro 		goto out;
762a0edafe4SNelio Laranjeiro 	ret = priv_get_mtu(priv, &kern_mtu);
763a0edafe4SNelio Laranjeiro 	if (ret)
764a0edafe4SNelio Laranjeiro 		goto out;
765a0edafe4SNelio Laranjeiro 	if (kern_mtu == mtu) {
766a0edafe4SNelio Laranjeiro 		priv->mtu = mtu;
767a0edafe4SNelio Laranjeiro 		DEBUG("adapter port %u MTU set to %u", priv->port, mtu);
768a0edafe4SNelio Laranjeiro 	}
769a0edafe4SNelio Laranjeiro 	return 0;
770a0edafe4SNelio Laranjeiro out:
771cf37ca95SAdrien Mazarguil 	ret = errno;
772cf37ca95SAdrien Mazarguil 	WARN("cannot set port %u MTU to %u: %s", priv->port, mtu,
773cf37ca95SAdrien Mazarguil 	     strerror(ret));
774cf37ca95SAdrien Mazarguil 	assert(ret >= 0);
775cf37ca95SAdrien Mazarguil 	return -ret;
776cf37ca95SAdrien Mazarguil }
777cf37ca95SAdrien Mazarguil 
778cf37ca95SAdrien Mazarguil /**
77902d75430SAdrien Mazarguil  * DPDK callback to get flow control status.
78002d75430SAdrien Mazarguil  *
78102d75430SAdrien Mazarguil  * @param dev
78202d75430SAdrien Mazarguil  *   Pointer to Ethernet device structure.
78302d75430SAdrien Mazarguil  * @param[out] fc_conf
78402d75430SAdrien Mazarguil  *   Flow control output buffer.
78502d75430SAdrien Mazarguil  *
78602d75430SAdrien Mazarguil  * @return
78702d75430SAdrien Mazarguil  *   0 on success, negative errno value on failure.
78802d75430SAdrien Mazarguil  */
78902d75430SAdrien Mazarguil int
79002d75430SAdrien Mazarguil mlx5_dev_get_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
79102d75430SAdrien Mazarguil {
79202d75430SAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
79302d75430SAdrien Mazarguil 	struct ifreq ifr;
79402d75430SAdrien Mazarguil 	struct ethtool_pauseparam ethpause = {
79502d75430SAdrien Mazarguil 		.cmd = ETHTOOL_GPAUSEPARAM
79602d75430SAdrien Mazarguil 	};
79702d75430SAdrien Mazarguil 	int ret;
79802d75430SAdrien Mazarguil 
799d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&ethpause;
80002d75430SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
80102d75430SAdrien Mazarguil 		ret = errno;
80202d75430SAdrien Mazarguil 		WARN("ioctl(SIOCETHTOOL, ETHTOOL_GPAUSEPARAM)"
80302d75430SAdrien Mazarguil 		     " failed: %s",
80402d75430SAdrien Mazarguil 		     strerror(ret));
80502d75430SAdrien Mazarguil 		goto out;
80602d75430SAdrien Mazarguil 	}
80702d75430SAdrien Mazarguil 	fc_conf->autoneg = ethpause.autoneg;
80802d75430SAdrien Mazarguil 	if (ethpause.rx_pause && ethpause.tx_pause)
80902d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_FULL;
81002d75430SAdrien Mazarguil 	else if (ethpause.rx_pause)
81102d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_RX_PAUSE;
81202d75430SAdrien Mazarguil 	else if (ethpause.tx_pause)
81302d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_TX_PAUSE;
81402d75430SAdrien Mazarguil 	else
81502d75430SAdrien Mazarguil 		fc_conf->mode = RTE_FC_NONE;
81602d75430SAdrien Mazarguil 	ret = 0;
81702d75430SAdrien Mazarguil out:
81802d75430SAdrien Mazarguil 	assert(ret >= 0);
81902d75430SAdrien Mazarguil 	return -ret;
82002d75430SAdrien Mazarguil }
82102d75430SAdrien Mazarguil 
82202d75430SAdrien Mazarguil /**
82302d75430SAdrien Mazarguil  * DPDK callback to modify flow control parameters.
82402d75430SAdrien Mazarguil  *
82502d75430SAdrien Mazarguil  * @param dev
82602d75430SAdrien Mazarguil  *   Pointer to Ethernet device structure.
82702d75430SAdrien Mazarguil  * @param[in] fc_conf
82802d75430SAdrien Mazarguil  *   Flow control parameters.
82902d75430SAdrien Mazarguil  *
83002d75430SAdrien Mazarguil  * @return
83102d75430SAdrien Mazarguil  *   0 on success, negative errno value on failure.
83202d75430SAdrien Mazarguil  */
83302d75430SAdrien Mazarguil int
83402d75430SAdrien Mazarguil mlx5_dev_set_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf)
83502d75430SAdrien Mazarguil {
83602d75430SAdrien Mazarguil 	struct priv *priv = dev->data->dev_private;
83702d75430SAdrien Mazarguil 	struct ifreq ifr;
83802d75430SAdrien Mazarguil 	struct ethtool_pauseparam ethpause = {
83902d75430SAdrien Mazarguil 		.cmd = ETHTOOL_SPAUSEPARAM
84002d75430SAdrien Mazarguil 	};
84102d75430SAdrien Mazarguil 	int ret;
84202d75430SAdrien Mazarguil 
843d06c608cSAdrien Mazarguil 	ifr.ifr_data = (void *)&ethpause;
84402d75430SAdrien Mazarguil 	ethpause.autoneg = fc_conf->autoneg;
84502d75430SAdrien Mazarguil 	if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
84602d75430SAdrien Mazarguil 	    (fc_conf->mode & RTE_FC_RX_PAUSE))
84702d75430SAdrien Mazarguil 		ethpause.rx_pause = 1;
84802d75430SAdrien Mazarguil 	else
84902d75430SAdrien Mazarguil 		ethpause.rx_pause = 0;
85002d75430SAdrien Mazarguil 
85102d75430SAdrien Mazarguil 	if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) ||
85202d75430SAdrien Mazarguil 	    (fc_conf->mode & RTE_FC_TX_PAUSE))
85302d75430SAdrien Mazarguil 		ethpause.tx_pause = 1;
85402d75430SAdrien Mazarguil 	else
85502d75430SAdrien Mazarguil 		ethpause.tx_pause = 0;
85602d75430SAdrien Mazarguil 	if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) {
85702d75430SAdrien Mazarguil 		ret = errno;
85802d75430SAdrien Mazarguil 		WARN("ioctl(SIOCETHTOOL, ETHTOOL_SPAUSEPARAM)"
85902d75430SAdrien Mazarguil 		     " failed: %s",
86002d75430SAdrien Mazarguil 		     strerror(ret));
86102d75430SAdrien Mazarguil 		goto out;
86202d75430SAdrien Mazarguil 	}
86302d75430SAdrien Mazarguil 	ret = 0;
86402d75430SAdrien Mazarguil out:
86502d75430SAdrien Mazarguil 	assert(ret >= 0);
86602d75430SAdrien Mazarguil 	return -ret;
86702d75430SAdrien Mazarguil }
86802d75430SAdrien Mazarguil 
86902d75430SAdrien Mazarguil /**
870771fa900SAdrien Mazarguil  * Get PCI information from struct ibv_device.
871771fa900SAdrien Mazarguil  *
872771fa900SAdrien Mazarguil  * @param device
873771fa900SAdrien Mazarguil  *   Pointer to Ethernet device structure.
874771fa900SAdrien Mazarguil  * @param[out] pci_addr
875771fa900SAdrien Mazarguil  *   PCI bus address output buffer.
876771fa900SAdrien Mazarguil  *
877771fa900SAdrien Mazarguil  * @return
878771fa900SAdrien Mazarguil  *   0 on success, -1 on failure and errno is set.
879771fa900SAdrien Mazarguil  */
880771fa900SAdrien Mazarguil int
881771fa900SAdrien Mazarguil mlx5_ibv_device_to_pci_addr(const struct ibv_device *device,
882771fa900SAdrien Mazarguil 			    struct rte_pci_addr *pci_addr)
883771fa900SAdrien Mazarguil {
884771fa900SAdrien Mazarguil 	FILE *file;
885771fa900SAdrien Mazarguil 	char line[32];
886771fa900SAdrien Mazarguil 	MKSTR(path, "%s/device/uevent", device->ibdev_path);
887771fa900SAdrien Mazarguil 
888771fa900SAdrien Mazarguil 	file = fopen(path, "rb");
889771fa900SAdrien Mazarguil 	if (file == NULL)
890771fa900SAdrien Mazarguil 		return -1;
891771fa900SAdrien Mazarguil 	while (fgets(line, sizeof(line), file) == line) {
892771fa900SAdrien Mazarguil 		size_t len = strlen(line);
893771fa900SAdrien Mazarguil 		int ret;
894771fa900SAdrien Mazarguil 
895771fa900SAdrien Mazarguil 		/* Truncate long lines. */
896771fa900SAdrien Mazarguil 		if (len == (sizeof(line) - 1))
897771fa900SAdrien Mazarguil 			while (line[(len - 1)] != '\n') {
898771fa900SAdrien Mazarguil 				ret = fgetc(file);
899771fa900SAdrien Mazarguil 				if (ret == EOF)
900771fa900SAdrien Mazarguil 					break;
901771fa900SAdrien Mazarguil 				line[(len - 1)] = ret;
902771fa900SAdrien Mazarguil 			}
903771fa900SAdrien Mazarguil 		/* Extract information. */
904771fa900SAdrien Mazarguil 		if (sscanf(line,
905771fa900SAdrien Mazarguil 			   "PCI_SLOT_NAME="
906463ced95SStephen Hemminger 			   "%" SCNx32 ":%" SCNx8 ":%" SCNx8 ".%" SCNx8 "\n",
907771fa900SAdrien Mazarguil 			   &pci_addr->domain,
908771fa900SAdrien Mazarguil 			   &pci_addr->bus,
909771fa900SAdrien Mazarguil 			   &pci_addr->devid,
910771fa900SAdrien Mazarguil 			   &pci_addr->function) == 4) {
911771fa900SAdrien Mazarguil 			ret = 0;
912771fa900SAdrien Mazarguil 			break;
913771fa900SAdrien Mazarguil 		}
914771fa900SAdrien Mazarguil 	}
915771fa900SAdrien Mazarguil 	fclose(file);
916771fa900SAdrien Mazarguil 	return 0;
917771fa900SAdrien Mazarguil }
918198a3c33SNelio Laranjeiro 
919198a3c33SNelio Laranjeiro /**
920c26ae069SMatan Azrad  * Update the link status.
921198a3c33SNelio Laranjeiro  *
922198a3c33SNelio Laranjeiro  * @param priv
923198a3c33SNelio Laranjeiro  *   Pointer to private structure.
924198a3c33SNelio Laranjeiro  *
925198a3c33SNelio Laranjeiro  * @return
926c26ae069SMatan Azrad  *   Zero if the callback process can be called immediately.
927198a3c33SNelio Laranjeiro  */
928198a3c33SNelio Laranjeiro static int
929c26ae069SMatan Azrad priv_link_status_update(struct priv *priv)
930c26ae069SMatan Azrad {
931c26ae069SMatan Azrad 	struct rte_eth_link *link = &priv->dev->data->dev_link;
932c26ae069SMatan Azrad 
933c7bf6225SYongseok Koh 	priv_link_update(priv, 0);
934c26ae069SMatan Azrad 	if (((link->link_speed == 0) && link->link_status) ||
935c26ae069SMatan Azrad 		((link->link_speed != 0) && !link->link_status)) {
936c26ae069SMatan Azrad 		/*
937c26ae069SMatan Azrad 		 * Inconsistent status. Event likely occurred before the
938c26ae069SMatan Azrad 		 * kernel netdevice exposes the new status.
939c26ae069SMatan Azrad 		 */
940c26ae069SMatan Azrad 		if (!priv->pending_alarm) {
941c26ae069SMatan Azrad 			priv->pending_alarm = 1;
942c26ae069SMatan Azrad 			rte_eal_alarm_set(MLX5_ALARM_TIMEOUT_US,
943c26ae069SMatan Azrad 					  mlx5_dev_link_status_handler,
944c26ae069SMatan Azrad 					  priv->dev);
945c26ae069SMatan Azrad 		}
946c26ae069SMatan Azrad 		return 1;
947c26ae069SMatan Azrad 	} else if (unlikely(priv->pending_alarm)) {
948c26ae069SMatan Azrad 		/* Link interrupt occurred while alarm is already scheduled. */
949c26ae069SMatan Azrad 		priv->pending_alarm = 0;
950c26ae069SMatan Azrad 		rte_eal_alarm_cancel(mlx5_dev_link_status_handler, priv->dev);
951c26ae069SMatan Azrad 	}
952c26ae069SMatan Azrad 	return 0;
953c26ae069SMatan Azrad }
954c26ae069SMatan Azrad 
955c26ae069SMatan Azrad /**
956c26ae069SMatan Azrad  * Device status handler.
957c26ae069SMatan Azrad  *
958c26ae069SMatan Azrad  * @param priv
959c26ae069SMatan Azrad  *   Pointer to private structure.
960c26ae069SMatan Azrad  * @param events
961c26ae069SMatan Azrad  *   Pointer to event flags holder.
962c26ae069SMatan Azrad  *
963c26ae069SMatan Azrad  * @return
964c26ae069SMatan Azrad  *   Events bitmap of callback process which can be called immediately.
965c26ae069SMatan Azrad  */
966c26ae069SMatan Azrad static uint32_t
967c26ae069SMatan Azrad priv_dev_status_handler(struct priv *priv)
968198a3c33SNelio Laranjeiro {
969198a3c33SNelio Laranjeiro 	struct ibv_async_event event;
970c26ae069SMatan Azrad 	uint32_t ret = 0;
971198a3c33SNelio Laranjeiro 
972198a3c33SNelio Laranjeiro 	/* Read all message and acknowledge them. */
973198a3c33SNelio Laranjeiro 	for (;;) {
9740e83b8e5SNelio Laranjeiro 		if (mlx5_glue->get_async_event(priv->ctx, &event))
975198a3c33SNelio Laranjeiro 			break;
976c26ae069SMatan Azrad 		if ((event.event_type == IBV_EVENT_PORT_ACTIVE ||
977c26ae069SMatan Azrad 			event.event_type == IBV_EVENT_PORT_ERR) &&
978c26ae069SMatan Azrad 			(priv->dev->data->dev_conf.intr_conf.lsc == 1))
979c26ae069SMatan Azrad 			ret |= (1 << RTE_ETH_EVENT_INTR_LSC);
9807d7d7ad1SMatan Azrad 		else if (event.event_type == IBV_EVENT_DEVICE_FATAL &&
9817d7d7ad1SMatan Azrad 			priv->dev->data->dev_conf.intr_conf.rmv == 1)
9827d7d7ad1SMatan Azrad 			ret |= (1 << RTE_ETH_EVENT_INTR_RMV);
983c26ae069SMatan Azrad 		else
984198a3c33SNelio Laranjeiro 			DEBUG("event type %d on port %d not handled",
985198a3c33SNelio Laranjeiro 			      event.event_type, event.element.port_num);
9860e83b8e5SNelio Laranjeiro 		mlx5_glue->ack_async_event(&event);
987198a3c33SNelio Laranjeiro 	}
988c26ae069SMatan Azrad 	if (ret & (1 << RTE_ETH_EVENT_INTR_LSC))
989c26ae069SMatan Azrad 		if (priv_link_status_update(priv))
990c26ae069SMatan Azrad 			ret &= ~(1 << RTE_ETH_EVENT_INTR_LSC);
991198a3c33SNelio Laranjeiro 	return ret;
992198a3c33SNelio Laranjeiro }
993198a3c33SNelio Laranjeiro 
994198a3c33SNelio Laranjeiro /**
995198a3c33SNelio Laranjeiro  * Handle delayed link status event.
996198a3c33SNelio Laranjeiro  *
997198a3c33SNelio Laranjeiro  * @param arg
998198a3c33SNelio Laranjeiro  *   Registered argument.
999198a3c33SNelio Laranjeiro  */
1000198a3c33SNelio Laranjeiro void
1001198a3c33SNelio Laranjeiro mlx5_dev_link_status_handler(void *arg)
1002198a3c33SNelio Laranjeiro {
1003198a3c33SNelio Laranjeiro 	struct rte_eth_dev *dev = arg;
1004198a3c33SNelio Laranjeiro 	struct priv *priv = dev->data->dev_private;
1005198a3c33SNelio Laranjeiro 	int ret;
1006198a3c33SNelio Laranjeiro 
1007a9f2fbc4SShahaf Shuler 	priv->pending_alarm = 0;
1008c26ae069SMatan Azrad 	ret = priv_link_status_update(priv);
1009c26ae069SMatan Azrad 	if (!ret)
1010cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL);
1011198a3c33SNelio Laranjeiro }
1012198a3c33SNelio Laranjeiro 
1013198a3c33SNelio Laranjeiro /**
1014198a3c33SNelio Laranjeiro  * Handle interrupts from the NIC.
1015198a3c33SNelio Laranjeiro  *
1016198a3c33SNelio Laranjeiro  * @param[in] intr_handle
1017198a3c33SNelio Laranjeiro  *   Interrupt handler.
1018198a3c33SNelio Laranjeiro  * @param cb_arg
1019198a3c33SNelio Laranjeiro  *   Callback argument.
1020198a3c33SNelio Laranjeiro  */
1021198a3c33SNelio Laranjeiro void
1022c23a1a30SQi Zhang mlx5_dev_interrupt_handler(void *cb_arg)
1023198a3c33SNelio Laranjeiro {
1024198a3c33SNelio Laranjeiro 	struct rte_eth_dev *dev = cb_arg;
1025198a3c33SNelio Laranjeiro 	struct priv *priv = dev->data->dev_private;
1026c26ae069SMatan Azrad 	uint32_t events;
1027198a3c33SNelio Laranjeiro 
1028c26ae069SMatan Azrad 	events = priv_dev_status_handler(priv);
1029c26ae069SMatan Azrad 	if (events & (1 << RTE_ETH_EVENT_INTR_LSC))
1030cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL);
10317d7d7ad1SMatan Azrad 	if (events & (1 << RTE_ETH_EVENT_INTR_RMV))
1032cebe3d7bSThomas Monjalon 		_rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_RMV, NULL);
1033198a3c33SNelio Laranjeiro }
1034198a3c33SNelio Laranjeiro 
1035198a3c33SNelio Laranjeiro /**
1036f8b9a3baSXueming Li  * Handle interrupts from the socket.
1037f8b9a3baSXueming Li  *
1038f8b9a3baSXueming Li  * @param cb_arg
1039f8b9a3baSXueming Li  *   Callback argument.
1040f8b9a3baSXueming Li  */
1041f8b9a3baSXueming Li static void
1042f8b9a3baSXueming Li mlx5_dev_handler_socket(void *cb_arg)
1043f8b9a3baSXueming Li {
1044f8b9a3baSXueming Li 	struct rte_eth_dev *dev = cb_arg;
1045f8b9a3baSXueming Li 	struct priv *priv = dev->data->dev_private;
1046f8b9a3baSXueming Li 
1047f8b9a3baSXueming Li 	priv_socket_handle(priv);
1048f8b9a3baSXueming Li }
1049f8b9a3baSXueming Li 
1050f8b9a3baSXueming Li /**
1051198a3c33SNelio Laranjeiro  * Uninstall interrupt handler.
1052198a3c33SNelio Laranjeiro  *
1053198a3c33SNelio Laranjeiro  * @param priv
1054198a3c33SNelio Laranjeiro  *   Pointer to private structure.
1055198a3c33SNelio Laranjeiro  * @param dev
1056198a3c33SNelio Laranjeiro  *   Pointer to the rte_eth_dev structure.
1057198a3c33SNelio Laranjeiro  */
1058198a3c33SNelio Laranjeiro void
1059198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_uninstall(struct priv *priv, struct rte_eth_dev *dev)
1060198a3c33SNelio Laranjeiro {
1061f8b9a3baSXueming Li 	if (dev->data->dev_conf.intr_conf.lsc ||
1062f8b9a3baSXueming Li 	    dev->data->dev_conf.intr_conf.rmv)
1063198a3c33SNelio Laranjeiro 		rte_intr_callback_unregister(&priv->intr_handle,
1064f8b9a3baSXueming Li 					     mlx5_dev_interrupt_handler, dev);
1065f8b9a3baSXueming Li 	if (priv->primary_socket)
1066f8b9a3baSXueming Li 		rte_intr_callback_unregister(&priv->intr_handle_socket,
1067f8b9a3baSXueming Li 					     mlx5_dev_handler_socket, dev);
10686817ad38SYongseok Koh 	if (priv->pending_alarm) {
1069198a3c33SNelio Laranjeiro 		priv->pending_alarm = 0;
10706817ad38SYongseok Koh 		rte_eal_alarm_cancel(mlx5_dev_link_status_handler, dev);
10716817ad38SYongseok Koh 	}
1072198a3c33SNelio Laranjeiro 	priv->intr_handle.fd = 0;
107336351ea3SFerruh Yigit 	priv->intr_handle.type = RTE_INTR_HANDLE_UNKNOWN;
1074f8b9a3baSXueming Li 	priv->intr_handle_socket.fd = 0;
1075f8b9a3baSXueming Li 	priv->intr_handle_socket.type = RTE_INTR_HANDLE_UNKNOWN;
1076198a3c33SNelio Laranjeiro }
1077198a3c33SNelio Laranjeiro 
1078198a3c33SNelio Laranjeiro /**
1079198a3c33SNelio Laranjeiro  * Install interrupt handler.
1080198a3c33SNelio Laranjeiro  *
1081198a3c33SNelio Laranjeiro  * @param priv
1082198a3c33SNelio Laranjeiro  *   Pointer to private structure.
1083198a3c33SNelio Laranjeiro  * @param dev
1084198a3c33SNelio Laranjeiro  *   Pointer to the rte_eth_dev structure.
1085198a3c33SNelio Laranjeiro  */
1086198a3c33SNelio Laranjeiro void
1087198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_install(struct priv *priv, struct rte_eth_dev *dev)
1088198a3c33SNelio Laranjeiro {
1089198a3c33SNelio Laranjeiro 	int rc, flags;
1090198a3c33SNelio Laranjeiro 
1091198a3c33SNelio Laranjeiro 	assert(priv->ctx->async_fd > 0);
1092198a3c33SNelio Laranjeiro 	flags = fcntl(priv->ctx->async_fd, F_GETFL);
1093198a3c33SNelio Laranjeiro 	rc = fcntl(priv->ctx->async_fd, F_SETFL, flags | O_NONBLOCK);
1094198a3c33SNelio Laranjeiro 	if (rc < 0) {
1095198a3c33SNelio Laranjeiro 		INFO("failed to change file descriptor async event queue");
1096198a3c33SNelio Laranjeiro 		dev->data->dev_conf.intr_conf.lsc = 0;
10977d7d7ad1SMatan Azrad 		dev->data->dev_conf.intr_conf.rmv = 0;
1098f8b9a3baSXueming Li 	}
1099f8b9a3baSXueming Li 	if (dev->data->dev_conf.intr_conf.lsc ||
1100f8b9a3baSXueming Li 	    dev->data->dev_conf.intr_conf.rmv) {
1101198a3c33SNelio Laranjeiro 		priv->intr_handle.fd = priv->ctx->async_fd;
1102198a3c33SNelio Laranjeiro 		priv->intr_handle.type = RTE_INTR_HANDLE_EXT;
1103198a3c33SNelio Laranjeiro 		rte_intr_callback_register(&priv->intr_handle,
1104f8b9a3baSXueming Li 					   mlx5_dev_interrupt_handler, dev);
1105f8b9a3baSXueming Li 	}
1106f8b9a3baSXueming Li 	rc = priv_socket_init(priv);
1107f8b9a3baSXueming Li 	if (!rc && priv->primary_socket) {
1108f8b9a3baSXueming Li 		priv->intr_handle_socket.fd = priv->primary_socket;
1109f8b9a3baSXueming Li 		priv->intr_handle_socket.type = RTE_INTR_HANDLE_EXT;
1110f8b9a3baSXueming Li 		rte_intr_callback_register(&priv->intr_handle_socket,
1111f8b9a3baSXueming Li 					   mlx5_dev_handler_socket, dev);
1112198a3c33SNelio Laranjeiro 	}
1113198a3c33SNelio Laranjeiro }
111462072098SOr Ami 
111562072098SOr Ami /**
111662072098SOr Ami  * Change the link state (UP / DOWN).
111762072098SOr Ami  *
11183d04e050SOlivier Matz  * @param priv
1119aee1b165SXueming Li  *   Pointer to private data structure.
112062072098SOr Ami  * @param up
112162072098SOr Ami  *   Nonzero for link up, otherwise link down.
112262072098SOr Ami  *
112362072098SOr Ami  * @return
112462072098SOr Ami  *   0 on success, errno value on failure.
112562072098SOr Ami  */
112662072098SOr Ami static int
1127c7bf6225SYongseok Koh priv_dev_set_link(struct priv *priv, int up)
112862072098SOr Ami {
1129c7bf6225SYongseok Koh 	return priv_set_flags(priv, ~IFF_UP, up ? IFF_UP : ~IFF_UP);
113062072098SOr Ami }
113162072098SOr Ami 
113262072098SOr Ami /**
113362072098SOr Ami  * DPDK callback to bring the link DOWN.
113462072098SOr Ami  *
113562072098SOr Ami  * @param dev
113662072098SOr Ami  *   Pointer to Ethernet device structure.
113762072098SOr Ami  *
113862072098SOr Ami  * @return
113962072098SOr Ami  *   0 on success, errno value on failure.
114062072098SOr Ami  */
114162072098SOr Ami int
114262072098SOr Ami mlx5_set_link_down(struct rte_eth_dev *dev)
114362072098SOr Ami {
114462072098SOr Ami 	struct priv *priv = dev->data->dev_private;
114562072098SOr Ami 	int err;
114662072098SOr Ami 
1147c7bf6225SYongseok Koh 	err = priv_dev_set_link(priv, 0);
114862072098SOr Ami 	return err;
114962072098SOr Ami }
115062072098SOr Ami 
115162072098SOr Ami /**
115262072098SOr Ami  * DPDK callback to bring the link UP.
115362072098SOr Ami  *
115462072098SOr Ami  * @param dev
115562072098SOr Ami  *   Pointer to Ethernet device structure.
115662072098SOr Ami  *
115762072098SOr Ami  * @return
115862072098SOr Ami  *   0 on success, errno value on failure.
115962072098SOr Ami  */
116062072098SOr Ami int
116162072098SOr Ami mlx5_set_link_up(struct rte_eth_dev *dev)
116262072098SOr Ami {
116362072098SOr Ami 	struct priv *priv = dev->data->dev_private;
116462072098SOr Ami 	int err;
116562072098SOr Ami 
1166c7bf6225SYongseok Koh 	err = priv_dev_set_link(priv, 1);
116762072098SOr Ami 	return err;
116862072098SOr Ami }
1169a48deadaSOr Ami 
1170a48deadaSOr Ami /**
1171cdab90cbSNélio Laranjeiro  * Configure the TX function to use.
1172cdab90cbSNélio Laranjeiro  *
1173cdab90cbSNélio Laranjeiro  * @param priv
1174aee1b165SXueming Li  *   Pointer to private data structure.
1175aee1b165SXueming Li  * @param dev
1176aee1b165SXueming Li  *   Pointer to rte_eth_dev structure.
11771cfa649bSShahaf Shuler  *
11781cfa649bSShahaf Shuler  * @return
11791cfa649bSShahaf Shuler  *   Pointer to selected Tx burst function.
1180cdab90cbSNélio Laranjeiro  */
11811cfa649bSShahaf Shuler eth_tx_burst_t
1182dbccb4cdSShahaf Shuler priv_select_tx_function(struct priv *priv, struct rte_eth_dev *dev)
1183cdab90cbSNélio Laranjeiro {
11841cfa649bSShahaf Shuler 	eth_tx_burst_t tx_pkt_burst = mlx5_tx_burst;
11857fe24446SShahaf Shuler 	struct mlx5_dev_config *config = &priv->config;
1186dbccb4cdSShahaf Shuler 	uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads;
1187dbccb4cdSShahaf Shuler 	int tso = !!(tx_offloads & (DEV_TX_OFFLOAD_TCP_TSO |
1188dbccb4cdSShahaf Shuler 				    DEV_TX_OFFLOAD_VXLAN_TNL_TSO |
1189dbccb4cdSShahaf Shuler 				    DEV_TX_OFFLOAD_GRE_TNL_TSO));
1190dbccb4cdSShahaf Shuler 	int vlan_insert = !!(tx_offloads & DEV_TX_OFFLOAD_VLAN_INSERT);
11911cfa649bSShahaf Shuler 
1192aee1b165SXueming Li 	assert(priv != NULL);
1193230189d9SNélio Laranjeiro 	/* Select appropriate TX function. */
1194dbccb4cdSShahaf Shuler 	if (vlan_insert || tso)
1195dbccb4cdSShahaf Shuler 		return tx_pkt_burst;
11967fe24446SShahaf Shuler 	if (config->mps == MLX5_MPW_ENHANCED) {
1197dbccb4cdSShahaf Shuler 		if (priv_check_vec_tx_support(priv, dev) > 0) {
1198dbccb4cdSShahaf Shuler 			if (priv_check_raw_vec_tx_support(priv, dev) > 0)
11991cfa649bSShahaf Shuler 				tx_pkt_burst = mlx5_tx_burst_raw_vec;
12006cb559d6SYongseok Koh 			else
12011cfa649bSShahaf Shuler 				tx_pkt_burst = mlx5_tx_burst_vec;
12026cb559d6SYongseok Koh 			DEBUG("selected Enhanced MPW TX vectorized function");
12036cb559d6SYongseok Koh 		} else {
12041cfa649bSShahaf Shuler 			tx_pkt_burst = mlx5_tx_burst_empw;
12056ce84bd8SYongseok Koh 			DEBUG("selected Enhanced MPW TX function");
12066cb559d6SYongseok Koh 		}
12077fe24446SShahaf Shuler 	} else if (config->mps && (config->txq_inline > 0)) {
12081cfa649bSShahaf Shuler 		tx_pkt_burst = mlx5_tx_burst_mpw_inline;
1209230189d9SNélio Laranjeiro 		DEBUG("selected MPW inline TX function");
12107fe24446SShahaf Shuler 	} else if (config->mps) {
12111cfa649bSShahaf Shuler 		tx_pkt_burst = mlx5_tx_burst_mpw;
1212230189d9SNélio Laranjeiro 		DEBUG("selected MPW TX function");
12132a66cf37SYaacov Hazan 	}
12141cfa649bSShahaf Shuler 	return tx_pkt_burst;
1215cdab90cbSNélio Laranjeiro }
1216cdab90cbSNélio Laranjeiro 
1217cdab90cbSNélio Laranjeiro /**
1218cdab90cbSNélio Laranjeiro  * Configure the RX function to use.
1219cdab90cbSNélio Laranjeiro  *
1220cdab90cbSNélio Laranjeiro  * @param priv
1221aee1b165SXueming Li  *   Pointer to private data structure.
1222aee1b165SXueming Li  * @param dev
1223aee1b165SXueming Li  *   Pointer to rte_eth_dev structure.
12241cfa649bSShahaf Shuler  *
12251cfa649bSShahaf Shuler  * @return
12261cfa649bSShahaf Shuler  *   Pointer to selected Rx burst function.
1227cdab90cbSNélio Laranjeiro  */
12281cfa649bSShahaf Shuler eth_rx_burst_t
12291cfa649bSShahaf Shuler priv_select_rx_function(struct priv *priv, __rte_unused struct rte_eth_dev *dev)
1230cdab90cbSNélio Laranjeiro {
12311cfa649bSShahaf Shuler 	eth_rx_burst_t rx_pkt_burst = mlx5_rx_burst;
12321cfa649bSShahaf Shuler 
1233aee1b165SXueming Li 	assert(priv != NULL);
12346cb559d6SYongseok Koh 	if (priv_check_vec_rx_support(priv) > 0) {
12351cfa649bSShahaf Shuler 		rx_pkt_burst = mlx5_rx_burst_vec;
12366cb559d6SYongseok Koh 		DEBUG("selected RX vectorized function");
1237cdab90cbSNélio Laranjeiro 	}
12381cfa649bSShahaf Shuler 	return rx_pkt_burst;
12396cb559d6SYongseok Koh }
1240d3e0f392SMatan Azrad 
1241d3e0f392SMatan Azrad /**
1242d3e0f392SMatan Azrad  * Check if mlx5 device was removed.
1243d3e0f392SMatan Azrad  *
1244d3e0f392SMatan Azrad  * @param dev
1245d3e0f392SMatan Azrad  *   Pointer to Ethernet device structure.
1246d3e0f392SMatan Azrad  *
1247d3e0f392SMatan Azrad  * @return
1248d3e0f392SMatan Azrad  *   1 when device is removed, otherwise 0.
1249d3e0f392SMatan Azrad  */
1250d3e0f392SMatan Azrad int
1251d3e0f392SMatan Azrad mlx5_is_removed(struct rte_eth_dev *dev)
1252d3e0f392SMatan Azrad {
1253d3e0f392SMatan Azrad 	struct ibv_device_attr device_attr;
1254d3e0f392SMatan Azrad 	struct priv *priv = dev->data->dev_private;
1255d3e0f392SMatan Azrad 
12560e83b8e5SNelio Laranjeiro 	if (mlx5_glue->query_device(priv->ctx, &device_attr) == EIO)
1257d3e0f392SMatan Azrad 		return 1;
1258d3e0f392SMatan Azrad 	return 0;
1259d3e0f392SMatan Azrad }
1260