18fd92a66SOlivier Matz /* SPDX-License-Identifier: BSD-3-Clause 2771fa900SAdrien Mazarguil * Copyright 2015 6WIND S.A. 3771fa900SAdrien Mazarguil * Copyright 2015 Mellanox. 4771fa900SAdrien Mazarguil */ 5771fa900SAdrien Mazarguil 6f8b9a3baSXueming Li #define _GNU_SOURCE 7f8b9a3baSXueming Li 8771fa900SAdrien Mazarguil #include <stddef.h> 9e60fbd5bSAdrien Mazarguil #include <assert.h> 10*fc40db99SAdrien Mazarguil #include <inttypes.h> 11771fa900SAdrien Mazarguil #include <unistd.h> 12771fa900SAdrien Mazarguil #include <stdint.h> 13771fa900SAdrien Mazarguil #include <stdio.h> 14771fa900SAdrien Mazarguil #include <string.h> 15771fa900SAdrien Mazarguil #include <stdlib.h> 16771fa900SAdrien Mazarguil #include <errno.h> 17771fa900SAdrien Mazarguil #include <dirent.h> 18771fa900SAdrien Mazarguil #include <net/if.h> 19771fa900SAdrien Mazarguil #include <sys/ioctl.h> 20771fa900SAdrien Mazarguil #include <sys/socket.h> 213a49ffe3SShahaf Shuler #include <sys/utsname.h> 22771fa900SAdrien Mazarguil #include <netinet/in.h> 23cb8faed7SAdrien Mazarguil #include <linux/ethtool.h> 24cb8faed7SAdrien Mazarguil #include <linux/sockios.h> 253a49ffe3SShahaf Shuler #include <linux/version.h> 26198a3c33SNelio Laranjeiro #include <fcntl.h> 2790260d57SNélio Laranjeiro #include <stdalign.h> 28f8b9a3baSXueming Li #include <sys/un.h> 29771fa900SAdrien Mazarguil 30771fa900SAdrien Mazarguil #include <rte_atomic.h> 31ffc905f3SFerruh Yigit #include <rte_ethdev_driver.h> 32c752998bSGaetan Rivet #include <rte_bus_pci.h> 33771fa900SAdrien Mazarguil #include <rte_mbuf.h> 34771fa900SAdrien Mazarguil #include <rte_common.h> 35198a3c33SNelio Laranjeiro #include <rte_interrupts.h> 36198a3c33SNelio Laranjeiro #include <rte_alarm.h> 37a48deadaSOr Ami #include <rte_malloc.h> 38771fa900SAdrien Mazarguil 39771fa900SAdrien Mazarguil #include "mlx5.h" 400e83b8e5SNelio Laranjeiro #include "mlx5_glue.h" 41e60fbd5bSAdrien Mazarguil #include "mlx5_rxtx.h" 42771fa900SAdrien Mazarguil #include "mlx5_utils.h" 43771fa900SAdrien Mazarguil 443a49ffe3SShahaf Shuler /* Add defines in case the running kernel is not the same as user headers. */ 453a49ffe3SShahaf Shuler #ifndef ETHTOOL_GLINKSETTINGS 463a49ffe3SShahaf Shuler struct ethtool_link_settings { 473a49ffe3SShahaf Shuler uint32_t cmd; 483a49ffe3SShahaf Shuler uint32_t speed; 493a49ffe3SShahaf Shuler uint8_t duplex; 503a49ffe3SShahaf Shuler uint8_t port; 513a49ffe3SShahaf Shuler uint8_t phy_address; 523a49ffe3SShahaf Shuler uint8_t autoneg; 533a49ffe3SShahaf Shuler uint8_t mdio_support; 543a49ffe3SShahaf Shuler uint8_t eth_to_mdix; 553a49ffe3SShahaf Shuler uint8_t eth_tp_mdix_ctrl; 563a49ffe3SShahaf Shuler int8_t link_mode_masks_nwords; 573a49ffe3SShahaf Shuler uint32_t reserved[8]; 583a49ffe3SShahaf Shuler uint32_t link_mode_masks[]; 593a49ffe3SShahaf Shuler }; 603a49ffe3SShahaf Shuler 613a49ffe3SShahaf Shuler #define ETHTOOL_GLINKSETTINGS 0x0000004c 623a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseT_Full_BIT 5 633a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_Autoneg_BIT 6 643a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_1000baseKX_Full_BIT 17 653a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT 18 663a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseKR_Full_BIT 19 673a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_10000baseR_FEC_BIT 20 683a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT 21 693a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT 22 703a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT 23 713a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT 24 723a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT 25 733a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT 26 743a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT 27 753a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT 28 763a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT 29 773a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT 30 783a49ffe3SShahaf Shuler #endif 793a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_25G 803a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseCR_Full_BIT 31 813a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseKR_Full_BIT 32 823a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_25000baseSR_Full_BIT 33 833a49ffe3SShahaf Shuler #endif 843a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_50G 853a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT 34 863a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT 35 873a49ffe3SShahaf Shuler #endif 883a49ffe3SShahaf Shuler #ifndef HAVE_ETHTOOL_LINK_MODE_100G 893a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT 36 903a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT 37 913a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT 38 923a49ffe3SShahaf Shuler #define ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT 39 933a49ffe3SShahaf Shuler #endif 943a49ffe3SShahaf Shuler 95771fa900SAdrien Mazarguil /** 96771fa900SAdrien Mazarguil * Get interface name from private structure. 97771fa900SAdrien Mazarguil * 98771fa900SAdrien Mazarguil * @param[in] priv 99771fa900SAdrien Mazarguil * Pointer to private structure. 100771fa900SAdrien Mazarguil * @param[out] ifname 101771fa900SAdrien Mazarguil * Interface name output buffer. 102771fa900SAdrien Mazarguil * 103771fa900SAdrien Mazarguil * @return 104771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 105771fa900SAdrien Mazarguil */ 106771fa900SAdrien Mazarguil int 107771fa900SAdrien Mazarguil priv_get_ifname(const struct priv *priv, char (*ifname)[IF_NAMESIZE]) 108771fa900SAdrien Mazarguil { 109771fa900SAdrien Mazarguil DIR *dir; 110771fa900SAdrien Mazarguil struct dirent *dent; 111771fa900SAdrien Mazarguil unsigned int dev_type = 0; 112771fa900SAdrien Mazarguil unsigned int dev_port_prev = ~0u; 113771fa900SAdrien Mazarguil char match[IF_NAMESIZE] = ""; 114771fa900SAdrien Mazarguil 115771fa900SAdrien Mazarguil { 11687ec44ceSXueming Li MKSTR(path, "%s/device/net", priv->ibdev_path); 117771fa900SAdrien Mazarguil 118771fa900SAdrien Mazarguil dir = opendir(path); 119771fa900SAdrien Mazarguil if (dir == NULL) 120771fa900SAdrien Mazarguil return -1; 121771fa900SAdrien Mazarguil } 122771fa900SAdrien Mazarguil while ((dent = readdir(dir)) != NULL) { 123771fa900SAdrien Mazarguil char *name = dent->d_name; 124771fa900SAdrien Mazarguil FILE *file; 125771fa900SAdrien Mazarguil unsigned int dev_port; 126771fa900SAdrien Mazarguil int r; 127771fa900SAdrien Mazarguil 128771fa900SAdrien Mazarguil if ((name[0] == '.') && 129771fa900SAdrien Mazarguil ((name[1] == '\0') || 130771fa900SAdrien Mazarguil ((name[1] == '.') && (name[2] == '\0')))) 131771fa900SAdrien Mazarguil continue; 132771fa900SAdrien Mazarguil 133771fa900SAdrien Mazarguil MKSTR(path, "%s/device/net/%s/%s", 13487ec44ceSXueming Li priv->ibdev_path, name, 135771fa900SAdrien Mazarguil (dev_type ? "dev_id" : "dev_port")); 136771fa900SAdrien Mazarguil 137771fa900SAdrien Mazarguil file = fopen(path, "rb"); 138771fa900SAdrien Mazarguil if (file == NULL) { 139771fa900SAdrien Mazarguil if (errno != ENOENT) 140771fa900SAdrien Mazarguil continue; 141771fa900SAdrien Mazarguil /* 142771fa900SAdrien Mazarguil * Switch to dev_id when dev_port does not exist as 143771fa900SAdrien Mazarguil * is the case with Linux kernel versions < 3.15. 144771fa900SAdrien Mazarguil */ 145771fa900SAdrien Mazarguil try_dev_id: 146771fa900SAdrien Mazarguil match[0] = '\0'; 147771fa900SAdrien Mazarguil if (dev_type) 148771fa900SAdrien Mazarguil break; 149771fa900SAdrien Mazarguil dev_type = 1; 150771fa900SAdrien Mazarguil dev_port_prev = ~0u; 151771fa900SAdrien Mazarguil rewinddir(dir); 152771fa900SAdrien Mazarguil continue; 153771fa900SAdrien Mazarguil } 154771fa900SAdrien Mazarguil r = fscanf(file, (dev_type ? "%x" : "%u"), &dev_port); 155771fa900SAdrien Mazarguil fclose(file); 156771fa900SAdrien Mazarguil if (r != 1) 157771fa900SAdrien Mazarguil continue; 158771fa900SAdrien Mazarguil /* 159771fa900SAdrien Mazarguil * Switch to dev_id when dev_port returns the same value for 160771fa900SAdrien Mazarguil * all ports. May happen when using a MOFED release older than 161771fa900SAdrien Mazarguil * 3.0 with a Linux kernel >= 3.15. 162771fa900SAdrien Mazarguil */ 163771fa900SAdrien Mazarguil if (dev_port == dev_port_prev) 164771fa900SAdrien Mazarguil goto try_dev_id; 165771fa900SAdrien Mazarguil dev_port_prev = dev_port; 166771fa900SAdrien Mazarguil if (dev_port == (priv->port - 1u)) 167771fa900SAdrien Mazarguil snprintf(match, sizeof(match), "%s", name); 168771fa900SAdrien Mazarguil } 169771fa900SAdrien Mazarguil closedir(dir); 170771fa900SAdrien Mazarguil if (match[0] == '\0') 171771fa900SAdrien Mazarguil return -1; 172771fa900SAdrien Mazarguil strncpy(*ifname, match, sizeof(*ifname)); 173771fa900SAdrien Mazarguil return 0; 174771fa900SAdrien Mazarguil } 175771fa900SAdrien Mazarguil 176771fa900SAdrien Mazarguil /** 177771fa900SAdrien Mazarguil * Perform ifreq ioctl() on associated Ethernet device. 178771fa900SAdrien Mazarguil * 179771fa900SAdrien Mazarguil * @param[in] priv 180771fa900SAdrien Mazarguil * Pointer to private structure. 181771fa900SAdrien Mazarguil * @param req 182771fa900SAdrien Mazarguil * Request number to pass to ioctl(). 183771fa900SAdrien Mazarguil * @param[out] ifr 184771fa900SAdrien Mazarguil * Interface request structure output buffer. 185771fa900SAdrien Mazarguil * 186771fa900SAdrien Mazarguil * @return 187771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 188771fa900SAdrien Mazarguil */ 189771fa900SAdrien Mazarguil int 190771fa900SAdrien Mazarguil priv_ifreq(const struct priv *priv, int req, struct ifreq *ifr) 191771fa900SAdrien Mazarguil { 192771fa900SAdrien Mazarguil int sock = socket(PF_INET, SOCK_DGRAM, IPPROTO_IP); 193771fa900SAdrien Mazarguil int ret = -1; 194771fa900SAdrien Mazarguil 195771fa900SAdrien Mazarguil if (sock == -1) 196771fa900SAdrien Mazarguil return ret; 197771fa900SAdrien Mazarguil if (priv_get_ifname(priv, &ifr->ifr_name) == 0) 198771fa900SAdrien Mazarguil ret = ioctl(sock, req, ifr); 199771fa900SAdrien Mazarguil close(sock); 200771fa900SAdrien Mazarguil return ret; 201771fa900SAdrien Mazarguil } 202771fa900SAdrien Mazarguil 203771fa900SAdrien Mazarguil /** 20485e347dbSNélio Laranjeiro * Return the number of active VFs for the current device. 20585e347dbSNélio Laranjeiro * 20685e347dbSNélio Laranjeiro * @param[in] priv 20785e347dbSNélio Laranjeiro * Pointer to private structure. 20885e347dbSNélio Laranjeiro * @param[out] num_vfs 20985e347dbSNélio Laranjeiro * Number of active VFs. 21085e347dbSNélio Laranjeiro * 21185e347dbSNélio Laranjeiro * @return 21285e347dbSNélio Laranjeiro * 0 on success, -1 on failure and errno is set. 21385e347dbSNélio Laranjeiro */ 21485e347dbSNélio Laranjeiro int 21585e347dbSNélio Laranjeiro priv_get_num_vfs(struct priv *priv, uint16_t *num_vfs) 21685e347dbSNélio Laranjeiro { 21785e347dbSNélio Laranjeiro /* The sysfs entry name depends on the operating system. */ 21885e347dbSNélio Laranjeiro const char **name = (const char *[]){ 219*fc40db99SAdrien Mazarguil "sriov_numvfs", 220*fc40db99SAdrien Mazarguil "mlx5_num_vfs", 22185e347dbSNélio Laranjeiro NULL, 22285e347dbSNélio Laranjeiro }; 22385e347dbSNélio Laranjeiro 22485e347dbSNélio Laranjeiro do { 225*fc40db99SAdrien Mazarguil int n; 226*fc40db99SAdrien Mazarguil FILE *file; 227*fc40db99SAdrien Mazarguil MKSTR(path, "%s/device/%s", priv->ibdev_path, *name); 22885e347dbSNélio Laranjeiro 229*fc40db99SAdrien Mazarguil file = fopen(path, "rb"); 230*fc40db99SAdrien Mazarguil if (!file) 231*fc40db99SAdrien Mazarguil continue; 232*fc40db99SAdrien Mazarguil n = fscanf(file, "%" SCNu16, num_vfs); 233*fc40db99SAdrien Mazarguil fclose(file); 234*fc40db99SAdrien Mazarguil if (n == 1) 235*fc40db99SAdrien Mazarguil return 0; 236*fc40db99SAdrien Mazarguil } while (*(++name)); 237*fc40db99SAdrien Mazarguil return -1; 23885e347dbSNélio Laranjeiro } 23985e347dbSNélio Laranjeiro 24085e347dbSNélio Laranjeiro /** 241771fa900SAdrien Mazarguil * Get device MTU. 242771fa900SAdrien Mazarguil * 243771fa900SAdrien Mazarguil * @param priv 244771fa900SAdrien Mazarguil * Pointer to private structure. 245771fa900SAdrien Mazarguil * @param[out] mtu 246771fa900SAdrien Mazarguil * MTU value output buffer. 247771fa900SAdrien Mazarguil * 248771fa900SAdrien Mazarguil * @return 249771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 250771fa900SAdrien Mazarguil */ 251771fa900SAdrien Mazarguil int 252771fa900SAdrien Mazarguil priv_get_mtu(struct priv *priv, uint16_t *mtu) 253771fa900SAdrien Mazarguil { 254*fc40db99SAdrien Mazarguil struct ifreq request; 255*fc40db99SAdrien Mazarguil int ret = priv_ifreq(priv, SIOCGIFMTU, &request); 256771fa900SAdrien Mazarguil 257*fc40db99SAdrien Mazarguil if (ret) 258*fc40db99SAdrien Mazarguil return ret; 259*fc40db99SAdrien Mazarguil *mtu = request.ifr_mtu; 260859081d3SShahaf Shuler return 0; 261859081d3SShahaf Shuler } 262859081d3SShahaf Shuler 263859081d3SShahaf Shuler /** 264cf37ca95SAdrien Mazarguil * Set device MTU. 265cf37ca95SAdrien Mazarguil * 266cf37ca95SAdrien Mazarguil * @param priv 267cf37ca95SAdrien Mazarguil * Pointer to private structure. 268cf37ca95SAdrien Mazarguil * @param mtu 269cf37ca95SAdrien Mazarguil * MTU value to set. 270cf37ca95SAdrien Mazarguil * 271cf37ca95SAdrien Mazarguil * @return 272cf37ca95SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 273cf37ca95SAdrien Mazarguil */ 274cf37ca95SAdrien Mazarguil static int 275cf37ca95SAdrien Mazarguil priv_set_mtu(struct priv *priv, uint16_t mtu) 276cf37ca95SAdrien Mazarguil { 277*fc40db99SAdrien Mazarguil struct ifreq request = { .ifr_mtu = mtu, }; 278f3b492d7SAdrien Mazarguil 279*fc40db99SAdrien Mazarguil return priv_ifreq(priv, SIOCSIFMTU, &request); 280cf37ca95SAdrien Mazarguil } 281cf37ca95SAdrien Mazarguil 282cf37ca95SAdrien Mazarguil /** 283771fa900SAdrien Mazarguil * Set device flags. 284771fa900SAdrien Mazarguil * 285771fa900SAdrien Mazarguil * @param priv 286771fa900SAdrien Mazarguil * Pointer to private structure. 287771fa900SAdrien Mazarguil * @param keep 288771fa900SAdrien Mazarguil * Bitmask for flags that must remain untouched. 289771fa900SAdrien Mazarguil * @param flags 290771fa900SAdrien Mazarguil * Bitmask for flags to modify. 291771fa900SAdrien Mazarguil * 292771fa900SAdrien Mazarguil * @return 293771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 294771fa900SAdrien Mazarguil */ 295771fa900SAdrien Mazarguil int 296771fa900SAdrien Mazarguil priv_set_flags(struct priv *priv, unsigned int keep, unsigned int flags) 297771fa900SAdrien Mazarguil { 298*fc40db99SAdrien Mazarguil struct ifreq request; 299*fc40db99SAdrien Mazarguil int ret = priv_ifreq(priv, SIOCGIFFLAGS, &request); 300771fa900SAdrien Mazarguil 301*fc40db99SAdrien Mazarguil if (ret) 302*fc40db99SAdrien Mazarguil return ret; 303*fc40db99SAdrien Mazarguil request.ifr_flags &= keep; 304*fc40db99SAdrien Mazarguil request.ifr_flags |= flags & ~keep; 305*fc40db99SAdrien Mazarguil return priv_ifreq(priv, SIOCSIFFLAGS, &request); 306771fa900SAdrien Mazarguil } 307771fa900SAdrien Mazarguil 308771fa900SAdrien Mazarguil /** 309e60fbd5bSAdrien Mazarguil * Ethernet device configuration. 310e60fbd5bSAdrien Mazarguil * 311e60fbd5bSAdrien Mazarguil * Prepare the driver for a given number of TX and RX queues. 312e60fbd5bSAdrien Mazarguil * 313e60fbd5bSAdrien Mazarguil * @param dev 314e60fbd5bSAdrien Mazarguil * Pointer to Ethernet device structure. 315e60fbd5bSAdrien Mazarguil * 316e60fbd5bSAdrien Mazarguil * @return 317e60fbd5bSAdrien Mazarguil * 0 on success, errno value on failure. 318e60fbd5bSAdrien Mazarguil */ 319e60fbd5bSAdrien Mazarguil static int 320e60fbd5bSAdrien Mazarguil dev_configure(struct rte_eth_dev *dev) 321e60fbd5bSAdrien Mazarguil { 322e60fbd5bSAdrien Mazarguil struct priv *priv = dev->data->dev_private; 323e60fbd5bSAdrien Mazarguil unsigned int rxqs_n = dev->data->nb_rx_queues; 324e60fbd5bSAdrien Mazarguil unsigned int txqs_n = dev->data->nb_tx_queues; 325634efbc2SNelio Laranjeiro unsigned int i; 326634efbc2SNelio Laranjeiro unsigned int j; 327634efbc2SNelio Laranjeiro unsigned int reta_idx_n; 32829c1d8bbSNélio Laranjeiro const uint8_t use_app_rss_key = 32921e3a974SShahaf Shuler !!dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key; 330dbccb4cdSShahaf Shuler uint64_t supp_tx_offloads = mlx5_priv_get_tx_port_offloads(priv); 331dbccb4cdSShahaf Shuler uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads; 33217b843ebSShahaf Shuler uint64_t supp_rx_offloads = 33317b843ebSShahaf Shuler (mlx5_priv_get_rx_port_offloads(priv) | 33417b843ebSShahaf Shuler mlx5_priv_get_rx_queue_offloads(priv)); 33517b843ebSShahaf Shuler uint64_t rx_offloads = dev->data->dev_conf.rxmode.offloads; 336e60fbd5bSAdrien Mazarguil 337dbccb4cdSShahaf Shuler if ((tx_offloads & supp_tx_offloads) != tx_offloads) { 338dbccb4cdSShahaf Shuler ERROR("Some Tx offloads are not supported " 339dbccb4cdSShahaf Shuler "requested 0x%" PRIx64 " supported 0x%" PRIx64, 340dbccb4cdSShahaf Shuler tx_offloads, supp_tx_offloads); 341dbccb4cdSShahaf Shuler return ENOTSUP; 342dbccb4cdSShahaf Shuler } 34317b843ebSShahaf Shuler if ((rx_offloads & supp_rx_offloads) != rx_offloads) { 34417b843ebSShahaf Shuler ERROR("Some Rx offloads are not supported " 34517b843ebSShahaf Shuler "requested 0x%" PRIx64 " supported 0x%" PRIx64, 34617b843ebSShahaf Shuler rx_offloads, supp_rx_offloads); 34717b843ebSShahaf Shuler return ENOTSUP; 34817b843ebSShahaf Shuler } 34929c1d8bbSNélio Laranjeiro if (use_app_rss_key && 35029c1d8bbSNélio Laranjeiro (dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key_len != 35129c1d8bbSNélio Laranjeiro rss_hash_default_key_len)) { 35229c1d8bbSNélio Laranjeiro /* MLX5 RSS only support 40bytes key. */ 35329c1d8bbSNélio Laranjeiro return EINVAL; 35429c1d8bbSNélio Laranjeiro } 35529c1d8bbSNélio Laranjeiro priv->rss_conf.rss_key = 35629c1d8bbSNélio Laranjeiro rte_realloc(priv->rss_conf.rss_key, 35729c1d8bbSNélio Laranjeiro rss_hash_default_key_len, 0); 35829c1d8bbSNélio Laranjeiro if (!priv->rss_conf.rss_key) { 35929c1d8bbSNélio Laranjeiro ERROR("cannot allocate RSS hash key memory (%u)", rxqs_n); 36029c1d8bbSNélio Laranjeiro return ENOMEM; 36129c1d8bbSNélio Laranjeiro } 36229c1d8bbSNélio Laranjeiro memcpy(priv->rss_conf.rss_key, 36329c1d8bbSNélio Laranjeiro use_app_rss_key ? 36429c1d8bbSNélio Laranjeiro dev->data->dev_conf.rx_adv_conf.rss_conf.rss_key : 36529c1d8bbSNélio Laranjeiro rss_hash_default_key, 36629c1d8bbSNélio Laranjeiro rss_hash_default_key_len); 36729c1d8bbSNélio Laranjeiro priv->rss_conf.rss_key_len = rss_hash_default_key_len; 36829c1d8bbSNélio Laranjeiro priv->rss_conf.rss_hf = dev->data->dev_conf.rx_adv_conf.rss_conf.rss_hf; 369e60fbd5bSAdrien Mazarguil priv->rxqs = (void *)dev->data->rx_queues; 370e60fbd5bSAdrien Mazarguil priv->txqs = (void *)dev->data->tx_queues; 371e60fbd5bSAdrien Mazarguil if (txqs_n != priv->txqs_n) { 372e60fbd5bSAdrien Mazarguil INFO("%p: TX queues number update: %u -> %u", 373e60fbd5bSAdrien Mazarguil (void *)dev, priv->txqs_n, txqs_n); 374e60fbd5bSAdrien Mazarguil priv->txqs_n = txqs_n; 375e60fbd5bSAdrien Mazarguil } 3767fe24446SShahaf Shuler if (rxqs_n > priv->config.ind_table_max_size) { 377634efbc2SNelio Laranjeiro ERROR("cannot handle this many RX queues (%u)", rxqs_n); 378634efbc2SNelio Laranjeiro return EINVAL; 379634efbc2SNelio Laranjeiro } 380e60fbd5bSAdrien Mazarguil if (rxqs_n == priv->rxqs_n) 381e60fbd5bSAdrien Mazarguil return 0; 382e60fbd5bSAdrien Mazarguil INFO("%p: RX queues number update: %u -> %u", 383e60fbd5bSAdrien Mazarguil (void *)dev, priv->rxqs_n, rxqs_n); 384e60fbd5bSAdrien Mazarguil priv->rxqs_n = rxqs_n; 385634efbc2SNelio Laranjeiro /* If the requested number of RX queues is not a power of two, use the 386634efbc2SNelio Laranjeiro * maximum indirection table size for better balancing. 387634efbc2SNelio Laranjeiro * The result is always rounded to the next power of two. */ 388634efbc2SNelio Laranjeiro reta_idx_n = (1 << log2above((rxqs_n & (rxqs_n - 1)) ? 3897fe24446SShahaf Shuler priv->config.ind_table_max_size : 390634efbc2SNelio Laranjeiro rxqs_n)); 391634efbc2SNelio Laranjeiro if (priv_rss_reta_index_resize(priv, reta_idx_n)) 392634efbc2SNelio Laranjeiro return ENOMEM; 393634efbc2SNelio Laranjeiro /* When the number of RX queues is not a power of two, the remaining 394634efbc2SNelio Laranjeiro * table entries are padded with reused WQs and hashes are not spread 395634efbc2SNelio Laranjeiro * uniformly. */ 396634efbc2SNelio Laranjeiro for (i = 0, j = 0; (i != reta_idx_n); ++i) { 397634efbc2SNelio Laranjeiro (*priv->reta_idx)[i] = j; 398634efbc2SNelio Laranjeiro if (++j == rxqs_n) 399634efbc2SNelio Laranjeiro j = 0; 400634efbc2SNelio Laranjeiro } 401e60fbd5bSAdrien Mazarguil return 0; 402e60fbd5bSAdrien Mazarguil } 403e60fbd5bSAdrien Mazarguil 404e60fbd5bSAdrien Mazarguil /** 405e60fbd5bSAdrien Mazarguil * DPDK callback for Ethernet device configuration. 406e60fbd5bSAdrien Mazarguil * 407e60fbd5bSAdrien Mazarguil * @param dev 408e60fbd5bSAdrien Mazarguil * Pointer to Ethernet device structure. 409e60fbd5bSAdrien Mazarguil * 410e60fbd5bSAdrien Mazarguil * @return 411e60fbd5bSAdrien Mazarguil * 0 on success, negative errno value on failure. 412e60fbd5bSAdrien Mazarguil */ 413e60fbd5bSAdrien Mazarguil int 414e60fbd5bSAdrien Mazarguil mlx5_dev_configure(struct rte_eth_dev *dev) 415e60fbd5bSAdrien Mazarguil { 416e60fbd5bSAdrien Mazarguil struct priv *priv = dev->data->dev_private; 417e60fbd5bSAdrien Mazarguil int ret; 418e60fbd5bSAdrien Mazarguil 419e60fbd5bSAdrien Mazarguil priv_lock(priv); 420e60fbd5bSAdrien Mazarguil ret = dev_configure(dev); 421e60fbd5bSAdrien Mazarguil assert(ret >= 0); 422e60fbd5bSAdrien Mazarguil priv_unlock(priv); 423e60fbd5bSAdrien Mazarguil return -ret; 424e60fbd5bSAdrien Mazarguil } 425e60fbd5bSAdrien Mazarguil 426e60fbd5bSAdrien Mazarguil /** 427e60fbd5bSAdrien Mazarguil * DPDK callback to get information about the device. 428e60fbd5bSAdrien Mazarguil * 429e60fbd5bSAdrien Mazarguil * @param dev 430e60fbd5bSAdrien Mazarguil * Pointer to Ethernet device structure. 431e60fbd5bSAdrien Mazarguil * @param[out] info 432e60fbd5bSAdrien Mazarguil * Info structure output buffer. 433e60fbd5bSAdrien Mazarguil */ 434e60fbd5bSAdrien Mazarguil void 435e60fbd5bSAdrien Mazarguil mlx5_dev_infos_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *info) 436e60fbd5bSAdrien Mazarguil { 43701d79216SNélio Laranjeiro struct priv *priv = dev->data->dev_private; 4387fe24446SShahaf Shuler struct mlx5_dev_config *config = &priv->config; 439e60fbd5bSAdrien Mazarguil unsigned int max; 440e60fbd5bSAdrien Mazarguil char ifname[IF_NAMESIZE]; 441e60fbd5bSAdrien Mazarguil 442c0802544SFerruh Yigit info->pci_dev = RTE_ETH_DEV_TO_PCI(dev); 443ae34410aSJan Blunck 444e60fbd5bSAdrien Mazarguil priv_lock(priv); 445e60fbd5bSAdrien Mazarguil /* FIXME: we should ask the device for these values. */ 446e60fbd5bSAdrien Mazarguil info->min_rx_bufsize = 32; 447e60fbd5bSAdrien Mazarguil info->max_rx_pktlen = 65536; 448e60fbd5bSAdrien Mazarguil /* 449e60fbd5bSAdrien Mazarguil * Since we need one CQ per QP, the limit is the minimum number 450e60fbd5bSAdrien Mazarguil * between the two values. 451e60fbd5bSAdrien Mazarguil */ 45243e9d979SShachar Beiser max = RTE_MIN(priv->device_attr.orig_attr.max_cq, 45343e9d979SShachar Beiser priv->device_attr.orig_attr.max_qp); 454e60fbd5bSAdrien Mazarguil /* If max >= 65535 then max = 0, max_rx_queues is uint16_t. */ 455e60fbd5bSAdrien Mazarguil if (max >= 65535) 456e60fbd5bSAdrien Mazarguil max = 65535; 457e60fbd5bSAdrien Mazarguil info->max_rx_queues = max; 458e60fbd5bSAdrien Mazarguil info->max_tx_queues = max; 4590497ddaaSYaacov Hazan info->max_mac_addrs = RTE_DIM(priv->mac); 46017b843ebSShahaf Shuler info->rx_queue_offload_capa = 46117b843ebSShahaf Shuler mlx5_priv_get_rx_queue_offloads(priv); 46217b843ebSShahaf Shuler info->rx_offload_capa = (mlx5_priv_get_rx_port_offloads(priv) | 46317b843ebSShahaf Shuler info->rx_queue_offload_capa); 464dbccb4cdSShahaf Shuler info->tx_offload_capa = mlx5_priv_get_tx_port_offloads(priv); 465e60fbd5bSAdrien Mazarguil if (priv_get_ifname(priv, &ifname) == 0) 466e60fbd5bSAdrien Mazarguil info->if_index = if_nametoindex(ifname); 467d365210eSYongseok Koh info->reta_size = priv->reta_idx_n ? 4687fe24446SShahaf Shuler priv->reta_idx_n : config->ind_table_max_size; 46929c1d8bbSNélio Laranjeiro info->hash_key_size = priv->rss_conf.rss_key_len; 47075ef62a9SNélio Laranjeiro info->speed_capa = priv->link_speed_capa; 471b233b027SShahaf Shuler info->flow_type_rss_offloads = ~MLX5_RSS_HF_MASK; 472e60fbd5bSAdrien Mazarguil priv_unlock(priv); 473e60fbd5bSAdrien Mazarguil } 474e60fbd5bSAdrien Mazarguil 47578a38edfSJianfeng Tan const uint32_t * 47678a38edfSJianfeng Tan mlx5_dev_supported_ptypes_get(struct rte_eth_dev *dev) 47778a38edfSJianfeng Tan { 47878a38edfSJianfeng Tan static const uint32_t ptypes[] = { 47978a38edfSJianfeng Tan /* refers to rxq_cq_to_pkt_type() */ 480ea16068cSYongseok Koh RTE_PTYPE_L2_ETHER, 481c4ba5434SNélio Laranjeiro RTE_PTYPE_L3_IPV4_EXT_UNKNOWN, 482c4ba5434SNélio Laranjeiro RTE_PTYPE_L3_IPV6_EXT_UNKNOWN, 483ea16068cSYongseok Koh RTE_PTYPE_L4_NONFRAG, 484ea16068cSYongseok Koh RTE_PTYPE_L4_FRAG, 485ea16068cSYongseok Koh RTE_PTYPE_L4_TCP, 486ea16068cSYongseok Koh RTE_PTYPE_L4_UDP, 487c4ba5434SNélio Laranjeiro RTE_PTYPE_INNER_L3_IPV4_EXT_UNKNOWN, 488c4ba5434SNélio Laranjeiro RTE_PTYPE_INNER_L3_IPV6_EXT_UNKNOWN, 489ea16068cSYongseok Koh RTE_PTYPE_INNER_L4_NONFRAG, 490ea16068cSYongseok Koh RTE_PTYPE_INNER_L4_FRAG, 491ea16068cSYongseok Koh RTE_PTYPE_INNER_L4_TCP, 492ea16068cSYongseok Koh RTE_PTYPE_INNER_L4_UDP, 49378a38edfSJianfeng Tan RTE_PTYPE_UNKNOWN 49478a38edfSJianfeng Tan }; 49578a38edfSJianfeng Tan 4966cb559d6SYongseok Koh if (dev->rx_pkt_burst == mlx5_rx_burst || 4976cb559d6SYongseok Koh dev->rx_pkt_burst == mlx5_rx_burst_vec) 49878a38edfSJianfeng Tan return ptypes; 49978a38edfSJianfeng Tan return NULL; 50078a38edfSJianfeng Tan } 50178a38edfSJianfeng Tan 502e60fbd5bSAdrien Mazarguil /** 5032c960a51SMatthieu Ternisien d'Ouville * DPDK callback to retrieve physical link information. 504cb8faed7SAdrien Mazarguil * 505cb8faed7SAdrien Mazarguil * @param dev 506cb8faed7SAdrien Mazarguil * Pointer to Ethernet device structure. 507cb8faed7SAdrien Mazarguil * @param wait_to_complete 508cb8faed7SAdrien Mazarguil * Wait for request completion (ignored). 509cb8faed7SAdrien Mazarguil */ 51018840871SNélio Laranjeiro static int 51118840871SNélio Laranjeiro mlx5_link_update_unlocked_gset(struct rte_eth_dev *dev, int wait_to_complete) 512cb8faed7SAdrien Mazarguil { 51301d79216SNélio Laranjeiro struct priv *priv = dev->data->dev_private; 514cb8faed7SAdrien Mazarguil struct ethtool_cmd edata = { 51575ef62a9SNélio Laranjeiro .cmd = ETHTOOL_GSET /* Deprecated since Linux v4.5. */ 516cb8faed7SAdrien Mazarguil }; 517cb8faed7SAdrien Mazarguil struct ifreq ifr; 518cb8faed7SAdrien Mazarguil struct rte_eth_link dev_link; 519cb8faed7SAdrien Mazarguil int link_speed = 0; 520cb8faed7SAdrien Mazarguil 5212c960a51SMatthieu Ternisien d'Ouville /* priv_lock() is not taken to allow concurrent calls. */ 5222c960a51SMatthieu Ternisien d'Ouville 523cb8faed7SAdrien Mazarguil (void)wait_to_complete; 524cb8faed7SAdrien Mazarguil if (priv_ifreq(priv, SIOCGIFFLAGS, &ifr)) { 525cb8faed7SAdrien Mazarguil WARN("ioctl(SIOCGIFFLAGS) failed: %s", strerror(errno)); 526cb8faed7SAdrien Mazarguil return -1; 527cb8faed7SAdrien Mazarguil } 528cb8faed7SAdrien Mazarguil memset(&dev_link, 0, sizeof(dev_link)); 529cb8faed7SAdrien Mazarguil dev_link.link_status = ((ifr.ifr_flags & IFF_UP) && 530cb8faed7SAdrien Mazarguil (ifr.ifr_flags & IFF_RUNNING)); 531d06c608cSAdrien Mazarguil ifr.ifr_data = (void *)&edata; 532cb8faed7SAdrien Mazarguil if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 533cb8faed7SAdrien Mazarguil WARN("ioctl(SIOCETHTOOL, ETHTOOL_GSET) failed: %s", 534cb8faed7SAdrien Mazarguil strerror(errno)); 535cb8faed7SAdrien Mazarguil return -1; 536cb8faed7SAdrien Mazarguil } 537cb8faed7SAdrien Mazarguil link_speed = ethtool_cmd_speed(&edata); 538cb8faed7SAdrien Mazarguil if (link_speed == -1) 539cb8faed7SAdrien Mazarguil dev_link.link_speed = 0; 540cb8faed7SAdrien Mazarguil else 541cb8faed7SAdrien Mazarguil dev_link.link_speed = link_speed; 54275ef62a9SNélio Laranjeiro priv->link_speed_capa = 0; 54375ef62a9SNélio Laranjeiro if (edata.supported & SUPPORTED_Autoneg) 54475ef62a9SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG; 54575ef62a9SNélio Laranjeiro if (edata.supported & (SUPPORTED_1000baseT_Full | 54675ef62a9SNélio Laranjeiro SUPPORTED_1000baseKX_Full)) 54775ef62a9SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_1G; 54875ef62a9SNélio Laranjeiro if (edata.supported & SUPPORTED_10000baseKR_Full) 54975ef62a9SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_10G; 55075ef62a9SNélio Laranjeiro if (edata.supported & (SUPPORTED_40000baseKR4_Full | 55175ef62a9SNélio Laranjeiro SUPPORTED_40000baseCR4_Full | 55275ef62a9SNélio Laranjeiro SUPPORTED_40000baseSR4_Full | 55375ef62a9SNélio Laranjeiro SUPPORTED_40000baseLR4_Full)) 55475ef62a9SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_40G; 555cb8faed7SAdrien Mazarguil dev_link.link_duplex = ((edata.duplex == DUPLEX_HALF) ? 556cb8faed7SAdrien Mazarguil ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX); 55782113036SMarc Sune dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds & 55882113036SMarc Sune ETH_LINK_SPEED_FIXED); 559cb8faed7SAdrien Mazarguil if (memcmp(&dev_link, &dev->data->dev_link, sizeof(dev_link))) { 560cb8faed7SAdrien Mazarguil /* Link status changed. */ 561cb8faed7SAdrien Mazarguil dev->data->dev_link = dev_link; 562cb8faed7SAdrien Mazarguil return 0; 563cb8faed7SAdrien Mazarguil } 564cb8faed7SAdrien Mazarguil /* Link status is still the same. */ 565cb8faed7SAdrien Mazarguil return -1; 566cb8faed7SAdrien Mazarguil } 567cb8faed7SAdrien Mazarguil 568cb8faed7SAdrien Mazarguil /** 5693a49ffe3SShahaf Shuler * Retrieve physical link information (unlocked version using new ioctl). 57018840871SNélio Laranjeiro * 57118840871SNélio Laranjeiro * @param dev 57218840871SNélio Laranjeiro * Pointer to Ethernet device structure. 57318840871SNélio Laranjeiro * @param wait_to_complete 57418840871SNélio Laranjeiro * Wait for request completion (ignored). 57518840871SNélio Laranjeiro */ 57618840871SNélio Laranjeiro static int 57718840871SNélio Laranjeiro mlx5_link_update_unlocked_gs(struct rte_eth_dev *dev, int wait_to_complete) 57818840871SNélio Laranjeiro { 57901d79216SNélio Laranjeiro struct priv *priv = dev->data->dev_private; 58037a4406cSNélio Laranjeiro struct ethtool_link_settings gcmd = { .cmd = ETHTOOL_GLINKSETTINGS }; 58118840871SNélio Laranjeiro struct ifreq ifr; 58218840871SNélio Laranjeiro struct rte_eth_link dev_link; 58318840871SNélio Laranjeiro uint64_t sc; 58418840871SNélio Laranjeiro 58518840871SNélio Laranjeiro (void)wait_to_complete; 58618840871SNélio Laranjeiro if (priv_ifreq(priv, SIOCGIFFLAGS, &ifr)) { 58718840871SNélio Laranjeiro WARN("ioctl(SIOCGIFFLAGS) failed: %s", strerror(errno)); 58818840871SNélio Laranjeiro return -1; 58918840871SNélio Laranjeiro } 59018840871SNélio Laranjeiro memset(&dev_link, 0, sizeof(dev_link)); 59118840871SNélio Laranjeiro dev_link.link_status = ((ifr.ifr_flags & IFF_UP) && 59218840871SNélio Laranjeiro (ifr.ifr_flags & IFF_RUNNING)); 59337a4406cSNélio Laranjeiro ifr.ifr_data = (void *)&gcmd; 59418840871SNélio Laranjeiro if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 59518840871SNélio Laranjeiro DEBUG("ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS) failed: %s", 59618840871SNélio Laranjeiro strerror(errno)); 59718840871SNélio Laranjeiro return -1; 59818840871SNélio Laranjeiro } 59937a4406cSNélio Laranjeiro gcmd.link_mode_masks_nwords = -gcmd.link_mode_masks_nwords; 60037a4406cSNélio Laranjeiro 60137a4406cSNélio Laranjeiro alignas(struct ethtool_link_settings) 60237a4406cSNélio Laranjeiro uint8_t data[offsetof(struct ethtool_link_settings, link_mode_masks) + 60337a4406cSNélio Laranjeiro sizeof(uint32_t) * gcmd.link_mode_masks_nwords * 3]; 60437a4406cSNélio Laranjeiro struct ethtool_link_settings *ecmd = (void *)data; 60537a4406cSNélio Laranjeiro 60637a4406cSNélio Laranjeiro *ecmd = gcmd; 60737a4406cSNélio Laranjeiro ifr.ifr_data = (void *)ecmd; 608ef09a7fcSGowrishankar Muthukrishnan if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 609ef09a7fcSGowrishankar Muthukrishnan DEBUG("ioctl(SIOCETHTOOL, ETHTOOL_GLINKSETTINGS) failed: %s", 610ef09a7fcSGowrishankar Muthukrishnan strerror(errno)); 611ef09a7fcSGowrishankar Muthukrishnan return -1; 612ef09a7fcSGowrishankar Muthukrishnan } 61390260d57SNélio Laranjeiro dev_link.link_speed = ecmd->speed; 61490260d57SNélio Laranjeiro sc = ecmd->link_mode_masks[0] | 61590260d57SNélio Laranjeiro ((uint64_t)ecmd->link_mode_masks[1] << 32); 61618840871SNélio Laranjeiro priv->link_speed_capa = 0; 617b113cb5eSEdward Makarov if (sc & MLX5_BITSHIFT(ETHTOOL_LINK_MODE_Autoneg_BIT)) 61818840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_AUTONEG; 619b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseT_Full_BIT) | 620b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_1000baseKX_Full_BIT))) 62118840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_1G; 622b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKX4_Full_BIT) | 623b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseKR_Full_BIT) | 624b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_10000baseR_FEC_BIT))) 62518840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_10G; 626b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseMLD2_Full_BIT) | 627b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_20000baseKR2_Full_BIT))) 62818840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_20G; 629b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseKR4_Full_BIT) | 630b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseCR4_Full_BIT) | 631b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseSR4_Full_BIT) | 632b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_40000baseLR4_Full_BIT))) 63318840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_40G; 634b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseKR4_Full_BIT) | 635b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseCR4_Full_BIT) | 636b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseSR4_Full_BIT) | 637b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_56000baseLR4_Full_BIT))) 63818840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_56G; 639b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseCR_Full_BIT) | 640b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseKR_Full_BIT) | 641b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_25000baseSR_Full_BIT))) 64218840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_25G; 643b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseCR2_Full_BIT) | 644b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_50000baseKR2_Full_BIT))) 64518840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_50G; 646b113cb5eSEdward Makarov if (sc & (MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseKR4_Full_BIT) | 647b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseSR4_Full_BIT) | 648b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseCR4_Full_BIT) | 649b113cb5eSEdward Makarov MLX5_BITSHIFT(ETHTOOL_LINK_MODE_100000baseLR4_ER4_Full_BIT))) 65018840871SNélio Laranjeiro priv->link_speed_capa |= ETH_LINK_SPEED_100G; 65190260d57SNélio Laranjeiro dev_link.link_duplex = ((ecmd->duplex == DUPLEX_HALF) ? 65218840871SNélio Laranjeiro ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX); 65318840871SNélio Laranjeiro dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds & 65418840871SNélio Laranjeiro ETH_LINK_SPEED_FIXED); 65518840871SNélio Laranjeiro if (memcmp(&dev_link, &dev->data->dev_link, sizeof(dev_link))) { 65618840871SNélio Laranjeiro /* Link status changed. */ 65718840871SNélio Laranjeiro dev->data->dev_link = dev_link; 65818840871SNélio Laranjeiro return 0; 65918840871SNélio Laranjeiro } 66018840871SNélio Laranjeiro /* Link status is still the same. */ 66118840871SNélio Laranjeiro return -1; 66218840871SNélio Laranjeiro } 66318840871SNélio Laranjeiro 66418840871SNélio Laranjeiro /** 665c7bf6225SYongseok Koh * Enable receiving and transmitting traffic. 666c7bf6225SYongseok Koh * 667c7bf6225SYongseok Koh * @param priv 668c7bf6225SYongseok Koh * Pointer to private structure. 669c7bf6225SYongseok Koh */ 670c7bf6225SYongseok Koh static void 671c7bf6225SYongseok Koh priv_link_start(struct priv *priv) 672c7bf6225SYongseok Koh { 673c7bf6225SYongseok Koh struct rte_eth_dev *dev = priv->dev; 674c7bf6225SYongseok Koh int err; 675c7bf6225SYongseok Koh 676c7bf6225SYongseok Koh dev->tx_pkt_burst = priv_select_tx_function(priv, dev); 677c7bf6225SYongseok Koh dev->rx_pkt_burst = priv_select_rx_function(priv, dev); 678c7bf6225SYongseok Koh err = priv_dev_traffic_enable(priv, dev); 679c7bf6225SYongseok Koh if (err) 680c7bf6225SYongseok Koh ERROR("%p: error occurred while configuring control flows: %s", 681c7bf6225SYongseok Koh (void *)priv, strerror(err)); 682c7bf6225SYongseok Koh err = priv_flow_start(priv, &priv->flows); 683c7bf6225SYongseok Koh if (err) 684c7bf6225SYongseok Koh ERROR("%p: error occurred while configuring flows: %s", 685c7bf6225SYongseok Koh (void *)priv, strerror(err)); 686c7bf6225SYongseok Koh } 687c7bf6225SYongseok Koh 688c7bf6225SYongseok Koh /** 689c7bf6225SYongseok Koh * Disable receiving and transmitting traffic. 690c7bf6225SYongseok Koh * 691c7bf6225SYongseok Koh * @param priv 692c7bf6225SYongseok Koh * Pointer to private structure. 693c7bf6225SYongseok Koh */ 694c7bf6225SYongseok Koh static void 695c7bf6225SYongseok Koh priv_link_stop(struct priv *priv) 696c7bf6225SYongseok Koh { 697c7bf6225SYongseok Koh struct rte_eth_dev *dev = priv->dev; 698c7bf6225SYongseok Koh 699c7bf6225SYongseok Koh priv_flow_stop(priv, &priv->flows); 700c7bf6225SYongseok Koh priv_dev_traffic_disable(priv, dev); 701c7bf6225SYongseok Koh dev->rx_pkt_burst = removed_rx_burst; 702c7bf6225SYongseok Koh dev->tx_pkt_burst = removed_tx_burst; 703c7bf6225SYongseok Koh } 704c7bf6225SYongseok Koh 705c7bf6225SYongseok Koh /** 706c7bf6225SYongseok Koh * Retrieve physical link information and update rx/tx_pkt_burst callbacks 707c7bf6225SYongseok Koh * accordingly. 708c7bf6225SYongseok Koh * 709c7bf6225SYongseok Koh * @param priv 710c7bf6225SYongseok Koh * Pointer to private structure. 711c7bf6225SYongseok Koh * @param wait_to_complete 712c7bf6225SYongseok Koh * Wait for request completion (ignored). 713c7bf6225SYongseok Koh */ 714c7bf6225SYongseok Koh int 715c7bf6225SYongseok Koh priv_link_update(struct priv *priv, int wait_to_complete) 716c7bf6225SYongseok Koh { 717c7bf6225SYongseok Koh struct rte_eth_dev *dev = priv->dev; 718c7bf6225SYongseok Koh struct utsname utsname; 719c7bf6225SYongseok Koh int ver[3]; 720c7bf6225SYongseok Koh int ret; 721c7bf6225SYongseok Koh struct rte_eth_link dev_link = dev->data->dev_link; 722c7bf6225SYongseok Koh 723c7bf6225SYongseok Koh if (uname(&utsname) == -1 || 724c7bf6225SYongseok Koh sscanf(utsname.release, "%d.%d.%d", 725c7bf6225SYongseok Koh &ver[0], &ver[1], &ver[2]) != 3 || 726c7bf6225SYongseok Koh KERNEL_VERSION(ver[0], ver[1], ver[2]) < KERNEL_VERSION(4, 9, 0)) 727c7bf6225SYongseok Koh ret = mlx5_link_update_unlocked_gset(dev, wait_to_complete); 728c7bf6225SYongseok Koh else 729c7bf6225SYongseok Koh ret = mlx5_link_update_unlocked_gs(dev, wait_to_complete); 730c7bf6225SYongseok Koh /* If lsc interrupt is disabled, should always be ready for traffic. */ 731c7bf6225SYongseok Koh if (!dev->data->dev_conf.intr_conf.lsc) { 732c7bf6225SYongseok Koh priv_link_start(priv); 733c7bf6225SYongseok Koh return ret; 734c7bf6225SYongseok Koh } 735c7bf6225SYongseok Koh /* Re-select burst callbacks only if link status has been changed. */ 736c7bf6225SYongseok Koh if (!ret && dev_link.link_status != dev->data->dev_link.link_status) { 737c7bf6225SYongseok Koh if (dev->data->dev_link.link_status == ETH_LINK_UP) 738c7bf6225SYongseok Koh priv_link_start(priv); 739c7bf6225SYongseok Koh else 740c7bf6225SYongseok Koh priv_link_stop(priv); 741c7bf6225SYongseok Koh } 742c7bf6225SYongseok Koh return ret; 743c7bf6225SYongseok Koh } 744c7bf6225SYongseok Koh 745c7bf6225SYongseok Koh /** 746e313ef4cSShahaf Shuler * Querying the link status till it changes to the desired state. 747e313ef4cSShahaf Shuler * Number of query attempts is bounded by MLX5_MAX_LINK_QUERY_ATTEMPTS. 748e313ef4cSShahaf Shuler * 749e313ef4cSShahaf Shuler * @param priv 750e313ef4cSShahaf Shuler * Pointer to private structure. 751e313ef4cSShahaf Shuler * @param status 752e313ef4cSShahaf Shuler * Link desired status. 753e313ef4cSShahaf Shuler * 754e313ef4cSShahaf Shuler * @return 755e313ef4cSShahaf Shuler * 0 on success, negative errno value on failure. 756e313ef4cSShahaf Shuler */ 757e313ef4cSShahaf Shuler int 758e313ef4cSShahaf Shuler priv_force_link_status_change(struct priv *priv, int status) 759e313ef4cSShahaf Shuler { 760e313ef4cSShahaf Shuler int try = 0; 761e313ef4cSShahaf Shuler 762e313ef4cSShahaf Shuler while (try < MLX5_MAX_LINK_QUERY_ATTEMPTS) { 763e313ef4cSShahaf Shuler priv_link_update(priv, 0); 764e313ef4cSShahaf Shuler if (priv->dev->data->dev_link.link_status == status) 765e313ef4cSShahaf Shuler return 0; 766e313ef4cSShahaf Shuler try++; 767e313ef4cSShahaf Shuler sleep(1); 768e313ef4cSShahaf Shuler } 769e313ef4cSShahaf Shuler return -EAGAIN; 770e313ef4cSShahaf Shuler } 771e313ef4cSShahaf Shuler 772e313ef4cSShahaf Shuler /** 773cb8faed7SAdrien Mazarguil * DPDK callback to retrieve physical link information. 774cb8faed7SAdrien Mazarguil * 775cb8faed7SAdrien Mazarguil * @param dev 776cb8faed7SAdrien Mazarguil * Pointer to Ethernet device structure. 777cb8faed7SAdrien Mazarguil * @param wait_to_complete 778cb8faed7SAdrien Mazarguil * Wait for request completion (ignored). 779cb8faed7SAdrien Mazarguil */ 780cb8faed7SAdrien Mazarguil int 781cb8faed7SAdrien Mazarguil mlx5_link_update(struct rte_eth_dev *dev, int wait_to_complete) 782cb8faed7SAdrien Mazarguil { 783c7bf6225SYongseok Koh struct priv *priv = dev->data->dev_private; 784c7bf6225SYongseok Koh int ret; 785cb8faed7SAdrien Mazarguil 786c7bf6225SYongseok Koh priv_lock(priv); 787c7bf6225SYongseok Koh ret = priv_link_update(priv, wait_to_complete); 788c7bf6225SYongseok Koh priv_unlock(priv); 789c7bf6225SYongseok Koh return ret; 790cb8faed7SAdrien Mazarguil } 791cb8faed7SAdrien Mazarguil 792cb8faed7SAdrien Mazarguil /** 793cf37ca95SAdrien Mazarguil * DPDK callback to change the MTU. 794cf37ca95SAdrien Mazarguil * 795cf37ca95SAdrien Mazarguil * @param dev 796cf37ca95SAdrien Mazarguil * Pointer to Ethernet device structure. 797cf37ca95SAdrien Mazarguil * @param in_mtu 798cf37ca95SAdrien Mazarguil * New MTU. 799cf37ca95SAdrien Mazarguil * 800cf37ca95SAdrien Mazarguil * @return 801cf37ca95SAdrien Mazarguil * 0 on success, negative errno value on failure. 802cf37ca95SAdrien Mazarguil */ 803cf37ca95SAdrien Mazarguil int 804cf37ca95SAdrien Mazarguil mlx5_dev_set_mtu(struct rte_eth_dev *dev, uint16_t mtu) 805cf37ca95SAdrien Mazarguil { 806cf37ca95SAdrien Mazarguil struct priv *priv = dev->data->dev_private; 807a0edafe4SNelio Laranjeiro uint16_t kern_mtu; 808cf37ca95SAdrien Mazarguil int ret = 0; 809cf37ca95SAdrien Mazarguil 810cf37ca95SAdrien Mazarguil priv_lock(priv); 811a0edafe4SNelio Laranjeiro ret = priv_get_mtu(priv, &kern_mtu); 812a0edafe4SNelio Laranjeiro if (ret) 813a0edafe4SNelio Laranjeiro goto out; 814cf37ca95SAdrien Mazarguil /* Set kernel interface MTU first. */ 815a0edafe4SNelio Laranjeiro ret = priv_set_mtu(priv, mtu); 816a0edafe4SNelio Laranjeiro if (ret) 817a0edafe4SNelio Laranjeiro goto out; 818a0edafe4SNelio Laranjeiro ret = priv_get_mtu(priv, &kern_mtu); 819a0edafe4SNelio Laranjeiro if (ret) 820a0edafe4SNelio Laranjeiro goto out; 821a0edafe4SNelio Laranjeiro if (kern_mtu == mtu) { 822a0edafe4SNelio Laranjeiro priv->mtu = mtu; 823a0edafe4SNelio Laranjeiro DEBUG("adapter port %u MTU set to %u", priv->port, mtu); 824a0edafe4SNelio Laranjeiro } 825a0edafe4SNelio Laranjeiro priv_unlock(priv); 826a0edafe4SNelio Laranjeiro return 0; 827a0edafe4SNelio Laranjeiro out: 828cf37ca95SAdrien Mazarguil ret = errno; 829cf37ca95SAdrien Mazarguil WARN("cannot set port %u MTU to %u: %s", priv->port, mtu, 830cf37ca95SAdrien Mazarguil strerror(ret)); 831cf37ca95SAdrien Mazarguil priv_unlock(priv); 832cf37ca95SAdrien Mazarguil assert(ret >= 0); 833cf37ca95SAdrien Mazarguil return -ret; 834cf37ca95SAdrien Mazarguil } 835cf37ca95SAdrien Mazarguil 836cf37ca95SAdrien Mazarguil /** 83702d75430SAdrien Mazarguil * DPDK callback to get flow control status. 83802d75430SAdrien Mazarguil * 83902d75430SAdrien Mazarguil * @param dev 84002d75430SAdrien Mazarguil * Pointer to Ethernet device structure. 84102d75430SAdrien Mazarguil * @param[out] fc_conf 84202d75430SAdrien Mazarguil * Flow control output buffer. 84302d75430SAdrien Mazarguil * 84402d75430SAdrien Mazarguil * @return 84502d75430SAdrien Mazarguil * 0 on success, negative errno value on failure. 84602d75430SAdrien Mazarguil */ 84702d75430SAdrien Mazarguil int 84802d75430SAdrien Mazarguil mlx5_dev_get_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf) 84902d75430SAdrien Mazarguil { 85002d75430SAdrien Mazarguil struct priv *priv = dev->data->dev_private; 85102d75430SAdrien Mazarguil struct ifreq ifr; 85202d75430SAdrien Mazarguil struct ethtool_pauseparam ethpause = { 85302d75430SAdrien Mazarguil .cmd = ETHTOOL_GPAUSEPARAM 85402d75430SAdrien Mazarguil }; 85502d75430SAdrien Mazarguil int ret; 85602d75430SAdrien Mazarguil 857d06c608cSAdrien Mazarguil ifr.ifr_data = (void *)ðpause; 85802d75430SAdrien Mazarguil priv_lock(priv); 85902d75430SAdrien Mazarguil if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 86002d75430SAdrien Mazarguil ret = errno; 86102d75430SAdrien Mazarguil WARN("ioctl(SIOCETHTOOL, ETHTOOL_GPAUSEPARAM)" 86202d75430SAdrien Mazarguil " failed: %s", 86302d75430SAdrien Mazarguil strerror(ret)); 86402d75430SAdrien Mazarguil goto out; 86502d75430SAdrien Mazarguil } 86602d75430SAdrien Mazarguil 86702d75430SAdrien Mazarguil fc_conf->autoneg = ethpause.autoneg; 86802d75430SAdrien Mazarguil if (ethpause.rx_pause && ethpause.tx_pause) 86902d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_FULL; 87002d75430SAdrien Mazarguil else if (ethpause.rx_pause) 87102d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_RX_PAUSE; 87202d75430SAdrien Mazarguil else if (ethpause.tx_pause) 87302d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_TX_PAUSE; 87402d75430SAdrien Mazarguil else 87502d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_NONE; 87602d75430SAdrien Mazarguil ret = 0; 87702d75430SAdrien Mazarguil 87802d75430SAdrien Mazarguil out: 87902d75430SAdrien Mazarguil priv_unlock(priv); 88002d75430SAdrien Mazarguil assert(ret >= 0); 88102d75430SAdrien Mazarguil return -ret; 88202d75430SAdrien Mazarguil } 88302d75430SAdrien Mazarguil 88402d75430SAdrien Mazarguil /** 88502d75430SAdrien Mazarguil * DPDK callback to modify flow control parameters. 88602d75430SAdrien Mazarguil * 88702d75430SAdrien Mazarguil * @param dev 88802d75430SAdrien Mazarguil * Pointer to Ethernet device structure. 88902d75430SAdrien Mazarguil * @param[in] fc_conf 89002d75430SAdrien Mazarguil * Flow control parameters. 89102d75430SAdrien Mazarguil * 89202d75430SAdrien Mazarguil * @return 89302d75430SAdrien Mazarguil * 0 on success, negative errno value on failure. 89402d75430SAdrien Mazarguil */ 89502d75430SAdrien Mazarguil int 89602d75430SAdrien Mazarguil mlx5_dev_set_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf) 89702d75430SAdrien Mazarguil { 89802d75430SAdrien Mazarguil struct priv *priv = dev->data->dev_private; 89902d75430SAdrien Mazarguil struct ifreq ifr; 90002d75430SAdrien Mazarguil struct ethtool_pauseparam ethpause = { 90102d75430SAdrien Mazarguil .cmd = ETHTOOL_SPAUSEPARAM 90202d75430SAdrien Mazarguil }; 90302d75430SAdrien Mazarguil int ret; 90402d75430SAdrien Mazarguil 905d06c608cSAdrien Mazarguil ifr.ifr_data = (void *)ðpause; 90602d75430SAdrien Mazarguil ethpause.autoneg = fc_conf->autoneg; 90702d75430SAdrien Mazarguil if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) || 90802d75430SAdrien Mazarguil (fc_conf->mode & RTE_FC_RX_PAUSE)) 90902d75430SAdrien Mazarguil ethpause.rx_pause = 1; 91002d75430SAdrien Mazarguil else 91102d75430SAdrien Mazarguil ethpause.rx_pause = 0; 91202d75430SAdrien Mazarguil 91302d75430SAdrien Mazarguil if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) || 91402d75430SAdrien Mazarguil (fc_conf->mode & RTE_FC_TX_PAUSE)) 91502d75430SAdrien Mazarguil ethpause.tx_pause = 1; 91602d75430SAdrien Mazarguil else 91702d75430SAdrien Mazarguil ethpause.tx_pause = 0; 91802d75430SAdrien Mazarguil 91902d75430SAdrien Mazarguil priv_lock(priv); 92002d75430SAdrien Mazarguil if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 92102d75430SAdrien Mazarguil ret = errno; 92202d75430SAdrien Mazarguil WARN("ioctl(SIOCETHTOOL, ETHTOOL_SPAUSEPARAM)" 92302d75430SAdrien Mazarguil " failed: %s", 92402d75430SAdrien Mazarguil strerror(ret)); 92502d75430SAdrien Mazarguil goto out; 92602d75430SAdrien Mazarguil } 92702d75430SAdrien Mazarguil ret = 0; 92802d75430SAdrien Mazarguil 92902d75430SAdrien Mazarguil out: 93002d75430SAdrien Mazarguil priv_unlock(priv); 93102d75430SAdrien Mazarguil assert(ret >= 0); 93202d75430SAdrien Mazarguil return -ret; 93302d75430SAdrien Mazarguil } 93402d75430SAdrien Mazarguil 93502d75430SAdrien Mazarguil /** 936771fa900SAdrien Mazarguil * Get PCI information from struct ibv_device. 937771fa900SAdrien Mazarguil * 938771fa900SAdrien Mazarguil * @param device 939771fa900SAdrien Mazarguil * Pointer to Ethernet device structure. 940771fa900SAdrien Mazarguil * @param[out] pci_addr 941771fa900SAdrien Mazarguil * PCI bus address output buffer. 942771fa900SAdrien Mazarguil * 943771fa900SAdrien Mazarguil * @return 944771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 945771fa900SAdrien Mazarguil */ 946771fa900SAdrien Mazarguil int 947771fa900SAdrien Mazarguil mlx5_ibv_device_to_pci_addr(const struct ibv_device *device, 948771fa900SAdrien Mazarguil struct rte_pci_addr *pci_addr) 949771fa900SAdrien Mazarguil { 950771fa900SAdrien Mazarguil FILE *file; 951771fa900SAdrien Mazarguil char line[32]; 952771fa900SAdrien Mazarguil MKSTR(path, "%s/device/uevent", device->ibdev_path); 953771fa900SAdrien Mazarguil 954771fa900SAdrien Mazarguil file = fopen(path, "rb"); 955771fa900SAdrien Mazarguil if (file == NULL) 956771fa900SAdrien Mazarguil return -1; 957771fa900SAdrien Mazarguil while (fgets(line, sizeof(line), file) == line) { 958771fa900SAdrien Mazarguil size_t len = strlen(line); 959771fa900SAdrien Mazarguil int ret; 960771fa900SAdrien Mazarguil 961771fa900SAdrien Mazarguil /* Truncate long lines. */ 962771fa900SAdrien Mazarguil if (len == (sizeof(line) - 1)) 963771fa900SAdrien Mazarguil while (line[(len - 1)] != '\n') { 964771fa900SAdrien Mazarguil ret = fgetc(file); 965771fa900SAdrien Mazarguil if (ret == EOF) 966771fa900SAdrien Mazarguil break; 967771fa900SAdrien Mazarguil line[(len - 1)] = ret; 968771fa900SAdrien Mazarguil } 969771fa900SAdrien Mazarguil /* Extract information. */ 970771fa900SAdrien Mazarguil if (sscanf(line, 971771fa900SAdrien Mazarguil "PCI_SLOT_NAME=" 972463ced95SStephen Hemminger "%" SCNx32 ":%" SCNx8 ":%" SCNx8 ".%" SCNx8 "\n", 973771fa900SAdrien Mazarguil &pci_addr->domain, 974771fa900SAdrien Mazarguil &pci_addr->bus, 975771fa900SAdrien Mazarguil &pci_addr->devid, 976771fa900SAdrien Mazarguil &pci_addr->function) == 4) { 977771fa900SAdrien Mazarguil ret = 0; 978771fa900SAdrien Mazarguil break; 979771fa900SAdrien Mazarguil } 980771fa900SAdrien Mazarguil } 981771fa900SAdrien Mazarguil fclose(file); 982771fa900SAdrien Mazarguil return 0; 983771fa900SAdrien Mazarguil } 984198a3c33SNelio Laranjeiro 985198a3c33SNelio Laranjeiro /** 986c26ae069SMatan Azrad * Update the link status. 987198a3c33SNelio Laranjeiro * 988198a3c33SNelio Laranjeiro * @param priv 989198a3c33SNelio Laranjeiro * Pointer to private structure. 990198a3c33SNelio Laranjeiro * 991198a3c33SNelio Laranjeiro * @return 992c26ae069SMatan Azrad * Zero if the callback process can be called immediately. 993198a3c33SNelio Laranjeiro */ 994198a3c33SNelio Laranjeiro static int 995c26ae069SMatan Azrad priv_link_status_update(struct priv *priv) 996c26ae069SMatan Azrad { 997c26ae069SMatan Azrad struct rte_eth_link *link = &priv->dev->data->dev_link; 998c26ae069SMatan Azrad 999c7bf6225SYongseok Koh priv_link_update(priv, 0); 1000c26ae069SMatan Azrad if (((link->link_speed == 0) && link->link_status) || 1001c26ae069SMatan Azrad ((link->link_speed != 0) && !link->link_status)) { 1002c26ae069SMatan Azrad /* 1003c26ae069SMatan Azrad * Inconsistent status. Event likely occurred before the 1004c26ae069SMatan Azrad * kernel netdevice exposes the new status. 1005c26ae069SMatan Azrad */ 1006c26ae069SMatan Azrad if (!priv->pending_alarm) { 1007c26ae069SMatan Azrad priv->pending_alarm = 1; 1008c26ae069SMatan Azrad rte_eal_alarm_set(MLX5_ALARM_TIMEOUT_US, 1009c26ae069SMatan Azrad mlx5_dev_link_status_handler, 1010c26ae069SMatan Azrad priv->dev); 1011c26ae069SMatan Azrad } 1012c26ae069SMatan Azrad return 1; 1013c26ae069SMatan Azrad } else if (unlikely(priv->pending_alarm)) { 1014c26ae069SMatan Azrad /* Link interrupt occurred while alarm is already scheduled. */ 1015c26ae069SMatan Azrad priv->pending_alarm = 0; 1016c26ae069SMatan Azrad rte_eal_alarm_cancel(mlx5_dev_link_status_handler, priv->dev); 1017c26ae069SMatan Azrad } 1018c26ae069SMatan Azrad return 0; 1019c26ae069SMatan Azrad } 1020c26ae069SMatan Azrad 1021c26ae069SMatan Azrad /** 1022c26ae069SMatan Azrad * Device status handler. 1023c26ae069SMatan Azrad * 1024c26ae069SMatan Azrad * @param priv 1025c26ae069SMatan Azrad * Pointer to private structure. 1026c26ae069SMatan Azrad * @param events 1027c26ae069SMatan Azrad * Pointer to event flags holder. 1028c26ae069SMatan Azrad * 1029c26ae069SMatan Azrad * @return 1030c26ae069SMatan Azrad * Events bitmap of callback process which can be called immediately. 1031c26ae069SMatan Azrad */ 1032c26ae069SMatan Azrad static uint32_t 1033c26ae069SMatan Azrad priv_dev_status_handler(struct priv *priv) 1034198a3c33SNelio Laranjeiro { 1035198a3c33SNelio Laranjeiro struct ibv_async_event event; 1036c26ae069SMatan Azrad uint32_t ret = 0; 1037198a3c33SNelio Laranjeiro 1038198a3c33SNelio Laranjeiro /* Read all message and acknowledge them. */ 1039198a3c33SNelio Laranjeiro for (;;) { 10400e83b8e5SNelio Laranjeiro if (mlx5_glue->get_async_event(priv->ctx, &event)) 1041198a3c33SNelio Laranjeiro break; 1042c26ae069SMatan Azrad if ((event.event_type == IBV_EVENT_PORT_ACTIVE || 1043c26ae069SMatan Azrad event.event_type == IBV_EVENT_PORT_ERR) && 1044c26ae069SMatan Azrad (priv->dev->data->dev_conf.intr_conf.lsc == 1)) 1045c26ae069SMatan Azrad ret |= (1 << RTE_ETH_EVENT_INTR_LSC); 10467d7d7ad1SMatan Azrad else if (event.event_type == IBV_EVENT_DEVICE_FATAL && 10477d7d7ad1SMatan Azrad priv->dev->data->dev_conf.intr_conf.rmv == 1) 10487d7d7ad1SMatan Azrad ret |= (1 << RTE_ETH_EVENT_INTR_RMV); 1049c26ae069SMatan Azrad else 1050198a3c33SNelio Laranjeiro DEBUG("event type %d on port %d not handled", 1051198a3c33SNelio Laranjeiro event.event_type, event.element.port_num); 10520e83b8e5SNelio Laranjeiro mlx5_glue->ack_async_event(&event); 1053198a3c33SNelio Laranjeiro } 1054c26ae069SMatan Azrad if (ret & (1 << RTE_ETH_EVENT_INTR_LSC)) 1055c26ae069SMatan Azrad if (priv_link_status_update(priv)) 1056c26ae069SMatan Azrad ret &= ~(1 << RTE_ETH_EVENT_INTR_LSC); 1057198a3c33SNelio Laranjeiro return ret; 1058198a3c33SNelio Laranjeiro } 1059198a3c33SNelio Laranjeiro 1060198a3c33SNelio Laranjeiro /** 1061198a3c33SNelio Laranjeiro * Handle delayed link status event. 1062198a3c33SNelio Laranjeiro * 1063198a3c33SNelio Laranjeiro * @param arg 1064198a3c33SNelio Laranjeiro * Registered argument. 1065198a3c33SNelio Laranjeiro */ 1066198a3c33SNelio Laranjeiro void 1067198a3c33SNelio Laranjeiro mlx5_dev_link_status_handler(void *arg) 1068198a3c33SNelio Laranjeiro { 1069198a3c33SNelio Laranjeiro struct rte_eth_dev *dev = arg; 1070198a3c33SNelio Laranjeiro struct priv *priv = dev->data->dev_private; 1071198a3c33SNelio Laranjeiro int ret; 1072198a3c33SNelio Laranjeiro 10736817ad38SYongseok Koh while (!priv_trylock(priv)) { 10746817ad38SYongseok Koh /* Alarm is being canceled. */ 10756817ad38SYongseok Koh if (priv->pending_alarm == 0) 10766817ad38SYongseok Koh return; 10776817ad38SYongseok Koh rte_pause(); 10786817ad38SYongseok Koh } 1079a9f2fbc4SShahaf Shuler priv->pending_alarm = 0; 1080c26ae069SMatan Azrad ret = priv_link_status_update(priv); 1081198a3c33SNelio Laranjeiro priv_unlock(priv); 1082c26ae069SMatan Azrad if (!ret) 1083cebe3d7bSThomas Monjalon _rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL); 1084198a3c33SNelio Laranjeiro } 1085198a3c33SNelio Laranjeiro 1086198a3c33SNelio Laranjeiro /** 1087198a3c33SNelio Laranjeiro * Handle interrupts from the NIC. 1088198a3c33SNelio Laranjeiro * 1089198a3c33SNelio Laranjeiro * @param[in] intr_handle 1090198a3c33SNelio Laranjeiro * Interrupt handler. 1091198a3c33SNelio Laranjeiro * @param cb_arg 1092198a3c33SNelio Laranjeiro * Callback argument. 1093198a3c33SNelio Laranjeiro */ 1094198a3c33SNelio Laranjeiro void 1095c23a1a30SQi Zhang mlx5_dev_interrupt_handler(void *cb_arg) 1096198a3c33SNelio Laranjeiro { 1097198a3c33SNelio Laranjeiro struct rte_eth_dev *dev = cb_arg; 1098198a3c33SNelio Laranjeiro struct priv *priv = dev->data->dev_private; 1099c26ae069SMatan Azrad uint32_t events; 1100198a3c33SNelio Laranjeiro 1101198a3c33SNelio Laranjeiro priv_lock(priv); 1102c26ae069SMatan Azrad events = priv_dev_status_handler(priv); 1103198a3c33SNelio Laranjeiro priv_unlock(priv); 1104c26ae069SMatan Azrad if (events & (1 << RTE_ETH_EVENT_INTR_LSC)) 1105cebe3d7bSThomas Monjalon _rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL); 11067d7d7ad1SMatan Azrad if (events & (1 << RTE_ETH_EVENT_INTR_RMV)) 1107cebe3d7bSThomas Monjalon _rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_RMV, NULL); 1108198a3c33SNelio Laranjeiro } 1109198a3c33SNelio Laranjeiro 1110198a3c33SNelio Laranjeiro /** 1111f8b9a3baSXueming Li * Handle interrupts from the socket. 1112f8b9a3baSXueming Li * 1113f8b9a3baSXueming Li * @param cb_arg 1114f8b9a3baSXueming Li * Callback argument. 1115f8b9a3baSXueming Li */ 1116f8b9a3baSXueming Li static void 1117f8b9a3baSXueming Li mlx5_dev_handler_socket(void *cb_arg) 1118f8b9a3baSXueming Li { 1119f8b9a3baSXueming Li struct rte_eth_dev *dev = cb_arg; 1120f8b9a3baSXueming Li struct priv *priv = dev->data->dev_private; 1121f8b9a3baSXueming Li 1122f8b9a3baSXueming Li priv_lock(priv); 1123f8b9a3baSXueming Li priv_socket_handle(priv); 1124f8b9a3baSXueming Li priv_unlock(priv); 1125f8b9a3baSXueming Li } 1126f8b9a3baSXueming Li 1127f8b9a3baSXueming Li /** 1128198a3c33SNelio Laranjeiro * Uninstall interrupt handler. 1129198a3c33SNelio Laranjeiro * 1130198a3c33SNelio Laranjeiro * @param priv 1131198a3c33SNelio Laranjeiro * Pointer to private structure. 1132198a3c33SNelio Laranjeiro * @param dev 1133198a3c33SNelio Laranjeiro * Pointer to the rte_eth_dev structure. 1134198a3c33SNelio Laranjeiro */ 1135198a3c33SNelio Laranjeiro void 1136198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_uninstall(struct priv *priv, struct rte_eth_dev *dev) 1137198a3c33SNelio Laranjeiro { 1138f8b9a3baSXueming Li if (dev->data->dev_conf.intr_conf.lsc || 1139f8b9a3baSXueming Li dev->data->dev_conf.intr_conf.rmv) 1140198a3c33SNelio Laranjeiro rte_intr_callback_unregister(&priv->intr_handle, 1141f8b9a3baSXueming Li mlx5_dev_interrupt_handler, dev); 1142f8b9a3baSXueming Li if (priv->primary_socket) 1143f8b9a3baSXueming Li rte_intr_callback_unregister(&priv->intr_handle_socket, 1144f8b9a3baSXueming Li mlx5_dev_handler_socket, dev); 11456817ad38SYongseok Koh if (priv->pending_alarm) { 1146198a3c33SNelio Laranjeiro priv->pending_alarm = 0; 11476817ad38SYongseok Koh rte_eal_alarm_cancel(mlx5_dev_link_status_handler, dev); 11486817ad38SYongseok Koh } 1149198a3c33SNelio Laranjeiro priv->intr_handle.fd = 0; 115036351ea3SFerruh Yigit priv->intr_handle.type = RTE_INTR_HANDLE_UNKNOWN; 1151f8b9a3baSXueming Li priv->intr_handle_socket.fd = 0; 1152f8b9a3baSXueming Li priv->intr_handle_socket.type = RTE_INTR_HANDLE_UNKNOWN; 1153198a3c33SNelio Laranjeiro } 1154198a3c33SNelio Laranjeiro 1155198a3c33SNelio Laranjeiro /** 1156198a3c33SNelio Laranjeiro * Install interrupt handler. 1157198a3c33SNelio Laranjeiro * 1158198a3c33SNelio Laranjeiro * @param priv 1159198a3c33SNelio Laranjeiro * Pointer to private structure. 1160198a3c33SNelio Laranjeiro * @param dev 1161198a3c33SNelio Laranjeiro * Pointer to the rte_eth_dev structure. 1162198a3c33SNelio Laranjeiro */ 1163198a3c33SNelio Laranjeiro void 1164198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_install(struct priv *priv, struct rte_eth_dev *dev) 1165198a3c33SNelio Laranjeiro { 1166198a3c33SNelio Laranjeiro int rc, flags; 1167198a3c33SNelio Laranjeiro 1168198a3c33SNelio Laranjeiro assert(priv->ctx->async_fd > 0); 1169198a3c33SNelio Laranjeiro flags = fcntl(priv->ctx->async_fd, F_GETFL); 1170198a3c33SNelio Laranjeiro rc = fcntl(priv->ctx->async_fd, F_SETFL, flags | O_NONBLOCK); 1171198a3c33SNelio Laranjeiro if (rc < 0) { 1172198a3c33SNelio Laranjeiro INFO("failed to change file descriptor async event queue"); 1173198a3c33SNelio Laranjeiro dev->data->dev_conf.intr_conf.lsc = 0; 11747d7d7ad1SMatan Azrad dev->data->dev_conf.intr_conf.rmv = 0; 1175f8b9a3baSXueming Li } 1176f8b9a3baSXueming Li if (dev->data->dev_conf.intr_conf.lsc || 1177f8b9a3baSXueming Li dev->data->dev_conf.intr_conf.rmv) { 1178198a3c33SNelio Laranjeiro priv->intr_handle.fd = priv->ctx->async_fd; 1179198a3c33SNelio Laranjeiro priv->intr_handle.type = RTE_INTR_HANDLE_EXT; 1180198a3c33SNelio Laranjeiro rte_intr_callback_register(&priv->intr_handle, 1181f8b9a3baSXueming Li mlx5_dev_interrupt_handler, dev); 1182f8b9a3baSXueming Li } 1183f8b9a3baSXueming Li 1184f8b9a3baSXueming Li rc = priv_socket_init(priv); 1185f8b9a3baSXueming Li if (!rc && priv->primary_socket) { 1186f8b9a3baSXueming Li priv->intr_handle_socket.fd = priv->primary_socket; 1187f8b9a3baSXueming Li priv->intr_handle_socket.type = RTE_INTR_HANDLE_EXT; 1188f8b9a3baSXueming Li rte_intr_callback_register(&priv->intr_handle_socket, 1189f8b9a3baSXueming Li mlx5_dev_handler_socket, dev); 1190198a3c33SNelio Laranjeiro } 1191198a3c33SNelio Laranjeiro } 119262072098SOr Ami 119362072098SOr Ami /** 119462072098SOr Ami * Change the link state (UP / DOWN). 119562072098SOr Ami * 11963d04e050SOlivier Matz * @param priv 1197aee1b165SXueming Li * Pointer to private data structure. 119862072098SOr Ami * @param up 119962072098SOr Ami * Nonzero for link up, otherwise link down. 120062072098SOr Ami * 120162072098SOr Ami * @return 120262072098SOr Ami * 0 on success, errno value on failure. 120362072098SOr Ami */ 120462072098SOr Ami static int 1205c7bf6225SYongseok Koh priv_dev_set_link(struct priv *priv, int up) 120662072098SOr Ami { 1207c7bf6225SYongseok Koh return priv_set_flags(priv, ~IFF_UP, up ? IFF_UP : ~IFF_UP); 120862072098SOr Ami } 120962072098SOr Ami 121062072098SOr Ami /** 121162072098SOr Ami * DPDK callback to bring the link DOWN. 121262072098SOr Ami * 121362072098SOr Ami * @param dev 121462072098SOr Ami * Pointer to Ethernet device structure. 121562072098SOr Ami * 121662072098SOr Ami * @return 121762072098SOr Ami * 0 on success, errno value on failure. 121862072098SOr Ami */ 121962072098SOr Ami int 122062072098SOr Ami mlx5_set_link_down(struct rte_eth_dev *dev) 122162072098SOr Ami { 122262072098SOr Ami struct priv *priv = dev->data->dev_private; 122362072098SOr Ami int err; 122462072098SOr Ami 122562072098SOr Ami priv_lock(priv); 1226c7bf6225SYongseok Koh err = priv_dev_set_link(priv, 0); 122762072098SOr Ami priv_unlock(priv); 122862072098SOr Ami return err; 122962072098SOr Ami } 123062072098SOr Ami 123162072098SOr Ami /** 123262072098SOr Ami * DPDK callback to bring the link UP. 123362072098SOr Ami * 123462072098SOr Ami * @param dev 123562072098SOr Ami * Pointer to Ethernet device structure. 123662072098SOr Ami * 123762072098SOr Ami * @return 123862072098SOr Ami * 0 on success, errno value on failure. 123962072098SOr Ami */ 124062072098SOr Ami int 124162072098SOr Ami mlx5_set_link_up(struct rte_eth_dev *dev) 124262072098SOr Ami { 124362072098SOr Ami struct priv *priv = dev->data->dev_private; 124462072098SOr Ami int err; 124562072098SOr Ami 124662072098SOr Ami priv_lock(priv); 1247c7bf6225SYongseok Koh err = priv_dev_set_link(priv, 1); 124862072098SOr Ami priv_unlock(priv); 124962072098SOr Ami return err; 125062072098SOr Ami } 1251a48deadaSOr Ami 1252a48deadaSOr Ami /** 1253cdab90cbSNélio Laranjeiro * Configure the TX function to use. 1254cdab90cbSNélio Laranjeiro * 1255cdab90cbSNélio Laranjeiro * @param priv 1256aee1b165SXueming Li * Pointer to private data structure. 1257aee1b165SXueming Li * @param dev 1258aee1b165SXueming Li * Pointer to rte_eth_dev structure. 12591cfa649bSShahaf Shuler * 12601cfa649bSShahaf Shuler * @return 12611cfa649bSShahaf Shuler * Pointer to selected Tx burst function. 1262cdab90cbSNélio Laranjeiro */ 12631cfa649bSShahaf Shuler eth_tx_burst_t 1264dbccb4cdSShahaf Shuler priv_select_tx_function(struct priv *priv, struct rte_eth_dev *dev) 1265cdab90cbSNélio Laranjeiro { 12661cfa649bSShahaf Shuler eth_tx_burst_t tx_pkt_burst = mlx5_tx_burst; 12677fe24446SShahaf Shuler struct mlx5_dev_config *config = &priv->config; 1268dbccb4cdSShahaf Shuler uint64_t tx_offloads = dev->data->dev_conf.txmode.offloads; 1269dbccb4cdSShahaf Shuler int tso = !!(tx_offloads & (DEV_TX_OFFLOAD_TCP_TSO | 1270dbccb4cdSShahaf Shuler DEV_TX_OFFLOAD_VXLAN_TNL_TSO | 1271dbccb4cdSShahaf Shuler DEV_TX_OFFLOAD_GRE_TNL_TSO)); 1272dbccb4cdSShahaf Shuler int vlan_insert = !!(tx_offloads & DEV_TX_OFFLOAD_VLAN_INSERT); 12731cfa649bSShahaf Shuler 1274aee1b165SXueming Li assert(priv != NULL); 1275230189d9SNélio Laranjeiro /* Select appropriate TX function. */ 1276dbccb4cdSShahaf Shuler if (vlan_insert || tso) 1277dbccb4cdSShahaf Shuler return tx_pkt_burst; 12787fe24446SShahaf Shuler if (config->mps == MLX5_MPW_ENHANCED) { 1279dbccb4cdSShahaf Shuler if (priv_check_vec_tx_support(priv, dev) > 0) { 1280dbccb4cdSShahaf Shuler if (priv_check_raw_vec_tx_support(priv, dev) > 0) 12811cfa649bSShahaf Shuler tx_pkt_burst = mlx5_tx_burst_raw_vec; 12826cb559d6SYongseok Koh else 12831cfa649bSShahaf Shuler tx_pkt_burst = mlx5_tx_burst_vec; 12846cb559d6SYongseok Koh DEBUG("selected Enhanced MPW TX vectorized function"); 12856cb559d6SYongseok Koh } else { 12861cfa649bSShahaf Shuler tx_pkt_burst = mlx5_tx_burst_empw; 12876ce84bd8SYongseok Koh DEBUG("selected Enhanced MPW TX function"); 12886cb559d6SYongseok Koh } 12897fe24446SShahaf Shuler } else if (config->mps && (config->txq_inline > 0)) { 12901cfa649bSShahaf Shuler tx_pkt_burst = mlx5_tx_burst_mpw_inline; 1291230189d9SNélio Laranjeiro DEBUG("selected MPW inline TX function"); 12927fe24446SShahaf Shuler } else if (config->mps) { 12931cfa649bSShahaf Shuler tx_pkt_burst = mlx5_tx_burst_mpw; 1294230189d9SNélio Laranjeiro DEBUG("selected MPW TX function"); 12952a66cf37SYaacov Hazan } 12961cfa649bSShahaf Shuler return tx_pkt_burst; 1297cdab90cbSNélio Laranjeiro } 1298cdab90cbSNélio Laranjeiro 1299cdab90cbSNélio Laranjeiro /** 1300cdab90cbSNélio Laranjeiro * Configure the RX function to use. 1301cdab90cbSNélio Laranjeiro * 1302cdab90cbSNélio Laranjeiro * @param priv 1303aee1b165SXueming Li * Pointer to private data structure. 1304aee1b165SXueming Li * @param dev 1305aee1b165SXueming Li * Pointer to rte_eth_dev structure. 13061cfa649bSShahaf Shuler * 13071cfa649bSShahaf Shuler * @return 13081cfa649bSShahaf Shuler * Pointer to selected Rx burst function. 1309cdab90cbSNélio Laranjeiro */ 13101cfa649bSShahaf Shuler eth_rx_burst_t 13111cfa649bSShahaf Shuler priv_select_rx_function(struct priv *priv, __rte_unused struct rte_eth_dev *dev) 1312cdab90cbSNélio Laranjeiro { 13131cfa649bSShahaf Shuler eth_rx_burst_t rx_pkt_burst = mlx5_rx_burst; 13141cfa649bSShahaf Shuler 1315aee1b165SXueming Li assert(priv != NULL); 13166cb559d6SYongseok Koh if (priv_check_vec_rx_support(priv) > 0) { 13171cfa649bSShahaf Shuler rx_pkt_burst = mlx5_rx_burst_vec; 13186cb559d6SYongseok Koh DEBUG("selected RX vectorized function"); 1319cdab90cbSNélio Laranjeiro } 13201cfa649bSShahaf Shuler return rx_pkt_burst; 13216cb559d6SYongseok Koh } 1322d3e0f392SMatan Azrad 1323d3e0f392SMatan Azrad /** 1324d3e0f392SMatan Azrad * Check if mlx5 device was removed. 1325d3e0f392SMatan Azrad * 1326d3e0f392SMatan Azrad * @param dev 1327d3e0f392SMatan Azrad * Pointer to Ethernet device structure. 1328d3e0f392SMatan Azrad * 1329d3e0f392SMatan Azrad * @return 1330d3e0f392SMatan Azrad * 1 when device is removed, otherwise 0. 1331d3e0f392SMatan Azrad */ 1332d3e0f392SMatan Azrad int 1333d3e0f392SMatan Azrad mlx5_is_removed(struct rte_eth_dev *dev) 1334d3e0f392SMatan Azrad { 1335d3e0f392SMatan Azrad struct ibv_device_attr device_attr; 1336d3e0f392SMatan Azrad struct priv *priv = dev->data->dev_private; 1337d3e0f392SMatan Azrad 13380e83b8e5SNelio Laranjeiro if (mlx5_glue->query_device(priv->ctx, &device_attr) == EIO) 1339d3e0f392SMatan Azrad return 1; 1340d3e0f392SMatan Azrad return 0; 1341d3e0f392SMatan Azrad } 1342