1771fa900SAdrien Mazarguil /*- 2771fa900SAdrien Mazarguil * BSD LICENSE 3771fa900SAdrien Mazarguil * 4771fa900SAdrien Mazarguil * Copyright 2015 6WIND S.A. 5771fa900SAdrien Mazarguil * Copyright 2015 Mellanox. 6771fa900SAdrien Mazarguil * 7771fa900SAdrien Mazarguil * Redistribution and use in source and binary forms, with or without 8771fa900SAdrien Mazarguil * modification, are permitted provided that the following conditions 9771fa900SAdrien Mazarguil * are met: 10771fa900SAdrien Mazarguil * 11771fa900SAdrien Mazarguil * * Redistributions of source code must retain the above copyright 12771fa900SAdrien Mazarguil * notice, this list of conditions and the following disclaimer. 13771fa900SAdrien Mazarguil * * Redistributions in binary form must reproduce the above copyright 14771fa900SAdrien Mazarguil * notice, this list of conditions and the following disclaimer in 15771fa900SAdrien Mazarguil * the documentation and/or other materials provided with the 16771fa900SAdrien Mazarguil * distribution. 17771fa900SAdrien Mazarguil * * Neither the name of 6WIND S.A. nor the names of its 18771fa900SAdrien Mazarguil * contributors may be used to endorse or promote products derived 19771fa900SAdrien Mazarguil * from this software without specific prior written permission. 20771fa900SAdrien Mazarguil * 21771fa900SAdrien Mazarguil * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 22771fa900SAdrien Mazarguil * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 23771fa900SAdrien Mazarguil * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 24771fa900SAdrien Mazarguil * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 25771fa900SAdrien Mazarguil * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 26771fa900SAdrien Mazarguil * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 27771fa900SAdrien Mazarguil * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 28771fa900SAdrien Mazarguil * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 29771fa900SAdrien Mazarguil * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 30771fa900SAdrien Mazarguil * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 31771fa900SAdrien Mazarguil * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 32771fa900SAdrien Mazarguil */ 33771fa900SAdrien Mazarguil 34771fa900SAdrien Mazarguil #include <stddef.h> 35e60fbd5bSAdrien Mazarguil #include <assert.h> 36771fa900SAdrien Mazarguil #include <unistd.h> 37771fa900SAdrien Mazarguil #include <stdint.h> 38771fa900SAdrien Mazarguil #include <stdio.h> 39771fa900SAdrien Mazarguil #include <string.h> 40771fa900SAdrien Mazarguil #include <stdlib.h> 41771fa900SAdrien Mazarguil #include <errno.h> 42771fa900SAdrien Mazarguil #include <dirent.h> 43771fa900SAdrien Mazarguil #include <net/if.h> 44771fa900SAdrien Mazarguil #include <sys/ioctl.h> 45771fa900SAdrien Mazarguil #include <sys/socket.h> 46771fa900SAdrien Mazarguil #include <netinet/in.h> 47cb8faed7SAdrien Mazarguil #include <linux/ethtool.h> 48cb8faed7SAdrien Mazarguil #include <linux/sockios.h> 49198a3c33SNelio Laranjeiro #include <fcntl.h> 50771fa900SAdrien Mazarguil 51771fa900SAdrien Mazarguil /* DPDK headers don't like -pedantic. */ 52771fa900SAdrien Mazarguil #ifdef PEDANTIC 53fc5b160fSBruce Richardson #pragma GCC diagnostic ignored "-Wpedantic" 54771fa900SAdrien Mazarguil #endif 55771fa900SAdrien Mazarguil #include <rte_atomic.h> 56771fa900SAdrien Mazarguil #include <rte_ethdev.h> 57771fa900SAdrien Mazarguil #include <rte_mbuf.h> 58771fa900SAdrien Mazarguil #include <rte_common.h> 59198a3c33SNelio Laranjeiro #include <rte_interrupts.h> 60198a3c33SNelio Laranjeiro #include <rte_alarm.h> 61a48deadaSOr Ami #include <rte_malloc.h> 62771fa900SAdrien Mazarguil #ifdef PEDANTIC 63fc5b160fSBruce Richardson #pragma GCC diagnostic error "-Wpedantic" 64771fa900SAdrien Mazarguil #endif 65771fa900SAdrien Mazarguil 66771fa900SAdrien Mazarguil #include "mlx5.h" 67e60fbd5bSAdrien Mazarguil #include "mlx5_rxtx.h" 68771fa900SAdrien Mazarguil #include "mlx5_utils.h" 69771fa900SAdrien Mazarguil 70771fa900SAdrien Mazarguil /** 71a48deadaSOr Ami * Return private structure associated with an Ethernet device. 72a48deadaSOr Ami * 73a48deadaSOr Ami * @param dev 74a48deadaSOr Ami * Pointer to Ethernet device structure. 75a48deadaSOr Ami * 76a48deadaSOr Ami * @return 77a48deadaSOr Ami * Pointer to private structure. 78a48deadaSOr Ami */ 79a48deadaSOr Ami struct priv * 80a48deadaSOr Ami mlx5_get_priv(struct rte_eth_dev *dev) 81a48deadaSOr Ami { 82a48deadaSOr Ami struct mlx5_secondary_data *sd; 83a48deadaSOr Ami 84a48deadaSOr Ami if (!mlx5_is_secondary()) 85a48deadaSOr Ami return dev->data->dev_private; 86a48deadaSOr Ami sd = &mlx5_secondary_data[dev->data->port_id]; 87a48deadaSOr Ami return sd->data.dev_private; 88a48deadaSOr Ami } 89a48deadaSOr Ami 90a48deadaSOr Ami /** 91a48deadaSOr Ami * Check if running as a secondary process. 92a48deadaSOr Ami * 93a48deadaSOr Ami * @return 94a48deadaSOr Ami * Nonzero if running as a secondary process. 95a48deadaSOr Ami */ 96a48deadaSOr Ami inline int 97a48deadaSOr Ami mlx5_is_secondary(void) 98a48deadaSOr Ami { 99a48deadaSOr Ami return rte_eal_process_type() != RTE_PROC_PRIMARY; 100a48deadaSOr Ami } 101a48deadaSOr Ami 102a48deadaSOr Ami /** 103771fa900SAdrien Mazarguil * Get interface name from private structure. 104771fa900SAdrien Mazarguil * 105771fa900SAdrien Mazarguil * @param[in] priv 106771fa900SAdrien Mazarguil * Pointer to private structure. 107771fa900SAdrien Mazarguil * @param[out] ifname 108771fa900SAdrien Mazarguil * Interface name output buffer. 109771fa900SAdrien Mazarguil * 110771fa900SAdrien Mazarguil * @return 111771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 112771fa900SAdrien Mazarguil */ 113771fa900SAdrien Mazarguil int 114771fa900SAdrien Mazarguil priv_get_ifname(const struct priv *priv, char (*ifname)[IF_NAMESIZE]) 115771fa900SAdrien Mazarguil { 116771fa900SAdrien Mazarguil DIR *dir; 117771fa900SAdrien Mazarguil struct dirent *dent; 118771fa900SAdrien Mazarguil unsigned int dev_type = 0; 119771fa900SAdrien Mazarguil unsigned int dev_port_prev = ~0u; 120771fa900SAdrien Mazarguil char match[IF_NAMESIZE] = ""; 121771fa900SAdrien Mazarguil 122771fa900SAdrien Mazarguil { 123771fa900SAdrien Mazarguil MKSTR(path, "%s/device/net", priv->ctx->device->ibdev_path); 124771fa900SAdrien Mazarguil 125771fa900SAdrien Mazarguil dir = opendir(path); 126771fa900SAdrien Mazarguil if (dir == NULL) 127771fa900SAdrien Mazarguil return -1; 128771fa900SAdrien Mazarguil } 129771fa900SAdrien Mazarguil while ((dent = readdir(dir)) != NULL) { 130771fa900SAdrien Mazarguil char *name = dent->d_name; 131771fa900SAdrien Mazarguil FILE *file; 132771fa900SAdrien Mazarguil unsigned int dev_port; 133771fa900SAdrien Mazarguil int r; 134771fa900SAdrien Mazarguil 135771fa900SAdrien Mazarguil if ((name[0] == '.') && 136771fa900SAdrien Mazarguil ((name[1] == '\0') || 137771fa900SAdrien Mazarguil ((name[1] == '.') && (name[2] == '\0')))) 138771fa900SAdrien Mazarguil continue; 139771fa900SAdrien Mazarguil 140771fa900SAdrien Mazarguil MKSTR(path, "%s/device/net/%s/%s", 141771fa900SAdrien Mazarguil priv->ctx->device->ibdev_path, name, 142771fa900SAdrien Mazarguil (dev_type ? "dev_id" : "dev_port")); 143771fa900SAdrien Mazarguil 144771fa900SAdrien Mazarguil file = fopen(path, "rb"); 145771fa900SAdrien Mazarguil if (file == NULL) { 146771fa900SAdrien Mazarguil if (errno != ENOENT) 147771fa900SAdrien Mazarguil continue; 148771fa900SAdrien Mazarguil /* 149771fa900SAdrien Mazarguil * Switch to dev_id when dev_port does not exist as 150771fa900SAdrien Mazarguil * is the case with Linux kernel versions < 3.15. 151771fa900SAdrien Mazarguil */ 152771fa900SAdrien Mazarguil try_dev_id: 153771fa900SAdrien Mazarguil match[0] = '\0'; 154771fa900SAdrien Mazarguil if (dev_type) 155771fa900SAdrien Mazarguil break; 156771fa900SAdrien Mazarguil dev_type = 1; 157771fa900SAdrien Mazarguil dev_port_prev = ~0u; 158771fa900SAdrien Mazarguil rewinddir(dir); 159771fa900SAdrien Mazarguil continue; 160771fa900SAdrien Mazarguil } 161771fa900SAdrien Mazarguil r = fscanf(file, (dev_type ? "%x" : "%u"), &dev_port); 162771fa900SAdrien Mazarguil fclose(file); 163771fa900SAdrien Mazarguil if (r != 1) 164771fa900SAdrien Mazarguil continue; 165771fa900SAdrien Mazarguil /* 166771fa900SAdrien Mazarguil * Switch to dev_id when dev_port returns the same value for 167771fa900SAdrien Mazarguil * all ports. May happen when using a MOFED release older than 168771fa900SAdrien Mazarguil * 3.0 with a Linux kernel >= 3.15. 169771fa900SAdrien Mazarguil */ 170771fa900SAdrien Mazarguil if (dev_port == dev_port_prev) 171771fa900SAdrien Mazarguil goto try_dev_id; 172771fa900SAdrien Mazarguil dev_port_prev = dev_port; 173771fa900SAdrien Mazarguil if (dev_port == (priv->port - 1u)) 174771fa900SAdrien Mazarguil snprintf(match, sizeof(match), "%s", name); 175771fa900SAdrien Mazarguil } 176771fa900SAdrien Mazarguil closedir(dir); 177771fa900SAdrien Mazarguil if (match[0] == '\0') 178771fa900SAdrien Mazarguil return -1; 179771fa900SAdrien Mazarguil strncpy(*ifname, match, sizeof(*ifname)); 180771fa900SAdrien Mazarguil return 0; 181771fa900SAdrien Mazarguil } 182771fa900SAdrien Mazarguil 183771fa900SAdrien Mazarguil /** 184771fa900SAdrien Mazarguil * Read from sysfs entry. 185771fa900SAdrien Mazarguil * 186771fa900SAdrien Mazarguil * @param[in] priv 187771fa900SAdrien Mazarguil * Pointer to private structure. 188771fa900SAdrien Mazarguil * @param[in] entry 189771fa900SAdrien Mazarguil * Entry name relative to sysfs path. 190771fa900SAdrien Mazarguil * @param[out] buf 191771fa900SAdrien Mazarguil * Data output buffer. 192771fa900SAdrien Mazarguil * @param size 193771fa900SAdrien Mazarguil * Buffer size. 194771fa900SAdrien Mazarguil * 195771fa900SAdrien Mazarguil * @return 196771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 197771fa900SAdrien Mazarguil */ 198771fa900SAdrien Mazarguil static int 199771fa900SAdrien Mazarguil priv_sysfs_read(const struct priv *priv, const char *entry, 200771fa900SAdrien Mazarguil char *buf, size_t size) 201771fa900SAdrien Mazarguil { 202771fa900SAdrien Mazarguil char ifname[IF_NAMESIZE]; 203771fa900SAdrien Mazarguil FILE *file; 204771fa900SAdrien Mazarguil int ret; 205771fa900SAdrien Mazarguil int err; 206771fa900SAdrien Mazarguil 207771fa900SAdrien Mazarguil if (priv_get_ifname(priv, &ifname)) 208771fa900SAdrien Mazarguil return -1; 209771fa900SAdrien Mazarguil 210771fa900SAdrien Mazarguil MKSTR(path, "%s/device/net/%s/%s", priv->ctx->device->ibdev_path, 211771fa900SAdrien Mazarguil ifname, entry); 212771fa900SAdrien Mazarguil 213771fa900SAdrien Mazarguil file = fopen(path, "rb"); 214771fa900SAdrien Mazarguil if (file == NULL) 215771fa900SAdrien Mazarguil return -1; 216771fa900SAdrien Mazarguil ret = fread(buf, 1, size, file); 217771fa900SAdrien Mazarguil err = errno; 218771fa900SAdrien Mazarguil if (((size_t)ret < size) && (ferror(file))) 219771fa900SAdrien Mazarguil ret = -1; 220771fa900SAdrien Mazarguil else 221771fa900SAdrien Mazarguil ret = size; 222771fa900SAdrien Mazarguil fclose(file); 223771fa900SAdrien Mazarguil errno = err; 224771fa900SAdrien Mazarguil return ret; 225771fa900SAdrien Mazarguil } 226771fa900SAdrien Mazarguil 227771fa900SAdrien Mazarguil /** 228771fa900SAdrien Mazarguil * Write to sysfs entry. 229771fa900SAdrien Mazarguil * 230771fa900SAdrien Mazarguil * @param[in] priv 231771fa900SAdrien Mazarguil * Pointer to private structure. 232771fa900SAdrien Mazarguil * @param[in] entry 233771fa900SAdrien Mazarguil * Entry name relative to sysfs path. 234771fa900SAdrien Mazarguil * @param[in] buf 235771fa900SAdrien Mazarguil * Data buffer. 236771fa900SAdrien Mazarguil * @param size 237771fa900SAdrien Mazarguil * Buffer size. 238771fa900SAdrien Mazarguil * 239771fa900SAdrien Mazarguil * @return 240771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 241771fa900SAdrien Mazarguil */ 242771fa900SAdrien Mazarguil static int 243771fa900SAdrien Mazarguil priv_sysfs_write(const struct priv *priv, const char *entry, 244771fa900SAdrien Mazarguil char *buf, size_t size) 245771fa900SAdrien Mazarguil { 246771fa900SAdrien Mazarguil char ifname[IF_NAMESIZE]; 247771fa900SAdrien Mazarguil FILE *file; 248771fa900SAdrien Mazarguil int ret; 249771fa900SAdrien Mazarguil int err; 250771fa900SAdrien Mazarguil 251771fa900SAdrien Mazarguil if (priv_get_ifname(priv, &ifname)) 252771fa900SAdrien Mazarguil return -1; 253771fa900SAdrien Mazarguil 254771fa900SAdrien Mazarguil MKSTR(path, "%s/device/net/%s/%s", priv->ctx->device->ibdev_path, 255771fa900SAdrien Mazarguil ifname, entry); 256771fa900SAdrien Mazarguil 257771fa900SAdrien Mazarguil file = fopen(path, "wb"); 258771fa900SAdrien Mazarguil if (file == NULL) 259771fa900SAdrien Mazarguil return -1; 260771fa900SAdrien Mazarguil ret = fwrite(buf, 1, size, file); 261771fa900SAdrien Mazarguil err = errno; 262771fa900SAdrien Mazarguil if (((size_t)ret < size) || (ferror(file))) 263771fa900SAdrien Mazarguil ret = -1; 264771fa900SAdrien Mazarguil else 265771fa900SAdrien Mazarguil ret = size; 266771fa900SAdrien Mazarguil fclose(file); 267771fa900SAdrien Mazarguil errno = err; 268771fa900SAdrien Mazarguil return ret; 269771fa900SAdrien Mazarguil } 270771fa900SAdrien Mazarguil 271771fa900SAdrien Mazarguil /** 272771fa900SAdrien Mazarguil * Get unsigned long sysfs property. 273771fa900SAdrien Mazarguil * 274771fa900SAdrien Mazarguil * @param priv 275771fa900SAdrien Mazarguil * Pointer to private structure. 276771fa900SAdrien Mazarguil * @param[in] name 277771fa900SAdrien Mazarguil * Entry name relative to sysfs path. 278771fa900SAdrien Mazarguil * @param[out] value 279771fa900SAdrien Mazarguil * Value output buffer. 280771fa900SAdrien Mazarguil * 281771fa900SAdrien Mazarguil * @return 282771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 283771fa900SAdrien Mazarguil */ 284771fa900SAdrien Mazarguil static int 285771fa900SAdrien Mazarguil priv_get_sysfs_ulong(struct priv *priv, const char *name, unsigned long *value) 286771fa900SAdrien Mazarguil { 287771fa900SAdrien Mazarguil int ret; 288771fa900SAdrien Mazarguil unsigned long value_ret; 289771fa900SAdrien Mazarguil char value_str[32]; 290771fa900SAdrien Mazarguil 291771fa900SAdrien Mazarguil ret = priv_sysfs_read(priv, name, value_str, (sizeof(value_str) - 1)); 292771fa900SAdrien Mazarguil if (ret == -1) { 293771fa900SAdrien Mazarguil DEBUG("cannot read %s value from sysfs: %s", 294771fa900SAdrien Mazarguil name, strerror(errno)); 295771fa900SAdrien Mazarguil return -1; 296771fa900SAdrien Mazarguil } 297771fa900SAdrien Mazarguil value_str[ret] = '\0'; 298771fa900SAdrien Mazarguil errno = 0; 299771fa900SAdrien Mazarguil value_ret = strtoul(value_str, NULL, 0); 300771fa900SAdrien Mazarguil if (errno) { 301771fa900SAdrien Mazarguil DEBUG("invalid %s value `%s': %s", name, value_str, 302771fa900SAdrien Mazarguil strerror(errno)); 303771fa900SAdrien Mazarguil return -1; 304771fa900SAdrien Mazarguil } 305771fa900SAdrien Mazarguil *value = value_ret; 306771fa900SAdrien Mazarguil return 0; 307771fa900SAdrien Mazarguil } 308771fa900SAdrien Mazarguil 309771fa900SAdrien Mazarguil /** 310771fa900SAdrien Mazarguil * Set unsigned long sysfs property. 311771fa900SAdrien Mazarguil * 312771fa900SAdrien Mazarguil * @param priv 313771fa900SAdrien Mazarguil * Pointer to private structure. 314771fa900SAdrien Mazarguil * @param[in] name 315771fa900SAdrien Mazarguil * Entry name relative to sysfs path. 316771fa900SAdrien Mazarguil * @param value 317771fa900SAdrien Mazarguil * Value to set. 318771fa900SAdrien Mazarguil * 319771fa900SAdrien Mazarguil * @return 320771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 321771fa900SAdrien Mazarguil */ 322771fa900SAdrien Mazarguil static int 323771fa900SAdrien Mazarguil priv_set_sysfs_ulong(struct priv *priv, const char *name, unsigned long value) 324771fa900SAdrien Mazarguil { 325771fa900SAdrien Mazarguil int ret; 326771fa900SAdrien Mazarguil MKSTR(value_str, "%lu", value); 327771fa900SAdrien Mazarguil 328771fa900SAdrien Mazarguil ret = priv_sysfs_write(priv, name, value_str, (sizeof(value_str) - 1)); 329771fa900SAdrien Mazarguil if (ret == -1) { 330771fa900SAdrien Mazarguil DEBUG("cannot write %s `%s' (%lu) to sysfs: %s", 331771fa900SAdrien Mazarguil name, value_str, value, strerror(errno)); 332771fa900SAdrien Mazarguil return -1; 333771fa900SAdrien Mazarguil } 334771fa900SAdrien Mazarguil return 0; 335771fa900SAdrien Mazarguil } 336771fa900SAdrien Mazarguil 337771fa900SAdrien Mazarguil /** 338771fa900SAdrien Mazarguil * Perform ifreq ioctl() on associated Ethernet device. 339771fa900SAdrien Mazarguil * 340771fa900SAdrien Mazarguil * @param[in] priv 341771fa900SAdrien Mazarguil * Pointer to private structure. 342771fa900SAdrien Mazarguil * @param req 343771fa900SAdrien Mazarguil * Request number to pass to ioctl(). 344771fa900SAdrien Mazarguil * @param[out] ifr 345771fa900SAdrien Mazarguil * Interface request structure output buffer. 346771fa900SAdrien Mazarguil * 347771fa900SAdrien Mazarguil * @return 348771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 349771fa900SAdrien Mazarguil */ 350771fa900SAdrien Mazarguil int 351771fa900SAdrien Mazarguil priv_ifreq(const struct priv *priv, int req, struct ifreq *ifr) 352771fa900SAdrien Mazarguil { 353771fa900SAdrien Mazarguil int sock = socket(PF_INET, SOCK_DGRAM, IPPROTO_IP); 354771fa900SAdrien Mazarguil int ret = -1; 355771fa900SAdrien Mazarguil 356771fa900SAdrien Mazarguil if (sock == -1) 357771fa900SAdrien Mazarguil return ret; 358771fa900SAdrien Mazarguil if (priv_get_ifname(priv, &ifr->ifr_name) == 0) 359771fa900SAdrien Mazarguil ret = ioctl(sock, req, ifr); 360771fa900SAdrien Mazarguil close(sock); 361771fa900SAdrien Mazarguil return ret; 362771fa900SAdrien Mazarguil } 363771fa900SAdrien Mazarguil 364771fa900SAdrien Mazarguil /** 36585e347dbSNélio Laranjeiro * Return the number of active VFs for the current device. 36685e347dbSNélio Laranjeiro * 36785e347dbSNélio Laranjeiro * @param[in] priv 36885e347dbSNélio Laranjeiro * Pointer to private structure. 36985e347dbSNélio Laranjeiro * @param[out] num_vfs 37085e347dbSNélio Laranjeiro * Number of active VFs. 37185e347dbSNélio Laranjeiro * 37285e347dbSNélio Laranjeiro * @return 37385e347dbSNélio Laranjeiro * 0 on success, -1 on failure and errno is set. 37485e347dbSNélio Laranjeiro */ 37585e347dbSNélio Laranjeiro int 37685e347dbSNélio Laranjeiro priv_get_num_vfs(struct priv *priv, uint16_t *num_vfs) 37785e347dbSNélio Laranjeiro { 37885e347dbSNélio Laranjeiro /* The sysfs entry name depends on the operating system. */ 37985e347dbSNélio Laranjeiro const char **name = (const char *[]){ 38085e347dbSNélio Laranjeiro "device/sriov_numvfs", 38185e347dbSNélio Laranjeiro "device/mlx5_num_vfs", 38285e347dbSNélio Laranjeiro NULL, 38385e347dbSNélio Laranjeiro }; 38485e347dbSNélio Laranjeiro int ret; 38585e347dbSNélio Laranjeiro 38685e347dbSNélio Laranjeiro do { 38785e347dbSNélio Laranjeiro unsigned long ulong_num_vfs; 38885e347dbSNélio Laranjeiro 38985e347dbSNélio Laranjeiro ret = priv_get_sysfs_ulong(priv, *name, &ulong_num_vfs); 39085e347dbSNélio Laranjeiro if (!ret) 39185e347dbSNélio Laranjeiro *num_vfs = ulong_num_vfs; 39285e347dbSNélio Laranjeiro } while (*(++name) && ret); 39385e347dbSNélio Laranjeiro return ret; 39485e347dbSNélio Laranjeiro } 39585e347dbSNélio Laranjeiro 39685e347dbSNélio Laranjeiro /** 397771fa900SAdrien Mazarguil * Get device MTU. 398771fa900SAdrien Mazarguil * 399771fa900SAdrien Mazarguil * @param priv 400771fa900SAdrien Mazarguil * Pointer to private structure. 401771fa900SAdrien Mazarguil * @param[out] mtu 402771fa900SAdrien Mazarguil * MTU value output buffer. 403771fa900SAdrien Mazarguil * 404771fa900SAdrien Mazarguil * @return 405771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 406771fa900SAdrien Mazarguil */ 407771fa900SAdrien Mazarguil int 408771fa900SAdrien Mazarguil priv_get_mtu(struct priv *priv, uint16_t *mtu) 409771fa900SAdrien Mazarguil { 410771fa900SAdrien Mazarguil unsigned long ulong_mtu; 411771fa900SAdrien Mazarguil 412771fa900SAdrien Mazarguil if (priv_get_sysfs_ulong(priv, "mtu", &ulong_mtu) == -1) 413771fa900SAdrien Mazarguil return -1; 414771fa900SAdrien Mazarguil *mtu = ulong_mtu; 415771fa900SAdrien Mazarguil return 0; 416771fa900SAdrien Mazarguil } 417771fa900SAdrien Mazarguil 418771fa900SAdrien Mazarguil /** 419cf37ca95SAdrien Mazarguil * Set device MTU. 420cf37ca95SAdrien Mazarguil * 421cf37ca95SAdrien Mazarguil * @param priv 422cf37ca95SAdrien Mazarguil * Pointer to private structure. 423cf37ca95SAdrien Mazarguil * @param mtu 424cf37ca95SAdrien Mazarguil * MTU value to set. 425cf37ca95SAdrien Mazarguil * 426cf37ca95SAdrien Mazarguil * @return 427cf37ca95SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 428cf37ca95SAdrien Mazarguil */ 429cf37ca95SAdrien Mazarguil static int 430cf37ca95SAdrien Mazarguil priv_set_mtu(struct priv *priv, uint16_t mtu) 431cf37ca95SAdrien Mazarguil { 432f3b492d7SAdrien Mazarguil uint16_t new_mtu; 433f3b492d7SAdrien Mazarguil 434f3b492d7SAdrien Mazarguil if (priv_set_sysfs_ulong(priv, "mtu", mtu) || 435f3b492d7SAdrien Mazarguil priv_get_mtu(priv, &new_mtu)) 436f3b492d7SAdrien Mazarguil return -1; 437f3b492d7SAdrien Mazarguil if (new_mtu == mtu) 438f3b492d7SAdrien Mazarguil return 0; 439f3b492d7SAdrien Mazarguil errno = EINVAL; 440f3b492d7SAdrien Mazarguil return -1; 441cf37ca95SAdrien Mazarguil } 442cf37ca95SAdrien Mazarguil 443cf37ca95SAdrien Mazarguil /** 444771fa900SAdrien Mazarguil * Set device flags. 445771fa900SAdrien Mazarguil * 446771fa900SAdrien Mazarguil * @param priv 447771fa900SAdrien Mazarguil * Pointer to private structure. 448771fa900SAdrien Mazarguil * @param keep 449771fa900SAdrien Mazarguil * Bitmask for flags that must remain untouched. 450771fa900SAdrien Mazarguil * @param flags 451771fa900SAdrien Mazarguil * Bitmask for flags to modify. 452771fa900SAdrien Mazarguil * 453771fa900SAdrien Mazarguil * @return 454771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 455771fa900SAdrien Mazarguil */ 456771fa900SAdrien Mazarguil int 457771fa900SAdrien Mazarguil priv_set_flags(struct priv *priv, unsigned int keep, unsigned int flags) 458771fa900SAdrien Mazarguil { 459771fa900SAdrien Mazarguil unsigned long tmp; 460771fa900SAdrien Mazarguil 461771fa900SAdrien Mazarguil if (priv_get_sysfs_ulong(priv, "flags", &tmp) == -1) 462771fa900SAdrien Mazarguil return -1; 463771fa900SAdrien Mazarguil tmp &= keep; 46433242e3eSOlivier Matz tmp |= (flags & (~keep)); 465771fa900SAdrien Mazarguil return priv_set_sysfs_ulong(priv, "flags", tmp); 466771fa900SAdrien Mazarguil } 467771fa900SAdrien Mazarguil 468771fa900SAdrien Mazarguil /** 469e60fbd5bSAdrien Mazarguil * Ethernet device configuration. 470e60fbd5bSAdrien Mazarguil * 471e60fbd5bSAdrien Mazarguil * Prepare the driver for a given number of TX and RX queues. 472e60fbd5bSAdrien Mazarguil * 473e60fbd5bSAdrien Mazarguil * @param dev 474e60fbd5bSAdrien Mazarguil * Pointer to Ethernet device structure. 475e60fbd5bSAdrien Mazarguil * 476e60fbd5bSAdrien Mazarguil * @return 477e60fbd5bSAdrien Mazarguil * 0 on success, errno value on failure. 478e60fbd5bSAdrien Mazarguil */ 479e60fbd5bSAdrien Mazarguil static int 480e60fbd5bSAdrien Mazarguil dev_configure(struct rte_eth_dev *dev) 481e60fbd5bSAdrien Mazarguil { 482e60fbd5bSAdrien Mazarguil struct priv *priv = dev->data->dev_private; 483e60fbd5bSAdrien Mazarguil unsigned int rxqs_n = dev->data->nb_rx_queues; 484e60fbd5bSAdrien Mazarguil unsigned int txqs_n = dev->data->nb_tx_queues; 485634efbc2SNelio Laranjeiro unsigned int i; 486634efbc2SNelio Laranjeiro unsigned int j; 487634efbc2SNelio Laranjeiro unsigned int reta_idx_n; 488e60fbd5bSAdrien Mazarguil 489c64ccc0eSNélio Laranjeiro priv->rss_hf = dev->data->dev_conf.rx_adv_conf.rss_conf.rss_hf; 490e60fbd5bSAdrien Mazarguil priv->rxqs = (void *)dev->data->rx_queues; 491e60fbd5bSAdrien Mazarguil priv->txqs = (void *)dev->data->tx_queues; 492e60fbd5bSAdrien Mazarguil if (txqs_n != priv->txqs_n) { 493e60fbd5bSAdrien Mazarguil INFO("%p: TX queues number update: %u -> %u", 494e60fbd5bSAdrien Mazarguil (void *)dev, priv->txqs_n, txqs_n); 495e60fbd5bSAdrien Mazarguil priv->txqs_n = txqs_n; 496e60fbd5bSAdrien Mazarguil } 497634efbc2SNelio Laranjeiro if (rxqs_n > priv->ind_table_max_size) { 498634efbc2SNelio Laranjeiro ERROR("cannot handle this many RX queues (%u)", rxqs_n); 499634efbc2SNelio Laranjeiro return EINVAL; 500634efbc2SNelio Laranjeiro } 501e60fbd5bSAdrien Mazarguil if (rxqs_n == priv->rxqs_n) 502e60fbd5bSAdrien Mazarguil return 0; 503e60fbd5bSAdrien Mazarguil INFO("%p: RX queues number update: %u -> %u", 504e60fbd5bSAdrien Mazarguil (void *)dev, priv->rxqs_n, rxqs_n); 505e60fbd5bSAdrien Mazarguil priv->rxqs_n = rxqs_n; 506634efbc2SNelio Laranjeiro /* If the requested number of RX queues is not a power of two, use the 507634efbc2SNelio Laranjeiro * maximum indirection table size for better balancing. 508634efbc2SNelio Laranjeiro * The result is always rounded to the next power of two. */ 509634efbc2SNelio Laranjeiro reta_idx_n = (1 << log2above((rxqs_n & (rxqs_n - 1)) ? 510634efbc2SNelio Laranjeiro priv->ind_table_max_size : 511634efbc2SNelio Laranjeiro rxqs_n)); 512634efbc2SNelio Laranjeiro if (priv_rss_reta_index_resize(priv, reta_idx_n)) 513634efbc2SNelio Laranjeiro return ENOMEM; 514634efbc2SNelio Laranjeiro /* When the number of RX queues is not a power of two, the remaining 515634efbc2SNelio Laranjeiro * table entries are padded with reused WQs and hashes are not spread 516634efbc2SNelio Laranjeiro * uniformly. */ 517634efbc2SNelio Laranjeiro for (i = 0, j = 0; (i != reta_idx_n); ++i) { 518634efbc2SNelio Laranjeiro (*priv->reta_idx)[i] = j; 519634efbc2SNelio Laranjeiro if (++j == rxqs_n) 520634efbc2SNelio Laranjeiro j = 0; 521634efbc2SNelio Laranjeiro } 522e60fbd5bSAdrien Mazarguil return 0; 523e60fbd5bSAdrien Mazarguil } 524e60fbd5bSAdrien Mazarguil 525e60fbd5bSAdrien Mazarguil /** 526e60fbd5bSAdrien Mazarguil * DPDK callback for Ethernet device configuration. 527e60fbd5bSAdrien Mazarguil * 528e60fbd5bSAdrien Mazarguil * @param dev 529e60fbd5bSAdrien Mazarguil * Pointer to Ethernet device structure. 530e60fbd5bSAdrien Mazarguil * 531e60fbd5bSAdrien Mazarguil * @return 532e60fbd5bSAdrien Mazarguil * 0 on success, negative errno value on failure. 533e60fbd5bSAdrien Mazarguil */ 534e60fbd5bSAdrien Mazarguil int 535e60fbd5bSAdrien Mazarguil mlx5_dev_configure(struct rte_eth_dev *dev) 536e60fbd5bSAdrien Mazarguil { 537e60fbd5bSAdrien Mazarguil struct priv *priv = dev->data->dev_private; 538e60fbd5bSAdrien Mazarguil int ret; 539e60fbd5bSAdrien Mazarguil 540a48deadaSOr Ami if (mlx5_is_secondary()) 541a48deadaSOr Ami return -E_RTE_SECONDARY; 542a48deadaSOr Ami 543e60fbd5bSAdrien Mazarguil priv_lock(priv); 544e60fbd5bSAdrien Mazarguil ret = dev_configure(dev); 545e60fbd5bSAdrien Mazarguil assert(ret >= 0); 546e60fbd5bSAdrien Mazarguil priv_unlock(priv); 547e60fbd5bSAdrien Mazarguil return -ret; 548e60fbd5bSAdrien Mazarguil } 549e60fbd5bSAdrien Mazarguil 550e60fbd5bSAdrien Mazarguil /** 551e60fbd5bSAdrien Mazarguil * DPDK callback to get information about the device. 552e60fbd5bSAdrien Mazarguil * 553e60fbd5bSAdrien Mazarguil * @param dev 554e60fbd5bSAdrien Mazarguil * Pointer to Ethernet device structure. 555e60fbd5bSAdrien Mazarguil * @param[out] info 556e60fbd5bSAdrien Mazarguil * Info structure output buffer. 557e60fbd5bSAdrien Mazarguil */ 558e60fbd5bSAdrien Mazarguil void 559e60fbd5bSAdrien Mazarguil mlx5_dev_infos_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *info) 560e60fbd5bSAdrien Mazarguil { 561a48deadaSOr Ami struct priv *priv = mlx5_get_priv(dev); 562e60fbd5bSAdrien Mazarguil unsigned int max; 563e60fbd5bSAdrien Mazarguil char ifname[IF_NAMESIZE]; 564e60fbd5bSAdrien Mazarguil 565e60fbd5bSAdrien Mazarguil priv_lock(priv); 566e60fbd5bSAdrien Mazarguil /* FIXME: we should ask the device for these values. */ 567e60fbd5bSAdrien Mazarguil info->min_rx_bufsize = 32; 568e60fbd5bSAdrien Mazarguil info->max_rx_pktlen = 65536; 569e60fbd5bSAdrien Mazarguil /* 570e60fbd5bSAdrien Mazarguil * Since we need one CQ per QP, the limit is the minimum number 571e60fbd5bSAdrien Mazarguil * between the two values. 572e60fbd5bSAdrien Mazarguil */ 573e60fbd5bSAdrien Mazarguil max = ((priv->device_attr.max_cq > priv->device_attr.max_qp) ? 574e60fbd5bSAdrien Mazarguil priv->device_attr.max_qp : priv->device_attr.max_cq); 575e60fbd5bSAdrien Mazarguil /* If max >= 65535 then max = 0, max_rx_queues is uint16_t. */ 576e60fbd5bSAdrien Mazarguil if (max >= 65535) 577e60fbd5bSAdrien Mazarguil max = 65535; 578e60fbd5bSAdrien Mazarguil info->max_rx_queues = max; 579e60fbd5bSAdrien Mazarguil info->max_tx_queues = max; 5800497ddaaSYaacov Hazan info->max_mac_addrs = RTE_DIM(priv->mac); 581e60fbd5bSAdrien Mazarguil info->rx_offload_capa = 582e60fbd5bSAdrien Mazarguil (priv->hw_csum ? 583e60fbd5bSAdrien Mazarguil (DEV_RX_OFFLOAD_IPV4_CKSUM | 584e60fbd5bSAdrien Mazarguil DEV_RX_OFFLOAD_UDP_CKSUM | 585e60fbd5bSAdrien Mazarguil DEV_RX_OFFLOAD_TCP_CKSUM) : 586f08b6e71SAdrien Mazarguil 0) | 587f08b6e71SAdrien Mazarguil (priv->hw_vlan_strip ? DEV_RX_OFFLOAD_VLAN_STRIP : 0); 588230189d9SNélio Laranjeiro if (!priv->mps) 589e192ef80SYaacov Hazan info->tx_offload_capa = DEV_TX_OFFLOAD_VLAN_INSERT; 590e192ef80SYaacov Hazan if (priv->hw_csum) 591e192ef80SYaacov Hazan info->tx_offload_capa |= 592e60fbd5bSAdrien Mazarguil (DEV_TX_OFFLOAD_IPV4_CKSUM | 593e60fbd5bSAdrien Mazarguil DEV_TX_OFFLOAD_UDP_CKSUM | 594e192ef80SYaacov Hazan DEV_TX_OFFLOAD_TCP_CKSUM); 595e60fbd5bSAdrien Mazarguil if (priv_get_ifname(priv, &ifname) == 0) 596e60fbd5bSAdrien Mazarguil info->if_index = if_nametoindex(ifname); 597634efbc2SNelio Laranjeiro /* FIXME: RETA update/query API expects the callee to know the size of 598634efbc2SNelio Laranjeiro * the indirection table, for this PMD the size varies depending on 599634efbc2SNelio Laranjeiro * the number of RX queues, it becomes impossible to find the correct 600634efbc2SNelio Laranjeiro * size if it is not fixed. 601634efbc2SNelio Laranjeiro * The API should be updated to solve this problem. */ 602634efbc2SNelio Laranjeiro info->reta_size = priv->ind_table_max_size; 603e274f573SMarc Sune info->speed_capa = 604e274f573SMarc Sune ETH_LINK_SPEED_1G | 605e274f573SMarc Sune ETH_LINK_SPEED_10G | 606e274f573SMarc Sune ETH_LINK_SPEED_20G | 607e274f573SMarc Sune ETH_LINK_SPEED_25G | 608e274f573SMarc Sune ETH_LINK_SPEED_40G | 609e274f573SMarc Sune ETH_LINK_SPEED_50G | 610b2feed01SThomas Monjalon ETH_LINK_SPEED_56G | 611b2feed01SThomas Monjalon ETH_LINK_SPEED_100G; 612e60fbd5bSAdrien Mazarguil priv_unlock(priv); 613e60fbd5bSAdrien Mazarguil } 614e60fbd5bSAdrien Mazarguil 61578a38edfSJianfeng Tan const uint32_t * 61678a38edfSJianfeng Tan mlx5_dev_supported_ptypes_get(struct rte_eth_dev *dev) 61778a38edfSJianfeng Tan { 61878a38edfSJianfeng Tan static const uint32_t ptypes[] = { 61978a38edfSJianfeng Tan /* refers to rxq_cq_to_pkt_type() */ 62078a38edfSJianfeng Tan RTE_PTYPE_L3_IPV4, 62178a38edfSJianfeng Tan RTE_PTYPE_L3_IPV6, 62278a38edfSJianfeng Tan RTE_PTYPE_INNER_L3_IPV4, 62378a38edfSJianfeng Tan RTE_PTYPE_INNER_L3_IPV6, 62478a38edfSJianfeng Tan RTE_PTYPE_UNKNOWN 62578a38edfSJianfeng Tan 62678a38edfSJianfeng Tan }; 62778a38edfSJianfeng Tan 6283f5ac8f2SNélio Laranjeiro if (dev->rx_pkt_burst == mlx5_rx_burst) 62978a38edfSJianfeng Tan return ptypes; 63078a38edfSJianfeng Tan return NULL; 63178a38edfSJianfeng Tan } 63278a38edfSJianfeng Tan 633e60fbd5bSAdrien Mazarguil /** 634cb8faed7SAdrien Mazarguil * DPDK callback to retrieve physical link information (unlocked version). 635cb8faed7SAdrien Mazarguil * 636cb8faed7SAdrien Mazarguil * @param dev 637cb8faed7SAdrien Mazarguil * Pointer to Ethernet device structure. 638cb8faed7SAdrien Mazarguil * @param wait_to_complete 639cb8faed7SAdrien Mazarguil * Wait for request completion (ignored). 640cb8faed7SAdrien Mazarguil */ 641cb8faed7SAdrien Mazarguil static int 642cb8faed7SAdrien Mazarguil mlx5_link_update_unlocked(struct rte_eth_dev *dev, int wait_to_complete) 643cb8faed7SAdrien Mazarguil { 644a48deadaSOr Ami struct priv *priv = mlx5_get_priv(dev); 645cb8faed7SAdrien Mazarguil struct ethtool_cmd edata = { 646cb8faed7SAdrien Mazarguil .cmd = ETHTOOL_GSET 647cb8faed7SAdrien Mazarguil }; 648cb8faed7SAdrien Mazarguil struct ifreq ifr; 649cb8faed7SAdrien Mazarguil struct rte_eth_link dev_link; 650cb8faed7SAdrien Mazarguil int link_speed = 0; 651cb8faed7SAdrien Mazarguil 652cb8faed7SAdrien Mazarguil (void)wait_to_complete; 653cb8faed7SAdrien Mazarguil if (priv_ifreq(priv, SIOCGIFFLAGS, &ifr)) { 654cb8faed7SAdrien Mazarguil WARN("ioctl(SIOCGIFFLAGS) failed: %s", strerror(errno)); 655cb8faed7SAdrien Mazarguil return -1; 656cb8faed7SAdrien Mazarguil } 657cb8faed7SAdrien Mazarguil memset(&dev_link, 0, sizeof(dev_link)); 658cb8faed7SAdrien Mazarguil dev_link.link_status = ((ifr.ifr_flags & IFF_UP) && 659cb8faed7SAdrien Mazarguil (ifr.ifr_flags & IFF_RUNNING)); 660d06c608cSAdrien Mazarguil ifr.ifr_data = (void *)&edata; 661cb8faed7SAdrien Mazarguil if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 662cb8faed7SAdrien Mazarguil WARN("ioctl(SIOCETHTOOL, ETHTOOL_GSET) failed: %s", 663cb8faed7SAdrien Mazarguil strerror(errno)); 664cb8faed7SAdrien Mazarguil return -1; 665cb8faed7SAdrien Mazarguil } 666cb8faed7SAdrien Mazarguil link_speed = ethtool_cmd_speed(&edata); 667cb8faed7SAdrien Mazarguil if (link_speed == -1) 668cb8faed7SAdrien Mazarguil dev_link.link_speed = 0; 669cb8faed7SAdrien Mazarguil else 670cb8faed7SAdrien Mazarguil dev_link.link_speed = link_speed; 671cb8faed7SAdrien Mazarguil dev_link.link_duplex = ((edata.duplex == DUPLEX_HALF) ? 672cb8faed7SAdrien Mazarguil ETH_LINK_HALF_DUPLEX : ETH_LINK_FULL_DUPLEX); 67382113036SMarc Sune dev_link.link_autoneg = !(dev->data->dev_conf.link_speeds & 67482113036SMarc Sune ETH_LINK_SPEED_FIXED); 675cb8faed7SAdrien Mazarguil if (memcmp(&dev_link, &dev->data->dev_link, sizeof(dev_link))) { 676cb8faed7SAdrien Mazarguil /* Link status changed. */ 677cb8faed7SAdrien Mazarguil dev->data->dev_link = dev_link; 678cb8faed7SAdrien Mazarguil return 0; 679cb8faed7SAdrien Mazarguil } 680cb8faed7SAdrien Mazarguil /* Link status is still the same. */ 681cb8faed7SAdrien Mazarguil return -1; 682cb8faed7SAdrien Mazarguil } 683cb8faed7SAdrien Mazarguil 684cb8faed7SAdrien Mazarguil /** 685cb8faed7SAdrien Mazarguil * DPDK callback to retrieve physical link information. 686cb8faed7SAdrien Mazarguil * 687cb8faed7SAdrien Mazarguil * @param dev 688cb8faed7SAdrien Mazarguil * Pointer to Ethernet device structure. 689cb8faed7SAdrien Mazarguil * @param wait_to_complete 690cb8faed7SAdrien Mazarguil * Wait for request completion (ignored). 691cb8faed7SAdrien Mazarguil */ 692cb8faed7SAdrien Mazarguil int 693cb8faed7SAdrien Mazarguil mlx5_link_update(struct rte_eth_dev *dev, int wait_to_complete) 694cb8faed7SAdrien Mazarguil { 695a48deadaSOr Ami struct priv *priv = mlx5_get_priv(dev); 696cb8faed7SAdrien Mazarguil int ret; 697cb8faed7SAdrien Mazarguil 698cb8faed7SAdrien Mazarguil priv_lock(priv); 699cb8faed7SAdrien Mazarguil ret = mlx5_link_update_unlocked(dev, wait_to_complete); 700cb8faed7SAdrien Mazarguil priv_unlock(priv); 701cb8faed7SAdrien Mazarguil return ret; 702cb8faed7SAdrien Mazarguil } 703cb8faed7SAdrien Mazarguil 704cb8faed7SAdrien Mazarguil /** 705cf37ca95SAdrien Mazarguil * DPDK callback to change the MTU. 706cf37ca95SAdrien Mazarguil * 707cf37ca95SAdrien Mazarguil * Setting the MTU affects hardware MRU (packets larger than the MTU cannot be 708cf37ca95SAdrien Mazarguil * received). Use this as a hint to enable/disable scattered packets support 709cf37ca95SAdrien Mazarguil * and improve performance when not needed. 710cf37ca95SAdrien Mazarguil * Since failure is not an option, reconfiguring queues on the fly is not 711cf37ca95SAdrien Mazarguil * recommended. 712cf37ca95SAdrien Mazarguil * 713cf37ca95SAdrien Mazarguil * @param dev 714cf37ca95SAdrien Mazarguil * Pointer to Ethernet device structure. 715cf37ca95SAdrien Mazarguil * @param in_mtu 716cf37ca95SAdrien Mazarguil * New MTU. 717cf37ca95SAdrien Mazarguil * 718cf37ca95SAdrien Mazarguil * @return 719cf37ca95SAdrien Mazarguil * 0 on success, negative errno value on failure. 720cf37ca95SAdrien Mazarguil */ 721cf37ca95SAdrien Mazarguil int 722cf37ca95SAdrien Mazarguil mlx5_dev_set_mtu(struct rte_eth_dev *dev, uint16_t mtu) 723cf37ca95SAdrien Mazarguil { 724cf37ca95SAdrien Mazarguil struct priv *priv = dev->data->dev_private; 725cf37ca95SAdrien Mazarguil int ret = 0; 726cf37ca95SAdrien Mazarguil unsigned int i; 727cf37ca95SAdrien Mazarguil uint16_t (*rx_func)(void *, struct rte_mbuf **, uint16_t) = 728cf37ca95SAdrien Mazarguil mlx5_rx_burst; 7299964b965SNélio Laranjeiro unsigned int max_frame_len; 7309964b965SNélio Laranjeiro int rehash; 7319964b965SNélio Laranjeiro int restart = priv->started; 732cf37ca95SAdrien Mazarguil 733a48deadaSOr Ami if (mlx5_is_secondary()) 734a48deadaSOr Ami return -E_RTE_SECONDARY; 735a48deadaSOr Ami 736cf37ca95SAdrien Mazarguil priv_lock(priv); 737cf37ca95SAdrien Mazarguil /* Set kernel interface MTU first. */ 738cf37ca95SAdrien Mazarguil if (priv_set_mtu(priv, mtu)) { 739cf37ca95SAdrien Mazarguil ret = errno; 740cf37ca95SAdrien Mazarguil WARN("cannot set port %u MTU to %u: %s", priv->port, mtu, 741cf37ca95SAdrien Mazarguil strerror(ret)); 742cf37ca95SAdrien Mazarguil goto out; 743cf37ca95SAdrien Mazarguil } else 744cf37ca95SAdrien Mazarguil DEBUG("adapter port %u MTU set to %u", priv->port, mtu); 745cf37ca95SAdrien Mazarguil /* Temporarily replace RX handler with a fake one, assuming it has not 746cf37ca95SAdrien Mazarguil * been copied elsewhere. */ 747cf37ca95SAdrien Mazarguil dev->rx_pkt_burst = removed_rx_burst; 748cf37ca95SAdrien Mazarguil /* Make sure everyone has left mlx5_rx_burst() and uses 749cf37ca95SAdrien Mazarguil * removed_rx_burst() instead. */ 750cf37ca95SAdrien Mazarguil rte_wmb(); 751cf37ca95SAdrien Mazarguil usleep(1000); 7529964b965SNélio Laranjeiro /* MTU does not include header and CRC. */ 7539964b965SNélio Laranjeiro max_frame_len = ETHER_HDR_LEN + mtu + ETHER_CRC_LEN; 7549964b965SNélio Laranjeiro /* Check if at least one queue is going to need a SGE update. */ 7559964b965SNélio Laranjeiro for (i = 0; i != priv->rxqs_n; ++i) { 756cf37ca95SAdrien Mazarguil struct rxq *rxq = (*priv->rxqs)[i]; 75778d9c95dSAdrien Mazarguil unsigned int mb_len; 7589964b965SNélio Laranjeiro unsigned int size = RTE_PKTMBUF_HEADROOM + max_frame_len; 7599964b965SNélio Laranjeiro unsigned int sges_n; 760cf37ca95SAdrien Mazarguil 761cf37ca95SAdrien Mazarguil if (rxq == NULL) 762cf37ca95SAdrien Mazarguil continue; 76378d9c95dSAdrien Mazarguil mb_len = rte_pktmbuf_data_room_size(rxq->mp); 76478d9c95dSAdrien Mazarguil assert(mb_len >= RTE_PKTMBUF_HEADROOM); 7659964b965SNélio Laranjeiro /* 7669964b965SNélio Laranjeiro * Determine the number of SGEs needed for a full packet 7679964b965SNélio Laranjeiro * and round it to the next power of two. 7689964b965SNélio Laranjeiro */ 7699964b965SNélio Laranjeiro sges_n = log2above((size / mb_len) + !!(size % mb_len)); 7709964b965SNélio Laranjeiro if (sges_n != rxq->sges_n) 7719964b965SNélio Laranjeiro break; 7729964b965SNélio Laranjeiro } 7739964b965SNélio Laranjeiro /* 7749964b965SNélio Laranjeiro * If all queues have the right number of SGEs, a simple rehash 7759964b965SNélio Laranjeiro * of their buffers is enough, otherwise SGE information can only 7769964b965SNélio Laranjeiro * be updated in a queue by recreating it. All resources that depend 7779964b965SNélio Laranjeiro * on queues (flows, indirection tables) must be recreated as well in 7789964b965SNélio Laranjeiro * that case. 7799964b965SNélio Laranjeiro */ 7809964b965SNélio Laranjeiro rehash = (i == priv->rxqs_n); 7819964b965SNélio Laranjeiro if (!rehash) { 7829964b965SNélio Laranjeiro /* Clean up everything as with mlx5_dev_stop(). */ 7839964b965SNélio Laranjeiro priv_special_flow_disable_all(priv); 7849964b965SNélio Laranjeiro priv_mac_addrs_disable(priv); 7859964b965SNélio Laranjeiro priv_destroy_hash_rxqs(priv); 7869964b965SNélio Laranjeiro priv_fdir_disable(priv); 7879964b965SNélio Laranjeiro priv_dev_interrupt_handler_uninstall(priv, dev); 7889964b965SNélio Laranjeiro } 7899964b965SNélio Laranjeiro recover: 7909964b965SNélio Laranjeiro /* Reconfigure each RX queue. */ 7919964b965SNélio Laranjeiro for (i = 0; (i != priv->rxqs_n); ++i) { 7929964b965SNélio Laranjeiro struct rxq *rxq = (*priv->rxqs)[i]; 7939964b965SNélio Laranjeiro struct rxq_ctrl *rxq_ctrl = 7949964b965SNélio Laranjeiro container_of(rxq, struct rxq_ctrl, rxq); 7959964b965SNélio Laranjeiro int sp; 7969964b965SNélio Laranjeiro unsigned int mb_len; 7979964b965SNélio Laranjeiro unsigned int tmp; 7989964b965SNélio Laranjeiro 7999964b965SNélio Laranjeiro if (rxq == NULL) 8009964b965SNélio Laranjeiro continue; 8019964b965SNélio Laranjeiro mb_len = rte_pktmbuf_data_room_size(rxq->mp); 8029964b965SNélio Laranjeiro assert(mb_len >= RTE_PKTMBUF_HEADROOM); 8039964b965SNélio Laranjeiro /* Toggle scattered support (sp) if necessary. */ 80478d9c95dSAdrien Mazarguil sp = (max_frame_len > (mb_len - RTE_PKTMBUF_HEADROOM)); 8059964b965SNélio Laranjeiro /* Provide new values to rxq_setup(). */ 8069964b965SNélio Laranjeiro dev->data->dev_conf.rxmode.jumbo_frame = sp; 8079964b965SNélio Laranjeiro dev->data->dev_conf.rxmode.max_rx_pkt_len = max_frame_len; 8089964b965SNélio Laranjeiro if (rehash) 8099964b965SNélio Laranjeiro ret = rxq_rehash(dev, rxq_ctrl); 8109964b965SNélio Laranjeiro else 811*b4b12e55SNélio Laranjeiro ret = rxq_ctrl_setup(dev, rxq_ctrl, 1 << rxq->elts_n, 8129964b965SNélio Laranjeiro rxq_ctrl->socket, NULL, rxq->mp); 8139964b965SNélio Laranjeiro if (!ret) 8149964b965SNélio Laranjeiro continue; 8159964b965SNélio Laranjeiro /* Attempt to roll back in case of error. */ 8169964b965SNélio Laranjeiro tmp = (mb_len << rxq->sges_n) - RTE_PKTMBUF_HEADROOM; 8179964b965SNélio Laranjeiro if (max_frame_len != tmp) { 8189964b965SNélio Laranjeiro max_frame_len = tmp; 8199964b965SNélio Laranjeiro goto recover; 820cf37ca95SAdrien Mazarguil } 8219964b965SNélio Laranjeiro /* Double fault, disable RX. */ 8229964b965SNélio Laranjeiro break; 823cf37ca95SAdrien Mazarguil } 8249964b965SNélio Laranjeiro /* 8259964b965SNélio Laranjeiro * Use a safe RX burst function in case of error, otherwise mimic 8269964b965SNélio Laranjeiro * mlx5_dev_start(). 8279964b965SNélio Laranjeiro */ 8289964b965SNélio Laranjeiro if (ret) { 8299964b965SNélio Laranjeiro ERROR("unable to reconfigure RX queues, RX disabled"); 8309964b965SNélio Laranjeiro rx_func = removed_rx_burst; 8319964b965SNélio Laranjeiro } else if (restart && 8329964b965SNélio Laranjeiro !rehash && 8339964b965SNélio Laranjeiro !priv_create_hash_rxqs(priv) && 8349964b965SNélio Laranjeiro !priv_rehash_flows(priv)) { 8359964b965SNélio Laranjeiro if (dev->data->dev_conf.fdir_conf.mode == RTE_FDIR_MODE_NONE) 8369964b965SNélio Laranjeiro priv_fdir_enable(priv); 8379964b965SNélio Laranjeiro priv_dev_interrupt_handler_install(priv, dev); 8389964b965SNélio Laranjeiro } 8399964b965SNélio Laranjeiro priv->mtu = mtu; 840cf37ca95SAdrien Mazarguil /* Burst functions can now be called again. */ 841cf37ca95SAdrien Mazarguil rte_wmb(); 842cf37ca95SAdrien Mazarguil dev->rx_pkt_burst = rx_func; 843cf37ca95SAdrien Mazarguil out: 844cf37ca95SAdrien Mazarguil priv_unlock(priv); 845cf37ca95SAdrien Mazarguil assert(ret >= 0); 846cf37ca95SAdrien Mazarguil return -ret; 847cf37ca95SAdrien Mazarguil } 848cf37ca95SAdrien Mazarguil 849cf37ca95SAdrien Mazarguil /** 85002d75430SAdrien Mazarguil * DPDK callback to get flow control status. 85102d75430SAdrien Mazarguil * 85202d75430SAdrien Mazarguil * @param dev 85302d75430SAdrien Mazarguil * Pointer to Ethernet device structure. 85402d75430SAdrien Mazarguil * @param[out] fc_conf 85502d75430SAdrien Mazarguil * Flow control output buffer. 85602d75430SAdrien Mazarguil * 85702d75430SAdrien Mazarguil * @return 85802d75430SAdrien Mazarguil * 0 on success, negative errno value on failure. 85902d75430SAdrien Mazarguil */ 86002d75430SAdrien Mazarguil int 86102d75430SAdrien Mazarguil mlx5_dev_get_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf) 86202d75430SAdrien Mazarguil { 86302d75430SAdrien Mazarguil struct priv *priv = dev->data->dev_private; 86402d75430SAdrien Mazarguil struct ifreq ifr; 86502d75430SAdrien Mazarguil struct ethtool_pauseparam ethpause = { 86602d75430SAdrien Mazarguil .cmd = ETHTOOL_GPAUSEPARAM 86702d75430SAdrien Mazarguil }; 86802d75430SAdrien Mazarguil int ret; 86902d75430SAdrien Mazarguil 870a48deadaSOr Ami if (mlx5_is_secondary()) 871a48deadaSOr Ami return -E_RTE_SECONDARY; 872a48deadaSOr Ami 873d06c608cSAdrien Mazarguil ifr.ifr_data = (void *)ðpause; 87402d75430SAdrien Mazarguil priv_lock(priv); 87502d75430SAdrien Mazarguil if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 87602d75430SAdrien Mazarguil ret = errno; 87702d75430SAdrien Mazarguil WARN("ioctl(SIOCETHTOOL, ETHTOOL_GPAUSEPARAM)" 87802d75430SAdrien Mazarguil " failed: %s", 87902d75430SAdrien Mazarguil strerror(ret)); 88002d75430SAdrien Mazarguil goto out; 88102d75430SAdrien Mazarguil } 88202d75430SAdrien Mazarguil 88302d75430SAdrien Mazarguil fc_conf->autoneg = ethpause.autoneg; 88402d75430SAdrien Mazarguil if (ethpause.rx_pause && ethpause.tx_pause) 88502d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_FULL; 88602d75430SAdrien Mazarguil else if (ethpause.rx_pause) 88702d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_RX_PAUSE; 88802d75430SAdrien Mazarguil else if (ethpause.tx_pause) 88902d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_TX_PAUSE; 89002d75430SAdrien Mazarguil else 89102d75430SAdrien Mazarguil fc_conf->mode = RTE_FC_NONE; 89202d75430SAdrien Mazarguil ret = 0; 89302d75430SAdrien Mazarguil 89402d75430SAdrien Mazarguil out: 89502d75430SAdrien Mazarguil priv_unlock(priv); 89602d75430SAdrien Mazarguil assert(ret >= 0); 89702d75430SAdrien Mazarguil return -ret; 89802d75430SAdrien Mazarguil } 89902d75430SAdrien Mazarguil 90002d75430SAdrien Mazarguil /** 90102d75430SAdrien Mazarguil * DPDK callback to modify flow control parameters. 90202d75430SAdrien Mazarguil * 90302d75430SAdrien Mazarguil * @param dev 90402d75430SAdrien Mazarguil * Pointer to Ethernet device structure. 90502d75430SAdrien Mazarguil * @param[in] fc_conf 90602d75430SAdrien Mazarguil * Flow control parameters. 90702d75430SAdrien Mazarguil * 90802d75430SAdrien Mazarguil * @return 90902d75430SAdrien Mazarguil * 0 on success, negative errno value on failure. 91002d75430SAdrien Mazarguil */ 91102d75430SAdrien Mazarguil int 91202d75430SAdrien Mazarguil mlx5_dev_set_flow_ctrl(struct rte_eth_dev *dev, struct rte_eth_fc_conf *fc_conf) 91302d75430SAdrien Mazarguil { 91402d75430SAdrien Mazarguil struct priv *priv = dev->data->dev_private; 91502d75430SAdrien Mazarguil struct ifreq ifr; 91602d75430SAdrien Mazarguil struct ethtool_pauseparam ethpause = { 91702d75430SAdrien Mazarguil .cmd = ETHTOOL_SPAUSEPARAM 91802d75430SAdrien Mazarguil }; 91902d75430SAdrien Mazarguil int ret; 92002d75430SAdrien Mazarguil 921a48deadaSOr Ami if (mlx5_is_secondary()) 922a48deadaSOr Ami return -E_RTE_SECONDARY; 923a48deadaSOr Ami 924d06c608cSAdrien Mazarguil ifr.ifr_data = (void *)ðpause; 92502d75430SAdrien Mazarguil ethpause.autoneg = fc_conf->autoneg; 92602d75430SAdrien Mazarguil if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) || 92702d75430SAdrien Mazarguil (fc_conf->mode & RTE_FC_RX_PAUSE)) 92802d75430SAdrien Mazarguil ethpause.rx_pause = 1; 92902d75430SAdrien Mazarguil else 93002d75430SAdrien Mazarguil ethpause.rx_pause = 0; 93102d75430SAdrien Mazarguil 93202d75430SAdrien Mazarguil if (((fc_conf->mode & RTE_FC_FULL) == RTE_FC_FULL) || 93302d75430SAdrien Mazarguil (fc_conf->mode & RTE_FC_TX_PAUSE)) 93402d75430SAdrien Mazarguil ethpause.tx_pause = 1; 93502d75430SAdrien Mazarguil else 93602d75430SAdrien Mazarguil ethpause.tx_pause = 0; 93702d75430SAdrien Mazarguil 93802d75430SAdrien Mazarguil priv_lock(priv); 93902d75430SAdrien Mazarguil if (priv_ifreq(priv, SIOCETHTOOL, &ifr)) { 94002d75430SAdrien Mazarguil ret = errno; 94102d75430SAdrien Mazarguil WARN("ioctl(SIOCETHTOOL, ETHTOOL_SPAUSEPARAM)" 94202d75430SAdrien Mazarguil " failed: %s", 94302d75430SAdrien Mazarguil strerror(ret)); 94402d75430SAdrien Mazarguil goto out; 94502d75430SAdrien Mazarguil } 94602d75430SAdrien Mazarguil ret = 0; 94702d75430SAdrien Mazarguil 94802d75430SAdrien Mazarguil out: 94902d75430SAdrien Mazarguil priv_unlock(priv); 95002d75430SAdrien Mazarguil assert(ret >= 0); 95102d75430SAdrien Mazarguil return -ret; 95202d75430SAdrien Mazarguil } 95302d75430SAdrien Mazarguil 95402d75430SAdrien Mazarguil /** 955771fa900SAdrien Mazarguil * Get PCI information from struct ibv_device. 956771fa900SAdrien Mazarguil * 957771fa900SAdrien Mazarguil * @param device 958771fa900SAdrien Mazarguil * Pointer to Ethernet device structure. 959771fa900SAdrien Mazarguil * @param[out] pci_addr 960771fa900SAdrien Mazarguil * PCI bus address output buffer. 961771fa900SAdrien Mazarguil * 962771fa900SAdrien Mazarguil * @return 963771fa900SAdrien Mazarguil * 0 on success, -1 on failure and errno is set. 964771fa900SAdrien Mazarguil */ 965771fa900SAdrien Mazarguil int 966771fa900SAdrien Mazarguil mlx5_ibv_device_to_pci_addr(const struct ibv_device *device, 967771fa900SAdrien Mazarguil struct rte_pci_addr *pci_addr) 968771fa900SAdrien Mazarguil { 969771fa900SAdrien Mazarguil FILE *file; 970771fa900SAdrien Mazarguil char line[32]; 971771fa900SAdrien Mazarguil MKSTR(path, "%s/device/uevent", device->ibdev_path); 972771fa900SAdrien Mazarguil 973771fa900SAdrien Mazarguil file = fopen(path, "rb"); 974771fa900SAdrien Mazarguil if (file == NULL) 975771fa900SAdrien Mazarguil return -1; 976771fa900SAdrien Mazarguil while (fgets(line, sizeof(line), file) == line) { 977771fa900SAdrien Mazarguil size_t len = strlen(line); 978771fa900SAdrien Mazarguil int ret; 979771fa900SAdrien Mazarguil 980771fa900SAdrien Mazarguil /* Truncate long lines. */ 981771fa900SAdrien Mazarguil if (len == (sizeof(line) - 1)) 982771fa900SAdrien Mazarguil while (line[(len - 1)] != '\n') { 983771fa900SAdrien Mazarguil ret = fgetc(file); 984771fa900SAdrien Mazarguil if (ret == EOF) 985771fa900SAdrien Mazarguil break; 986771fa900SAdrien Mazarguil line[(len - 1)] = ret; 987771fa900SAdrien Mazarguil } 988771fa900SAdrien Mazarguil /* Extract information. */ 989771fa900SAdrien Mazarguil if (sscanf(line, 990771fa900SAdrien Mazarguil "PCI_SLOT_NAME=" 991771fa900SAdrien Mazarguil "%" SCNx16 ":%" SCNx8 ":%" SCNx8 ".%" SCNx8 "\n", 992771fa900SAdrien Mazarguil &pci_addr->domain, 993771fa900SAdrien Mazarguil &pci_addr->bus, 994771fa900SAdrien Mazarguil &pci_addr->devid, 995771fa900SAdrien Mazarguil &pci_addr->function) == 4) { 996771fa900SAdrien Mazarguil ret = 0; 997771fa900SAdrien Mazarguil break; 998771fa900SAdrien Mazarguil } 999771fa900SAdrien Mazarguil } 1000771fa900SAdrien Mazarguil fclose(file); 1001771fa900SAdrien Mazarguil return 0; 1002771fa900SAdrien Mazarguil } 1003198a3c33SNelio Laranjeiro 1004198a3c33SNelio Laranjeiro /** 1005198a3c33SNelio Laranjeiro * Link status handler. 1006198a3c33SNelio Laranjeiro * 1007198a3c33SNelio Laranjeiro * @param priv 1008198a3c33SNelio Laranjeiro * Pointer to private structure. 1009198a3c33SNelio Laranjeiro * @param dev 1010198a3c33SNelio Laranjeiro * Pointer to the rte_eth_dev structure. 1011198a3c33SNelio Laranjeiro * 1012198a3c33SNelio Laranjeiro * @return 1013198a3c33SNelio Laranjeiro * Nonzero if the callback process can be called immediately. 1014198a3c33SNelio Laranjeiro */ 1015198a3c33SNelio Laranjeiro static int 1016198a3c33SNelio Laranjeiro priv_dev_link_status_handler(struct priv *priv, struct rte_eth_dev *dev) 1017198a3c33SNelio Laranjeiro { 1018198a3c33SNelio Laranjeiro struct ibv_async_event event; 1019198a3c33SNelio Laranjeiro int port_change = 0; 1020198a3c33SNelio Laranjeiro int ret = 0; 1021198a3c33SNelio Laranjeiro 1022198a3c33SNelio Laranjeiro /* Read all message and acknowledge them. */ 1023198a3c33SNelio Laranjeiro for (;;) { 1024198a3c33SNelio Laranjeiro if (ibv_get_async_event(priv->ctx, &event)) 1025198a3c33SNelio Laranjeiro break; 1026198a3c33SNelio Laranjeiro 1027198a3c33SNelio Laranjeiro if (event.event_type == IBV_EVENT_PORT_ACTIVE || 1028198a3c33SNelio Laranjeiro event.event_type == IBV_EVENT_PORT_ERR) 1029198a3c33SNelio Laranjeiro port_change = 1; 1030198a3c33SNelio Laranjeiro else 1031198a3c33SNelio Laranjeiro DEBUG("event type %d on port %d not handled", 1032198a3c33SNelio Laranjeiro event.event_type, event.element.port_num); 1033198a3c33SNelio Laranjeiro ibv_ack_async_event(&event); 1034198a3c33SNelio Laranjeiro } 1035198a3c33SNelio Laranjeiro 1036198a3c33SNelio Laranjeiro if (port_change ^ priv->pending_alarm) { 1037198a3c33SNelio Laranjeiro struct rte_eth_link *link = &dev->data->dev_link; 1038198a3c33SNelio Laranjeiro 1039198a3c33SNelio Laranjeiro priv->pending_alarm = 0; 1040198a3c33SNelio Laranjeiro mlx5_link_update_unlocked(dev, 0); 1041198a3c33SNelio Laranjeiro if (((link->link_speed == 0) && link->link_status) || 1042198a3c33SNelio Laranjeiro ((link->link_speed != 0) && !link->link_status)) { 1043198a3c33SNelio Laranjeiro /* Inconsistent status, check again later. */ 1044198a3c33SNelio Laranjeiro priv->pending_alarm = 1; 1045198a3c33SNelio Laranjeiro rte_eal_alarm_set(MLX5_ALARM_TIMEOUT_US, 1046198a3c33SNelio Laranjeiro mlx5_dev_link_status_handler, 1047198a3c33SNelio Laranjeiro dev); 1048198a3c33SNelio Laranjeiro } else 1049198a3c33SNelio Laranjeiro ret = 1; 1050198a3c33SNelio Laranjeiro } 1051198a3c33SNelio Laranjeiro return ret; 1052198a3c33SNelio Laranjeiro } 1053198a3c33SNelio Laranjeiro 1054198a3c33SNelio Laranjeiro /** 1055198a3c33SNelio Laranjeiro * Handle delayed link status event. 1056198a3c33SNelio Laranjeiro * 1057198a3c33SNelio Laranjeiro * @param arg 1058198a3c33SNelio Laranjeiro * Registered argument. 1059198a3c33SNelio Laranjeiro */ 1060198a3c33SNelio Laranjeiro void 1061198a3c33SNelio Laranjeiro mlx5_dev_link_status_handler(void *arg) 1062198a3c33SNelio Laranjeiro { 1063198a3c33SNelio Laranjeiro struct rte_eth_dev *dev = arg; 1064198a3c33SNelio Laranjeiro struct priv *priv = dev->data->dev_private; 1065198a3c33SNelio Laranjeiro int ret; 1066198a3c33SNelio Laranjeiro 1067198a3c33SNelio Laranjeiro priv_lock(priv); 1068198a3c33SNelio Laranjeiro assert(priv->pending_alarm == 1); 1069198a3c33SNelio Laranjeiro ret = priv_dev_link_status_handler(priv, dev); 1070198a3c33SNelio Laranjeiro priv_unlock(priv); 1071198a3c33SNelio Laranjeiro if (ret) 1072198a3c33SNelio Laranjeiro _rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC); 1073198a3c33SNelio Laranjeiro } 1074198a3c33SNelio Laranjeiro 1075198a3c33SNelio Laranjeiro /** 1076198a3c33SNelio Laranjeiro * Handle interrupts from the NIC. 1077198a3c33SNelio Laranjeiro * 1078198a3c33SNelio Laranjeiro * @param[in] intr_handle 1079198a3c33SNelio Laranjeiro * Interrupt handler. 1080198a3c33SNelio Laranjeiro * @param cb_arg 1081198a3c33SNelio Laranjeiro * Callback argument. 1082198a3c33SNelio Laranjeiro */ 1083198a3c33SNelio Laranjeiro void 1084198a3c33SNelio Laranjeiro mlx5_dev_interrupt_handler(struct rte_intr_handle *intr_handle, void *cb_arg) 1085198a3c33SNelio Laranjeiro { 1086198a3c33SNelio Laranjeiro struct rte_eth_dev *dev = cb_arg; 1087198a3c33SNelio Laranjeiro struct priv *priv = dev->data->dev_private; 1088198a3c33SNelio Laranjeiro int ret; 1089198a3c33SNelio Laranjeiro 1090198a3c33SNelio Laranjeiro (void)intr_handle; 1091198a3c33SNelio Laranjeiro priv_lock(priv); 1092198a3c33SNelio Laranjeiro ret = priv_dev_link_status_handler(priv, dev); 1093198a3c33SNelio Laranjeiro priv_unlock(priv); 1094198a3c33SNelio Laranjeiro if (ret) 1095198a3c33SNelio Laranjeiro _rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC); 1096198a3c33SNelio Laranjeiro } 1097198a3c33SNelio Laranjeiro 1098198a3c33SNelio Laranjeiro /** 1099198a3c33SNelio Laranjeiro * Uninstall interrupt handler. 1100198a3c33SNelio Laranjeiro * 1101198a3c33SNelio Laranjeiro * @param priv 1102198a3c33SNelio Laranjeiro * Pointer to private structure. 1103198a3c33SNelio Laranjeiro * @param dev 1104198a3c33SNelio Laranjeiro * Pointer to the rte_eth_dev structure. 1105198a3c33SNelio Laranjeiro */ 1106198a3c33SNelio Laranjeiro void 1107198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_uninstall(struct priv *priv, struct rte_eth_dev *dev) 1108198a3c33SNelio Laranjeiro { 1109198a3c33SNelio Laranjeiro if (!dev->data->dev_conf.intr_conf.lsc) 1110198a3c33SNelio Laranjeiro return; 1111198a3c33SNelio Laranjeiro rte_intr_callback_unregister(&priv->intr_handle, 1112198a3c33SNelio Laranjeiro mlx5_dev_interrupt_handler, 1113198a3c33SNelio Laranjeiro dev); 1114198a3c33SNelio Laranjeiro if (priv->pending_alarm) 1115198a3c33SNelio Laranjeiro rte_eal_alarm_cancel(mlx5_dev_link_status_handler, dev); 1116198a3c33SNelio Laranjeiro priv->pending_alarm = 0; 1117198a3c33SNelio Laranjeiro priv->intr_handle.fd = 0; 111836351ea3SFerruh Yigit priv->intr_handle.type = RTE_INTR_HANDLE_UNKNOWN; 1119198a3c33SNelio Laranjeiro } 1120198a3c33SNelio Laranjeiro 1121198a3c33SNelio Laranjeiro /** 1122198a3c33SNelio Laranjeiro * Install interrupt handler. 1123198a3c33SNelio Laranjeiro * 1124198a3c33SNelio Laranjeiro * @param priv 1125198a3c33SNelio Laranjeiro * Pointer to private structure. 1126198a3c33SNelio Laranjeiro * @param dev 1127198a3c33SNelio Laranjeiro * Pointer to the rte_eth_dev structure. 1128198a3c33SNelio Laranjeiro */ 1129198a3c33SNelio Laranjeiro void 1130198a3c33SNelio Laranjeiro priv_dev_interrupt_handler_install(struct priv *priv, struct rte_eth_dev *dev) 1131198a3c33SNelio Laranjeiro { 1132198a3c33SNelio Laranjeiro int rc, flags; 1133198a3c33SNelio Laranjeiro 1134198a3c33SNelio Laranjeiro if (!dev->data->dev_conf.intr_conf.lsc) 1135198a3c33SNelio Laranjeiro return; 1136198a3c33SNelio Laranjeiro assert(priv->ctx->async_fd > 0); 1137198a3c33SNelio Laranjeiro flags = fcntl(priv->ctx->async_fd, F_GETFL); 1138198a3c33SNelio Laranjeiro rc = fcntl(priv->ctx->async_fd, F_SETFL, flags | O_NONBLOCK); 1139198a3c33SNelio Laranjeiro if (rc < 0) { 1140198a3c33SNelio Laranjeiro INFO("failed to change file descriptor async event queue"); 1141198a3c33SNelio Laranjeiro dev->data->dev_conf.intr_conf.lsc = 0; 1142198a3c33SNelio Laranjeiro } else { 1143198a3c33SNelio Laranjeiro priv->intr_handle.fd = priv->ctx->async_fd; 1144198a3c33SNelio Laranjeiro priv->intr_handle.type = RTE_INTR_HANDLE_EXT; 1145198a3c33SNelio Laranjeiro rte_intr_callback_register(&priv->intr_handle, 1146198a3c33SNelio Laranjeiro mlx5_dev_interrupt_handler, 1147198a3c33SNelio Laranjeiro dev); 1148198a3c33SNelio Laranjeiro } 1149198a3c33SNelio Laranjeiro } 115062072098SOr Ami 115162072098SOr Ami /** 115262072098SOr Ami * Change the link state (UP / DOWN). 115362072098SOr Ami * 11543d04e050SOlivier Matz * @param priv 115562072098SOr Ami * Pointer to Ethernet device structure. 115662072098SOr Ami * @param up 115762072098SOr Ami * Nonzero for link up, otherwise link down. 115862072098SOr Ami * 115962072098SOr Ami * @return 116062072098SOr Ami * 0 on success, errno value on failure. 116162072098SOr Ami */ 116262072098SOr Ami static int 116362072098SOr Ami priv_set_link(struct priv *priv, int up) 116462072098SOr Ami { 116562072098SOr Ami struct rte_eth_dev *dev = priv->dev; 116662072098SOr Ami int err; 116762072098SOr Ami 116862072098SOr Ami if (up) { 116962072098SOr Ami err = priv_set_flags(priv, ~IFF_UP, IFF_UP); 117062072098SOr Ami if (err) 117162072098SOr Ami return err; 1172cdab90cbSNélio Laranjeiro priv_select_tx_function(priv); 1173cdab90cbSNélio Laranjeiro priv_select_rx_function(priv); 117462072098SOr Ami } else { 117562072098SOr Ami err = priv_set_flags(priv, ~IFF_UP, ~IFF_UP); 117662072098SOr Ami if (err) 117762072098SOr Ami return err; 117862072098SOr Ami dev->rx_pkt_burst = removed_rx_burst; 117962072098SOr Ami dev->tx_pkt_burst = removed_tx_burst; 118062072098SOr Ami } 118162072098SOr Ami return 0; 118262072098SOr Ami } 118362072098SOr Ami 118462072098SOr Ami /** 118562072098SOr Ami * DPDK callback to bring the link DOWN. 118662072098SOr Ami * 118762072098SOr Ami * @param dev 118862072098SOr Ami * Pointer to Ethernet device structure. 118962072098SOr Ami * 119062072098SOr Ami * @return 119162072098SOr Ami * 0 on success, errno value on failure. 119262072098SOr Ami */ 119362072098SOr Ami int 119462072098SOr Ami mlx5_set_link_down(struct rte_eth_dev *dev) 119562072098SOr Ami { 119662072098SOr Ami struct priv *priv = dev->data->dev_private; 119762072098SOr Ami int err; 119862072098SOr Ami 119962072098SOr Ami priv_lock(priv); 120062072098SOr Ami err = priv_set_link(priv, 0); 120162072098SOr Ami priv_unlock(priv); 120262072098SOr Ami return err; 120362072098SOr Ami } 120462072098SOr Ami 120562072098SOr Ami /** 120662072098SOr Ami * DPDK callback to bring the link UP. 120762072098SOr Ami * 120862072098SOr Ami * @param dev 120962072098SOr Ami * Pointer to Ethernet device structure. 121062072098SOr Ami * 121162072098SOr Ami * @return 121262072098SOr Ami * 0 on success, errno value on failure. 121362072098SOr Ami */ 121462072098SOr Ami int 121562072098SOr Ami mlx5_set_link_up(struct rte_eth_dev *dev) 121662072098SOr Ami { 121762072098SOr Ami struct priv *priv = dev->data->dev_private; 121862072098SOr Ami int err; 121962072098SOr Ami 122062072098SOr Ami priv_lock(priv); 122162072098SOr Ami err = priv_set_link(priv, 1); 122262072098SOr Ami priv_unlock(priv); 122362072098SOr Ami return err; 122462072098SOr Ami } 1225a48deadaSOr Ami 1226a48deadaSOr Ami /** 1227a48deadaSOr Ami * Configure secondary process queues from a private data pointer (primary 1228a48deadaSOr Ami * or secondary) and update burst callbacks. Can take place only once. 1229a48deadaSOr Ami * 1230a48deadaSOr Ami * All queues must have been previously created by the primary process to 1231a48deadaSOr Ami * avoid undefined behavior. 1232a48deadaSOr Ami * 1233a48deadaSOr Ami * @param priv 1234a48deadaSOr Ami * Private data pointer from either primary or secondary process. 1235a48deadaSOr Ami * 1236a48deadaSOr Ami * @return 1237a48deadaSOr Ami * Private data pointer from secondary process, NULL in case of error. 1238a48deadaSOr Ami */ 1239a48deadaSOr Ami struct priv * 1240a48deadaSOr Ami mlx5_secondary_data_setup(struct priv *priv) 1241a48deadaSOr Ami { 1242a48deadaSOr Ami unsigned int port_id = 0; 1243a48deadaSOr Ami struct mlx5_secondary_data *sd; 1244a48deadaSOr Ami void **tx_queues; 1245a48deadaSOr Ami void **rx_queues; 1246a48deadaSOr Ami unsigned int nb_tx_queues; 1247a48deadaSOr Ami unsigned int nb_rx_queues; 1248a48deadaSOr Ami unsigned int i; 1249a48deadaSOr Ami 1250a48deadaSOr Ami /* priv must be valid at this point. */ 1251a48deadaSOr Ami assert(priv != NULL); 1252a48deadaSOr Ami /* priv->dev must also be valid but may point to local memory from 1253a48deadaSOr Ami * another process, possibly with the same address and must not 1254a48deadaSOr Ami * be dereferenced yet. */ 1255a48deadaSOr Ami assert(priv->dev != NULL); 1256a48deadaSOr Ami /* Determine port ID by finding out where priv comes from. */ 1257a48deadaSOr Ami while (1) { 1258a48deadaSOr Ami sd = &mlx5_secondary_data[port_id]; 1259a48deadaSOr Ami rte_spinlock_lock(&sd->lock); 1260a48deadaSOr Ami /* Primary process? */ 1261a48deadaSOr Ami if (sd->primary_priv == priv) 1262a48deadaSOr Ami break; 1263a48deadaSOr Ami /* Secondary process? */ 1264a48deadaSOr Ami if (sd->data.dev_private == priv) 1265a48deadaSOr Ami break; 1266a48deadaSOr Ami rte_spinlock_unlock(&sd->lock); 1267a48deadaSOr Ami if (++port_id == RTE_DIM(mlx5_secondary_data)) 1268a48deadaSOr Ami port_id = 0; 1269a48deadaSOr Ami } 1270a48deadaSOr Ami /* Switch to secondary private structure. If private data has already 1271a48deadaSOr Ami * been updated by another thread, there is nothing else to do. */ 1272a48deadaSOr Ami priv = sd->data.dev_private; 1273a48deadaSOr Ami if (priv->dev->data == &sd->data) 1274a48deadaSOr Ami goto end; 1275a48deadaSOr Ami /* Sanity checks. Secondary private structure is supposed to point 1276a48deadaSOr Ami * to local eth_dev, itself still pointing to the shared device data 1277a48deadaSOr Ami * structure allocated by the primary process. */ 1278a48deadaSOr Ami assert(sd->shared_dev_data != &sd->data); 1279a48deadaSOr Ami assert(sd->data.nb_tx_queues == 0); 1280a48deadaSOr Ami assert(sd->data.tx_queues == NULL); 1281a48deadaSOr Ami assert(sd->data.nb_rx_queues == 0); 1282a48deadaSOr Ami assert(sd->data.rx_queues == NULL); 1283a48deadaSOr Ami assert(priv != sd->primary_priv); 1284a48deadaSOr Ami assert(priv->dev->data == sd->shared_dev_data); 1285a48deadaSOr Ami assert(priv->txqs_n == 0); 1286a48deadaSOr Ami assert(priv->txqs == NULL); 1287a48deadaSOr Ami assert(priv->rxqs_n == 0); 1288a48deadaSOr Ami assert(priv->rxqs == NULL); 1289a48deadaSOr Ami nb_tx_queues = sd->shared_dev_data->nb_tx_queues; 1290a48deadaSOr Ami nb_rx_queues = sd->shared_dev_data->nb_rx_queues; 1291a48deadaSOr Ami /* Allocate local storage for queues. */ 1292a48deadaSOr Ami tx_queues = rte_zmalloc("secondary ethdev->tx_queues", 1293a48deadaSOr Ami sizeof(sd->data.tx_queues[0]) * nb_tx_queues, 1294a48deadaSOr Ami RTE_CACHE_LINE_SIZE); 1295a48deadaSOr Ami rx_queues = rte_zmalloc("secondary ethdev->rx_queues", 1296a48deadaSOr Ami sizeof(sd->data.rx_queues[0]) * nb_rx_queues, 1297a48deadaSOr Ami RTE_CACHE_LINE_SIZE); 1298a48deadaSOr Ami if (tx_queues == NULL || rx_queues == NULL) 1299a48deadaSOr Ami goto error; 1300a48deadaSOr Ami /* Lock to prevent control operations during setup. */ 1301a48deadaSOr Ami priv_lock(priv); 1302a48deadaSOr Ami /* TX queues. */ 1303a48deadaSOr Ami for (i = 0; i != nb_tx_queues; ++i) { 1304a48deadaSOr Ami struct txq *primary_txq = (*sd->primary_priv->txqs)[i]; 130521c8bb49SNélio Laranjeiro struct txq_ctrl *primary_txq_ctrl; 130621c8bb49SNélio Laranjeiro struct txq_ctrl *txq_ctrl; 1307a48deadaSOr Ami 1308a48deadaSOr Ami if (primary_txq == NULL) 1309a48deadaSOr Ami continue; 131021c8bb49SNélio Laranjeiro primary_txq_ctrl = container_of(primary_txq, 131121c8bb49SNélio Laranjeiro struct txq_ctrl, txq); 131221c8bb49SNélio Laranjeiro txq_ctrl = rte_calloc_socket("TXQ", 1, sizeof(*txq_ctrl), 0, 131321c8bb49SNélio Laranjeiro primary_txq_ctrl->socket); 131421c8bb49SNélio Laranjeiro if (txq_ctrl != NULL) { 13151d88ba17SNélio Laranjeiro if (txq_ctrl_setup(priv->dev, 131621c8bb49SNélio Laranjeiro primary_txq_ctrl, 1317*b4b12e55SNélio Laranjeiro 1 << primary_txq->elts_n, 131821c8bb49SNélio Laranjeiro primary_txq_ctrl->socket, 1319a48deadaSOr Ami NULL) == 0) { 132021c8bb49SNélio Laranjeiro txq_ctrl->txq.stats.idx = 132121c8bb49SNélio Laranjeiro primary_txq->stats.idx; 132221c8bb49SNélio Laranjeiro tx_queues[i] = &txq_ctrl->txq; 1323a48deadaSOr Ami continue; 1324a48deadaSOr Ami } 132521c8bb49SNélio Laranjeiro rte_free(txq_ctrl); 1326a48deadaSOr Ami } 1327a48deadaSOr Ami while (i) { 132821c8bb49SNélio Laranjeiro txq_ctrl = tx_queues[--i]; 132921c8bb49SNélio Laranjeiro txq_cleanup(txq_ctrl); 133021c8bb49SNélio Laranjeiro rte_free(txq_ctrl); 1331a48deadaSOr Ami } 1332a48deadaSOr Ami goto error; 1333a48deadaSOr Ami } 1334a48deadaSOr Ami /* RX queues. */ 1335a48deadaSOr Ami for (i = 0; i != nb_rx_queues; ++i) { 13366218063bSNélio Laranjeiro struct rxq_ctrl *primary_rxq = 13376218063bSNélio Laranjeiro container_of((*sd->primary_priv->rxqs)[i], 13386218063bSNélio Laranjeiro struct rxq_ctrl, rxq); 1339a48deadaSOr Ami 1340a48deadaSOr Ami if (primary_rxq == NULL) 1341a48deadaSOr Ami continue; 1342a48deadaSOr Ami /* Not supported yet. */ 1343a48deadaSOr Ami rx_queues[i] = NULL; 1344a48deadaSOr Ami } 1345a48deadaSOr Ami /* Update everything. */ 1346a48deadaSOr Ami priv->txqs = (void *)tx_queues; 1347a48deadaSOr Ami priv->txqs_n = nb_tx_queues; 1348a48deadaSOr Ami priv->rxqs = (void *)rx_queues; 1349a48deadaSOr Ami priv->rxqs_n = nb_rx_queues; 1350a48deadaSOr Ami sd->data.rx_queues = rx_queues; 1351a48deadaSOr Ami sd->data.tx_queues = tx_queues; 1352a48deadaSOr Ami sd->data.nb_rx_queues = nb_rx_queues; 1353a48deadaSOr Ami sd->data.nb_tx_queues = nb_tx_queues; 1354a48deadaSOr Ami sd->data.dev_link = sd->shared_dev_data->dev_link; 1355a48deadaSOr Ami sd->data.mtu = sd->shared_dev_data->mtu; 1356a48deadaSOr Ami memcpy(sd->data.rx_queue_state, sd->shared_dev_data->rx_queue_state, 1357a48deadaSOr Ami sizeof(sd->data.rx_queue_state)); 1358a48deadaSOr Ami memcpy(sd->data.tx_queue_state, sd->shared_dev_data->tx_queue_state, 1359a48deadaSOr Ami sizeof(sd->data.tx_queue_state)); 1360a48deadaSOr Ami sd->data.dev_flags = sd->shared_dev_data->dev_flags; 1361a48deadaSOr Ami /* Use local data from now on. */ 1362a48deadaSOr Ami rte_mb(); 1363a48deadaSOr Ami priv->dev->data = &sd->data; 1364a48deadaSOr Ami rte_mb(); 1365cdab90cbSNélio Laranjeiro priv_select_tx_function(priv); 1366cdab90cbSNélio Laranjeiro priv_select_rx_function(priv); 1367a48deadaSOr Ami priv_unlock(priv); 1368a48deadaSOr Ami end: 1369a48deadaSOr Ami /* More sanity checks. */ 1370a48deadaSOr Ami assert(priv->dev->data == &sd->data); 1371a48deadaSOr Ami rte_spinlock_unlock(&sd->lock); 1372a48deadaSOr Ami return priv; 1373a48deadaSOr Ami error: 1374a48deadaSOr Ami priv_unlock(priv); 1375a48deadaSOr Ami rte_free(tx_queues); 1376a48deadaSOr Ami rte_free(rx_queues); 1377a48deadaSOr Ami rte_spinlock_unlock(&sd->lock); 1378a48deadaSOr Ami return NULL; 1379a48deadaSOr Ami } 1380cdab90cbSNélio Laranjeiro 1381cdab90cbSNélio Laranjeiro /** 1382cdab90cbSNélio Laranjeiro * Configure the TX function to use. 1383cdab90cbSNélio Laranjeiro * 1384cdab90cbSNélio Laranjeiro * @param priv 1385cdab90cbSNélio Laranjeiro * Pointer to private structure. 1386cdab90cbSNélio Laranjeiro */ 1387cdab90cbSNélio Laranjeiro void 1388cdab90cbSNélio Laranjeiro priv_select_tx_function(struct priv *priv) 1389cdab90cbSNélio Laranjeiro { 1390cdab90cbSNélio Laranjeiro priv->dev->tx_pkt_burst = mlx5_tx_burst; 1391230189d9SNélio Laranjeiro /* Display warning for unsupported configurations. */ 1392230189d9SNélio Laranjeiro if (priv->sriov && priv->mps) 1393230189d9SNélio Laranjeiro WARN("multi-packet send WQE cannot be used on a SR-IOV setup"); 1394230189d9SNélio Laranjeiro /* Select appropriate TX function. */ 1395230189d9SNélio Laranjeiro if ((priv->sriov == 0) && priv->mps && priv->txq_inline) { 1396230189d9SNélio Laranjeiro priv->dev->tx_pkt_burst = mlx5_tx_burst_mpw_inline; 1397230189d9SNélio Laranjeiro DEBUG("selected MPW inline TX function"); 1398230189d9SNélio Laranjeiro } else if ((priv->sriov == 0) && priv->mps) { 1399230189d9SNélio Laranjeiro priv->dev->tx_pkt_burst = mlx5_tx_burst_mpw; 1400230189d9SNélio Laranjeiro DEBUG("selected MPW TX function"); 14012a66cf37SYaacov Hazan } 1402cdab90cbSNélio Laranjeiro } 1403cdab90cbSNélio Laranjeiro 1404cdab90cbSNélio Laranjeiro /** 1405cdab90cbSNélio Laranjeiro * Configure the RX function to use. 1406cdab90cbSNélio Laranjeiro * 1407cdab90cbSNélio Laranjeiro * @param priv 1408cdab90cbSNélio Laranjeiro * Pointer to private structure. 1409cdab90cbSNélio Laranjeiro */ 1410cdab90cbSNélio Laranjeiro void 1411cdab90cbSNélio Laranjeiro priv_select_rx_function(struct priv *priv) 1412cdab90cbSNélio Laranjeiro { 1413cdab90cbSNélio Laranjeiro priv->dev->rx_pkt_burst = mlx5_rx_burst; 1414cdab90cbSNélio Laranjeiro } 1415