179aa4307SOphir Munk /* SPDX-License-Identifier: BSD-3-Clause 279aa4307SOphir Munk * Copyright 2020 Mellanox Technologies, Ltd 379aa4307SOphir Munk */ 479aa4307SOphir Munk 579aa4307SOphir Munk #include <unistd.h> 679aa4307SOphir Munk #include <string.h> 779aa4307SOphir Munk #include <stdio.h> 879aa4307SOphir Munk #ifdef RTE_IBVERBS_LINK_DLOPEN 979aa4307SOphir Munk #include <dlfcn.h> 1079aa4307SOphir Munk #endif 11*aec086c9SMatan Azrad #include <dirent.h> 12*aec086c9SMatan Azrad #include <net/if.h> 1379aa4307SOphir Munk 1479aa4307SOphir Munk #include <rte_errno.h> 15*aec086c9SMatan Azrad #include <rte_string_fns.h> 1679aa4307SOphir Munk 1779aa4307SOphir Munk #include "mlx5_common.h" 1879aa4307SOphir Munk #include "mlx5_common_utils.h" 1979aa4307SOphir Munk #include "mlx5_glue.h" 2079aa4307SOphir Munk 2179aa4307SOphir Munk #ifdef MLX5_GLUE 2279aa4307SOphir Munk const struct mlx5_glue *mlx5_glue; 2379aa4307SOphir Munk #endif 2479aa4307SOphir Munk 2579aa4307SOphir Munk /** 2679aa4307SOphir Munk * Get PCI information by sysfs device path. 2779aa4307SOphir Munk * 2879aa4307SOphir Munk * @param dev_path 2979aa4307SOphir Munk * Pointer to device sysfs folder name. 3079aa4307SOphir Munk * @param[out] pci_addr 3179aa4307SOphir Munk * PCI bus address output buffer. 3279aa4307SOphir Munk * 3379aa4307SOphir Munk * @return 3479aa4307SOphir Munk * 0 on success, a negative errno value otherwise and rte_errno is set. 3579aa4307SOphir Munk */ 3679aa4307SOphir Munk int 3779aa4307SOphir Munk mlx5_dev_to_pci_addr(const char *dev_path, 3879aa4307SOphir Munk struct rte_pci_addr *pci_addr) 3979aa4307SOphir Munk { 4079aa4307SOphir Munk FILE *file; 4179aa4307SOphir Munk char line[32]; 4279aa4307SOphir Munk MKSTR(path, "%s/device/uevent", dev_path); 4379aa4307SOphir Munk 4479aa4307SOphir Munk file = fopen(path, "rb"); 4579aa4307SOphir Munk if (file == NULL) { 4679aa4307SOphir Munk rte_errno = errno; 4779aa4307SOphir Munk return -rte_errno; 4879aa4307SOphir Munk } 4979aa4307SOphir Munk while (fgets(line, sizeof(line), file) == line) { 5079aa4307SOphir Munk size_t len = strlen(line); 5179aa4307SOphir Munk int ret; 5279aa4307SOphir Munk 5379aa4307SOphir Munk /* Truncate long lines. */ 5479aa4307SOphir Munk if (len == (sizeof(line) - 1)) 5579aa4307SOphir Munk while (line[(len - 1)] != '\n') { 5679aa4307SOphir Munk ret = fgetc(file); 5779aa4307SOphir Munk if (ret == EOF) 5879aa4307SOphir Munk break; 5979aa4307SOphir Munk line[(len - 1)] = ret; 6079aa4307SOphir Munk } 6179aa4307SOphir Munk /* Extract information. */ 6279aa4307SOphir Munk if (sscanf(line, 6379aa4307SOphir Munk "PCI_SLOT_NAME=" 6479aa4307SOphir Munk "%" SCNx32 ":%" SCNx8 ":%" SCNx8 ".%" SCNx8 "\n", 6579aa4307SOphir Munk &pci_addr->domain, 6679aa4307SOphir Munk &pci_addr->bus, 6779aa4307SOphir Munk &pci_addr->devid, 6879aa4307SOphir Munk &pci_addr->function) == 4) { 6979aa4307SOphir Munk ret = 0; 7079aa4307SOphir Munk break; 7179aa4307SOphir Munk } 7279aa4307SOphir Munk } 7379aa4307SOphir Munk fclose(file); 7479aa4307SOphir Munk return 0; 7579aa4307SOphir Munk } 7679aa4307SOphir Munk 7779aa4307SOphir Munk /** 7879aa4307SOphir Munk * Extract port name, as a number, from sysfs or netlink information. 7979aa4307SOphir Munk * 8079aa4307SOphir Munk * @param[in] port_name_in 8179aa4307SOphir Munk * String representing the port name. 8279aa4307SOphir Munk * @param[out] port_info_out 8379aa4307SOphir Munk * Port information, including port name as a number and port name 8479aa4307SOphir Munk * type if recognized 8579aa4307SOphir Munk * 8679aa4307SOphir Munk * @return 8779aa4307SOphir Munk * port_name field set according to recognized name format. 8879aa4307SOphir Munk */ 8979aa4307SOphir Munk void 9079aa4307SOphir Munk mlx5_translate_port_name(const char *port_name_in, 9179aa4307SOphir Munk struct mlx5_switch_info *port_info_out) 9279aa4307SOphir Munk { 9379aa4307SOphir Munk char pf_c1, pf_c2, vf_c1, vf_c2; 9479aa4307SOphir Munk char *end; 9579aa4307SOphir Munk int sc_items; 9679aa4307SOphir Munk 9779aa4307SOphir Munk /* 9879aa4307SOphir Munk * Check for port-name as a string of the form pf0vf0 9979aa4307SOphir Munk * (support kernel ver >= 5.0 or OFED ver >= 4.6). 10079aa4307SOphir Munk */ 10179aa4307SOphir Munk sc_items = sscanf(port_name_in, "%c%c%d%c%c%d", 10279aa4307SOphir Munk &pf_c1, &pf_c2, &port_info_out->pf_num, 10379aa4307SOphir Munk &vf_c1, &vf_c2, &port_info_out->port_name); 10479aa4307SOphir Munk if (sc_items == 6 && 10579aa4307SOphir Munk pf_c1 == 'p' && pf_c2 == 'f' && 10679aa4307SOphir Munk vf_c1 == 'v' && vf_c2 == 'f') { 10779aa4307SOphir Munk port_info_out->name_type = MLX5_PHYS_PORT_NAME_TYPE_PFVF; 10879aa4307SOphir Munk return; 10979aa4307SOphir Munk } 11079aa4307SOphir Munk /* 11179aa4307SOphir Munk * Check for port-name as a string of the form p0 11279aa4307SOphir Munk * (support kernel ver >= 5.0, or OFED ver >= 4.6). 11379aa4307SOphir Munk */ 11479aa4307SOphir Munk sc_items = sscanf(port_name_in, "%c%d", 11579aa4307SOphir Munk &pf_c1, &port_info_out->port_name); 11679aa4307SOphir Munk if (sc_items == 2 && pf_c1 == 'p') { 11779aa4307SOphir Munk port_info_out->name_type = MLX5_PHYS_PORT_NAME_TYPE_UPLINK; 11879aa4307SOphir Munk return; 11979aa4307SOphir Munk } 12079aa4307SOphir Munk /* Check for port-name as a number (support kernel ver < 5.0 */ 12179aa4307SOphir Munk errno = 0; 12279aa4307SOphir Munk port_info_out->port_name = strtol(port_name_in, &end, 0); 12379aa4307SOphir Munk if (!errno && 12479aa4307SOphir Munk (size_t)(end - port_name_in) == strlen(port_name_in)) { 12579aa4307SOphir Munk port_info_out->name_type = MLX5_PHYS_PORT_NAME_TYPE_LEGACY; 12679aa4307SOphir Munk return; 12779aa4307SOphir Munk } 12879aa4307SOphir Munk port_info_out->name_type = MLX5_PHYS_PORT_NAME_TYPE_UNKNOWN; 12979aa4307SOphir Munk } 13079aa4307SOphir Munk 131*aec086c9SMatan Azrad /** 132*aec086c9SMatan Azrad * Get kernel interface name from IB device path. 133*aec086c9SMatan Azrad * 134*aec086c9SMatan Azrad * @param[in] ibdev_path 135*aec086c9SMatan Azrad * Pointer to IB device path. 136*aec086c9SMatan Azrad * @param[out] ifname 137*aec086c9SMatan Azrad * Interface name output buffer. 138*aec086c9SMatan Azrad * 139*aec086c9SMatan Azrad * @return 140*aec086c9SMatan Azrad * 0 on success, a negative errno value otherwise and rte_errno is set. 141*aec086c9SMatan Azrad */ 142*aec086c9SMatan Azrad int 143*aec086c9SMatan Azrad mlx5_get_ifname_sysfs(const char *ibdev_path, char *ifname) 144*aec086c9SMatan Azrad { 145*aec086c9SMatan Azrad DIR *dir; 146*aec086c9SMatan Azrad struct dirent *dent; 147*aec086c9SMatan Azrad unsigned int dev_type = 0; 148*aec086c9SMatan Azrad unsigned int dev_port_prev = ~0u; 149*aec086c9SMatan Azrad char match[IF_NAMESIZE] = ""; 150*aec086c9SMatan Azrad 151*aec086c9SMatan Azrad MLX5_ASSERT(ibdev_path); 152*aec086c9SMatan Azrad { 153*aec086c9SMatan Azrad MKSTR(path, "%s/device/net", ibdev_path); 154*aec086c9SMatan Azrad 155*aec086c9SMatan Azrad dir = opendir(path); 156*aec086c9SMatan Azrad if (dir == NULL) { 157*aec086c9SMatan Azrad rte_errno = errno; 158*aec086c9SMatan Azrad return -rte_errno; 159*aec086c9SMatan Azrad } 160*aec086c9SMatan Azrad } 161*aec086c9SMatan Azrad while ((dent = readdir(dir)) != NULL) { 162*aec086c9SMatan Azrad char *name = dent->d_name; 163*aec086c9SMatan Azrad FILE *file; 164*aec086c9SMatan Azrad unsigned int dev_port; 165*aec086c9SMatan Azrad int r; 166*aec086c9SMatan Azrad 167*aec086c9SMatan Azrad if ((name[0] == '.') && 168*aec086c9SMatan Azrad ((name[1] == '\0') || 169*aec086c9SMatan Azrad ((name[1] == '.') && (name[2] == '\0')))) 170*aec086c9SMatan Azrad continue; 171*aec086c9SMatan Azrad 172*aec086c9SMatan Azrad MKSTR(path, "%s/device/net/%s/%s", 173*aec086c9SMatan Azrad ibdev_path, name, 174*aec086c9SMatan Azrad (dev_type ? "dev_id" : "dev_port")); 175*aec086c9SMatan Azrad 176*aec086c9SMatan Azrad file = fopen(path, "rb"); 177*aec086c9SMatan Azrad if (file == NULL) { 178*aec086c9SMatan Azrad if (errno != ENOENT) 179*aec086c9SMatan Azrad continue; 180*aec086c9SMatan Azrad /* 181*aec086c9SMatan Azrad * Switch to dev_id when dev_port does not exist as 182*aec086c9SMatan Azrad * is the case with Linux kernel versions < 3.15. 183*aec086c9SMatan Azrad */ 184*aec086c9SMatan Azrad try_dev_id: 185*aec086c9SMatan Azrad match[0] = '\0'; 186*aec086c9SMatan Azrad if (dev_type) 187*aec086c9SMatan Azrad break; 188*aec086c9SMatan Azrad dev_type = 1; 189*aec086c9SMatan Azrad dev_port_prev = ~0u; 190*aec086c9SMatan Azrad rewinddir(dir); 191*aec086c9SMatan Azrad continue; 192*aec086c9SMatan Azrad } 193*aec086c9SMatan Azrad r = fscanf(file, (dev_type ? "%x" : "%u"), &dev_port); 194*aec086c9SMatan Azrad fclose(file); 195*aec086c9SMatan Azrad if (r != 1) 196*aec086c9SMatan Azrad continue; 197*aec086c9SMatan Azrad /* 198*aec086c9SMatan Azrad * Switch to dev_id when dev_port returns the same value for 199*aec086c9SMatan Azrad * all ports. May happen when using a MOFED release older than 200*aec086c9SMatan Azrad * 3.0 with a Linux kernel >= 3.15. 201*aec086c9SMatan Azrad */ 202*aec086c9SMatan Azrad if (dev_port == dev_port_prev) 203*aec086c9SMatan Azrad goto try_dev_id; 204*aec086c9SMatan Azrad dev_port_prev = dev_port; 205*aec086c9SMatan Azrad if (dev_port == 0) 206*aec086c9SMatan Azrad strlcpy(match, name, IF_NAMESIZE); 207*aec086c9SMatan Azrad } 208*aec086c9SMatan Azrad closedir(dir); 209*aec086c9SMatan Azrad if (match[0] == '\0') { 210*aec086c9SMatan Azrad rte_errno = ENOENT; 211*aec086c9SMatan Azrad return -rte_errno; 212*aec086c9SMatan Azrad } 213*aec086c9SMatan Azrad strncpy(ifname, match, IF_NAMESIZE); 214*aec086c9SMatan Azrad return 0; 215*aec086c9SMatan Azrad } 216*aec086c9SMatan Azrad 21779aa4307SOphir Munk #ifdef MLX5_GLUE 21879aa4307SOphir Munk 21979aa4307SOphir Munk /** 22079aa4307SOphir Munk * Suffix RTE_EAL_PMD_PATH with "-glue". 22179aa4307SOphir Munk * 22279aa4307SOphir Munk * This function performs a sanity check on RTE_EAL_PMD_PATH before 22379aa4307SOphir Munk * suffixing its last component. 22479aa4307SOphir Munk * 22579aa4307SOphir Munk * @param buf[out] 22679aa4307SOphir Munk * Output buffer, should be large enough otherwise NULL is returned. 22779aa4307SOphir Munk * @param size 22879aa4307SOphir Munk * Size of @p out. 22979aa4307SOphir Munk * 23079aa4307SOphir Munk * @return 23179aa4307SOphir Munk * Pointer to @p buf or @p NULL in case suffix cannot be appended. 23279aa4307SOphir Munk */ 23379aa4307SOphir Munk static char * 23479aa4307SOphir Munk mlx5_glue_path(char *buf, size_t size) 23579aa4307SOphir Munk { 23679aa4307SOphir Munk static const char *const bad[] = { "/", ".", "..", NULL }; 23779aa4307SOphir Munk const char *path = RTE_EAL_PMD_PATH; 23879aa4307SOphir Munk size_t len = strlen(path); 23979aa4307SOphir Munk size_t off; 24079aa4307SOphir Munk int i; 24179aa4307SOphir Munk 24279aa4307SOphir Munk while (len && path[len - 1] == '/') 24379aa4307SOphir Munk --len; 24479aa4307SOphir Munk for (off = len; off && path[off - 1] != '/'; --off) 24579aa4307SOphir Munk ; 24679aa4307SOphir Munk for (i = 0; bad[i]; ++i) 24779aa4307SOphir Munk if (!strncmp(path + off, bad[i], (int)(len - off))) 24879aa4307SOphir Munk goto error; 24979aa4307SOphir Munk i = snprintf(buf, size, "%.*s-glue", (int)len, path); 25079aa4307SOphir Munk if (i == -1 || (size_t)i >= size) 25179aa4307SOphir Munk goto error; 25279aa4307SOphir Munk return buf; 25379aa4307SOphir Munk error: 25479aa4307SOphir Munk RTE_LOG(ERR, PMD, "unable to append \"-glue\" to last component of" 25579aa4307SOphir Munk " RTE_EAL_PMD_PATH (\"" RTE_EAL_PMD_PATH "\"), please" 25679aa4307SOphir Munk " re-configure DPDK"); 25779aa4307SOphir Munk return NULL; 25879aa4307SOphir Munk } 25979aa4307SOphir Munk 26079aa4307SOphir Munk static int 26179aa4307SOphir Munk mlx5_glue_dlopen(void) 26279aa4307SOphir Munk { 26379aa4307SOphir Munk char glue_path[sizeof(RTE_EAL_PMD_PATH) - 1 + sizeof("-glue")]; 26479aa4307SOphir Munk void *handle = NULL; 26579aa4307SOphir Munk 26679aa4307SOphir Munk char const *path[] = { 26779aa4307SOphir Munk /* 26879aa4307SOphir Munk * A basic security check is necessary before trusting 26979aa4307SOphir Munk * MLX5_GLUE_PATH, which may override RTE_EAL_PMD_PATH. 27079aa4307SOphir Munk */ 27179aa4307SOphir Munk (geteuid() == getuid() && getegid() == getgid() ? 27279aa4307SOphir Munk getenv("MLX5_GLUE_PATH") : NULL), 27379aa4307SOphir Munk /* 27479aa4307SOphir Munk * When RTE_EAL_PMD_PATH is set, use its glue-suffixed 27579aa4307SOphir Munk * variant, otherwise let dlopen() look up libraries on its 27679aa4307SOphir Munk * own. 27779aa4307SOphir Munk */ 27879aa4307SOphir Munk (*RTE_EAL_PMD_PATH ? 27979aa4307SOphir Munk mlx5_glue_path(glue_path, sizeof(glue_path)) : ""), 28079aa4307SOphir Munk }; 28179aa4307SOphir Munk unsigned int i = 0; 28279aa4307SOphir Munk void **sym; 28379aa4307SOphir Munk const char *dlmsg; 28479aa4307SOphir Munk 28579aa4307SOphir Munk while (!handle && i != RTE_DIM(path)) { 28679aa4307SOphir Munk const char *end; 28779aa4307SOphir Munk size_t len; 28879aa4307SOphir Munk int ret; 28979aa4307SOphir Munk 29079aa4307SOphir Munk if (!path[i]) { 29179aa4307SOphir Munk ++i; 29279aa4307SOphir Munk continue; 29379aa4307SOphir Munk } 29479aa4307SOphir Munk end = strpbrk(path[i], ":;"); 29579aa4307SOphir Munk if (!end) 29679aa4307SOphir Munk end = path[i] + strlen(path[i]); 29779aa4307SOphir Munk len = end - path[i]; 29879aa4307SOphir Munk ret = 0; 29979aa4307SOphir Munk do { 30079aa4307SOphir Munk char name[ret + 1]; 30179aa4307SOphir Munk 30279aa4307SOphir Munk ret = snprintf(name, sizeof(name), "%.*s%s" MLX5_GLUE, 30379aa4307SOphir Munk (int)len, path[i], 30479aa4307SOphir Munk (!len || *(end - 1) == '/') ? "" : "/"); 30579aa4307SOphir Munk if (ret == -1) 30679aa4307SOphir Munk break; 30779aa4307SOphir Munk if (sizeof(name) != (size_t)ret + 1) 30879aa4307SOphir Munk continue; 30979aa4307SOphir Munk DRV_LOG(DEBUG, "Looking for rdma-core glue as " 31079aa4307SOphir Munk "\"%s\"", name); 31179aa4307SOphir Munk handle = dlopen(name, RTLD_LAZY); 31279aa4307SOphir Munk break; 31379aa4307SOphir Munk } while (1); 31479aa4307SOphir Munk path[i] = end + 1; 31579aa4307SOphir Munk if (!*end) 31679aa4307SOphir Munk ++i; 31779aa4307SOphir Munk } 31879aa4307SOphir Munk if (!handle) { 31979aa4307SOphir Munk rte_errno = EINVAL; 32079aa4307SOphir Munk dlmsg = dlerror(); 32179aa4307SOphir Munk if (dlmsg) 32279aa4307SOphir Munk DRV_LOG(WARNING, "Cannot load glue library: %s", dlmsg); 32379aa4307SOphir Munk goto glue_error; 32479aa4307SOphir Munk } 32579aa4307SOphir Munk sym = dlsym(handle, "mlx5_glue"); 32679aa4307SOphir Munk if (!sym || !*sym) { 32779aa4307SOphir Munk rte_errno = EINVAL; 32879aa4307SOphir Munk dlmsg = dlerror(); 32979aa4307SOphir Munk if (dlmsg) 33079aa4307SOphir Munk DRV_LOG(ERR, "Cannot resolve glue symbol: %s", dlmsg); 33179aa4307SOphir Munk goto glue_error; 33279aa4307SOphir Munk } 33379aa4307SOphir Munk mlx5_glue = *sym; 33479aa4307SOphir Munk return 0; 33579aa4307SOphir Munk 33679aa4307SOphir Munk glue_error: 33779aa4307SOphir Munk if (handle) 33879aa4307SOphir Munk dlclose(handle); 33979aa4307SOphir Munk return -1; 34079aa4307SOphir Munk } 34179aa4307SOphir Munk 34279aa4307SOphir Munk #endif 34379aa4307SOphir Munk 34479aa4307SOphir Munk /** 34579aa4307SOphir Munk * Initialization routine for run-time dependency on rdma-core. 34679aa4307SOphir Munk */ 34779aa4307SOphir Munk void 34879aa4307SOphir Munk mlx5_glue_constructor(void) 34979aa4307SOphir Munk { 35079aa4307SOphir Munk /* 35179aa4307SOphir Munk * RDMAV_HUGEPAGES_SAFE tells ibv_fork_init() we intend to use 35279aa4307SOphir Munk * huge pages. Calling ibv_fork_init() during init allows 35379aa4307SOphir Munk * applications to use fork() safely for purposes other than 35479aa4307SOphir Munk * using this PMD, which is not supported in forked processes. 35579aa4307SOphir Munk */ 35679aa4307SOphir Munk setenv("RDMAV_HUGEPAGES_SAFE", "1", 1); 35779aa4307SOphir Munk /* Match the size of Rx completion entry to the size of a cacheline. */ 35879aa4307SOphir Munk if (RTE_CACHE_LINE_SIZE == 128) 35979aa4307SOphir Munk setenv("MLX5_CQE_SIZE", "128", 0); 36079aa4307SOphir Munk /* 36179aa4307SOphir Munk * MLX5_DEVICE_FATAL_CLEANUP tells ibv_destroy functions to 36279aa4307SOphir Munk * cleanup all the Verbs resources even when the device was removed. 36379aa4307SOphir Munk */ 36479aa4307SOphir Munk setenv("MLX5_DEVICE_FATAL_CLEANUP", "1", 1); 36579aa4307SOphir Munk 36679aa4307SOphir Munk #ifdef MLX5_GLUE 36779aa4307SOphir Munk if (mlx5_glue_dlopen() != 0) 36879aa4307SOphir Munk goto glue_error; 36979aa4307SOphir Munk #endif 37079aa4307SOphir Munk 37179aa4307SOphir Munk #ifdef RTE_LIBRTE_MLX5_DEBUG 37279aa4307SOphir Munk /* Glue structure must not contain any NULL pointers. */ 37379aa4307SOphir Munk { 37479aa4307SOphir Munk unsigned int i; 37579aa4307SOphir Munk 37679aa4307SOphir Munk for (i = 0; i != sizeof(*mlx5_glue) / sizeof(void *); ++i) 37779aa4307SOphir Munk MLX5_ASSERT(((const void *const *)mlx5_glue)[i]); 37879aa4307SOphir Munk } 37979aa4307SOphir Munk #endif 38079aa4307SOphir Munk if (strcmp(mlx5_glue->version, MLX5_GLUE_VERSION)) { 38179aa4307SOphir Munk rte_errno = EINVAL; 38279aa4307SOphir Munk DRV_LOG(ERR, "rdma-core glue \"%s\" mismatch: \"%s\" is " 38379aa4307SOphir Munk "required", mlx5_glue->version, MLX5_GLUE_VERSION); 38479aa4307SOphir Munk goto glue_error; 38579aa4307SOphir Munk } 38679aa4307SOphir Munk mlx5_glue->fork_init(); 38779aa4307SOphir Munk return; 38879aa4307SOphir Munk 38979aa4307SOphir Munk glue_error: 39079aa4307SOphir Munk DRV_LOG(WARNING, "Cannot initialize MLX5 common due to missing" 39179aa4307SOphir Munk " run-time dependency on rdma-core libraries (libibverbs," 39279aa4307SOphir Munk " libmlx5)"); 39379aa4307SOphir Munk mlx5_glue = NULL; 39479aa4307SOphir Munk } 395