17b4f1e6bSMatan Azrad /* SPDX-License-Identifier: BSD-3-Clause 27b4f1e6bSMatan Azrad * Copyright 2019 Mellanox Technologies, Ltd 37b4f1e6bSMatan Azrad */ 47b4f1e6bSMatan Azrad 57b4f1e6bSMatan Azrad #include <unistd.h> 67b4f1e6bSMatan Azrad #include <string.h> 793e30982SMatan Azrad #include <stdio.h> 87b4f1e6bSMatan Azrad 97b4f1e6bSMatan Azrad #include <rte_errno.h> 10262c7ad0SOri Kam #include <rte_mempool.h> 11ad435d32SXueming Li #include <rte_class.h> 12ad435d32SXueming Li #include <rte_malloc.h> 137b4f1e6bSMatan Azrad 147b4f1e6bSMatan Azrad #include "mlx5_common.h" 15262c7ad0SOri Kam #include "mlx5_common_os.h" 1625245d5dSShiri Kuzin #include "mlx5_common_log.h" 178a41f4deSParav Pandit #include "mlx5_common_pci.h" 18ad435d32SXueming Li #include "mlx5_common_private.h" 197b4f1e6bSMatan Azrad 204c204fe5SShiri Kuzin uint8_t haswell_broadwell_cpu; 214c204fe5SShiri Kuzin 224c204fe5SShiri Kuzin /* In case this is an x86_64 intel processor to check if 234c204fe5SShiri Kuzin * we should use relaxed ordering. 244c204fe5SShiri Kuzin */ 254c204fe5SShiri Kuzin #ifdef RTE_ARCH_X86_64 264c204fe5SShiri Kuzin /** 274c204fe5SShiri Kuzin * This function returns processor identification and feature information 284c204fe5SShiri Kuzin * into the registers. 294c204fe5SShiri Kuzin * 304c204fe5SShiri Kuzin * @param eax, ebx, ecx, edx 314c204fe5SShiri Kuzin * Pointers to the registers that will hold cpu information. 324c204fe5SShiri Kuzin * @param level 334c204fe5SShiri Kuzin * The main category of information returned. 344c204fe5SShiri Kuzin */ 354c204fe5SShiri Kuzin static inline void mlx5_cpu_id(unsigned int level, 364c204fe5SShiri Kuzin unsigned int *eax, unsigned int *ebx, 374c204fe5SShiri Kuzin unsigned int *ecx, unsigned int *edx) 384c204fe5SShiri Kuzin { 394c204fe5SShiri Kuzin __asm__("cpuid\n\t" 404c204fe5SShiri Kuzin : "=a" (*eax), "=b" (*ebx), "=c" (*ecx), "=d" (*edx) 414c204fe5SShiri Kuzin : "0" (level)); 424c204fe5SShiri Kuzin } 434c204fe5SShiri Kuzin #endif 444c204fe5SShiri Kuzin 45eeded204SDavid Marchand RTE_LOG_REGISTER_DEFAULT(mlx5_common_logtype, NOTICE) 4683c99c36SThomas Monjalon 47ad435d32SXueming Li /* Head of list of drivers. */ 48ad435d32SXueming Li static TAILQ_HEAD(mlx5_drivers, mlx5_class_driver) drivers_list = 49ad435d32SXueming Li TAILQ_HEAD_INITIALIZER(drivers_list); 50ad435d32SXueming Li 51ad435d32SXueming Li /* Head of devices. */ 52ad435d32SXueming Li static TAILQ_HEAD(mlx5_devices, mlx5_common_device) devices_list = 53ad435d32SXueming Li TAILQ_HEAD_INITIALIZER(devices_list); 54ad435d32SXueming Li 55ad435d32SXueming Li static const struct { 56ad435d32SXueming Li const char *name; 57ad435d32SXueming Li unsigned int drv_class; 58ad435d32SXueming Li } mlx5_classes[] = { 59ad435d32SXueming Li { .name = "vdpa", .drv_class = MLX5_CLASS_VDPA }, 60ad435d32SXueming Li { .name = "eth", .drv_class = MLX5_CLASS_ETH }, 61ad435d32SXueming Li /* Keep class "net" for backward compatibility. */ 62ad435d32SXueming Li { .name = "net", .drv_class = MLX5_CLASS_ETH }, 63ad435d32SXueming Li { .name = "regex", .drv_class = MLX5_CLASS_REGEX }, 64ad435d32SXueming Li { .name = "compress", .drv_class = MLX5_CLASS_COMPRESS }, 65ad435d32SXueming Li { .name = "crypto", .drv_class = MLX5_CLASS_CRYPTO }, 66ad435d32SXueming Li }; 67ad435d32SXueming Li 68ad435d32SXueming Li static int 69ad435d32SXueming Li class_name_to_value(const char *class_name) 70ad435d32SXueming Li { 71ad435d32SXueming Li unsigned int i; 72ad435d32SXueming Li 73ad435d32SXueming Li for (i = 0; i < RTE_DIM(mlx5_classes); i++) { 74ad435d32SXueming Li if (strcmp(class_name, mlx5_classes[i].name) == 0) 75ad435d32SXueming Li return mlx5_classes[i].drv_class; 76ad435d32SXueming Li } 77ad435d32SXueming Li return -EINVAL; 78ad435d32SXueming Li } 79ad435d32SXueming Li 80ad435d32SXueming Li static struct mlx5_class_driver * 81ad435d32SXueming Li driver_get(uint32_t class) 82ad435d32SXueming Li { 83ad435d32SXueming Li struct mlx5_class_driver *driver; 84ad435d32SXueming Li 85ad435d32SXueming Li TAILQ_FOREACH(driver, &drivers_list, next) { 86ad435d32SXueming Li if ((uint32_t)driver->drv_class == class) 87ad435d32SXueming Li return driver; 88ad435d32SXueming Li } 89ad435d32SXueming Li return NULL; 90ad435d32SXueming Li } 91ad435d32SXueming Li 92ad435d32SXueming Li static int 93ad435d32SXueming Li devargs_class_handler(__rte_unused const char *key, 94ad435d32SXueming Li const char *class_names, void *opaque) 95ad435d32SXueming Li { 96ad435d32SXueming Li int *ret = opaque; 97ad435d32SXueming Li int class_val; 98ad435d32SXueming Li char *scratch; 99ad435d32SXueming Li char *found; 100ad435d32SXueming Li char *refstr = NULL; 101ad435d32SXueming Li 102ad435d32SXueming Li *ret = 0; 103ad435d32SXueming Li scratch = strdup(class_names); 104ad435d32SXueming Li if (scratch == NULL) { 105ad435d32SXueming Li *ret = -ENOMEM; 106ad435d32SXueming Li return *ret; 107ad435d32SXueming Li } 108ad435d32SXueming Li found = strtok_r(scratch, ":", &refstr); 109ad435d32SXueming Li if (found == NULL) 110ad435d32SXueming Li /* Empty string. */ 111ad435d32SXueming Li goto err; 112ad435d32SXueming Li do { 113ad435d32SXueming Li /* Extract each individual class name. Multiple 114ad435d32SXueming Li * classes can be supplied as class=net:regex:foo:bar. 115ad435d32SXueming Li */ 116ad435d32SXueming Li class_val = class_name_to_value(found); 117ad435d32SXueming Li /* Check if its a valid class. */ 118ad435d32SXueming Li if (class_val < 0) { 119ad435d32SXueming Li *ret = -EINVAL; 120ad435d32SXueming Li goto err; 121ad435d32SXueming Li } 122ad435d32SXueming Li *ret |= class_val; 123ad435d32SXueming Li found = strtok_r(NULL, ":", &refstr); 124ad435d32SXueming Li } while (found != NULL); 125ad435d32SXueming Li err: 126ad435d32SXueming Li free(scratch); 127ad435d32SXueming Li if (*ret < 0) 128ad435d32SXueming Li DRV_LOG(ERR, "Invalid mlx5 class options: %s.\n", class_names); 129ad435d32SXueming Li return *ret; 130ad435d32SXueming Li } 131ad435d32SXueming Li 132ad435d32SXueming Li static int 133ad435d32SXueming Li parse_class_options(const struct rte_devargs *devargs) 134ad435d32SXueming Li { 135ad435d32SXueming Li struct rte_kvargs *kvlist; 136ad435d32SXueming Li int ret = 0; 137ad435d32SXueming Li 138ad435d32SXueming Li if (devargs == NULL) 139ad435d32SXueming Li return 0; 140ad435d32SXueming Li if (devargs->cls != NULL && devargs->cls->name != NULL) 141ad435d32SXueming Li /* Global syntax, only one class type. */ 142ad435d32SXueming Li return class_name_to_value(devargs->cls->name); 143ad435d32SXueming Li /* Legacy devargs support multiple classes. */ 144ad435d32SXueming Li kvlist = rte_kvargs_parse(devargs->args, NULL); 145ad435d32SXueming Li if (kvlist == NULL) 146ad435d32SXueming Li return 0; 147ad435d32SXueming Li rte_kvargs_process(kvlist, RTE_DEVARGS_KEY_CLASS, 148ad435d32SXueming Li devargs_class_handler, &ret); 149ad435d32SXueming Li rte_kvargs_free(kvlist); 150ad435d32SXueming Li return ret; 151ad435d32SXueming Li } 152ad435d32SXueming Li 153ad435d32SXueming Li static const unsigned int mlx5_class_invalid_combinations[] = { 154ad435d32SXueming Li MLX5_CLASS_ETH | MLX5_CLASS_VDPA, 155ad435d32SXueming Li /* New class combination should be added here. */ 156ad435d32SXueming Li }; 157ad435d32SXueming Li 158ad435d32SXueming Li static int 159ad435d32SXueming Li is_valid_class_combination(uint32_t user_classes) 160ad435d32SXueming Li { 161ad435d32SXueming Li unsigned int i; 162ad435d32SXueming Li 163ad435d32SXueming Li /* Verify if user specified unsupported combination. */ 164ad435d32SXueming Li for (i = 0; i < RTE_DIM(mlx5_class_invalid_combinations); i++) { 165ad435d32SXueming Li if ((mlx5_class_invalid_combinations[i] & user_classes) == 166ad435d32SXueming Li mlx5_class_invalid_combinations[i]) 167ad435d32SXueming Li return -EINVAL; 168ad435d32SXueming Li } 169ad435d32SXueming Li /* Not found any invalid class combination. */ 170ad435d32SXueming Li return 0; 171ad435d32SXueming Li } 172ad435d32SXueming Li 173ad435d32SXueming Li static bool 174ad435d32SXueming Li device_class_enabled(const struct mlx5_common_device *device, uint32_t class) 175ad435d32SXueming Li { 176ad435d32SXueming Li return (device->classes_loaded & class) > 0; 177ad435d32SXueming Li } 178ad435d32SXueming Li 179ad435d32SXueming Li static bool 180ad435d32SXueming Li mlx5_bus_match(const struct mlx5_class_driver *drv, 181ad435d32SXueming Li const struct rte_device *dev) 182ad435d32SXueming Li { 183ad435d32SXueming Li if (mlx5_dev_is_pci(dev)) 184ad435d32SXueming Li return mlx5_dev_pci_match(drv, dev); 185ad435d32SXueming Li return true; 186ad435d32SXueming Li } 187ad435d32SXueming Li 188ad435d32SXueming Li static struct mlx5_common_device * 189ad435d32SXueming Li to_mlx5_device(const struct rte_device *rte_dev) 190ad435d32SXueming Li { 191ad435d32SXueming Li struct mlx5_common_device *dev; 192ad435d32SXueming Li 193ad435d32SXueming Li TAILQ_FOREACH(dev, &devices_list, next) { 194ad435d32SXueming Li if (rte_dev == dev->dev) 195ad435d32SXueming Li return dev; 196ad435d32SXueming Li } 197ad435d32SXueming Li return NULL; 198ad435d32SXueming Li } 199ad435d32SXueming Li 200*4d567938SThomas Monjalon int 201*4d567938SThomas Monjalon mlx5_dev_to_pci_str(const struct rte_device *dev, char *addr, size_t size) 202*4d567938SThomas Monjalon { 203*4d567938SThomas Monjalon struct rte_pci_addr pci_addr = { 0 }; 204*4d567938SThomas Monjalon int ret; 205*4d567938SThomas Monjalon 206*4d567938SThomas Monjalon if (mlx5_dev_is_pci(dev)) { 207*4d567938SThomas Monjalon /* Input might be <BDF>, format PCI address to <DBDF>. */ 208*4d567938SThomas Monjalon ret = rte_pci_addr_parse(dev->name, &pci_addr); 209*4d567938SThomas Monjalon if (ret != 0) 210*4d567938SThomas Monjalon return -ENODEV; 211*4d567938SThomas Monjalon rte_pci_device_name(&pci_addr, addr, size); 212*4d567938SThomas Monjalon return 0; 213*4d567938SThomas Monjalon } 214*4d567938SThomas Monjalon #ifdef RTE_EXEC_ENV_LINUX 215*4d567938SThomas Monjalon return mlx5_auxiliary_get_pci_str(RTE_DEV_TO_AUXILIARY_CONST(dev), 216*4d567938SThomas Monjalon addr, size); 217*4d567938SThomas Monjalon #else 218*4d567938SThomas Monjalon rte_errno = ENODEV; 219*4d567938SThomas Monjalon return -rte_errno; 220*4d567938SThomas Monjalon #endif 221*4d567938SThomas Monjalon } 222*4d567938SThomas Monjalon 223ad435d32SXueming Li static void 224ad435d32SXueming Li dev_release(struct mlx5_common_device *dev) 225ad435d32SXueming Li { 226ad435d32SXueming Li TAILQ_REMOVE(&devices_list, dev, next); 227ad435d32SXueming Li rte_free(dev); 228ad435d32SXueming Li } 229ad435d32SXueming Li 230ad435d32SXueming Li static int 231ad435d32SXueming Li drivers_remove(struct mlx5_common_device *dev, uint32_t enabled_classes) 232ad435d32SXueming Li { 233ad435d32SXueming Li struct mlx5_class_driver *driver; 234ad435d32SXueming Li int local_ret = -ENODEV; 235ad435d32SXueming Li unsigned int i = 0; 236ad435d32SXueming Li int ret = 0; 237ad435d32SXueming Li 238ad435d32SXueming Li enabled_classes &= dev->classes_loaded; 239ad435d32SXueming Li while (enabled_classes) { 240ad435d32SXueming Li driver = driver_get(RTE_BIT64(i)); 241ad435d32SXueming Li if (driver != NULL) { 242ad435d32SXueming Li local_ret = driver->remove(dev->dev); 243ad435d32SXueming Li if (local_ret == 0) 244ad435d32SXueming Li dev->classes_loaded &= ~RTE_BIT64(i); 245ad435d32SXueming Li else if (ret == 0) 246ad435d32SXueming Li ret = local_ret; 247ad435d32SXueming Li } 248ad435d32SXueming Li enabled_classes &= ~RTE_BIT64(i); 249ad435d32SXueming Li i++; 250ad435d32SXueming Li } 251ad435d32SXueming Li if (local_ret != 0 && ret == 0) 252ad435d32SXueming Li ret = local_ret; 253ad435d32SXueming Li return ret; 254ad435d32SXueming Li } 255ad435d32SXueming Li 256ad435d32SXueming Li static int 257ad435d32SXueming Li drivers_probe(struct mlx5_common_device *dev, uint32_t user_classes) 258ad435d32SXueming Li { 259ad435d32SXueming Li struct mlx5_class_driver *driver; 260ad435d32SXueming Li uint32_t enabled_classes = 0; 261ad435d32SXueming Li bool already_loaded; 262ad435d32SXueming Li int ret; 263ad435d32SXueming Li 264ad435d32SXueming Li TAILQ_FOREACH(driver, &drivers_list, next) { 265ad435d32SXueming Li if ((driver->drv_class & user_classes) == 0) 266ad435d32SXueming Li continue; 267ad435d32SXueming Li if (!mlx5_bus_match(driver, dev->dev)) 268ad435d32SXueming Li continue; 269ad435d32SXueming Li already_loaded = dev->classes_loaded & driver->drv_class; 270ad435d32SXueming Li if (already_loaded && driver->probe_again == 0) { 271ad435d32SXueming Li DRV_LOG(ERR, "Device %s is already probed", 272ad435d32SXueming Li dev->dev->name); 273ad435d32SXueming Li ret = -EEXIST; 274ad435d32SXueming Li goto probe_err; 275ad435d32SXueming Li } 276ad435d32SXueming Li ret = driver->probe(dev->dev); 277ad435d32SXueming Li if (ret < 0) { 278ad435d32SXueming Li DRV_LOG(ERR, "Failed to load driver %s", 279ad435d32SXueming Li driver->name); 280ad435d32SXueming Li goto probe_err; 281ad435d32SXueming Li } 282ad435d32SXueming Li enabled_classes |= driver->drv_class; 283ad435d32SXueming Li } 284ad435d32SXueming Li dev->classes_loaded |= enabled_classes; 285ad435d32SXueming Li return 0; 286ad435d32SXueming Li probe_err: 287ad435d32SXueming Li /* Only unload drivers which are enabled which were enabled 288ad435d32SXueming Li * in this probe instance. 289ad435d32SXueming Li */ 290ad435d32SXueming Li drivers_remove(dev, enabled_classes); 291ad435d32SXueming Li return ret; 292ad435d32SXueming Li } 293ad435d32SXueming Li 294ad435d32SXueming Li int 295ad435d32SXueming Li mlx5_common_dev_probe(struct rte_device *eal_dev) 296ad435d32SXueming Li { 297ad435d32SXueming Li struct mlx5_common_device *dev; 298ad435d32SXueming Li uint32_t classes = 0; 299ad435d32SXueming Li bool new_device = false; 300ad435d32SXueming Li int ret; 301ad435d32SXueming Li 302ad435d32SXueming Li DRV_LOG(INFO, "probe device \"%s\".", eal_dev->name); 303ad435d32SXueming Li ret = parse_class_options(eal_dev->devargs); 304ad435d32SXueming Li if (ret < 0) { 305ad435d32SXueming Li DRV_LOG(ERR, "Unsupported mlx5 class type: %s", 306ad435d32SXueming Li eal_dev->devargs->args); 307ad435d32SXueming Li return ret; 308ad435d32SXueming Li } 309ad435d32SXueming Li classes = ret; 310ad435d32SXueming Li if (classes == 0) 311ad435d32SXueming Li /* Default to net class. */ 312ad435d32SXueming Li classes = MLX5_CLASS_ETH; 313ad435d32SXueming Li dev = to_mlx5_device(eal_dev); 314ad435d32SXueming Li if (!dev) { 315ad435d32SXueming Li dev = rte_zmalloc("mlx5_common_device", sizeof(*dev), 0); 316ad435d32SXueming Li if (!dev) 317ad435d32SXueming Li return -ENOMEM; 318ad435d32SXueming Li dev->dev = eal_dev; 319ad435d32SXueming Li TAILQ_INSERT_HEAD(&devices_list, dev, next); 320ad435d32SXueming Li new_device = true; 321ad435d32SXueming Li } else { 322ad435d32SXueming Li /* Validate combination here. */ 323ad435d32SXueming Li ret = is_valid_class_combination(classes | 324ad435d32SXueming Li dev->classes_loaded); 325ad435d32SXueming Li if (ret != 0) { 326ad435d32SXueming Li DRV_LOG(ERR, "Unsupported mlx5 classes combination."); 327ad435d32SXueming Li return ret; 328ad435d32SXueming Li } 329ad435d32SXueming Li } 330ad435d32SXueming Li ret = drivers_probe(dev, classes); 331ad435d32SXueming Li if (ret) 332ad435d32SXueming Li goto class_err; 333ad435d32SXueming Li return 0; 334ad435d32SXueming Li class_err: 335ad435d32SXueming Li if (new_device) 336ad435d32SXueming Li dev_release(dev); 337ad435d32SXueming Li return ret; 338ad435d32SXueming Li } 339ad435d32SXueming Li 340ad435d32SXueming Li int 341ad435d32SXueming Li mlx5_common_dev_remove(struct rte_device *eal_dev) 342ad435d32SXueming Li { 343ad435d32SXueming Li struct mlx5_common_device *dev; 344ad435d32SXueming Li int ret; 345ad435d32SXueming Li 346ad435d32SXueming Li dev = to_mlx5_device(eal_dev); 347ad435d32SXueming Li if (!dev) 348ad435d32SXueming Li return -ENODEV; 349ad435d32SXueming Li /* Matching device found, cleanup and unload drivers. */ 350ad435d32SXueming Li ret = drivers_remove(dev, dev->classes_loaded); 351ad435d32SXueming Li if (ret != 0) 352ad435d32SXueming Li dev_release(dev); 353ad435d32SXueming Li return ret; 354ad435d32SXueming Li } 355ad435d32SXueming Li 356ad435d32SXueming Li int 357ad435d32SXueming Li mlx5_common_dev_dma_map(struct rte_device *dev, void *addr, uint64_t iova, 358ad435d32SXueming Li size_t len) 359ad435d32SXueming Li { 360ad435d32SXueming Li struct mlx5_class_driver *driver = NULL; 361ad435d32SXueming Li struct mlx5_class_driver *temp; 362ad435d32SXueming Li struct mlx5_common_device *mdev; 363ad435d32SXueming Li int ret = -EINVAL; 364ad435d32SXueming Li 365ad435d32SXueming Li mdev = to_mlx5_device(dev); 366ad435d32SXueming Li if (!mdev) 367ad435d32SXueming Li return -ENODEV; 368ad435d32SXueming Li TAILQ_FOREACH(driver, &drivers_list, next) { 369ad435d32SXueming Li if (!device_class_enabled(mdev, driver->drv_class) || 370ad435d32SXueming Li driver->dma_map == NULL) 371ad435d32SXueming Li continue; 372ad435d32SXueming Li ret = driver->dma_map(dev, addr, iova, len); 373ad435d32SXueming Li if (ret) 374ad435d32SXueming Li goto map_err; 375ad435d32SXueming Li } 376ad435d32SXueming Li return ret; 377ad435d32SXueming Li map_err: 378ad435d32SXueming Li TAILQ_FOREACH(temp, &drivers_list, next) { 379ad435d32SXueming Li if (temp == driver) 380ad435d32SXueming Li break; 381ad435d32SXueming Li if (device_class_enabled(mdev, temp->drv_class) && 382ad435d32SXueming Li temp->dma_map && temp->dma_unmap) 383ad435d32SXueming Li temp->dma_unmap(dev, addr, iova, len); 384ad435d32SXueming Li } 385ad435d32SXueming Li return ret; 386ad435d32SXueming Li } 387ad435d32SXueming Li 388ad435d32SXueming Li int 389ad435d32SXueming Li mlx5_common_dev_dma_unmap(struct rte_device *dev, void *addr, uint64_t iova, 390ad435d32SXueming Li size_t len) 391ad435d32SXueming Li { 392ad435d32SXueming Li struct mlx5_class_driver *driver; 393ad435d32SXueming Li struct mlx5_common_device *mdev; 394ad435d32SXueming Li int local_ret = -EINVAL; 395ad435d32SXueming Li int ret = 0; 396ad435d32SXueming Li 397ad435d32SXueming Li mdev = to_mlx5_device(dev); 398ad435d32SXueming Li if (!mdev) 399ad435d32SXueming Li return -ENODEV; 400ad435d32SXueming Li /* There is no unmap error recovery in current implementation. */ 401ad435d32SXueming Li TAILQ_FOREACH_REVERSE(driver, &drivers_list, mlx5_drivers, next) { 402ad435d32SXueming Li if (!device_class_enabled(mdev, driver->drv_class) || 403ad435d32SXueming Li driver->dma_unmap == NULL) 404ad435d32SXueming Li continue; 405ad435d32SXueming Li local_ret = driver->dma_unmap(dev, addr, iova, len); 406ad435d32SXueming Li if (local_ret && (ret == 0)) 407ad435d32SXueming Li ret = local_ret; 408ad435d32SXueming Li } 409ad435d32SXueming Li if (local_ret) 410ad435d32SXueming Li ret = local_ret; 411ad435d32SXueming Li return ret; 412ad435d32SXueming Li } 413ad435d32SXueming Li 414ad435d32SXueming Li void 415ad435d32SXueming Li mlx5_class_driver_register(struct mlx5_class_driver *driver) 416ad435d32SXueming Li { 417ad435d32SXueming Li mlx5_common_driver_on_register_pci(driver); 418ad435d32SXueming Li TAILQ_INSERT_TAIL(&drivers_list, driver, next); 419ad435d32SXueming Li } 420ad435d32SXueming Li 421ad435d32SXueming Li static void mlx5_common_driver_init(void) 422ad435d32SXueming Li { 423ad435d32SXueming Li mlx5_common_pci_init(); 424777b72a9SXueming Li #ifdef RTE_EXEC_ENV_LINUX 425777b72a9SXueming Li mlx5_common_auxiliary_init(); 426777b72a9SXueming Li #endif 427ad435d32SXueming Li } 428ad435d32SXueming Li 42982088001SParav Pandit static bool mlx5_common_initialized; 43082088001SParav Pandit 43183c99c36SThomas Monjalon /** 43282088001SParav Pandit * One time innitialization routine for run-time dependency on glue library 43382088001SParav Pandit * for multiple PMDs. Each mlx5 PMD that depends on mlx5_common module, 43482088001SParav Pandit * must invoke in its constructor. 43583c99c36SThomas Monjalon */ 43682088001SParav Pandit void 43782088001SParav Pandit mlx5_common_init(void) 43883c99c36SThomas Monjalon { 43982088001SParav Pandit if (mlx5_common_initialized) 44082088001SParav Pandit return; 44182088001SParav Pandit 44279aa4307SOphir Munk mlx5_glue_constructor(); 443ad435d32SXueming Li mlx5_common_driver_init(); 44482088001SParav Pandit mlx5_common_initialized = true; 4457b4f1e6bSMatan Azrad } 4464c204fe5SShiri Kuzin 4474c204fe5SShiri Kuzin /** 4484c204fe5SShiri Kuzin * This function is responsible of initializing the variable 4494c204fe5SShiri Kuzin * haswell_broadwell_cpu by checking if the cpu is intel 4504c204fe5SShiri Kuzin * and reading the data returned from mlx5_cpu_id(). 4514c204fe5SShiri Kuzin * since haswell and broadwell cpus don't have improved performance 4524c204fe5SShiri Kuzin * when using relaxed ordering we want to check the cpu type before 4534c204fe5SShiri Kuzin * before deciding whether to enable RO or not. 4544c204fe5SShiri Kuzin * if the cpu is haswell or broadwell the variable will be set to 1 4554c204fe5SShiri Kuzin * otherwise it will be 0. 4564c204fe5SShiri Kuzin */ 4574c204fe5SShiri Kuzin RTE_INIT_PRIO(mlx5_is_haswell_broadwell_cpu, LOG) 4584c204fe5SShiri Kuzin { 4594c204fe5SShiri Kuzin #ifdef RTE_ARCH_X86_64 4604c204fe5SShiri Kuzin unsigned int broadwell_models[4] = {0x3d, 0x47, 0x4F, 0x56}; 4614c204fe5SShiri Kuzin unsigned int haswell_models[4] = {0x3c, 0x3f, 0x45, 0x46}; 4624c204fe5SShiri Kuzin unsigned int i, model, family, brand_id, vendor; 4634c204fe5SShiri Kuzin unsigned int signature_intel_ebx = 0x756e6547; 4644c204fe5SShiri Kuzin unsigned int extended_model; 4654c204fe5SShiri Kuzin unsigned int eax = 0; 4664c204fe5SShiri Kuzin unsigned int ebx = 0; 4674c204fe5SShiri Kuzin unsigned int ecx = 0; 4684c204fe5SShiri Kuzin unsigned int edx = 0; 4694c204fe5SShiri Kuzin int max_level; 4704c204fe5SShiri Kuzin 4714c204fe5SShiri Kuzin mlx5_cpu_id(0, &eax, &ebx, &ecx, &edx); 4724c204fe5SShiri Kuzin vendor = ebx; 4734c204fe5SShiri Kuzin max_level = eax; 4744c204fe5SShiri Kuzin if (max_level < 1) { 4754c204fe5SShiri Kuzin haswell_broadwell_cpu = 0; 4764c204fe5SShiri Kuzin return; 4774c204fe5SShiri Kuzin } 4784c204fe5SShiri Kuzin mlx5_cpu_id(1, &eax, &ebx, &ecx, &edx); 4794c204fe5SShiri Kuzin model = (eax >> 4) & 0x0f; 4804c204fe5SShiri Kuzin family = (eax >> 8) & 0x0f; 4814c204fe5SShiri Kuzin brand_id = ebx & 0xff; 4824c204fe5SShiri Kuzin extended_model = (eax >> 12) & 0xf0; 4834c204fe5SShiri Kuzin /* Check if the processor is Haswell or Broadwell */ 4844c204fe5SShiri Kuzin if (vendor == signature_intel_ebx) { 4854c204fe5SShiri Kuzin if (family == 0x06) 4864c204fe5SShiri Kuzin model += extended_model; 4874c204fe5SShiri Kuzin if (brand_id == 0 && family == 0x6) { 4884c204fe5SShiri Kuzin for (i = 0; i < RTE_DIM(broadwell_models); i++) 4894c204fe5SShiri Kuzin if (model == broadwell_models[i]) { 4904c204fe5SShiri Kuzin haswell_broadwell_cpu = 1; 4914c204fe5SShiri Kuzin return; 4924c204fe5SShiri Kuzin } 4934c204fe5SShiri Kuzin for (i = 0; i < RTE_DIM(haswell_models); i++) 4944c204fe5SShiri Kuzin if (model == haswell_models[i]) { 4954c204fe5SShiri Kuzin haswell_broadwell_cpu = 1; 4964c204fe5SShiri Kuzin return; 4974c204fe5SShiri Kuzin } 4984c204fe5SShiri Kuzin } 4994c204fe5SShiri Kuzin } 5004c204fe5SShiri Kuzin #endif 5014c204fe5SShiri Kuzin haswell_broadwell_cpu = 0; 5024c204fe5SShiri Kuzin } 503262c7ad0SOri Kam 504262c7ad0SOri Kam /** 5059cc0e99cSViacheslav Ovsiienko * Allocate the User Access Region with DevX on specified device. 5069cc0e99cSViacheslav Ovsiienko * 5079cc0e99cSViacheslav Ovsiienko * @param [in] ctx 5089cc0e99cSViacheslav Ovsiienko * Infiniband device context to perform allocation on. 5099cc0e99cSViacheslav Ovsiienko * @param [in] mapping 5109cc0e99cSViacheslav Ovsiienko * MLX5DV_UAR_ALLOC_TYPE_BF - allocate as cached memory with write-combining 5119cc0e99cSViacheslav Ovsiienko * attributes (if supported by the host), the 5129cc0e99cSViacheslav Ovsiienko * writes to the UAR registers must be followed 5139cc0e99cSViacheslav Ovsiienko * by write memory barrier. 5149cc0e99cSViacheslav Ovsiienko * MLX5DV_UAR_ALLOC_TYPE_NC - allocate as non-cached nenory, all writes are 5159cc0e99cSViacheslav Ovsiienko * promoted to the registers immediately, no 5169cc0e99cSViacheslav Ovsiienko * memory barriers needed. 5179cc0e99cSViacheslav Ovsiienko * mapping < 0 - the first attempt is performed with MLX5DV_UAR_ALLOC_TYPE_BF, 5189cc0e99cSViacheslav Ovsiienko * if this fails the next attempt with MLX5DV_UAR_ALLOC_TYPE_NC 5199cc0e99cSViacheslav Ovsiienko * is performed. The drivers specifying negative values should 5209cc0e99cSViacheslav Ovsiienko * always provide the write memory barrier operation after UAR 5219cc0e99cSViacheslav Ovsiienko * register writings. 5229cc0e99cSViacheslav Ovsiienko * If there is no definitions for the MLX5DV_UAR_ALLOC_TYPE_xx (older rdma 5239cc0e99cSViacheslav Ovsiienko * library headers), the caller can specify 0. 5249cc0e99cSViacheslav Ovsiienko * 5259cc0e99cSViacheslav Ovsiienko * @return 5269cc0e99cSViacheslav Ovsiienko * UAR object pointer on success, NULL otherwise and rte_errno is set. 5279cc0e99cSViacheslav Ovsiienko */ 5289cc0e99cSViacheslav Ovsiienko void * 5299cc0e99cSViacheslav Ovsiienko mlx5_devx_alloc_uar(void *ctx, int mapping) 5309cc0e99cSViacheslav Ovsiienko { 5319cc0e99cSViacheslav Ovsiienko void *uar; 5329cc0e99cSViacheslav Ovsiienko uint32_t retry, uar_mapping; 5339cc0e99cSViacheslav Ovsiienko void *base_addr; 5349cc0e99cSViacheslav Ovsiienko 5359cc0e99cSViacheslav Ovsiienko for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) { 5369cc0e99cSViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC 5379cc0e99cSViacheslav Ovsiienko /* Control the mapping type according to the settings. */ 5389cc0e99cSViacheslav Ovsiienko uar_mapping = (mapping < 0) ? 5399cc0e99cSViacheslav Ovsiienko MLX5DV_UAR_ALLOC_TYPE_NC : mapping; 5409cc0e99cSViacheslav Ovsiienko #else 5419cc0e99cSViacheslav Ovsiienko /* 5429cc0e99cSViacheslav Ovsiienko * It seems we have no way to control the memory mapping type 5439cc0e99cSViacheslav Ovsiienko * for the UAR, the default "Write-Combining" type is supposed. 5449cc0e99cSViacheslav Ovsiienko */ 5459cc0e99cSViacheslav Ovsiienko uar_mapping = 0; 5469cc0e99cSViacheslav Ovsiienko RTE_SET_USED(mapping); 5479cc0e99cSViacheslav Ovsiienko #endif 5489cc0e99cSViacheslav Ovsiienko uar = mlx5_glue->devx_alloc_uar(ctx, uar_mapping); 5499cc0e99cSViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC 5509cc0e99cSViacheslav Ovsiienko if (!uar && 5519cc0e99cSViacheslav Ovsiienko mapping < 0 && 5529cc0e99cSViacheslav Ovsiienko uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) { 5539cc0e99cSViacheslav Ovsiienko /* 5549cc0e99cSViacheslav Ovsiienko * In some environments like virtual machine the 5559cc0e99cSViacheslav Ovsiienko * Write Combining mapped might be not supported and 5569cc0e99cSViacheslav Ovsiienko * UAR allocation fails. We tried "Non-Cached" mapping 5579cc0e99cSViacheslav Ovsiienko * for the case. 5589cc0e99cSViacheslav Ovsiienko */ 5599cc0e99cSViacheslav Ovsiienko DRV_LOG(WARNING, "Failed to allocate DevX UAR (BF)"); 5609cc0e99cSViacheslav Ovsiienko uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC; 5619cc0e99cSViacheslav Ovsiienko uar = mlx5_glue->devx_alloc_uar(ctx, uar_mapping); 5629cc0e99cSViacheslav Ovsiienko } else if (!uar && 5639cc0e99cSViacheslav Ovsiienko mapping < 0 && 5649cc0e99cSViacheslav Ovsiienko uar_mapping == MLX5DV_UAR_ALLOC_TYPE_NC) { 5659cc0e99cSViacheslav Ovsiienko /* 5669cc0e99cSViacheslav Ovsiienko * If Verbs/kernel does not support "Non-Cached" 5679cc0e99cSViacheslav Ovsiienko * try the "Write-Combining". 5689cc0e99cSViacheslav Ovsiienko */ 5699cc0e99cSViacheslav Ovsiienko DRV_LOG(WARNING, "Failed to allocate DevX UAR (NC)"); 5709cc0e99cSViacheslav Ovsiienko uar_mapping = MLX5DV_UAR_ALLOC_TYPE_BF; 5719cc0e99cSViacheslav Ovsiienko uar = mlx5_glue->devx_alloc_uar(ctx, uar_mapping); 5729cc0e99cSViacheslav Ovsiienko } 5739cc0e99cSViacheslav Ovsiienko #endif 5749cc0e99cSViacheslav Ovsiienko if (!uar) { 5759cc0e99cSViacheslav Ovsiienko DRV_LOG(ERR, "Failed to allocate DevX UAR (BF/NC)"); 5769cc0e99cSViacheslav Ovsiienko rte_errno = ENOMEM; 5779cc0e99cSViacheslav Ovsiienko goto exit; 5789cc0e99cSViacheslav Ovsiienko } 5799cc0e99cSViacheslav Ovsiienko base_addr = mlx5_os_get_devx_uar_base_addr(uar); 5809cc0e99cSViacheslav Ovsiienko if (base_addr) 5819cc0e99cSViacheslav Ovsiienko break; 5829cc0e99cSViacheslav Ovsiienko /* 5839cc0e99cSViacheslav Ovsiienko * The UARs are allocated by rdma_core within the 5849cc0e99cSViacheslav Ovsiienko * IB device context, on context closure all UARs 5859cc0e99cSViacheslav Ovsiienko * will be freed, should be no memory/object leakage. 5869cc0e99cSViacheslav Ovsiienko */ 5879cc0e99cSViacheslav Ovsiienko DRV_LOG(WARNING, "Retrying to allocate DevX UAR"); 5889cc0e99cSViacheslav Ovsiienko uar = NULL; 5899cc0e99cSViacheslav Ovsiienko } 5909cc0e99cSViacheslav Ovsiienko /* Check whether we finally succeeded with valid UAR allocation. */ 5919cc0e99cSViacheslav Ovsiienko if (!uar) { 5929cc0e99cSViacheslav Ovsiienko DRV_LOG(ERR, "Failed to allocate DevX UAR (NULL base)"); 5939cc0e99cSViacheslav Ovsiienko rte_errno = ENOMEM; 5949cc0e99cSViacheslav Ovsiienko } 5959cc0e99cSViacheslav Ovsiienko /* 5969cc0e99cSViacheslav Ovsiienko * Return void * instead of struct mlx5dv_devx_uar * 5979cc0e99cSViacheslav Ovsiienko * is for compatibility with older rdma-core library headers. 5989cc0e99cSViacheslav Ovsiienko */ 5999cc0e99cSViacheslav Ovsiienko exit: 6009cc0e99cSViacheslav Ovsiienko return uar; 6019cc0e99cSViacheslav Ovsiienko } 602ad435d32SXueming Li 603ad435d32SXueming Li RTE_PMD_EXPORT_NAME(mlx5_common_driver, __COUNTER__); 604