17b4f1e6bSMatan Azrad /* SPDX-License-Identifier: BSD-3-Clause 27b4f1e6bSMatan Azrad * Copyright 2019 Mellanox Technologies, Ltd 37b4f1e6bSMatan Azrad */ 47b4f1e6bSMatan Azrad 57b4f1e6bSMatan Azrad #include <unistd.h> 67b4f1e6bSMatan Azrad #include <string.h> 793e30982SMatan Azrad #include <stdio.h> 87b4f1e6bSMatan Azrad 97b4f1e6bSMatan Azrad #include <rte_errno.h> 10262c7ad0SOri Kam #include <rte_mempool.h> 11*ad435d32SXueming Li #include <rte_class.h> 12*ad435d32SXueming Li #include <rte_malloc.h> 137b4f1e6bSMatan Azrad 147b4f1e6bSMatan Azrad #include "mlx5_common.h" 15262c7ad0SOri Kam #include "mlx5_common_os.h" 1625245d5dSShiri Kuzin #include "mlx5_common_log.h" 178a41f4deSParav Pandit #include "mlx5_common_pci.h" 18*ad435d32SXueming Li #include "mlx5_common_private.h" 197b4f1e6bSMatan Azrad 204c204fe5SShiri Kuzin uint8_t haswell_broadwell_cpu; 214c204fe5SShiri Kuzin 224c204fe5SShiri Kuzin /* In case this is an x86_64 intel processor to check if 234c204fe5SShiri Kuzin * we should use relaxed ordering. 244c204fe5SShiri Kuzin */ 254c204fe5SShiri Kuzin #ifdef RTE_ARCH_X86_64 264c204fe5SShiri Kuzin /** 274c204fe5SShiri Kuzin * This function returns processor identification and feature information 284c204fe5SShiri Kuzin * into the registers. 294c204fe5SShiri Kuzin * 304c204fe5SShiri Kuzin * @param eax, ebx, ecx, edx 314c204fe5SShiri Kuzin * Pointers to the registers that will hold cpu information. 324c204fe5SShiri Kuzin * @param level 334c204fe5SShiri Kuzin * The main category of information returned. 344c204fe5SShiri Kuzin */ 354c204fe5SShiri Kuzin static inline void mlx5_cpu_id(unsigned int level, 364c204fe5SShiri Kuzin unsigned int *eax, unsigned int *ebx, 374c204fe5SShiri Kuzin unsigned int *ecx, unsigned int *edx) 384c204fe5SShiri Kuzin { 394c204fe5SShiri Kuzin __asm__("cpuid\n\t" 404c204fe5SShiri Kuzin : "=a" (*eax), "=b" (*ebx), "=c" (*ecx), "=d" (*edx) 414c204fe5SShiri Kuzin : "0" (level)); 424c204fe5SShiri Kuzin } 434c204fe5SShiri Kuzin #endif 444c204fe5SShiri Kuzin 45eeded204SDavid Marchand RTE_LOG_REGISTER_DEFAULT(mlx5_common_logtype, NOTICE) 4683c99c36SThomas Monjalon 47*ad435d32SXueming Li /* Head of list of drivers. */ 48*ad435d32SXueming Li static TAILQ_HEAD(mlx5_drivers, mlx5_class_driver) drivers_list = 49*ad435d32SXueming Li TAILQ_HEAD_INITIALIZER(drivers_list); 50*ad435d32SXueming Li 51*ad435d32SXueming Li /* Head of devices. */ 52*ad435d32SXueming Li static TAILQ_HEAD(mlx5_devices, mlx5_common_device) devices_list = 53*ad435d32SXueming Li TAILQ_HEAD_INITIALIZER(devices_list); 54*ad435d32SXueming Li 55*ad435d32SXueming Li static const struct { 56*ad435d32SXueming Li const char *name; 57*ad435d32SXueming Li unsigned int drv_class; 58*ad435d32SXueming Li } mlx5_classes[] = { 59*ad435d32SXueming Li { .name = "vdpa", .drv_class = MLX5_CLASS_VDPA }, 60*ad435d32SXueming Li { .name = "eth", .drv_class = MLX5_CLASS_ETH }, 61*ad435d32SXueming Li /* Keep class "net" for backward compatibility. */ 62*ad435d32SXueming Li { .name = "net", .drv_class = MLX5_CLASS_ETH }, 63*ad435d32SXueming Li { .name = "regex", .drv_class = MLX5_CLASS_REGEX }, 64*ad435d32SXueming Li { .name = "compress", .drv_class = MLX5_CLASS_COMPRESS }, 65*ad435d32SXueming Li { .name = "crypto", .drv_class = MLX5_CLASS_CRYPTO }, 66*ad435d32SXueming Li }; 67*ad435d32SXueming Li 68*ad435d32SXueming Li static int 69*ad435d32SXueming Li class_name_to_value(const char *class_name) 70*ad435d32SXueming Li { 71*ad435d32SXueming Li unsigned int i; 72*ad435d32SXueming Li 73*ad435d32SXueming Li for (i = 0; i < RTE_DIM(mlx5_classes); i++) { 74*ad435d32SXueming Li if (strcmp(class_name, mlx5_classes[i].name) == 0) 75*ad435d32SXueming Li return mlx5_classes[i].drv_class; 76*ad435d32SXueming Li } 77*ad435d32SXueming Li return -EINVAL; 78*ad435d32SXueming Li } 79*ad435d32SXueming Li 80*ad435d32SXueming Li static struct mlx5_class_driver * 81*ad435d32SXueming Li driver_get(uint32_t class) 82*ad435d32SXueming Li { 83*ad435d32SXueming Li struct mlx5_class_driver *driver; 84*ad435d32SXueming Li 85*ad435d32SXueming Li TAILQ_FOREACH(driver, &drivers_list, next) { 86*ad435d32SXueming Li if ((uint32_t)driver->drv_class == class) 87*ad435d32SXueming Li return driver; 88*ad435d32SXueming Li } 89*ad435d32SXueming Li return NULL; 90*ad435d32SXueming Li } 91*ad435d32SXueming Li 92*ad435d32SXueming Li static int 93*ad435d32SXueming Li devargs_class_handler(__rte_unused const char *key, 94*ad435d32SXueming Li const char *class_names, void *opaque) 95*ad435d32SXueming Li { 96*ad435d32SXueming Li int *ret = opaque; 97*ad435d32SXueming Li int class_val; 98*ad435d32SXueming Li char *scratch; 99*ad435d32SXueming Li char *found; 100*ad435d32SXueming Li char *refstr = NULL; 101*ad435d32SXueming Li 102*ad435d32SXueming Li *ret = 0; 103*ad435d32SXueming Li scratch = strdup(class_names); 104*ad435d32SXueming Li if (scratch == NULL) { 105*ad435d32SXueming Li *ret = -ENOMEM; 106*ad435d32SXueming Li return *ret; 107*ad435d32SXueming Li } 108*ad435d32SXueming Li found = strtok_r(scratch, ":", &refstr); 109*ad435d32SXueming Li if (found == NULL) 110*ad435d32SXueming Li /* Empty string. */ 111*ad435d32SXueming Li goto err; 112*ad435d32SXueming Li do { 113*ad435d32SXueming Li /* Extract each individual class name. Multiple 114*ad435d32SXueming Li * classes can be supplied as class=net:regex:foo:bar. 115*ad435d32SXueming Li */ 116*ad435d32SXueming Li class_val = class_name_to_value(found); 117*ad435d32SXueming Li /* Check if its a valid class. */ 118*ad435d32SXueming Li if (class_val < 0) { 119*ad435d32SXueming Li *ret = -EINVAL; 120*ad435d32SXueming Li goto err; 121*ad435d32SXueming Li } 122*ad435d32SXueming Li *ret |= class_val; 123*ad435d32SXueming Li found = strtok_r(NULL, ":", &refstr); 124*ad435d32SXueming Li } while (found != NULL); 125*ad435d32SXueming Li err: 126*ad435d32SXueming Li free(scratch); 127*ad435d32SXueming Li if (*ret < 0) 128*ad435d32SXueming Li DRV_LOG(ERR, "Invalid mlx5 class options: %s.\n", class_names); 129*ad435d32SXueming Li return *ret; 130*ad435d32SXueming Li } 131*ad435d32SXueming Li 132*ad435d32SXueming Li static int 133*ad435d32SXueming Li parse_class_options(const struct rte_devargs *devargs) 134*ad435d32SXueming Li { 135*ad435d32SXueming Li struct rte_kvargs *kvlist; 136*ad435d32SXueming Li int ret = 0; 137*ad435d32SXueming Li 138*ad435d32SXueming Li if (devargs == NULL) 139*ad435d32SXueming Li return 0; 140*ad435d32SXueming Li if (devargs->cls != NULL && devargs->cls->name != NULL) 141*ad435d32SXueming Li /* Global syntax, only one class type. */ 142*ad435d32SXueming Li return class_name_to_value(devargs->cls->name); 143*ad435d32SXueming Li /* Legacy devargs support multiple classes. */ 144*ad435d32SXueming Li kvlist = rte_kvargs_parse(devargs->args, NULL); 145*ad435d32SXueming Li if (kvlist == NULL) 146*ad435d32SXueming Li return 0; 147*ad435d32SXueming Li rte_kvargs_process(kvlist, RTE_DEVARGS_KEY_CLASS, 148*ad435d32SXueming Li devargs_class_handler, &ret); 149*ad435d32SXueming Li rte_kvargs_free(kvlist); 150*ad435d32SXueming Li return ret; 151*ad435d32SXueming Li } 152*ad435d32SXueming Li 153*ad435d32SXueming Li static const unsigned int mlx5_class_invalid_combinations[] = { 154*ad435d32SXueming Li MLX5_CLASS_ETH | MLX5_CLASS_VDPA, 155*ad435d32SXueming Li /* New class combination should be added here. */ 156*ad435d32SXueming Li }; 157*ad435d32SXueming Li 158*ad435d32SXueming Li static int 159*ad435d32SXueming Li is_valid_class_combination(uint32_t user_classes) 160*ad435d32SXueming Li { 161*ad435d32SXueming Li unsigned int i; 162*ad435d32SXueming Li 163*ad435d32SXueming Li /* Verify if user specified unsupported combination. */ 164*ad435d32SXueming Li for (i = 0; i < RTE_DIM(mlx5_class_invalid_combinations); i++) { 165*ad435d32SXueming Li if ((mlx5_class_invalid_combinations[i] & user_classes) == 166*ad435d32SXueming Li mlx5_class_invalid_combinations[i]) 167*ad435d32SXueming Li return -EINVAL; 168*ad435d32SXueming Li } 169*ad435d32SXueming Li /* Not found any invalid class combination. */ 170*ad435d32SXueming Li return 0; 171*ad435d32SXueming Li } 172*ad435d32SXueming Li 173*ad435d32SXueming Li static bool 174*ad435d32SXueming Li device_class_enabled(const struct mlx5_common_device *device, uint32_t class) 175*ad435d32SXueming Li { 176*ad435d32SXueming Li return (device->classes_loaded & class) > 0; 177*ad435d32SXueming Li } 178*ad435d32SXueming Li 179*ad435d32SXueming Li static bool 180*ad435d32SXueming Li mlx5_bus_match(const struct mlx5_class_driver *drv, 181*ad435d32SXueming Li const struct rte_device *dev) 182*ad435d32SXueming Li { 183*ad435d32SXueming Li if (mlx5_dev_is_pci(dev)) 184*ad435d32SXueming Li return mlx5_dev_pci_match(drv, dev); 185*ad435d32SXueming Li return true; 186*ad435d32SXueming Li } 187*ad435d32SXueming Li 188*ad435d32SXueming Li static struct mlx5_common_device * 189*ad435d32SXueming Li to_mlx5_device(const struct rte_device *rte_dev) 190*ad435d32SXueming Li { 191*ad435d32SXueming Li struct mlx5_common_device *dev; 192*ad435d32SXueming Li 193*ad435d32SXueming Li TAILQ_FOREACH(dev, &devices_list, next) { 194*ad435d32SXueming Li if (rte_dev == dev->dev) 195*ad435d32SXueming Li return dev; 196*ad435d32SXueming Li } 197*ad435d32SXueming Li return NULL; 198*ad435d32SXueming Li } 199*ad435d32SXueming Li 200*ad435d32SXueming Li static void 201*ad435d32SXueming Li dev_release(struct mlx5_common_device *dev) 202*ad435d32SXueming Li { 203*ad435d32SXueming Li TAILQ_REMOVE(&devices_list, dev, next); 204*ad435d32SXueming Li rte_free(dev); 205*ad435d32SXueming Li } 206*ad435d32SXueming Li 207*ad435d32SXueming Li static int 208*ad435d32SXueming Li drivers_remove(struct mlx5_common_device *dev, uint32_t enabled_classes) 209*ad435d32SXueming Li { 210*ad435d32SXueming Li struct mlx5_class_driver *driver; 211*ad435d32SXueming Li int local_ret = -ENODEV; 212*ad435d32SXueming Li unsigned int i = 0; 213*ad435d32SXueming Li int ret = 0; 214*ad435d32SXueming Li 215*ad435d32SXueming Li enabled_classes &= dev->classes_loaded; 216*ad435d32SXueming Li while (enabled_classes) { 217*ad435d32SXueming Li driver = driver_get(RTE_BIT64(i)); 218*ad435d32SXueming Li if (driver != NULL) { 219*ad435d32SXueming Li local_ret = driver->remove(dev->dev); 220*ad435d32SXueming Li if (local_ret == 0) 221*ad435d32SXueming Li dev->classes_loaded &= ~RTE_BIT64(i); 222*ad435d32SXueming Li else if (ret == 0) 223*ad435d32SXueming Li ret = local_ret; 224*ad435d32SXueming Li } 225*ad435d32SXueming Li enabled_classes &= ~RTE_BIT64(i); 226*ad435d32SXueming Li i++; 227*ad435d32SXueming Li } 228*ad435d32SXueming Li if (local_ret != 0 && ret == 0) 229*ad435d32SXueming Li ret = local_ret; 230*ad435d32SXueming Li return ret; 231*ad435d32SXueming Li } 232*ad435d32SXueming Li 233*ad435d32SXueming Li static int 234*ad435d32SXueming Li drivers_probe(struct mlx5_common_device *dev, uint32_t user_classes) 235*ad435d32SXueming Li { 236*ad435d32SXueming Li struct mlx5_class_driver *driver; 237*ad435d32SXueming Li uint32_t enabled_classes = 0; 238*ad435d32SXueming Li bool already_loaded; 239*ad435d32SXueming Li int ret; 240*ad435d32SXueming Li 241*ad435d32SXueming Li TAILQ_FOREACH(driver, &drivers_list, next) { 242*ad435d32SXueming Li if ((driver->drv_class & user_classes) == 0) 243*ad435d32SXueming Li continue; 244*ad435d32SXueming Li if (!mlx5_bus_match(driver, dev->dev)) 245*ad435d32SXueming Li continue; 246*ad435d32SXueming Li already_loaded = dev->classes_loaded & driver->drv_class; 247*ad435d32SXueming Li if (already_loaded && driver->probe_again == 0) { 248*ad435d32SXueming Li DRV_LOG(ERR, "Device %s is already probed", 249*ad435d32SXueming Li dev->dev->name); 250*ad435d32SXueming Li ret = -EEXIST; 251*ad435d32SXueming Li goto probe_err; 252*ad435d32SXueming Li } 253*ad435d32SXueming Li ret = driver->probe(dev->dev); 254*ad435d32SXueming Li if (ret < 0) { 255*ad435d32SXueming Li DRV_LOG(ERR, "Failed to load driver %s", 256*ad435d32SXueming Li driver->name); 257*ad435d32SXueming Li goto probe_err; 258*ad435d32SXueming Li } 259*ad435d32SXueming Li enabled_classes |= driver->drv_class; 260*ad435d32SXueming Li } 261*ad435d32SXueming Li dev->classes_loaded |= enabled_classes; 262*ad435d32SXueming Li return 0; 263*ad435d32SXueming Li probe_err: 264*ad435d32SXueming Li /* Only unload drivers which are enabled which were enabled 265*ad435d32SXueming Li * in this probe instance. 266*ad435d32SXueming Li */ 267*ad435d32SXueming Li drivers_remove(dev, enabled_classes); 268*ad435d32SXueming Li return ret; 269*ad435d32SXueming Li } 270*ad435d32SXueming Li 271*ad435d32SXueming Li int 272*ad435d32SXueming Li mlx5_common_dev_probe(struct rte_device *eal_dev) 273*ad435d32SXueming Li { 274*ad435d32SXueming Li struct mlx5_common_device *dev; 275*ad435d32SXueming Li uint32_t classes = 0; 276*ad435d32SXueming Li bool new_device = false; 277*ad435d32SXueming Li int ret; 278*ad435d32SXueming Li 279*ad435d32SXueming Li DRV_LOG(INFO, "probe device \"%s\".", eal_dev->name); 280*ad435d32SXueming Li ret = parse_class_options(eal_dev->devargs); 281*ad435d32SXueming Li if (ret < 0) { 282*ad435d32SXueming Li DRV_LOG(ERR, "Unsupported mlx5 class type: %s", 283*ad435d32SXueming Li eal_dev->devargs->args); 284*ad435d32SXueming Li return ret; 285*ad435d32SXueming Li } 286*ad435d32SXueming Li classes = ret; 287*ad435d32SXueming Li if (classes == 0) 288*ad435d32SXueming Li /* Default to net class. */ 289*ad435d32SXueming Li classes = MLX5_CLASS_ETH; 290*ad435d32SXueming Li dev = to_mlx5_device(eal_dev); 291*ad435d32SXueming Li if (!dev) { 292*ad435d32SXueming Li dev = rte_zmalloc("mlx5_common_device", sizeof(*dev), 0); 293*ad435d32SXueming Li if (!dev) 294*ad435d32SXueming Li return -ENOMEM; 295*ad435d32SXueming Li dev->dev = eal_dev; 296*ad435d32SXueming Li TAILQ_INSERT_HEAD(&devices_list, dev, next); 297*ad435d32SXueming Li new_device = true; 298*ad435d32SXueming Li } else { 299*ad435d32SXueming Li /* Validate combination here. */ 300*ad435d32SXueming Li ret = is_valid_class_combination(classes | 301*ad435d32SXueming Li dev->classes_loaded); 302*ad435d32SXueming Li if (ret != 0) { 303*ad435d32SXueming Li DRV_LOG(ERR, "Unsupported mlx5 classes combination."); 304*ad435d32SXueming Li return ret; 305*ad435d32SXueming Li } 306*ad435d32SXueming Li } 307*ad435d32SXueming Li ret = drivers_probe(dev, classes); 308*ad435d32SXueming Li if (ret) 309*ad435d32SXueming Li goto class_err; 310*ad435d32SXueming Li return 0; 311*ad435d32SXueming Li class_err: 312*ad435d32SXueming Li if (new_device) 313*ad435d32SXueming Li dev_release(dev); 314*ad435d32SXueming Li return ret; 315*ad435d32SXueming Li } 316*ad435d32SXueming Li 317*ad435d32SXueming Li int 318*ad435d32SXueming Li mlx5_common_dev_remove(struct rte_device *eal_dev) 319*ad435d32SXueming Li { 320*ad435d32SXueming Li struct mlx5_common_device *dev; 321*ad435d32SXueming Li int ret; 322*ad435d32SXueming Li 323*ad435d32SXueming Li dev = to_mlx5_device(eal_dev); 324*ad435d32SXueming Li if (!dev) 325*ad435d32SXueming Li return -ENODEV; 326*ad435d32SXueming Li /* Matching device found, cleanup and unload drivers. */ 327*ad435d32SXueming Li ret = drivers_remove(dev, dev->classes_loaded); 328*ad435d32SXueming Li if (ret != 0) 329*ad435d32SXueming Li dev_release(dev); 330*ad435d32SXueming Li return ret; 331*ad435d32SXueming Li } 332*ad435d32SXueming Li 333*ad435d32SXueming Li int 334*ad435d32SXueming Li mlx5_common_dev_dma_map(struct rte_device *dev, void *addr, uint64_t iova, 335*ad435d32SXueming Li size_t len) 336*ad435d32SXueming Li { 337*ad435d32SXueming Li struct mlx5_class_driver *driver = NULL; 338*ad435d32SXueming Li struct mlx5_class_driver *temp; 339*ad435d32SXueming Li struct mlx5_common_device *mdev; 340*ad435d32SXueming Li int ret = -EINVAL; 341*ad435d32SXueming Li 342*ad435d32SXueming Li mdev = to_mlx5_device(dev); 343*ad435d32SXueming Li if (!mdev) 344*ad435d32SXueming Li return -ENODEV; 345*ad435d32SXueming Li TAILQ_FOREACH(driver, &drivers_list, next) { 346*ad435d32SXueming Li if (!device_class_enabled(mdev, driver->drv_class) || 347*ad435d32SXueming Li driver->dma_map == NULL) 348*ad435d32SXueming Li continue; 349*ad435d32SXueming Li ret = driver->dma_map(dev, addr, iova, len); 350*ad435d32SXueming Li if (ret) 351*ad435d32SXueming Li goto map_err; 352*ad435d32SXueming Li } 353*ad435d32SXueming Li return ret; 354*ad435d32SXueming Li map_err: 355*ad435d32SXueming Li TAILQ_FOREACH(temp, &drivers_list, next) { 356*ad435d32SXueming Li if (temp == driver) 357*ad435d32SXueming Li break; 358*ad435d32SXueming Li if (device_class_enabled(mdev, temp->drv_class) && 359*ad435d32SXueming Li temp->dma_map && temp->dma_unmap) 360*ad435d32SXueming Li temp->dma_unmap(dev, addr, iova, len); 361*ad435d32SXueming Li } 362*ad435d32SXueming Li return ret; 363*ad435d32SXueming Li } 364*ad435d32SXueming Li 365*ad435d32SXueming Li int 366*ad435d32SXueming Li mlx5_common_dev_dma_unmap(struct rte_device *dev, void *addr, uint64_t iova, 367*ad435d32SXueming Li size_t len) 368*ad435d32SXueming Li { 369*ad435d32SXueming Li struct mlx5_class_driver *driver; 370*ad435d32SXueming Li struct mlx5_common_device *mdev; 371*ad435d32SXueming Li int local_ret = -EINVAL; 372*ad435d32SXueming Li int ret = 0; 373*ad435d32SXueming Li 374*ad435d32SXueming Li mdev = to_mlx5_device(dev); 375*ad435d32SXueming Li if (!mdev) 376*ad435d32SXueming Li return -ENODEV; 377*ad435d32SXueming Li /* There is no unmap error recovery in current implementation. */ 378*ad435d32SXueming Li TAILQ_FOREACH_REVERSE(driver, &drivers_list, mlx5_drivers, next) { 379*ad435d32SXueming Li if (!device_class_enabled(mdev, driver->drv_class) || 380*ad435d32SXueming Li driver->dma_unmap == NULL) 381*ad435d32SXueming Li continue; 382*ad435d32SXueming Li local_ret = driver->dma_unmap(dev, addr, iova, len); 383*ad435d32SXueming Li if (local_ret && (ret == 0)) 384*ad435d32SXueming Li ret = local_ret; 385*ad435d32SXueming Li } 386*ad435d32SXueming Li if (local_ret) 387*ad435d32SXueming Li ret = local_ret; 388*ad435d32SXueming Li return ret; 389*ad435d32SXueming Li } 390*ad435d32SXueming Li 391*ad435d32SXueming Li void 392*ad435d32SXueming Li mlx5_class_driver_register(struct mlx5_class_driver *driver) 393*ad435d32SXueming Li { 394*ad435d32SXueming Li mlx5_common_driver_on_register_pci(driver); 395*ad435d32SXueming Li TAILQ_INSERT_TAIL(&drivers_list, driver, next); 396*ad435d32SXueming Li } 397*ad435d32SXueming Li 398*ad435d32SXueming Li static void mlx5_common_driver_init(void) 399*ad435d32SXueming Li { 400*ad435d32SXueming Li mlx5_common_pci_init(); 401*ad435d32SXueming Li } 402*ad435d32SXueming Li 40382088001SParav Pandit static bool mlx5_common_initialized; 40482088001SParav Pandit 40583c99c36SThomas Monjalon /** 40682088001SParav Pandit * One time innitialization routine for run-time dependency on glue library 40782088001SParav Pandit * for multiple PMDs. Each mlx5 PMD that depends on mlx5_common module, 40882088001SParav Pandit * must invoke in its constructor. 40983c99c36SThomas Monjalon */ 41082088001SParav Pandit void 41182088001SParav Pandit mlx5_common_init(void) 41283c99c36SThomas Monjalon { 41382088001SParav Pandit if (mlx5_common_initialized) 41482088001SParav Pandit return; 41582088001SParav Pandit 41679aa4307SOphir Munk mlx5_glue_constructor(); 417*ad435d32SXueming Li mlx5_common_driver_init(); 41882088001SParav Pandit mlx5_common_initialized = true; 4197b4f1e6bSMatan Azrad } 4204c204fe5SShiri Kuzin 4214c204fe5SShiri Kuzin /** 4224c204fe5SShiri Kuzin * This function is responsible of initializing the variable 4234c204fe5SShiri Kuzin * haswell_broadwell_cpu by checking if the cpu is intel 4244c204fe5SShiri Kuzin * and reading the data returned from mlx5_cpu_id(). 4254c204fe5SShiri Kuzin * since haswell and broadwell cpus don't have improved performance 4264c204fe5SShiri Kuzin * when using relaxed ordering we want to check the cpu type before 4274c204fe5SShiri Kuzin * before deciding whether to enable RO or not. 4284c204fe5SShiri Kuzin * if the cpu is haswell or broadwell the variable will be set to 1 4294c204fe5SShiri Kuzin * otherwise it will be 0. 4304c204fe5SShiri Kuzin */ 4314c204fe5SShiri Kuzin RTE_INIT_PRIO(mlx5_is_haswell_broadwell_cpu, LOG) 4324c204fe5SShiri Kuzin { 4334c204fe5SShiri Kuzin #ifdef RTE_ARCH_X86_64 4344c204fe5SShiri Kuzin unsigned int broadwell_models[4] = {0x3d, 0x47, 0x4F, 0x56}; 4354c204fe5SShiri Kuzin unsigned int haswell_models[4] = {0x3c, 0x3f, 0x45, 0x46}; 4364c204fe5SShiri Kuzin unsigned int i, model, family, brand_id, vendor; 4374c204fe5SShiri Kuzin unsigned int signature_intel_ebx = 0x756e6547; 4384c204fe5SShiri Kuzin unsigned int extended_model; 4394c204fe5SShiri Kuzin unsigned int eax = 0; 4404c204fe5SShiri Kuzin unsigned int ebx = 0; 4414c204fe5SShiri Kuzin unsigned int ecx = 0; 4424c204fe5SShiri Kuzin unsigned int edx = 0; 4434c204fe5SShiri Kuzin int max_level; 4444c204fe5SShiri Kuzin 4454c204fe5SShiri Kuzin mlx5_cpu_id(0, &eax, &ebx, &ecx, &edx); 4464c204fe5SShiri Kuzin vendor = ebx; 4474c204fe5SShiri Kuzin max_level = eax; 4484c204fe5SShiri Kuzin if (max_level < 1) { 4494c204fe5SShiri Kuzin haswell_broadwell_cpu = 0; 4504c204fe5SShiri Kuzin return; 4514c204fe5SShiri Kuzin } 4524c204fe5SShiri Kuzin mlx5_cpu_id(1, &eax, &ebx, &ecx, &edx); 4534c204fe5SShiri Kuzin model = (eax >> 4) & 0x0f; 4544c204fe5SShiri Kuzin family = (eax >> 8) & 0x0f; 4554c204fe5SShiri Kuzin brand_id = ebx & 0xff; 4564c204fe5SShiri Kuzin extended_model = (eax >> 12) & 0xf0; 4574c204fe5SShiri Kuzin /* Check if the processor is Haswell or Broadwell */ 4584c204fe5SShiri Kuzin if (vendor == signature_intel_ebx) { 4594c204fe5SShiri Kuzin if (family == 0x06) 4604c204fe5SShiri Kuzin model += extended_model; 4614c204fe5SShiri Kuzin if (brand_id == 0 && family == 0x6) { 4624c204fe5SShiri Kuzin for (i = 0; i < RTE_DIM(broadwell_models); i++) 4634c204fe5SShiri Kuzin if (model == broadwell_models[i]) { 4644c204fe5SShiri Kuzin haswell_broadwell_cpu = 1; 4654c204fe5SShiri Kuzin return; 4664c204fe5SShiri Kuzin } 4674c204fe5SShiri Kuzin for (i = 0; i < RTE_DIM(haswell_models); i++) 4684c204fe5SShiri Kuzin if (model == haswell_models[i]) { 4694c204fe5SShiri Kuzin haswell_broadwell_cpu = 1; 4704c204fe5SShiri Kuzin return; 4714c204fe5SShiri Kuzin } 4724c204fe5SShiri Kuzin } 4734c204fe5SShiri Kuzin } 4744c204fe5SShiri Kuzin #endif 4754c204fe5SShiri Kuzin haswell_broadwell_cpu = 0; 4764c204fe5SShiri Kuzin } 477262c7ad0SOri Kam 478262c7ad0SOri Kam /** 4799cc0e99cSViacheslav Ovsiienko * Allocate the User Access Region with DevX on specified device. 4809cc0e99cSViacheslav Ovsiienko * 4819cc0e99cSViacheslav Ovsiienko * @param [in] ctx 4829cc0e99cSViacheslav Ovsiienko * Infiniband device context to perform allocation on. 4839cc0e99cSViacheslav Ovsiienko * @param [in] mapping 4849cc0e99cSViacheslav Ovsiienko * MLX5DV_UAR_ALLOC_TYPE_BF - allocate as cached memory with write-combining 4859cc0e99cSViacheslav Ovsiienko * attributes (if supported by the host), the 4869cc0e99cSViacheslav Ovsiienko * writes to the UAR registers must be followed 4879cc0e99cSViacheslav Ovsiienko * by write memory barrier. 4889cc0e99cSViacheslav Ovsiienko * MLX5DV_UAR_ALLOC_TYPE_NC - allocate as non-cached nenory, all writes are 4899cc0e99cSViacheslav Ovsiienko * promoted to the registers immediately, no 4909cc0e99cSViacheslav Ovsiienko * memory barriers needed. 4919cc0e99cSViacheslav Ovsiienko * mapping < 0 - the first attempt is performed with MLX5DV_UAR_ALLOC_TYPE_BF, 4929cc0e99cSViacheslav Ovsiienko * if this fails the next attempt with MLX5DV_UAR_ALLOC_TYPE_NC 4939cc0e99cSViacheslav Ovsiienko * is performed. The drivers specifying negative values should 4949cc0e99cSViacheslav Ovsiienko * always provide the write memory barrier operation after UAR 4959cc0e99cSViacheslav Ovsiienko * register writings. 4969cc0e99cSViacheslav Ovsiienko * If there is no definitions for the MLX5DV_UAR_ALLOC_TYPE_xx (older rdma 4979cc0e99cSViacheslav Ovsiienko * library headers), the caller can specify 0. 4989cc0e99cSViacheslav Ovsiienko * 4999cc0e99cSViacheslav Ovsiienko * @return 5009cc0e99cSViacheslav Ovsiienko * UAR object pointer on success, NULL otherwise and rte_errno is set. 5019cc0e99cSViacheslav Ovsiienko */ 5029cc0e99cSViacheslav Ovsiienko void * 5039cc0e99cSViacheslav Ovsiienko mlx5_devx_alloc_uar(void *ctx, int mapping) 5049cc0e99cSViacheslav Ovsiienko { 5059cc0e99cSViacheslav Ovsiienko void *uar; 5069cc0e99cSViacheslav Ovsiienko uint32_t retry, uar_mapping; 5079cc0e99cSViacheslav Ovsiienko void *base_addr; 5089cc0e99cSViacheslav Ovsiienko 5099cc0e99cSViacheslav Ovsiienko for (retry = 0; retry < MLX5_ALLOC_UAR_RETRY; ++retry) { 5109cc0e99cSViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC 5119cc0e99cSViacheslav Ovsiienko /* Control the mapping type according to the settings. */ 5129cc0e99cSViacheslav Ovsiienko uar_mapping = (mapping < 0) ? 5139cc0e99cSViacheslav Ovsiienko MLX5DV_UAR_ALLOC_TYPE_NC : mapping; 5149cc0e99cSViacheslav Ovsiienko #else 5159cc0e99cSViacheslav Ovsiienko /* 5169cc0e99cSViacheslav Ovsiienko * It seems we have no way to control the memory mapping type 5179cc0e99cSViacheslav Ovsiienko * for the UAR, the default "Write-Combining" type is supposed. 5189cc0e99cSViacheslav Ovsiienko */ 5199cc0e99cSViacheslav Ovsiienko uar_mapping = 0; 5209cc0e99cSViacheslav Ovsiienko RTE_SET_USED(mapping); 5219cc0e99cSViacheslav Ovsiienko #endif 5229cc0e99cSViacheslav Ovsiienko uar = mlx5_glue->devx_alloc_uar(ctx, uar_mapping); 5239cc0e99cSViacheslav Ovsiienko #ifdef MLX5DV_UAR_ALLOC_TYPE_NC 5249cc0e99cSViacheslav Ovsiienko if (!uar && 5259cc0e99cSViacheslav Ovsiienko mapping < 0 && 5269cc0e99cSViacheslav Ovsiienko uar_mapping == MLX5DV_UAR_ALLOC_TYPE_BF) { 5279cc0e99cSViacheslav Ovsiienko /* 5289cc0e99cSViacheslav Ovsiienko * In some environments like virtual machine the 5299cc0e99cSViacheslav Ovsiienko * Write Combining mapped might be not supported and 5309cc0e99cSViacheslav Ovsiienko * UAR allocation fails. We tried "Non-Cached" mapping 5319cc0e99cSViacheslav Ovsiienko * for the case. 5329cc0e99cSViacheslav Ovsiienko */ 5339cc0e99cSViacheslav Ovsiienko DRV_LOG(WARNING, "Failed to allocate DevX UAR (BF)"); 5349cc0e99cSViacheslav Ovsiienko uar_mapping = MLX5DV_UAR_ALLOC_TYPE_NC; 5359cc0e99cSViacheslav Ovsiienko uar = mlx5_glue->devx_alloc_uar(ctx, uar_mapping); 5369cc0e99cSViacheslav Ovsiienko } else if (!uar && 5379cc0e99cSViacheslav Ovsiienko mapping < 0 && 5389cc0e99cSViacheslav Ovsiienko uar_mapping == MLX5DV_UAR_ALLOC_TYPE_NC) { 5399cc0e99cSViacheslav Ovsiienko /* 5409cc0e99cSViacheslav Ovsiienko * If Verbs/kernel does not support "Non-Cached" 5419cc0e99cSViacheslav Ovsiienko * try the "Write-Combining". 5429cc0e99cSViacheslav Ovsiienko */ 5439cc0e99cSViacheslav Ovsiienko DRV_LOG(WARNING, "Failed to allocate DevX UAR (NC)"); 5449cc0e99cSViacheslav Ovsiienko uar_mapping = MLX5DV_UAR_ALLOC_TYPE_BF; 5459cc0e99cSViacheslav Ovsiienko uar = mlx5_glue->devx_alloc_uar(ctx, uar_mapping); 5469cc0e99cSViacheslav Ovsiienko } 5479cc0e99cSViacheslav Ovsiienko #endif 5489cc0e99cSViacheslav Ovsiienko if (!uar) { 5499cc0e99cSViacheslav Ovsiienko DRV_LOG(ERR, "Failed to allocate DevX UAR (BF/NC)"); 5509cc0e99cSViacheslav Ovsiienko rte_errno = ENOMEM; 5519cc0e99cSViacheslav Ovsiienko goto exit; 5529cc0e99cSViacheslav Ovsiienko } 5539cc0e99cSViacheslav Ovsiienko base_addr = mlx5_os_get_devx_uar_base_addr(uar); 5549cc0e99cSViacheslav Ovsiienko if (base_addr) 5559cc0e99cSViacheslav Ovsiienko break; 5569cc0e99cSViacheslav Ovsiienko /* 5579cc0e99cSViacheslav Ovsiienko * The UARs are allocated by rdma_core within the 5589cc0e99cSViacheslav Ovsiienko * IB device context, on context closure all UARs 5599cc0e99cSViacheslav Ovsiienko * will be freed, should be no memory/object leakage. 5609cc0e99cSViacheslav Ovsiienko */ 5619cc0e99cSViacheslav Ovsiienko DRV_LOG(WARNING, "Retrying to allocate DevX UAR"); 5629cc0e99cSViacheslav Ovsiienko uar = NULL; 5639cc0e99cSViacheslav Ovsiienko } 5649cc0e99cSViacheslav Ovsiienko /* Check whether we finally succeeded with valid UAR allocation. */ 5659cc0e99cSViacheslav Ovsiienko if (!uar) { 5669cc0e99cSViacheslav Ovsiienko DRV_LOG(ERR, "Failed to allocate DevX UAR (NULL base)"); 5679cc0e99cSViacheslav Ovsiienko rte_errno = ENOMEM; 5689cc0e99cSViacheslav Ovsiienko } 5699cc0e99cSViacheslav Ovsiienko /* 5709cc0e99cSViacheslav Ovsiienko * Return void * instead of struct mlx5dv_devx_uar * 5719cc0e99cSViacheslav Ovsiienko * is for compatibility with older rdma-core library headers. 5729cc0e99cSViacheslav Ovsiienko */ 5739cc0e99cSViacheslav Ovsiienko exit: 5749cc0e99cSViacheslav Ovsiienko return uar; 5759cc0e99cSViacheslav Ovsiienko } 576*ad435d32SXueming Li 577*ad435d32SXueming Li RTE_PMD_EXPORT_NAME(mlx5_common_driver, __COUNTER__); 578