18b8036a6SElena Agostini /* SPDX-License-Identifier: BSD-3-Clause 28b8036a6SElena Agostini * Copyright (c) 2021 NVIDIA Corporation & Affiliates 38b8036a6SElena Agostini */ 48b8036a6SElena Agostini 58b8036a6SElena Agostini #include <rte_eal.h> 618cb0756SThomas Monjalon #include <rte_tailq.h> 718cb0756SThomas Monjalon #include <rte_rwlock.h> 88b8036a6SElena Agostini #include <rte_string_fns.h> 9a9af048aSThomas Monjalon #include <rte_memzone.h> 10e818c4e2SElena Agostini #include <rte_malloc.h> 118b8036a6SElena Agostini #include <rte_errno.h> 128b8036a6SElena Agostini #include <rte_log.h> 138b8036a6SElena Agostini 148b8036a6SElena Agostini #include "rte_gpudev.h" 158b8036a6SElena Agostini #include "gpudev_driver.h" 168b8036a6SElena Agostini 178b8036a6SElena Agostini /* Logging */ 188b8036a6SElena Agostini RTE_LOG_REGISTER_DEFAULT(gpu_logtype, NOTICE); 198b8036a6SElena Agostini #define GPU_LOG(level, ...) \ 208b8036a6SElena Agostini rte_log(RTE_LOG_ ## level, gpu_logtype, RTE_FMT("gpu: " \ 218b8036a6SElena Agostini RTE_FMT_HEAD(__VA_ARGS__, ) "\n", RTE_FMT_TAIL(__VA_ARGS__, ))) 228b8036a6SElena Agostini 238b8036a6SElena Agostini /* Set any driver error as EPERM */ 248b8036a6SElena Agostini #define GPU_DRV_RET(function) \ 258b8036a6SElena Agostini ((function != 0) ? -(rte_errno = EPERM) : (rte_errno = 0)) 268b8036a6SElena Agostini 278b8036a6SElena Agostini /* Array of devices */ 288b8036a6SElena Agostini static struct rte_gpu *gpus; 298b8036a6SElena Agostini /* Number of currently valid devices */ 308b8036a6SElena Agostini static int16_t gpu_max; 318b8036a6SElena Agostini /* Number of currently valid devices */ 328b8036a6SElena Agostini static int16_t gpu_count; 338b8036a6SElena Agostini 34a9af048aSThomas Monjalon /* Shared memory between processes. */ 35a9af048aSThomas Monjalon static const char *GPU_MEMZONE = "rte_gpu_shared"; 36a9af048aSThomas Monjalon static struct { 37a9af048aSThomas Monjalon __extension__ struct rte_gpu_mpshared gpus[0]; 38a9af048aSThomas Monjalon } *gpu_shared_mem; 39a9af048aSThomas Monjalon 4018cb0756SThomas Monjalon /* Event callback object */ 4118cb0756SThomas Monjalon struct rte_gpu_callback { 4218cb0756SThomas Monjalon TAILQ_ENTRY(rte_gpu_callback) next; 4318cb0756SThomas Monjalon rte_gpu_callback_t *function; 4418cb0756SThomas Monjalon void *user_data; 4518cb0756SThomas Monjalon enum rte_gpu_event event; 4618cb0756SThomas Monjalon }; 4718cb0756SThomas Monjalon static rte_rwlock_t gpu_callback_lock = RTE_RWLOCK_INITIALIZER; 4818cb0756SThomas Monjalon static void gpu_free_callbacks(struct rte_gpu *dev); 4918cb0756SThomas Monjalon 508b8036a6SElena Agostini int 518b8036a6SElena Agostini rte_gpu_init(size_t dev_max) 528b8036a6SElena Agostini { 538b8036a6SElena Agostini if (dev_max == 0 || dev_max > INT16_MAX) { 548b8036a6SElena Agostini GPU_LOG(ERR, "invalid array size"); 558b8036a6SElena Agostini rte_errno = EINVAL; 568b8036a6SElena Agostini return -rte_errno; 578b8036a6SElena Agostini } 588b8036a6SElena Agostini 598b8036a6SElena Agostini /* No lock, it must be called before or during first probing. */ 608b8036a6SElena Agostini if (gpus != NULL) { 618b8036a6SElena Agostini GPU_LOG(ERR, "already initialized"); 628b8036a6SElena Agostini rte_errno = EBUSY; 638b8036a6SElena Agostini return -rte_errno; 648b8036a6SElena Agostini } 658b8036a6SElena Agostini 668b8036a6SElena Agostini gpus = calloc(dev_max, sizeof(struct rte_gpu)); 678b8036a6SElena Agostini if (gpus == NULL) { 688b8036a6SElena Agostini GPU_LOG(ERR, "cannot initialize library"); 698b8036a6SElena Agostini rte_errno = ENOMEM; 708b8036a6SElena Agostini return -rte_errno; 718b8036a6SElena Agostini } 728b8036a6SElena Agostini 738b8036a6SElena Agostini gpu_max = dev_max; 748b8036a6SElena Agostini return 0; 758b8036a6SElena Agostini } 768b8036a6SElena Agostini 778b8036a6SElena Agostini uint16_t 788b8036a6SElena Agostini rte_gpu_count_avail(void) 798b8036a6SElena Agostini { 808b8036a6SElena Agostini return gpu_count; 818b8036a6SElena Agostini } 828b8036a6SElena Agostini 838b8036a6SElena Agostini bool 848b8036a6SElena Agostini rte_gpu_is_valid(int16_t dev_id) 858b8036a6SElena Agostini { 868b8036a6SElena Agostini if (dev_id >= 0 && dev_id < gpu_max && 87a9af048aSThomas Monjalon gpus[dev_id].process_state == RTE_GPU_STATE_INITIALIZED) 888b8036a6SElena Agostini return true; 898b8036a6SElena Agostini return false; 908b8036a6SElena Agostini } 918b8036a6SElena Agostini 9282e5f6b6SThomas Monjalon static bool 9382e5f6b6SThomas Monjalon gpu_match_parent(int16_t dev_id, int16_t parent) 9482e5f6b6SThomas Monjalon { 9582e5f6b6SThomas Monjalon if (parent == RTE_GPU_ID_ANY) 9682e5f6b6SThomas Monjalon return true; 97a9af048aSThomas Monjalon return gpus[dev_id].mpshared->info.parent == parent; 9882e5f6b6SThomas Monjalon } 9982e5f6b6SThomas Monjalon 1008b8036a6SElena Agostini int16_t 10182e5f6b6SThomas Monjalon rte_gpu_find_next(int16_t dev_id, int16_t parent) 1028b8036a6SElena Agostini { 1038b8036a6SElena Agostini if (dev_id < 0) 1048b8036a6SElena Agostini dev_id = 0; 1058b8036a6SElena Agostini while (dev_id < gpu_max && 106a9af048aSThomas Monjalon (gpus[dev_id].process_state == RTE_GPU_STATE_UNUSED || 10782e5f6b6SThomas Monjalon !gpu_match_parent(dev_id, parent))) 1088b8036a6SElena Agostini dev_id++; 1098b8036a6SElena Agostini 1108b8036a6SElena Agostini if (dev_id >= gpu_max) 1118b8036a6SElena Agostini return RTE_GPU_ID_NONE; 1128b8036a6SElena Agostini return dev_id; 1138b8036a6SElena Agostini } 1148b8036a6SElena Agostini 1158b8036a6SElena Agostini static int16_t 1168b8036a6SElena Agostini gpu_find_free_id(void) 1178b8036a6SElena Agostini { 1188b8036a6SElena Agostini int16_t dev_id; 1198b8036a6SElena Agostini 1208b8036a6SElena Agostini for (dev_id = 0; dev_id < gpu_max; dev_id++) { 121a9af048aSThomas Monjalon if (gpus[dev_id].process_state == RTE_GPU_STATE_UNUSED) 1228b8036a6SElena Agostini return dev_id; 1238b8036a6SElena Agostini } 1248b8036a6SElena Agostini return RTE_GPU_ID_NONE; 1258b8036a6SElena Agostini } 1268b8036a6SElena Agostini 1278b8036a6SElena Agostini static struct rte_gpu * 1288b8036a6SElena Agostini gpu_get_by_id(int16_t dev_id) 1298b8036a6SElena Agostini { 1308b8036a6SElena Agostini if (!rte_gpu_is_valid(dev_id)) 1318b8036a6SElena Agostini return NULL; 1328b8036a6SElena Agostini return &gpus[dev_id]; 1338b8036a6SElena Agostini } 1348b8036a6SElena Agostini 1358b8036a6SElena Agostini struct rte_gpu * 1368b8036a6SElena Agostini rte_gpu_get_by_name(const char *name) 1378b8036a6SElena Agostini { 1388b8036a6SElena Agostini int16_t dev_id; 1398b8036a6SElena Agostini struct rte_gpu *dev; 1408b8036a6SElena Agostini 1418b8036a6SElena Agostini if (name == NULL) { 1428b8036a6SElena Agostini rte_errno = EINVAL; 1438b8036a6SElena Agostini return NULL; 1448b8036a6SElena Agostini } 1458b8036a6SElena Agostini 1468b8036a6SElena Agostini RTE_GPU_FOREACH(dev_id) { 1478b8036a6SElena Agostini dev = &gpus[dev_id]; 148a9af048aSThomas Monjalon if (strncmp(name, dev->mpshared->name, RTE_DEV_NAME_MAX_LEN) == 0) 1498b8036a6SElena Agostini return dev; 1508b8036a6SElena Agostini } 1518b8036a6SElena Agostini return NULL; 1528b8036a6SElena Agostini } 1538b8036a6SElena Agostini 154a9af048aSThomas Monjalon static int 155a9af048aSThomas Monjalon gpu_shared_mem_init(void) 156a9af048aSThomas Monjalon { 157a9af048aSThomas Monjalon const struct rte_memzone *memzone; 158a9af048aSThomas Monjalon 159a9af048aSThomas Monjalon if (rte_eal_process_type() == RTE_PROC_PRIMARY) { 160a9af048aSThomas Monjalon memzone = rte_memzone_reserve(GPU_MEMZONE, 161a9af048aSThomas Monjalon sizeof(*gpu_shared_mem) + 162a9af048aSThomas Monjalon sizeof(*gpu_shared_mem->gpus) * gpu_max, 163a9af048aSThomas Monjalon SOCKET_ID_ANY, 0); 164a9af048aSThomas Monjalon } else { 165a9af048aSThomas Monjalon memzone = rte_memzone_lookup(GPU_MEMZONE); 166a9af048aSThomas Monjalon } 167a9af048aSThomas Monjalon if (memzone == NULL) { 168a9af048aSThomas Monjalon GPU_LOG(ERR, "cannot initialize shared memory"); 169a9af048aSThomas Monjalon rte_errno = ENOMEM; 170a9af048aSThomas Monjalon return -rte_errno; 171a9af048aSThomas Monjalon } 172a9af048aSThomas Monjalon 173a9af048aSThomas Monjalon gpu_shared_mem = memzone->addr; 174a9af048aSThomas Monjalon return 0; 175a9af048aSThomas Monjalon } 176a9af048aSThomas Monjalon 1778b8036a6SElena Agostini struct rte_gpu * 1788b8036a6SElena Agostini rte_gpu_allocate(const char *name) 1798b8036a6SElena Agostini { 1808b8036a6SElena Agostini int16_t dev_id; 1818b8036a6SElena Agostini struct rte_gpu *dev; 1828b8036a6SElena Agostini 1838b8036a6SElena Agostini if (rte_eal_process_type() != RTE_PROC_PRIMARY) { 1848b8036a6SElena Agostini GPU_LOG(ERR, "only primary process can allocate device"); 1858b8036a6SElena Agostini rte_errno = EPERM; 1868b8036a6SElena Agostini return NULL; 1878b8036a6SElena Agostini } 1888b8036a6SElena Agostini if (name == NULL) { 1898b8036a6SElena Agostini GPU_LOG(ERR, "allocate device without a name"); 1908b8036a6SElena Agostini rte_errno = EINVAL; 1918b8036a6SElena Agostini return NULL; 1928b8036a6SElena Agostini } 1938b8036a6SElena Agostini 1948b8036a6SElena Agostini /* implicit initialization of library before adding first device */ 1958b8036a6SElena Agostini if (gpus == NULL && rte_gpu_init(RTE_GPU_DEFAULT_MAX) < 0) 1968b8036a6SElena Agostini return NULL; 1978b8036a6SElena Agostini 198a9af048aSThomas Monjalon /* initialize shared memory before adding first device */ 199a9af048aSThomas Monjalon if (gpu_shared_mem == NULL && gpu_shared_mem_init() < 0) 200a9af048aSThomas Monjalon return NULL; 201a9af048aSThomas Monjalon 2028b8036a6SElena Agostini if (rte_gpu_get_by_name(name) != NULL) { 2038b8036a6SElena Agostini GPU_LOG(ERR, "device with name %s already exists", name); 2048b8036a6SElena Agostini rte_errno = EEXIST; 2058b8036a6SElena Agostini return NULL; 2068b8036a6SElena Agostini } 2078b8036a6SElena Agostini dev_id = gpu_find_free_id(); 2088b8036a6SElena Agostini if (dev_id == RTE_GPU_ID_NONE) { 2098b8036a6SElena Agostini GPU_LOG(ERR, "reached maximum number of devices"); 2108b8036a6SElena Agostini rte_errno = ENOENT; 2118b8036a6SElena Agostini return NULL; 2128b8036a6SElena Agostini } 2138b8036a6SElena Agostini 2148b8036a6SElena Agostini dev = &gpus[dev_id]; 2158b8036a6SElena Agostini memset(dev, 0, sizeof(*dev)); 2168b8036a6SElena Agostini 217a9af048aSThomas Monjalon dev->mpshared = &gpu_shared_mem->gpus[dev_id]; 218a9af048aSThomas Monjalon memset(dev->mpshared, 0, sizeof(*dev->mpshared)); 219a9af048aSThomas Monjalon 220a9af048aSThomas Monjalon if (rte_strscpy(dev->mpshared->name, name, RTE_DEV_NAME_MAX_LEN) < 0) { 2218b8036a6SElena Agostini GPU_LOG(ERR, "device name too long: %s", name); 2228b8036a6SElena Agostini rte_errno = ENAMETOOLONG; 2238b8036a6SElena Agostini return NULL; 2248b8036a6SElena Agostini } 225a9af048aSThomas Monjalon dev->mpshared->info.name = dev->mpshared->name; 226a9af048aSThomas Monjalon dev->mpshared->info.dev_id = dev_id; 227a9af048aSThomas Monjalon dev->mpshared->info.numa_node = -1; 228a9af048aSThomas Monjalon dev->mpshared->info.parent = RTE_GPU_ID_NONE; 22918cb0756SThomas Monjalon TAILQ_INIT(&dev->callbacks); 230a9af048aSThomas Monjalon __atomic_fetch_add(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 2318b8036a6SElena Agostini 2328b8036a6SElena Agostini gpu_count++; 2338b8036a6SElena Agostini GPU_LOG(DEBUG, "new device %s (id %d) of total %d", 2348b8036a6SElena Agostini name, dev_id, gpu_count); 2358b8036a6SElena Agostini return dev; 2368b8036a6SElena Agostini } 2378b8036a6SElena Agostini 238a9af048aSThomas Monjalon struct rte_gpu * 239a9af048aSThomas Monjalon rte_gpu_attach(const char *name) 240a9af048aSThomas Monjalon { 241a9af048aSThomas Monjalon int16_t dev_id; 242a9af048aSThomas Monjalon struct rte_gpu *dev; 243a9af048aSThomas Monjalon struct rte_gpu_mpshared *shared_dev; 244a9af048aSThomas Monjalon 245a9af048aSThomas Monjalon if (rte_eal_process_type() != RTE_PROC_SECONDARY) { 246a9af048aSThomas Monjalon GPU_LOG(ERR, "only secondary process can attach device"); 247a9af048aSThomas Monjalon rte_errno = EPERM; 248a9af048aSThomas Monjalon return NULL; 249a9af048aSThomas Monjalon } 250a9af048aSThomas Monjalon if (name == NULL) { 251a9af048aSThomas Monjalon GPU_LOG(ERR, "attach device without a name"); 252a9af048aSThomas Monjalon rte_errno = EINVAL; 253a9af048aSThomas Monjalon return NULL; 254a9af048aSThomas Monjalon } 255a9af048aSThomas Monjalon 256a9af048aSThomas Monjalon /* implicit initialization of library before adding first device */ 257a9af048aSThomas Monjalon if (gpus == NULL && rte_gpu_init(RTE_GPU_DEFAULT_MAX) < 0) 258a9af048aSThomas Monjalon return NULL; 259a9af048aSThomas Monjalon 260a9af048aSThomas Monjalon /* initialize shared memory before adding first device */ 261a9af048aSThomas Monjalon if (gpu_shared_mem == NULL && gpu_shared_mem_init() < 0) 262a9af048aSThomas Monjalon return NULL; 263a9af048aSThomas Monjalon 264a9af048aSThomas Monjalon for (dev_id = 0; dev_id < gpu_max; dev_id++) { 265a9af048aSThomas Monjalon shared_dev = &gpu_shared_mem->gpus[dev_id]; 266a9af048aSThomas Monjalon if (strncmp(name, shared_dev->name, RTE_DEV_NAME_MAX_LEN) == 0) 267a9af048aSThomas Monjalon break; 268a9af048aSThomas Monjalon } 269a9af048aSThomas Monjalon if (dev_id >= gpu_max) { 270a9af048aSThomas Monjalon GPU_LOG(ERR, "device with name %s not found", name); 271a9af048aSThomas Monjalon rte_errno = ENOENT; 272a9af048aSThomas Monjalon return NULL; 273a9af048aSThomas Monjalon } 274a9af048aSThomas Monjalon dev = &gpus[dev_id]; 275a9af048aSThomas Monjalon memset(dev, 0, sizeof(*dev)); 276a9af048aSThomas Monjalon 277a9af048aSThomas Monjalon TAILQ_INIT(&dev->callbacks); 278a9af048aSThomas Monjalon dev->mpshared = shared_dev; 279a9af048aSThomas Monjalon __atomic_fetch_add(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 280a9af048aSThomas Monjalon 281a9af048aSThomas Monjalon gpu_count++; 282a9af048aSThomas Monjalon GPU_LOG(DEBUG, "attached device %s (id %d) of total %d", 283a9af048aSThomas Monjalon name, dev_id, gpu_count); 284a9af048aSThomas Monjalon return dev; 285a9af048aSThomas Monjalon } 286a9af048aSThomas Monjalon 28782e5f6b6SThomas Monjalon int16_t 28882e5f6b6SThomas Monjalon rte_gpu_add_child(const char *name, int16_t parent, uint64_t child_context) 28982e5f6b6SThomas Monjalon { 29082e5f6b6SThomas Monjalon struct rte_gpu *dev; 29182e5f6b6SThomas Monjalon 29282e5f6b6SThomas Monjalon if (!rte_gpu_is_valid(parent)) { 29382e5f6b6SThomas Monjalon GPU_LOG(ERR, "add child to invalid parent ID %d", parent); 29482e5f6b6SThomas Monjalon rte_errno = ENODEV; 29582e5f6b6SThomas Monjalon return -rte_errno; 29682e5f6b6SThomas Monjalon } 29782e5f6b6SThomas Monjalon 29882e5f6b6SThomas Monjalon dev = rte_gpu_allocate(name); 29982e5f6b6SThomas Monjalon if (dev == NULL) 30082e5f6b6SThomas Monjalon return -rte_errno; 30182e5f6b6SThomas Monjalon 302a9af048aSThomas Monjalon dev->mpshared->info.parent = parent; 303a9af048aSThomas Monjalon dev->mpshared->info.context = child_context; 30482e5f6b6SThomas Monjalon 30582e5f6b6SThomas Monjalon rte_gpu_complete_new(dev); 306a9af048aSThomas Monjalon return dev->mpshared->info.dev_id; 30782e5f6b6SThomas Monjalon } 30882e5f6b6SThomas Monjalon 3098b8036a6SElena Agostini void 3108b8036a6SElena Agostini rte_gpu_complete_new(struct rte_gpu *dev) 3118b8036a6SElena Agostini { 3128b8036a6SElena Agostini if (dev == NULL) 3138b8036a6SElena Agostini return; 3148b8036a6SElena Agostini 315a9af048aSThomas Monjalon dev->process_state = RTE_GPU_STATE_INITIALIZED; 31618cb0756SThomas Monjalon rte_gpu_notify(dev, RTE_GPU_EVENT_NEW); 3178b8036a6SElena Agostini } 3188b8036a6SElena Agostini 3198b8036a6SElena Agostini int 3208b8036a6SElena Agostini rte_gpu_release(struct rte_gpu *dev) 3218b8036a6SElena Agostini { 32282e5f6b6SThomas Monjalon int16_t dev_id, child; 32382e5f6b6SThomas Monjalon 3248b8036a6SElena Agostini if (dev == NULL) { 3258b8036a6SElena Agostini rte_errno = ENODEV; 3268b8036a6SElena Agostini return -rte_errno; 3278b8036a6SElena Agostini } 328a9af048aSThomas Monjalon dev_id = dev->mpshared->info.dev_id; 32982e5f6b6SThomas Monjalon RTE_GPU_FOREACH_CHILD(child, dev_id) { 33082e5f6b6SThomas Monjalon GPU_LOG(ERR, "cannot release device %d with child %d", 33182e5f6b6SThomas Monjalon dev_id, child); 33282e5f6b6SThomas Monjalon rte_errno = EBUSY; 33382e5f6b6SThomas Monjalon return -rte_errno; 33482e5f6b6SThomas Monjalon } 3358b8036a6SElena Agostini 3368b8036a6SElena Agostini GPU_LOG(DEBUG, "free device %s (id %d)", 337a9af048aSThomas Monjalon dev->mpshared->info.name, dev->mpshared->info.dev_id); 33818cb0756SThomas Monjalon rte_gpu_notify(dev, RTE_GPU_EVENT_DEL); 33918cb0756SThomas Monjalon 34018cb0756SThomas Monjalon gpu_free_callbacks(dev); 341a9af048aSThomas Monjalon dev->process_state = RTE_GPU_STATE_UNUSED; 342a9af048aSThomas Monjalon __atomic_fetch_sub(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 3438b8036a6SElena Agostini gpu_count--; 3448b8036a6SElena Agostini 3458b8036a6SElena Agostini return 0; 3468b8036a6SElena Agostini } 3478b8036a6SElena Agostini 3488b8036a6SElena Agostini int 3498b8036a6SElena Agostini rte_gpu_close(int16_t dev_id) 3508b8036a6SElena Agostini { 3518b8036a6SElena Agostini int firsterr, binerr; 3528b8036a6SElena Agostini int *lasterr = &firsterr; 3538b8036a6SElena Agostini struct rte_gpu *dev; 3548b8036a6SElena Agostini 3558b8036a6SElena Agostini dev = gpu_get_by_id(dev_id); 3568b8036a6SElena Agostini if (dev == NULL) { 3578b8036a6SElena Agostini GPU_LOG(ERR, "close invalid device ID %d", dev_id); 3588b8036a6SElena Agostini rte_errno = ENODEV; 3598b8036a6SElena Agostini return -rte_errno; 3608b8036a6SElena Agostini } 3618b8036a6SElena Agostini 3628b8036a6SElena Agostini if (dev->ops.dev_close != NULL) { 3638b8036a6SElena Agostini *lasterr = GPU_DRV_RET(dev->ops.dev_close(dev)); 3648b8036a6SElena Agostini if (*lasterr != 0) 3658b8036a6SElena Agostini lasterr = &binerr; 3668b8036a6SElena Agostini } 3678b8036a6SElena Agostini 3688b8036a6SElena Agostini *lasterr = rte_gpu_release(dev); 3698b8036a6SElena Agostini 3708b8036a6SElena Agostini rte_errno = -firsterr; 3718b8036a6SElena Agostini return firsterr; 3728b8036a6SElena Agostini } 3738b8036a6SElena Agostini 3748b8036a6SElena Agostini int 37518cb0756SThomas Monjalon rte_gpu_callback_register(int16_t dev_id, enum rte_gpu_event event, 37618cb0756SThomas Monjalon rte_gpu_callback_t *function, void *user_data) 37718cb0756SThomas Monjalon { 37818cb0756SThomas Monjalon int16_t next_dev, last_dev; 37918cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 38018cb0756SThomas Monjalon struct rte_gpu_callback *callback; 38118cb0756SThomas Monjalon 38218cb0756SThomas Monjalon if (!rte_gpu_is_valid(dev_id) && dev_id != RTE_GPU_ID_ANY) { 38318cb0756SThomas Monjalon GPU_LOG(ERR, "register callback of invalid ID %d", dev_id); 38418cb0756SThomas Monjalon rte_errno = ENODEV; 38518cb0756SThomas Monjalon return -rte_errno; 38618cb0756SThomas Monjalon } 38718cb0756SThomas Monjalon if (function == NULL) { 38818cb0756SThomas Monjalon GPU_LOG(ERR, "cannot register callback without function"); 38918cb0756SThomas Monjalon rte_errno = EINVAL; 39018cb0756SThomas Monjalon return -rte_errno; 39118cb0756SThomas Monjalon } 39218cb0756SThomas Monjalon 39318cb0756SThomas Monjalon if (dev_id == RTE_GPU_ID_ANY) { 39418cb0756SThomas Monjalon next_dev = 0; 39518cb0756SThomas Monjalon last_dev = gpu_max - 1; 39618cb0756SThomas Monjalon } else { 39718cb0756SThomas Monjalon next_dev = last_dev = dev_id; 39818cb0756SThomas Monjalon } 39918cb0756SThomas Monjalon 40018cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 40118cb0756SThomas Monjalon do { 40218cb0756SThomas Monjalon callbacks = &gpus[next_dev].callbacks; 40318cb0756SThomas Monjalon 40418cb0756SThomas Monjalon /* check if not already registered */ 40518cb0756SThomas Monjalon TAILQ_FOREACH(callback, callbacks, next) { 40618cb0756SThomas Monjalon if (callback->event == event && 40718cb0756SThomas Monjalon callback->function == function && 40818cb0756SThomas Monjalon callback->user_data == user_data) { 40918cb0756SThomas Monjalon GPU_LOG(INFO, "callback already registered"); 41018cb0756SThomas Monjalon return 0; 41118cb0756SThomas Monjalon } 41218cb0756SThomas Monjalon } 41318cb0756SThomas Monjalon 41418cb0756SThomas Monjalon callback = malloc(sizeof(*callback)); 41518cb0756SThomas Monjalon if (callback == NULL) { 41618cb0756SThomas Monjalon GPU_LOG(ERR, "cannot allocate callback"); 41718cb0756SThomas Monjalon return -ENOMEM; 41818cb0756SThomas Monjalon } 41918cb0756SThomas Monjalon callback->function = function; 42018cb0756SThomas Monjalon callback->user_data = user_data; 42118cb0756SThomas Monjalon callback->event = event; 42218cb0756SThomas Monjalon TAILQ_INSERT_TAIL(callbacks, callback, next); 42318cb0756SThomas Monjalon 42418cb0756SThomas Monjalon } while (++next_dev <= last_dev); 42518cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 42618cb0756SThomas Monjalon 42718cb0756SThomas Monjalon return 0; 42818cb0756SThomas Monjalon } 42918cb0756SThomas Monjalon 43018cb0756SThomas Monjalon int 43118cb0756SThomas Monjalon rte_gpu_callback_unregister(int16_t dev_id, enum rte_gpu_event event, 43218cb0756SThomas Monjalon rte_gpu_callback_t *function, void *user_data) 43318cb0756SThomas Monjalon { 43418cb0756SThomas Monjalon int16_t next_dev, last_dev; 43518cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 43618cb0756SThomas Monjalon struct rte_gpu_callback *callback, *nextcb; 43718cb0756SThomas Monjalon 43818cb0756SThomas Monjalon if (!rte_gpu_is_valid(dev_id) && dev_id != RTE_GPU_ID_ANY) { 43918cb0756SThomas Monjalon GPU_LOG(ERR, "unregister callback of invalid ID %d", dev_id); 44018cb0756SThomas Monjalon rte_errno = ENODEV; 44118cb0756SThomas Monjalon return -rte_errno; 44218cb0756SThomas Monjalon } 44318cb0756SThomas Monjalon if (function == NULL) { 44418cb0756SThomas Monjalon GPU_LOG(ERR, "cannot unregister callback without function"); 44518cb0756SThomas Monjalon rte_errno = EINVAL; 44618cb0756SThomas Monjalon return -rte_errno; 44718cb0756SThomas Monjalon } 44818cb0756SThomas Monjalon 44918cb0756SThomas Monjalon if (dev_id == RTE_GPU_ID_ANY) { 45018cb0756SThomas Monjalon next_dev = 0; 45118cb0756SThomas Monjalon last_dev = gpu_max - 1; 45218cb0756SThomas Monjalon } else { 45318cb0756SThomas Monjalon next_dev = last_dev = dev_id; 45418cb0756SThomas Monjalon } 45518cb0756SThomas Monjalon 45618cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 45718cb0756SThomas Monjalon do { 45818cb0756SThomas Monjalon callbacks = &gpus[next_dev].callbacks; 45918cb0756SThomas Monjalon RTE_TAILQ_FOREACH_SAFE(callback, callbacks, next, nextcb) { 46018cb0756SThomas Monjalon if (callback->event != event || 46118cb0756SThomas Monjalon callback->function != function || 46218cb0756SThomas Monjalon (callback->user_data != user_data && 46318cb0756SThomas Monjalon user_data != (void *)-1)) 46418cb0756SThomas Monjalon continue; 46518cb0756SThomas Monjalon TAILQ_REMOVE(callbacks, callback, next); 46618cb0756SThomas Monjalon free(callback); 46718cb0756SThomas Monjalon } 46818cb0756SThomas Monjalon } while (++next_dev <= last_dev); 46918cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 47018cb0756SThomas Monjalon 47118cb0756SThomas Monjalon return 0; 47218cb0756SThomas Monjalon } 47318cb0756SThomas Monjalon 47418cb0756SThomas Monjalon static void 47518cb0756SThomas Monjalon gpu_free_callbacks(struct rte_gpu *dev) 47618cb0756SThomas Monjalon { 47718cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 47818cb0756SThomas Monjalon struct rte_gpu_callback *callback, *nextcb; 47918cb0756SThomas Monjalon 48018cb0756SThomas Monjalon callbacks = &dev->callbacks; 48118cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 48218cb0756SThomas Monjalon RTE_TAILQ_FOREACH_SAFE(callback, callbacks, next, nextcb) { 48318cb0756SThomas Monjalon TAILQ_REMOVE(callbacks, callback, next); 48418cb0756SThomas Monjalon free(callback); 48518cb0756SThomas Monjalon } 48618cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 48718cb0756SThomas Monjalon } 48818cb0756SThomas Monjalon 48918cb0756SThomas Monjalon void 49018cb0756SThomas Monjalon rte_gpu_notify(struct rte_gpu *dev, enum rte_gpu_event event) 49118cb0756SThomas Monjalon { 49218cb0756SThomas Monjalon int16_t dev_id; 49318cb0756SThomas Monjalon struct rte_gpu_callback *callback; 49418cb0756SThomas Monjalon 495a9af048aSThomas Monjalon dev_id = dev->mpshared->info.dev_id; 49618cb0756SThomas Monjalon rte_rwlock_read_lock(&gpu_callback_lock); 49718cb0756SThomas Monjalon TAILQ_FOREACH(callback, &dev->callbacks, next) { 49818cb0756SThomas Monjalon if (callback->event != event || callback->function == NULL) 49918cb0756SThomas Monjalon continue; 50018cb0756SThomas Monjalon callback->function(dev_id, event, callback->user_data); 50118cb0756SThomas Monjalon } 50218cb0756SThomas Monjalon rte_rwlock_read_unlock(&gpu_callback_lock); 50318cb0756SThomas Monjalon } 50418cb0756SThomas Monjalon 50518cb0756SThomas Monjalon int 5068b8036a6SElena Agostini rte_gpu_info_get(int16_t dev_id, struct rte_gpu_info *info) 5078b8036a6SElena Agostini { 5088b8036a6SElena Agostini struct rte_gpu *dev; 5098b8036a6SElena Agostini 5108b8036a6SElena Agostini dev = gpu_get_by_id(dev_id); 5118b8036a6SElena Agostini if (dev == NULL) { 5128b8036a6SElena Agostini GPU_LOG(ERR, "query invalid device ID %d", dev_id); 5138b8036a6SElena Agostini rte_errno = ENODEV; 5148b8036a6SElena Agostini return -rte_errno; 5158b8036a6SElena Agostini } 5168b8036a6SElena Agostini if (info == NULL) { 5178b8036a6SElena Agostini GPU_LOG(ERR, "query without storage"); 5188b8036a6SElena Agostini rte_errno = EINVAL; 5198b8036a6SElena Agostini return -rte_errno; 5208b8036a6SElena Agostini } 5218b8036a6SElena Agostini 5228b8036a6SElena Agostini if (dev->ops.dev_info_get == NULL) { 523a9af048aSThomas Monjalon *info = dev->mpshared->info; 5248b8036a6SElena Agostini return 0; 5258b8036a6SElena Agostini } 5268b8036a6SElena Agostini return GPU_DRV_RET(dev->ops.dev_info_get(dev, info)); 5278b8036a6SElena Agostini } 528e818c4e2SElena Agostini 529e818c4e2SElena Agostini void * 530e818c4e2SElena Agostini rte_gpu_mem_alloc(int16_t dev_id, size_t size) 531e818c4e2SElena Agostini { 532e818c4e2SElena Agostini struct rte_gpu *dev; 533e818c4e2SElena Agostini void *ptr; 534e818c4e2SElena Agostini int ret; 535e818c4e2SElena Agostini 536e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 537e818c4e2SElena Agostini if (dev == NULL) { 538e818c4e2SElena Agostini GPU_LOG(ERR, "alloc mem for invalid device ID %d", dev_id); 539e818c4e2SElena Agostini rte_errno = ENODEV; 540e818c4e2SElena Agostini return NULL; 541e818c4e2SElena Agostini } 542e818c4e2SElena Agostini 543e818c4e2SElena Agostini if (dev->ops.mem_alloc == NULL) { 544e818c4e2SElena Agostini GPU_LOG(ERR, "mem allocation not supported"); 545e818c4e2SElena Agostini rte_errno = ENOTSUP; 546e818c4e2SElena Agostini return NULL; 547e818c4e2SElena Agostini } 548e818c4e2SElena Agostini 549e818c4e2SElena Agostini if (size == 0) /* dry-run */ 550e818c4e2SElena Agostini return NULL; 551e818c4e2SElena Agostini 552e818c4e2SElena Agostini ret = dev->ops.mem_alloc(dev, size, &ptr); 553e818c4e2SElena Agostini 554e818c4e2SElena Agostini switch (ret) { 555e818c4e2SElena Agostini case 0: 556e818c4e2SElena Agostini return ptr; 557e818c4e2SElena Agostini case -ENOMEM: 558e818c4e2SElena Agostini case -E2BIG: 559e818c4e2SElena Agostini rte_errno = -ret; 560e818c4e2SElena Agostini return NULL; 561e818c4e2SElena Agostini default: 562e818c4e2SElena Agostini rte_errno = -EPERM; 563e818c4e2SElena Agostini return NULL; 564e818c4e2SElena Agostini } 565e818c4e2SElena Agostini } 566e818c4e2SElena Agostini 567e818c4e2SElena Agostini int 568e818c4e2SElena Agostini rte_gpu_mem_free(int16_t dev_id, void *ptr) 569e818c4e2SElena Agostini { 570e818c4e2SElena Agostini struct rte_gpu *dev; 571e818c4e2SElena Agostini 572e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 573e818c4e2SElena Agostini if (dev == NULL) { 574e818c4e2SElena Agostini GPU_LOG(ERR, "free mem for invalid device ID %d", dev_id); 575e818c4e2SElena Agostini rte_errno = ENODEV; 576e818c4e2SElena Agostini return -rte_errno; 577e818c4e2SElena Agostini } 578e818c4e2SElena Agostini 579e818c4e2SElena Agostini if (dev->ops.mem_free == NULL) { 580e818c4e2SElena Agostini rte_errno = ENOTSUP; 581e818c4e2SElena Agostini return -rte_errno; 582e818c4e2SElena Agostini } 583e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_free(dev, ptr)); 584e818c4e2SElena Agostini } 585e818c4e2SElena Agostini 586e818c4e2SElena Agostini int 587e818c4e2SElena Agostini rte_gpu_mem_register(int16_t dev_id, size_t size, void *ptr) 588e818c4e2SElena Agostini { 589e818c4e2SElena Agostini struct rte_gpu *dev; 590e818c4e2SElena Agostini 591e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 592e818c4e2SElena Agostini if (dev == NULL) { 593e818c4e2SElena Agostini GPU_LOG(ERR, "alloc mem for invalid device ID %d", dev_id); 594e818c4e2SElena Agostini rte_errno = ENODEV; 595e818c4e2SElena Agostini return -rte_errno; 596e818c4e2SElena Agostini } 597e818c4e2SElena Agostini 598e818c4e2SElena Agostini if (dev->ops.mem_register == NULL) { 599e818c4e2SElena Agostini GPU_LOG(ERR, "mem registration not supported"); 600e818c4e2SElena Agostini rte_errno = ENOTSUP; 601e818c4e2SElena Agostini return -rte_errno; 602e818c4e2SElena Agostini } 603e818c4e2SElena Agostini 604e818c4e2SElena Agostini if (size == 0 || ptr == NULL) /* dry-run */ 605e818c4e2SElena Agostini return -EINVAL; 606e818c4e2SElena Agostini 607e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_register(dev, size, ptr)); 608e818c4e2SElena Agostini } 609e818c4e2SElena Agostini 610e818c4e2SElena Agostini int 611e818c4e2SElena Agostini rte_gpu_mem_unregister(int16_t dev_id, void *ptr) 612e818c4e2SElena Agostini { 613e818c4e2SElena Agostini struct rte_gpu *dev; 614e818c4e2SElena Agostini 615e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 616e818c4e2SElena Agostini if (dev == NULL) { 617e818c4e2SElena Agostini GPU_LOG(ERR, "unregister mem for invalid device ID %d", dev_id); 618e818c4e2SElena Agostini rte_errno = ENODEV; 619e818c4e2SElena Agostini return -rte_errno; 620e818c4e2SElena Agostini } 621e818c4e2SElena Agostini 622e818c4e2SElena Agostini if (dev->ops.mem_unregister == NULL) { 623e818c4e2SElena Agostini rte_errno = ENOTSUP; 624e818c4e2SElena Agostini return -rte_errno; 625e818c4e2SElena Agostini } 626e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_unregister(dev, ptr)); 627e818c4e2SElena Agostini } 628*2d61b429SElena Agostini 629*2d61b429SElena Agostini int 630*2d61b429SElena Agostini rte_gpu_wmb(int16_t dev_id) 631*2d61b429SElena Agostini { 632*2d61b429SElena Agostini struct rte_gpu *dev; 633*2d61b429SElena Agostini 634*2d61b429SElena Agostini dev = gpu_get_by_id(dev_id); 635*2d61b429SElena Agostini if (dev == NULL) { 636*2d61b429SElena Agostini GPU_LOG(ERR, "memory barrier for invalid device ID %d", dev_id); 637*2d61b429SElena Agostini rte_errno = ENODEV; 638*2d61b429SElena Agostini return -rte_errno; 639*2d61b429SElena Agostini } 640*2d61b429SElena Agostini 641*2d61b429SElena Agostini if (dev->ops.wmb == NULL) { 642*2d61b429SElena Agostini rte_errno = ENOTSUP; 643*2d61b429SElena Agostini return -rte_errno; 644*2d61b429SElena Agostini } 645*2d61b429SElena Agostini return GPU_DRV_RET(dev->ops.wmb(dev)); 646*2d61b429SElena Agostini } 647