18b8036a6SElena Agostini /* SPDX-License-Identifier: BSD-3-Clause 28b8036a6SElena Agostini * Copyright (c) 2021 NVIDIA Corporation & Affiliates 38b8036a6SElena Agostini */ 48b8036a6SElena Agostini 58b8036a6SElena Agostini #include <rte_eal.h> 618cb0756SThomas Monjalon #include <rte_tailq.h> 718cb0756SThomas Monjalon #include <rte_rwlock.h> 88b8036a6SElena Agostini #include <rte_string_fns.h> 9a9af048aSThomas Monjalon #include <rte_memzone.h> 10e818c4e2SElena Agostini #include <rte_malloc.h> 118b8036a6SElena Agostini #include <rte_errno.h> 128b8036a6SElena Agostini #include <rte_log.h> 138b8036a6SElena Agostini 148b8036a6SElena Agostini #include "rte_gpudev.h" 158b8036a6SElena Agostini #include "gpudev_driver.h" 168b8036a6SElena Agostini 178b8036a6SElena Agostini /* Logging */ 188b8036a6SElena Agostini RTE_LOG_REGISTER_DEFAULT(gpu_logtype, NOTICE); 198b8036a6SElena Agostini #define GPU_LOG(level, ...) \ 208b8036a6SElena Agostini rte_log(RTE_LOG_ ## level, gpu_logtype, RTE_FMT("gpu: " \ 218b8036a6SElena Agostini RTE_FMT_HEAD(__VA_ARGS__, ) "\n", RTE_FMT_TAIL(__VA_ARGS__, ))) 228b8036a6SElena Agostini 238b8036a6SElena Agostini /* Set any driver error as EPERM */ 248b8036a6SElena Agostini #define GPU_DRV_RET(function) \ 258b8036a6SElena Agostini ((function != 0) ? -(rte_errno = EPERM) : (rte_errno = 0)) 268b8036a6SElena Agostini 278b8036a6SElena Agostini /* Array of devices */ 288b8036a6SElena Agostini static struct rte_gpu *gpus; 298b8036a6SElena Agostini /* Number of currently valid devices */ 308b8036a6SElena Agostini static int16_t gpu_max; 318b8036a6SElena Agostini /* Number of currently valid devices */ 328b8036a6SElena Agostini static int16_t gpu_count; 338b8036a6SElena Agostini 34a9af048aSThomas Monjalon /* Shared memory between processes. */ 35a9af048aSThomas Monjalon static const char *GPU_MEMZONE = "rte_gpu_shared"; 36a9af048aSThomas Monjalon static struct { 37a9af048aSThomas Monjalon __extension__ struct rte_gpu_mpshared gpus[0]; 38a9af048aSThomas Monjalon } *gpu_shared_mem; 39a9af048aSThomas Monjalon 4018cb0756SThomas Monjalon /* Event callback object */ 4118cb0756SThomas Monjalon struct rte_gpu_callback { 4218cb0756SThomas Monjalon TAILQ_ENTRY(rte_gpu_callback) next; 4318cb0756SThomas Monjalon rte_gpu_callback_t *function; 4418cb0756SThomas Monjalon void *user_data; 4518cb0756SThomas Monjalon enum rte_gpu_event event; 4618cb0756SThomas Monjalon }; 4718cb0756SThomas Monjalon static rte_rwlock_t gpu_callback_lock = RTE_RWLOCK_INITIALIZER; 4818cb0756SThomas Monjalon static void gpu_free_callbacks(struct rte_gpu *dev); 4918cb0756SThomas Monjalon 508b8036a6SElena Agostini int 518b8036a6SElena Agostini rte_gpu_init(size_t dev_max) 528b8036a6SElena Agostini { 538b8036a6SElena Agostini if (dev_max == 0 || dev_max > INT16_MAX) { 548b8036a6SElena Agostini GPU_LOG(ERR, "invalid array size"); 558b8036a6SElena Agostini rte_errno = EINVAL; 568b8036a6SElena Agostini return -rte_errno; 578b8036a6SElena Agostini } 588b8036a6SElena Agostini 598b8036a6SElena Agostini /* No lock, it must be called before or during first probing. */ 608b8036a6SElena Agostini if (gpus != NULL) { 618b8036a6SElena Agostini GPU_LOG(ERR, "already initialized"); 628b8036a6SElena Agostini rte_errno = EBUSY; 638b8036a6SElena Agostini return -rte_errno; 648b8036a6SElena Agostini } 658b8036a6SElena Agostini 668b8036a6SElena Agostini gpus = calloc(dev_max, sizeof(struct rte_gpu)); 678b8036a6SElena Agostini if (gpus == NULL) { 688b8036a6SElena Agostini GPU_LOG(ERR, "cannot initialize library"); 698b8036a6SElena Agostini rte_errno = ENOMEM; 708b8036a6SElena Agostini return -rte_errno; 718b8036a6SElena Agostini } 728b8036a6SElena Agostini 738b8036a6SElena Agostini gpu_max = dev_max; 748b8036a6SElena Agostini return 0; 758b8036a6SElena Agostini } 768b8036a6SElena Agostini 778b8036a6SElena Agostini uint16_t 788b8036a6SElena Agostini rte_gpu_count_avail(void) 798b8036a6SElena Agostini { 808b8036a6SElena Agostini return gpu_count; 818b8036a6SElena Agostini } 828b8036a6SElena Agostini 838b8036a6SElena Agostini bool 848b8036a6SElena Agostini rte_gpu_is_valid(int16_t dev_id) 858b8036a6SElena Agostini { 868b8036a6SElena Agostini if (dev_id >= 0 && dev_id < gpu_max && 87a9af048aSThomas Monjalon gpus[dev_id].process_state == RTE_GPU_STATE_INITIALIZED) 888b8036a6SElena Agostini return true; 898b8036a6SElena Agostini return false; 908b8036a6SElena Agostini } 918b8036a6SElena Agostini 9282e5f6b6SThomas Monjalon static bool 9382e5f6b6SThomas Monjalon gpu_match_parent(int16_t dev_id, int16_t parent) 9482e5f6b6SThomas Monjalon { 9582e5f6b6SThomas Monjalon if (parent == RTE_GPU_ID_ANY) 9682e5f6b6SThomas Monjalon return true; 97a9af048aSThomas Monjalon return gpus[dev_id].mpshared->info.parent == parent; 9882e5f6b6SThomas Monjalon } 9982e5f6b6SThomas Monjalon 1008b8036a6SElena Agostini int16_t 10182e5f6b6SThomas Monjalon rte_gpu_find_next(int16_t dev_id, int16_t parent) 1028b8036a6SElena Agostini { 1038b8036a6SElena Agostini if (dev_id < 0) 1048b8036a6SElena Agostini dev_id = 0; 1058b8036a6SElena Agostini while (dev_id < gpu_max && 106a9af048aSThomas Monjalon (gpus[dev_id].process_state == RTE_GPU_STATE_UNUSED || 10782e5f6b6SThomas Monjalon !gpu_match_parent(dev_id, parent))) 1088b8036a6SElena Agostini dev_id++; 1098b8036a6SElena Agostini 1108b8036a6SElena Agostini if (dev_id >= gpu_max) 1118b8036a6SElena Agostini return RTE_GPU_ID_NONE; 1128b8036a6SElena Agostini return dev_id; 1138b8036a6SElena Agostini } 1148b8036a6SElena Agostini 1158b8036a6SElena Agostini static int16_t 1168b8036a6SElena Agostini gpu_find_free_id(void) 1178b8036a6SElena Agostini { 1188b8036a6SElena Agostini int16_t dev_id; 1198b8036a6SElena Agostini 1208b8036a6SElena Agostini for (dev_id = 0; dev_id < gpu_max; dev_id++) { 121a9af048aSThomas Monjalon if (gpus[dev_id].process_state == RTE_GPU_STATE_UNUSED) 1228b8036a6SElena Agostini return dev_id; 1238b8036a6SElena Agostini } 1248b8036a6SElena Agostini return RTE_GPU_ID_NONE; 1258b8036a6SElena Agostini } 1268b8036a6SElena Agostini 1278b8036a6SElena Agostini static struct rte_gpu * 1288b8036a6SElena Agostini gpu_get_by_id(int16_t dev_id) 1298b8036a6SElena Agostini { 1308b8036a6SElena Agostini if (!rte_gpu_is_valid(dev_id)) 1318b8036a6SElena Agostini return NULL; 1328b8036a6SElena Agostini return &gpus[dev_id]; 1338b8036a6SElena Agostini } 1348b8036a6SElena Agostini 1358b8036a6SElena Agostini struct rte_gpu * 1368b8036a6SElena Agostini rte_gpu_get_by_name(const char *name) 1378b8036a6SElena Agostini { 1388b8036a6SElena Agostini int16_t dev_id; 1398b8036a6SElena Agostini struct rte_gpu *dev; 1408b8036a6SElena Agostini 1418b8036a6SElena Agostini if (name == NULL) { 1428b8036a6SElena Agostini rte_errno = EINVAL; 1438b8036a6SElena Agostini return NULL; 1448b8036a6SElena Agostini } 1458b8036a6SElena Agostini 1468b8036a6SElena Agostini RTE_GPU_FOREACH(dev_id) { 1478b8036a6SElena Agostini dev = &gpus[dev_id]; 148a9af048aSThomas Monjalon if (strncmp(name, dev->mpshared->name, RTE_DEV_NAME_MAX_LEN) == 0) 1498b8036a6SElena Agostini return dev; 1508b8036a6SElena Agostini } 1518b8036a6SElena Agostini return NULL; 1528b8036a6SElena Agostini } 1538b8036a6SElena Agostini 154a9af048aSThomas Monjalon static int 155a9af048aSThomas Monjalon gpu_shared_mem_init(void) 156a9af048aSThomas Monjalon { 157a9af048aSThomas Monjalon const struct rte_memzone *memzone; 158a9af048aSThomas Monjalon 159a9af048aSThomas Monjalon if (rte_eal_process_type() == RTE_PROC_PRIMARY) { 160a9af048aSThomas Monjalon memzone = rte_memzone_reserve(GPU_MEMZONE, 161a9af048aSThomas Monjalon sizeof(*gpu_shared_mem) + 162a9af048aSThomas Monjalon sizeof(*gpu_shared_mem->gpus) * gpu_max, 163a9af048aSThomas Monjalon SOCKET_ID_ANY, 0); 164a9af048aSThomas Monjalon } else { 165a9af048aSThomas Monjalon memzone = rte_memzone_lookup(GPU_MEMZONE); 166a9af048aSThomas Monjalon } 167a9af048aSThomas Monjalon if (memzone == NULL) { 168a9af048aSThomas Monjalon GPU_LOG(ERR, "cannot initialize shared memory"); 169a9af048aSThomas Monjalon rte_errno = ENOMEM; 170a9af048aSThomas Monjalon return -rte_errno; 171a9af048aSThomas Monjalon } 172a9af048aSThomas Monjalon 173a9af048aSThomas Monjalon gpu_shared_mem = memzone->addr; 174a9af048aSThomas Monjalon return 0; 175a9af048aSThomas Monjalon } 176a9af048aSThomas Monjalon 1778b8036a6SElena Agostini struct rte_gpu * 1788b8036a6SElena Agostini rte_gpu_allocate(const char *name) 1798b8036a6SElena Agostini { 1808b8036a6SElena Agostini int16_t dev_id; 1818b8036a6SElena Agostini struct rte_gpu *dev; 1828b8036a6SElena Agostini 1838b8036a6SElena Agostini if (rte_eal_process_type() != RTE_PROC_PRIMARY) { 1848b8036a6SElena Agostini GPU_LOG(ERR, "only primary process can allocate device"); 1858b8036a6SElena Agostini rte_errno = EPERM; 1868b8036a6SElena Agostini return NULL; 1878b8036a6SElena Agostini } 1888b8036a6SElena Agostini if (name == NULL) { 1898b8036a6SElena Agostini GPU_LOG(ERR, "allocate device without a name"); 1908b8036a6SElena Agostini rte_errno = EINVAL; 1918b8036a6SElena Agostini return NULL; 1928b8036a6SElena Agostini } 1938b8036a6SElena Agostini 1948b8036a6SElena Agostini /* implicit initialization of library before adding first device */ 1958b8036a6SElena Agostini if (gpus == NULL && rte_gpu_init(RTE_GPU_DEFAULT_MAX) < 0) 1968b8036a6SElena Agostini return NULL; 1978b8036a6SElena Agostini 198a9af048aSThomas Monjalon /* initialize shared memory before adding first device */ 199a9af048aSThomas Monjalon if (gpu_shared_mem == NULL && gpu_shared_mem_init() < 0) 200a9af048aSThomas Monjalon return NULL; 201a9af048aSThomas Monjalon 2028b8036a6SElena Agostini if (rte_gpu_get_by_name(name) != NULL) { 2038b8036a6SElena Agostini GPU_LOG(ERR, "device with name %s already exists", name); 2048b8036a6SElena Agostini rte_errno = EEXIST; 2058b8036a6SElena Agostini return NULL; 2068b8036a6SElena Agostini } 2078b8036a6SElena Agostini dev_id = gpu_find_free_id(); 2088b8036a6SElena Agostini if (dev_id == RTE_GPU_ID_NONE) { 2098b8036a6SElena Agostini GPU_LOG(ERR, "reached maximum number of devices"); 2108b8036a6SElena Agostini rte_errno = ENOENT; 2118b8036a6SElena Agostini return NULL; 2128b8036a6SElena Agostini } 2138b8036a6SElena Agostini 2148b8036a6SElena Agostini dev = &gpus[dev_id]; 2158b8036a6SElena Agostini memset(dev, 0, sizeof(*dev)); 2168b8036a6SElena Agostini 217a9af048aSThomas Monjalon dev->mpshared = &gpu_shared_mem->gpus[dev_id]; 218a9af048aSThomas Monjalon memset(dev->mpshared, 0, sizeof(*dev->mpshared)); 219a9af048aSThomas Monjalon 220a9af048aSThomas Monjalon if (rte_strscpy(dev->mpshared->name, name, RTE_DEV_NAME_MAX_LEN) < 0) { 2218b8036a6SElena Agostini GPU_LOG(ERR, "device name too long: %s", name); 2228b8036a6SElena Agostini rte_errno = ENAMETOOLONG; 2238b8036a6SElena Agostini return NULL; 2248b8036a6SElena Agostini } 225a9af048aSThomas Monjalon dev->mpshared->info.name = dev->mpshared->name; 226a9af048aSThomas Monjalon dev->mpshared->info.dev_id = dev_id; 227a9af048aSThomas Monjalon dev->mpshared->info.numa_node = -1; 228a9af048aSThomas Monjalon dev->mpshared->info.parent = RTE_GPU_ID_NONE; 22918cb0756SThomas Monjalon TAILQ_INIT(&dev->callbacks); 230a9af048aSThomas Monjalon __atomic_fetch_add(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 2318b8036a6SElena Agostini 2328b8036a6SElena Agostini gpu_count++; 2338b8036a6SElena Agostini GPU_LOG(DEBUG, "new device %s (id %d) of total %d", 2348b8036a6SElena Agostini name, dev_id, gpu_count); 2358b8036a6SElena Agostini return dev; 2368b8036a6SElena Agostini } 2378b8036a6SElena Agostini 238a9af048aSThomas Monjalon struct rte_gpu * 239a9af048aSThomas Monjalon rte_gpu_attach(const char *name) 240a9af048aSThomas Monjalon { 241a9af048aSThomas Monjalon int16_t dev_id; 242a9af048aSThomas Monjalon struct rte_gpu *dev; 243a9af048aSThomas Monjalon struct rte_gpu_mpshared *shared_dev; 244a9af048aSThomas Monjalon 245a9af048aSThomas Monjalon if (rte_eal_process_type() != RTE_PROC_SECONDARY) { 246a9af048aSThomas Monjalon GPU_LOG(ERR, "only secondary process can attach device"); 247a9af048aSThomas Monjalon rte_errno = EPERM; 248a9af048aSThomas Monjalon return NULL; 249a9af048aSThomas Monjalon } 250a9af048aSThomas Monjalon if (name == NULL) { 251a9af048aSThomas Monjalon GPU_LOG(ERR, "attach device without a name"); 252a9af048aSThomas Monjalon rte_errno = EINVAL; 253a9af048aSThomas Monjalon return NULL; 254a9af048aSThomas Monjalon } 255a9af048aSThomas Monjalon 256a9af048aSThomas Monjalon /* implicit initialization of library before adding first device */ 257a9af048aSThomas Monjalon if (gpus == NULL && rte_gpu_init(RTE_GPU_DEFAULT_MAX) < 0) 258a9af048aSThomas Monjalon return NULL; 259a9af048aSThomas Monjalon 260a9af048aSThomas Monjalon /* initialize shared memory before adding first device */ 261a9af048aSThomas Monjalon if (gpu_shared_mem == NULL && gpu_shared_mem_init() < 0) 262a9af048aSThomas Monjalon return NULL; 263a9af048aSThomas Monjalon 264a9af048aSThomas Monjalon for (dev_id = 0; dev_id < gpu_max; dev_id++) { 265a9af048aSThomas Monjalon shared_dev = &gpu_shared_mem->gpus[dev_id]; 266a9af048aSThomas Monjalon if (strncmp(name, shared_dev->name, RTE_DEV_NAME_MAX_LEN) == 0) 267a9af048aSThomas Monjalon break; 268a9af048aSThomas Monjalon } 269a9af048aSThomas Monjalon if (dev_id >= gpu_max) { 270a9af048aSThomas Monjalon GPU_LOG(ERR, "device with name %s not found", name); 271a9af048aSThomas Monjalon rte_errno = ENOENT; 272a9af048aSThomas Monjalon return NULL; 273a9af048aSThomas Monjalon } 274a9af048aSThomas Monjalon dev = &gpus[dev_id]; 275a9af048aSThomas Monjalon memset(dev, 0, sizeof(*dev)); 276a9af048aSThomas Monjalon 277a9af048aSThomas Monjalon TAILQ_INIT(&dev->callbacks); 278a9af048aSThomas Monjalon dev->mpshared = shared_dev; 279a9af048aSThomas Monjalon __atomic_fetch_add(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 280a9af048aSThomas Monjalon 281a9af048aSThomas Monjalon gpu_count++; 282a9af048aSThomas Monjalon GPU_LOG(DEBUG, "attached device %s (id %d) of total %d", 283a9af048aSThomas Monjalon name, dev_id, gpu_count); 284a9af048aSThomas Monjalon return dev; 285a9af048aSThomas Monjalon } 286a9af048aSThomas Monjalon 28782e5f6b6SThomas Monjalon int16_t 28882e5f6b6SThomas Monjalon rte_gpu_add_child(const char *name, int16_t parent, uint64_t child_context) 28982e5f6b6SThomas Monjalon { 29082e5f6b6SThomas Monjalon struct rte_gpu *dev; 29182e5f6b6SThomas Monjalon 29282e5f6b6SThomas Monjalon if (!rte_gpu_is_valid(parent)) { 29382e5f6b6SThomas Monjalon GPU_LOG(ERR, "add child to invalid parent ID %d", parent); 29482e5f6b6SThomas Monjalon rte_errno = ENODEV; 29582e5f6b6SThomas Monjalon return -rte_errno; 29682e5f6b6SThomas Monjalon } 29782e5f6b6SThomas Monjalon 29882e5f6b6SThomas Monjalon dev = rte_gpu_allocate(name); 29982e5f6b6SThomas Monjalon if (dev == NULL) 30082e5f6b6SThomas Monjalon return -rte_errno; 30182e5f6b6SThomas Monjalon 302a9af048aSThomas Monjalon dev->mpshared->info.parent = parent; 303a9af048aSThomas Monjalon dev->mpshared->info.context = child_context; 30482e5f6b6SThomas Monjalon 30582e5f6b6SThomas Monjalon rte_gpu_complete_new(dev); 306a9af048aSThomas Monjalon return dev->mpshared->info.dev_id; 30782e5f6b6SThomas Monjalon } 30882e5f6b6SThomas Monjalon 3098b8036a6SElena Agostini void 3108b8036a6SElena Agostini rte_gpu_complete_new(struct rte_gpu *dev) 3118b8036a6SElena Agostini { 3128b8036a6SElena Agostini if (dev == NULL) 3138b8036a6SElena Agostini return; 3148b8036a6SElena Agostini 315a9af048aSThomas Monjalon dev->process_state = RTE_GPU_STATE_INITIALIZED; 31618cb0756SThomas Monjalon rte_gpu_notify(dev, RTE_GPU_EVENT_NEW); 3178b8036a6SElena Agostini } 3188b8036a6SElena Agostini 3198b8036a6SElena Agostini int 3208b8036a6SElena Agostini rte_gpu_release(struct rte_gpu *dev) 3218b8036a6SElena Agostini { 32282e5f6b6SThomas Monjalon int16_t dev_id, child; 32382e5f6b6SThomas Monjalon 3248b8036a6SElena Agostini if (dev == NULL) { 3258b8036a6SElena Agostini rte_errno = ENODEV; 3268b8036a6SElena Agostini return -rte_errno; 3278b8036a6SElena Agostini } 328a9af048aSThomas Monjalon dev_id = dev->mpshared->info.dev_id; 32982e5f6b6SThomas Monjalon RTE_GPU_FOREACH_CHILD(child, dev_id) { 33082e5f6b6SThomas Monjalon GPU_LOG(ERR, "cannot release device %d with child %d", 33182e5f6b6SThomas Monjalon dev_id, child); 33282e5f6b6SThomas Monjalon rte_errno = EBUSY; 33382e5f6b6SThomas Monjalon return -rte_errno; 33482e5f6b6SThomas Monjalon } 3358b8036a6SElena Agostini 3368b8036a6SElena Agostini GPU_LOG(DEBUG, "free device %s (id %d)", 337a9af048aSThomas Monjalon dev->mpshared->info.name, dev->mpshared->info.dev_id); 33818cb0756SThomas Monjalon rte_gpu_notify(dev, RTE_GPU_EVENT_DEL); 33918cb0756SThomas Monjalon 34018cb0756SThomas Monjalon gpu_free_callbacks(dev); 341a9af048aSThomas Monjalon dev->process_state = RTE_GPU_STATE_UNUSED; 342a9af048aSThomas Monjalon __atomic_fetch_sub(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 3438b8036a6SElena Agostini gpu_count--; 3448b8036a6SElena Agostini 3458b8036a6SElena Agostini return 0; 3468b8036a6SElena Agostini } 3478b8036a6SElena Agostini 3488b8036a6SElena Agostini int 3498b8036a6SElena Agostini rte_gpu_close(int16_t dev_id) 3508b8036a6SElena Agostini { 3518b8036a6SElena Agostini int firsterr, binerr; 3528b8036a6SElena Agostini int *lasterr = &firsterr; 3538b8036a6SElena Agostini struct rte_gpu *dev; 3548b8036a6SElena Agostini 3558b8036a6SElena Agostini dev = gpu_get_by_id(dev_id); 3568b8036a6SElena Agostini if (dev == NULL) { 3578b8036a6SElena Agostini GPU_LOG(ERR, "close invalid device ID %d", dev_id); 3588b8036a6SElena Agostini rte_errno = ENODEV; 3598b8036a6SElena Agostini return -rte_errno; 3608b8036a6SElena Agostini } 3618b8036a6SElena Agostini 3628b8036a6SElena Agostini if (dev->ops.dev_close != NULL) { 3638b8036a6SElena Agostini *lasterr = GPU_DRV_RET(dev->ops.dev_close(dev)); 3648b8036a6SElena Agostini if (*lasterr != 0) 3658b8036a6SElena Agostini lasterr = &binerr; 3668b8036a6SElena Agostini } 3678b8036a6SElena Agostini 3688b8036a6SElena Agostini *lasterr = rte_gpu_release(dev); 3698b8036a6SElena Agostini 3708b8036a6SElena Agostini rte_errno = -firsterr; 3718b8036a6SElena Agostini return firsterr; 3728b8036a6SElena Agostini } 3738b8036a6SElena Agostini 3748b8036a6SElena Agostini int 37518cb0756SThomas Monjalon rte_gpu_callback_register(int16_t dev_id, enum rte_gpu_event event, 37618cb0756SThomas Monjalon rte_gpu_callback_t *function, void *user_data) 37718cb0756SThomas Monjalon { 37818cb0756SThomas Monjalon int16_t next_dev, last_dev; 37918cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 38018cb0756SThomas Monjalon struct rte_gpu_callback *callback; 38118cb0756SThomas Monjalon 38218cb0756SThomas Monjalon if (!rte_gpu_is_valid(dev_id) && dev_id != RTE_GPU_ID_ANY) { 38318cb0756SThomas Monjalon GPU_LOG(ERR, "register callback of invalid ID %d", dev_id); 38418cb0756SThomas Monjalon rte_errno = ENODEV; 38518cb0756SThomas Monjalon return -rte_errno; 38618cb0756SThomas Monjalon } 38718cb0756SThomas Monjalon if (function == NULL) { 38818cb0756SThomas Monjalon GPU_LOG(ERR, "cannot register callback without function"); 38918cb0756SThomas Monjalon rte_errno = EINVAL; 39018cb0756SThomas Monjalon return -rte_errno; 39118cb0756SThomas Monjalon } 39218cb0756SThomas Monjalon 39318cb0756SThomas Monjalon if (dev_id == RTE_GPU_ID_ANY) { 39418cb0756SThomas Monjalon next_dev = 0; 39518cb0756SThomas Monjalon last_dev = gpu_max - 1; 39618cb0756SThomas Monjalon } else { 39718cb0756SThomas Monjalon next_dev = last_dev = dev_id; 39818cb0756SThomas Monjalon } 39918cb0756SThomas Monjalon 40018cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 40118cb0756SThomas Monjalon do { 40218cb0756SThomas Monjalon callbacks = &gpus[next_dev].callbacks; 40318cb0756SThomas Monjalon 40418cb0756SThomas Monjalon /* check if not already registered */ 40518cb0756SThomas Monjalon TAILQ_FOREACH(callback, callbacks, next) { 40618cb0756SThomas Monjalon if (callback->event == event && 40718cb0756SThomas Monjalon callback->function == function && 40818cb0756SThomas Monjalon callback->user_data == user_data) { 40918cb0756SThomas Monjalon GPU_LOG(INFO, "callback already registered"); 41018cb0756SThomas Monjalon return 0; 41118cb0756SThomas Monjalon } 41218cb0756SThomas Monjalon } 41318cb0756SThomas Monjalon 41418cb0756SThomas Monjalon callback = malloc(sizeof(*callback)); 41518cb0756SThomas Monjalon if (callback == NULL) { 41618cb0756SThomas Monjalon GPU_LOG(ERR, "cannot allocate callback"); 41718cb0756SThomas Monjalon return -ENOMEM; 41818cb0756SThomas Monjalon } 41918cb0756SThomas Monjalon callback->function = function; 42018cb0756SThomas Monjalon callback->user_data = user_data; 42118cb0756SThomas Monjalon callback->event = event; 42218cb0756SThomas Monjalon TAILQ_INSERT_TAIL(callbacks, callback, next); 42318cb0756SThomas Monjalon 42418cb0756SThomas Monjalon } while (++next_dev <= last_dev); 42518cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 42618cb0756SThomas Monjalon 42718cb0756SThomas Monjalon return 0; 42818cb0756SThomas Monjalon } 42918cb0756SThomas Monjalon 43018cb0756SThomas Monjalon int 43118cb0756SThomas Monjalon rte_gpu_callback_unregister(int16_t dev_id, enum rte_gpu_event event, 43218cb0756SThomas Monjalon rte_gpu_callback_t *function, void *user_data) 43318cb0756SThomas Monjalon { 43418cb0756SThomas Monjalon int16_t next_dev, last_dev; 43518cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 43618cb0756SThomas Monjalon struct rte_gpu_callback *callback, *nextcb; 43718cb0756SThomas Monjalon 43818cb0756SThomas Monjalon if (!rte_gpu_is_valid(dev_id) && dev_id != RTE_GPU_ID_ANY) { 43918cb0756SThomas Monjalon GPU_LOG(ERR, "unregister callback of invalid ID %d", dev_id); 44018cb0756SThomas Monjalon rte_errno = ENODEV; 44118cb0756SThomas Monjalon return -rte_errno; 44218cb0756SThomas Monjalon } 44318cb0756SThomas Monjalon if (function == NULL) { 44418cb0756SThomas Monjalon GPU_LOG(ERR, "cannot unregister callback without function"); 44518cb0756SThomas Monjalon rte_errno = EINVAL; 44618cb0756SThomas Monjalon return -rte_errno; 44718cb0756SThomas Monjalon } 44818cb0756SThomas Monjalon 44918cb0756SThomas Monjalon if (dev_id == RTE_GPU_ID_ANY) { 45018cb0756SThomas Monjalon next_dev = 0; 45118cb0756SThomas Monjalon last_dev = gpu_max - 1; 45218cb0756SThomas Monjalon } else { 45318cb0756SThomas Monjalon next_dev = last_dev = dev_id; 45418cb0756SThomas Monjalon } 45518cb0756SThomas Monjalon 45618cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 45718cb0756SThomas Monjalon do { 45818cb0756SThomas Monjalon callbacks = &gpus[next_dev].callbacks; 45918cb0756SThomas Monjalon RTE_TAILQ_FOREACH_SAFE(callback, callbacks, next, nextcb) { 46018cb0756SThomas Monjalon if (callback->event != event || 46118cb0756SThomas Monjalon callback->function != function || 46218cb0756SThomas Monjalon (callback->user_data != user_data && 46318cb0756SThomas Monjalon user_data != (void *)-1)) 46418cb0756SThomas Monjalon continue; 46518cb0756SThomas Monjalon TAILQ_REMOVE(callbacks, callback, next); 46618cb0756SThomas Monjalon free(callback); 46718cb0756SThomas Monjalon } 46818cb0756SThomas Monjalon } while (++next_dev <= last_dev); 46918cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 47018cb0756SThomas Monjalon 47118cb0756SThomas Monjalon return 0; 47218cb0756SThomas Monjalon } 47318cb0756SThomas Monjalon 47418cb0756SThomas Monjalon static void 47518cb0756SThomas Monjalon gpu_free_callbacks(struct rte_gpu *dev) 47618cb0756SThomas Monjalon { 47718cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 47818cb0756SThomas Monjalon struct rte_gpu_callback *callback, *nextcb; 47918cb0756SThomas Monjalon 48018cb0756SThomas Monjalon callbacks = &dev->callbacks; 48118cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 48218cb0756SThomas Monjalon RTE_TAILQ_FOREACH_SAFE(callback, callbacks, next, nextcb) { 48318cb0756SThomas Monjalon TAILQ_REMOVE(callbacks, callback, next); 48418cb0756SThomas Monjalon free(callback); 48518cb0756SThomas Monjalon } 48618cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 48718cb0756SThomas Monjalon } 48818cb0756SThomas Monjalon 48918cb0756SThomas Monjalon void 49018cb0756SThomas Monjalon rte_gpu_notify(struct rte_gpu *dev, enum rte_gpu_event event) 49118cb0756SThomas Monjalon { 49218cb0756SThomas Monjalon int16_t dev_id; 49318cb0756SThomas Monjalon struct rte_gpu_callback *callback; 49418cb0756SThomas Monjalon 495a9af048aSThomas Monjalon dev_id = dev->mpshared->info.dev_id; 49618cb0756SThomas Monjalon rte_rwlock_read_lock(&gpu_callback_lock); 49718cb0756SThomas Monjalon TAILQ_FOREACH(callback, &dev->callbacks, next) { 49818cb0756SThomas Monjalon if (callback->event != event || callback->function == NULL) 49918cb0756SThomas Monjalon continue; 50018cb0756SThomas Monjalon callback->function(dev_id, event, callback->user_data); 50118cb0756SThomas Monjalon } 50218cb0756SThomas Monjalon rte_rwlock_read_unlock(&gpu_callback_lock); 50318cb0756SThomas Monjalon } 50418cb0756SThomas Monjalon 50518cb0756SThomas Monjalon int 5068b8036a6SElena Agostini rte_gpu_info_get(int16_t dev_id, struct rte_gpu_info *info) 5078b8036a6SElena Agostini { 5088b8036a6SElena Agostini struct rte_gpu *dev; 5098b8036a6SElena Agostini 5108b8036a6SElena Agostini dev = gpu_get_by_id(dev_id); 5118b8036a6SElena Agostini if (dev == NULL) { 5128b8036a6SElena Agostini GPU_LOG(ERR, "query invalid device ID %d", dev_id); 5138b8036a6SElena Agostini rte_errno = ENODEV; 5148b8036a6SElena Agostini return -rte_errno; 5158b8036a6SElena Agostini } 5168b8036a6SElena Agostini if (info == NULL) { 5178b8036a6SElena Agostini GPU_LOG(ERR, "query without storage"); 5188b8036a6SElena Agostini rte_errno = EINVAL; 5198b8036a6SElena Agostini return -rte_errno; 5208b8036a6SElena Agostini } 5218b8036a6SElena Agostini 5228b8036a6SElena Agostini if (dev->ops.dev_info_get == NULL) { 523a9af048aSThomas Monjalon *info = dev->mpshared->info; 5248b8036a6SElena Agostini return 0; 5258b8036a6SElena Agostini } 5268b8036a6SElena Agostini return GPU_DRV_RET(dev->ops.dev_info_get(dev, info)); 5278b8036a6SElena Agostini } 528e818c4e2SElena Agostini 529e818c4e2SElena Agostini void * 530c8557ed4SElena Agostini rte_gpu_mem_alloc(int16_t dev_id, size_t size, unsigned int align) 531e818c4e2SElena Agostini { 532e818c4e2SElena Agostini struct rte_gpu *dev; 533e818c4e2SElena Agostini void *ptr; 534e818c4e2SElena Agostini int ret; 535e818c4e2SElena Agostini 536e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 537e818c4e2SElena Agostini if (dev == NULL) { 538e818c4e2SElena Agostini GPU_LOG(ERR, "alloc mem for invalid device ID %d", dev_id); 539e818c4e2SElena Agostini rte_errno = ENODEV; 540e818c4e2SElena Agostini return NULL; 541e818c4e2SElena Agostini } 542e818c4e2SElena Agostini 543e818c4e2SElena Agostini if (dev->ops.mem_alloc == NULL) { 544e818c4e2SElena Agostini GPU_LOG(ERR, "mem allocation not supported"); 545e818c4e2SElena Agostini rte_errno = ENOTSUP; 546e818c4e2SElena Agostini return NULL; 547e818c4e2SElena Agostini } 548e818c4e2SElena Agostini 549e818c4e2SElena Agostini if (size == 0) /* dry-run */ 550e818c4e2SElena Agostini return NULL; 551e818c4e2SElena Agostini 552c8557ed4SElena Agostini if (align && !rte_is_power_of_2(align)) { 553c8557ed4SElena Agostini GPU_LOG(ERR, "requested alignment is not a power of two %u", align); 554c8557ed4SElena Agostini rte_errno = EINVAL; 555c8557ed4SElena Agostini return NULL; 556c8557ed4SElena Agostini } 557c8557ed4SElena Agostini 558c8557ed4SElena Agostini ret = dev->ops.mem_alloc(dev, size, align, &ptr); 559e818c4e2SElena Agostini 560e818c4e2SElena Agostini switch (ret) { 561e818c4e2SElena Agostini case 0: 562e818c4e2SElena Agostini return ptr; 563e818c4e2SElena Agostini case -ENOMEM: 564e818c4e2SElena Agostini case -E2BIG: 565e818c4e2SElena Agostini rte_errno = -ret; 566e818c4e2SElena Agostini return NULL; 567e818c4e2SElena Agostini default: 568e818c4e2SElena Agostini rte_errno = -EPERM; 569e818c4e2SElena Agostini return NULL; 570e818c4e2SElena Agostini } 571e818c4e2SElena Agostini } 572e818c4e2SElena Agostini 573e818c4e2SElena Agostini int 574e818c4e2SElena Agostini rte_gpu_mem_free(int16_t dev_id, void *ptr) 575e818c4e2SElena Agostini { 576e818c4e2SElena Agostini struct rte_gpu *dev; 577e818c4e2SElena Agostini 578e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 579e818c4e2SElena Agostini if (dev == NULL) { 580e818c4e2SElena Agostini GPU_LOG(ERR, "free mem for invalid device ID %d", dev_id); 581e818c4e2SElena Agostini rte_errno = ENODEV; 582e818c4e2SElena Agostini return -rte_errno; 583e818c4e2SElena Agostini } 584e818c4e2SElena Agostini 585e818c4e2SElena Agostini if (dev->ops.mem_free == NULL) { 586e818c4e2SElena Agostini rte_errno = ENOTSUP; 587e818c4e2SElena Agostini return -rte_errno; 588e818c4e2SElena Agostini } 5891674c56dSElena Agostini 5901674c56dSElena Agostini if (ptr == NULL) /* dry-run */ 5911674c56dSElena Agostini return 0; 5921674c56dSElena Agostini 593e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_free(dev, ptr)); 594e818c4e2SElena Agostini } 595e818c4e2SElena Agostini 596e818c4e2SElena Agostini int 597e818c4e2SElena Agostini rte_gpu_mem_register(int16_t dev_id, size_t size, void *ptr) 598e818c4e2SElena Agostini { 599e818c4e2SElena Agostini struct rte_gpu *dev; 600e818c4e2SElena Agostini 601e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 602e818c4e2SElena Agostini if (dev == NULL) { 603e818c4e2SElena Agostini GPU_LOG(ERR, "alloc mem for invalid device ID %d", dev_id); 604e818c4e2SElena Agostini rte_errno = ENODEV; 605e818c4e2SElena Agostini return -rte_errno; 606e818c4e2SElena Agostini } 607e818c4e2SElena Agostini 608e818c4e2SElena Agostini if (dev->ops.mem_register == NULL) { 609e818c4e2SElena Agostini GPU_LOG(ERR, "mem registration not supported"); 610e818c4e2SElena Agostini rte_errno = ENOTSUP; 611e818c4e2SElena Agostini return -rte_errno; 612e818c4e2SElena Agostini } 613e818c4e2SElena Agostini 6141674c56dSElena Agostini if (ptr == NULL || size == 0) /* dry-run */ 6151674c56dSElena Agostini return 0; 616e818c4e2SElena Agostini 617e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_register(dev, size, ptr)); 618e818c4e2SElena Agostini } 619e818c4e2SElena Agostini 620e818c4e2SElena Agostini int 621e818c4e2SElena Agostini rte_gpu_mem_unregister(int16_t dev_id, void *ptr) 622e818c4e2SElena Agostini { 623e818c4e2SElena Agostini struct rte_gpu *dev; 624e818c4e2SElena Agostini 625e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 626e818c4e2SElena Agostini if (dev == NULL) { 627e818c4e2SElena Agostini GPU_LOG(ERR, "unregister mem for invalid device ID %d", dev_id); 628e818c4e2SElena Agostini rte_errno = ENODEV; 629e818c4e2SElena Agostini return -rte_errno; 630e818c4e2SElena Agostini } 631e818c4e2SElena Agostini 632e818c4e2SElena Agostini if (dev->ops.mem_unregister == NULL) { 633e818c4e2SElena Agostini rte_errno = ENOTSUP; 634e818c4e2SElena Agostini return -rte_errno; 635e818c4e2SElena Agostini } 6361674c56dSElena Agostini 6371674c56dSElena Agostini if (ptr == NULL) /* dry-run */ 6381674c56dSElena Agostini return 0; 6391674c56dSElena Agostini 640e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_unregister(dev, ptr)); 641e818c4e2SElena Agostini } 6422d61b429SElena Agostini 643*d69bb47dSElena Agostini void * 644*d69bb47dSElena Agostini rte_gpu_mem_cpu_map(int16_t dev_id, size_t size, void *ptr) 645*d69bb47dSElena Agostini { 646*d69bb47dSElena Agostini struct rte_gpu *dev; 647*d69bb47dSElena Agostini void *ptr_out; 648*d69bb47dSElena Agostini int ret; 649*d69bb47dSElena Agostini 650*d69bb47dSElena Agostini dev = gpu_get_by_id(dev_id); 651*d69bb47dSElena Agostini if (dev == NULL) { 652*d69bb47dSElena Agostini GPU_LOG(ERR, "mem CPU map for invalid device ID %d", dev_id); 653*d69bb47dSElena Agostini rte_errno = ENODEV; 654*d69bb47dSElena Agostini return NULL; 655*d69bb47dSElena Agostini } 656*d69bb47dSElena Agostini 657*d69bb47dSElena Agostini if (dev->ops.mem_cpu_map == NULL) { 658*d69bb47dSElena Agostini GPU_LOG(ERR, "mem CPU map not supported"); 659*d69bb47dSElena Agostini rte_errno = ENOTSUP; 660*d69bb47dSElena Agostini return NULL; 661*d69bb47dSElena Agostini } 662*d69bb47dSElena Agostini 663*d69bb47dSElena Agostini if (ptr == NULL || size == 0) /* dry-run */ 664*d69bb47dSElena Agostini return NULL; 665*d69bb47dSElena Agostini 666*d69bb47dSElena Agostini ret = GPU_DRV_RET(dev->ops.mem_cpu_map(dev, size, ptr, &ptr_out)); 667*d69bb47dSElena Agostini 668*d69bb47dSElena Agostini switch (ret) { 669*d69bb47dSElena Agostini case 0: 670*d69bb47dSElena Agostini return ptr_out; 671*d69bb47dSElena Agostini case -ENOMEM: 672*d69bb47dSElena Agostini case -E2BIG: 673*d69bb47dSElena Agostini rte_errno = -ret; 674*d69bb47dSElena Agostini return NULL; 675*d69bb47dSElena Agostini default: 676*d69bb47dSElena Agostini rte_errno = -EPERM; 677*d69bb47dSElena Agostini return NULL; 678*d69bb47dSElena Agostini } 679*d69bb47dSElena Agostini } 680*d69bb47dSElena Agostini 681*d69bb47dSElena Agostini int 682*d69bb47dSElena Agostini rte_gpu_mem_cpu_unmap(int16_t dev_id, void *ptr) 683*d69bb47dSElena Agostini { 684*d69bb47dSElena Agostini struct rte_gpu *dev; 685*d69bb47dSElena Agostini 686*d69bb47dSElena Agostini dev = gpu_get_by_id(dev_id); 687*d69bb47dSElena Agostini if (dev == NULL) { 688*d69bb47dSElena Agostini GPU_LOG(ERR, "cpu_unmap mem for invalid device ID %d", dev_id); 689*d69bb47dSElena Agostini rte_errno = ENODEV; 690*d69bb47dSElena Agostini return -rte_errno; 691*d69bb47dSElena Agostini } 692*d69bb47dSElena Agostini 693*d69bb47dSElena Agostini if (dev->ops.mem_cpu_unmap == NULL) { 694*d69bb47dSElena Agostini rte_errno = ENOTSUP; 695*d69bb47dSElena Agostini return -rte_errno; 696*d69bb47dSElena Agostini } 697*d69bb47dSElena Agostini 698*d69bb47dSElena Agostini if (ptr == NULL) /* dry-run */ 699*d69bb47dSElena Agostini return 0; 700*d69bb47dSElena Agostini 701*d69bb47dSElena Agostini return GPU_DRV_RET(dev->ops.mem_cpu_unmap(dev, ptr)); 702*d69bb47dSElena Agostini } 703*d69bb47dSElena Agostini 7042d61b429SElena Agostini int 7052d61b429SElena Agostini rte_gpu_wmb(int16_t dev_id) 7062d61b429SElena Agostini { 7072d61b429SElena Agostini struct rte_gpu *dev; 7082d61b429SElena Agostini 7092d61b429SElena Agostini dev = gpu_get_by_id(dev_id); 7102d61b429SElena Agostini if (dev == NULL) { 7112d61b429SElena Agostini GPU_LOG(ERR, "memory barrier for invalid device ID %d", dev_id); 7122d61b429SElena Agostini rte_errno = ENODEV; 7132d61b429SElena Agostini return -rte_errno; 7142d61b429SElena Agostini } 7152d61b429SElena Agostini 7162d61b429SElena Agostini if (dev->ops.wmb == NULL) { 7172d61b429SElena Agostini rte_errno = ENOTSUP; 7182d61b429SElena Agostini return -rte_errno; 7192d61b429SElena Agostini } 7202d61b429SElena Agostini return GPU_DRV_RET(dev->ops.wmb(dev)); 7212d61b429SElena Agostini } 722f56160a2SElena Agostini 723f56160a2SElena Agostini int 724f56160a2SElena Agostini rte_gpu_comm_create_flag(uint16_t dev_id, struct rte_gpu_comm_flag *devflag, 725f56160a2SElena Agostini enum rte_gpu_comm_flag_type mtype) 726f56160a2SElena Agostini { 727f56160a2SElena Agostini size_t flag_size; 728f56160a2SElena Agostini int ret; 729f56160a2SElena Agostini 730f56160a2SElena Agostini if (devflag == NULL) { 731f56160a2SElena Agostini rte_errno = EINVAL; 732f56160a2SElena Agostini return -rte_errno; 733f56160a2SElena Agostini } 734f56160a2SElena Agostini if (mtype != RTE_GPU_COMM_FLAG_CPU) { 735f56160a2SElena Agostini rte_errno = EINVAL; 736f56160a2SElena Agostini return -rte_errno; 737f56160a2SElena Agostini } 738f56160a2SElena Agostini 739f56160a2SElena Agostini flag_size = sizeof(uint32_t); 740f56160a2SElena Agostini 741f56160a2SElena Agostini devflag->ptr = rte_zmalloc(NULL, flag_size, 0); 742f56160a2SElena Agostini if (devflag->ptr == NULL) { 743f56160a2SElena Agostini rte_errno = ENOMEM; 744f56160a2SElena Agostini return -rte_errno; 745f56160a2SElena Agostini } 746f56160a2SElena Agostini 747f56160a2SElena Agostini ret = rte_gpu_mem_register(dev_id, flag_size, devflag->ptr); 748f56160a2SElena Agostini if (ret < 0) { 749f56160a2SElena Agostini rte_errno = ENOMEM; 750f56160a2SElena Agostini return -rte_errno; 751f56160a2SElena Agostini } 752f56160a2SElena Agostini 753f56160a2SElena Agostini devflag->mtype = mtype; 754f56160a2SElena Agostini devflag->dev_id = dev_id; 755f56160a2SElena Agostini 756f56160a2SElena Agostini return 0; 757f56160a2SElena Agostini } 758f56160a2SElena Agostini 759f56160a2SElena Agostini int 760f56160a2SElena Agostini rte_gpu_comm_destroy_flag(struct rte_gpu_comm_flag *devflag) 761f56160a2SElena Agostini { 762f56160a2SElena Agostini int ret; 763f56160a2SElena Agostini 764f56160a2SElena Agostini if (devflag == NULL) { 765f56160a2SElena Agostini rte_errno = EINVAL; 766f56160a2SElena Agostini return -rte_errno; 767f56160a2SElena Agostini } 768f56160a2SElena Agostini 769f56160a2SElena Agostini ret = rte_gpu_mem_unregister(devflag->dev_id, devflag->ptr); 770f56160a2SElena Agostini if (ret < 0) { 771f56160a2SElena Agostini rte_errno = EINVAL; 772f56160a2SElena Agostini return -1; 773f56160a2SElena Agostini } 774f56160a2SElena Agostini 775f56160a2SElena Agostini rte_free(devflag->ptr); 776f56160a2SElena Agostini 777f56160a2SElena Agostini return 0; 778f56160a2SElena Agostini } 779f56160a2SElena Agostini 780f56160a2SElena Agostini int 781f56160a2SElena Agostini rte_gpu_comm_set_flag(struct rte_gpu_comm_flag *devflag, uint32_t val) 782f56160a2SElena Agostini { 783f56160a2SElena Agostini if (devflag == NULL) { 784f56160a2SElena Agostini rte_errno = EINVAL; 785f56160a2SElena Agostini return -rte_errno; 786f56160a2SElena Agostini } 787f56160a2SElena Agostini 788f56160a2SElena Agostini if (devflag->mtype != RTE_GPU_COMM_FLAG_CPU) { 789f56160a2SElena Agostini rte_errno = EINVAL; 790f56160a2SElena Agostini return -rte_errno; 791f56160a2SElena Agostini } 792f56160a2SElena Agostini 793f56160a2SElena Agostini RTE_GPU_VOLATILE(*devflag->ptr) = val; 794f56160a2SElena Agostini 795f56160a2SElena Agostini return 0; 796f56160a2SElena Agostini } 797f56160a2SElena Agostini 798f56160a2SElena Agostini int 799f56160a2SElena Agostini rte_gpu_comm_get_flag_value(struct rte_gpu_comm_flag *devflag, uint32_t *val) 800f56160a2SElena Agostini { 801f56160a2SElena Agostini if (devflag == NULL) { 802f56160a2SElena Agostini rte_errno = EINVAL; 803f56160a2SElena Agostini return -rte_errno; 804f56160a2SElena Agostini } 805f56160a2SElena Agostini if (devflag->mtype != RTE_GPU_COMM_FLAG_CPU) { 806f56160a2SElena Agostini rte_errno = EINVAL; 807f56160a2SElena Agostini return -rte_errno; 808f56160a2SElena Agostini } 809f56160a2SElena Agostini 810f56160a2SElena Agostini *val = RTE_GPU_VOLATILE(*devflag->ptr); 811f56160a2SElena Agostini 812f56160a2SElena Agostini return 0; 813f56160a2SElena Agostini } 814c7ebd65cSElena Agostini 815c7ebd65cSElena Agostini struct rte_gpu_comm_list * 816c7ebd65cSElena Agostini rte_gpu_comm_create_list(uint16_t dev_id, 817c7ebd65cSElena Agostini uint32_t num_comm_items) 818c7ebd65cSElena Agostini { 819c7ebd65cSElena Agostini struct rte_gpu_comm_list *comm_list; 820c7ebd65cSElena Agostini uint32_t idx_l; 821c7ebd65cSElena Agostini int ret; 822c7ebd65cSElena Agostini struct rte_gpu *dev; 823c7ebd65cSElena Agostini 824c7ebd65cSElena Agostini if (num_comm_items == 0) { 825c7ebd65cSElena Agostini rte_errno = EINVAL; 826c7ebd65cSElena Agostini return NULL; 827c7ebd65cSElena Agostini } 828c7ebd65cSElena Agostini 829c7ebd65cSElena Agostini dev = gpu_get_by_id(dev_id); 830c7ebd65cSElena Agostini if (dev == NULL) { 831c7ebd65cSElena Agostini GPU_LOG(ERR, "memory barrier for invalid device ID %d", dev_id); 832c7ebd65cSElena Agostini rte_errno = ENODEV; 833c7ebd65cSElena Agostini return NULL; 834c7ebd65cSElena Agostini } 835c7ebd65cSElena Agostini 836c7ebd65cSElena Agostini comm_list = rte_zmalloc(NULL, 837c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_list) * num_comm_items, 0); 838c7ebd65cSElena Agostini if (comm_list == NULL) { 839c7ebd65cSElena Agostini rte_errno = ENOMEM; 840c7ebd65cSElena Agostini return NULL; 841c7ebd65cSElena Agostini } 842c7ebd65cSElena Agostini 843c7ebd65cSElena Agostini ret = rte_gpu_mem_register(dev_id, 844c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_list) * num_comm_items, comm_list); 845c7ebd65cSElena Agostini if (ret < 0) { 846c7ebd65cSElena Agostini rte_errno = ENOMEM; 847c7ebd65cSElena Agostini return NULL; 848c7ebd65cSElena Agostini } 849c7ebd65cSElena Agostini 850c7ebd65cSElena Agostini for (idx_l = 0; idx_l < num_comm_items; idx_l++) { 851c7ebd65cSElena Agostini comm_list[idx_l].pkt_list = rte_zmalloc(NULL, 852c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_pkt) * RTE_GPU_COMM_LIST_PKTS_MAX, 0); 853c7ebd65cSElena Agostini if (comm_list[idx_l].pkt_list == NULL) { 854c7ebd65cSElena Agostini rte_errno = ENOMEM; 855c7ebd65cSElena Agostini return NULL; 856c7ebd65cSElena Agostini } 857c7ebd65cSElena Agostini 858c7ebd65cSElena Agostini ret = rte_gpu_mem_register(dev_id, 859c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_pkt) * RTE_GPU_COMM_LIST_PKTS_MAX, 860c7ebd65cSElena Agostini comm_list[idx_l].pkt_list); 861c7ebd65cSElena Agostini if (ret < 0) { 862c7ebd65cSElena Agostini rte_errno = ENOMEM; 863c7ebd65cSElena Agostini return NULL; 864c7ebd65cSElena Agostini } 865c7ebd65cSElena Agostini 866c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list[idx_l].status) = RTE_GPU_COMM_LIST_FREE; 867c7ebd65cSElena Agostini comm_list[idx_l].num_pkts = 0; 868c7ebd65cSElena Agostini comm_list[idx_l].dev_id = dev_id; 869c7ebd65cSElena Agostini 870c7ebd65cSElena Agostini comm_list[idx_l].mbufs = rte_zmalloc(NULL, 871c7ebd65cSElena Agostini sizeof(struct rte_mbuf *) * RTE_GPU_COMM_LIST_PKTS_MAX, 0); 872c7ebd65cSElena Agostini if (comm_list[idx_l].mbufs == NULL) { 873c7ebd65cSElena Agostini rte_errno = ENOMEM; 874c7ebd65cSElena Agostini return NULL; 875c7ebd65cSElena Agostini } 876c7ebd65cSElena Agostini } 877c7ebd65cSElena Agostini 878c7ebd65cSElena Agostini return comm_list; 879c7ebd65cSElena Agostini } 880c7ebd65cSElena Agostini 881c7ebd65cSElena Agostini int 882c7ebd65cSElena Agostini rte_gpu_comm_destroy_list(struct rte_gpu_comm_list *comm_list, 883c7ebd65cSElena Agostini uint32_t num_comm_items) 884c7ebd65cSElena Agostini { 885c7ebd65cSElena Agostini uint32_t idx_l; 886c7ebd65cSElena Agostini int ret; 887c7ebd65cSElena Agostini uint16_t dev_id; 888c7ebd65cSElena Agostini 889c7ebd65cSElena Agostini if (comm_list == NULL) { 890c7ebd65cSElena Agostini rte_errno = EINVAL; 891c7ebd65cSElena Agostini return -rte_errno; 892c7ebd65cSElena Agostini } 893c7ebd65cSElena Agostini 894c7ebd65cSElena Agostini dev_id = comm_list[0].dev_id; 895c7ebd65cSElena Agostini 896c7ebd65cSElena Agostini for (idx_l = 0; idx_l < num_comm_items; idx_l++) { 897c7ebd65cSElena Agostini ret = rte_gpu_mem_unregister(dev_id, comm_list[idx_l].pkt_list); 898c7ebd65cSElena Agostini if (ret < 0) { 899c7ebd65cSElena Agostini rte_errno = EINVAL; 900c7ebd65cSElena Agostini return -1; 901c7ebd65cSElena Agostini } 902c7ebd65cSElena Agostini 903c7ebd65cSElena Agostini rte_free(comm_list[idx_l].pkt_list); 904c7ebd65cSElena Agostini rte_free(comm_list[idx_l].mbufs); 905c7ebd65cSElena Agostini } 906c7ebd65cSElena Agostini 907c7ebd65cSElena Agostini ret = rte_gpu_mem_unregister(dev_id, comm_list); 908c7ebd65cSElena Agostini if (ret < 0) { 909c7ebd65cSElena Agostini rte_errno = EINVAL; 910c7ebd65cSElena Agostini return -1; 911c7ebd65cSElena Agostini } 912c7ebd65cSElena Agostini 913c7ebd65cSElena Agostini rte_free(comm_list); 914c7ebd65cSElena Agostini 915c7ebd65cSElena Agostini return 0; 916c7ebd65cSElena Agostini } 917c7ebd65cSElena Agostini 918c7ebd65cSElena Agostini int 919c7ebd65cSElena Agostini rte_gpu_comm_populate_list_pkts(struct rte_gpu_comm_list *comm_list_item, 920c7ebd65cSElena Agostini struct rte_mbuf **mbufs, uint32_t num_mbufs) 921c7ebd65cSElena Agostini { 922c7ebd65cSElena Agostini uint32_t idx; 923c7ebd65cSElena Agostini 924c7ebd65cSElena Agostini if (comm_list_item == NULL || comm_list_item->pkt_list == NULL || 925c7ebd65cSElena Agostini mbufs == NULL || num_mbufs > RTE_GPU_COMM_LIST_PKTS_MAX) { 926c7ebd65cSElena Agostini rte_errno = EINVAL; 927c7ebd65cSElena Agostini return -rte_errno; 928c7ebd65cSElena Agostini } 929c7ebd65cSElena Agostini 930c7ebd65cSElena Agostini for (idx = 0; idx < num_mbufs; idx++) { 931c7ebd65cSElena Agostini /* support only unchained mbufs */ 932c7ebd65cSElena Agostini if (unlikely((mbufs[idx]->nb_segs > 1) || 933c7ebd65cSElena Agostini (mbufs[idx]->next != NULL) || 934c7ebd65cSElena Agostini (mbufs[idx]->data_len != mbufs[idx]->pkt_len))) { 935c7ebd65cSElena Agostini rte_errno = ENOTSUP; 936c7ebd65cSElena Agostini return -rte_errno; 937c7ebd65cSElena Agostini } 938c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].addr = 939c7ebd65cSElena Agostini rte_pktmbuf_mtod_offset(mbufs[idx], uintptr_t, 0); 940c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].size = mbufs[idx]->pkt_len; 941c7ebd65cSElena Agostini comm_list_item->mbufs[idx] = mbufs[idx]; 942c7ebd65cSElena Agostini } 943c7ebd65cSElena Agostini 944c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->num_pkts) = num_mbufs; 945c7ebd65cSElena Agostini rte_gpu_wmb(comm_list_item->dev_id); 946c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->status) = RTE_GPU_COMM_LIST_READY; 947c7ebd65cSElena Agostini 948c7ebd65cSElena Agostini return 0; 949c7ebd65cSElena Agostini } 950c7ebd65cSElena Agostini 951c7ebd65cSElena Agostini int 952c7ebd65cSElena Agostini rte_gpu_comm_cleanup_list(struct rte_gpu_comm_list *comm_list_item) 953c7ebd65cSElena Agostini { 954c7ebd65cSElena Agostini uint32_t idx = 0; 955c7ebd65cSElena Agostini 956c7ebd65cSElena Agostini if (comm_list_item == NULL) { 957c7ebd65cSElena Agostini rte_errno = EINVAL; 958c7ebd65cSElena Agostini return -rte_errno; 959c7ebd65cSElena Agostini } 960c7ebd65cSElena Agostini 961c7ebd65cSElena Agostini if (RTE_GPU_VOLATILE(comm_list_item->status) == 962c7ebd65cSElena Agostini RTE_GPU_COMM_LIST_READY) { 963c7ebd65cSElena Agostini GPU_LOG(ERR, "packet list is still in progress"); 964c7ebd65cSElena Agostini rte_errno = EINVAL; 965c7ebd65cSElena Agostini return -rte_errno; 966c7ebd65cSElena Agostini } 967c7ebd65cSElena Agostini 968c7ebd65cSElena Agostini for (idx = 0; idx < RTE_GPU_COMM_LIST_PKTS_MAX; idx++) { 969c7ebd65cSElena Agostini if (comm_list_item->pkt_list[idx].addr == 0) 970c7ebd65cSElena Agostini break; 971c7ebd65cSElena Agostini 972c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].addr = 0; 973c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].size = 0; 974c7ebd65cSElena Agostini comm_list_item->mbufs[idx] = NULL; 975c7ebd65cSElena Agostini } 976c7ebd65cSElena Agostini 977c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->status) = RTE_GPU_COMM_LIST_FREE; 978c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->num_pkts) = 0; 979c7ebd65cSElena Agostini rte_mb(); 980c7ebd65cSElena Agostini 981c7ebd65cSElena Agostini return 0; 982c7ebd65cSElena Agostini } 983