18b8036a6SElena Agostini /* SPDX-License-Identifier: BSD-3-Clause 28b8036a6SElena Agostini * Copyright (c) 2021 NVIDIA Corporation & Affiliates 38b8036a6SElena Agostini */ 48b8036a6SElena Agostini 58b8036a6SElena Agostini #include <rte_eal.h> 618cb0756SThomas Monjalon #include <rte_tailq.h> 718cb0756SThomas Monjalon #include <rte_rwlock.h> 88b8036a6SElena Agostini #include <rte_string_fns.h> 9a9af048aSThomas Monjalon #include <rte_memzone.h> 10e818c4e2SElena Agostini #include <rte_malloc.h> 118b8036a6SElena Agostini #include <rte_errno.h> 128b8036a6SElena Agostini #include <rte_log.h> 138b8036a6SElena Agostini 148b8036a6SElena Agostini #include "rte_gpudev.h" 158b8036a6SElena Agostini #include "gpudev_driver.h" 168b8036a6SElena Agostini 178b8036a6SElena Agostini /* Logging */ 188b8036a6SElena Agostini RTE_LOG_REGISTER_DEFAULT(gpu_logtype, NOTICE); 198b8036a6SElena Agostini #define GPU_LOG(level, ...) \ 208b8036a6SElena Agostini rte_log(RTE_LOG_ ## level, gpu_logtype, RTE_FMT("gpu: " \ 218b8036a6SElena Agostini RTE_FMT_HEAD(__VA_ARGS__, ) "\n", RTE_FMT_TAIL(__VA_ARGS__, ))) 228b8036a6SElena Agostini 238b8036a6SElena Agostini /* Set any driver error as EPERM */ 248b8036a6SElena Agostini #define GPU_DRV_RET(function) \ 258b8036a6SElena Agostini ((function != 0) ? -(rte_errno = EPERM) : (rte_errno = 0)) 268b8036a6SElena Agostini 278b8036a6SElena Agostini /* Array of devices */ 288b8036a6SElena Agostini static struct rte_gpu *gpus; 298b8036a6SElena Agostini /* Number of currently valid devices */ 308b8036a6SElena Agostini static int16_t gpu_max; 318b8036a6SElena Agostini /* Number of currently valid devices */ 328b8036a6SElena Agostini static int16_t gpu_count; 338b8036a6SElena Agostini 34a9af048aSThomas Monjalon /* Shared memory between processes. */ 35a9af048aSThomas Monjalon static const char *GPU_MEMZONE = "rte_gpu_shared"; 36a9af048aSThomas Monjalon static struct { 37a9af048aSThomas Monjalon __extension__ struct rte_gpu_mpshared gpus[0]; 38a9af048aSThomas Monjalon } *gpu_shared_mem; 39a9af048aSThomas Monjalon 4018cb0756SThomas Monjalon /* Event callback object */ 4118cb0756SThomas Monjalon struct rte_gpu_callback { 4218cb0756SThomas Monjalon TAILQ_ENTRY(rte_gpu_callback) next; 4318cb0756SThomas Monjalon rte_gpu_callback_t *function; 4418cb0756SThomas Monjalon void *user_data; 4518cb0756SThomas Monjalon enum rte_gpu_event event; 4618cb0756SThomas Monjalon }; 4718cb0756SThomas Monjalon static rte_rwlock_t gpu_callback_lock = RTE_RWLOCK_INITIALIZER; 4818cb0756SThomas Monjalon static void gpu_free_callbacks(struct rte_gpu *dev); 4918cb0756SThomas Monjalon 508b8036a6SElena Agostini int 518b8036a6SElena Agostini rte_gpu_init(size_t dev_max) 528b8036a6SElena Agostini { 538b8036a6SElena Agostini if (dev_max == 0 || dev_max > INT16_MAX) { 548b8036a6SElena Agostini GPU_LOG(ERR, "invalid array size"); 558b8036a6SElena Agostini rte_errno = EINVAL; 568b8036a6SElena Agostini return -rte_errno; 578b8036a6SElena Agostini } 588b8036a6SElena Agostini 598b8036a6SElena Agostini /* No lock, it must be called before or during first probing. */ 608b8036a6SElena Agostini if (gpus != NULL) { 618b8036a6SElena Agostini GPU_LOG(ERR, "already initialized"); 628b8036a6SElena Agostini rte_errno = EBUSY; 638b8036a6SElena Agostini return -rte_errno; 648b8036a6SElena Agostini } 658b8036a6SElena Agostini 668b8036a6SElena Agostini gpus = calloc(dev_max, sizeof(struct rte_gpu)); 678b8036a6SElena Agostini if (gpus == NULL) { 688b8036a6SElena Agostini GPU_LOG(ERR, "cannot initialize library"); 698b8036a6SElena Agostini rte_errno = ENOMEM; 708b8036a6SElena Agostini return -rte_errno; 718b8036a6SElena Agostini } 728b8036a6SElena Agostini 738b8036a6SElena Agostini gpu_max = dev_max; 748b8036a6SElena Agostini return 0; 758b8036a6SElena Agostini } 768b8036a6SElena Agostini 778b8036a6SElena Agostini uint16_t 788b8036a6SElena Agostini rte_gpu_count_avail(void) 798b8036a6SElena Agostini { 808b8036a6SElena Agostini return gpu_count; 818b8036a6SElena Agostini } 828b8036a6SElena Agostini 838b8036a6SElena Agostini bool 848b8036a6SElena Agostini rte_gpu_is_valid(int16_t dev_id) 858b8036a6SElena Agostini { 868b8036a6SElena Agostini if (dev_id >= 0 && dev_id < gpu_max && 87a9af048aSThomas Monjalon gpus[dev_id].process_state == RTE_GPU_STATE_INITIALIZED) 888b8036a6SElena Agostini return true; 898b8036a6SElena Agostini return false; 908b8036a6SElena Agostini } 918b8036a6SElena Agostini 9282e5f6b6SThomas Monjalon static bool 9382e5f6b6SThomas Monjalon gpu_match_parent(int16_t dev_id, int16_t parent) 9482e5f6b6SThomas Monjalon { 9582e5f6b6SThomas Monjalon if (parent == RTE_GPU_ID_ANY) 9682e5f6b6SThomas Monjalon return true; 97a9af048aSThomas Monjalon return gpus[dev_id].mpshared->info.parent == parent; 9882e5f6b6SThomas Monjalon } 9982e5f6b6SThomas Monjalon 1008b8036a6SElena Agostini int16_t 10182e5f6b6SThomas Monjalon rte_gpu_find_next(int16_t dev_id, int16_t parent) 1028b8036a6SElena Agostini { 1038b8036a6SElena Agostini if (dev_id < 0) 1048b8036a6SElena Agostini dev_id = 0; 1058b8036a6SElena Agostini while (dev_id < gpu_max && 106a9af048aSThomas Monjalon (gpus[dev_id].process_state == RTE_GPU_STATE_UNUSED || 10782e5f6b6SThomas Monjalon !gpu_match_parent(dev_id, parent))) 1088b8036a6SElena Agostini dev_id++; 1098b8036a6SElena Agostini 1108b8036a6SElena Agostini if (dev_id >= gpu_max) 1118b8036a6SElena Agostini return RTE_GPU_ID_NONE; 1128b8036a6SElena Agostini return dev_id; 1138b8036a6SElena Agostini } 1148b8036a6SElena Agostini 1158b8036a6SElena Agostini static int16_t 1168b8036a6SElena Agostini gpu_find_free_id(void) 1178b8036a6SElena Agostini { 1188b8036a6SElena Agostini int16_t dev_id; 1198b8036a6SElena Agostini 1208b8036a6SElena Agostini for (dev_id = 0; dev_id < gpu_max; dev_id++) { 121a9af048aSThomas Monjalon if (gpus[dev_id].process_state == RTE_GPU_STATE_UNUSED) 1228b8036a6SElena Agostini return dev_id; 1238b8036a6SElena Agostini } 1248b8036a6SElena Agostini return RTE_GPU_ID_NONE; 1258b8036a6SElena Agostini } 1268b8036a6SElena Agostini 1278b8036a6SElena Agostini static struct rte_gpu * 1288b8036a6SElena Agostini gpu_get_by_id(int16_t dev_id) 1298b8036a6SElena Agostini { 1308b8036a6SElena Agostini if (!rte_gpu_is_valid(dev_id)) 1318b8036a6SElena Agostini return NULL; 1328b8036a6SElena Agostini return &gpus[dev_id]; 1338b8036a6SElena Agostini } 1348b8036a6SElena Agostini 1358b8036a6SElena Agostini struct rte_gpu * 1368b8036a6SElena Agostini rte_gpu_get_by_name(const char *name) 1378b8036a6SElena Agostini { 1388b8036a6SElena Agostini int16_t dev_id; 1398b8036a6SElena Agostini struct rte_gpu *dev; 1408b8036a6SElena Agostini 1418b8036a6SElena Agostini if (name == NULL) { 1428b8036a6SElena Agostini rte_errno = EINVAL; 1438b8036a6SElena Agostini return NULL; 1448b8036a6SElena Agostini } 1458b8036a6SElena Agostini 1468b8036a6SElena Agostini RTE_GPU_FOREACH(dev_id) { 1478b8036a6SElena Agostini dev = &gpus[dev_id]; 148a9af048aSThomas Monjalon if (strncmp(name, dev->mpshared->name, RTE_DEV_NAME_MAX_LEN) == 0) 1498b8036a6SElena Agostini return dev; 1508b8036a6SElena Agostini } 1518b8036a6SElena Agostini return NULL; 1528b8036a6SElena Agostini } 1538b8036a6SElena Agostini 154a9af048aSThomas Monjalon static int 155a9af048aSThomas Monjalon gpu_shared_mem_init(void) 156a9af048aSThomas Monjalon { 157a9af048aSThomas Monjalon const struct rte_memzone *memzone; 158a9af048aSThomas Monjalon 159a9af048aSThomas Monjalon if (rte_eal_process_type() == RTE_PROC_PRIMARY) { 160a9af048aSThomas Monjalon memzone = rte_memzone_reserve(GPU_MEMZONE, 161a9af048aSThomas Monjalon sizeof(*gpu_shared_mem) + 162a9af048aSThomas Monjalon sizeof(*gpu_shared_mem->gpus) * gpu_max, 163a9af048aSThomas Monjalon SOCKET_ID_ANY, 0); 164a9af048aSThomas Monjalon } else { 165a9af048aSThomas Monjalon memzone = rte_memzone_lookup(GPU_MEMZONE); 166a9af048aSThomas Monjalon } 167a9af048aSThomas Monjalon if (memzone == NULL) { 168a9af048aSThomas Monjalon GPU_LOG(ERR, "cannot initialize shared memory"); 169a9af048aSThomas Monjalon rte_errno = ENOMEM; 170a9af048aSThomas Monjalon return -rte_errno; 171a9af048aSThomas Monjalon } 172a9af048aSThomas Monjalon 173a9af048aSThomas Monjalon gpu_shared_mem = memzone->addr; 174a9af048aSThomas Monjalon return 0; 175a9af048aSThomas Monjalon } 176a9af048aSThomas Monjalon 1778b8036a6SElena Agostini struct rte_gpu * 1788b8036a6SElena Agostini rte_gpu_allocate(const char *name) 1798b8036a6SElena Agostini { 1808b8036a6SElena Agostini int16_t dev_id; 1818b8036a6SElena Agostini struct rte_gpu *dev; 1828b8036a6SElena Agostini 1838b8036a6SElena Agostini if (rte_eal_process_type() != RTE_PROC_PRIMARY) { 1848b8036a6SElena Agostini GPU_LOG(ERR, "only primary process can allocate device"); 1858b8036a6SElena Agostini rte_errno = EPERM; 1868b8036a6SElena Agostini return NULL; 1878b8036a6SElena Agostini } 1888b8036a6SElena Agostini if (name == NULL) { 1898b8036a6SElena Agostini GPU_LOG(ERR, "allocate device without a name"); 1908b8036a6SElena Agostini rte_errno = EINVAL; 1918b8036a6SElena Agostini return NULL; 1928b8036a6SElena Agostini } 1938b8036a6SElena Agostini 1948b8036a6SElena Agostini /* implicit initialization of library before adding first device */ 1958b8036a6SElena Agostini if (gpus == NULL && rte_gpu_init(RTE_GPU_DEFAULT_MAX) < 0) 1968b8036a6SElena Agostini return NULL; 1978b8036a6SElena Agostini 198a9af048aSThomas Monjalon /* initialize shared memory before adding first device */ 199a9af048aSThomas Monjalon if (gpu_shared_mem == NULL && gpu_shared_mem_init() < 0) 200a9af048aSThomas Monjalon return NULL; 201a9af048aSThomas Monjalon 2028b8036a6SElena Agostini if (rte_gpu_get_by_name(name) != NULL) { 2038b8036a6SElena Agostini GPU_LOG(ERR, "device with name %s already exists", name); 2048b8036a6SElena Agostini rte_errno = EEXIST; 2058b8036a6SElena Agostini return NULL; 2068b8036a6SElena Agostini } 2078b8036a6SElena Agostini dev_id = gpu_find_free_id(); 2088b8036a6SElena Agostini if (dev_id == RTE_GPU_ID_NONE) { 2098b8036a6SElena Agostini GPU_LOG(ERR, "reached maximum number of devices"); 2108b8036a6SElena Agostini rte_errno = ENOENT; 2118b8036a6SElena Agostini return NULL; 2128b8036a6SElena Agostini } 2138b8036a6SElena Agostini 2148b8036a6SElena Agostini dev = &gpus[dev_id]; 2158b8036a6SElena Agostini memset(dev, 0, sizeof(*dev)); 2168b8036a6SElena Agostini 217a9af048aSThomas Monjalon dev->mpshared = &gpu_shared_mem->gpus[dev_id]; 218a9af048aSThomas Monjalon memset(dev->mpshared, 0, sizeof(*dev->mpshared)); 219a9af048aSThomas Monjalon 220a9af048aSThomas Monjalon if (rte_strscpy(dev->mpshared->name, name, RTE_DEV_NAME_MAX_LEN) < 0) { 2218b8036a6SElena Agostini GPU_LOG(ERR, "device name too long: %s", name); 2228b8036a6SElena Agostini rte_errno = ENAMETOOLONG; 2238b8036a6SElena Agostini return NULL; 2248b8036a6SElena Agostini } 225a9af048aSThomas Monjalon dev->mpshared->info.name = dev->mpshared->name; 226a9af048aSThomas Monjalon dev->mpshared->info.dev_id = dev_id; 227a9af048aSThomas Monjalon dev->mpshared->info.numa_node = -1; 228a9af048aSThomas Monjalon dev->mpshared->info.parent = RTE_GPU_ID_NONE; 22918cb0756SThomas Monjalon TAILQ_INIT(&dev->callbacks); 230a9af048aSThomas Monjalon __atomic_fetch_add(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 2318b8036a6SElena Agostini 2328b8036a6SElena Agostini gpu_count++; 2338b8036a6SElena Agostini GPU_LOG(DEBUG, "new device %s (id %d) of total %d", 2348b8036a6SElena Agostini name, dev_id, gpu_count); 2358b8036a6SElena Agostini return dev; 2368b8036a6SElena Agostini } 2378b8036a6SElena Agostini 238a9af048aSThomas Monjalon struct rte_gpu * 239a9af048aSThomas Monjalon rte_gpu_attach(const char *name) 240a9af048aSThomas Monjalon { 241a9af048aSThomas Monjalon int16_t dev_id; 242a9af048aSThomas Monjalon struct rte_gpu *dev; 243a9af048aSThomas Monjalon struct rte_gpu_mpshared *shared_dev; 244a9af048aSThomas Monjalon 245a9af048aSThomas Monjalon if (rte_eal_process_type() != RTE_PROC_SECONDARY) { 246a9af048aSThomas Monjalon GPU_LOG(ERR, "only secondary process can attach device"); 247a9af048aSThomas Monjalon rte_errno = EPERM; 248a9af048aSThomas Monjalon return NULL; 249a9af048aSThomas Monjalon } 250a9af048aSThomas Monjalon if (name == NULL) { 251a9af048aSThomas Monjalon GPU_LOG(ERR, "attach device without a name"); 252a9af048aSThomas Monjalon rte_errno = EINVAL; 253a9af048aSThomas Monjalon return NULL; 254a9af048aSThomas Monjalon } 255a9af048aSThomas Monjalon 256a9af048aSThomas Monjalon /* implicit initialization of library before adding first device */ 257a9af048aSThomas Monjalon if (gpus == NULL && rte_gpu_init(RTE_GPU_DEFAULT_MAX) < 0) 258a9af048aSThomas Monjalon return NULL; 259a9af048aSThomas Monjalon 260a9af048aSThomas Monjalon /* initialize shared memory before adding first device */ 261a9af048aSThomas Monjalon if (gpu_shared_mem == NULL && gpu_shared_mem_init() < 0) 262a9af048aSThomas Monjalon return NULL; 263a9af048aSThomas Monjalon 264a9af048aSThomas Monjalon for (dev_id = 0; dev_id < gpu_max; dev_id++) { 265a9af048aSThomas Monjalon shared_dev = &gpu_shared_mem->gpus[dev_id]; 266a9af048aSThomas Monjalon if (strncmp(name, shared_dev->name, RTE_DEV_NAME_MAX_LEN) == 0) 267a9af048aSThomas Monjalon break; 268a9af048aSThomas Monjalon } 269a9af048aSThomas Monjalon if (dev_id >= gpu_max) { 270a9af048aSThomas Monjalon GPU_LOG(ERR, "device with name %s not found", name); 271a9af048aSThomas Monjalon rte_errno = ENOENT; 272a9af048aSThomas Monjalon return NULL; 273a9af048aSThomas Monjalon } 274a9af048aSThomas Monjalon dev = &gpus[dev_id]; 275a9af048aSThomas Monjalon memset(dev, 0, sizeof(*dev)); 276a9af048aSThomas Monjalon 277a9af048aSThomas Monjalon TAILQ_INIT(&dev->callbacks); 278a9af048aSThomas Monjalon dev->mpshared = shared_dev; 279a9af048aSThomas Monjalon __atomic_fetch_add(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 280a9af048aSThomas Monjalon 281a9af048aSThomas Monjalon gpu_count++; 282a9af048aSThomas Monjalon GPU_LOG(DEBUG, "attached device %s (id %d) of total %d", 283a9af048aSThomas Monjalon name, dev_id, gpu_count); 284a9af048aSThomas Monjalon return dev; 285a9af048aSThomas Monjalon } 286a9af048aSThomas Monjalon 28782e5f6b6SThomas Monjalon int16_t 28882e5f6b6SThomas Monjalon rte_gpu_add_child(const char *name, int16_t parent, uint64_t child_context) 28982e5f6b6SThomas Monjalon { 29082e5f6b6SThomas Monjalon struct rte_gpu *dev; 29182e5f6b6SThomas Monjalon 29282e5f6b6SThomas Monjalon if (!rte_gpu_is_valid(parent)) { 29382e5f6b6SThomas Monjalon GPU_LOG(ERR, "add child to invalid parent ID %d", parent); 29482e5f6b6SThomas Monjalon rte_errno = ENODEV; 29582e5f6b6SThomas Monjalon return -rte_errno; 29682e5f6b6SThomas Monjalon } 29782e5f6b6SThomas Monjalon 29882e5f6b6SThomas Monjalon dev = rte_gpu_allocate(name); 29982e5f6b6SThomas Monjalon if (dev == NULL) 30082e5f6b6SThomas Monjalon return -rte_errno; 30182e5f6b6SThomas Monjalon 302a9af048aSThomas Monjalon dev->mpshared->info.parent = parent; 303a9af048aSThomas Monjalon dev->mpshared->info.context = child_context; 30482e5f6b6SThomas Monjalon 30582e5f6b6SThomas Monjalon rte_gpu_complete_new(dev); 306a9af048aSThomas Monjalon return dev->mpshared->info.dev_id; 30782e5f6b6SThomas Monjalon } 30882e5f6b6SThomas Monjalon 3098b8036a6SElena Agostini void 3108b8036a6SElena Agostini rte_gpu_complete_new(struct rte_gpu *dev) 3118b8036a6SElena Agostini { 3128b8036a6SElena Agostini if (dev == NULL) 3138b8036a6SElena Agostini return; 3148b8036a6SElena Agostini 315a9af048aSThomas Monjalon dev->process_state = RTE_GPU_STATE_INITIALIZED; 31618cb0756SThomas Monjalon rte_gpu_notify(dev, RTE_GPU_EVENT_NEW); 3178b8036a6SElena Agostini } 3188b8036a6SElena Agostini 3198b8036a6SElena Agostini int 3208b8036a6SElena Agostini rte_gpu_release(struct rte_gpu *dev) 3218b8036a6SElena Agostini { 32282e5f6b6SThomas Monjalon int16_t dev_id, child; 32382e5f6b6SThomas Monjalon 3248b8036a6SElena Agostini if (dev == NULL) { 3258b8036a6SElena Agostini rte_errno = ENODEV; 3268b8036a6SElena Agostini return -rte_errno; 3278b8036a6SElena Agostini } 328a9af048aSThomas Monjalon dev_id = dev->mpshared->info.dev_id; 32982e5f6b6SThomas Monjalon RTE_GPU_FOREACH_CHILD(child, dev_id) { 33082e5f6b6SThomas Monjalon GPU_LOG(ERR, "cannot release device %d with child %d", 33182e5f6b6SThomas Monjalon dev_id, child); 33282e5f6b6SThomas Monjalon rte_errno = EBUSY; 33382e5f6b6SThomas Monjalon return -rte_errno; 33482e5f6b6SThomas Monjalon } 3358b8036a6SElena Agostini 3368b8036a6SElena Agostini GPU_LOG(DEBUG, "free device %s (id %d)", 337a9af048aSThomas Monjalon dev->mpshared->info.name, dev->mpshared->info.dev_id); 33818cb0756SThomas Monjalon rte_gpu_notify(dev, RTE_GPU_EVENT_DEL); 33918cb0756SThomas Monjalon 34018cb0756SThomas Monjalon gpu_free_callbacks(dev); 341a9af048aSThomas Monjalon dev->process_state = RTE_GPU_STATE_UNUSED; 342a9af048aSThomas Monjalon __atomic_fetch_sub(&dev->mpshared->process_refcnt, 1, __ATOMIC_RELAXED); 3438b8036a6SElena Agostini gpu_count--; 3448b8036a6SElena Agostini 3458b8036a6SElena Agostini return 0; 3468b8036a6SElena Agostini } 3478b8036a6SElena Agostini 3488b8036a6SElena Agostini int 3498b8036a6SElena Agostini rte_gpu_close(int16_t dev_id) 3508b8036a6SElena Agostini { 3518b8036a6SElena Agostini int firsterr, binerr; 3528b8036a6SElena Agostini int *lasterr = &firsterr; 3538b8036a6SElena Agostini struct rte_gpu *dev; 3548b8036a6SElena Agostini 3558b8036a6SElena Agostini dev = gpu_get_by_id(dev_id); 3568b8036a6SElena Agostini if (dev == NULL) { 3578b8036a6SElena Agostini GPU_LOG(ERR, "close invalid device ID %d", dev_id); 3588b8036a6SElena Agostini rte_errno = ENODEV; 3598b8036a6SElena Agostini return -rte_errno; 3608b8036a6SElena Agostini } 3618b8036a6SElena Agostini 3628b8036a6SElena Agostini if (dev->ops.dev_close != NULL) { 3638b8036a6SElena Agostini *lasterr = GPU_DRV_RET(dev->ops.dev_close(dev)); 3648b8036a6SElena Agostini if (*lasterr != 0) 3658b8036a6SElena Agostini lasterr = &binerr; 3668b8036a6SElena Agostini } 3678b8036a6SElena Agostini 3688b8036a6SElena Agostini *lasterr = rte_gpu_release(dev); 3698b8036a6SElena Agostini 3708b8036a6SElena Agostini rte_errno = -firsterr; 3718b8036a6SElena Agostini return firsterr; 3728b8036a6SElena Agostini } 3738b8036a6SElena Agostini 3748b8036a6SElena Agostini int 37518cb0756SThomas Monjalon rte_gpu_callback_register(int16_t dev_id, enum rte_gpu_event event, 37618cb0756SThomas Monjalon rte_gpu_callback_t *function, void *user_data) 37718cb0756SThomas Monjalon { 37818cb0756SThomas Monjalon int16_t next_dev, last_dev; 37918cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 38018cb0756SThomas Monjalon struct rte_gpu_callback *callback; 38118cb0756SThomas Monjalon 38218cb0756SThomas Monjalon if (!rte_gpu_is_valid(dev_id) && dev_id != RTE_GPU_ID_ANY) { 38318cb0756SThomas Monjalon GPU_LOG(ERR, "register callback of invalid ID %d", dev_id); 38418cb0756SThomas Monjalon rte_errno = ENODEV; 38518cb0756SThomas Monjalon return -rte_errno; 38618cb0756SThomas Monjalon } 38718cb0756SThomas Monjalon if (function == NULL) { 38818cb0756SThomas Monjalon GPU_LOG(ERR, "cannot register callback without function"); 38918cb0756SThomas Monjalon rte_errno = EINVAL; 39018cb0756SThomas Monjalon return -rte_errno; 39118cb0756SThomas Monjalon } 39218cb0756SThomas Monjalon 39318cb0756SThomas Monjalon if (dev_id == RTE_GPU_ID_ANY) { 39418cb0756SThomas Monjalon next_dev = 0; 39518cb0756SThomas Monjalon last_dev = gpu_max - 1; 39618cb0756SThomas Monjalon } else { 39718cb0756SThomas Monjalon next_dev = last_dev = dev_id; 39818cb0756SThomas Monjalon } 39918cb0756SThomas Monjalon 40018cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 40118cb0756SThomas Monjalon do { 40218cb0756SThomas Monjalon callbacks = &gpus[next_dev].callbacks; 40318cb0756SThomas Monjalon 40418cb0756SThomas Monjalon /* check if not already registered */ 40518cb0756SThomas Monjalon TAILQ_FOREACH(callback, callbacks, next) { 40618cb0756SThomas Monjalon if (callback->event == event && 40718cb0756SThomas Monjalon callback->function == function && 40818cb0756SThomas Monjalon callback->user_data == user_data) { 40918cb0756SThomas Monjalon GPU_LOG(INFO, "callback already registered"); 41018cb0756SThomas Monjalon return 0; 41118cb0756SThomas Monjalon } 41218cb0756SThomas Monjalon } 41318cb0756SThomas Monjalon 41418cb0756SThomas Monjalon callback = malloc(sizeof(*callback)); 41518cb0756SThomas Monjalon if (callback == NULL) { 41618cb0756SThomas Monjalon GPU_LOG(ERR, "cannot allocate callback"); 41718cb0756SThomas Monjalon return -ENOMEM; 41818cb0756SThomas Monjalon } 41918cb0756SThomas Monjalon callback->function = function; 42018cb0756SThomas Monjalon callback->user_data = user_data; 42118cb0756SThomas Monjalon callback->event = event; 42218cb0756SThomas Monjalon TAILQ_INSERT_TAIL(callbacks, callback, next); 42318cb0756SThomas Monjalon 42418cb0756SThomas Monjalon } while (++next_dev <= last_dev); 42518cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 42618cb0756SThomas Monjalon 42718cb0756SThomas Monjalon return 0; 42818cb0756SThomas Monjalon } 42918cb0756SThomas Monjalon 43018cb0756SThomas Monjalon int 43118cb0756SThomas Monjalon rte_gpu_callback_unregister(int16_t dev_id, enum rte_gpu_event event, 43218cb0756SThomas Monjalon rte_gpu_callback_t *function, void *user_data) 43318cb0756SThomas Monjalon { 43418cb0756SThomas Monjalon int16_t next_dev, last_dev; 43518cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 43618cb0756SThomas Monjalon struct rte_gpu_callback *callback, *nextcb; 43718cb0756SThomas Monjalon 43818cb0756SThomas Monjalon if (!rte_gpu_is_valid(dev_id) && dev_id != RTE_GPU_ID_ANY) { 43918cb0756SThomas Monjalon GPU_LOG(ERR, "unregister callback of invalid ID %d", dev_id); 44018cb0756SThomas Monjalon rte_errno = ENODEV; 44118cb0756SThomas Monjalon return -rte_errno; 44218cb0756SThomas Monjalon } 44318cb0756SThomas Monjalon if (function == NULL) { 44418cb0756SThomas Monjalon GPU_LOG(ERR, "cannot unregister callback without function"); 44518cb0756SThomas Monjalon rte_errno = EINVAL; 44618cb0756SThomas Monjalon return -rte_errno; 44718cb0756SThomas Monjalon } 44818cb0756SThomas Monjalon 44918cb0756SThomas Monjalon if (dev_id == RTE_GPU_ID_ANY) { 45018cb0756SThomas Monjalon next_dev = 0; 45118cb0756SThomas Monjalon last_dev = gpu_max - 1; 45218cb0756SThomas Monjalon } else { 45318cb0756SThomas Monjalon next_dev = last_dev = dev_id; 45418cb0756SThomas Monjalon } 45518cb0756SThomas Monjalon 45618cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 45718cb0756SThomas Monjalon do { 45818cb0756SThomas Monjalon callbacks = &gpus[next_dev].callbacks; 45918cb0756SThomas Monjalon RTE_TAILQ_FOREACH_SAFE(callback, callbacks, next, nextcb) { 46018cb0756SThomas Monjalon if (callback->event != event || 46118cb0756SThomas Monjalon callback->function != function || 46218cb0756SThomas Monjalon (callback->user_data != user_data && 46318cb0756SThomas Monjalon user_data != (void *)-1)) 46418cb0756SThomas Monjalon continue; 46518cb0756SThomas Monjalon TAILQ_REMOVE(callbacks, callback, next); 46618cb0756SThomas Monjalon free(callback); 46718cb0756SThomas Monjalon } 46818cb0756SThomas Monjalon } while (++next_dev <= last_dev); 46918cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 47018cb0756SThomas Monjalon 47118cb0756SThomas Monjalon return 0; 47218cb0756SThomas Monjalon } 47318cb0756SThomas Monjalon 47418cb0756SThomas Monjalon static void 47518cb0756SThomas Monjalon gpu_free_callbacks(struct rte_gpu *dev) 47618cb0756SThomas Monjalon { 47718cb0756SThomas Monjalon struct rte_gpu_callback_list *callbacks; 47818cb0756SThomas Monjalon struct rte_gpu_callback *callback, *nextcb; 47918cb0756SThomas Monjalon 48018cb0756SThomas Monjalon callbacks = &dev->callbacks; 48118cb0756SThomas Monjalon rte_rwlock_write_lock(&gpu_callback_lock); 48218cb0756SThomas Monjalon RTE_TAILQ_FOREACH_SAFE(callback, callbacks, next, nextcb) { 48318cb0756SThomas Monjalon TAILQ_REMOVE(callbacks, callback, next); 48418cb0756SThomas Monjalon free(callback); 48518cb0756SThomas Monjalon } 48618cb0756SThomas Monjalon rte_rwlock_write_unlock(&gpu_callback_lock); 48718cb0756SThomas Monjalon } 48818cb0756SThomas Monjalon 48918cb0756SThomas Monjalon void 49018cb0756SThomas Monjalon rte_gpu_notify(struct rte_gpu *dev, enum rte_gpu_event event) 49118cb0756SThomas Monjalon { 49218cb0756SThomas Monjalon int16_t dev_id; 49318cb0756SThomas Monjalon struct rte_gpu_callback *callback; 49418cb0756SThomas Monjalon 495a9af048aSThomas Monjalon dev_id = dev->mpshared->info.dev_id; 49618cb0756SThomas Monjalon rte_rwlock_read_lock(&gpu_callback_lock); 49718cb0756SThomas Monjalon TAILQ_FOREACH(callback, &dev->callbacks, next) { 49818cb0756SThomas Monjalon if (callback->event != event || callback->function == NULL) 49918cb0756SThomas Monjalon continue; 50018cb0756SThomas Monjalon callback->function(dev_id, event, callback->user_data); 50118cb0756SThomas Monjalon } 50218cb0756SThomas Monjalon rte_rwlock_read_unlock(&gpu_callback_lock); 50318cb0756SThomas Monjalon } 50418cb0756SThomas Monjalon 50518cb0756SThomas Monjalon int 5068b8036a6SElena Agostini rte_gpu_info_get(int16_t dev_id, struct rte_gpu_info *info) 5078b8036a6SElena Agostini { 5088b8036a6SElena Agostini struct rte_gpu *dev; 5098b8036a6SElena Agostini 5108b8036a6SElena Agostini dev = gpu_get_by_id(dev_id); 5118b8036a6SElena Agostini if (dev == NULL) { 5128b8036a6SElena Agostini GPU_LOG(ERR, "query invalid device ID %d", dev_id); 5138b8036a6SElena Agostini rte_errno = ENODEV; 5148b8036a6SElena Agostini return -rte_errno; 5158b8036a6SElena Agostini } 5168b8036a6SElena Agostini if (info == NULL) { 5178b8036a6SElena Agostini GPU_LOG(ERR, "query without storage"); 5188b8036a6SElena Agostini rte_errno = EINVAL; 5198b8036a6SElena Agostini return -rte_errno; 5208b8036a6SElena Agostini } 5218b8036a6SElena Agostini 5228b8036a6SElena Agostini if (dev->ops.dev_info_get == NULL) { 523a9af048aSThomas Monjalon *info = dev->mpshared->info; 5248b8036a6SElena Agostini return 0; 5258b8036a6SElena Agostini } 5268b8036a6SElena Agostini return GPU_DRV_RET(dev->ops.dev_info_get(dev, info)); 5278b8036a6SElena Agostini } 528e818c4e2SElena Agostini 529e818c4e2SElena Agostini void * 530e818c4e2SElena Agostini rte_gpu_mem_alloc(int16_t dev_id, size_t size) 531e818c4e2SElena Agostini { 532e818c4e2SElena Agostini struct rte_gpu *dev; 533e818c4e2SElena Agostini void *ptr; 534e818c4e2SElena Agostini int ret; 535e818c4e2SElena Agostini 536e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 537e818c4e2SElena Agostini if (dev == NULL) { 538e818c4e2SElena Agostini GPU_LOG(ERR, "alloc mem for invalid device ID %d", dev_id); 539e818c4e2SElena Agostini rte_errno = ENODEV; 540e818c4e2SElena Agostini return NULL; 541e818c4e2SElena Agostini } 542e818c4e2SElena Agostini 543e818c4e2SElena Agostini if (dev->ops.mem_alloc == NULL) { 544e818c4e2SElena Agostini GPU_LOG(ERR, "mem allocation not supported"); 545e818c4e2SElena Agostini rte_errno = ENOTSUP; 546e818c4e2SElena Agostini return NULL; 547e818c4e2SElena Agostini } 548e818c4e2SElena Agostini 549e818c4e2SElena Agostini if (size == 0) /* dry-run */ 550e818c4e2SElena Agostini return NULL; 551e818c4e2SElena Agostini 552e818c4e2SElena Agostini ret = dev->ops.mem_alloc(dev, size, &ptr); 553e818c4e2SElena Agostini 554e818c4e2SElena Agostini switch (ret) { 555e818c4e2SElena Agostini case 0: 556e818c4e2SElena Agostini return ptr; 557e818c4e2SElena Agostini case -ENOMEM: 558e818c4e2SElena Agostini case -E2BIG: 559e818c4e2SElena Agostini rte_errno = -ret; 560e818c4e2SElena Agostini return NULL; 561e818c4e2SElena Agostini default: 562e818c4e2SElena Agostini rte_errno = -EPERM; 563e818c4e2SElena Agostini return NULL; 564e818c4e2SElena Agostini } 565e818c4e2SElena Agostini } 566e818c4e2SElena Agostini 567e818c4e2SElena Agostini int 568e818c4e2SElena Agostini rte_gpu_mem_free(int16_t dev_id, void *ptr) 569e818c4e2SElena Agostini { 570e818c4e2SElena Agostini struct rte_gpu *dev; 571e818c4e2SElena Agostini 572e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 573e818c4e2SElena Agostini if (dev == NULL) { 574e818c4e2SElena Agostini GPU_LOG(ERR, "free mem for invalid device ID %d", dev_id); 575e818c4e2SElena Agostini rte_errno = ENODEV; 576e818c4e2SElena Agostini return -rte_errno; 577e818c4e2SElena Agostini } 578e818c4e2SElena Agostini 579e818c4e2SElena Agostini if (dev->ops.mem_free == NULL) { 580e818c4e2SElena Agostini rte_errno = ENOTSUP; 581e818c4e2SElena Agostini return -rte_errno; 582e818c4e2SElena Agostini } 583e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_free(dev, ptr)); 584e818c4e2SElena Agostini } 585e818c4e2SElena Agostini 586e818c4e2SElena Agostini int 587e818c4e2SElena Agostini rte_gpu_mem_register(int16_t dev_id, size_t size, void *ptr) 588e818c4e2SElena Agostini { 589e818c4e2SElena Agostini struct rte_gpu *dev; 590e818c4e2SElena Agostini 591e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 592e818c4e2SElena Agostini if (dev == NULL) { 593e818c4e2SElena Agostini GPU_LOG(ERR, "alloc mem for invalid device ID %d", dev_id); 594e818c4e2SElena Agostini rte_errno = ENODEV; 595e818c4e2SElena Agostini return -rte_errno; 596e818c4e2SElena Agostini } 597e818c4e2SElena Agostini 598e818c4e2SElena Agostini if (dev->ops.mem_register == NULL) { 599e818c4e2SElena Agostini GPU_LOG(ERR, "mem registration not supported"); 600e818c4e2SElena Agostini rte_errno = ENOTSUP; 601e818c4e2SElena Agostini return -rte_errno; 602e818c4e2SElena Agostini } 603e818c4e2SElena Agostini 604e818c4e2SElena Agostini if (size == 0 || ptr == NULL) /* dry-run */ 605e818c4e2SElena Agostini return -EINVAL; 606e818c4e2SElena Agostini 607e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_register(dev, size, ptr)); 608e818c4e2SElena Agostini } 609e818c4e2SElena Agostini 610e818c4e2SElena Agostini int 611e818c4e2SElena Agostini rte_gpu_mem_unregister(int16_t dev_id, void *ptr) 612e818c4e2SElena Agostini { 613e818c4e2SElena Agostini struct rte_gpu *dev; 614e818c4e2SElena Agostini 615e818c4e2SElena Agostini dev = gpu_get_by_id(dev_id); 616e818c4e2SElena Agostini if (dev == NULL) { 617e818c4e2SElena Agostini GPU_LOG(ERR, "unregister mem for invalid device ID %d", dev_id); 618e818c4e2SElena Agostini rte_errno = ENODEV; 619e818c4e2SElena Agostini return -rte_errno; 620e818c4e2SElena Agostini } 621e818c4e2SElena Agostini 622e818c4e2SElena Agostini if (dev->ops.mem_unregister == NULL) { 623e818c4e2SElena Agostini rte_errno = ENOTSUP; 624e818c4e2SElena Agostini return -rte_errno; 625e818c4e2SElena Agostini } 626e818c4e2SElena Agostini return GPU_DRV_RET(dev->ops.mem_unregister(dev, ptr)); 627e818c4e2SElena Agostini } 6282d61b429SElena Agostini 6292d61b429SElena Agostini int 6302d61b429SElena Agostini rte_gpu_wmb(int16_t dev_id) 6312d61b429SElena Agostini { 6322d61b429SElena Agostini struct rte_gpu *dev; 6332d61b429SElena Agostini 6342d61b429SElena Agostini dev = gpu_get_by_id(dev_id); 6352d61b429SElena Agostini if (dev == NULL) { 6362d61b429SElena Agostini GPU_LOG(ERR, "memory barrier for invalid device ID %d", dev_id); 6372d61b429SElena Agostini rte_errno = ENODEV; 6382d61b429SElena Agostini return -rte_errno; 6392d61b429SElena Agostini } 6402d61b429SElena Agostini 6412d61b429SElena Agostini if (dev->ops.wmb == NULL) { 6422d61b429SElena Agostini rte_errno = ENOTSUP; 6432d61b429SElena Agostini return -rte_errno; 6442d61b429SElena Agostini } 6452d61b429SElena Agostini return GPU_DRV_RET(dev->ops.wmb(dev)); 6462d61b429SElena Agostini } 647f56160a2SElena Agostini 648f56160a2SElena Agostini int 649f56160a2SElena Agostini rte_gpu_comm_create_flag(uint16_t dev_id, struct rte_gpu_comm_flag *devflag, 650f56160a2SElena Agostini enum rte_gpu_comm_flag_type mtype) 651f56160a2SElena Agostini { 652f56160a2SElena Agostini size_t flag_size; 653f56160a2SElena Agostini int ret; 654f56160a2SElena Agostini 655f56160a2SElena Agostini if (devflag == NULL) { 656f56160a2SElena Agostini rte_errno = EINVAL; 657f56160a2SElena Agostini return -rte_errno; 658f56160a2SElena Agostini } 659f56160a2SElena Agostini if (mtype != RTE_GPU_COMM_FLAG_CPU) { 660f56160a2SElena Agostini rte_errno = EINVAL; 661f56160a2SElena Agostini return -rte_errno; 662f56160a2SElena Agostini } 663f56160a2SElena Agostini 664f56160a2SElena Agostini flag_size = sizeof(uint32_t); 665f56160a2SElena Agostini 666f56160a2SElena Agostini devflag->ptr = rte_zmalloc(NULL, flag_size, 0); 667f56160a2SElena Agostini if (devflag->ptr == NULL) { 668f56160a2SElena Agostini rte_errno = ENOMEM; 669f56160a2SElena Agostini return -rte_errno; 670f56160a2SElena Agostini } 671f56160a2SElena Agostini 672f56160a2SElena Agostini ret = rte_gpu_mem_register(dev_id, flag_size, devflag->ptr); 673f56160a2SElena Agostini if (ret < 0) { 674f56160a2SElena Agostini rte_errno = ENOMEM; 675f56160a2SElena Agostini return -rte_errno; 676f56160a2SElena Agostini } 677f56160a2SElena Agostini 678f56160a2SElena Agostini devflag->mtype = mtype; 679f56160a2SElena Agostini devflag->dev_id = dev_id; 680f56160a2SElena Agostini 681f56160a2SElena Agostini return 0; 682f56160a2SElena Agostini } 683f56160a2SElena Agostini 684f56160a2SElena Agostini int 685f56160a2SElena Agostini rte_gpu_comm_destroy_flag(struct rte_gpu_comm_flag *devflag) 686f56160a2SElena Agostini { 687f56160a2SElena Agostini int ret; 688f56160a2SElena Agostini 689f56160a2SElena Agostini if (devflag == NULL) { 690f56160a2SElena Agostini rte_errno = EINVAL; 691f56160a2SElena Agostini return -rte_errno; 692f56160a2SElena Agostini } 693f56160a2SElena Agostini 694f56160a2SElena Agostini ret = rte_gpu_mem_unregister(devflag->dev_id, devflag->ptr); 695f56160a2SElena Agostini if (ret < 0) { 696f56160a2SElena Agostini rte_errno = EINVAL; 697f56160a2SElena Agostini return -1; 698f56160a2SElena Agostini } 699f56160a2SElena Agostini 700f56160a2SElena Agostini rte_free(devflag->ptr); 701f56160a2SElena Agostini 702f56160a2SElena Agostini return 0; 703f56160a2SElena Agostini } 704f56160a2SElena Agostini 705f56160a2SElena Agostini int 706f56160a2SElena Agostini rte_gpu_comm_set_flag(struct rte_gpu_comm_flag *devflag, uint32_t val) 707f56160a2SElena Agostini { 708f56160a2SElena Agostini if (devflag == NULL) { 709f56160a2SElena Agostini rte_errno = EINVAL; 710f56160a2SElena Agostini return -rte_errno; 711f56160a2SElena Agostini } 712f56160a2SElena Agostini 713f56160a2SElena Agostini if (devflag->mtype != RTE_GPU_COMM_FLAG_CPU) { 714f56160a2SElena Agostini rte_errno = EINVAL; 715f56160a2SElena Agostini return -rte_errno; 716f56160a2SElena Agostini } 717f56160a2SElena Agostini 718f56160a2SElena Agostini RTE_GPU_VOLATILE(*devflag->ptr) = val; 719f56160a2SElena Agostini 720f56160a2SElena Agostini return 0; 721f56160a2SElena Agostini } 722f56160a2SElena Agostini 723f56160a2SElena Agostini int 724f56160a2SElena Agostini rte_gpu_comm_get_flag_value(struct rte_gpu_comm_flag *devflag, uint32_t *val) 725f56160a2SElena Agostini { 726f56160a2SElena Agostini if (devflag == NULL) { 727f56160a2SElena Agostini rte_errno = EINVAL; 728f56160a2SElena Agostini return -rte_errno; 729f56160a2SElena Agostini } 730f56160a2SElena Agostini if (devflag->mtype != RTE_GPU_COMM_FLAG_CPU) { 731f56160a2SElena Agostini rte_errno = EINVAL; 732f56160a2SElena Agostini return -rte_errno; 733f56160a2SElena Agostini } 734f56160a2SElena Agostini 735f56160a2SElena Agostini *val = RTE_GPU_VOLATILE(*devflag->ptr); 736f56160a2SElena Agostini 737f56160a2SElena Agostini return 0; 738f56160a2SElena Agostini } 739*c7ebd65cSElena Agostini 740*c7ebd65cSElena Agostini struct rte_gpu_comm_list * 741*c7ebd65cSElena Agostini rte_gpu_comm_create_list(uint16_t dev_id, 742*c7ebd65cSElena Agostini uint32_t num_comm_items) 743*c7ebd65cSElena Agostini { 744*c7ebd65cSElena Agostini struct rte_gpu_comm_list *comm_list; 745*c7ebd65cSElena Agostini uint32_t idx_l; 746*c7ebd65cSElena Agostini int ret; 747*c7ebd65cSElena Agostini struct rte_gpu *dev; 748*c7ebd65cSElena Agostini 749*c7ebd65cSElena Agostini if (num_comm_items == 0) { 750*c7ebd65cSElena Agostini rte_errno = EINVAL; 751*c7ebd65cSElena Agostini return NULL; 752*c7ebd65cSElena Agostini } 753*c7ebd65cSElena Agostini 754*c7ebd65cSElena Agostini dev = gpu_get_by_id(dev_id); 755*c7ebd65cSElena Agostini if (dev == NULL) { 756*c7ebd65cSElena Agostini GPU_LOG(ERR, "memory barrier for invalid device ID %d", dev_id); 757*c7ebd65cSElena Agostini rte_errno = ENODEV; 758*c7ebd65cSElena Agostini return NULL; 759*c7ebd65cSElena Agostini } 760*c7ebd65cSElena Agostini 761*c7ebd65cSElena Agostini comm_list = rte_zmalloc(NULL, 762*c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_list) * num_comm_items, 0); 763*c7ebd65cSElena Agostini if (comm_list == NULL) { 764*c7ebd65cSElena Agostini rte_errno = ENOMEM; 765*c7ebd65cSElena Agostini return NULL; 766*c7ebd65cSElena Agostini } 767*c7ebd65cSElena Agostini 768*c7ebd65cSElena Agostini ret = rte_gpu_mem_register(dev_id, 769*c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_list) * num_comm_items, comm_list); 770*c7ebd65cSElena Agostini if (ret < 0) { 771*c7ebd65cSElena Agostini rte_errno = ENOMEM; 772*c7ebd65cSElena Agostini return NULL; 773*c7ebd65cSElena Agostini } 774*c7ebd65cSElena Agostini 775*c7ebd65cSElena Agostini for (idx_l = 0; idx_l < num_comm_items; idx_l++) { 776*c7ebd65cSElena Agostini comm_list[idx_l].pkt_list = rte_zmalloc(NULL, 777*c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_pkt) * RTE_GPU_COMM_LIST_PKTS_MAX, 0); 778*c7ebd65cSElena Agostini if (comm_list[idx_l].pkt_list == NULL) { 779*c7ebd65cSElena Agostini rte_errno = ENOMEM; 780*c7ebd65cSElena Agostini return NULL; 781*c7ebd65cSElena Agostini } 782*c7ebd65cSElena Agostini 783*c7ebd65cSElena Agostini ret = rte_gpu_mem_register(dev_id, 784*c7ebd65cSElena Agostini sizeof(struct rte_gpu_comm_pkt) * RTE_GPU_COMM_LIST_PKTS_MAX, 785*c7ebd65cSElena Agostini comm_list[idx_l].pkt_list); 786*c7ebd65cSElena Agostini if (ret < 0) { 787*c7ebd65cSElena Agostini rte_errno = ENOMEM; 788*c7ebd65cSElena Agostini return NULL; 789*c7ebd65cSElena Agostini } 790*c7ebd65cSElena Agostini 791*c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list[idx_l].status) = RTE_GPU_COMM_LIST_FREE; 792*c7ebd65cSElena Agostini comm_list[idx_l].num_pkts = 0; 793*c7ebd65cSElena Agostini comm_list[idx_l].dev_id = dev_id; 794*c7ebd65cSElena Agostini 795*c7ebd65cSElena Agostini comm_list[idx_l].mbufs = rte_zmalloc(NULL, 796*c7ebd65cSElena Agostini sizeof(struct rte_mbuf *) * RTE_GPU_COMM_LIST_PKTS_MAX, 0); 797*c7ebd65cSElena Agostini if (comm_list[idx_l].mbufs == NULL) { 798*c7ebd65cSElena Agostini rte_errno = ENOMEM; 799*c7ebd65cSElena Agostini return NULL; 800*c7ebd65cSElena Agostini } 801*c7ebd65cSElena Agostini } 802*c7ebd65cSElena Agostini 803*c7ebd65cSElena Agostini return comm_list; 804*c7ebd65cSElena Agostini } 805*c7ebd65cSElena Agostini 806*c7ebd65cSElena Agostini int 807*c7ebd65cSElena Agostini rte_gpu_comm_destroy_list(struct rte_gpu_comm_list *comm_list, 808*c7ebd65cSElena Agostini uint32_t num_comm_items) 809*c7ebd65cSElena Agostini { 810*c7ebd65cSElena Agostini uint32_t idx_l; 811*c7ebd65cSElena Agostini int ret; 812*c7ebd65cSElena Agostini uint16_t dev_id; 813*c7ebd65cSElena Agostini 814*c7ebd65cSElena Agostini if (comm_list == NULL) { 815*c7ebd65cSElena Agostini rte_errno = EINVAL; 816*c7ebd65cSElena Agostini return -rte_errno; 817*c7ebd65cSElena Agostini } 818*c7ebd65cSElena Agostini 819*c7ebd65cSElena Agostini dev_id = comm_list[0].dev_id; 820*c7ebd65cSElena Agostini 821*c7ebd65cSElena Agostini for (idx_l = 0; idx_l < num_comm_items; idx_l++) { 822*c7ebd65cSElena Agostini ret = rte_gpu_mem_unregister(dev_id, comm_list[idx_l].pkt_list); 823*c7ebd65cSElena Agostini if (ret < 0) { 824*c7ebd65cSElena Agostini rte_errno = EINVAL; 825*c7ebd65cSElena Agostini return -1; 826*c7ebd65cSElena Agostini } 827*c7ebd65cSElena Agostini 828*c7ebd65cSElena Agostini rte_free(comm_list[idx_l].pkt_list); 829*c7ebd65cSElena Agostini rte_free(comm_list[idx_l].mbufs); 830*c7ebd65cSElena Agostini } 831*c7ebd65cSElena Agostini 832*c7ebd65cSElena Agostini ret = rte_gpu_mem_unregister(dev_id, comm_list); 833*c7ebd65cSElena Agostini if (ret < 0) { 834*c7ebd65cSElena Agostini rte_errno = EINVAL; 835*c7ebd65cSElena Agostini return -1; 836*c7ebd65cSElena Agostini } 837*c7ebd65cSElena Agostini 838*c7ebd65cSElena Agostini rte_free(comm_list); 839*c7ebd65cSElena Agostini 840*c7ebd65cSElena Agostini return 0; 841*c7ebd65cSElena Agostini } 842*c7ebd65cSElena Agostini 843*c7ebd65cSElena Agostini int 844*c7ebd65cSElena Agostini rte_gpu_comm_populate_list_pkts(struct rte_gpu_comm_list *comm_list_item, 845*c7ebd65cSElena Agostini struct rte_mbuf **mbufs, uint32_t num_mbufs) 846*c7ebd65cSElena Agostini { 847*c7ebd65cSElena Agostini uint32_t idx; 848*c7ebd65cSElena Agostini 849*c7ebd65cSElena Agostini if (comm_list_item == NULL || comm_list_item->pkt_list == NULL || 850*c7ebd65cSElena Agostini mbufs == NULL || num_mbufs > RTE_GPU_COMM_LIST_PKTS_MAX) { 851*c7ebd65cSElena Agostini rte_errno = EINVAL; 852*c7ebd65cSElena Agostini return -rte_errno; 853*c7ebd65cSElena Agostini } 854*c7ebd65cSElena Agostini 855*c7ebd65cSElena Agostini for (idx = 0; idx < num_mbufs; idx++) { 856*c7ebd65cSElena Agostini /* support only unchained mbufs */ 857*c7ebd65cSElena Agostini if (unlikely((mbufs[idx]->nb_segs > 1) || 858*c7ebd65cSElena Agostini (mbufs[idx]->next != NULL) || 859*c7ebd65cSElena Agostini (mbufs[idx]->data_len != mbufs[idx]->pkt_len))) { 860*c7ebd65cSElena Agostini rte_errno = ENOTSUP; 861*c7ebd65cSElena Agostini return -rte_errno; 862*c7ebd65cSElena Agostini } 863*c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].addr = 864*c7ebd65cSElena Agostini rte_pktmbuf_mtod_offset(mbufs[idx], uintptr_t, 0); 865*c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].size = mbufs[idx]->pkt_len; 866*c7ebd65cSElena Agostini comm_list_item->mbufs[idx] = mbufs[idx]; 867*c7ebd65cSElena Agostini } 868*c7ebd65cSElena Agostini 869*c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->num_pkts) = num_mbufs; 870*c7ebd65cSElena Agostini rte_gpu_wmb(comm_list_item->dev_id); 871*c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->status) = RTE_GPU_COMM_LIST_READY; 872*c7ebd65cSElena Agostini rte_gpu_wmb(comm_list_item->dev_id); 873*c7ebd65cSElena Agostini 874*c7ebd65cSElena Agostini return 0; 875*c7ebd65cSElena Agostini } 876*c7ebd65cSElena Agostini 877*c7ebd65cSElena Agostini int 878*c7ebd65cSElena Agostini rte_gpu_comm_cleanup_list(struct rte_gpu_comm_list *comm_list_item) 879*c7ebd65cSElena Agostini { 880*c7ebd65cSElena Agostini uint32_t idx = 0; 881*c7ebd65cSElena Agostini 882*c7ebd65cSElena Agostini if (comm_list_item == NULL) { 883*c7ebd65cSElena Agostini rte_errno = EINVAL; 884*c7ebd65cSElena Agostini return -rte_errno; 885*c7ebd65cSElena Agostini } 886*c7ebd65cSElena Agostini 887*c7ebd65cSElena Agostini if (RTE_GPU_VOLATILE(comm_list_item->status) == 888*c7ebd65cSElena Agostini RTE_GPU_COMM_LIST_READY) { 889*c7ebd65cSElena Agostini GPU_LOG(ERR, "packet list is still in progress"); 890*c7ebd65cSElena Agostini rte_errno = EINVAL; 891*c7ebd65cSElena Agostini return -rte_errno; 892*c7ebd65cSElena Agostini } 893*c7ebd65cSElena Agostini 894*c7ebd65cSElena Agostini for (idx = 0; idx < RTE_GPU_COMM_LIST_PKTS_MAX; idx++) { 895*c7ebd65cSElena Agostini if (comm_list_item->pkt_list[idx].addr == 0) 896*c7ebd65cSElena Agostini break; 897*c7ebd65cSElena Agostini 898*c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].addr = 0; 899*c7ebd65cSElena Agostini comm_list_item->pkt_list[idx].size = 0; 900*c7ebd65cSElena Agostini comm_list_item->mbufs[idx] = NULL; 901*c7ebd65cSElena Agostini } 902*c7ebd65cSElena Agostini 903*c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->status) = RTE_GPU_COMM_LIST_FREE; 904*c7ebd65cSElena Agostini RTE_GPU_VOLATILE(comm_list_item->num_pkts) = 0; 905*c7ebd65cSElena Agostini rte_mb(); 906*c7ebd65cSElena Agostini 907*c7ebd65cSElena Agostini return 0; 908*c7ebd65cSElena Agostini } 909