xref: /dpdk/drivers/bus/pci/linux/pci.c (revision ea0e711b8ae02a7bc95de732f6e64781df74b2ca)
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright(c) 2010-2014 Intel Corporation
3  */
4 
5 #include <string.h>
6 #include <dirent.h>
7 
8 #include <rte_log.h>
9 #include <rte_bus.h>
10 #include <rte_pci.h>
11 #include <rte_bus_pci.h>
12 #include <rte_malloc.h>
13 #include <rte_devargs.h>
14 #include <rte_memcpy.h>
15 #include <rte_vfio.h>
16 
17 #include "eal_filesystem.h"
18 
19 #include "private.h"
20 #include "pci_init.h"
21 
22 /**
23  * @file
24  * PCI probing under linux
25  *
26  * This code is used to simulate a PCI probe by parsing information in sysfs.
27  * When a registered device matches a driver, it is then initialized with
28  * IGB_UIO driver (or doesn't initialize, if the device wasn't bound to it).
29  */
30 
31 extern struct rte_pci_bus rte_pci_bus;
32 
33 static int
34 pci_get_kernel_driver_by_path(const char *filename, char *dri_name,
35 			      size_t len)
36 {
37 	int count;
38 	char path[PATH_MAX];
39 	char *name;
40 
41 	if (!filename || !dri_name)
42 		return -1;
43 
44 	count = readlink(filename, path, PATH_MAX);
45 	if (count >= PATH_MAX)
46 		return -1;
47 
48 	/* For device does not have a driver */
49 	if (count < 0)
50 		return 1;
51 
52 	path[count] = '\0';
53 
54 	name = strrchr(path, '/');
55 	if (name) {
56 		strlcpy(dri_name, name + 1, len);
57 		return 0;
58 	}
59 
60 	return -1;
61 }
62 
63 /* Map pci device */
64 int
65 rte_pci_map_device(struct rte_pci_device *dev)
66 {
67 	int ret = -1;
68 
69 	/* try mapping the NIC resources using VFIO if it exists */
70 	switch (dev->kdrv) {
71 	case RTE_PCI_KDRV_VFIO:
72 #ifdef VFIO_PRESENT
73 		if (pci_vfio_is_enabled())
74 			ret = pci_vfio_map_resource(dev);
75 #endif
76 		break;
77 	case RTE_PCI_KDRV_IGB_UIO:
78 	case RTE_PCI_KDRV_UIO_GENERIC:
79 		if (rte_eal_using_phys_addrs()) {
80 			/* map resources for devices that use uio */
81 			ret = pci_uio_map_resource(dev);
82 		}
83 		break;
84 	default:
85 		RTE_LOG(DEBUG, EAL,
86 			"  Not managed by a supported kernel driver, skipped\n");
87 		ret = 1;
88 		break;
89 	}
90 
91 	return ret;
92 }
93 
94 /* Unmap pci device */
95 void
96 rte_pci_unmap_device(struct rte_pci_device *dev)
97 {
98 	/* try unmapping the NIC resources using VFIO if it exists */
99 	switch (dev->kdrv) {
100 	case RTE_PCI_KDRV_VFIO:
101 #ifdef VFIO_PRESENT
102 		if (pci_vfio_is_enabled())
103 			pci_vfio_unmap_resource(dev);
104 #endif
105 		break;
106 	case RTE_PCI_KDRV_IGB_UIO:
107 	case RTE_PCI_KDRV_UIO_GENERIC:
108 		/* unmap resources for devices that use uio */
109 		pci_uio_unmap_resource(dev);
110 		break;
111 	default:
112 		RTE_LOG(DEBUG, EAL,
113 			"  Not managed by a supported kernel driver, skipped\n");
114 		break;
115 	}
116 }
117 
118 static int
119 find_max_end_va(const struct rte_memseg_list *msl, void *arg)
120 {
121 	size_t sz = msl->len;
122 	void *end_va = RTE_PTR_ADD(msl->base_va, sz);
123 	void **max_va = arg;
124 
125 	if (*max_va < end_va)
126 		*max_va = end_va;
127 	return 0;
128 }
129 
130 void *
131 pci_find_max_end_va(void)
132 {
133 	void *va = NULL;
134 
135 	rte_memseg_list_walk(find_max_end_va, &va);
136 	return va;
137 }
138 
139 
140 /* parse one line of the "resource" sysfs file (note that the 'line'
141  * string is modified)
142  */
143 int
144 pci_parse_one_sysfs_resource(char *line, size_t len, uint64_t *phys_addr,
145 	uint64_t *end_addr, uint64_t *flags)
146 {
147 	union pci_resource_info {
148 		struct {
149 			char *phys_addr;
150 			char *end_addr;
151 			char *flags;
152 		};
153 		char *ptrs[PCI_RESOURCE_FMT_NVAL];
154 	} res_info;
155 
156 	if (rte_strsplit(line, len, res_info.ptrs, 3, ' ') != 3) {
157 		RTE_LOG(ERR, EAL,
158 			"%s(): bad resource format\n", __func__);
159 		return -1;
160 	}
161 	errno = 0;
162 	*phys_addr = strtoull(res_info.phys_addr, NULL, 16);
163 	*end_addr = strtoull(res_info.end_addr, NULL, 16);
164 	*flags = strtoull(res_info.flags, NULL, 16);
165 	if (errno != 0) {
166 		RTE_LOG(ERR, EAL,
167 			"%s(): bad resource format\n", __func__);
168 		return -1;
169 	}
170 
171 	return 0;
172 }
173 
174 /* parse the "resource" sysfs file */
175 static int
176 pci_parse_sysfs_resource(const char *filename, struct rte_pci_device *dev)
177 {
178 	FILE *f;
179 	char buf[BUFSIZ];
180 	int i;
181 	uint64_t phys_addr, end_addr, flags;
182 
183 	f = fopen(filename, "r");
184 	if (f == NULL) {
185 		RTE_LOG(ERR, EAL, "Cannot open sysfs resource\n");
186 		return -1;
187 	}
188 
189 	for (i = 0; i<PCI_MAX_RESOURCE; i++) {
190 
191 		if (fgets(buf, sizeof(buf), f) == NULL) {
192 			RTE_LOG(ERR, EAL,
193 				"%s(): cannot read resource\n", __func__);
194 			goto error;
195 		}
196 		if (pci_parse_one_sysfs_resource(buf, sizeof(buf), &phys_addr,
197 				&end_addr, &flags) < 0)
198 			goto error;
199 
200 		if (flags & IORESOURCE_MEM) {
201 			dev->mem_resource[i].phys_addr = phys_addr;
202 			dev->mem_resource[i].len = end_addr - phys_addr + 1;
203 			/* not mapped for now */
204 			dev->mem_resource[i].addr = NULL;
205 		}
206 	}
207 	fclose(f);
208 	return 0;
209 
210 error:
211 	fclose(f);
212 	return -1;
213 }
214 
215 /* Scan one pci sysfs entry, and fill the devices list from it. */
216 static int
217 pci_scan_one(const char *dirname, const struct rte_pci_addr *addr)
218 {
219 	char filename[PATH_MAX];
220 	unsigned long tmp;
221 	struct rte_pci_device *dev;
222 	char driver[PATH_MAX];
223 	int ret;
224 
225 	dev = malloc(sizeof(*dev));
226 	if (dev == NULL)
227 		return -1;
228 
229 	memset(dev, 0, sizeof(*dev));
230 	dev->device.bus = &rte_pci_bus.bus;
231 	dev->addr = *addr;
232 
233 	/* get vendor id */
234 	snprintf(filename, sizeof(filename), "%s/vendor", dirname);
235 	if (eal_parse_sysfs_value(filename, &tmp) < 0) {
236 		free(dev);
237 		return -1;
238 	}
239 	dev->id.vendor_id = (uint16_t)tmp;
240 
241 	/* get device id */
242 	snprintf(filename, sizeof(filename), "%s/device", dirname);
243 	if (eal_parse_sysfs_value(filename, &tmp) < 0) {
244 		free(dev);
245 		return -1;
246 	}
247 	dev->id.device_id = (uint16_t)tmp;
248 
249 	/* get subsystem_vendor id */
250 	snprintf(filename, sizeof(filename), "%s/subsystem_vendor",
251 		 dirname);
252 	if (eal_parse_sysfs_value(filename, &tmp) < 0) {
253 		free(dev);
254 		return -1;
255 	}
256 	dev->id.subsystem_vendor_id = (uint16_t)tmp;
257 
258 	/* get subsystem_device id */
259 	snprintf(filename, sizeof(filename), "%s/subsystem_device",
260 		 dirname);
261 	if (eal_parse_sysfs_value(filename, &tmp) < 0) {
262 		free(dev);
263 		return -1;
264 	}
265 	dev->id.subsystem_device_id = (uint16_t)tmp;
266 
267 	/* get class_id */
268 	snprintf(filename, sizeof(filename), "%s/class",
269 		 dirname);
270 	if (eal_parse_sysfs_value(filename, &tmp) < 0) {
271 		free(dev);
272 		return -1;
273 	}
274 	/* the least 24 bits are valid: class, subclass, program interface */
275 	dev->id.class_id = (uint32_t)tmp & RTE_CLASS_ANY_ID;
276 
277 	/* get max_vfs */
278 	dev->max_vfs = 0;
279 	snprintf(filename, sizeof(filename), "%s/max_vfs", dirname);
280 	if (!access(filename, F_OK) &&
281 	    eal_parse_sysfs_value(filename, &tmp) == 0)
282 		dev->max_vfs = (uint16_t)tmp;
283 	else {
284 		/* for non igb_uio driver, need kernel version >= 3.8 */
285 		snprintf(filename, sizeof(filename),
286 			 "%s/sriov_numvfs", dirname);
287 		if (!access(filename, F_OK) &&
288 		    eal_parse_sysfs_value(filename, &tmp) == 0)
289 			dev->max_vfs = (uint16_t)tmp;
290 	}
291 
292 	/* get numa node, default to 0 if not present */
293 	snprintf(filename, sizeof(filename), "%s/numa_node",
294 		 dirname);
295 
296 	if (access(filename, F_OK) != -1) {
297 		if (eal_parse_sysfs_value(filename, &tmp) == 0)
298 			dev->device.numa_node = tmp;
299 		else
300 			dev->device.numa_node = -1;
301 	} else {
302 		dev->device.numa_node = 0;
303 	}
304 
305 	pci_name_set(dev);
306 
307 	/* parse resources */
308 	snprintf(filename, sizeof(filename), "%s/resource", dirname);
309 	if (pci_parse_sysfs_resource(filename, dev) < 0) {
310 		RTE_LOG(ERR, EAL, "%s(): cannot parse resource\n", __func__);
311 		free(dev);
312 		return -1;
313 	}
314 
315 	/* parse driver */
316 	snprintf(filename, sizeof(filename), "%s/driver", dirname);
317 	ret = pci_get_kernel_driver_by_path(filename, driver, sizeof(driver));
318 	if (ret < 0) {
319 		RTE_LOG(ERR, EAL, "Fail to get kernel driver\n");
320 		free(dev);
321 		return -1;
322 	}
323 
324 	if (!ret) {
325 		if (!strcmp(driver, "vfio-pci"))
326 			dev->kdrv = RTE_PCI_KDRV_VFIO;
327 		else if (!strcmp(driver, "igb_uio"))
328 			dev->kdrv = RTE_PCI_KDRV_IGB_UIO;
329 		else if (!strcmp(driver, "uio_pci_generic"))
330 			dev->kdrv = RTE_PCI_KDRV_UIO_GENERIC;
331 		else
332 			dev->kdrv = RTE_PCI_KDRV_UNKNOWN;
333 	} else {
334 		dev->kdrv = RTE_PCI_KDRV_NONE;
335 		return 0;
336 	}
337 	/* device is valid, add in list (sorted) */
338 	if (TAILQ_EMPTY(&rte_pci_bus.device_list)) {
339 		rte_pci_add_device(dev);
340 	} else {
341 		struct rte_pci_device *dev2;
342 		int ret;
343 
344 		TAILQ_FOREACH(dev2, &rte_pci_bus.device_list, next) {
345 			ret = rte_pci_addr_cmp(&dev->addr, &dev2->addr);
346 			if (ret > 0)
347 				continue;
348 
349 			if (ret < 0) {
350 				rte_pci_insert_device(dev2, dev);
351 			} else { /* already registered */
352 				if (!rte_dev_is_probed(&dev2->device)) {
353 					dev2->kdrv = dev->kdrv;
354 					dev2->max_vfs = dev->max_vfs;
355 					dev2->id = dev->id;
356 					pci_name_set(dev2);
357 					memmove(dev2->mem_resource,
358 						dev->mem_resource,
359 						sizeof(dev->mem_resource));
360 				} else {
361 					/**
362 					 * If device is plugged and driver is
363 					 * probed already, (This happens when
364 					 * we call rte_dev_probe which will
365 					 * scan all device on the bus) we don't
366 					 * need to do anything here unless...
367 					 **/
368 					if (dev2->kdrv != dev->kdrv ||
369 						dev2->max_vfs != dev->max_vfs ||
370 						memcmp(&dev2->id, &dev->id, sizeof(dev2->id)))
371 						/*
372 						 * This should not happens.
373 						 * But it is still possible if
374 						 * we unbind a device from
375 						 * vfio or uio before hotplug
376 						 * remove and rebind it with
377 						 * a different configure.
378 						 * So we just print out the
379 						 * error as an alarm.
380 						 */
381 						RTE_LOG(ERR, EAL, "Unexpected device scan at %s!\n",
382 							filename);
383 					else if (dev2->device.devargs !=
384 						 dev->device.devargs) {
385 						rte_devargs_remove(dev2->device.devargs);
386 						pci_name_set(dev2);
387 					}
388 				}
389 				free(dev);
390 			}
391 			return 0;
392 		}
393 
394 		rte_pci_add_device(dev);
395 	}
396 
397 	return 0;
398 }
399 
400 int
401 pci_update_device(const struct rte_pci_addr *addr)
402 {
403 	char filename[PATH_MAX];
404 
405 	snprintf(filename, sizeof(filename), "%s/" PCI_PRI_FMT,
406 		 rte_pci_get_sysfs_path(), addr->domain, addr->bus, addr->devid,
407 		 addr->function);
408 
409 	return pci_scan_one(filename, addr);
410 }
411 
412 /*
413  * split up a pci address into its constituent parts.
414  */
415 static int
416 parse_pci_addr_format(const char *buf, int bufsize, struct rte_pci_addr *addr)
417 {
418 	/* first split on ':' */
419 	union splitaddr {
420 		struct {
421 			char *domain;
422 			char *bus;
423 			char *devid;
424 			char *function;
425 		};
426 		char *str[PCI_FMT_NVAL]; /* last element-separator is "." not ":" */
427 	} splitaddr;
428 
429 	char *buf_copy = strndup(buf, bufsize);
430 	if (buf_copy == NULL)
431 		return -1;
432 
433 	if (rte_strsplit(buf_copy, bufsize, splitaddr.str, PCI_FMT_NVAL, ':')
434 			!= PCI_FMT_NVAL - 1)
435 		goto error;
436 	/* final split is on '.' between devid and function */
437 	splitaddr.function = strchr(splitaddr.devid,'.');
438 	if (splitaddr.function == NULL)
439 		goto error;
440 	*splitaddr.function++ = '\0';
441 
442 	/* now convert to int values */
443 	errno = 0;
444 	addr->domain = strtoul(splitaddr.domain, NULL, 16);
445 	addr->bus = strtoul(splitaddr.bus, NULL, 16);
446 	addr->devid = strtoul(splitaddr.devid, NULL, 16);
447 	addr->function = strtoul(splitaddr.function, NULL, 10);
448 	if (errno != 0)
449 		goto error;
450 
451 	free(buf_copy); /* free the copy made with strdup */
452 	return 0;
453 error:
454 	free(buf_copy);
455 	return -1;
456 }
457 
458 /*
459  * Scan the content of the PCI bus, and the devices in the devices
460  * list
461  */
462 int
463 rte_pci_scan(void)
464 {
465 	struct dirent *e;
466 	DIR *dir;
467 	char dirname[PATH_MAX];
468 	struct rte_pci_addr addr;
469 
470 	/* for debug purposes, PCI can be disabled */
471 	if (!rte_eal_has_pci())
472 		return 0;
473 
474 #ifdef VFIO_PRESENT
475 	if (!pci_vfio_is_enabled())
476 		RTE_LOG(DEBUG, EAL, "VFIO PCI modules not loaded\n");
477 #endif
478 
479 	dir = opendir(rte_pci_get_sysfs_path());
480 	if (dir == NULL) {
481 		RTE_LOG(ERR, EAL, "%s(): opendir failed: %s\n",
482 			__func__, strerror(errno));
483 		return -1;
484 	}
485 
486 	while ((e = readdir(dir)) != NULL) {
487 		if (e->d_name[0] == '.')
488 			continue;
489 
490 		if (parse_pci_addr_format(e->d_name, sizeof(e->d_name), &addr) != 0)
491 			continue;
492 
493 		if (rte_pci_ignore_device(&addr))
494 			continue;
495 
496 		snprintf(dirname, sizeof(dirname), "%s/%s",
497 				rte_pci_get_sysfs_path(), e->d_name);
498 
499 		if (pci_scan_one(dirname, &addr) < 0)
500 			goto error;
501 	}
502 	closedir(dir);
503 	return 0;
504 
505 error:
506 	closedir(dir);
507 	return -1;
508 }
509 
510 #if defined(RTE_ARCH_X86)
511 bool
512 pci_device_iommu_support_va(const struct rte_pci_device *dev)
513 {
514 #define VTD_CAP_MGAW_SHIFT	16
515 #define VTD_CAP_MGAW_MASK	(0x3fULL << VTD_CAP_MGAW_SHIFT)
516 	const struct rte_pci_addr *addr = &dev->addr;
517 	char filename[PATH_MAX];
518 	FILE *fp;
519 	uint64_t mgaw, vtd_cap_reg = 0;
520 
521 	snprintf(filename, sizeof(filename),
522 		 "%s/" PCI_PRI_FMT "/iommu/intel-iommu/cap",
523 		 rte_pci_get_sysfs_path(), addr->domain, addr->bus, addr->devid,
524 		 addr->function);
525 
526 	fp = fopen(filename, "r");
527 	if (fp == NULL) {
528 		/* We don't have an Intel IOMMU, assume VA supported */
529 		if (errno == ENOENT)
530 			return true;
531 
532 		RTE_LOG(ERR, EAL, "%s(): can't open %s: %s\n",
533 			__func__, filename, strerror(errno));
534 		return false;
535 	}
536 
537 	/* We have an Intel IOMMU */
538 	if (fscanf(fp, "%" PRIx64, &vtd_cap_reg) != 1) {
539 		RTE_LOG(ERR, EAL, "%s(): can't read %s\n", __func__, filename);
540 		fclose(fp);
541 		return false;
542 	}
543 
544 	fclose(fp);
545 
546 	mgaw = ((vtd_cap_reg & VTD_CAP_MGAW_MASK) >> VTD_CAP_MGAW_SHIFT) + 1;
547 
548 	/*
549 	 * Assuming there is no limitation by now. We can not know at this point
550 	 * because the memory has not been initialized yet. Setting the dma mask
551 	 * will force a check once memory initialization is done. We can not do
552 	 * a fallback to IOVA PA now, but if the dma check fails, the error
553 	 * message should advice for using '--iova-mode pa' if IOVA VA is the
554 	 * current mode.
555 	 */
556 	rte_mem_set_dma_mask(mgaw);
557 	return true;
558 }
559 #elif defined(RTE_ARCH_PPC_64)
560 bool
561 pci_device_iommu_support_va(__rte_unused const struct rte_pci_device *dev)
562 {
563 	/*
564 	 * IOMMU is always present on a PowerNV host (IOMMUv2).
565 	 * IOMMU is also present in a KVM/QEMU VM (IOMMUv1) but is not
566 	 * currently supported by DPDK. Test for our current environment
567 	 * and report VA support as appropriate.
568 	 */
569 
570 	char *line = NULL;
571 	size_t len = 0;
572 	char filename[PATH_MAX] = "/proc/cpuinfo";
573 	FILE *fp = fopen(filename, "r");
574 	bool ret = false;
575 
576 	if (fp == NULL) {
577 		RTE_LOG(ERR, EAL, "%s(): can't open %s: %s\n",
578 			__func__, filename, strerror(errno));
579 		return ret;
580 	}
581 
582 	/* Check for a PowerNV platform */
583 	while (getline(&line, &len, fp) != -1) {
584 		if (strstr(line, "platform") != NULL)
585 			continue;
586 
587 		if (strstr(line, "PowerNV") != NULL) {
588 			RTE_LOG(DEBUG, EAL, "Running on a PowerNV system\n");
589 			ret = true;
590 			break;
591 		}
592 	}
593 
594 	free(line);
595 	fclose(fp);
596 	return ret;
597 }
598 #else
599 bool
600 pci_device_iommu_support_va(__rte_unused const struct rte_pci_device *dev)
601 {
602 	return true;
603 }
604 #endif
605 
606 enum rte_iova_mode
607 pci_device_iova_mode(const struct rte_pci_driver *pdrv,
608 		     const struct rte_pci_device *pdev)
609 {
610 	enum rte_iova_mode iova_mode = RTE_IOVA_DC;
611 
612 	switch (pdev->kdrv) {
613 	case RTE_PCI_KDRV_VFIO: {
614 #ifdef VFIO_PRESENT
615 		static int is_vfio_noiommu_enabled = -1;
616 
617 		if (is_vfio_noiommu_enabled == -1) {
618 			if (rte_vfio_noiommu_is_enabled() == 1)
619 				is_vfio_noiommu_enabled = 1;
620 			else
621 				is_vfio_noiommu_enabled = 0;
622 		}
623 		if (is_vfio_noiommu_enabled != 0)
624 			iova_mode = RTE_IOVA_PA;
625 		else if ((pdrv->drv_flags & RTE_PCI_DRV_NEED_IOVA_AS_VA) != 0)
626 			iova_mode = RTE_IOVA_VA;
627 #endif
628 		break;
629 	}
630 
631 	case RTE_PCI_KDRV_IGB_UIO:
632 	case RTE_PCI_KDRV_UIO_GENERIC:
633 		iova_mode = RTE_IOVA_PA;
634 		break;
635 
636 	default:
637 		if ((pdrv->drv_flags & RTE_PCI_DRV_NEED_IOVA_AS_VA) != 0)
638 			iova_mode = RTE_IOVA_VA;
639 		break;
640 	}
641 	return iova_mode;
642 }
643 
644 /* Read PCI config space. */
645 int rte_pci_read_config(const struct rte_pci_device *device,
646 		void *buf, size_t len, off_t offset)
647 {
648 	char devname[RTE_DEV_NAME_MAX_LEN] = "";
649 	const struct rte_intr_handle *intr_handle = &device->intr_handle;
650 
651 	switch (device->kdrv) {
652 	case RTE_PCI_KDRV_IGB_UIO:
653 	case RTE_PCI_KDRV_UIO_GENERIC:
654 		return pci_uio_read_config(intr_handle, buf, len, offset);
655 #ifdef VFIO_PRESENT
656 	case RTE_PCI_KDRV_VFIO:
657 		return pci_vfio_read_config(intr_handle, buf, len, offset);
658 #endif
659 	default:
660 		rte_pci_device_name(&device->addr, devname,
661 				    RTE_DEV_NAME_MAX_LEN);
662 		RTE_LOG(ERR, EAL,
663 			"Unknown driver type for %s\n", devname);
664 		return -1;
665 	}
666 }
667 
668 /* Write PCI config space. */
669 int rte_pci_write_config(const struct rte_pci_device *device,
670 		const void *buf, size_t len, off_t offset)
671 {
672 	char devname[RTE_DEV_NAME_MAX_LEN] = "";
673 	const struct rte_intr_handle *intr_handle = &device->intr_handle;
674 
675 	switch (device->kdrv) {
676 	case RTE_PCI_KDRV_IGB_UIO:
677 	case RTE_PCI_KDRV_UIO_GENERIC:
678 		return pci_uio_write_config(intr_handle, buf, len, offset);
679 #ifdef VFIO_PRESENT
680 	case RTE_PCI_KDRV_VFIO:
681 		return pci_vfio_write_config(intr_handle, buf, len, offset);
682 #endif
683 	default:
684 		rte_pci_device_name(&device->addr, devname,
685 				    RTE_DEV_NAME_MAX_LEN);
686 		RTE_LOG(ERR, EAL,
687 			"Unknown driver type for %s\n", devname);
688 		return -1;
689 	}
690 }
691 
692 #if defined(RTE_ARCH_X86)
693 static int
694 pci_ioport_map(struct rte_pci_device *dev, int bar __rte_unused,
695 		struct rte_pci_ioport *p)
696 {
697 	uint16_t start, end;
698 	FILE *fp;
699 	char *line = NULL;
700 	char pci_id[16];
701 	int found = 0;
702 	size_t linesz;
703 
704 	if (rte_eal_iopl_init() != 0) {
705 		RTE_LOG(ERR, EAL, "%s(): insufficient ioport permissions for PCI device %s\n",
706 			__func__, dev->name);
707 		return -1;
708 	}
709 
710 	snprintf(pci_id, sizeof(pci_id), PCI_PRI_FMT,
711 		 dev->addr.domain, dev->addr.bus,
712 		 dev->addr.devid, dev->addr.function);
713 
714 	fp = fopen("/proc/ioports", "r");
715 	if (fp == NULL) {
716 		RTE_LOG(ERR, EAL, "%s(): can't open ioports\n", __func__);
717 		return -1;
718 	}
719 
720 	while (getdelim(&line, &linesz, '\n', fp) > 0) {
721 		char *ptr = line;
722 		char *left;
723 		int n;
724 
725 		n = strcspn(ptr, ":");
726 		ptr[n] = 0;
727 		left = &ptr[n + 1];
728 
729 		while (*left && isspace(*left))
730 			left++;
731 
732 		if (!strncmp(left, pci_id, strlen(pci_id))) {
733 			found = 1;
734 
735 			while (*ptr && isspace(*ptr))
736 				ptr++;
737 
738 			sscanf(ptr, "%04hx-%04hx", &start, &end);
739 
740 			break;
741 		}
742 	}
743 
744 	free(line);
745 	fclose(fp);
746 
747 	if (!found)
748 		return -1;
749 
750 	p->base = start;
751 	RTE_LOG(DEBUG, EAL, "PCI Port IO found start=0x%x\n", start);
752 
753 	return 0;
754 }
755 #endif
756 
757 int
758 rte_pci_ioport_map(struct rte_pci_device *dev, int bar,
759 		struct rte_pci_ioport *p)
760 {
761 	int ret = -1;
762 
763 	switch (dev->kdrv) {
764 #ifdef VFIO_PRESENT
765 	case RTE_PCI_KDRV_VFIO:
766 		if (pci_vfio_is_enabled())
767 			ret = pci_vfio_ioport_map(dev, bar, p);
768 		break;
769 #endif
770 	case RTE_PCI_KDRV_IGB_UIO:
771 		ret = pci_uio_ioport_map(dev, bar, p);
772 		break;
773 	case RTE_PCI_KDRV_UIO_GENERIC:
774 #if defined(RTE_ARCH_X86)
775 		ret = pci_ioport_map(dev, bar, p);
776 #else
777 		ret = pci_uio_ioport_map(dev, bar, p);
778 #endif
779 		break;
780 	default:
781 		break;
782 	}
783 
784 	if (!ret)
785 		p->dev = dev;
786 
787 	return ret;
788 }
789 
790 void
791 rte_pci_ioport_read(struct rte_pci_ioport *p,
792 		void *data, size_t len, off_t offset)
793 {
794 	switch (p->dev->kdrv) {
795 #ifdef VFIO_PRESENT
796 	case RTE_PCI_KDRV_VFIO:
797 		pci_vfio_ioport_read(p, data, len, offset);
798 		break;
799 #endif
800 	case RTE_PCI_KDRV_IGB_UIO:
801 		pci_uio_ioport_read(p, data, len, offset);
802 		break;
803 	case RTE_PCI_KDRV_UIO_GENERIC:
804 		pci_uio_ioport_read(p, data, len, offset);
805 		break;
806 	default:
807 		break;
808 	}
809 }
810 
811 void
812 rte_pci_ioport_write(struct rte_pci_ioport *p,
813 		const void *data, size_t len, off_t offset)
814 {
815 	switch (p->dev->kdrv) {
816 #ifdef VFIO_PRESENT
817 	case RTE_PCI_KDRV_VFIO:
818 		pci_vfio_ioport_write(p, data, len, offset);
819 		break;
820 #endif
821 	case RTE_PCI_KDRV_IGB_UIO:
822 		pci_uio_ioport_write(p, data, len, offset);
823 		break;
824 	case RTE_PCI_KDRV_UIO_GENERIC:
825 		pci_uio_ioport_write(p, data, len, offset);
826 		break;
827 	default:
828 		break;
829 	}
830 }
831 
832 int
833 rte_pci_ioport_unmap(struct rte_pci_ioport *p)
834 {
835 	int ret = -1;
836 
837 	switch (p->dev->kdrv) {
838 #ifdef VFIO_PRESENT
839 	case RTE_PCI_KDRV_VFIO:
840 		if (pci_vfio_is_enabled())
841 			ret = pci_vfio_ioport_unmap(p);
842 		break;
843 #endif
844 	case RTE_PCI_KDRV_IGB_UIO:
845 		ret = pci_uio_ioport_unmap(p);
846 		break;
847 	case RTE_PCI_KDRV_UIO_GENERIC:
848 #if defined(RTE_ARCH_X86)
849 		ret = 0;
850 #else
851 		ret = pci_uio_ioport_unmap(p);
852 #endif
853 		break;
854 	default:
855 		break;
856 	}
857 
858 	return ret;
859 }
860