xref: /dpdk/drivers/net/virtio/virtio_user/vhost_kernel.c (revision 746c346d76c47c47346e7a1168a2097fe6e77e80)
15566a3e3SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause
25566a3e3SBruce Richardson  * Copyright(c) 2016 Intel Corporation
3e3b43481SJianfeng Tan  */
4e3b43481SJianfeng Tan 
5e3b43481SJianfeng Tan #include <sys/types.h>
6e3b43481SJianfeng Tan #include <sys/stat.h>
7e3b43481SJianfeng Tan #include <fcntl.h>
8e3b43481SJianfeng Tan #include <unistd.h>
9e3b43481SJianfeng Tan 
10e3b43481SJianfeng Tan #include <rte_memory.h>
11e3b43481SJianfeng Tan #include <rte_eal_memconfig.h>
12e3b43481SJianfeng Tan 
13e3b43481SJianfeng Tan #include "vhost.h"
14e3b43481SJianfeng Tan #include "virtio_user_dev.h"
15e3b43481SJianfeng Tan #include "vhost_kernel_tap.h"
16e3b43481SJianfeng Tan 
17e3b43481SJianfeng Tan struct vhost_memory_kernel {
18e3b43481SJianfeng Tan 	uint32_t nregions;
19e3b43481SJianfeng Tan 	uint32_t padding;
20e3b43481SJianfeng Tan 	struct vhost_memory_region regions[0];
21e3b43481SJianfeng Tan };
22e3b43481SJianfeng Tan 
23e3b43481SJianfeng Tan /* vhost kernel ioctls */
24e3b43481SJianfeng Tan #define VHOST_VIRTIO 0xAF
25e3b43481SJianfeng Tan #define VHOST_GET_FEATURES _IOR(VHOST_VIRTIO, 0x00, __u64)
26e3b43481SJianfeng Tan #define VHOST_SET_FEATURES _IOW(VHOST_VIRTIO, 0x00, __u64)
27e3b43481SJianfeng Tan #define VHOST_SET_OWNER _IO(VHOST_VIRTIO, 0x01)
28e3b43481SJianfeng Tan #define VHOST_RESET_OWNER _IO(VHOST_VIRTIO, 0x02)
29e3b43481SJianfeng Tan #define VHOST_SET_MEM_TABLE _IOW(VHOST_VIRTIO, 0x03, struct vhost_memory_kernel)
30e3b43481SJianfeng Tan #define VHOST_SET_LOG_BASE _IOW(VHOST_VIRTIO, 0x04, __u64)
31e3b43481SJianfeng Tan #define VHOST_SET_LOG_FD _IOW(VHOST_VIRTIO, 0x07, int)
32e3b43481SJianfeng Tan #define VHOST_SET_VRING_NUM _IOW(VHOST_VIRTIO, 0x10, struct vhost_vring_state)
33e3b43481SJianfeng Tan #define VHOST_SET_VRING_ADDR _IOW(VHOST_VIRTIO, 0x11, struct vhost_vring_addr)
34e3b43481SJianfeng Tan #define VHOST_SET_VRING_BASE _IOW(VHOST_VIRTIO, 0x12, struct vhost_vring_state)
35e3b43481SJianfeng Tan #define VHOST_GET_VRING_BASE _IOWR(VHOST_VIRTIO, 0x12, struct vhost_vring_state)
36e3b43481SJianfeng Tan #define VHOST_SET_VRING_KICK _IOW(VHOST_VIRTIO, 0x20, struct vhost_vring_file)
37e3b43481SJianfeng Tan #define VHOST_SET_VRING_CALL _IOW(VHOST_VIRTIO, 0x21, struct vhost_vring_file)
38e3b43481SJianfeng Tan #define VHOST_SET_VRING_ERR _IOW(VHOST_VIRTIO, 0x22, struct vhost_vring_file)
39e3b43481SJianfeng Tan #define VHOST_NET_SET_BACKEND _IOW(VHOST_VIRTIO, 0x30, struct vhost_vring_file)
40e3b43481SJianfeng Tan 
41e3b43481SJianfeng Tan static uint64_t max_regions = 64;
42e3b43481SJianfeng Tan 
43e3b43481SJianfeng Tan static void
44e3b43481SJianfeng Tan get_vhost_kernel_max_regions(void)
45e3b43481SJianfeng Tan {
46e3b43481SJianfeng Tan 	int fd;
47e3b43481SJianfeng Tan 	char buf[20] = {'\0'};
48e3b43481SJianfeng Tan 
49e3b43481SJianfeng Tan 	fd = open("/sys/module/vhost/parameters/max_mem_regions", O_RDONLY);
50e3b43481SJianfeng Tan 	if (fd < 0)
51e3b43481SJianfeng Tan 		return;
52e3b43481SJianfeng Tan 
53e3b43481SJianfeng Tan 	if (read(fd, buf, sizeof(buf) - 1) > 0)
54e3b43481SJianfeng Tan 		max_regions = strtoull(buf, NULL, 10);
55e3b43481SJianfeng Tan 
56e3b43481SJianfeng Tan 	close(fd);
57e3b43481SJianfeng Tan }
58e3b43481SJianfeng Tan 
59e3b43481SJianfeng Tan static uint64_t vhost_req_user_to_kernel[] = {
60e3b43481SJianfeng Tan 	[VHOST_USER_SET_OWNER] = VHOST_SET_OWNER,
61e3b43481SJianfeng Tan 	[VHOST_USER_RESET_OWNER] = VHOST_RESET_OWNER,
62e3b43481SJianfeng Tan 	[VHOST_USER_SET_FEATURES] = VHOST_SET_FEATURES,
63e3b43481SJianfeng Tan 	[VHOST_USER_GET_FEATURES] = VHOST_GET_FEATURES,
64e3b43481SJianfeng Tan 	[VHOST_USER_SET_VRING_CALL] = VHOST_SET_VRING_CALL,
65e3b43481SJianfeng Tan 	[VHOST_USER_SET_VRING_NUM] = VHOST_SET_VRING_NUM,
66e3b43481SJianfeng Tan 	[VHOST_USER_SET_VRING_BASE] = VHOST_SET_VRING_BASE,
67e3b43481SJianfeng Tan 	[VHOST_USER_GET_VRING_BASE] = VHOST_GET_VRING_BASE,
68e3b43481SJianfeng Tan 	[VHOST_USER_SET_VRING_ADDR] = VHOST_SET_VRING_ADDR,
69e3b43481SJianfeng Tan 	[VHOST_USER_SET_VRING_KICK] = VHOST_SET_VRING_KICK,
70e3b43481SJianfeng Tan 	[VHOST_USER_SET_MEM_TABLE] = VHOST_SET_MEM_TABLE,
71e3b43481SJianfeng Tan };
72e3b43481SJianfeng Tan 
73*746c346dSAnatoly Burakov struct walk_arg {
74*746c346dSAnatoly Burakov 	struct vhost_memory_kernel *vm;
75*746c346dSAnatoly Burakov 	uint32_t region_nr;
76*746c346dSAnatoly Burakov };
77*746c346dSAnatoly Burakov static int
78*746c346dSAnatoly Burakov add_memory_region(const struct rte_memseg *ms, size_t len, void *arg)
79*746c346dSAnatoly Burakov {
80*746c346dSAnatoly Burakov 	struct walk_arg *wa = arg;
81*746c346dSAnatoly Burakov 	struct vhost_memory_region *mr;
82*746c346dSAnatoly Burakov 	void *start_addr;
83*746c346dSAnatoly Burakov 
84*746c346dSAnatoly Burakov 	if (wa->region_nr >= max_regions)
85*746c346dSAnatoly Burakov 		return -1;
86*746c346dSAnatoly Burakov 
87*746c346dSAnatoly Burakov 	mr = &wa->vm->regions[wa->region_nr++];
88*746c346dSAnatoly Burakov 	start_addr = ms->addr;
89*746c346dSAnatoly Burakov 
90*746c346dSAnatoly Burakov 	mr->guest_phys_addr = (uint64_t)(uintptr_t)start_addr;
91*746c346dSAnatoly Burakov 	mr->userspace_addr = (uint64_t)(uintptr_t)start_addr;
92*746c346dSAnatoly Burakov 	mr->memory_size = len;
93*746c346dSAnatoly Burakov 	mr->mmap_offset = 0;
94*746c346dSAnatoly Burakov 
95*746c346dSAnatoly Burakov 	return 0;
96*746c346dSAnatoly Burakov }
97*746c346dSAnatoly Burakov 
98*746c346dSAnatoly Burakov 
99e3b43481SJianfeng Tan /* By default, vhost kernel module allows 64 regions, but DPDK allows
100e3b43481SJianfeng Tan  * 256 segments. As a relief, below function merges those virtually
101e3b43481SJianfeng Tan  * adjacent memsegs into one region.
102e3b43481SJianfeng Tan  */
103e3b43481SJianfeng Tan static struct vhost_memory_kernel *
104e3b43481SJianfeng Tan prepare_vhost_memory_kernel(void)
105e3b43481SJianfeng Tan {
106e3b43481SJianfeng Tan 	struct vhost_memory_kernel *vm;
107*746c346dSAnatoly Burakov 	struct walk_arg wa;
108e3b43481SJianfeng Tan 
109e3b43481SJianfeng Tan 	vm = malloc(sizeof(struct vhost_memory_kernel) +
110e3b43481SJianfeng Tan 			max_regions *
111e3b43481SJianfeng Tan 			sizeof(struct vhost_memory_region));
1121e9057a9SJianfeng Tan 	if (!vm)
1131e9057a9SJianfeng Tan 		return NULL;
114e3b43481SJianfeng Tan 
115*746c346dSAnatoly Burakov 	wa.region_nr = 0;
116*746c346dSAnatoly Burakov 	wa.vm = vm;
117e3b43481SJianfeng Tan 
118*746c346dSAnatoly Burakov 	if (rte_memseg_contig_walk(add_memory_region, &wa) < 0) {
119e3b43481SJianfeng Tan 		free(vm);
120e3b43481SJianfeng Tan 		return NULL;
121e3b43481SJianfeng Tan 	}
122e3b43481SJianfeng Tan 
123*746c346dSAnatoly Burakov 	vm->nregions = wa.region_nr;
124e3b43481SJianfeng Tan 	vm->padding = 0;
125e3b43481SJianfeng Tan 	return vm;
126e3b43481SJianfeng Tan }
127e3b43481SJianfeng Tan 
1285e97e420SJianfeng Tan /* with below features, vhost kernel does not need to do the checksum and TSO,
1295e97e420SJianfeng Tan  * these info will be passed to virtio_user through virtio net header.
1305e97e420SJianfeng Tan  */
1315e97e420SJianfeng Tan #define VHOST_KERNEL_GUEST_OFFLOADS_MASK	\
1325e97e420SJianfeng Tan 	((1ULL << VIRTIO_NET_F_GUEST_CSUM) |	\
1335e97e420SJianfeng Tan 	 (1ULL << VIRTIO_NET_F_GUEST_TSO4) |	\
1345e97e420SJianfeng Tan 	 (1ULL << VIRTIO_NET_F_GUEST_TSO6) |	\
1355e97e420SJianfeng Tan 	 (1ULL << VIRTIO_NET_F_GUEST_ECN)  |	\
1365e97e420SJianfeng Tan 	 (1ULL << VIRTIO_NET_F_GUEST_UFO))
1375e97e420SJianfeng Tan 
1385e97e420SJianfeng Tan /* with below features, when flows from virtio_user to vhost kernel
1395e97e420SJianfeng Tan  * (1) if flows goes up through the kernel networking stack, it does not need
1405e97e420SJianfeng Tan  * to verify checksum, which can save CPU cycles;
1415e97e420SJianfeng Tan  * (2) if flows goes through a Linux bridge and outside from an interface
1425e97e420SJianfeng Tan  * (kernel driver), checksum and TSO will be done by GSO in kernel or even
1435e97e420SJianfeng Tan  * offloaded into real physical device.
1445e97e420SJianfeng Tan  */
1455e97e420SJianfeng Tan #define VHOST_KERNEL_HOST_OFFLOADS_MASK		\
1465e97e420SJianfeng Tan 	((1ULL << VIRTIO_NET_F_HOST_TSO4) |	\
1475e97e420SJianfeng Tan 	 (1ULL << VIRTIO_NET_F_HOST_TSO6) |	\
1485e97e420SJianfeng Tan 	 (1ULL << VIRTIO_NET_F_CSUM))
1495e97e420SJianfeng Tan 
150e3b43481SJianfeng Tan static int
151be7a4707SJianfeng Tan tap_supporte_mq(void)
152be7a4707SJianfeng Tan {
153be7a4707SJianfeng Tan 	int tapfd;
154be7a4707SJianfeng Tan 	unsigned int tap_features;
155be7a4707SJianfeng Tan 
156be7a4707SJianfeng Tan 	tapfd = open(PATH_NET_TUN, O_RDWR);
157be7a4707SJianfeng Tan 	if (tapfd < 0) {
158be7a4707SJianfeng Tan 		PMD_DRV_LOG(ERR, "fail to open %s: %s",
159be7a4707SJianfeng Tan 			    PATH_NET_TUN, strerror(errno));
160be7a4707SJianfeng Tan 		return -1;
161be7a4707SJianfeng Tan 	}
162be7a4707SJianfeng Tan 
163be7a4707SJianfeng Tan 	if (ioctl(tapfd, TUNGETFEATURES, &tap_features) == -1) {
164be7a4707SJianfeng Tan 		PMD_DRV_LOG(ERR, "TUNGETFEATURES failed: %s", strerror(errno));
165be7a4707SJianfeng Tan 		close(tapfd);
166be7a4707SJianfeng Tan 		return -1;
167be7a4707SJianfeng Tan 	}
168be7a4707SJianfeng Tan 
169be7a4707SJianfeng Tan 	close(tapfd);
170be7a4707SJianfeng Tan 	return tap_features & IFF_MULTI_QUEUE;
171be7a4707SJianfeng Tan }
172be7a4707SJianfeng Tan 
173be7a4707SJianfeng Tan static int
174e3b43481SJianfeng Tan vhost_kernel_ioctl(struct virtio_user_dev *dev,
175e3b43481SJianfeng Tan 		   enum vhost_user_request req,
176e3b43481SJianfeng Tan 		   void *arg)
177e3b43481SJianfeng Tan {
178e3b43481SJianfeng Tan 	int ret = -1;
179e3b43481SJianfeng Tan 	unsigned int i;
180e3b43481SJianfeng Tan 	uint64_t req_kernel;
181e3b43481SJianfeng Tan 	struct vhost_memory_kernel *vm = NULL;
182be7a4707SJianfeng Tan 	int vhostfd;
183be7a4707SJianfeng Tan 	unsigned int queue_sel;
184e3b43481SJianfeng Tan 
185e3b43481SJianfeng Tan 	PMD_DRV_LOG(INFO, "%s", vhost_msg_strings[req]);
186e3b43481SJianfeng Tan 
187e3b43481SJianfeng Tan 	req_kernel = vhost_req_user_to_kernel[req];
188e3b43481SJianfeng Tan 
189e3b43481SJianfeng Tan 	if (req_kernel == VHOST_SET_MEM_TABLE) {
190e3b43481SJianfeng Tan 		vm = prepare_vhost_memory_kernel();
191e3b43481SJianfeng Tan 		if (!vm)
192e3b43481SJianfeng Tan 			return -1;
193e3b43481SJianfeng Tan 		arg = (void *)vm;
194e3b43481SJianfeng Tan 	}
195e3b43481SJianfeng Tan 
1965e97e420SJianfeng Tan 	if (req_kernel == VHOST_SET_FEATURES) {
197e3b43481SJianfeng Tan 		/* We don't need memory protection here */
198e3b43481SJianfeng Tan 		*(uint64_t *)arg &= ~(1ULL << VIRTIO_F_IOMMU_PLATFORM);
199e3b43481SJianfeng Tan 
2005e97e420SJianfeng Tan 		/* VHOST kernel does not know about below flags */
2015e97e420SJianfeng Tan 		*(uint64_t *)arg &= ~VHOST_KERNEL_GUEST_OFFLOADS_MASK;
2025e97e420SJianfeng Tan 		*(uint64_t *)arg &= ~VHOST_KERNEL_HOST_OFFLOADS_MASK;
203be7a4707SJianfeng Tan 
204be7a4707SJianfeng Tan 		*(uint64_t *)arg &= ~(1ULL << VIRTIO_NET_F_MQ);
2055e97e420SJianfeng Tan 	}
2065e97e420SJianfeng Tan 
207be7a4707SJianfeng Tan 	switch (req_kernel) {
208be7a4707SJianfeng Tan 	case VHOST_SET_VRING_NUM:
209be7a4707SJianfeng Tan 	case VHOST_SET_VRING_ADDR:
210be7a4707SJianfeng Tan 	case VHOST_SET_VRING_BASE:
211be7a4707SJianfeng Tan 	case VHOST_GET_VRING_BASE:
212be7a4707SJianfeng Tan 	case VHOST_SET_VRING_KICK:
213be7a4707SJianfeng Tan 	case VHOST_SET_VRING_CALL:
214be7a4707SJianfeng Tan 		queue_sel = *(unsigned int *)arg;
215be7a4707SJianfeng Tan 		vhostfd = dev->vhostfds[queue_sel / 2];
216be7a4707SJianfeng Tan 		*(unsigned int *)arg = queue_sel % 2;
217be7a4707SJianfeng Tan 		PMD_DRV_LOG(DEBUG, "vhostfd=%d, index=%u",
218be7a4707SJianfeng Tan 			    vhostfd, *(unsigned int *)arg);
219be7a4707SJianfeng Tan 		break;
220be7a4707SJianfeng Tan 	default:
221be7a4707SJianfeng Tan 		vhostfd = -1;
222be7a4707SJianfeng Tan 	}
223be7a4707SJianfeng Tan 	if (vhostfd == -1) {
224e3b43481SJianfeng Tan 		for (i = 0; i < dev->max_queue_pairs; ++i) {
225e3b43481SJianfeng Tan 			if (dev->vhostfds[i] < 0)
226e3b43481SJianfeng Tan 				continue;
227e3b43481SJianfeng Tan 
228e3b43481SJianfeng Tan 			ret = ioctl(dev->vhostfds[i], req_kernel, arg);
229e3b43481SJianfeng Tan 			if (ret < 0)
230e3b43481SJianfeng Tan 				break;
231e3b43481SJianfeng Tan 		}
232be7a4707SJianfeng Tan 	} else {
233be7a4707SJianfeng Tan 		ret = ioctl(vhostfd, req_kernel, arg);
234be7a4707SJianfeng Tan 	}
235e3b43481SJianfeng Tan 
2365e97e420SJianfeng Tan 	if (!ret && req_kernel == VHOST_GET_FEATURES) {
2375e97e420SJianfeng Tan 		/* with tap as the backend, all these features are supported
2385e97e420SJianfeng Tan 		 * but not claimed by vhost-net, so we add them back when
2395e97e420SJianfeng Tan 		 * reporting to upper layer.
2405e97e420SJianfeng Tan 		 */
2415e97e420SJianfeng Tan 		*((uint64_t *)arg) |= VHOST_KERNEL_GUEST_OFFLOADS_MASK;
2425e97e420SJianfeng Tan 		*((uint64_t *)arg) |= VHOST_KERNEL_HOST_OFFLOADS_MASK;
243be7a4707SJianfeng Tan 
244be7a4707SJianfeng Tan 		/* vhost_kernel will not declare this feature, but it does
245be7a4707SJianfeng Tan 		 * support multi-queue.
246be7a4707SJianfeng Tan 		 */
247be7a4707SJianfeng Tan 		if (tap_supporte_mq())
248be7a4707SJianfeng Tan 			*(uint64_t *)arg |= (1ull << VIRTIO_NET_F_MQ);
2495e97e420SJianfeng Tan 	}
2505e97e420SJianfeng Tan 
251e3b43481SJianfeng Tan 	if (vm)
252e3b43481SJianfeng Tan 		free(vm);
253e3b43481SJianfeng Tan 
254e3b43481SJianfeng Tan 	if (ret < 0)
255e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "%s failed: %s",
256e3b43481SJianfeng Tan 			    vhost_msg_strings[req], strerror(errno));
257e3b43481SJianfeng Tan 
258e3b43481SJianfeng Tan 	return ret;
259e3b43481SJianfeng Tan }
260e3b43481SJianfeng Tan 
261e3b43481SJianfeng Tan /**
262e3b43481SJianfeng Tan  * Set up environment to talk with a vhost kernel backend.
263e3b43481SJianfeng Tan  *
264e3b43481SJianfeng Tan  * @return
265e3b43481SJianfeng Tan  *   - (-1) if fail to set up;
266e3b43481SJianfeng Tan  *   - (>=0) if successful.
267e3b43481SJianfeng Tan  */
268e3b43481SJianfeng Tan static int
269e3b43481SJianfeng Tan vhost_kernel_setup(struct virtio_user_dev *dev)
270e3b43481SJianfeng Tan {
271e3b43481SJianfeng Tan 	int vhostfd;
272e3b43481SJianfeng Tan 	uint32_t i;
273e3b43481SJianfeng Tan 
274e3b43481SJianfeng Tan 	get_vhost_kernel_max_regions();
275e3b43481SJianfeng Tan 
276e3b43481SJianfeng Tan 	for (i = 0; i < dev->max_queue_pairs; ++i) {
277e3b43481SJianfeng Tan 		vhostfd = open(dev->path, O_RDWR);
278e3b43481SJianfeng Tan 		if (vhostfd < 0) {
279e3b43481SJianfeng Tan 			PMD_DRV_LOG(ERR, "fail to open %s, %s",
280e3b43481SJianfeng Tan 				    dev->path, strerror(errno));
281e3b43481SJianfeng Tan 			return -1;
282e3b43481SJianfeng Tan 		}
283e3b43481SJianfeng Tan 
284e3b43481SJianfeng Tan 		dev->vhostfds[i] = vhostfd;
285e3b43481SJianfeng Tan 	}
286e3b43481SJianfeng Tan 
287e3b43481SJianfeng Tan 	return 0;
288e3b43481SJianfeng Tan }
289e3b43481SJianfeng Tan 
290e3b43481SJianfeng Tan static int
291e3b43481SJianfeng Tan vhost_kernel_set_backend(int vhostfd, int tapfd)
292e3b43481SJianfeng Tan {
293e3b43481SJianfeng Tan 	struct vhost_vring_file f;
294e3b43481SJianfeng Tan 
295e3b43481SJianfeng Tan 	f.fd = tapfd;
296e3b43481SJianfeng Tan 	f.index = 0;
297e3b43481SJianfeng Tan 	if (ioctl(vhostfd, VHOST_NET_SET_BACKEND, &f) < 0) {
298e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "VHOST_NET_SET_BACKEND fails, %s",
299e3b43481SJianfeng Tan 				strerror(errno));
300e3b43481SJianfeng Tan 		return -1;
301e3b43481SJianfeng Tan 	}
302e3b43481SJianfeng Tan 
303e3b43481SJianfeng Tan 	f.index = 1;
304e3b43481SJianfeng Tan 	if (ioctl(vhostfd, VHOST_NET_SET_BACKEND, &f) < 0) {
305e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "VHOST_NET_SET_BACKEND fails, %s",
306e3b43481SJianfeng Tan 				strerror(errno));
307e3b43481SJianfeng Tan 		return -1;
308e3b43481SJianfeng Tan 	}
309e3b43481SJianfeng Tan 
310e3b43481SJianfeng Tan 	return 0;
311e3b43481SJianfeng Tan }
312e3b43481SJianfeng Tan 
313e3b43481SJianfeng Tan static int
314e3b43481SJianfeng Tan vhost_kernel_enable_queue_pair(struct virtio_user_dev *dev,
315e3b43481SJianfeng Tan 			       uint16_t pair_idx,
316e3b43481SJianfeng Tan 			       int enable)
317e3b43481SJianfeng Tan {
318e3b43481SJianfeng Tan 	int hdr_size;
319e3b43481SJianfeng Tan 	int vhostfd;
320e3b43481SJianfeng Tan 	int tapfd;
321be7a4707SJianfeng Tan 	int req_mq = (dev->max_queue_pairs > 1);
322e3b43481SJianfeng Tan 
323e3b43481SJianfeng Tan 	vhostfd = dev->vhostfds[pair_idx];
324e3b43481SJianfeng Tan 
325e3b43481SJianfeng Tan 	if (!enable) {
326250c9965SWenfeng Liu 		if (dev->tapfds[pair_idx] >= 0) {
327e3b43481SJianfeng Tan 			close(dev->tapfds[pair_idx]);
328e3b43481SJianfeng Tan 			dev->tapfds[pair_idx] = -1;
329e3b43481SJianfeng Tan 		}
330e3b43481SJianfeng Tan 		return vhost_kernel_set_backend(vhostfd, -1);
331e3b43481SJianfeng Tan 	} else if (dev->tapfds[pair_idx] >= 0) {
332e3b43481SJianfeng Tan 		return 0;
333e3b43481SJianfeng Tan 	}
334e3b43481SJianfeng Tan 
335e3b43481SJianfeng Tan 	if ((dev->features & (1ULL << VIRTIO_NET_F_MRG_RXBUF)) ||
336e3b43481SJianfeng Tan 	    (dev->features & (1ULL << VIRTIO_F_VERSION_1)))
337e3b43481SJianfeng Tan 		hdr_size = sizeof(struct virtio_net_hdr_mrg_rxbuf);
338e3b43481SJianfeng Tan 	else
339e3b43481SJianfeng Tan 		hdr_size = sizeof(struct virtio_net_hdr);
340e3b43481SJianfeng Tan 
341791b43e0SNing Li 	tapfd = vhost_kernel_open_tap(&dev->ifname, hdr_size, req_mq,
342791b43e0SNing Li 			 (char *)dev->mac_addr);
343e3b43481SJianfeng Tan 	if (tapfd < 0) {
344e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "fail to open tap for vhost kernel");
345e3b43481SJianfeng Tan 		return -1;
346e3b43481SJianfeng Tan 	}
347e3b43481SJianfeng Tan 
348e3b43481SJianfeng Tan 	if (vhost_kernel_set_backend(vhostfd, tapfd) < 0) {
349e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "fail to set backend for vhost kernel");
350e3b43481SJianfeng Tan 		close(tapfd);
351e3b43481SJianfeng Tan 		return -1;
352e3b43481SJianfeng Tan 	}
353e3b43481SJianfeng Tan 
354e3b43481SJianfeng Tan 	dev->tapfds[pair_idx] = tapfd;
355e3b43481SJianfeng Tan 	return 0;
356e3b43481SJianfeng Tan }
357e3b43481SJianfeng Tan 
358e3b43481SJianfeng Tan struct virtio_user_backend_ops ops_kernel = {
359e3b43481SJianfeng Tan 	.setup = vhost_kernel_setup,
360e3b43481SJianfeng Tan 	.send_request = vhost_kernel_ioctl,
361e3b43481SJianfeng Tan 	.enable_qp = vhost_kernel_enable_queue_pair
362e3b43481SJianfeng Tan };
363