xref: /dpdk/drivers/net/virtio/virtio_user/virtio_user_dev.c (revision bd8f50a45d0fb55cf191c3f6022a1ceb80a0b712)
15566a3e3SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause
25566a3e3SBruce Richardson  * Copyright(c) 2010-2016 Intel Corporation
337a7eb2aSJianfeng Tan  */
437a7eb2aSJianfeng Tan 
537a7eb2aSJianfeng Tan #include <stdint.h>
637a7eb2aSJianfeng Tan #include <stdio.h>
737a7eb2aSJianfeng Tan #include <fcntl.h>
837a7eb2aSJianfeng Tan #include <string.h>
937a7eb2aSJianfeng Tan #include <errno.h>
1037a7eb2aSJianfeng Tan #include <sys/mman.h>
1137a7eb2aSJianfeng Tan #include <unistd.h>
1237a7eb2aSJianfeng Tan #include <sys/eventfd.h>
1333d24d65SJianfeng Tan #include <sys/types.h>
1433d24d65SJianfeng Tan #include <sys/stat.h>
1537a7eb2aSJianfeng Tan 
1637a7eb2aSJianfeng Tan #include "vhost.h"
1737a7eb2aSJianfeng Tan #include "virtio_user_dev.h"
1837a7eb2aSJianfeng Tan #include "../virtio_ethdev.h"
1937a7eb2aSJianfeng Tan 
2037a7eb2aSJianfeng Tan static int
2157ae79a7SJianfeng Tan virtio_user_create_queue(struct virtio_user_dev *dev, uint32_t queue_sel)
2257ae79a7SJianfeng Tan {
2357ae79a7SJianfeng Tan 	/* Of all per virtqueue MSGs, make sure VHOST_SET_VRING_CALL come
2457ae79a7SJianfeng Tan 	 * firstly because vhost depends on this msg to allocate virtqueue
2557ae79a7SJianfeng Tan 	 * pair.
2657ae79a7SJianfeng Tan 	 */
2757ae79a7SJianfeng Tan 	struct vhost_vring_file file;
2857ae79a7SJianfeng Tan 
2957ae79a7SJianfeng Tan 	file.index = queue_sel;
30e6e7ad8bSJianfeng Tan 	file.fd = dev->callfds[queue_sel];
3133d24d65SJianfeng Tan 	dev->ops->send_request(dev, VHOST_USER_SET_VRING_CALL, &file);
3257ae79a7SJianfeng Tan 
3357ae79a7SJianfeng Tan 	return 0;
3457ae79a7SJianfeng Tan }
3557ae79a7SJianfeng Tan 
3657ae79a7SJianfeng Tan static int
3737a7eb2aSJianfeng Tan virtio_user_kick_queue(struct virtio_user_dev *dev, uint32_t queue_sel)
3837a7eb2aSJianfeng Tan {
3937a7eb2aSJianfeng Tan 	struct vhost_vring_file file;
4037a7eb2aSJianfeng Tan 	struct vhost_vring_state state;
4137a7eb2aSJianfeng Tan 	struct vring *vring = &dev->vrings[queue_sel];
4237a7eb2aSJianfeng Tan 	struct vhost_vring_addr addr = {
4337a7eb2aSJianfeng Tan 		.index = queue_sel,
4437a7eb2aSJianfeng Tan 		.desc_user_addr = (uint64_t)(uintptr_t)vring->desc,
4537a7eb2aSJianfeng Tan 		.avail_user_addr = (uint64_t)(uintptr_t)vring->avail,
4637a7eb2aSJianfeng Tan 		.used_user_addr = (uint64_t)(uintptr_t)vring->used,
4737a7eb2aSJianfeng Tan 		.log_guest_addr = 0,
4837a7eb2aSJianfeng Tan 		.flags = 0, /* disable log */
4937a7eb2aSJianfeng Tan 	};
5037a7eb2aSJianfeng Tan 
5137a7eb2aSJianfeng Tan 	state.index = queue_sel;
5237a7eb2aSJianfeng Tan 	state.num = vring->num;
5333d24d65SJianfeng Tan 	dev->ops->send_request(dev, VHOST_USER_SET_VRING_NUM, &state);
5437a7eb2aSJianfeng Tan 
55be7a4707SJianfeng Tan 	state.index = queue_sel;
5637a7eb2aSJianfeng Tan 	state.num = 0; /* no reservation */
5733d24d65SJianfeng Tan 	dev->ops->send_request(dev, VHOST_USER_SET_VRING_BASE, &state);
5837a7eb2aSJianfeng Tan 
5933d24d65SJianfeng Tan 	dev->ops->send_request(dev, VHOST_USER_SET_VRING_ADDR, &addr);
6037a7eb2aSJianfeng Tan 
6137a7eb2aSJianfeng Tan 	/* Of all per virtqueue MSGs, make sure VHOST_USER_SET_VRING_KICK comes
6237a7eb2aSJianfeng Tan 	 * lastly because vhost depends on this msg to judge if
6337a7eb2aSJianfeng Tan 	 * virtio is ready.
6437a7eb2aSJianfeng Tan 	 */
6557ae79a7SJianfeng Tan 	file.index = queue_sel;
66e6e7ad8bSJianfeng Tan 	file.fd = dev->kickfds[queue_sel];
6733d24d65SJianfeng Tan 	dev->ops->send_request(dev, VHOST_USER_SET_VRING_KICK, &file);
6837a7eb2aSJianfeng Tan 
6937a7eb2aSJianfeng Tan 	return 0;
7037a7eb2aSJianfeng Tan }
7137a7eb2aSJianfeng Tan 
7257ae79a7SJianfeng Tan static int
7357ae79a7SJianfeng Tan virtio_user_queue_setup(struct virtio_user_dev *dev,
7457ae79a7SJianfeng Tan 			int (*fn)(struct virtio_user_dev *, uint32_t))
7557ae79a7SJianfeng Tan {
7657ae79a7SJianfeng Tan 	uint32_t i, queue_sel;
7757ae79a7SJianfeng Tan 
7857ae79a7SJianfeng Tan 	for (i = 0; i < dev->max_queue_pairs; ++i) {
7957ae79a7SJianfeng Tan 		queue_sel = 2 * i + VTNET_SQ_RQ_QUEUE_IDX;
8057ae79a7SJianfeng Tan 		if (fn(dev, queue_sel) < 0) {
8157ae79a7SJianfeng Tan 			PMD_DRV_LOG(INFO, "setup rx vq fails: %u", i);
8257ae79a7SJianfeng Tan 			return -1;
8357ae79a7SJianfeng Tan 		}
8457ae79a7SJianfeng Tan 	}
8557ae79a7SJianfeng Tan 	for (i = 0; i < dev->max_queue_pairs; ++i) {
8657ae79a7SJianfeng Tan 		queue_sel = 2 * i + VTNET_SQ_TQ_QUEUE_IDX;
8757ae79a7SJianfeng Tan 		if (fn(dev, queue_sel) < 0) {
8857ae79a7SJianfeng Tan 			PMD_DRV_LOG(INFO, "setup tx vq fails: %u", i);
8957ae79a7SJianfeng Tan 			return -1;
9057ae79a7SJianfeng Tan 		}
9157ae79a7SJianfeng Tan 	}
9257ae79a7SJianfeng Tan 
9357ae79a7SJianfeng Tan 	return 0;
9457ae79a7SJianfeng Tan }
9557ae79a7SJianfeng Tan 
9637a7eb2aSJianfeng Tan int
97*bd8f50a4SZhiyong Yang is_vhost_user_by_type(const char *path)
98*bd8f50a4SZhiyong Yang {
99*bd8f50a4SZhiyong Yang 	struct stat sb;
100*bd8f50a4SZhiyong Yang 
101*bd8f50a4SZhiyong Yang 	if (stat(path, &sb) == -1)
102*bd8f50a4SZhiyong Yang 		return 0;
103*bd8f50a4SZhiyong Yang 
104*bd8f50a4SZhiyong Yang 	return S_ISSOCK(sb.st_mode);
105*bd8f50a4SZhiyong Yang }
106*bd8f50a4SZhiyong Yang 
107*bd8f50a4SZhiyong Yang int
10837a7eb2aSJianfeng Tan virtio_user_start_device(struct virtio_user_dev *dev)
10937a7eb2aSJianfeng Tan {
11037a7eb2aSJianfeng Tan 	uint64_t features;
11137a7eb2aSJianfeng Tan 	int ret;
11237a7eb2aSJianfeng Tan 
113*bd8f50a4SZhiyong Yang 	if (is_vhost_user_by_type(dev->path) && dev->vhostfd < 0)
114*bd8f50a4SZhiyong Yang 		return -1;
115*bd8f50a4SZhiyong Yang 
116bce7e905SJianfeng Tan 	/* Do not check return as already done in init, or reset in stop */
117bce7e905SJianfeng Tan 	dev->ops->send_request(dev, VHOST_USER_SET_OWNER, NULL);
118bce7e905SJianfeng Tan 
11957ae79a7SJianfeng Tan 	/* Step 0: tell vhost to create queues */
12057ae79a7SJianfeng Tan 	if (virtio_user_queue_setup(dev, virtio_user_create_queue) < 0)
12137a7eb2aSJianfeng Tan 		goto error;
12237a7eb2aSJianfeng Tan 
12333d24d65SJianfeng Tan 	/* Step 1: set features */
12437a7eb2aSJianfeng Tan 	features = dev->features;
12533d24d65SJianfeng Tan 	/* Strip VIRTIO_NET_F_MAC, as MAC address is handled in vdev init */
12637a7eb2aSJianfeng Tan 	features &= ~(1ull << VIRTIO_NET_F_MAC);
12733d24d65SJianfeng Tan 	/* Strip VIRTIO_NET_F_CTRL_VQ, as devices do not really need to know */
128142678d4SJianfeng Tan 	features &= ~(1ull << VIRTIO_NET_F_CTRL_VQ);
12935c4f855SJianfeng Tan 	features &= ~(1ull << VIRTIO_NET_F_STATUS);
13033d24d65SJianfeng Tan 	ret = dev->ops->send_request(dev, VHOST_USER_SET_FEATURES, &features);
13137a7eb2aSJianfeng Tan 	if (ret < 0)
13237a7eb2aSJianfeng Tan 		goto error;
13337a7eb2aSJianfeng Tan 	PMD_DRV_LOG(INFO, "set features: %" PRIx64, features);
13437a7eb2aSJianfeng Tan 
13557ae79a7SJianfeng Tan 	/* Step 2: share memory regions */
13633d24d65SJianfeng Tan 	ret = dev->ops->send_request(dev, VHOST_USER_SET_MEM_TABLE, NULL);
13757ae79a7SJianfeng Tan 	if (ret < 0)
13857ae79a7SJianfeng Tan 		goto error;
13957ae79a7SJianfeng Tan 
14057ae79a7SJianfeng Tan 	/* Step 3: kick queues */
14157ae79a7SJianfeng Tan 	if (virtio_user_queue_setup(dev, virtio_user_kick_queue) < 0)
14257ae79a7SJianfeng Tan 		goto error;
14357ae79a7SJianfeng Tan 
14457ae79a7SJianfeng Tan 	/* Step 4: enable queues
14557ae79a7SJianfeng Tan 	 * we enable the 1st queue pair by default.
14657ae79a7SJianfeng Tan 	 */
14733d24d65SJianfeng Tan 	dev->ops->enable_qp(dev, 0, 1);
14857ae79a7SJianfeng Tan 
14937a7eb2aSJianfeng Tan 	return 0;
15037a7eb2aSJianfeng Tan error:
15137a7eb2aSJianfeng Tan 	/* TODO: free resource here or caller to check */
15237a7eb2aSJianfeng Tan 	return -1;
15337a7eb2aSJianfeng Tan }
15437a7eb2aSJianfeng Tan 
15537a7eb2aSJianfeng Tan int virtio_user_stop_device(struct virtio_user_dev *dev)
15637a7eb2aSJianfeng Tan {
157c12a26eeSJianfeng Tan 	uint32_t i;
158c12a26eeSJianfeng Tan 
159c12a26eeSJianfeng Tan 	for (i = 0; i < dev->max_queue_pairs; ++i)
16033d24d65SJianfeng Tan 		dev->ops->enable_qp(dev, i, 0);
161c12a26eeSJianfeng Tan 
1620d6a8752SJianfeng Tan 	if (dev->ops->send_request(dev, VHOST_USER_RESET_OWNER, NULL) < 0) {
1630d6a8752SJianfeng Tan 		PMD_DRV_LOG(INFO, "Failed to reset the device\n");
1640d6a8752SJianfeng Tan 		return -1;
1650d6a8752SJianfeng Tan 	}
1660d6a8752SJianfeng Tan 
167c12a26eeSJianfeng Tan 	return 0;
16837a7eb2aSJianfeng Tan }
16937a7eb2aSJianfeng Tan 
17037a7eb2aSJianfeng Tan static inline void
17137a7eb2aSJianfeng Tan parse_mac(struct virtio_user_dev *dev, const char *mac)
17237a7eb2aSJianfeng Tan {
17337a7eb2aSJianfeng Tan 	int i, r;
17437a7eb2aSJianfeng Tan 	uint32_t tmp[ETHER_ADDR_LEN];
17537a7eb2aSJianfeng Tan 
17637a7eb2aSJianfeng Tan 	if (!mac)
17737a7eb2aSJianfeng Tan 		return;
17837a7eb2aSJianfeng Tan 
17937a7eb2aSJianfeng Tan 	r = sscanf(mac, "%x:%x:%x:%x:%x:%x", &tmp[0],
18037a7eb2aSJianfeng Tan 			&tmp[1], &tmp[2], &tmp[3], &tmp[4], &tmp[5]);
18137a7eb2aSJianfeng Tan 	if (r == ETHER_ADDR_LEN) {
18237a7eb2aSJianfeng Tan 		for (i = 0; i < ETHER_ADDR_LEN; ++i)
18337a7eb2aSJianfeng Tan 			dev->mac_addr[i] = (uint8_t)tmp[i];
18437a7eb2aSJianfeng Tan 		dev->mac_specified = 1;
18537a7eb2aSJianfeng Tan 	} else {
18637a7eb2aSJianfeng Tan 		/* ignore the wrong mac, use random mac */
18737a7eb2aSJianfeng Tan 		PMD_DRV_LOG(ERR, "wrong format of mac: %s", mac);
18837a7eb2aSJianfeng Tan 	}
18937a7eb2aSJianfeng Tan }
19037a7eb2aSJianfeng Tan 
19133d24d65SJianfeng Tan static int
192e6e7ad8bSJianfeng Tan virtio_user_dev_init_notify(struct virtio_user_dev *dev)
19333d24d65SJianfeng Tan {
194e6e7ad8bSJianfeng Tan 	uint32_t i, j;
195e6e7ad8bSJianfeng Tan 	int callfd;
196e6e7ad8bSJianfeng Tan 	int kickfd;
19733d24d65SJianfeng Tan 
1982269b9aeSWenfeng Liu 	for (i = 0; i < VIRTIO_MAX_VIRTQUEUES; ++i) {
199e6e7ad8bSJianfeng Tan 		if (i >= dev->max_queue_pairs * 2) {
20033d24d65SJianfeng Tan 			dev->kickfds[i] = -1;
20133d24d65SJianfeng Tan 			dev->callfds[i] = -1;
202e6e7ad8bSJianfeng Tan 			continue;
20333d24d65SJianfeng Tan 		}
20433d24d65SJianfeng Tan 
205e6e7ad8bSJianfeng Tan 		/* May use invalid flag, but some backend uses kickfd and
206e6e7ad8bSJianfeng Tan 		 * callfd as criteria to judge if dev is alive. so finally we
207e6e7ad8bSJianfeng Tan 		 * use real event_fd.
208e6e7ad8bSJianfeng Tan 		 */
209e6e7ad8bSJianfeng Tan 		callfd = eventfd(0, EFD_CLOEXEC | EFD_NONBLOCK);
210e6e7ad8bSJianfeng Tan 		if (callfd < 0) {
211e6e7ad8bSJianfeng Tan 			PMD_DRV_LOG(ERR, "callfd error, %s", strerror(errno));
212e6e7ad8bSJianfeng Tan 			break;
213e6e7ad8bSJianfeng Tan 		}
214e6e7ad8bSJianfeng Tan 		kickfd = eventfd(0, EFD_CLOEXEC | EFD_NONBLOCK);
215e6e7ad8bSJianfeng Tan 		if (kickfd < 0) {
216e6e7ad8bSJianfeng Tan 			PMD_DRV_LOG(ERR, "kickfd error, %s", strerror(errno));
217e6e7ad8bSJianfeng Tan 			break;
218e6e7ad8bSJianfeng Tan 		}
219e6e7ad8bSJianfeng Tan 		dev->callfds[i] = callfd;
220e6e7ad8bSJianfeng Tan 		dev->kickfds[i] = kickfd;
221e6e7ad8bSJianfeng Tan 	}
222e6e7ad8bSJianfeng Tan 
223e6e7ad8bSJianfeng Tan 	if (i < VIRTIO_MAX_VIRTQUEUES) {
224e6e7ad8bSJianfeng Tan 		for (j = 0; j <= i; ++j) {
225e6e7ad8bSJianfeng Tan 			close(dev->callfds[j]);
226e6e7ad8bSJianfeng Tan 			close(dev->kickfds[j]);
227e6e7ad8bSJianfeng Tan 		}
228e6e7ad8bSJianfeng Tan 
229e6e7ad8bSJianfeng Tan 		return -1;
230e6e7ad8bSJianfeng Tan 	}
231e6e7ad8bSJianfeng Tan 
232e6e7ad8bSJianfeng Tan 	return 0;
233e6e7ad8bSJianfeng Tan }
234e6e7ad8bSJianfeng Tan 
235e6e7ad8bSJianfeng Tan static int
2363d4fb6fdSJianfeng Tan virtio_user_fill_intr_handle(struct virtio_user_dev *dev)
2373d4fb6fdSJianfeng Tan {
2383d4fb6fdSJianfeng Tan 	uint32_t i;
2393d4fb6fdSJianfeng Tan 	struct rte_eth_dev *eth_dev = &rte_eth_devices[dev->port_id];
2403d4fb6fdSJianfeng Tan 
2413d4fb6fdSJianfeng Tan 	if (!eth_dev->intr_handle) {
2423d4fb6fdSJianfeng Tan 		eth_dev->intr_handle = malloc(sizeof(*eth_dev->intr_handle));
2433d4fb6fdSJianfeng Tan 		if (!eth_dev->intr_handle) {
2443d4fb6fdSJianfeng Tan 			PMD_DRV_LOG(ERR, "fail to allocate intr_handle");
2453d4fb6fdSJianfeng Tan 			return -1;
2463d4fb6fdSJianfeng Tan 		}
2473d4fb6fdSJianfeng Tan 		memset(eth_dev->intr_handle, 0, sizeof(*eth_dev->intr_handle));
2483d4fb6fdSJianfeng Tan 	}
2493d4fb6fdSJianfeng Tan 
2503d4fb6fdSJianfeng Tan 	for (i = 0; i < dev->max_queue_pairs; ++i)
2513d4fb6fdSJianfeng Tan 		eth_dev->intr_handle->efds[i] = dev->callfds[i];
2523d4fb6fdSJianfeng Tan 	eth_dev->intr_handle->nb_efd = dev->max_queue_pairs;
2533d4fb6fdSJianfeng Tan 	eth_dev->intr_handle->max_intr = dev->max_queue_pairs + 1;
2543d4fb6fdSJianfeng Tan 	eth_dev->intr_handle->type = RTE_INTR_HANDLE_VDEV;
25529906b97SJingjing Wu 	/* For virtio vdev, no need to read counter for clean */
25629906b97SJingjing Wu 	eth_dev->intr_handle->efd_counter_size = 0;
257eae6e70cSJianfeng Tan 	eth_dev->intr_handle->fd = -1;
258cc4690e9SJianfeng Tan 	if (dev->vhostfd >= 0)
259cc4690e9SJianfeng Tan 		eth_dev->intr_handle->fd = dev->vhostfd;
260*bd8f50a4SZhiyong Yang 	else if (dev->is_server)
261*bd8f50a4SZhiyong Yang 		eth_dev->intr_handle->fd = dev->listenfd;
2623d4fb6fdSJianfeng Tan 
2633d4fb6fdSJianfeng Tan 	return 0;
2643d4fb6fdSJianfeng Tan }
2653d4fb6fdSJianfeng Tan 
2663d4fb6fdSJianfeng Tan static int
267e6e7ad8bSJianfeng Tan virtio_user_dev_setup(struct virtio_user_dev *dev)
268e6e7ad8bSJianfeng Tan {
269e6e7ad8bSJianfeng Tan 	uint32_t q;
270e6e7ad8bSJianfeng Tan 
271e6e7ad8bSJianfeng Tan 	dev->vhostfd = -1;
272e3b43481SJianfeng Tan 	dev->vhostfds = NULL;
273e3b43481SJianfeng Tan 	dev->tapfds = NULL;
274e3b43481SJianfeng Tan 
275*bd8f50a4SZhiyong Yang 	if (dev->is_server) {
276*bd8f50a4SZhiyong Yang 		if (access(dev->path, F_OK) == 0 &&
277*bd8f50a4SZhiyong Yang 		    !is_vhost_user_by_type(dev->path)) {
278*bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "Server mode doesn't support vhost-kernel!");
279*bd8f50a4SZhiyong Yang 			return -1;
280*bd8f50a4SZhiyong Yang 		}
281*bd8f50a4SZhiyong Yang 		dev->ops = &ops_user;
282*bd8f50a4SZhiyong Yang 	} else {
28333d24d65SJianfeng Tan 		if (is_vhost_user_by_type(dev->path)) {
28433d24d65SJianfeng Tan 			dev->ops = &ops_user;
285e3b43481SJianfeng Tan 		} else {
286e3b43481SJianfeng Tan 			dev->ops = &ops_kernel;
287e3b43481SJianfeng Tan 
288*bd8f50a4SZhiyong Yang 			dev->vhostfds = malloc(dev->max_queue_pairs *
289*bd8f50a4SZhiyong Yang 					       sizeof(int));
290*bd8f50a4SZhiyong Yang 			dev->tapfds = malloc(dev->max_queue_pairs *
291*bd8f50a4SZhiyong Yang 					     sizeof(int));
292e3b43481SJianfeng Tan 			if (!dev->vhostfds || !dev->tapfds) {
293e3b43481SJianfeng Tan 				PMD_INIT_LOG(ERR, "Failed to malloc");
294e3b43481SJianfeng Tan 				return -1;
29533d24d65SJianfeng Tan 			}
29633d24d65SJianfeng Tan 
297e3b43481SJianfeng Tan 			for (q = 0; q < dev->max_queue_pairs; ++q) {
298e3b43481SJianfeng Tan 				dev->vhostfds[q] = -1;
299e3b43481SJianfeng Tan 				dev->tapfds[q] = -1;
300e3b43481SJianfeng Tan 			}
301e3b43481SJianfeng Tan 		}
302*bd8f50a4SZhiyong Yang 	}
303e3b43481SJianfeng Tan 
304cc4690e9SJianfeng Tan 	if (dev->ops->setup(dev) < 0)
305cc4690e9SJianfeng Tan 		return -1;
306cc4690e9SJianfeng Tan 
307cc4690e9SJianfeng Tan 	if (virtio_user_dev_init_notify(dev) < 0)
308cc4690e9SJianfeng Tan 		return -1;
309cc4690e9SJianfeng Tan 
310cc4690e9SJianfeng Tan 	if (virtio_user_fill_intr_handle(dev) < 0)
311cc4690e9SJianfeng Tan 		return -1;
312cc4690e9SJianfeng Tan 
313cc4690e9SJianfeng Tan 	return 0;
31433d24d65SJianfeng Tan }
31533d24d65SJianfeng Tan 
316bed3b24cSJianfeng Tan /* Use below macro to filter features from vhost backend */
317bed3b24cSJianfeng Tan #define VIRTIO_USER_SUPPORTED_FEATURES			\
318bed3b24cSJianfeng Tan 	(1ULL << VIRTIO_NET_F_MAC		|	\
319bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_STATUS		|	\
320bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_MQ		|	\
321bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_CTRL_MAC_ADDR	|	\
322bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_CTRL_VQ		|	\
323bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_CTRL_RX		|	\
324bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_CTRL_VLAN		|	\
325bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_CSUM		|	\
326bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_HOST_TSO4		|	\
327bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_HOST_TSO6		|	\
328bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_MRG_RXBUF		|	\
329bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_RING_F_INDIRECT_DESC	|	\
330bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_GUEST_CSUM	|	\
331bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_GUEST_TSO4	|	\
332bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_NET_F_GUEST_TSO6	|	\
333bed3b24cSJianfeng Tan 	 1ULL << VIRTIO_F_VERSION_1)
334bed3b24cSJianfeng Tan 
33537a7eb2aSJianfeng Tan int
33637a7eb2aSJianfeng Tan virtio_user_dev_init(struct virtio_user_dev *dev, char *path, int queues,
3374214a1b4SWenfeng Liu 		     int cq, int queue_size, const char *mac, char **ifname)
33837a7eb2aSJianfeng Tan {
339542849c0SJianfeng Tan 	snprintf(dev->path, PATH_MAX, "%s", path);
34037a7eb2aSJianfeng Tan 	dev->max_queue_pairs = queues;
34137a7eb2aSJianfeng Tan 	dev->queue_pairs = 1; /* mq disabled by default */
34237a7eb2aSJianfeng Tan 	dev->queue_size = queue_size;
34337a7eb2aSJianfeng Tan 	dev->mac_specified = 0;
34437a7eb2aSJianfeng Tan 	parse_mac(dev, mac);
34537a7eb2aSJianfeng Tan 
3464214a1b4SWenfeng Liu 	if (*ifname) {
3474214a1b4SWenfeng Liu 		dev->ifname = *ifname;
3484214a1b4SWenfeng Liu 		*ifname = NULL;
3494214a1b4SWenfeng Liu 	}
3504214a1b4SWenfeng Liu 
35133d24d65SJianfeng Tan 	if (virtio_user_dev_setup(dev) < 0) {
35237a7eb2aSJianfeng Tan 		PMD_INIT_LOG(ERR, "backend set up fails");
35337a7eb2aSJianfeng Tan 		return -1;
35437a7eb2aSJianfeng Tan 	}
355bce7e905SJianfeng Tan 
356*bd8f50a4SZhiyong Yang 	if (dev->vhostfd >= 0) {
357*bd8f50a4SZhiyong Yang 		if (dev->ops->send_request(dev, VHOST_USER_SET_OWNER,
358*bd8f50a4SZhiyong Yang 					   NULL) < 0) {
359*bd8f50a4SZhiyong Yang 			PMD_INIT_LOG(ERR, "set_owner fails: %s",
360*bd8f50a4SZhiyong Yang 				     strerror(errno));
36137a7eb2aSJianfeng Tan 			return -1;
36237a7eb2aSJianfeng Tan 		}
36337a7eb2aSJianfeng Tan 
36433d24d65SJianfeng Tan 		if (dev->ops->send_request(dev, VHOST_USER_GET_FEATURES,
365142678d4SJianfeng Tan 					   &dev->device_features) < 0) {
366*bd8f50a4SZhiyong Yang 			PMD_INIT_LOG(ERR, "get_features failed: %s",
367*bd8f50a4SZhiyong Yang 				     strerror(errno));
36837a7eb2aSJianfeng Tan 			return -1;
36937a7eb2aSJianfeng Tan 		}
370*bd8f50a4SZhiyong Yang 	} else {
371*bd8f50a4SZhiyong Yang 		/* We just pretend vhost-user can support all these features.
372*bd8f50a4SZhiyong Yang 		 * Note that this could be problematic that if some feature is
373*bd8f50a4SZhiyong Yang 		 * negotiated but not supported by the vhost-user which comes
374*bd8f50a4SZhiyong Yang 		 * later.
375*bd8f50a4SZhiyong Yang 		 */
376*bd8f50a4SZhiyong Yang 		dev->device_features = VIRTIO_USER_SUPPORTED_FEATURES;
377*bd8f50a4SZhiyong Yang 	}
378*bd8f50a4SZhiyong Yang 
37937a7eb2aSJianfeng Tan 	if (dev->mac_specified)
380142678d4SJianfeng Tan 		dev->device_features |= (1ull << VIRTIO_NET_F_MAC);
381f9b9d1a5SJianfeng Tan 
382142678d4SJianfeng Tan 	if (cq) {
383142678d4SJianfeng Tan 		/* device does not really need to know anything about CQ,
384142678d4SJianfeng Tan 		 * so if necessary, we just claim to support CQ
385f9b9d1a5SJianfeng Tan 		 */
386142678d4SJianfeng Tan 		dev->device_features |= (1ull << VIRTIO_NET_F_CTRL_VQ);
387142678d4SJianfeng Tan 	} else {
388142678d4SJianfeng Tan 		dev->device_features &= ~(1ull << VIRTIO_NET_F_CTRL_VQ);
389142678d4SJianfeng Tan 		/* Also disable features depends on VIRTIO_NET_F_CTRL_VQ */
390142678d4SJianfeng Tan 		dev->device_features &= ~(1ull << VIRTIO_NET_F_CTRL_RX);
391142678d4SJianfeng Tan 		dev->device_features &= ~(1ull << VIRTIO_NET_F_CTRL_VLAN);
392142678d4SJianfeng Tan 		dev->device_features &= ~(1ull << VIRTIO_NET_F_GUEST_ANNOUNCE);
393142678d4SJianfeng Tan 		dev->device_features &= ~(1ull << VIRTIO_NET_F_MQ);
394142678d4SJianfeng Tan 		dev->device_features &= ~(1ull << VIRTIO_NET_F_CTRL_MAC_ADDR);
395f9b9d1a5SJianfeng Tan 	}
396f9b9d1a5SJianfeng Tan 
39735c4f855SJianfeng Tan 	/* The backend will not report this feature, we add it explicitly */
3984bf9e26dSJianfeng Tan 	if (is_vhost_user_by_type(dev->path))
39935c4f855SJianfeng Tan 		dev->device_features |= (1ull << VIRTIO_NET_F_STATUS);
40035c4f855SJianfeng Tan 
401bed3b24cSJianfeng Tan 	dev->device_features &= VIRTIO_USER_SUPPORTED_FEATURES;
402bed3b24cSJianfeng Tan 
40337a7eb2aSJianfeng Tan 	return 0;
40437a7eb2aSJianfeng Tan }
40537a7eb2aSJianfeng Tan 
40637a7eb2aSJianfeng Tan void
40737a7eb2aSJianfeng Tan virtio_user_dev_uninit(struct virtio_user_dev *dev)
40837a7eb2aSJianfeng Tan {
409e3b43481SJianfeng Tan 	uint32_t i;
410e3b43481SJianfeng Tan 
411e3b43481SJianfeng Tan 	virtio_user_stop_device(dev);
412e3b43481SJianfeng Tan 
413e6e7ad8bSJianfeng Tan 	for (i = 0; i < dev->max_queue_pairs * 2; ++i) {
414e6e7ad8bSJianfeng Tan 		close(dev->callfds[i]);
415e6e7ad8bSJianfeng Tan 		close(dev->kickfds[i]);
416e6e7ad8bSJianfeng Tan 	}
417e6e7ad8bSJianfeng Tan 
41837a7eb2aSJianfeng Tan 	close(dev->vhostfd);
419e3b43481SJianfeng Tan 
420*bd8f50a4SZhiyong Yang 	if (dev->is_server && dev->listenfd >= 0) {
421*bd8f50a4SZhiyong Yang 		close(dev->listenfd);
422*bd8f50a4SZhiyong Yang 		dev->listenfd = -1;
423*bd8f50a4SZhiyong Yang 	}
424*bd8f50a4SZhiyong Yang 
425e3b43481SJianfeng Tan 	if (dev->vhostfds) {
426e3b43481SJianfeng Tan 		for (i = 0; i < dev->max_queue_pairs; ++i)
427e3b43481SJianfeng Tan 			close(dev->vhostfds[i]);
428e3b43481SJianfeng Tan 		free(dev->vhostfds);
429e3b43481SJianfeng Tan 		free(dev->tapfds);
430e3b43481SJianfeng Tan 	}
4314214a1b4SWenfeng Liu 
4324214a1b4SWenfeng Liu 	free(dev->ifname);
433*bd8f50a4SZhiyong Yang 
434*bd8f50a4SZhiyong Yang 	if (dev->is_server)
435*bd8f50a4SZhiyong Yang 		unlink(dev->path);
43637a7eb2aSJianfeng Tan }
437f9b9d1a5SJianfeng Tan 
438f9b9d1a5SJianfeng Tan static uint8_t
439f9b9d1a5SJianfeng Tan virtio_user_handle_mq(struct virtio_user_dev *dev, uint16_t q_pairs)
440f9b9d1a5SJianfeng Tan {
441f9b9d1a5SJianfeng Tan 	uint16_t i;
442f9b9d1a5SJianfeng Tan 	uint8_t ret = 0;
443f9b9d1a5SJianfeng Tan 
444f9b9d1a5SJianfeng Tan 	if (q_pairs > dev->max_queue_pairs) {
445f9b9d1a5SJianfeng Tan 		PMD_INIT_LOG(ERR, "multi-q config %u, but only %u supported",
446f9b9d1a5SJianfeng Tan 			     q_pairs, dev->max_queue_pairs);
447f9b9d1a5SJianfeng Tan 		return -1;
448f9b9d1a5SJianfeng Tan 	}
449f9b9d1a5SJianfeng Tan 
450f9b9d1a5SJianfeng Tan 	for (i = 0; i < q_pairs; ++i)
45133d24d65SJianfeng Tan 		ret |= dev->ops->enable_qp(dev, i, 1);
452f9b9d1a5SJianfeng Tan 	for (i = q_pairs; i < dev->max_queue_pairs; ++i)
45333d24d65SJianfeng Tan 		ret |= dev->ops->enable_qp(dev, i, 0);
454f9b9d1a5SJianfeng Tan 
455f9b9d1a5SJianfeng Tan 	dev->queue_pairs = q_pairs;
456f9b9d1a5SJianfeng Tan 
457f9b9d1a5SJianfeng Tan 	return ret;
458f9b9d1a5SJianfeng Tan }
459f9b9d1a5SJianfeng Tan 
460f9b9d1a5SJianfeng Tan static uint32_t
461f9b9d1a5SJianfeng Tan virtio_user_handle_ctrl_msg(struct virtio_user_dev *dev, struct vring *vring,
462f9b9d1a5SJianfeng Tan 			    uint16_t idx_hdr)
463f9b9d1a5SJianfeng Tan {
464f9b9d1a5SJianfeng Tan 	struct virtio_net_ctrl_hdr *hdr;
465f9b9d1a5SJianfeng Tan 	virtio_net_ctrl_ack status = ~0;
466f9b9d1a5SJianfeng Tan 	uint16_t i, idx_data, idx_status;
467f9b9d1a5SJianfeng Tan 	uint32_t n_descs = 0;
468f9b9d1a5SJianfeng Tan 
469f9b9d1a5SJianfeng Tan 	/* locate desc for header, data, and status */
470f9b9d1a5SJianfeng Tan 	idx_data = vring->desc[idx_hdr].next;
471f9b9d1a5SJianfeng Tan 	n_descs++;
472f9b9d1a5SJianfeng Tan 
473f9b9d1a5SJianfeng Tan 	i = idx_data;
474f9b9d1a5SJianfeng Tan 	while (vring->desc[i].flags == VRING_DESC_F_NEXT) {
475f9b9d1a5SJianfeng Tan 		i = vring->desc[i].next;
476f9b9d1a5SJianfeng Tan 		n_descs++;
477f9b9d1a5SJianfeng Tan 	}
478f9b9d1a5SJianfeng Tan 
479f9b9d1a5SJianfeng Tan 	/* locate desc for status */
480f9b9d1a5SJianfeng Tan 	idx_status = i;
481f9b9d1a5SJianfeng Tan 	n_descs++;
482f9b9d1a5SJianfeng Tan 
483f9b9d1a5SJianfeng Tan 	hdr = (void *)(uintptr_t)vring->desc[idx_hdr].addr;
484f9b9d1a5SJianfeng Tan 	if (hdr->class == VIRTIO_NET_CTRL_MQ &&
485f9b9d1a5SJianfeng Tan 	    hdr->cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
486f9b9d1a5SJianfeng Tan 		uint16_t queues;
487f9b9d1a5SJianfeng Tan 
488f9b9d1a5SJianfeng Tan 		queues = *(uint16_t *)(uintptr_t)vring->desc[idx_data].addr;
489f9b9d1a5SJianfeng Tan 		status = virtio_user_handle_mq(dev, queues);
490f9b9d1a5SJianfeng Tan 	}
491f9b9d1a5SJianfeng Tan 
492f9b9d1a5SJianfeng Tan 	/* Update status */
493f9b9d1a5SJianfeng Tan 	*(virtio_net_ctrl_ack *)(uintptr_t)vring->desc[idx_status].addr = status;
494f9b9d1a5SJianfeng Tan 
495f9b9d1a5SJianfeng Tan 	return n_descs;
496f9b9d1a5SJianfeng Tan }
497f9b9d1a5SJianfeng Tan 
498f9b9d1a5SJianfeng Tan void
499f9b9d1a5SJianfeng Tan virtio_user_handle_cq(struct virtio_user_dev *dev, uint16_t queue_idx)
500f9b9d1a5SJianfeng Tan {
501f9b9d1a5SJianfeng Tan 	uint16_t avail_idx, desc_idx;
502f9b9d1a5SJianfeng Tan 	struct vring_used_elem *uep;
503f9b9d1a5SJianfeng Tan 	uint32_t n_descs;
504f9b9d1a5SJianfeng Tan 	struct vring *vring = &dev->vrings[queue_idx];
505f9b9d1a5SJianfeng Tan 
506f9b9d1a5SJianfeng Tan 	/* Consume avail ring, using used ring idx as first one */
507f9b9d1a5SJianfeng Tan 	while (vring->used->idx != vring->avail->idx) {
508f9b9d1a5SJianfeng Tan 		avail_idx = (vring->used->idx) & (vring->num - 1);
509f9b9d1a5SJianfeng Tan 		desc_idx = vring->avail->ring[avail_idx];
510f9b9d1a5SJianfeng Tan 
511f9b9d1a5SJianfeng Tan 		n_descs = virtio_user_handle_ctrl_msg(dev, vring, desc_idx);
512f9b9d1a5SJianfeng Tan 
513f9b9d1a5SJianfeng Tan 		/* Update used ring */
514f9b9d1a5SJianfeng Tan 		uep = &vring->used->ring[avail_idx];
515f9b9d1a5SJianfeng Tan 		uep->id = avail_idx;
516f9b9d1a5SJianfeng Tan 		uep->len = n_descs;
517f9b9d1a5SJianfeng Tan 
518f9b9d1a5SJianfeng Tan 		vring->used->idx++;
519f9b9d1a5SJianfeng Tan 	}
520f9b9d1a5SJianfeng Tan }
521