xref: /dpdk/drivers/net/virtio/virtio_user_ethdev.c (revision d7e10ea92ee6676af1be36d9afcc008423ad099e)
15566a3e3SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause
25566a3e3SBruce Richardson  * Copyright(c) 2010-2016 Intel Corporation
3e9efa4d9SJianfeng Tan  */
4e9efa4d9SJianfeng Tan 
5e9efa4d9SJianfeng Tan #include <stdint.h>
6e9efa4d9SJianfeng Tan #include <sys/types.h>
7e9efa4d9SJianfeng Tan #include <unistd.h>
8ef53b603SJianfeng Tan #include <fcntl.h>
97d62bf6fSMaxime Coquelin #include <linux/major.h>
10f908b22eSAdrian Moreno #include <sys/stat.h>
117d62bf6fSMaxime Coquelin #include <sys/sysmacros.h>
12ef53b603SJianfeng Tan #include <sys/socket.h>
13e9efa4d9SJianfeng Tan 
14ce2eabddSJianfeng Tan #include <rte_malloc.h>
15ce2eabddSJianfeng Tan #include <rte_kvargs.h>
16050fe6e9SJan Blunck #include <rte_ethdev_vdev.h>
17d4a586d2SJianfeng Tan #include <rte_bus_vdev.h>
18ef53b603SJianfeng Tan #include <rte_alarm.h>
196ebbf410SXuan Ding #include <rte_cycles.h>
20ce2eabddSJianfeng Tan 
21ce2eabddSJianfeng Tan #include "virtio_ethdev.h"
22e9efa4d9SJianfeng Tan #include "virtio_logs.h"
23e9efa4d9SJianfeng Tan #include "virtio_pci.h"
24e9efa4d9SJianfeng Tan #include "virtqueue.h"
251b69528eSJianfeng Tan #include "virtio_rxtx.h"
26e9efa4d9SJianfeng Tan #include "virtio_user/virtio_user_dev.h"
277f468b2eSTiwei Bie #include "virtio_user/vhost.h"
28e9efa4d9SJianfeng Tan 
29e9efa4d9SJianfeng Tan #define virtio_user_get_dev(hw) \
30e9efa4d9SJianfeng Tan 	((struct virtio_user_dev *)(hw)->virtio_user_dev)
31e9efa4d9SJianfeng Tan 
326ebbf410SXuan Ding static void
336ebbf410SXuan Ding virtio_user_reset_queues_packed(struct rte_eth_dev *dev)
346ebbf410SXuan Ding {
356ebbf410SXuan Ding 	struct virtio_hw *hw = dev->data->dev_private;
366ebbf410SXuan Ding 	struct virtnet_rx *rxvq;
376ebbf410SXuan Ding 	struct virtnet_tx *txvq;
386ebbf410SXuan Ding 	uint16_t i;
396ebbf410SXuan Ding 
406ebbf410SXuan Ding 	/* Add lock to avoid queue contention. */
416ebbf410SXuan Ding 	rte_spinlock_lock(&hw->state_lock);
426ebbf410SXuan Ding 	hw->started = 0;
436ebbf410SXuan Ding 
446ebbf410SXuan Ding 	/*
456ebbf410SXuan Ding 	 * Waitting for datapath to complete before resetting queues.
466ebbf410SXuan Ding 	 * 1 ms should be enough for the ongoing Tx/Rx function to finish.
476ebbf410SXuan Ding 	 */
486ebbf410SXuan Ding 	rte_delay_ms(1);
496ebbf410SXuan Ding 
506ebbf410SXuan Ding 	/* Vring reset for each Tx queue and Rx queue. */
516ebbf410SXuan Ding 	for (i = 0; i < dev->data->nb_rx_queues; i++) {
526ebbf410SXuan Ding 		rxvq = dev->data->rx_queues[i];
536ebbf410SXuan Ding 		virtqueue_rxvq_reset_packed(rxvq->vq);
546ebbf410SXuan Ding 		virtio_dev_rx_queue_setup_finish(dev, i);
556ebbf410SXuan Ding 	}
566ebbf410SXuan Ding 
576ebbf410SXuan Ding 	for (i = 0; i < dev->data->nb_tx_queues; i++) {
586ebbf410SXuan Ding 		txvq = dev->data->tx_queues[i];
596ebbf410SXuan Ding 		virtqueue_txvq_reset_packed(txvq->vq);
606ebbf410SXuan Ding 	}
616ebbf410SXuan Ding 
626ebbf410SXuan Ding 	hw->started = 1;
636ebbf410SXuan Ding 	rte_spinlock_unlock(&hw->state_lock);
646ebbf410SXuan Ding }
656ebbf410SXuan Ding 
666ebbf410SXuan Ding 
67bd8f50a4SZhiyong Yang static int
68bd8f50a4SZhiyong Yang virtio_user_server_reconnect(struct virtio_user_dev *dev)
69bd8f50a4SZhiyong Yang {
70bd8f50a4SZhiyong Yang 	int ret;
71bd8f50a4SZhiyong Yang 	int connectfd;
72bd8f50a4SZhiyong Yang 	struct rte_eth_dev *eth_dev = &rte_eth_devices[dev->port_id];
736ebbf410SXuan Ding 	struct virtio_hw *hw = eth_dev->data->dev_private;
748e756105SMaxime Coquelin 	uint64_t protocol_features;
75bd8f50a4SZhiyong Yang 
76bd8f50a4SZhiyong Yang 	connectfd = accept(dev->listenfd, NULL, NULL);
77bd8f50a4SZhiyong Yang 	if (connectfd < 0)
78bd8f50a4SZhiyong Yang 		return -1;
79bd8f50a4SZhiyong Yang 
80bd8f50a4SZhiyong Yang 	dev->vhostfd = connectfd;
81201a4165SZhiyong Yang 	if (dev->ops->send_request(dev, VHOST_USER_GET_FEATURES,
82201a4165SZhiyong Yang 				   &dev->device_features) < 0) {
83201a4165SZhiyong Yang 		PMD_INIT_LOG(ERR, "get_features failed: %s",
84201a4165SZhiyong Yang 			     strerror(errno));
85201a4165SZhiyong Yang 		return -1;
86201a4165SZhiyong Yang 	}
87201a4165SZhiyong Yang 
888e756105SMaxime Coquelin 	if (dev->device_features &
898e756105SMaxime Coquelin 			(1ULL << VHOST_USER_F_PROTOCOL_FEATURES)) {
908e756105SMaxime Coquelin 		if (dev->ops->send_request(dev,
918e756105SMaxime Coquelin 					VHOST_USER_GET_PROTOCOL_FEATURES,
928e756105SMaxime Coquelin 					&protocol_features))
938e756105SMaxime Coquelin 			return -1;
948e756105SMaxime Coquelin 
958e756105SMaxime Coquelin 		dev->protocol_features &= protocol_features;
968e756105SMaxime Coquelin 
978e756105SMaxime Coquelin 		if (dev->ops->send_request(dev,
988e756105SMaxime Coquelin 					VHOST_USER_SET_PROTOCOL_FEATURES,
998e756105SMaxime Coquelin 					&dev->protocol_features))
1008e756105SMaxime Coquelin 			return -1;
1018e756105SMaxime Coquelin 
1028e756105SMaxime Coquelin 		if (!(dev->protocol_features &
1038e756105SMaxime Coquelin 				(1ULL << VHOST_USER_PROTOCOL_F_MQ)))
1048e756105SMaxime Coquelin 			dev->unsupported_features |= (1ull << VIRTIO_NET_F_MQ);
1058e756105SMaxime Coquelin 	}
1068e756105SMaxime Coquelin 
107bb97d2ddSTiwei Bie 	dev->device_features |= dev->frontend_features;
108bb97d2ddSTiwei Bie 
1097c66ff61SMarvin Liu 	/* umask vhost-user unsupported features */
1107c66ff61SMarvin Liu 	dev->device_features &= ~(dev->unsupported_features);
111201a4165SZhiyong Yang 
112201a4165SZhiyong Yang 	dev->features &= dev->device_features;
113201a4165SZhiyong Yang 
1146ebbf410SXuan Ding 	/* For packed ring, resetting queues is required in reconnection. */
11501996a03SMarvin Liu 	if (vtpci_packed_queue(hw) &&
11601996a03SMarvin Liu 	   (vtpci_get_status(hw) & VIRTIO_CONFIG_STATUS_DRIVER_OK)) {
1176ebbf410SXuan Ding 		PMD_INIT_LOG(NOTICE, "Packets on the fly will be dropped"
1186ebbf410SXuan Ding 				" when packed ring reconnecting.");
1196ebbf410SXuan Ding 		virtio_user_reset_queues_packed(eth_dev);
12092771257STiwei Bie 	}
1216ebbf410SXuan Ding 
122bd8f50a4SZhiyong Yang 	ret = virtio_user_start_device(dev);
123bd8f50a4SZhiyong Yang 	if (ret < 0)
124bd8f50a4SZhiyong Yang 		return -1;
125bd8f50a4SZhiyong Yang 
126201a4165SZhiyong Yang 	if (dev->queue_pairs > 1) {
127201a4165SZhiyong Yang 		ret = virtio_user_handle_mq(dev, dev->queue_pairs);
128201a4165SZhiyong Yang 		if (ret != 0) {
129201a4165SZhiyong Yang 			PMD_INIT_LOG(ERR, "Fails to enable multi-queue pairs!");
130201a4165SZhiyong Yang 			return -1;
131201a4165SZhiyong Yang 		}
132201a4165SZhiyong Yang 	}
133bd8f50a4SZhiyong Yang 	if (eth_dev->data->dev_flags & RTE_ETH_DEV_INTR_LSC) {
134bd8f50a4SZhiyong Yang 		if (rte_intr_disable(eth_dev->intr_handle) < 0) {
135bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt disable failed");
136bd8f50a4SZhiyong Yang 			return -1;
137bd8f50a4SZhiyong Yang 		}
138bd8f50a4SZhiyong Yang 		rte_intr_callback_unregister(eth_dev->intr_handle,
139bd8f50a4SZhiyong Yang 					     virtio_interrupt_handler,
140bd8f50a4SZhiyong Yang 					     eth_dev);
141bd8f50a4SZhiyong Yang 		eth_dev->intr_handle->fd = connectfd;
142bd8f50a4SZhiyong Yang 		rte_intr_callback_register(eth_dev->intr_handle,
143bd8f50a4SZhiyong Yang 					   virtio_interrupt_handler, eth_dev);
144bd8f50a4SZhiyong Yang 
145bd8f50a4SZhiyong Yang 		if (rte_intr_enable(eth_dev->intr_handle) < 0) {
146bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt enable failed");
147bd8f50a4SZhiyong Yang 			return -1;
148bd8f50a4SZhiyong Yang 		}
149bd8f50a4SZhiyong Yang 	}
150bd8f50a4SZhiyong Yang 	PMD_INIT_LOG(NOTICE, "server mode virtio-user reconnection succeeds!");
151bd8f50a4SZhiyong Yang 	return 0;
152bd8f50a4SZhiyong Yang }
153bd8f50a4SZhiyong Yang 
154e9efa4d9SJianfeng Tan static void
155ef53b603SJianfeng Tan virtio_user_delayed_handler(void *param)
156ef53b603SJianfeng Tan {
157ef53b603SJianfeng Tan 	struct virtio_hw *hw = (struct virtio_hw *)param;
158bd8f50a4SZhiyong Yang 	struct rte_eth_dev *eth_dev = &rte_eth_devices[hw->port_id];
159bd8f50a4SZhiyong Yang 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
160ef53b603SJianfeng Tan 
161bd8f50a4SZhiyong Yang 	if (rte_intr_disable(eth_dev->intr_handle) < 0) {
162bd8f50a4SZhiyong Yang 		PMD_DRV_LOG(ERR, "interrupt disable failed");
163bd8f50a4SZhiyong Yang 		return;
164bd8f50a4SZhiyong Yang 	}
165bd8f50a4SZhiyong Yang 	rte_intr_callback_unregister(eth_dev->intr_handle,
166bd8f50a4SZhiyong Yang 				     virtio_interrupt_handler, eth_dev);
167bd8f50a4SZhiyong Yang 	if (dev->is_server) {
168bd8f50a4SZhiyong Yang 		if (dev->vhostfd >= 0) {
169bd8f50a4SZhiyong Yang 			close(dev->vhostfd);
170bd8f50a4SZhiyong Yang 			dev->vhostfd = -1;
171bd8f50a4SZhiyong Yang 		}
172bd8f50a4SZhiyong Yang 		eth_dev->intr_handle->fd = dev->listenfd;
173bd8f50a4SZhiyong Yang 		rte_intr_callback_register(eth_dev->intr_handle,
174bd8f50a4SZhiyong Yang 					   virtio_interrupt_handler, eth_dev);
175bd8f50a4SZhiyong Yang 		if (rte_intr_enable(eth_dev->intr_handle) < 0) {
176bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt enable failed");
177bd8f50a4SZhiyong Yang 			return;
178bd8f50a4SZhiyong Yang 		}
179bd8f50a4SZhiyong Yang 	}
180ef53b603SJianfeng Tan }
181ef53b603SJianfeng Tan 
182ef53b603SJianfeng Tan static void
183e9efa4d9SJianfeng Tan virtio_user_read_dev_config(struct virtio_hw *hw, size_t offset,
184e9efa4d9SJianfeng Tan 		     void *dst, int length)
185e9efa4d9SJianfeng Tan {
186e9efa4d9SJianfeng Tan 	int i;
187e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
188e9efa4d9SJianfeng Tan 
189e9efa4d9SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, mac) &&
19035b2d13fSOlivier Matz 	    length == RTE_ETHER_ADDR_LEN) {
19135b2d13fSOlivier Matz 		for (i = 0; i < RTE_ETHER_ADDR_LEN; ++i)
192e9efa4d9SJianfeng Tan 			((uint8_t *)dst)[i] = dev->mac_addr[i];
193e9efa4d9SJianfeng Tan 		return;
194e9efa4d9SJianfeng Tan 	}
195e9efa4d9SJianfeng Tan 
196ef53b603SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, status)) {
197ef53b603SJianfeng Tan 		char buf[128];
198ef53b603SJianfeng Tan 
199ef53b603SJianfeng Tan 		if (dev->vhostfd >= 0) {
200ef53b603SJianfeng Tan 			int r;
201ef53b603SJianfeng Tan 			int flags;
202ef53b603SJianfeng Tan 
203ef53b603SJianfeng Tan 			flags = fcntl(dev->vhostfd, F_GETFL);
2042fd826a3SSebastian Basierski 			if (fcntl(dev->vhostfd, F_SETFL,
2052fd826a3SSebastian Basierski 					flags | O_NONBLOCK) == -1) {
2062fd826a3SSebastian Basierski 				PMD_DRV_LOG(ERR, "error setting O_NONBLOCK flag");
2072fd826a3SSebastian Basierski 				return;
2082fd826a3SSebastian Basierski 			}
209ef53b603SJianfeng Tan 			r = recv(dev->vhostfd, buf, 128, MSG_PEEK);
210ef53b603SJianfeng Tan 			if (r == 0 || (r < 0 && errno != EAGAIN)) {
211d0131e49SXiao Wang 				dev->net_status &= (~VIRTIO_NET_S_LINK_UP);
212ef53b603SJianfeng Tan 				PMD_DRV_LOG(ERR, "virtio-user port %u is down",
213ef53b603SJianfeng Tan 					    hw->port_id);
214bd8f50a4SZhiyong Yang 
215bd8f50a4SZhiyong Yang 				/* This function could be called in the process
216bd8f50a4SZhiyong Yang 				 * of interrupt handling, callback cannot be
217bd8f50a4SZhiyong Yang 				 * unregistered here, set an alarm to do it.
218ef53b603SJianfeng Tan 				 */
219ef53b603SJianfeng Tan 				rte_eal_alarm_set(1,
220ef53b603SJianfeng Tan 						  virtio_user_delayed_handler,
221ef53b603SJianfeng Tan 						  (void *)hw);
222ef53b603SJianfeng Tan 			} else {
223d0131e49SXiao Wang 				dev->net_status |= VIRTIO_NET_S_LINK_UP;
224ef53b603SJianfeng Tan 			}
225f76ef453SSebastian Basierski 			if (fcntl(dev->vhostfd, F_SETFL,
226f76ef453SSebastian Basierski 					flags & ~O_NONBLOCK) == -1) {
227f76ef453SSebastian Basierski 				PMD_DRV_LOG(ERR, "error clearing O_NONBLOCK flag");
228f76ef453SSebastian Basierski 				return;
229f76ef453SSebastian Basierski 			}
230bd8f50a4SZhiyong Yang 		} else if (dev->is_server) {
231d0131e49SXiao Wang 			dev->net_status &= (~VIRTIO_NET_S_LINK_UP);
232bd8f50a4SZhiyong Yang 			if (virtio_user_server_reconnect(dev) >= 0)
233d0131e49SXiao Wang 				dev->net_status |= VIRTIO_NET_S_LINK_UP;
234ef53b603SJianfeng Tan 		}
235bd8f50a4SZhiyong Yang 
236d0131e49SXiao Wang 		*(uint16_t *)dst = dev->net_status;
237ef53b603SJianfeng Tan 	}
238e9efa4d9SJianfeng Tan 
239e9efa4d9SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, max_virtqueue_pairs))
240e9efa4d9SJianfeng Tan 		*(uint16_t *)dst = dev->max_queue_pairs;
241e9efa4d9SJianfeng Tan }
242e9efa4d9SJianfeng Tan 
243e9efa4d9SJianfeng Tan static void
244e9efa4d9SJianfeng Tan virtio_user_write_dev_config(struct virtio_hw *hw, size_t offset,
245e9efa4d9SJianfeng Tan 		      const void *src, int length)
246e9efa4d9SJianfeng Tan {
247e9efa4d9SJianfeng Tan 	int i;
248e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
249e9efa4d9SJianfeng Tan 
250e9efa4d9SJianfeng Tan 	if ((offset == offsetof(struct virtio_net_config, mac)) &&
25135b2d13fSOlivier Matz 	    (length == RTE_ETHER_ADDR_LEN))
25235b2d13fSOlivier Matz 		for (i = 0; i < RTE_ETHER_ADDR_LEN; ++i)
253e9efa4d9SJianfeng Tan 			dev->mac_addr[i] = ((const uint8_t *)src)[i];
254e9efa4d9SJianfeng Tan 	else
255f2462150SFerruh Yigit 		PMD_DRV_LOG(ERR, "not supported offset=%zu, len=%d",
256e9efa4d9SJianfeng Tan 			    offset, length);
257e9efa4d9SJianfeng Tan }
258e9efa4d9SJianfeng Tan 
259e9efa4d9SJianfeng Tan static void
260c12a26eeSJianfeng Tan virtio_user_reset(struct virtio_hw *hw)
261c12a26eeSJianfeng Tan {
262c12a26eeSJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
263c12a26eeSJianfeng Tan 
264c12a26eeSJianfeng Tan 	if (dev->status & VIRTIO_CONFIG_STATUS_DRIVER_OK)
265c12a26eeSJianfeng Tan 		virtio_user_stop_device(dev);
266c12a26eeSJianfeng Tan }
267c12a26eeSJianfeng Tan 
268c12a26eeSJianfeng Tan static void
269e9efa4d9SJianfeng Tan virtio_user_set_status(struct virtio_hw *hw, uint8_t status)
270e9efa4d9SJianfeng Tan {
271e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
272844e4683SMaxime Coquelin 	uint8_t old_status = dev->status;
273e9efa4d9SJianfeng Tan 
274844e4683SMaxime Coquelin 	if (status & VIRTIO_CONFIG_STATUS_FEATURES_OK &&
275844e4683SMaxime Coquelin 			~old_status & VIRTIO_CONFIG_STATUS_FEATURES_OK)
276844e4683SMaxime Coquelin 		virtio_user_dev_set_features(dev);
277e9efa4d9SJianfeng Tan 	if (status & VIRTIO_CONFIG_STATUS_DRIVER_OK)
278e9efa4d9SJianfeng Tan 		virtio_user_start_device(dev);
279c12a26eeSJianfeng Tan 	else if (status == VIRTIO_CONFIG_STATUS_RESET)
280c12a26eeSJianfeng Tan 		virtio_user_reset(hw);
281*d7e10ea9SAdrian Moreno 
282*d7e10ea9SAdrian Moreno 	virtio_user_dev_set_status(dev, status);
283e9efa4d9SJianfeng Tan }
284e9efa4d9SJianfeng Tan 
285e9efa4d9SJianfeng Tan static uint8_t
286e9efa4d9SJianfeng Tan virtio_user_get_status(struct virtio_hw *hw)
287e9efa4d9SJianfeng Tan {
288e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
289e9efa4d9SJianfeng Tan 
290*d7e10ea9SAdrian Moreno 	virtio_user_dev_update_status(dev);
2910b0dc66cSAdrian Moreno 
292e9efa4d9SJianfeng Tan 	return dev->status;
293e9efa4d9SJianfeng Tan }
294e9efa4d9SJianfeng Tan 
295e9efa4d9SJianfeng Tan static uint64_t
296e9efa4d9SJianfeng Tan virtio_user_get_features(struct virtio_hw *hw)
297e9efa4d9SJianfeng Tan {
298e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
299e9efa4d9SJianfeng Tan 
300142678d4SJianfeng Tan 	/* unmask feature bits defined in vhost user protocol */
301142678d4SJianfeng Tan 	return dev->device_features & VIRTIO_PMD_SUPPORTED_GUEST_FEATURES;
302e9efa4d9SJianfeng Tan }
303e9efa4d9SJianfeng Tan 
304e9efa4d9SJianfeng Tan static void
305e9efa4d9SJianfeng Tan virtio_user_set_features(struct virtio_hw *hw, uint64_t features)
306e9efa4d9SJianfeng Tan {
307e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
308e9efa4d9SJianfeng Tan 
309142678d4SJianfeng Tan 	dev->features = features & dev->device_features;
310e9efa4d9SJianfeng Tan }
311e9efa4d9SJianfeng Tan 
312e9efa4d9SJianfeng Tan static uint8_t
313e9efa4d9SJianfeng Tan virtio_user_get_isr(struct virtio_hw *hw __rte_unused)
314e9efa4d9SJianfeng Tan {
31535c4f855SJianfeng Tan 	/* rxq interrupts and config interrupt are separated in virtio-user,
31635c4f855SJianfeng Tan 	 * here we only report config change.
317e9efa4d9SJianfeng Tan 	 */
31835c4f855SJianfeng Tan 	return VIRTIO_PCI_ISR_CONFIG;
319e9efa4d9SJianfeng Tan }
320e9efa4d9SJianfeng Tan 
321e9efa4d9SJianfeng Tan static uint16_t
322e9efa4d9SJianfeng Tan virtio_user_set_config_irq(struct virtio_hw *hw __rte_unused,
323e9efa4d9SJianfeng Tan 		    uint16_t vec __rte_unused)
324e9efa4d9SJianfeng Tan {
32535c4f855SJianfeng Tan 	return 0;
326e9efa4d9SJianfeng Tan }
327e9efa4d9SJianfeng Tan 
3283d4fb6fdSJianfeng Tan static uint16_t
3293d4fb6fdSJianfeng Tan virtio_user_set_queue_irq(struct virtio_hw *hw __rte_unused,
3303d4fb6fdSJianfeng Tan 			  struct virtqueue *vq __rte_unused,
3313d4fb6fdSJianfeng Tan 			  uint16_t vec)
3323d4fb6fdSJianfeng Tan {
3333d4fb6fdSJianfeng Tan 	/* pretend we have done that */
3343d4fb6fdSJianfeng Tan 	return vec;
3353d4fb6fdSJianfeng Tan }
3363d4fb6fdSJianfeng Tan 
337e9efa4d9SJianfeng Tan /* This function is to get the queue size, aka, number of descs, of a specified
338e9efa4d9SJianfeng Tan  * queue. Different with the VHOST_USER_GET_QUEUE_NUM, which is used to get the
339e9efa4d9SJianfeng Tan  * max supported queues.
340e9efa4d9SJianfeng Tan  */
341e9efa4d9SJianfeng Tan static uint16_t
342e9efa4d9SJianfeng Tan virtio_user_get_queue_num(struct virtio_hw *hw, uint16_t queue_id __rte_unused)
343e9efa4d9SJianfeng Tan {
344e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
345e9efa4d9SJianfeng Tan 
346e9efa4d9SJianfeng Tan 	/* Currently, each queue has same queue size */
347e9efa4d9SJianfeng Tan 	return dev->queue_size;
348e9efa4d9SJianfeng Tan }
349e9efa4d9SJianfeng Tan 
35048a44640SJens Freimann static void
35148a44640SJens Freimann virtio_user_setup_queue_packed(struct virtqueue *vq,
35248a44640SJens Freimann 			       struct virtio_user_dev *dev)
353e9efa4d9SJianfeng Tan {
35448a44640SJens Freimann 	uint16_t queue_idx = vq->vq_queue_index;
35548a44640SJens Freimann 	struct vring_packed *vring;
35648a44640SJens Freimann 	uint64_t desc_addr;
35748a44640SJens Freimann 	uint64_t avail_addr;
35848a44640SJens Freimann 	uint64_t used_addr;
35948a44640SJens Freimann 	uint16_t i;
36048a44640SJens Freimann 
36148a44640SJens Freimann 	vring  = &dev->packed_vrings[queue_idx];
36248a44640SJens Freimann 	desc_addr = (uintptr_t)vq->vq_ring_virt_mem;
36348a44640SJens Freimann 	avail_addr = desc_addr + vq->vq_nentries *
36448a44640SJens Freimann 		sizeof(struct vring_packed_desc);
36548a44640SJens Freimann 	used_addr = RTE_ALIGN_CEIL(avail_addr +
36648a44640SJens Freimann 			   sizeof(struct vring_packed_desc_event),
36748a44640SJens Freimann 			   VIRTIO_PCI_VRING_ALIGN);
36848a44640SJens Freimann 	vring->num = vq->vq_nentries;
3694cdc4d98STiwei Bie 	vring->desc = (void *)(uintptr_t)desc_addr;
3704cdc4d98STiwei Bie 	vring->driver = (void *)(uintptr_t)avail_addr;
3714cdc4d98STiwei Bie 	vring->device = (void *)(uintptr_t)used_addr;
37248a44640SJens Freimann 	dev->packed_queues[queue_idx].avail_wrap_counter = true;
37348a44640SJens Freimann 	dev->packed_queues[queue_idx].used_wrap_counter = true;
37448a44640SJens Freimann 
37545c224e7STiwei Bie 	for (i = 0; i < vring->num; i++)
3764cdc4d98STiwei Bie 		vring->desc[i].flags = 0;
37748a44640SJens Freimann }
37848a44640SJens Freimann 
37948a44640SJens Freimann static void
38048a44640SJens Freimann virtio_user_setup_queue_split(struct virtqueue *vq, struct virtio_user_dev *dev)
38148a44640SJens Freimann {
382e9efa4d9SJianfeng Tan 	uint16_t queue_idx = vq->vq_queue_index;
383e9efa4d9SJianfeng Tan 	uint64_t desc_addr, avail_addr, used_addr;
384e9efa4d9SJianfeng Tan 
385e9efa4d9SJianfeng Tan 	desc_addr = (uintptr_t)vq->vq_ring_virt_mem;
386e9efa4d9SJianfeng Tan 	avail_addr = desc_addr + vq->vq_nentries * sizeof(struct vring_desc);
387e9efa4d9SJianfeng Tan 	used_addr = RTE_ALIGN_CEIL(avail_addr + offsetof(struct vring_avail,
388e9efa4d9SJianfeng Tan 							 ring[vq->vq_nentries]),
389e9efa4d9SJianfeng Tan 				   VIRTIO_PCI_VRING_ALIGN);
390e9efa4d9SJianfeng Tan 
391e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].num = vq->vq_nentries;
392e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].desc = (void *)(uintptr_t)desc_addr;
393e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].avail = (void *)(uintptr_t)avail_addr;
394e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].used = (void *)(uintptr_t)used_addr;
39548a44640SJens Freimann }
39648a44640SJens Freimann 
39748a44640SJens Freimann static int
39848a44640SJens Freimann virtio_user_setup_queue(struct virtio_hw *hw, struct virtqueue *vq)
39948a44640SJens Freimann {
40048a44640SJens Freimann 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
40148a44640SJens Freimann 
40248a44640SJens Freimann 	if (vtpci_packed_queue(hw))
40348a44640SJens Freimann 		virtio_user_setup_queue_packed(vq, dev);
40448a44640SJens Freimann 	else
40548a44640SJens Freimann 		virtio_user_setup_queue_split(vq, dev);
406e9efa4d9SJianfeng Tan 
407e9efa4d9SJianfeng Tan 	return 0;
408e9efa4d9SJianfeng Tan }
409e9efa4d9SJianfeng Tan 
410e9efa4d9SJianfeng Tan static void
411e9efa4d9SJianfeng Tan virtio_user_del_queue(struct virtio_hw *hw, struct virtqueue *vq)
412e9efa4d9SJianfeng Tan {
413e9efa4d9SJianfeng Tan 	/* For legacy devices, write 0 to VIRTIO_PCI_QUEUE_PFN port, QEMU
414e9efa4d9SJianfeng Tan 	 * correspondingly stops the ioeventfds, and reset the status of
415e9efa4d9SJianfeng Tan 	 * the device.
416e9efa4d9SJianfeng Tan 	 * For modern devices, set queue desc, avail, used in PCI bar to 0,
417e9efa4d9SJianfeng Tan 	 * not see any more behavior in QEMU.
418e9efa4d9SJianfeng Tan 	 *
419e9efa4d9SJianfeng Tan 	 * Here we just care about what information to deliver to vhost-user
420e9efa4d9SJianfeng Tan 	 * or vhost-kernel. So we just close ioeventfd for now.
421e9efa4d9SJianfeng Tan 	 */
422e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
423e9efa4d9SJianfeng Tan 
424e9efa4d9SJianfeng Tan 	close(dev->callfds[vq->vq_queue_index]);
425e9efa4d9SJianfeng Tan 	close(dev->kickfds[vq->vq_queue_index]);
426e9efa4d9SJianfeng Tan }
427e9efa4d9SJianfeng Tan 
428e9efa4d9SJianfeng Tan static void
429e9efa4d9SJianfeng Tan virtio_user_notify_queue(struct virtio_hw *hw, struct virtqueue *vq)
430e9efa4d9SJianfeng Tan {
431e9efa4d9SJianfeng Tan 	uint64_t buf = 1;
432e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
433e9efa4d9SJianfeng Tan 
4341b69528eSJianfeng Tan 	if (hw->cvq && (hw->cvq->vq == vq)) {
43548a44640SJens Freimann 		if (vtpci_packed_queue(vq->hw))
43648a44640SJens Freimann 			virtio_user_handle_cq_packed(dev, vq->vq_queue_index);
43748a44640SJens Freimann 		else
4381b69528eSJianfeng Tan 			virtio_user_handle_cq(dev, vq->vq_queue_index);
4391b69528eSJianfeng Tan 		return;
4401b69528eSJianfeng Tan 	}
4411b69528eSJianfeng Tan 
442e9efa4d9SJianfeng Tan 	if (write(dev->kickfds[vq->vq_queue_index], &buf, sizeof(buf)) < 0)
443f2462150SFerruh Yigit 		PMD_DRV_LOG(ERR, "failed to kick backend: %s",
444e9efa4d9SJianfeng Tan 			    strerror(errno));
445e9efa4d9SJianfeng Tan }
446e9efa4d9SJianfeng Tan 
4476d890f8aSYuanhan Liu const struct virtio_pci_ops virtio_user_ops = {
448e9efa4d9SJianfeng Tan 	.read_dev_cfg	= virtio_user_read_dev_config,
449e9efa4d9SJianfeng Tan 	.write_dev_cfg	= virtio_user_write_dev_config,
450e9efa4d9SJianfeng Tan 	.get_status	= virtio_user_get_status,
451e9efa4d9SJianfeng Tan 	.set_status	= virtio_user_set_status,
452e9efa4d9SJianfeng Tan 	.get_features	= virtio_user_get_features,
453e9efa4d9SJianfeng Tan 	.set_features	= virtio_user_set_features,
454e9efa4d9SJianfeng Tan 	.get_isr	= virtio_user_get_isr,
455e9efa4d9SJianfeng Tan 	.set_config_irq	= virtio_user_set_config_irq,
4563d4fb6fdSJianfeng Tan 	.set_queue_irq	= virtio_user_set_queue_irq,
457e9efa4d9SJianfeng Tan 	.get_queue_num	= virtio_user_get_queue_num,
458e9efa4d9SJianfeng Tan 	.setup_queue	= virtio_user_setup_queue,
459e9efa4d9SJianfeng Tan 	.del_queue	= virtio_user_del_queue,
460e9efa4d9SJianfeng Tan 	.notify_queue	= virtio_user_notify_queue,
461e9efa4d9SJianfeng Tan };
462ce2eabddSJianfeng Tan 
463ce2eabddSJianfeng Tan static const char *valid_args[] = {
464ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_QUEUES_NUM     "queues"
465ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_QUEUES_NUM,
466ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_CQ_NUM         "cq"
467ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_CQ_NUM,
468ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_MAC            "mac"
469ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_MAC,
470ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_PATH           "path"
471ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_PATH,
472ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_QUEUE_SIZE     "queue_size"
473ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_QUEUE_SIZE,
4744214a1b4SWenfeng Liu #define VIRTIO_USER_ARG_INTERFACE_NAME "iface"
4754214a1b4SWenfeng Liu 	VIRTIO_USER_ARG_INTERFACE_NAME,
476bd8f50a4SZhiyong Yang #define VIRTIO_USER_ARG_SERVER_MODE    "server"
477bd8f50a4SZhiyong Yang 	VIRTIO_USER_ARG_SERVER_MODE,
478488ed97aSMarvin Liu #define VIRTIO_USER_ARG_MRG_RXBUF      "mrg_rxbuf"
479488ed97aSMarvin Liu 	VIRTIO_USER_ARG_MRG_RXBUF,
480488ed97aSMarvin Liu #define VIRTIO_USER_ARG_IN_ORDER       "in_order"
481488ed97aSMarvin Liu 	VIRTIO_USER_ARG_IN_ORDER,
48234f3966cSYuanhan Liu #define VIRTIO_USER_ARG_PACKED_VQ      "packed_vq"
48334f3966cSYuanhan Liu 	VIRTIO_USER_ARG_PACKED_VQ,
484b0db4beaSIvan Dyukov #define VIRTIO_USER_ARG_SPEED          "speed"
485b0db4beaSIvan Dyukov 	VIRTIO_USER_ARG_SPEED,
4866b7eefbcSMarvin Liu #define VIRTIO_USER_ARG_VECTORIZED     "vectorized"
4876b7eefbcSMarvin Liu 	VIRTIO_USER_ARG_VECTORIZED,
488ce2eabddSJianfeng Tan 	NULL
489ce2eabddSJianfeng Tan };
490ce2eabddSJianfeng Tan 
491ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_CQ_EN	0
492ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_Q_NUM	1
493ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_Q_SZ	256
494bd8f50a4SZhiyong Yang #define VIRTIO_USER_DEF_SERVER_MODE	0
495ce2eabddSJianfeng Tan 
496ce2eabddSJianfeng Tan static int
497ce2eabddSJianfeng Tan get_string_arg(const char *key __rte_unused,
498ce2eabddSJianfeng Tan 	       const char *value, void *extra_args)
499ce2eabddSJianfeng Tan {
500ce2eabddSJianfeng Tan 	if (!value || !extra_args)
501ce2eabddSJianfeng Tan 		return -EINVAL;
502ce2eabddSJianfeng Tan 
503ce2eabddSJianfeng Tan 	*(char **)extra_args = strdup(value);
504ce2eabddSJianfeng Tan 
5054214a1b4SWenfeng Liu 	if (!*(char **)extra_args)
5064214a1b4SWenfeng Liu 		return -ENOMEM;
5074214a1b4SWenfeng Liu 
508ce2eabddSJianfeng Tan 	return 0;
509ce2eabddSJianfeng Tan }
510ce2eabddSJianfeng Tan 
511ce2eabddSJianfeng Tan static int
512ce2eabddSJianfeng Tan get_integer_arg(const char *key __rte_unused,
513ce2eabddSJianfeng Tan 		const char *value, void *extra_args)
514ce2eabddSJianfeng Tan {
515bc5b6c11SIvan Dyukov 	uint64_t integer = 0;
516ce2eabddSJianfeng Tan 	if (!value || !extra_args)
517ce2eabddSJianfeng Tan 		return -EINVAL;
518bc5b6c11SIvan Dyukov 	errno = 0;
519bc5b6c11SIvan Dyukov 	integer = strtoull(value, NULL, 0);
520bc5b6c11SIvan Dyukov 	/* extra_args keeps default value, it should be replaced
521bc5b6c11SIvan Dyukov 	 * only in case of successful parsing of the 'value' arg
522bc5b6c11SIvan Dyukov 	 */
523bc5b6c11SIvan Dyukov 	if (errno == 0)
524bc5b6c11SIvan Dyukov 		*(uint64_t *)extra_args = integer;
525bc5b6c11SIvan Dyukov 	return -errno;
526ce2eabddSJianfeng Tan }
527ce2eabddSJianfeng Tan 
5287d62bf6fSMaxime Coquelin static uint32_t
5297d62bf6fSMaxime Coquelin vdpa_dynamic_major_num(void)
5307d62bf6fSMaxime Coquelin {
5317d62bf6fSMaxime Coquelin 	FILE *fp;
5327d62bf6fSMaxime Coquelin 	char *line = NULL;
5337d62bf6fSMaxime Coquelin 	size_t size;
5347d62bf6fSMaxime Coquelin 	char name[11];
5357d62bf6fSMaxime Coquelin 	bool found = false;
5367d62bf6fSMaxime Coquelin 	uint32_t num;
5377d62bf6fSMaxime Coquelin 
5387d62bf6fSMaxime Coquelin 	fp = fopen("/proc/devices", "r");
5397d62bf6fSMaxime Coquelin 	if (fp == NULL) {
5407d62bf6fSMaxime Coquelin 		PMD_INIT_LOG(ERR, "Cannot open /proc/devices: %s",
5417d62bf6fSMaxime Coquelin 			     strerror(errno));
5427d62bf6fSMaxime Coquelin 		return UNNAMED_MAJOR;
5437d62bf6fSMaxime Coquelin 	}
5447d62bf6fSMaxime Coquelin 
5457d62bf6fSMaxime Coquelin 	while (getline(&line, &size, fp) > 0) {
5467d62bf6fSMaxime Coquelin 		char *stripped = line + strspn(line, " ");
5477d62bf6fSMaxime Coquelin 		if ((sscanf(stripped, "%u %10s", &num, name) == 2) &&
5487d62bf6fSMaxime Coquelin 		    (strncmp(name, "vhost-vdpa", 10) == 0)) {
5497d62bf6fSMaxime Coquelin 			found = true;
5507d62bf6fSMaxime Coquelin 			break;
5517d62bf6fSMaxime Coquelin 		}
5527d62bf6fSMaxime Coquelin 	}
5537d62bf6fSMaxime Coquelin 	fclose(fp);
5547d62bf6fSMaxime Coquelin 	return found ? num : UNNAMED_MAJOR;
5557d62bf6fSMaxime Coquelin }
5567d62bf6fSMaxime Coquelin 
557f908b22eSAdrian Moreno static enum virtio_user_backend_type
558f908b22eSAdrian Moreno virtio_user_backend_type(const char *path)
559f908b22eSAdrian Moreno {
560f908b22eSAdrian Moreno 	struct stat sb;
561f908b22eSAdrian Moreno 
5627d62bf6fSMaxime Coquelin 	if (stat(path, &sb) == -1) {
563b0395dc8SAdrian Moreno 		if (errno == ENOENT)
564b0395dc8SAdrian Moreno 			return VIRTIO_USER_BACKEND_VHOST_USER;
565b0395dc8SAdrian Moreno 
5667d62bf6fSMaxime Coquelin 		PMD_INIT_LOG(ERR, "Stat fails: %s (%s)\n", path,
5677d62bf6fSMaxime Coquelin 			     strerror(errno));
568f908b22eSAdrian Moreno 		return VIRTIO_USER_BACKEND_UNKNOWN;
5697d62bf6fSMaxime Coquelin 	}
570f908b22eSAdrian Moreno 
5717d62bf6fSMaxime Coquelin 	if (S_ISSOCK(sb.st_mode)) {
5727d62bf6fSMaxime Coquelin 		return VIRTIO_USER_BACKEND_VHOST_USER;
5737d62bf6fSMaxime Coquelin 	} else if (S_ISCHR(sb.st_mode)) {
5747d62bf6fSMaxime Coquelin 		if (major(sb.st_rdev) == MISC_MAJOR)
5757d62bf6fSMaxime Coquelin 			return VIRTIO_USER_BACKEND_VHOST_KERNEL;
5767d62bf6fSMaxime Coquelin 		if (major(sb.st_rdev) == vdpa_dynamic_major_num())
5777d62bf6fSMaxime Coquelin 			return VIRTIO_USER_BACKEND_VHOST_VDPA;
5787d62bf6fSMaxime Coquelin 	}
5797d62bf6fSMaxime Coquelin 	return VIRTIO_USER_BACKEND_UNKNOWN;
580f908b22eSAdrian Moreno }
581f908b22eSAdrian Moreno 
582ce2eabddSJianfeng Tan static struct rte_eth_dev *
583050fe6e9SJan Blunck virtio_user_eth_dev_alloc(struct rte_vdev_device *vdev)
584ce2eabddSJianfeng Tan {
585ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
586ce2eabddSJianfeng Tan 	struct rte_eth_dev_data *data;
587ce2eabddSJianfeng Tan 	struct virtio_hw *hw;
588ce2eabddSJianfeng Tan 	struct virtio_user_dev *dev;
589ce2eabddSJianfeng Tan 
590050fe6e9SJan Blunck 	eth_dev = rte_eth_vdev_allocate(vdev, sizeof(*hw));
591ce2eabddSJianfeng Tan 	if (!eth_dev) {
592ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "cannot alloc rte_eth_dev");
593ce2eabddSJianfeng Tan 		return NULL;
594ce2eabddSJianfeng Tan 	}
595ce2eabddSJianfeng Tan 
596ce2eabddSJianfeng Tan 	data = eth_dev->data;
597050fe6e9SJan Blunck 	hw = eth_dev->data->dev_private;
598ce2eabddSJianfeng Tan 
599ce2eabddSJianfeng Tan 	dev = rte_zmalloc(NULL, sizeof(*dev), 0);
600ce2eabddSJianfeng Tan 	if (!dev) {
601ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "malloc virtio_user_dev failed");
602ce2eabddSJianfeng Tan 		rte_eth_dev_release_port(eth_dev);
603ce2eabddSJianfeng Tan 		return NULL;
604ce2eabddSJianfeng Tan 	}
605ce2eabddSJianfeng Tan 
606553f4593SYuanhan Liu 	hw->port_id = data->port_id;
6073d4fb6fdSJianfeng Tan 	dev->port_id = data->port_id;
608553f4593SYuanhan Liu 	virtio_hw_internal[hw->port_id].vtpci_ops = &virtio_user_ops;
609ef53b603SJianfeng Tan 	/*
610ef53b603SJianfeng Tan 	 * MSIX is required to enable LSC (see virtio_init_device).
611ef53b603SJianfeng Tan 	 * Here just pretend that we support msix.
612ef53b603SJianfeng Tan 	 */
613ef53b603SJianfeng Tan 	hw->use_msix = 1;
614ce2eabddSJianfeng Tan 	hw->modern   = 0;
6154710e16aSMarvin Liu 	hw->use_vec_rx = 0;
61677d66da8SMarvin Liu 	hw->use_vec_tx = 0;
6179f233f54SMarvin Liu 	hw->use_inorder_rx = 0;
6189f233f54SMarvin Liu 	hw->use_inorder_tx = 0;
619ce2eabddSJianfeng Tan 	hw->virtio_user_dev = dev;
620ce2eabddSJianfeng Tan 	return eth_dev;
621ce2eabddSJianfeng Tan }
622ce2eabddSJianfeng Tan 
623ca8326a9SJianfeng Tan static void
624ca8326a9SJianfeng Tan virtio_user_eth_dev_free(struct rte_eth_dev *eth_dev)
625ca8326a9SJianfeng Tan {
626ca8326a9SJianfeng Tan 	struct rte_eth_dev_data *data = eth_dev->data;
627ca8326a9SJianfeng Tan 	struct virtio_hw *hw = data->dev_private;
628ca8326a9SJianfeng Tan 
629ca8326a9SJianfeng Tan 	rte_free(hw->virtio_user_dev);
630ca8326a9SJianfeng Tan 	rte_eth_dev_release_port(eth_dev);
631ca8326a9SJianfeng Tan }
632ca8326a9SJianfeng Tan 
633ce2eabddSJianfeng Tan /* Dev initialization routine. Invoked once for each virtio vdev at
634c3b2fdfeSYong Wang  * EAL init time, see rte_bus_probe().
635ce2eabddSJianfeng Tan  * Returns 0 on success.
636ce2eabddSJianfeng Tan  */
637ce2eabddSJianfeng Tan static int
6385d2aa461SJan Blunck virtio_user_pmd_probe(struct rte_vdev_device *dev)
639ce2eabddSJianfeng Tan {
64014f06474SJianfeng Tan 	struct rte_kvargs *kvlist = NULL;
641ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
642ce2eabddSJianfeng Tan 	struct virtio_hw *hw;
643f908b22eSAdrian Moreno 	enum virtio_user_backend_type backend_type = VIRTIO_USER_BACKEND_UNKNOWN;
644ce2eabddSJianfeng Tan 	uint64_t queues = VIRTIO_USER_DEF_Q_NUM;
645ce2eabddSJianfeng Tan 	uint64_t cq = VIRTIO_USER_DEF_CQ_EN;
646ce2eabddSJianfeng Tan 	uint64_t queue_size = VIRTIO_USER_DEF_Q_SZ;
647bd8f50a4SZhiyong Yang 	uint64_t server_mode = VIRTIO_USER_DEF_SERVER_MODE;
648488ed97aSMarvin Liu 	uint64_t mrg_rxbuf = 1;
649488ed97aSMarvin Liu 	uint64_t in_order = 1;
6509070f88bSTiwei Bie 	uint64_t packed_vq = 0;
6516b7eefbcSMarvin Liu 	uint64_t vectorized = 0;
652ce2eabddSJianfeng Tan 	char *path = NULL;
6534214a1b4SWenfeng Liu 	char *ifname = NULL;
654ce2eabddSJianfeng Tan 	char *mac_addr = NULL;
655ce2eabddSJianfeng Tan 	int ret = -1;
656ce2eabddSJianfeng Tan 
6571c8489daSTiwei Bie 	if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
6581c8489daSTiwei Bie 		const char *name = rte_vdev_device_name(dev);
6591c8489daSTiwei Bie 		eth_dev = rte_eth_dev_attach_secondary(name);
6601c8489daSTiwei Bie 		if (!eth_dev) {
66188fa5bb6SStephen Hemminger 			PMD_INIT_LOG(ERR, "Failed to probe %s", name);
6621c8489daSTiwei Bie 			return -1;
6631c8489daSTiwei Bie 		}
6641c8489daSTiwei Bie 
6651c8489daSTiwei Bie 		if (eth_virtio_dev_init(eth_dev) < 0) {
6661c8489daSTiwei Bie 			PMD_INIT_LOG(ERR, "eth_virtio_dev_init fails");
6671c8489daSTiwei Bie 			rte_eth_dev_release_port(eth_dev);
6681c8489daSTiwei Bie 			return -1;
6691c8489daSTiwei Bie 		}
6701c8489daSTiwei Bie 
6711c8489daSTiwei Bie 		eth_dev->dev_ops = &virtio_user_secondary_eth_dev_ops;
6721c8489daSTiwei Bie 		eth_dev->device = &dev->device;
6731c8489daSTiwei Bie 		rte_eth_dev_probing_finish(eth_dev);
6741c8489daSTiwei Bie 		return 0;
6751c8489daSTiwei Bie 	}
6761c8489daSTiwei Bie 
6775d2aa461SJan Blunck 	kvlist = rte_kvargs_parse(rte_vdev_device_args(dev), valid_args);
678ce2eabddSJianfeng Tan 	if (!kvlist) {
679ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "error when parsing param");
680ce2eabddSJianfeng Tan 		goto end;
681ce2eabddSJianfeng Tan 	}
682ce2eabddSJianfeng Tan 
6839cca159eSMaxime Coquelin 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_PATH) == 1) {
684ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_PATH,
685ca8326a9SJianfeng Tan 				       &get_string_arg, &path) < 0) {
686404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
687404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_PATH);
688404bd6bfSJianfeng Tan 			goto end;
689404bd6bfSJianfeng Tan 		}
6909cca159eSMaxime Coquelin 	} else {
691f2462150SFerruh Yigit 		PMD_INIT_LOG(ERR, "arg %s is mandatory for virtio_user",
6922dac0df4STiwei Bie 			     VIRTIO_USER_ARG_PATH);
693ce2eabddSJianfeng Tan 		goto end;
694ce2eabddSJianfeng Tan 	}
695ce2eabddSJianfeng Tan 
696f908b22eSAdrian Moreno 	backend_type = virtio_user_backend_type(path);
697f908b22eSAdrian Moreno 	if (backend_type == VIRTIO_USER_BACKEND_UNKNOWN) {
698f908b22eSAdrian Moreno 		PMD_INIT_LOG(ERR,
699f908b22eSAdrian Moreno 			     "unable to determine backend type for path %s",
700f908b22eSAdrian Moreno 			path);
701f908b22eSAdrian Moreno 		goto end;
702f908b22eSAdrian Moreno 	}
703b0395dc8SAdrian Moreno 	PMD_INIT_LOG(INFO, "Backend type detected: %s",
704b0395dc8SAdrian Moreno 		     virtio_user_backend_strings[backend_type]);
705f908b22eSAdrian Moreno 
7064214a1b4SWenfeng Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_INTERFACE_NAME) == 1) {
707f908b22eSAdrian Moreno 		if (backend_type != VIRTIO_USER_BACKEND_VHOST_KERNEL) {
7084214a1b4SWenfeng Liu 			PMD_INIT_LOG(ERR,
7094214a1b4SWenfeng Liu 				"arg %s applies only to vhost-kernel backend",
7104214a1b4SWenfeng Liu 				VIRTIO_USER_ARG_INTERFACE_NAME);
7114214a1b4SWenfeng Liu 			goto end;
7124214a1b4SWenfeng Liu 		}
7134214a1b4SWenfeng Liu 
7144214a1b4SWenfeng Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_INTERFACE_NAME,
7154214a1b4SWenfeng Liu 				       &get_string_arg, &ifname) < 0) {
7164214a1b4SWenfeng Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
7174214a1b4SWenfeng Liu 				     VIRTIO_USER_ARG_INTERFACE_NAME);
7184214a1b4SWenfeng Liu 			goto end;
7194214a1b4SWenfeng Liu 		}
7204214a1b4SWenfeng Liu 	}
7214214a1b4SWenfeng Liu 
722404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_MAC) == 1) {
723ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_MAC,
724ca8326a9SJianfeng Tan 				       &get_string_arg, &mac_addr) < 0) {
725404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
726404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_MAC);
727404bd6bfSJianfeng Tan 			goto end;
728404bd6bfSJianfeng Tan 		}
729404bd6bfSJianfeng Tan 	}
730ce2eabddSJianfeng Tan 
731404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_QUEUE_SIZE) == 1) {
732ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_QUEUE_SIZE,
733ca8326a9SJianfeng Tan 				       &get_integer_arg, &queue_size) < 0) {
734404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
735404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_QUEUE_SIZE);
736404bd6bfSJianfeng Tan 			goto end;
737404bd6bfSJianfeng Tan 		}
738404bd6bfSJianfeng Tan 	}
739ce2eabddSJianfeng Tan 
740404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_QUEUES_NUM) == 1) {
741ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_QUEUES_NUM,
742ca8326a9SJianfeng Tan 				       &get_integer_arg, &queues) < 0) {
743404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
744404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_QUEUES_NUM);
745404bd6bfSJianfeng Tan 			goto end;
746404bd6bfSJianfeng Tan 		}
747404bd6bfSJianfeng Tan 	}
748ce2eabddSJianfeng Tan 
749bd8f50a4SZhiyong Yang 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_SERVER_MODE) == 1) {
750bd8f50a4SZhiyong Yang 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_SERVER_MODE,
751bd8f50a4SZhiyong Yang 				       &get_integer_arg, &server_mode) < 0) {
752bd8f50a4SZhiyong Yang 			PMD_INIT_LOG(ERR, "error to parse %s",
753bd8f50a4SZhiyong Yang 				     VIRTIO_USER_ARG_SERVER_MODE);
754bd8f50a4SZhiyong Yang 			goto end;
755bd8f50a4SZhiyong Yang 		}
756bd8f50a4SZhiyong Yang 	}
757bd8f50a4SZhiyong Yang 
758404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_CQ_NUM) == 1) {
759ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_CQ_NUM,
760ca8326a9SJianfeng Tan 				       &get_integer_arg, &cq) < 0) {
761404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
762404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_CQ_NUM);
763404bd6bfSJianfeng Tan 			goto end;
764404bd6bfSJianfeng Tan 		}
765404bd6bfSJianfeng Tan 	} else if (queues > 1) {
7661b69528eSJianfeng Tan 		cq = 1;
767404bd6bfSJianfeng Tan 	}
7681b69528eSJianfeng Tan 
76934f3966cSYuanhan Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_PACKED_VQ) == 1) {
77034f3966cSYuanhan Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_PACKED_VQ,
77134f3966cSYuanhan Liu 				       &get_integer_arg, &packed_vq) < 0) {
77234f3966cSYuanhan Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
77334f3966cSYuanhan Liu 				     VIRTIO_USER_ARG_PACKED_VQ);
77434f3966cSYuanhan Liu 			goto end;
77534f3966cSYuanhan Liu 		}
77634f3966cSYuanhan Liu 	}
77734f3966cSYuanhan Liu 
7786b7eefbcSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_VECTORIZED) == 1) {
7796b7eefbcSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_VECTORIZED,
7806b7eefbcSMarvin Liu 				       &get_integer_arg, &vectorized) < 0) {
7816b7eefbcSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
7826b7eefbcSMarvin Liu 				     VIRTIO_USER_ARG_VECTORIZED);
7836b7eefbcSMarvin Liu 			goto end;
7846b7eefbcSMarvin Liu 		}
7856b7eefbcSMarvin Liu 	}
7866b7eefbcSMarvin Liu 
7871b69528eSJianfeng Tan 	if (queues > 1 && cq == 0) {
7881b69528eSJianfeng Tan 		PMD_INIT_LOG(ERR, "multi-q requires ctrl-q");
7891b69528eSJianfeng Tan 		goto end;
7901b69528eSJianfeng Tan 	}
791ce2eabddSJianfeng Tan 
7922269b9aeSWenfeng Liu 	if (queues > VIRTIO_MAX_VIRTQUEUE_PAIRS) {
7932269b9aeSWenfeng Liu 		PMD_INIT_LOG(ERR, "arg %s %" PRIu64 " exceeds the limit %u",
7942269b9aeSWenfeng Liu 			VIRTIO_USER_ARG_QUEUES_NUM, queues,
7952269b9aeSWenfeng Liu 			VIRTIO_MAX_VIRTQUEUE_PAIRS);
7962269b9aeSWenfeng Liu 		goto end;
7972269b9aeSWenfeng Liu 	}
7982269b9aeSWenfeng Liu 
799488ed97aSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_MRG_RXBUF) == 1) {
800488ed97aSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_MRG_RXBUF,
801488ed97aSMarvin Liu 				       &get_integer_arg, &mrg_rxbuf) < 0) {
802488ed97aSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
803488ed97aSMarvin Liu 				     VIRTIO_USER_ARG_MRG_RXBUF);
804488ed97aSMarvin Liu 			goto end;
805488ed97aSMarvin Liu 		}
806488ed97aSMarvin Liu 	}
807488ed97aSMarvin Liu 
808488ed97aSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_IN_ORDER) == 1) {
809488ed97aSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_IN_ORDER,
810488ed97aSMarvin Liu 				       &get_integer_arg, &in_order) < 0) {
811488ed97aSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
812488ed97aSMarvin Liu 				     VIRTIO_USER_ARG_IN_ORDER);
813488ed97aSMarvin Liu 			goto end;
814488ed97aSMarvin Liu 		}
815488ed97aSMarvin Liu 	}
816488ed97aSMarvin Liu 
817050fe6e9SJan Blunck 	eth_dev = virtio_user_eth_dev_alloc(dev);
818ce2eabddSJianfeng Tan 	if (!eth_dev) {
819e8df94b8SJianfeng Tan 		PMD_INIT_LOG(ERR, "virtio_user fails to alloc device");
820ce2eabddSJianfeng Tan 		goto end;
821ce2eabddSJianfeng Tan 	}
822ce2eabddSJianfeng Tan 
823ce2eabddSJianfeng Tan 	hw = eth_dev->data->dev_private;
824ce2eabddSJianfeng Tan 	if (virtio_user_dev_init(hw->virtio_user_dev, path, queues, cq,
8251c8489daSTiwei Bie 			 queue_size, mac_addr, &ifname, server_mode,
826f908b22eSAdrian Moreno 			 mrg_rxbuf, in_order, packed_vq, backend_type) < 0) {
827ca8326a9SJianfeng Tan 		PMD_INIT_LOG(ERR, "virtio_user_dev_init fails");
828ca8326a9SJianfeng Tan 		virtio_user_eth_dev_free(eth_dev);
829ce2eabddSJianfeng Tan 		goto end;
830ca8326a9SJianfeng Tan 	}
831fbe90cddSThomas Monjalon 
83287db93e0SDavid Marchand 	/* previously called by pci probing for physical dev */
833ce2eabddSJianfeng Tan 	if (eth_virtio_dev_init(eth_dev) < 0) {
834ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "eth_virtio_dev_init fails");
835ca8326a9SJianfeng Tan 		virtio_user_eth_dev_free(eth_dev);
836ce2eabddSJianfeng Tan 		goto end;
837ce2eabddSJianfeng Tan 	}
838fbe90cddSThomas Monjalon 
83977d66da8SMarvin Liu 	if (vectorized) {
84077d66da8SMarvin Liu 		if (packed_vq) {
84177d66da8SMarvin Liu #if defined(CC_AVX512_SUPPORT)
8426b7eefbcSMarvin Liu 			hw->use_vec_rx = 1;
84377d66da8SMarvin Liu 			hw->use_vec_tx = 1;
84477d66da8SMarvin Liu #else
84577d66da8SMarvin Liu 			PMD_INIT_LOG(INFO,
84677d66da8SMarvin Liu 				"building environment do not support packed ring vectorized");
84777d66da8SMarvin Liu #endif
84877d66da8SMarvin Liu 		} else {
84977d66da8SMarvin Liu 			hw->use_vec_rx = 1;
85077d66da8SMarvin Liu 		}
85177d66da8SMarvin Liu 	}
8526b7eefbcSMarvin Liu 
853fbe90cddSThomas Monjalon 	rte_eth_dev_probing_finish(eth_dev);
854ce2eabddSJianfeng Tan 	ret = 0;
855ce2eabddSJianfeng Tan 
856ce2eabddSJianfeng Tan end:
85714f06474SJianfeng Tan 	if (kvlist)
85814f06474SJianfeng Tan 		rte_kvargs_free(kvlist);
859ce2eabddSJianfeng Tan 	if (path)
860ce2eabddSJianfeng Tan 		free(path);
861ce2eabddSJianfeng Tan 	if (mac_addr)
862ce2eabddSJianfeng Tan 		free(mac_addr);
8634214a1b4SWenfeng Liu 	if (ifname)
8644214a1b4SWenfeng Liu 		free(ifname);
865ce2eabddSJianfeng Tan 	return ret;
866ce2eabddSJianfeng Tan }
867ce2eabddSJianfeng Tan 
868ce2eabddSJianfeng Tan static int
8695d2aa461SJan Blunck virtio_user_pmd_remove(struct rte_vdev_device *vdev)
870ce2eabddSJianfeng Tan {
8715d2aa461SJan Blunck 	const char *name;
872ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
873ce2eabddSJianfeng Tan 
8745d2aa461SJan Blunck 	if (!vdev)
875ce2eabddSJianfeng Tan 		return -EINVAL;
876ce2eabddSJianfeng Tan 
8775d2aa461SJan Blunck 	name = rte_vdev_device_name(vdev);
878f2462150SFerruh Yigit 	PMD_DRV_LOG(INFO, "Un-Initializing %s", name);
879ce2eabddSJianfeng Tan 	eth_dev = rte_eth_dev_allocated(name);
8807f468b2eSTiwei Bie 	/* Port has already been released by close. */
881ce2eabddSJianfeng Tan 	if (!eth_dev)
8827f468b2eSTiwei Bie 		return 0;
883ce2eabddSJianfeng Tan 
8841c8489daSTiwei Bie 	if (rte_eal_process_type() != RTE_PROC_PRIMARY)
8851c8489daSTiwei Bie 		return rte_eth_dev_release_port(eth_dev);
8861c8489daSTiwei Bie 
887ce2eabddSJianfeng Tan 	/* make sure the device is stopped, queues freed */
8888a5a0aadSThomas Monjalon 	return rte_eth_dev_close(eth_dev->data->port_id);
889ce2eabddSJianfeng Tan }
890ce2eabddSJianfeng Tan 
89186e71eb2SMaxime Coquelin static int virtio_user_pmd_dma_map(struct rte_vdev_device *vdev, void *addr,
89286e71eb2SMaxime Coquelin 		uint64_t iova, size_t len)
89386e71eb2SMaxime Coquelin {
89486e71eb2SMaxime Coquelin 	const char *name;
89586e71eb2SMaxime Coquelin 	struct rte_eth_dev *eth_dev;
89686e71eb2SMaxime Coquelin 	struct virtio_user_dev *dev;
89786e71eb2SMaxime Coquelin 	struct virtio_hw *hw;
89886e71eb2SMaxime Coquelin 
89986e71eb2SMaxime Coquelin 	if (!vdev)
90086e71eb2SMaxime Coquelin 		return -EINVAL;
90186e71eb2SMaxime Coquelin 
90286e71eb2SMaxime Coquelin 	name = rte_vdev_device_name(vdev);
90386e71eb2SMaxime Coquelin 	eth_dev = rte_eth_dev_allocated(name);
90486e71eb2SMaxime Coquelin 	/* Port has already been released by close. */
90586e71eb2SMaxime Coquelin 	if (!eth_dev)
90686e71eb2SMaxime Coquelin 		return 0;
90786e71eb2SMaxime Coquelin 
90886e71eb2SMaxime Coquelin 	hw = (struct virtio_hw *)eth_dev->data->dev_private;
90986e71eb2SMaxime Coquelin 	dev = hw->virtio_user_dev;
91086e71eb2SMaxime Coquelin 
91186e71eb2SMaxime Coquelin 	if (dev->ops->dma_map)
91286e71eb2SMaxime Coquelin 		return dev->ops->dma_map(dev, addr, iova, len);
91386e71eb2SMaxime Coquelin 
91486e71eb2SMaxime Coquelin 	return 0;
91586e71eb2SMaxime Coquelin }
91686e71eb2SMaxime Coquelin 
91786e71eb2SMaxime Coquelin static int virtio_user_pmd_dma_unmap(struct rte_vdev_device *vdev, void *addr,
91886e71eb2SMaxime Coquelin 		uint64_t iova, size_t len)
91986e71eb2SMaxime Coquelin {
92086e71eb2SMaxime Coquelin 	const char *name;
92186e71eb2SMaxime Coquelin 	struct rte_eth_dev *eth_dev;
92286e71eb2SMaxime Coquelin 	struct virtio_user_dev *dev;
92386e71eb2SMaxime Coquelin 	struct virtio_hw *hw;
92486e71eb2SMaxime Coquelin 
92586e71eb2SMaxime Coquelin 	if (!vdev)
92686e71eb2SMaxime Coquelin 		return -EINVAL;
92786e71eb2SMaxime Coquelin 
92886e71eb2SMaxime Coquelin 	name = rte_vdev_device_name(vdev);
92986e71eb2SMaxime Coquelin 	eth_dev = rte_eth_dev_allocated(name);
93086e71eb2SMaxime Coquelin 	/* Port has already been released by close. */
93186e71eb2SMaxime Coquelin 	if (!eth_dev)
93286e71eb2SMaxime Coquelin 		return 0;
93386e71eb2SMaxime Coquelin 
93486e71eb2SMaxime Coquelin 	hw = (struct virtio_hw *)eth_dev->data->dev_private;
93586e71eb2SMaxime Coquelin 	dev = hw->virtio_user_dev;
93686e71eb2SMaxime Coquelin 
93786e71eb2SMaxime Coquelin 	if (dev->ops->dma_unmap)
93886e71eb2SMaxime Coquelin 		return dev->ops->dma_unmap(dev, addr, iova, len);
93986e71eb2SMaxime Coquelin 
94086e71eb2SMaxime Coquelin 	return 0;
94186e71eb2SMaxime Coquelin }
94286e71eb2SMaxime Coquelin 
943fe363dd4SJan Viktorin static struct rte_vdev_driver virtio_user_driver = {
94450a3345fSShreyansh Jain 	.probe = virtio_user_pmd_probe,
94550a3345fSShreyansh Jain 	.remove = virtio_user_pmd_remove,
94686e71eb2SMaxime Coquelin 	.dma_map = virtio_user_pmd_dma_map,
94786e71eb2SMaxime Coquelin 	.dma_unmap = virtio_user_pmd_dma_unmap,
948ce2eabddSJianfeng Tan };
949ce2eabddSJianfeng Tan 
95001f19227SShreyansh Jain RTE_PMD_REGISTER_VDEV(net_virtio_user, virtio_user_driver);
9519fa80cb2SJan Blunck RTE_PMD_REGISTER_ALIAS(net_virtio_user, virtio_user);
95201f19227SShreyansh Jain RTE_PMD_REGISTER_PARAM_STRING(net_virtio_user,
95344e32a67SPablo de Lara 	"path=<path> "
95444e32a67SPablo de Lara 	"mac=<mac addr> "
95544e32a67SPablo de Lara 	"cq=<int> "
95644e32a67SPablo de Lara 	"queue_size=<int> "
9574214a1b4SWenfeng Liu 	"queues=<int> "
958488ed97aSMarvin Liu 	"iface=<string> "
95962758c76STiwei Bie 	"server=<0|1> "
960488ed97aSMarvin Liu 	"mrg_rxbuf=<0|1> "
9619070f88bSTiwei Bie 	"in_order=<0|1> "
962b0db4beaSIvan Dyukov 	"packed_vq=<0|1> "
9636b7eefbcSMarvin Liu 	"speed=<int> "
9646b7eefbcSMarvin Liu 	"vectorized=<0|1>");
965