xref: /dpdk/drivers/net/virtio/virtio_user_ethdev.c (revision 8a5a0aad5d3e4f4f75ca81932eb247de94765685)
15566a3e3SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause
25566a3e3SBruce Richardson  * Copyright(c) 2010-2016 Intel Corporation
3e9efa4d9SJianfeng Tan  */
4e9efa4d9SJianfeng Tan 
5e9efa4d9SJianfeng Tan #include <stdint.h>
6e9efa4d9SJianfeng Tan #include <sys/types.h>
7e9efa4d9SJianfeng Tan #include <unistd.h>
8ef53b603SJianfeng Tan #include <fcntl.h>
97d62bf6fSMaxime Coquelin #include <linux/major.h>
10f908b22eSAdrian Moreno #include <sys/stat.h>
117d62bf6fSMaxime Coquelin #include <sys/sysmacros.h>
12ef53b603SJianfeng Tan #include <sys/socket.h>
13e9efa4d9SJianfeng Tan 
14ce2eabddSJianfeng Tan #include <rte_malloc.h>
15ce2eabddSJianfeng Tan #include <rte_kvargs.h>
16050fe6e9SJan Blunck #include <rte_ethdev_vdev.h>
17d4a586d2SJianfeng Tan #include <rte_bus_vdev.h>
18ef53b603SJianfeng Tan #include <rte_alarm.h>
196ebbf410SXuan Ding #include <rte_cycles.h>
20ce2eabddSJianfeng Tan 
21ce2eabddSJianfeng Tan #include "virtio_ethdev.h"
22e9efa4d9SJianfeng Tan #include "virtio_logs.h"
23e9efa4d9SJianfeng Tan #include "virtio_pci.h"
24e9efa4d9SJianfeng Tan #include "virtqueue.h"
251b69528eSJianfeng Tan #include "virtio_rxtx.h"
26e9efa4d9SJianfeng Tan #include "virtio_user/virtio_user_dev.h"
277f468b2eSTiwei Bie #include "virtio_user/vhost.h"
28e9efa4d9SJianfeng Tan 
29e9efa4d9SJianfeng Tan #define virtio_user_get_dev(hw) \
30e9efa4d9SJianfeng Tan 	((struct virtio_user_dev *)(hw)->virtio_user_dev)
31e9efa4d9SJianfeng Tan 
326ebbf410SXuan Ding static void
336ebbf410SXuan Ding virtio_user_reset_queues_packed(struct rte_eth_dev *dev)
346ebbf410SXuan Ding {
356ebbf410SXuan Ding 	struct virtio_hw *hw = dev->data->dev_private;
366ebbf410SXuan Ding 	struct virtnet_rx *rxvq;
376ebbf410SXuan Ding 	struct virtnet_tx *txvq;
386ebbf410SXuan Ding 	uint16_t i;
396ebbf410SXuan Ding 
406ebbf410SXuan Ding 	/* Add lock to avoid queue contention. */
416ebbf410SXuan Ding 	rte_spinlock_lock(&hw->state_lock);
426ebbf410SXuan Ding 	hw->started = 0;
436ebbf410SXuan Ding 
446ebbf410SXuan Ding 	/*
456ebbf410SXuan Ding 	 * Waitting for datapath to complete before resetting queues.
466ebbf410SXuan Ding 	 * 1 ms should be enough for the ongoing Tx/Rx function to finish.
476ebbf410SXuan Ding 	 */
486ebbf410SXuan Ding 	rte_delay_ms(1);
496ebbf410SXuan Ding 
506ebbf410SXuan Ding 	/* Vring reset for each Tx queue and Rx queue. */
516ebbf410SXuan Ding 	for (i = 0; i < dev->data->nb_rx_queues; i++) {
526ebbf410SXuan Ding 		rxvq = dev->data->rx_queues[i];
536ebbf410SXuan Ding 		virtqueue_rxvq_reset_packed(rxvq->vq);
546ebbf410SXuan Ding 		virtio_dev_rx_queue_setup_finish(dev, i);
556ebbf410SXuan Ding 	}
566ebbf410SXuan Ding 
576ebbf410SXuan Ding 	for (i = 0; i < dev->data->nb_tx_queues; i++) {
586ebbf410SXuan Ding 		txvq = dev->data->tx_queues[i];
596ebbf410SXuan Ding 		virtqueue_txvq_reset_packed(txvq->vq);
606ebbf410SXuan Ding 	}
616ebbf410SXuan Ding 
626ebbf410SXuan Ding 	hw->started = 1;
636ebbf410SXuan Ding 	rte_spinlock_unlock(&hw->state_lock);
646ebbf410SXuan Ding }
656ebbf410SXuan Ding 
666ebbf410SXuan Ding 
67bd8f50a4SZhiyong Yang static int
68bd8f50a4SZhiyong Yang virtio_user_server_reconnect(struct virtio_user_dev *dev)
69bd8f50a4SZhiyong Yang {
70bd8f50a4SZhiyong Yang 	int ret;
71bd8f50a4SZhiyong Yang 	int connectfd;
72bd8f50a4SZhiyong Yang 	struct rte_eth_dev *eth_dev = &rte_eth_devices[dev->port_id];
736ebbf410SXuan Ding 	struct virtio_hw *hw = eth_dev->data->dev_private;
748e756105SMaxime Coquelin 	uint64_t protocol_features;
75bd8f50a4SZhiyong Yang 
76bd8f50a4SZhiyong Yang 	connectfd = accept(dev->listenfd, NULL, NULL);
77bd8f50a4SZhiyong Yang 	if (connectfd < 0)
78bd8f50a4SZhiyong Yang 		return -1;
79bd8f50a4SZhiyong Yang 
80bd8f50a4SZhiyong Yang 	dev->vhostfd = connectfd;
81201a4165SZhiyong Yang 	if (dev->ops->send_request(dev, VHOST_USER_GET_FEATURES,
82201a4165SZhiyong Yang 				   &dev->device_features) < 0) {
83201a4165SZhiyong Yang 		PMD_INIT_LOG(ERR, "get_features failed: %s",
84201a4165SZhiyong Yang 			     strerror(errno));
85201a4165SZhiyong Yang 		return -1;
86201a4165SZhiyong Yang 	}
87201a4165SZhiyong Yang 
888e756105SMaxime Coquelin 	if (dev->device_features &
898e756105SMaxime Coquelin 			(1ULL << VHOST_USER_F_PROTOCOL_FEATURES)) {
908e756105SMaxime Coquelin 		if (dev->ops->send_request(dev,
918e756105SMaxime Coquelin 					VHOST_USER_GET_PROTOCOL_FEATURES,
928e756105SMaxime Coquelin 					&protocol_features))
938e756105SMaxime Coquelin 			return -1;
948e756105SMaxime Coquelin 
958e756105SMaxime Coquelin 		dev->protocol_features &= protocol_features;
968e756105SMaxime Coquelin 
978e756105SMaxime Coquelin 		if (dev->ops->send_request(dev,
988e756105SMaxime Coquelin 					VHOST_USER_SET_PROTOCOL_FEATURES,
998e756105SMaxime Coquelin 					&dev->protocol_features))
1008e756105SMaxime Coquelin 			return -1;
1018e756105SMaxime Coquelin 
1028e756105SMaxime Coquelin 		if (!(dev->protocol_features &
1038e756105SMaxime Coquelin 				(1ULL << VHOST_USER_PROTOCOL_F_MQ)))
1048e756105SMaxime Coquelin 			dev->unsupported_features |= (1ull << VIRTIO_NET_F_MQ);
1058e756105SMaxime Coquelin 	}
1068e756105SMaxime Coquelin 
107bb97d2ddSTiwei Bie 	dev->device_features |= dev->frontend_features;
108bb97d2ddSTiwei Bie 
1097c66ff61SMarvin Liu 	/* umask vhost-user unsupported features */
1107c66ff61SMarvin Liu 	dev->device_features &= ~(dev->unsupported_features);
111201a4165SZhiyong Yang 
112201a4165SZhiyong Yang 	dev->features &= dev->device_features;
113201a4165SZhiyong Yang 
1146ebbf410SXuan Ding 	/* For packed ring, resetting queues is required in reconnection. */
11501996a03SMarvin Liu 	if (vtpci_packed_queue(hw) &&
11601996a03SMarvin Liu 	   (vtpci_get_status(hw) & VIRTIO_CONFIG_STATUS_DRIVER_OK)) {
1176ebbf410SXuan Ding 		PMD_INIT_LOG(NOTICE, "Packets on the fly will be dropped"
1186ebbf410SXuan Ding 				" when packed ring reconnecting.");
1196ebbf410SXuan Ding 		virtio_user_reset_queues_packed(eth_dev);
12092771257STiwei Bie 	}
1216ebbf410SXuan Ding 
122bd8f50a4SZhiyong Yang 	ret = virtio_user_start_device(dev);
123bd8f50a4SZhiyong Yang 	if (ret < 0)
124bd8f50a4SZhiyong Yang 		return -1;
125bd8f50a4SZhiyong Yang 
126201a4165SZhiyong Yang 	if (dev->queue_pairs > 1) {
127201a4165SZhiyong Yang 		ret = virtio_user_handle_mq(dev, dev->queue_pairs);
128201a4165SZhiyong Yang 		if (ret != 0) {
129201a4165SZhiyong Yang 			PMD_INIT_LOG(ERR, "Fails to enable multi-queue pairs!");
130201a4165SZhiyong Yang 			return -1;
131201a4165SZhiyong Yang 		}
132201a4165SZhiyong Yang 	}
133bd8f50a4SZhiyong Yang 	if (eth_dev->data->dev_flags & RTE_ETH_DEV_INTR_LSC) {
134bd8f50a4SZhiyong Yang 		if (rte_intr_disable(eth_dev->intr_handle) < 0) {
135bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt disable failed");
136bd8f50a4SZhiyong Yang 			return -1;
137bd8f50a4SZhiyong Yang 		}
138bd8f50a4SZhiyong Yang 		rte_intr_callback_unregister(eth_dev->intr_handle,
139bd8f50a4SZhiyong Yang 					     virtio_interrupt_handler,
140bd8f50a4SZhiyong Yang 					     eth_dev);
141bd8f50a4SZhiyong Yang 		eth_dev->intr_handle->fd = connectfd;
142bd8f50a4SZhiyong Yang 		rte_intr_callback_register(eth_dev->intr_handle,
143bd8f50a4SZhiyong Yang 					   virtio_interrupt_handler, eth_dev);
144bd8f50a4SZhiyong Yang 
145bd8f50a4SZhiyong Yang 		if (rte_intr_enable(eth_dev->intr_handle) < 0) {
146bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt enable failed");
147bd8f50a4SZhiyong Yang 			return -1;
148bd8f50a4SZhiyong Yang 		}
149bd8f50a4SZhiyong Yang 	}
150bd8f50a4SZhiyong Yang 	PMD_INIT_LOG(NOTICE, "server mode virtio-user reconnection succeeds!");
151bd8f50a4SZhiyong Yang 	return 0;
152bd8f50a4SZhiyong Yang }
153bd8f50a4SZhiyong Yang 
154e9efa4d9SJianfeng Tan static void
155ef53b603SJianfeng Tan virtio_user_delayed_handler(void *param)
156ef53b603SJianfeng Tan {
157ef53b603SJianfeng Tan 	struct virtio_hw *hw = (struct virtio_hw *)param;
158bd8f50a4SZhiyong Yang 	struct rte_eth_dev *eth_dev = &rte_eth_devices[hw->port_id];
159bd8f50a4SZhiyong Yang 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
160ef53b603SJianfeng Tan 
161bd8f50a4SZhiyong Yang 	if (rte_intr_disable(eth_dev->intr_handle) < 0) {
162bd8f50a4SZhiyong Yang 		PMD_DRV_LOG(ERR, "interrupt disable failed");
163bd8f50a4SZhiyong Yang 		return;
164bd8f50a4SZhiyong Yang 	}
165bd8f50a4SZhiyong Yang 	rte_intr_callback_unregister(eth_dev->intr_handle,
166bd8f50a4SZhiyong Yang 				     virtio_interrupt_handler, eth_dev);
167bd8f50a4SZhiyong Yang 	if (dev->is_server) {
168bd8f50a4SZhiyong Yang 		if (dev->vhostfd >= 0) {
169bd8f50a4SZhiyong Yang 			close(dev->vhostfd);
170bd8f50a4SZhiyong Yang 			dev->vhostfd = -1;
171bd8f50a4SZhiyong Yang 		}
172bd8f50a4SZhiyong Yang 		eth_dev->intr_handle->fd = dev->listenfd;
173bd8f50a4SZhiyong Yang 		rte_intr_callback_register(eth_dev->intr_handle,
174bd8f50a4SZhiyong Yang 					   virtio_interrupt_handler, eth_dev);
175bd8f50a4SZhiyong Yang 		if (rte_intr_enable(eth_dev->intr_handle) < 0) {
176bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt enable failed");
177bd8f50a4SZhiyong Yang 			return;
178bd8f50a4SZhiyong Yang 		}
179bd8f50a4SZhiyong Yang 	}
180ef53b603SJianfeng Tan }
181ef53b603SJianfeng Tan 
182ef53b603SJianfeng Tan static void
183e9efa4d9SJianfeng Tan virtio_user_read_dev_config(struct virtio_hw *hw, size_t offset,
184e9efa4d9SJianfeng Tan 		     void *dst, int length)
185e9efa4d9SJianfeng Tan {
186e9efa4d9SJianfeng Tan 	int i;
187e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
188e9efa4d9SJianfeng Tan 
189e9efa4d9SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, mac) &&
19035b2d13fSOlivier Matz 	    length == RTE_ETHER_ADDR_LEN) {
19135b2d13fSOlivier Matz 		for (i = 0; i < RTE_ETHER_ADDR_LEN; ++i)
192e9efa4d9SJianfeng Tan 			((uint8_t *)dst)[i] = dev->mac_addr[i];
193e9efa4d9SJianfeng Tan 		return;
194e9efa4d9SJianfeng Tan 	}
195e9efa4d9SJianfeng Tan 
196ef53b603SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, status)) {
197ef53b603SJianfeng Tan 		char buf[128];
198ef53b603SJianfeng Tan 
199ef53b603SJianfeng Tan 		if (dev->vhostfd >= 0) {
200ef53b603SJianfeng Tan 			int r;
201ef53b603SJianfeng Tan 			int flags;
202ef53b603SJianfeng Tan 
203ef53b603SJianfeng Tan 			flags = fcntl(dev->vhostfd, F_GETFL);
2042fd826a3SSebastian Basierski 			if (fcntl(dev->vhostfd, F_SETFL,
2052fd826a3SSebastian Basierski 					flags | O_NONBLOCK) == -1) {
2062fd826a3SSebastian Basierski 				PMD_DRV_LOG(ERR, "error setting O_NONBLOCK flag");
2072fd826a3SSebastian Basierski 				return;
2082fd826a3SSebastian Basierski 			}
209ef53b603SJianfeng Tan 			r = recv(dev->vhostfd, buf, 128, MSG_PEEK);
210ef53b603SJianfeng Tan 			if (r == 0 || (r < 0 && errno != EAGAIN)) {
211d0131e49SXiao Wang 				dev->net_status &= (~VIRTIO_NET_S_LINK_UP);
212ef53b603SJianfeng Tan 				PMD_DRV_LOG(ERR, "virtio-user port %u is down",
213ef53b603SJianfeng Tan 					    hw->port_id);
214bd8f50a4SZhiyong Yang 
215bd8f50a4SZhiyong Yang 				/* This function could be called in the process
216bd8f50a4SZhiyong Yang 				 * of interrupt handling, callback cannot be
217bd8f50a4SZhiyong Yang 				 * unregistered here, set an alarm to do it.
218ef53b603SJianfeng Tan 				 */
219ef53b603SJianfeng Tan 				rte_eal_alarm_set(1,
220ef53b603SJianfeng Tan 						  virtio_user_delayed_handler,
221ef53b603SJianfeng Tan 						  (void *)hw);
222ef53b603SJianfeng Tan 			} else {
223d0131e49SXiao Wang 				dev->net_status |= VIRTIO_NET_S_LINK_UP;
224ef53b603SJianfeng Tan 			}
225f76ef453SSebastian Basierski 			if (fcntl(dev->vhostfd, F_SETFL,
226f76ef453SSebastian Basierski 					flags & ~O_NONBLOCK) == -1) {
227f76ef453SSebastian Basierski 				PMD_DRV_LOG(ERR, "error clearing O_NONBLOCK flag");
228f76ef453SSebastian Basierski 				return;
229f76ef453SSebastian Basierski 			}
230bd8f50a4SZhiyong Yang 		} else if (dev->is_server) {
231d0131e49SXiao Wang 			dev->net_status &= (~VIRTIO_NET_S_LINK_UP);
232bd8f50a4SZhiyong Yang 			if (virtio_user_server_reconnect(dev) >= 0)
233d0131e49SXiao Wang 				dev->net_status |= VIRTIO_NET_S_LINK_UP;
234ef53b603SJianfeng Tan 		}
235bd8f50a4SZhiyong Yang 
236d0131e49SXiao Wang 		*(uint16_t *)dst = dev->net_status;
237ef53b603SJianfeng Tan 	}
238e9efa4d9SJianfeng Tan 
239e9efa4d9SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, max_virtqueue_pairs))
240e9efa4d9SJianfeng Tan 		*(uint16_t *)dst = dev->max_queue_pairs;
241e9efa4d9SJianfeng Tan }
242e9efa4d9SJianfeng Tan 
243e9efa4d9SJianfeng Tan static void
244e9efa4d9SJianfeng Tan virtio_user_write_dev_config(struct virtio_hw *hw, size_t offset,
245e9efa4d9SJianfeng Tan 		      const void *src, int length)
246e9efa4d9SJianfeng Tan {
247e9efa4d9SJianfeng Tan 	int i;
248e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
249e9efa4d9SJianfeng Tan 
250e9efa4d9SJianfeng Tan 	if ((offset == offsetof(struct virtio_net_config, mac)) &&
25135b2d13fSOlivier Matz 	    (length == RTE_ETHER_ADDR_LEN))
25235b2d13fSOlivier Matz 		for (i = 0; i < RTE_ETHER_ADDR_LEN; ++i)
253e9efa4d9SJianfeng Tan 			dev->mac_addr[i] = ((const uint8_t *)src)[i];
254e9efa4d9SJianfeng Tan 	else
255f2462150SFerruh Yigit 		PMD_DRV_LOG(ERR, "not supported offset=%zu, len=%d",
256e9efa4d9SJianfeng Tan 			    offset, length);
257e9efa4d9SJianfeng Tan }
258e9efa4d9SJianfeng Tan 
259e9efa4d9SJianfeng Tan static void
260c12a26eeSJianfeng Tan virtio_user_reset(struct virtio_hw *hw)
261c12a26eeSJianfeng Tan {
262c12a26eeSJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
263c12a26eeSJianfeng Tan 
264c12a26eeSJianfeng Tan 	if (dev->status & VIRTIO_CONFIG_STATUS_DRIVER_OK)
265c12a26eeSJianfeng Tan 		virtio_user_stop_device(dev);
266c12a26eeSJianfeng Tan }
267c12a26eeSJianfeng Tan 
268c12a26eeSJianfeng Tan static void
269e9efa4d9SJianfeng Tan virtio_user_set_status(struct virtio_hw *hw, uint8_t status)
270e9efa4d9SJianfeng Tan {
271e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
272844e4683SMaxime Coquelin 	uint8_t old_status = dev->status;
273e9efa4d9SJianfeng Tan 
274844e4683SMaxime Coquelin 	if (status & VIRTIO_CONFIG_STATUS_FEATURES_OK &&
275844e4683SMaxime Coquelin 			~old_status & VIRTIO_CONFIG_STATUS_FEATURES_OK)
276844e4683SMaxime Coquelin 		virtio_user_dev_set_features(dev);
277e9efa4d9SJianfeng Tan 	if (status & VIRTIO_CONFIG_STATUS_DRIVER_OK)
278e9efa4d9SJianfeng Tan 		virtio_user_start_device(dev);
279c12a26eeSJianfeng Tan 	else if (status == VIRTIO_CONFIG_STATUS_RESET)
280c12a26eeSJianfeng Tan 		virtio_user_reset(hw);
281e9efa4d9SJianfeng Tan 	dev->status = status;
28257912824SMaxime Coquelin 	virtio_user_send_status_update(dev, status);
283e9efa4d9SJianfeng Tan }
284e9efa4d9SJianfeng Tan 
285e9efa4d9SJianfeng Tan static uint8_t
286e9efa4d9SJianfeng Tan virtio_user_get_status(struct virtio_hw *hw)
287e9efa4d9SJianfeng Tan {
288e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
289e9efa4d9SJianfeng Tan 
2900b0dc66cSAdrian Moreno 	virtio_user_update_status(dev);
2910b0dc66cSAdrian Moreno 
292e9efa4d9SJianfeng Tan 	return dev->status;
293e9efa4d9SJianfeng Tan }
294e9efa4d9SJianfeng Tan 
295e9efa4d9SJianfeng Tan static uint64_t
296e9efa4d9SJianfeng Tan virtio_user_get_features(struct virtio_hw *hw)
297e9efa4d9SJianfeng Tan {
298e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
299e9efa4d9SJianfeng Tan 
300142678d4SJianfeng Tan 	/* unmask feature bits defined in vhost user protocol */
301142678d4SJianfeng Tan 	return dev->device_features & VIRTIO_PMD_SUPPORTED_GUEST_FEATURES;
302e9efa4d9SJianfeng Tan }
303e9efa4d9SJianfeng Tan 
304e9efa4d9SJianfeng Tan static void
305e9efa4d9SJianfeng Tan virtio_user_set_features(struct virtio_hw *hw, uint64_t features)
306e9efa4d9SJianfeng Tan {
307e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
308e9efa4d9SJianfeng Tan 
309142678d4SJianfeng Tan 	dev->features = features & dev->device_features;
310e9efa4d9SJianfeng Tan }
311e9efa4d9SJianfeng Tan 
312e9efa4d9SJianfeng Tan static uint8_t
313e9efa4d9SJianfeng Tan virtio_user_get_isr(struct virtio_hw *hw __rte_unused)
314e9efa4d9SJianfeng Tan {
31535c4f855SJianfeng Tan 	/* rxq interrupts and config interrupt are separated in virtio-user,
31635c4f855SJianfeng Tan 	 * here we only report config change.
317e9efa4d9SJianfeng Tan 	 */
31835c4f855SJianfeng Tan 	return VIRTIO_PCI_ISR_CONFIG;
319e9efa4d9SJianfeng Tan }
320e9efa4d9SJianfeng Tan 
321e9efa4d9SJianfeng Tan static uint16_t
322e9efa4d9SJianfeng Tan virtio_user_set_config_irq(struct virtio_hw *hw __rte_unused,
323e9efa4d9SJianfeng Tan 		    uint16_t vec __rte_unused)
324e9efa4d9SJianfeng Tan {
32535c4f855SJianfeng Tan 	return 0;
326e9efa4d9SJianfeng Tan }
327e9efa4d9SJianfeng Tan 
3283d4fb6fdSJianfeng Tan static uint16_t
3293d4fb6fdSJianfeng Tan virtio_user_set_queue_irq(struct virtio_hw *hw __rte_unused,
3303d4fb6fdSJianfeng Tan 			  struct virtqueue *vq __rte_unused,
3313d4fb6fdSJianfeng Tan 			  uint16_t vec)
3323d4fb6fdSJianfeng Tan {
3333d4fb6fdSJianfeng Tan 	/* pretend we have done that */
3343d4fb6fdSJianfeng Tan 	return vec;
3353d4fb6fdSJianfeng Tan }
3363d4fb6fdSJianfeng Tan 
337e9efa4d9SJianfeng Tan /* This function is to get the queue size, aka, number of descs, of a specified
338e9efa4d9SJianfeng Tan  * queue. Different with the VHOST_USER_GET_QUEUE_NUM, which is used to get the
339e9efa4d9SJianfeng Tan  * max supported queues.
340e9efa4d9SJianfeng Tan  */
341e9efa4d9SJianfeng Tan static uint16_t
342e9efa4d9SJianfeng Tan virtio_user_get_queue_num(struct virtio_hw *hw, uint16_t queue_id __rte_unused)
343e9efa4d9SJianfeng Tan {
344e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
345e9efa4d9SJianfeng Tan 
346e9efa4d9SJianfeng Tan 	/* Currently, each queue has same queue size */
347e9efa4d9SJianfeng Tan 	return dev->queue_size;
348e9efa4d9SJianfeng Tan }
349e9efa4d9SJianfeng Tan 
35048a44640SJens Freimann static void
35148a44640SJens Freimann virtio_user_setup_queue_packed(struct virtqueue *vq,
35248a44640SJens Freimann 			       struct virtio_user_dev *dev)
353e9efa4d9SJianfeng Tan {
35448a44640SJens Freimann 	uint16_t queue_idx = vq->vq_queue_index;
35548a44640SJens Freimann 	struct vring_packed *vring;
35648a44640SJens Freimann 	uint64_t desc_addr;
35748a44640SJens Freimann 	uint64_t avail_addr;
35848a44640SJens Freimann 	uint64_t used_addr;
35948a44640SJens Freimann 	uint16_t i;
36048a44640SJens Freimann 
36148a44640SJens Freimann 	vring  = &dev->packed_vrings[queue_idx];
36248a44640SJens Freimann 	desc_addr = (uintptr_t)vq->vq_ring_virt_mem;
36348a44640SJens Freimann 	avail_addr = desc_addr + vq->vq_nentries *
36448a44640SJens Freimann 		sizeof(struct vring_packed_desc);
36548a44640SJens Freimann 	used_addr = RTE_ALIGN_CEIL(avail_addr +
36648a44640SJens Freimann 			   sizeof(struct vring_packed_desc_event),
36748a44640SJens Freimann 			   VIRTIO_PCI_VRING_ALIGN);
36848a44640SJens Freimann 	vring->num = vq->vq_nentries;
3694cdc4d98STiwei Bie 	vring->desc = (void *)(uintptr_t)desc_addr;
3704cdc4d98STiwei Bie 	vring->driver = (void *)(uintptr_t)avail_addr;
3714cdc4d98STiwei Bie 	vring->device = (void *)(uintptr_t)used_addr;
37248a44640SJens Freimann 	dev->packed_queues[queue_idx].avail_wrap_counter = true;
37348a44640SJens Freimann 	dev->packed_queues[queue_idx].used_wrap_counter = true;
37448a44640SJens Freimann 
37545c224e7STiwei Bie 	for (i = 0; i < vring->num; i++)
3764cdc4d98STiwei Bie 		vring->desc[i].flags = 0;
37748a44640SJens Freimann }
37848a44640SJens Freimann 
37948a44640SJens Freimann static void
38048a44640SJens Freimann virtio_user_setup_queue_split(struct virtqueue *vq, struct virtio_user_dev *dev)
38148a44640SJens Freimann {
382e9efa4d9SJianfeng Tan 	uint16_t queue_idx = vq->vq_queue_index;
383e9efa4d9SJianfeng Tan 	uint64_t desc_addr, avail_addr, used_addr;
384e9efa4d9SJianfeng Tan 
385e9efa4d9SJianfeng Tan 	desc_addr = (uintptr_t)vq->vq_ring_virt_mem;
386e9efa4d9SJianfeng Tan 	avail_addr = desc_addr + vq->vq_nentries * sizeof(struct vring_desc);
387e9efa4d9SJianfeng Tan 	used_addr = RTE_ALIGN_CEIL(avail_addr + offsetof(struct vring_avail,
388e9efa4d9SJianfeng Tan 							 ring[vq->vq_nentries]),
389e9efa4d9SJianfeng Tan 				   VIRTIO_PCI_VRING_ALIGN);
390e9efa4d9SJianfeng Tan 
391e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].num = vq->vq_nentries;
392e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].desc = (void *)(uintptr_t)desc_addr;
393e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].avail = (void *)(uintptr_t)avail_addr;
394e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].used = (void *)(uintptr_t)used_addr;
39548a44640SJens Freimann }
39648a44640SJens Freimann 
39748a44640SJens Freimann static int
39848a44640SJens Freimann virtio_user_setup_queue(struct virtio_hw *hw, struct virtqueue *vq)
39948a44640SJens Freimann {
40048a44640SJens Freimann 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
40148a44640SJens Freimann 
40248a44640SJens Freimann 	if (vtpci_packed_queue(hw))
40348a44640SJens Freimann 		virtio_user_setup_queue_packed(vq, dev);
40448a44640SJens Freimann 	else
40548a44640SJens Freimann 		virtio_user_setup_queue_split(vq, dev);
406e9efa4d9SJianfeng Tan 
407e9efa4d9SJianfeng Tan 	return 0;
408e9efa4d9SJianfeng Tan }
409e9efa4d9SJianfeng Tan 
410e9efa4d9SJianfeng Tan static void
411e9efa4d9SJianfeng Tan virtio_user_del_queue(struct virtio_hw *hw, struct virtqueue *vq)
412e9efa4d9SJianfeng Tan {
413e9efa4d9SJianfeng Tan 	/* For legacy devices, write 0 to VIRTIO_PCI_QUEUE_PFN port, QEMU
414e9efa4d9SJianfeng Tan 	 * correspondingly stops the ioeventfds, and reset the status of
415e9efa4d9SJianfeng Tan 	 * the device.
416e9efa4d9SJianfeng Tan 	 * For modern devices, set queue desc, avail, used in PCI bar to 0,
417e9efa4d9SJianfeng Tan 	 * not see any more behavior in QEMU.
418e9efa4d9SJianfeng Tan 	 *
419e9efa4d9SJianfeng Tan 	 * Here we just care about what information to deliver to vhost-user
420e9efa4d9SJianfeng Tan 	 * or vhost-kernel. So we just close ioeventfd for now.
421e9efa4d9SJianfeng Tan 	 */
422e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
423e9efa4d9SJianfeng Tan 
424e9efa4d9SJianfeng Tan 	close(dev->callfds[vq->vq_queue_index]);
425e9efa4d9SJianfeng Tan 	close(dev->kickfds[vq->vq_queue_index]);
426e9efa4d9SJianfeng Tan }
427e9efa4d9SJianfeng Tan 
428e9efa4d9SJianfeng Tan static void
429e9efa4d9SJianfeng Tan virtio_user_notify_queue(struct virtio_hw *hw, struct virtqueue *vq)
430e9efa4d9SJianfeng Tan {
431e9efa4d9SJianfeng Tan 	uint64_t buf = 1;
432e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
433e9efa4d9SJianfeng Tan 
4341b69528eSJianfeng Tan 	if (hw->cvq && (hw->cvq->vq == vq)) {
43548a44640SJens Freimann 		if (vtpci_packed_queue(vq->hw))
43648a44640SJens Freimann 			virtio_user_handle_cq_packed(dev, vq->vq_queue_index);
43748a44640SJens Freimann 		else
4381b69528eSJianfeng Tan 			virtio_user_handle_cq(dev, vq->vq_queue_index);
4391b69528eSJianfeng Tan 		return;
4401b69528eSJianfeng Tan 	}
4411b69528eSJianfeng Tan 
442e9efa4d9SJianfeng Tan 	if (write(dev->kickfds[vq->vq_queue_index], &buf, sizeof(buf)) < 0)
443f2462150SFerruh Yigit 		PMD_DRV_LOG(ERR, "failed to kick backend: %s",
444e9efa4d9SJianfeng Tan 			    strerror(errno));
445e9efa4d9SJianfeng Tan }
446e9efa4d9SJianfeng Tan 
4476d890f8aSYuanhan Liu const struct virtio_pci_ops virtio_user_ops = {
448e9efa4d9SJianfeng Tan 	.read_dev_cfg	= virtio_user_read_dev_config,
449e9efa4d9SJianfeng Tan 	.write_dev_cfg	= virtio_user_write_dev_config,
450e9efa4d9SJianfeng Tan 	.get_status	= virtio_user_get_status,
451e9efa4d9SJianfeng Tan 	.set_status	= virtio_user_set_status,
452e9efa4d9SJianfeng Tan 	.get_features	= virtio_user_get_features,
453e9efa4d9SJianfeng Tan 	.set_features	= virtio_user_set_features,
454e9efa4d9SJianfeng Tan 	.get_isr	= virtio_user_get_isr,
455e9efa4d9SJianfeng Tan 	.set_config_irq	= virtio_user_set_config_irq,
4563d4fb6fdSJianfeng Tan 	.set_queue_irq	= virtio_user_set_queue_irq,
457e9efa4d9SJianfeng Tan 	.get_queue_num	= virtio_user_get_queue_num,
458e9efa4d9SJianfeng Tan 	.setup_queue	= virtio_user_setup_queue,
459e9efa4d9SJianfeng Tan 	.del_queue	= virtio_user_del_queue,
460e9efa4d9SJianfeng Tan 	.notify_queue	= virtio_user_notify_queue,
461e9efa4d9SJianfeng Tan };
462ce2eabddSJianfeng Tan 
463ce2eabddSJianfeng Tan static const char *valid_args[] = {
464ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_QUEUES_NUM     "queues"
465ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_QUEUES_NUM,
466ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_CQ_NUM         "cq"
467ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_CQ_NUM,
468ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_MAC            "mac"
469ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_MAC,
470ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_PATH           "path"
471ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_PATH,
472ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_QUEUE_SIZE     "queue_size"
473ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_QUEUE_SIZE,
4744214a1b4SWenfeng Liu #define VIRTIO_USER_ARG_INTERFACE_NAME "iface"
4754214a1b4SWenfeng Liu 	VIRTIO_USER_ARG_INTERFACE_NAME,
476bd8f50a4SZhiyong Yang #define VIRTIO_USER_ARG_SERVER_MODE    "server"
477bd8f50a4SZhiyong Yang 	VIRTIO_USER_ARG_SERVER_MODE,
478488ed97aSMarvin Liu #define VIRTIO_USER_ARG_MRG_RXBUF      "mrg_rxbuf"
479488ed97aSMarvin Liu 	VIRTIO_USER_ARG_MRG_RXBUF,
480488ed97aSMarvin Liu #define VIRTIO_USER_ARG_IN_ORDER       "in_order"
481488ed97aSMarvin Liu 	VIRTIO_USER_ARG_IN_ORDER,
48234f3966cSYuanhan Liu #define VIRTIO_USER_ARG_PACKED_VQ      "packed_vq"
48334f3966cSYuanhan Liu 	VIRTIO_USER_ARG_PACKED_VQ,
484b0db4beaSIvan Dyukov #define VIRTIO_USER_ARG_SPEED          "speed"
485b0db4beaSIvan Dyukov 	VIRTIO_USER_ARG_SPEED,
4866b7eefbcSMarvin Liu #define VIRTIO_USER_ARG_VECTORIZED     "vectorized"
4876b7eefbcSMarvin Liu 	VIRTIO_USER_ARG_VECTORIZED,
488ce2eabddSJianfeng Tan 	NULL
489ce2eabddSJianfeng Tan };
490ce2eabddSJianfeng Tan 
491ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_CQ_EN	0
492ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_Q_NUM	1
493ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_Q_SZ	256
494bd8f50a4SZhiyong Yang #define VIRTIO_USER_DEF_SERVER_MODE	0
495ce2eabddSJianfeng Tan 
496ce2eabddSJianfeng Tan static int
497ce2eabddSJianfeng Tan get_string_arg(const char *key __rte_unused,
498ce2eabddSJianfeng Tan 	       const char *value, void *extra_args)
499ce2eabddSJianfeng Tan {
500ce2eabddSJianfeng Tan 	if (!value || !extra_args)
501ce2eabddSJianfeng Tan 		return -EINVAL;
502ce2eabddSJianfeng Tan 
503ce2eabddSJianfeng Tan 	*(char **)extra_args = strdup(value);
504ce2eabddSJianfeng Tan 
5054214a1b4SWenfeng Liu 	if (!*(char **)extra_args)
5064214a1b4SWenfeng Liu 		return -ENOMEM;
5074214a1b4SWenfeng Liu 
508ce2eabddSJianfeng Tan 	return 0;
509ce2eabddSJianfeng Tan }
510ce2eabddSJianfeng Tan 
511ce2eabddSJianfeng Tan static int
512ce2eabddSJianfeng Tan get_integer_arg(const char *key __rte_unused,
513ce2eabddSJianfeng Tan 		const char *value, void *extra_args)
514ce2eabddSJianfeng Tan {
515bc5b6c11SIvan Dyukov 	uint64_t integer = 0;
516ce2eabddSJianfeng Tan 	if (!value || !extra_args)
517ce2eabddSJianfeng Tan 		return -EINVAL;
518bc5b6c11SIvan Dyukov 	errno = 0;
519bc5b6c11SIvan Dyukov 	integer = strtoull(value, NULL, 0);
520bc5b6c11SIvan Dyukov 	/* extra_args keeps default value, it should be replaced
521bc5b6c11SIvan Dyukov 	 * only in case of successful parsing of the 'value' arg
522bc5b6c11SIvan Dyukov 	 */
523bc5b6c11SIvan Dyukov 	if (errno == 0)
524bc5b6c11SIvan Dyukov 		*(uint64_t *)extra_args = integer;
525bc5b6c11SIvan Dyukov 	return -errno;
526ce2eabddSJianfeng Tan }
527ce2eabddSJianfeng Tan 
5287d62bf6fSMaxime Coquelin static uint32_t
5297d62bf6fSMaxime Coquelin vdpa_dynamic_major_num(void)
5307d62bf6fSMaxime Coquelin {
5317d62bf6fSMaxime Coquelin 	FILE *fp;
5327d62bf6fSMaxime Coquelin 	char *line = NULL;
5337d62bf6fSMaxime Coquelin 	size_t size;
5347d62bf6fSMaxime Coquelin 	char name[11];
5357d62bf6fSMaxime Coquelin 	bool found = false;
5367d62bf6fSMaxime Coquelin 	uint32_t num;
5377d62bf6fSMaxime Coquelin 
5387d62bf6fSMaxime Coquelin 	fp = fopen("/proc/devices", "r");
5397d62bf6fSMaxime Coquelin 	if (fp == NULL) {
5407d62bf6fSMaxime Coquelin 		PMD_INIT_LOG(ERR, "Cannot open /proc/devices: %s",
5417d62bf6fSMaxime Coquelin 			     strerror(errno));
5427d62bf6fSMaxime Coquelin 		return UNNAMED_MAJOR;
5437d62bf6fSMaxime Coquelin 	}
5447d62bf6fSMaxime Coquelin 
5457d62bf6fSMaxime Coquelin 	while (getline(&line, &size, fp) > 0) {
5467d62bf6fSMaxime Coquelin 		char *stripped = line + strspn(line, " ");
5477d62bf6fSMaxime Coquelin 		if ((sscanf(stripped, "%u %10s", &num, name) == 2) &&
5487d62bf6fSMaxime Coquelin 		    (strncmp(name, "vhost-vdpa", 10) == 0)) {
5497d62bf6fSMaxime Coquelin 			found = true;
5507d62bf6fSMaxime Coquelin 			break;
5517d62bf6fSMaxime Coquelin 		}
5527d62bf6fSMaxime Coquelin 	}
5537d62bf6fSMaxime Coquelin 	fclose(fp);
5547d62bf6fSMaxime Coquelin 	return found ? num : UNNAMED_MAJOR;
5557d62bf6fSMaxime Coquelin }
5567d62bf6fSMaxime Coquelin 
557f908b22eSAdrian Moreno static enum virtio_user_backend_type
558f908b22eSAdrian Moreno virtio_user_backend_type(const char *path)
559f908b22eSAdrian Moreno {
560f908b22eSAdrian Moreno 	struct stat sb;
561f908b22eSAdrian Moreno 
5627d62bf6fSMaxime Coquelin 	if (stat(path, &sb) == -1) {
5637d62bf6fSMaxime Coquelin 		PMD_INIT_LOG(ERR, "Stat fails: %s (%s)\n", path,
5647d62bf6fSMaxime Coquelin 			     strerror(errno));
565f908b22eSAdrian Moreno 		return VIRTIO_USER_BACKEND_UNKNOWN;
5667d62bf6fSMaxime Coquelin 	}
567f908b22eSAdrian Moreno 
5687d62bf6fSMaxime Coquelin 	if (S_ISSOCK(sb.st_mode)) {
5697d62bf6fSMaxime Coquelin 		return VIRTIO_USER_BACKEND_VHOST_USER;
5707d62bf6fSMaxime Coquelin 	} else if (S_ISCHR(sb.st_mode)) {
5717d62bf6fSMaxime Coquelin 		if (major(sb.st_rdev) == MISC_MAJOR)
5727d62bf6fSMaxime Coquelin 			return VIRTIO_USER_BACKEND_VHOST_KERNEL;
5737d62bf6fSMaxime Coquelin 		if (major(sb.st_rdev) == vdpa_dynamic_major_num())
5747d62bf6fSMaxime Coquelin 			return VIRTIO_USER_BACKEND_VHOST_VDPA;
5757d62bf6fSMaxime Coquelin 	}
5767d62bf6fSMaxime Coquelin 	return VIRTIO_USER_BACKEND_UNKNOWN;
577f908b22eSAdrian Moreno }
578f908b22eSAdrian Moreno 
579ce2eabddSJianfeng Tan static struct rte_eth_dev *
580050fe6e9SJan Blunck virtio_user_eth_dev_alloc(struct rte_vdev_device *vdev)
581ce2eabddSJianfeng Tan {
582ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
583ce2eabddSJianfeng Tan 	struct rte_eth_dev_data *data;
584ce2eabddSJianfeng Tan 	struct virtio_hw *hw;
585ce2eabddSJianfeng Tan 	struct virtio_user_dev *dev;
586ce2eabddSJianfeng Tan 
587050fe6e9SJan Blunck 	eth_dev = rte_eth_vdev_allocate(vdev, sizeof(*hw));
588ce2eabddSJianfeng Tan 	if (!eth_dev) {
589ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "cannot alloc rte_eth_dev");
590ce2eabddSJianfeng Tan 		return NULL;
591ce2eabddSJianfeng Tan 	}
592ce2eabddSJianfeng Tan 
593ce2eabddSJianfeng Tan 	data = eth_dev->data;
594050fe6e9SJan Blunck 	hw = eth_dev->data->dev_private;
595ce2eabddSJianfeng Tan 
596ce2eabddSJianfeng Tan 	dev = rte_zmalloc(NULL, sizeof(*dev), 0);
597ce2eabddSJianfeng Tan 	if (!dev) {
598ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "malloc virtio_user_dev failed");
599ce2eabddSJianfeng Tan 		rte_eth_dev_release_port(eth_dev);
600ce2eabddSJianfeng Tan 		return NULL;
601ce2eabddSJianfeng Tan 	}
602ce2eabddSJianfeng Tan 
603553f4593SYuanhan Liu 	hw->port_id = data->port_id;
6043d4fb6fdSJianfeng Tan 	dev->port_id = data->port_id;
605553f4593SYuanhan Liu 	virtio_hw_internal[hw->port_id].vtpci_ops = &virtio_user_ops;
606ef53b603SJianfeng Tan 	/*
607ef53b603SJianfeng Tan 	 * MSIX is required to enable LSC (see virtio_init_device).
608ef53b603SJianfeng Tan 	 * Here just pretend that we support msix.
609ef53b603SJianfeng Tan 	 */
610ef53b603SJianfeng Tan 	hw->use_msix = 1;
611ce2eabddSJianfeng Tan 	hw->modern   = 0;
6124710e16aSMarvin Liu 	hw->use_vec_rx = 0;
61377d66da8SMarvin Liu 	hw->use_vec_tx = 0;
6149f233f54SMarvin Liu 	hw->use_inorder_rx = 0;
6159f233f54SMarvin Liu 	hw->use_inorder_tx = 0;
616ce2eabddSJianfeng Tan 	hw->virtio_user_dev = dev;
617ce2eabddSJianfeng Tan 	return eth_dev;
618ce2eabddSJianfeng Tan }
619ce2eabddSJianfeng Tan 
620ca8326a9SJianfeng Tan static void
621ca8326a9SJianfeng Tan virtio_user_eth_dev_free(struct rte_eth_dev *eth_dev)
622ca8326a9SJianfeng Tan {
623ca8326a9SJianfeng Tan 	struct rte_eth_dev_data *data = eth_dev->data;
624ca8326a9SJianfeng Tan 	struct virtio_hw *hw = data->dev_private;
625ca8326a9SJianfeng Tan 
626ca8326a9SJianfeng Tan 	rte_free(hw->virtio_user_dev);
627ca8326a9SJianfeng Tan 	rte_eth_dev_release_port(eth_dev);
628ca8326a9SJianfeng Tan }
629ca8326a9SJianfeng Tan 
630ce2eabddSJianfeng Tan /* Dev initialization routine. Invoked once for each virtio vdev at
631c3b2fdfeSYong Wang  * EAL init time, see rte_bus_probe().
632ce2eabddSJianfeng Tan  * Returns 0 on success.
633ce2eabddSJianfeng Tan  */
634ce2eabddSJianfeng Tan static int
6355d2aa461SJan Blunck virtio_user_pmd_probe(struct rte_vdev_device *dev)
636ce2eabddSJianfeng Tan {
63714f06474SJianfeng Tan 	struct rte_kvargs *kvlist = NULL;
638ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
639ce2eabddSJianfeng Tan 	struct virtio_hw *hw;
640f908b22eSAdrian Moreno 	enum virtio_user_backend_type backend_type = VIRTIO_USER_BACKEND_UNKNOWN;
641ce2eabddSJianfeng Tan 	uint64_t queues = VIRTIO_USER_DEF_Q_NUM;
642ce2eabddSJianfeng Tan 	uint64_t cq = VIRTIO_USER_DEF_CQ_EN;
643ce2eabddSJianfeng Tan 	uint64_t queue_size = VIRTIO_USER_DEF_Q_SZ;
644bd8f50a4SZhiyong Yang 	uint64_t server_mode = VIRTIO_USER_DEF_SERVER_MODE;
645488ed97aSMarvin Liu 	uint64_t mrg_rxbuf = 1;
646488ed97aSMarvin Liu 	uint64_t in_order = 1;
6479070f88bSTiwei Bie 	uint64_t packed_vq = 0;
6486b7eefbcSMarvin Liu 	uint64_t vectorized = 0;
649ce2eabddSJianfeng Tan 	char *path = NULL;
6504214a1b4SWenfeng Liu 	char *ifname = NULL;
651ce2eabddSJianfeng Tan 	char *mac_addr = NULL;
652ce2eabddSJianfeng Tan 	int ret = -1;
653ce2eabddSJianfeng Tan 
6541c8489daSTiwei Bie 	if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
6551c8489daSTiwei Bie 		const char *name = rte_vdev_device_name(dev);
6561c8489daSTiwei Bie 		eth_dev = rte_eth_dev_attach_secondary(name);
6571c8489daSTiwei Bie 		if (!eth_dev) {
65888fa5bb6SStephen Hemminger 			PMD_INIT_LOG(ERR, "Failed to probe %s", name);
6591c8489daSTiwei Bie 			return -1;
6601c8489daSTiwei Bie 		}
6611c8489daSTiwei Bie 
6621c8489daSTiwei Bie 		if (eth_virtio_dev_init(eth_dev) < 0) {
6631c8489daSTiwei Bie 			PMD_INIT_LOG(ERR, "eth_virtio_dev_init fails");
6641c8489daSTiwei Bie 			rte_eth_dev_release_port(eth_dev);
6651c8489daSTiwei Bie 			return -1;
6661c8489daSTiwei Bie 		}
6671c8489daSTiwei Bie 
6681c8489daSTiwei Bie 		eth_dev->dev_ops = &virtio_user_secondary_eth_dev_ops;
6691c8489daSTiwei Bie 		eth_dev->device = &dev->device;
6701c8489daSTiwei Bie 		rte_eth_dev_probing_finish(eth_dev);
6711c8489daSTiwei Bie 		return 0;
6721c8489daSTiwei Bie 	}
6731c8489daSTiwei Bie 
6745d2aa461SJan Blunck 	kvlist = rte_kvargs_parse(rte_vdev_device_args(dev), valid_args);
675ce2eabddSJianfeng Tan 	if (!kvlist) {
676ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "error when parsing param");
677ce2eabddSJianfeng Tan 		goto end;
678ce2eabddSJianfeng Tan 	}
679ce2eabddSJianfeng Tan 
6809cca159eSMaxime Coquelin 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_PATH) == 1) {
681ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_PATH,
682ca8326a9SJianfeng Tan 				       &get_string_arg, &path) < 0) {
683404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
684404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_PATH);
685404bd6bfSJianfeng Tan 			goto end;
686404bd6bfSJianfeng Tan 		}
6879cca159eSMaxime Coquelin 	} else {
688f2462150SFerruh Yigit 		PMD_INIT_LOG(ERR, "arg %s is mandatory for virtio_user",
6892dac0df4STiwei Bie 			     VIRTIO_USER_ARG_PATH);
690ce2eabddSJianfeng Tan 		goto end;
691ce2eabddSJianfeng Tan 	}
692ce2eabddSJianfeng Tan 
693f908b22eSAdrian Moreno 	backend_type = virtio_user_backend_type(path);
694f908b22eSAdrian Moreno 	if (backend_type == VIRTIO_USER_BACKEND_UNKNOWN) {
695f908b22eSAdrian Moreno 		PMD_INIT_LOG(ERR,
696f908b22eSAdrian Moreno 			     "unable to determine backend type for path %s",
697f908b22eSAdrian Moreno 			path);
698f908b22eSAdrian Moreno 		goto end;
699f908b22eSAdrian Moreno 	}
700f908b22eSAdrian Moreno 
701f908b22eSAdrian Moreno 
7024214a1b4SWenfeng Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_INTERFACE_NAME) == 1) {
703f908b22eSAdrian Moreno 		if (backend_type != VIRTIO_USER_BACKEND_VHOST_KERNEL) {
7044214a1b4SWenfeng Liu 			PMD_INIT_LOG(ERR,
7054214a1b4SWenfeng Liu 				"arg %s applies only to vhost-kernel backend",
7064214a1b4SWenfeng Liu 				VIRTIO_USER_ARG_INTERFACE_NAME);
7074214a1b4SWenfeng Liu 			goto end;
7084214a1b4SWenfeng Liu 		}
7094214a1b4SWenfeng Liu 
7104214a1b4SWenfeng Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_INTERFACE_NAME,
7114214a1b4SWenfeng Liu 				       &get_string_arg, &ifname) < 0) {
7124214a1b4SWenfeng Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
7134214a1b4SWenfeng Liu 				     VIRTIO_USER_ARG_INTERFACE_NAME);
7144214a1b4SWenfeng Liu 			goto end;
7154214a1b4SWenfeng Liu 		}
7164214a1b4SWenfeng Liu 	}
7174214a1b4SWenfeng Liu 
718404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_MAC) == 1) {
719ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_MAC,
720ca8326a9SJianfeng Tan 				       &get_string_arg, &mac_addr) < 0) {
721404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
722404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_MAC);
723404bd6bfSJianfeng Tan 			goto end;
724404bd6bfSJianfeng Tan 		}
725404bd6bfSJianfeng Tan 	}
726ce2eabddSJianfeng Tan 
727404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_QUEUE_SIZE) == 1) {
728ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_QUEUE_SIZE,
729ca8326a9SJianfeng Tan 				       &get_integer_arg, &queue_size) < 0) {
730404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
731404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_QUEUE_SIZE);
732404bd6bfSJianfeng Tan 			goto end;
733404bd6bfSJianfeng Tan 		}
734404bd6bfSJianfeng Tan 	}
735ce2eabddSJianfeng Tan 
736404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_QUEUES_NUM) == 1) {
737ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_QUEUES_NUM,
738ca8326a9SJianfeng Tan 				       &get_integer_arg, &queues) < 0) {
739404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
740404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_QUEUES_NUM);
741404bd6bfSJianfeng Tan 			goto end;
742404bd6bfSJianfeng Tan 		}
743404bd6bfSJianfeng Tan 	}
744ce2eabddSJianfeng Tan 
745bd8f50a4SZhiyong Yang 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_SERVER_MODE) == 1) {
746bd8f50a4SZhiyong Yang 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_SERVER_MODE,
747bd8f50a4SZhiyong Yang 				       &get_integer_arg, &server_mode) < 0) {
748bd8f50a4SZhiyong Yang 			PMD_INIT_LOG(ERR, "error to parse %s",
749bd8f50a4SZhiyong Yang 				     VIRTIO_USER_ARG_SERVER_MODE);
750bd8f50a4SZhiyong Yang 			goto end;
751bd8f50a4SZhiyong Yang 		}
752bd8f50a4SZhiyong Yang 	}
753bd8f50a4SZhiyong Yang 
754404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_CQ_NUM) == 1) {
755ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_CQ_NUM,
756ca8326a9SJianfeng Tan 				       &get_integer_arg, &cq) < 0) {
757404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
758404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_CQ_NUM);
759404bd6bfSJianfeng Tan 			goto end;
760404bd6bfSJianfeng Tan 		}
761404bd6bfSJianfeng Tan 	} else if (queues > 1) {
7621b69528eSJianfeng Tan 		cq = 1;
763404bd6bfSJianfeng Tan 	}
7641b69528eSJianfeng Tan 
76534f3966cSYuanhan Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_PACKED_VQ) == 1) {
76634f3966cSYuanhan Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_PACKED_VQ,
76734f3966cSYuanhan Liu 				       &get_integer_arg, &packed_vq) < 0) {
76834f3966cSYuanhan Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
76934f3966cSYuanhan Liu 				     VIRTIO_USER_ARG_PACKED_VQ);
77034f3966cSYuanhan Liu 			goto end;
77134f3966cSYuanhan Liu 		}
77234f3966cSYuanhan Liu 	}
77334f3966cSYuanhan Liu 
7746b7eefbcSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_VECTORIZED) == 1) {
7756b7eefbcSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_VECTORIZED,
7766b7eefbcSMarvin Liu 				       &get_integer_arg, &vectorized) < 0) {
7776b7eefbcSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
7786b7eefbcSMarvin Liu 				     VIRTIO_USER_ARG_VECTORIZED);
7796b7eefbcSMarvin Liu 			goto end;
7806b7eefbcSMarvin Liu 		}
7816b7eefbcSMarvin Liu 	}
7826b7eefbcSMarvin Liu 
7831b69528eSJianfeng Tan 	if (queues > 1 && cq == 0) {
7841b69528eSJianfeng Tan 		PMD_INIT_LOG(ERR, "multi-q requires ctrl-q");
7851b69528eSJianfeng Tan 		goto end;
7861b69528eSJianfeng Tan 	}
787ce2eabddSJianfeng Tan 
7882269b9aeSWenfeng Liu 	if (queues > VIRTIO_MAX_VIRTQUEUE_PAIRS) {
7892269b9aeSWenfeng Liu 		PMD_INIT_LOG(ERR, "arg %s %" PRIu64 " exceeds the limit %u",
7902269b9aeSWenfeng Liu 			VIRTIO_USER_ARG_QUEUES_NUM, queues,
7912269b9aeSWenfeng Liu 			VIRTIO_MAX_VIRTQUEUE_PAIRS);
7922269b9aeSWenfeng Liu 		goto end;
7932269b9aeSWenfeng Liu 	}
7942269b9aeSWenfeng Liu 
795488ed97aSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_MRG_RXBUF) == 1) {
796488ed97aSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_MRG_RXBUF,
797488ed97aSMarvin Liu 				       &get_integer_arg, &mrg_rxbuf) < 0) {
798488ed97aSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
799488ed97aSMarvin Liu 				     VIRTIO_USER_ARG_MRG_RXBUF);
800488ed97aSMarvin Liu 			goto end;
801488ed97aSMarvin Liu 		}
802488ed97aSMarvin Liu 	}
803488ed97aSMarvin Liu 
804488ed97aSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_IN_ORDER) == 1) {
805488ed97aSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_IN_ORDER,
806488ed97aSMarvin Liu 				       &get_integer_arg, &in_order) < 0) {
807488ed97aSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
808488ed97aSMarvin Liu 				     VIRTIO_USER_ARG_IN_ORDER);
809488ed97aSMarvin Liu 			goto end;
810488ed97aSMarvin Liu 		}
811488ed97aSMarvin Liu 	}
812488ed97aSMarvin Liu 
813050fe6e9SJan Blunck 	eth_dev = virtio_user_eth_dev_alloc(dev);
814ce2eabddSJianfeng Tan 	if (!eth_dev) {
815e8df94b8SJianfeng Tan 		PMD_INIT_LOG(ERR, "virtio_user fails to alloc device");
816ce2eabddSJianfeng Tan 		goto end;
817ce2eabddSJianfeng Tan 	}
818ce2eabddSJianfeng Tan 
819ce2eabddSJianfeng Tan 	hw = eth_dev->data->dev_private;
820ce2eabddSJianfeng Tan 	if (virtio_user_dev_init(hw->virtio_user_dev, path, queues, cq,
8211c8489daSTiwei Bie 			 queue_size, mac_addr, &ifname, server_mode,
822f908b22eSAdrian Moreno 			 mrg_rxbuf, in_order, packed_vq, backend_type) < 0) {
823ca8326a9SJianfeng Tan 		PMD_INIT_LOG(ERR, "virtio_user_dev_init fails");
824ca8326a9SJianfeng Tan 		virtio_user_eth_dev_free(eth_dev);
825ce2eabddSJianfeng Tan 		goto end;
826ca8326a9SJianfeng Tan 	}
827fbe90cddSThomas Monjalon 
82887db93e0SDavid Marchand 	/* previously called by pci probing for physical dev */
829ce2eabddSJianfeng Tan 	if (eth_virtio_dev_init(eth_dev) < 0) {
830ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "eth_virtio_dev_init fails");
831ca8326a9SJianfeng Tan 		virtio_user_eth_dev_free(eth_dev);
832ce2eabddSJianfeng Tan 		goto end;
833ce2eabddSJianfeng Tan 	}
834fbe90cddSThomas Monjalon 
83577d66da8SMarvin Liu 	if (vectorized) {
83677d66da8SMarvin Liu 		if (packed_vq) {
83777d66da8SMarvin Liu #if defined(CC_AVX512_SUPPORT)
8386b7eefbcSMarvin Liu 			hw->use_vec_rx = 1;
83977d66da8SMarvin Liu 			hw->use_vec_tx = 1;
84077d66da8SMarvin Liu #else
84177d66da8SMarvin Liu 			PMD_INIT_LOG(INFO,
84277d66da8SMarvin Liu 				"building environment do not support packed ring vectorized");
84377d66da8SMarvin Liu #endif
84477d66da8SMarvin Liu 		} else {
84577d66da8SMarvin Liu 			hw->use_vec_rx = 1;
84677d66da8SMarvin Liu 		}
84777d66da8SMarvin Liu 	}
8486b7eefbcSMarvin Liu 
849fbe90cddSThomas Monjalon 	rte_eth_dev_probing_finish(eth_dev);
850ce2eabddSJianfeng Tan 	ret = 0;
851ce2eabddSJianfeng Tan 
852ce2eabddSJianfeng Tan end:
85314f06474SJianfeng Tan 	if (kvlist)
85414f06474SJianfeng Tan 		rte_kvargs_free(kvlist);
855ce2eabddSJianfeng Tan 	if (path)
856ce2eabddSJianfeng Tan 		free(path);
857ce2eabddSJianfeng Tan 	if (mac_addr)
858ce2eabddSJianfeng Tan 		free(mac_addr);
8594214a1b4SWenfeng Liu 	if (ifname)
8604214a1b4SWenfeng Liu 		free(ifname);
861ce2eabddSJianfeng Tan 	return ret;
862ce2eabddSJianfeng Tan }
863ce2eabddSJianfeng Tan 
864ce2eabddSJianfeng Tan static int
8655d2aa461SJan Blunck virtio_user_pmd_remove(struct rte_vdev_device *vdev)
866ce2eabddSJianfeng Tan {
8675d2aa461SJan Blunck 	const char *name;
868ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
869ce2eabddSJianfeng Tan 
8705d2aa461SJan Blunck 	if (!vdev)
871ce2eabddSJianfeng Tan 		return -EINVAL;
872ce2eabddSJianfeng Tan 
8735d2aa461SJan Blunck 	name = rte_vdev_device_name(vdev);
874f2462150SFerruh Yigit 	PMD_DRV_LOG(INFO, "Un-Initializing %s", name);
875ce2eabddSJianfeng Tan 	eth_dev = rte_eth_dev_allocated(name);
8767f468b2eSTiwei Bie 	/* Port has already been released by close. */
877ce2eabddSJianfeng Tan 	if (!eth_dev)
8787f468b2eSTiwei Bie 		return 0;
879ce2eabddSJianfeng Tan 
8801c8489daSTiwei Bie 	if (rte_eal_process_type() != RTE_PROC_PRIMARY)
8811c8489daSTiwei Bie 		return rte_eth_dev_release_port(eth_dev);
8821c8489daSTiwei Bie 
883ce2eabddSJianfeng Tan 	/* make sure the device is stopped, queues freed */
884*8a5a0aadSThomas Monjalon 	return rte_eth_dev_close(eth_dev->data->port_id);
885ce2eabddSJianfeng Tan }
886ce2eabddSJianfeng Tan 
88786e71eb2SMaxime Coquelin static int virtio_user_pmd_dma_map(struct rte_vdev_device *vdev, void *addr,
88886e71eb2SMaxime Coquelin 		uint64_t iova, size_t len)
88986e71eb2SMaxime Coquelin {
89086e71eb2SMaxime Coquelin 	const char *name;
89186e71eb2SMaxime Coquelin 	struct rte_eth_dev *eth_dev;
89286e71eb2SMaxime Coquelin 	struct virtio_user_dev *dev;
89386e71eb2SMaxime Coquelin 	struct virtio_hw *hw;
89486e71eb2SMaxime Coquelin 
89586e71eb2SMaxime Coquelin 	if (!vdev)
89686e71eb2SMaxime Coquelin 		return -EINVAL;
89786e71eb2SMaxime Coquelin 
89886e71eb2SMaxime Coquelin 	name = rte_vdev_device_name(vdev);
89986e71eb2SMaxime Coquelin 	eth_dev = rte_eth_dev_allocated(name);
90086e71eb2SMaxime Coquelin 	/* Port has already been released by close. */
90186e71eb2SMaxime Coquelin 	if (!eth_dev)
90286e71eb2SMaxime Coquelin 		return 0;
90386e71eb2SMaxime Coquelin 
90486e71eb2SMaxime Coquelin 	hw = (struct virtio_hw *)eth_dev->data->dev_private;
90586e71eb2SMaxime Coquelin 	dev = hw->virtio_user_dev;
90686e71eb2SMaxime Coquelin 
90786e71eb2SMaxime Coquelin 	if (dev->ops->dma_map)
90886e71eb2SMaxime Coquelin 		return dev->ops->dma_map(dev, addr, iova, len);
90986e71eb2SMaxime Coquelin 
91086e71eb2SMaxime Coquelin 	return 0;
91186e71eb2SMaxime Coquelin }
91286e71eb2SMaxime Coquelin 
91386e71eb2SMaxime Coquelin static int virtio_user_pmd_dma_unmap(struct rte_vdev_device *vdev, void *addr,
91486e71eb2SMaxime Coquelin 		uint64_t iova, size_t len)
91586e71eb2SMaxime Coquelin {
91686e71eb2SMaxime Coquelin 	const char *name;
91786e71eb2SMaxime Coquelin 	struct rte_eth_dev *eth_dev;
91886e71eb2SMaxime Coquelin 	struct virtio_user_dev *dev;
91986e71eb2SMaxime Coquelin 	struct virtio_hw *hw;
92086e71eb2SMaxime Coquelin 
92186e71eb2SMaxime Coquelin 	if (!vdev)
92286e71eb2SMaxime Coquelin 		return -EINVAL;
92386e71eb2SMaxime Coquelin 
92486e71eb2SMaxime Coquelin 	name = rte_vdev_device_name(vdev);
92586e71eb2SMaxime Coquelin 	eth_dev = rte_eth_dev_allocated(name);
92686e71eb2SMaxime Coquelin 	/* Port has already been released by close. */
92786e71eb2SMaxime Coquelin 	if (!eth_dev)
92886e71eb2SMaxime Coquelin 		return 0;
92986e71eb2SMaxime Coquelin 
93086e71eb2SMaxime Coquelin 	hw = (struct virtio_hw *)eth_dev->data->dev_private;
93186e71eb2SMaxime Coquelin 	dev = hw->virtio_user_dev;
93286e71eb2SMaxime Coquelin 
93386e71eb2SMaxime Coquelin 	if (dev->ops->dma_unmap)
93486e71eb2SMaxime Coquelin 		return dev->ops->dma_unmap(dev, addr, iova, len);
93586e71eb2SMaxime Coquelin 
93686e71eb2SMaxime Coquelin 	return 0;
93786e71eb2SMaxime Coquelin }
93886e71eb2SMaxime Coquelin 
939fe363dd4SJan Viktorin static struct rte_vdev_driver virtio_user_driver = {
94050a3345fSShreyansh Jain 	.probe = virtio_user_pmd_probe,
94150a3345fSShreyansh Jain 	.remove = virtio_user_pmd_remove,
94286e71eb2SMaxime Coquelin 	.dma_map = virtio_user_pmd_dma_map,
94386e71eb2SMaxime Coquelin 	.dma_unmap = virtio_user_pmd_dma_unmap,
944ce2eabddSJianfeng Tan };
945ce2eabddSJianfeng Tan 
94601f19227SShreyansh Jain RTE_PMD_REGISTER_VDEV(net_virtio_user, virtio_user_driver);
9479fa80cb2SJan Blunck RTE_PMD_REGISTER_ALIAS(net_virtio_user, virtio_user);
94801f19227SShreyansh Jain RTE_PMD_REGISTER_PARAM_STRING(net_virtio_user,
94944e32a67SPablo de Lara 	"path=<path> "
95044e32a67SPablo de Lara 	"mac=<mac addr> "
95144e32a67SPablo de Lara 	"cq=<int> "
95244e32a67SPablo de Lara 	"queue_size=<int> "
9534214a1b4SWenfeng Liu 	"queues=<int> "
954488ed97aSMarvin Liu 	"iface=<string> "
95562758c76STiwei Bie 	"server=<0|1> "
956488ed97aSMarvin Liu 	"mrg_rxbuf=<0|1> "
9579070f88bSTiwei Bie 	"in_order=<0|1> "
958b0db4beaSIvan Dyukov 	"packed_vq=<0|1> "
9596b7eefbcSMarvin Liu 	"speed=<int> "
9606b7eefbcSMarvin Liu 	"vectorized=<0|1>");
961