xref: /dpdk/drivers/net/virtio/virtio_user_ethdev.c (revision 88fa5bb6b9807d55a3fbd34e5537fcf1ee7efb80)
15566a3e3SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause
25566a3e3SBruce Richardson  * Copyright(c) 2010-2016 Intel Corporation
3e9efa4d9SJianfeng Tan  */
4e9efa4d9SJianfeng Tan 
5e9efa4d9SJianfeng Tan #include <stdint.h>
6e9efa4d9SJianfeng Tan #include <sys/types.h>
7e9efa4d9SJianfeng Tan #include <unistd.h>
8ef53b603SJianfeng Tan #include <fcntl.h>
9ef53b603SJianfeng Tan #include <sys/socket.h>
10e9efa4d9SJianfeng Tan 
11ce2eabddSJianfeng Tan #include <rte_malloc.h>
12ce2eabddSJianfeng Tan #include <rte_kvargs.h>
13050fe6e9SJan Blunck #include <rte_ethdev_vdev.h>
14d4a586d2SJianfeng Tan #include <rte_bus_vdev.h>
15ef53b603SJianfeng Tan #include <rte_alarm.h>
166ebbf410SXuan Ding #include <rte_cycles.h>
17ce2eabddSJianfeng Tan 
18ce2eabddSJianfeng Tan #include "virtio_ethdev.h"
19e9efa4d9SJianfeng Tan #include "virtio_logs.h"
20e9efa4d9SJianfeng Tan #include "virtio_pci.h"
21e9efa4d9SJianfeng Tan #include "virtqueue.h"
221b69528eSJianfeng Tan #include "virtio_rxtx.h"
23e9efa4d9SJianfeng Tan #include "virtio_user/virtio_user_dev.h"
247f468b2eSTiwei Bie #include "virtio_user/vhost.h"
25e9efa4d9SJianfeng Tan 
26e9efa4d9SJianfeng Tan #define virtio_user_get_dev(hw) \
27e9efa4d9SJianfeng Tan 	((struct virtio_user_dev *)(hw)->virtio_user_dev)
28e9efa4d9SJianfeng Tan 
296ebbf410SXuan Ding static void
306ebbf410SXuan Ding virtio_user_reset_queues_packed(struct rte_eth_dev *dev)
316ebbf410SXuan Ding {
326ebbf410SXuan Ding 	struct virtio_hw *hw = dev->data->dev_private;
336ebbf410SXuan Ding 	struct virtnet_rx *rxvq;
346ebbf410SXuan Ding 	struct virtnet_tx *txvq;
356ebbf410SXuan Ding 	uint16_t i;
366ebbf410SXuan Ding 
376ebbf410SXuan Ding 	/* Add lock to avoid queue contention. */
386ebbf410SXuan Ding 	rte_spinlock_lock(&hw->state_lock);
396ebbf410SXuan Ding 	hw->started = 0;
406ebbf410SXuan Ding 
416ebbf410SXuan Ding 	/*
426ebbf410SXuan Ding 	 * Waitting for datapath to complete before resetting queues.
436ebbf410SXuan Ding 	 * 1 ms should be enough for the ongoing Tx/Rx function to finish.
446ebbf410SXuan Ding 	 */
456ebbf410SXuan Ding 	rte_delay_ms(1);
466ebbf410SXuan Ding 
476ebbf410SXuan Ding 	/* Vring reset for each Tx queue and Rx queue. */
486ebbf410SXuan Ding 	for (i = 0; i < dev->data->nb_rx_queues; i++) {
496ebbf410SXuan Ding 		rxvq = dev->data->rx_queues[i];
506ebbf410SXuan Ding 		virtqueue_rxvq_reset_packed(rxvq->vq);
516ebbf410SXuan Ding 		virtio_dev_rx_queue_setup_finish(dev, i);
526ebbf410SXuan Ding 	}
536ebbf410SXuan Ding 
546ebbf410SXuan Ding 	for (i = 0; i < dev->data->nb_tx_queues; i++) {
556ebbf410SXuan Ding 		txvq = dev->data->tx_queues[i];
566ebbf410SXuan Ding 		virtqueue_txvq_reset_packed(txvq->vq);
576ebbf410SXuan Ding 	}
586ebbf410SXuan Ding 
596ebbf410SXuan Ding 	hw->started = 1;
606ebbf410SXuan Ding 	rte_spinlock_unlock(&hw->state_lock);
616ebbf410SXuan Ding }
626ebbf410SXuan Ding 
636ebbf410SXuan Ding 
64bd8f50a4SZhiyong Yang static int
65bd8f50a4SZhiyong Yang virtio_user_server_reconnect(struct virtio_user_dev *dev)
66bd8f50a4SZhiyong Yang {
67bd8f50a4SZhiyong Yang 	int ret;
68bd8f50a4SZhiyong Yang 	int connectfd;
69bd8f50a4SZhiyong Yang 	struct rte_eth_dev *eth_dev = &rte_eth_devices[dev->port_id];
706ebbf410SXuan Ding 	struct virtio_hw *hw = eth_dev->data->dev_private;
71bd8f50a4SZhiyong Yang 
72bd8f50a4SZhiyong Yang 	connectfd = accept(dev->listenfd, NULL, NULL);
73bd8f50a4SZhiyong Yang 	if (connectfd < 0)
74bd8f50a4SZhiyong Yang 		return -1;
75bd8f50a4SZhiyong Yang 
76bd8f50a4SZhiyong Yang 	dev->vhostfd = connectfd;
77201a4165SZhiyong Yang 	if (dev->ops->send_request(dev, VHOST_USER_GET_FEATURES,
78201a4165SZhiyong Yang 				   &dev->device_features) < 0) {
79201a4165SZhiyong Yang 		PMD_INIT_LOG(ERR, "get_features failed: %s",
80201a4165SZhiyong Yang 			     strerror(errno));
81201a4165SZhiyong Yang 		return -1;
82201a4165SZhiyong Yang 	}
83201a4165SZhiyong Yang 
84bb97d2ddSTiwei Bie 	dev->device_features |= dev->frontend_features;
85bb97d2ddSTiwei Bie 
867c66ff61SMarvin Liu 	/* umask vhost-user unsupported features */
877c66ff61SMarvin Liu 	dev->device_features &= ~(dev->unsupported_features);
88201a4165SZhiyong Yang 
89201a4165SZhiyong Yang 	dev->features &= dev->device_features;
90201a4165SZhiyong Yang 
916ebbf410SXuan Ding 	/* For packed ring, resetting queues is required in reconnection. */
9292771257STiwei Bie 	if (vtpci_packed_queue(hw)) {
936ebbf410SXuan Ding 		PMD_INIT_LOG(NOTICE, "Packets on the fly will be dropped"
946ebbf410SXuan Ding 				" when packed ring reconnecting.");
956ebbf410SXuan Ding 		virtio_user_reset_queues_packed(eth_dev);
9692771257STiwei Bie 	}
976ebbf410SXuan Ding 
98bd8f50a4SZhiyong Yang 	ret = virtio_user_start_device(dev);
99bd8f50a4SZhiyong Yang 	if (ret < 0)
100bd8f50a4SZhiyong Yang 		return -1;
101bd8f50a4SZhiyong Yang 
102201a4165SZhiyong Yang 	if (dev->queue_pairs > 1) {
103201a4165SZhiyong Yang 		ret = virtio_user_handle_mq(dev, dev->queue_pairs);
104201a4165SZhiyong Yang 		if (ret != 0) {
105201a4165SZhiyong Yang 			PMD_INIT_LOG(ERR, "Fails to enable multi-queue pairs!");
106201a4165SZhiyong Yang 			return -1;
107201a4165SZhiyong Yang 		}
108201a4165SZhiyong Yang 	}
109bd8f50a4SZhiyong Yang 	if (eth_dev->data->dev_flags & RTE_ETH_DEV_INTR_LSC) {
110bd8f50a4SZhiyong Yang 		if (rte_intr_disable(eth_dev->intr_handle) < 0) {
111bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt disable failed");
112bd8f50a4SZhiyong Yang 			return -1;
113bd8f50a4SZhiyong Yang 		}
114bd8f50a4SZhiyong Yang 		rte_intr_callback_unregister(eth_dev->intr_handle,
115bd8f50a4SZhiyong Yang 					     virtio_interrupt_handler,
116bd8f50a4SZhiyong Yang 					     eth_dev);
117bd8f50a4SZhiyong Yang 		eth_dev->intr_handle->fd = connectfd;
118bd8f50a4SZhiyong Yang 		rte_intr_callback_register(eth_dev->intr_handle,
119bd8f50a4SZhiyong Yang 					   virtio_interrupt_handler, eth_dev);
120bd8f50a4SZhiyong Yang 
121bd8f50a4SZhiyong Yang 		if (rte_intr_enable(eth_dev->intr_handle) < 0) {
122bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt enable failed");
123bd8f50a4SZhiyong Yang 			return -1;
124bd8f50a4SZhiyong Yang 		}
125bd8f50a4SZhiyong Yang 	}
126bd8f50a4SZhiyong Yang 	PMD_INIT_LOG(NOTICE, "server mode virtio-user reconnection succeeds!");
127bd8f50a4SZhiyong Yang 	return 0;
128bd8f50a4SZhiyong Yang }
129bd8f50a4SZhiyong Yang 
130e9efa4d9SJianfeng Tan static void
131ef53b603SJianfeng Tan virtio_user_delayed_handler(void *param)
132ef53b603SJianfeng Tan {
133ef53b603SJianfeng Tan 	struct virtio_hw *hw = (struct virtio_hw *)param;
134bd8f50a4SZhiyong Yang 	struct rte_eth_dev *eth_dev = &rte_eth_devices[hw->port_id];
135bd8f50a4SZhiyong Yang 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
136ef53b603SJianfeng Tan 
137bd8f50a4SZhiyong Yang 	if (rte_intr_disable(eth_dev->intr_handle) < 0) {
138bd8f50a4SZhiyong Yang 		PMD_DRV_LOG(ERR, "interrupt disable failed");
139bd8f50a4SZhiyong Yang 		return;
140bd8f50a4SZhiyong Yang 	}
141bd8f50a4SZhiyong Yang 	rte_intr_callback_unregister(eth_dev->intr_handle,
142bd8f50a4SZhiyong Yang 				     virtio_interrupt_handler, eth_dev);
143bd8f50a4SZhiyong Yang 	if (dev->is_server) {
144bd8f50a4SZhiyong Yang 		if (dev->vhostfd >= 0) {
145bd8f50a4SZhiyong Yang 			close(dev->vhostfd);
146bd8f50a4SZhiyong Yang 			dev->vhostfd = -1;
147bd8f50a4SZhiyong Yang 		}
148bd8f50a4SZhiyong Yang 		eth_dev->intr_handle->fd = dev->listenfd;
149bd8f50a4SZhiyong Yang 		rte_intr_callback_register(eth_dev->intr_handle,
150bd8f50a4SZhiyong Yang 					   virtio_interrupt_handler, eth_dev);
151bd8f50a4SZhiyong Yang 		if (rte_intr_enable(eth_dev->intr_handle) < 0) {
152bd8f50a4SZhiyong Yang 			PMD_DRV_LOG(ERR, "interrupt enable failed");
153bd8f50a4SZhiyong Yang 			return;
154bd8f50a4SZhiyong Yang 		}
155bd8f50a4SZhiyong Yang 	}
156ef53b603SJianfeng Tan }
157ef53b603SJianfeng Tan 
158ef53b603SJianfeng Tan static void
159e9efa4d9SJianfeng Tan virtio_user_read_dev_config(struct virtio_hw *hw, size_t offset,
160e9efa4d9SJianfeng Tan 		     void *dst, int length)
161e9efa4d9SJianfeng Tan {
162e9efa4d9SJianfeng Tan 	int i;
163e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
164e9efa4d9SJianfeng Tan 
165e9efa4d9SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, mac) &&
16635b2d13fSOlivier Matz 	    length == RTE_ETHER_ADDR_LEN) {
16735b2d13fSOlivier Matz 		for (i = 0; i < RTE_ETHER_ADDR_LEN; ++i)
168e9efa4d9SJianfeng Tan 			((uint8_t *)dst)[i] = dev->mac_addr[i];
169e9efa4d9SJianfeng Tan 		return;
170e9efa4d9SJianfeng Tan 	}
171e9efa4d9SJianfeng Tan 
172ef53b603SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, status)) {
173ef53b603SJianfeng Tan 		char buf[128];
174ef53b603SJianfeng Tan 
175ef53b603SJianfeng Tan 		if (dev->vhostfd >= 0) {
176ef53b603SJianfeng Tan 			int r;
177ef53b603SJianfeng Tan 			int flags;
178ef53b603SJianfeng Tan 
179ef53b603SJianfeng Tan 			flags = fcntl(dev->vhostfd, F_GETFL);
1802fd826a3SSebastian Basierski 			if (fcntl(dev->vhostfd, F_SETFL,
1812fd826a3SSebastian Basierski 					flags | O_NONBLOCK) == -1) {
1822fd826a3SSebastian Basierski 				PMD_DRV_LOG(ERR, "error setting O_NONBLOCK flag");
1832fd826a3SSebastian Basierski 				return;
1842fd826a3SSebastian Basierski 			}
185ef53b603SJianfeng Tan 			r = recv(dev->vhostfd, buf, 128, MSG_PEEK);
186ef53b603SJianfeng Tan 			if (r == 0 || (r < 0 && errno != EAGAIN)) {
187ef53b603SJianfeng Tan 				dev->status &= (~VIRTIO_NET_S_LINK_UP);
188ef53b603SJianfeng Tan 				PMD_DRV_LOG(ERR, "virtio-user port %u is down",
189ef53b603SJianfeng Tan 					    hw->port_id);
190bd8f50a4SZhiyong Yang 
191bd8f50a4SZhiyong Yang 				/* This function could be called in the process
192bd8f50a4SZhiyong Yang 				 * of interrupt handling, callback cannot be
193bd8f50a4SZhiyong Yang 				 * unregistered here, set an alarm to do it.
194ef53b603SJianfeng Tan 				 */
195ef53b603SJianfeng Tan 				rte_eal_alarm_set(1,
196ef53b603SJianfeng Tan 						  virtio_user_delayed_handler,
197ef53b603SJianfeng Tan 						  (void *)hw);
198ef53b603SJianfeng Tan 			} else {
199ef53b603SJianfeng Tan 				dev->status |= VIRTIO_NET_S_LINK_UP;
200ef53b603SJianfeng Tan 			}
201f76ef453SSebastian Basierski 			if (fcntl(dev->vhostfd, F_SETFL,
202f76ef453SSebastian Basierski 					flags & ~O_NONBLOCK) == -1) {
203f76ef453SSebastian Basierski 				PMD_DRV_LOG(ERR, "error clearing O_NONBLOCK flag");
204f76ef453SSebastian Basierski 				return;
205f76ef453SSebastian Basierski 			}
206bd8f50a4SZhiyong Yang 		} else if (dev->is_server) {
207bd8f50a4SZhiyong Yang 			dev->status &= (~VIRTIO_NET_S_LINK_UP);
208bd8f50a4SZhiyong Yang 			if (virtio_user_server_reconnect(dev) >= 0)
209bd8f50a4SZhiyong Yang 				dev->status |= VIRTIO_NET_S_LINK_UP;
210ef53b603SJianfeng Tan 		}
211bd8f50a4SZhiyong Yang 
212e9efa4d9SJianfeng Tan 		*(uint16_t *)dst = dev->status;
213ef53b603SJianfeng Tan 	}
214e9efa4d9SJianfeng Tan 
215e9efa4d9SJianfeng Tan 	if (offset == offsetof(struct virtio_net_config, max_virtqueue_pairs))
216e9efa4d9SJianfeng Tan 		*(uint16_t *)dst = dev->max_queue_pairs;
217e9efa4d9SJianfeng Tan }
218e9efa4d9SJianfeng Tan 
219e9efa4d9SJianfeng Tan static void
220e9efa4d9SJianfeng Tan virtio_user_write_dev_config(struct virtio_hw *hw, size_t offset,
221e9efa4d9SJianfeng Tan 		      const void *src, int length)
222e9efa4d9SJianfeng Tan {
223e9efa4d9SJianfeng Tan 	int i;
224e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
225e9efa4d9SJianfeng Tan 
226e9efa4d9SJianfeng Tan 	if ((offset == offsetof(struct virtio_net_config, mac)) &&
22735b2d13fSOlivier Matz 	    (length == RTE_ETHER_ADDR_LEN))
22835b2d13fSOlivier Matz 		for (i = 0; i < RTE_ETHER_ADDR_LEN; ++i)
229e9efa4d9SJianfeng Tan 			dev->mac_addr[i] = ((const uint8_t *)src)[i];
230e9efa4d9SJianfeng Tan 	else
231f2462150SFerruh Yigit 		PMD_DRV_LOG(ERR, "not supported offset=%zu, len=%d",
232e9efa4d9SJianfeng Tan 			    offset, length);
233e9efa4d9SJianfeng Tan }
234e9efa4d9SJianfeng Tan 
235e9efa4d9SJianfeng Tan static void
236c12a26eeSJianfeng Tan virtio_user_reset(struct virtio_hw *hw)
237c12a26eeSJianfeng Tan {
238c12a26eeSJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
239c12a26eeSJianfeng Tan 
240c12a26eeSJianfeng Tan 	if (dev->status & VIRTIO_CONFIG_STATUS_DRIVER_OK)
241c12a26eeSJianfeng Tan 		virtio_user_stop_device(dev);
242c12a26eeSJianfeng Tan }
243c12a26eeSJianfeng Tan 
244c12a26eeSJianfeng Tan static void
245e9efa4d9SJianfeng Tan virtio_user_set_status(struct virtio_hw *hw, uint8_t status)
246e9efa4d9SJianfeng Tan {
247e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
248e9efa4d9SJianfeng Tan 
249e9efa4d9SJianfeng Tan 	if (status & VIRTIO_CONFIG_STATUS_DRIVER_OK)
250e9efa4d9SJianfeng Tan 		virtio_user_start_device(dev);
251c12a26eeSJianfeng Tan 	else if (status == VIRTIO_CONFIG_STATUS_RESET)
252c12a26eeSJianfeng Tan 		virtio_user_reset(hw);
253e9efa4d9SJianfeng Tan 	dev->status = status;
254e9efa4d9SJianfeng Tan }
255e9efa4d9SJianfeng Tan 
256e9efa4d9SJianfeng Tan static uint8_t
257e9efa4d9SJianfeng Tan virtio_user_get_status(struct virtio_hw *hw)
258e9efa4d9SJianfeng Tan {
259e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
260e9efa4d9SJianfeng Tan 
261e9efa4d9SJianfeng Tan 	return dev->status;
262e9efa4d9SJianfeng Tan }
263e9efa4d9SJianfeng Tan 
264e9efa4d9SJianfeng Tan static uint64_t
265e9efa4d9SJianfeng Tan virtio_user_get_features(struct virtio_hw *hw)
266e9efa4d9SJianfeng Tan {
267e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
268e9efa4d9SJianfeng Tan 
269142678d4SJianfeng Tan 	/* unmask feature bits defined in vhost user protocol */
270142678d4SJianfeng Tan 	return dev->device_features & VIRTIO_PMD_SUPPORTED_GUEST_FEATURES;
271e9efa4d9SJianfeng Tan }
272e9efa4d9SJianfeng Tan 
273e9efa4d9SJianfeng Tan static void
274e9efa4d9SJianfeng Tan virtio_user_set_features(struct virtio_hw *hw, uint64_t features)
275e9efa4d9SJianfeng Tan {
276e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
277e9efa4d9SJianfeng Tan 
278142678d4SJianfeng Tan 	dev->features = features & dev->device_features;
279e9efa4d9SJianfeng Tan }
280e9efa4d9SJianfeng Tan 
281e9efa4d9SJianfeng Tan static uint8_t
282e9efa4d9SJianfeng Tan virtio_user_get_isr(struct virtio_hw *hw __rte_unused)
283e9efa4d9SJianfeng Tan {
28435c4f855SJianfeng Tan 	/* rxq interrupts and config interrupt are separated in virtio-user,
28535c4f855SJianfeng Tan 	 * here we only report config change.
286e9efa4d9SJianfeng Tan 	 */
28735c4f855SJianfeng Tan 	return VIRTIO_PCI_ISR_CONFIG;
288e9efa4d9SJianfeng Tan }
289e9efa4d9SJianfeng Tan 
290e9efa4d9SJianfeng Tan static uint16_t
291e9efa4d9SJianfeng Tan virtio_user_set_config_irq(struct virtio_hw *hw __rte_unused,
292e9efa4d9SJianfeng Tan 		    uint16_t vec __rte_unused)
293e9efa4d9SJianfeng Tan {
29435c4f855SJianfeng Tan 	return 0;
295e9efa4d9SJianfeng Tan }
296e9efa4d9SJianfeng Tan 
2973d4fb6fdSJianfeng Tan static uint16_t
2983d4fb6fdSJianfeng Tan virtio_user_set_queue_irq(struct virtio_hw *hw __rte_unused,
2993d4fb6fdSJianfeng Tan 			  struct virtqueue *vq __rte_unused,
3003d4fb6fdSJianfeng Tan 			  uint16_t vec)
3013d4fb6fdSJianfeng Tan {
3023d4fb6fdSJianfeng Tan 	/* pretend we have done that */
3033d4fb6fdSJianfeng Tan 	return vec;
3043d4fb6fdSJianfeng Tan }
3053d4fb6fdSJianfeng Tan 
306e9efa4d9SJianfeng Tan /* This function is to get the queue size, aka, number of descs, of a specified
307e9efa4d9SJianfeng Tan  * queue. Different with the VHOST_USER_GET_QUEUE_NUM, which is used to get the
308e9efa4d9SJianfeng Tan  * max supported queues.
309e9efa4d9SJianfeng Tan  */
310e9efa4d9SJianfeng Tan static uint16_t
311e9efa4d9SJianfeng Tan virtio_user_get_queue_num(struct virtio_hw *hw, uint16_t queue_id __rte_unused)
312e9efa4d9SJianfeng Tan {
313e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
314e9efa4d9SJianfeng Tan 
315e9efa4d9SJianfeng Tan 	/* Currently, each queue has same queue size */
316e9efa4d9SJianfeng Tan 	return dev->queue_size;
317e9efa4d9SJianfeng Tan }
318e9efa4d9SJianfeng Tan 
31948a44640SJens Freimann static void
32048a44640SJens Freimann virtio_user_setup_queue_packed(struct virtqueue *vq,
32148a44640SJens Freimann 			       struct virtio_user_dev *dev)
322e9efa4d9SJianfeng Tan {
32348a44640SJens Freimann 	uint16_t queue_idx = vq->vq_queue_index;
32448a44640SJens Freimann 	struct vring_packed *vring;
32548a44640SJens Freimann 	uint64_t desc_addr;
32648a44640SJens Freimann 	uint64_t avail_addr;
32748a44640SJens Freimann 	uint64_t used_addr;
32848a44640SJens Freimann 	uint16_t i;
32948a44640SJens Freimann 
33048a44640SJens Freimann 	vring  = &dev->packed_vrings[queue_idx];
33148a44640SJens Freimann 	desc_addr = (uintptr_t)vq->vq_ring_virt_mem;
33248a44640SJens Freimann 	avail_addr = desc_addr + vq->vq_nentries *
33348a44640SJens Freimann 		sizeof(struct vring_packed_desc);
33448a44640SJens Freimann 	used_addr = RTE_ALIGN_CEIL(avail_addr +
33548a44640SJens Freimann 			   sizeof(struct vring_packed_desc_event),
33648a44640SJens Freimann 			   VIRTIO_PCI_VRING_ALIGN);
33748a44640SJens Freimann 	vring->num = vq->vq_nentries;
3384cdc4d98STiwei Bie 	vring->desc = (void *)(uintptr_t)desc_addr;
3394cdc4d98STiwei Bie 	vring->driver = (void *)(uintptr_t)avail_addr;
3404cdc4d98STiwei Bie 	vring->device = (void *)(uintptr_t)used_addr;
34148a44640SJens Freimann 	dev->packed_queues[queue_idx].avail_wrap_counter = true;
34248a44640SJens Freimann 	dev->packed_queues[queue_idx].used_wrap_counter = true;
34348a44640SJens Freimann 
34445c224e7STiwei Bie 	for (i = 0; i < vring->num; i++)
3454cdc4d98STiwei Bie 		vring->desc[i].flags = 0;
34648a44640SJens Freimann }
34748a44640SJens Freimann 
34848a44640SJens Freimann static void
34948a44640SJens Freimann virtio_user_setup_queue_split(struct virtqueue *vq, struct virtio_user_dev *dev)
35048a44640SJens Freimann {
351e9efa4d9SJianfeng Tan 	uint16_t queue_idx = vq->vq_queue_index;
352e9efa4d9SJianfeng Tan 	uint64_t desc_addr, avail_addr, used_addr;
353e9efa4d9SJianfeng Tan 
354e9efa4d9SJianfeng Tan 	desc_addr = (uintptr_t)vq->vq_ring_virt_mem;
355e9efa4d9SJianfeng Tan 	avail_addr = desc_addr + vq->vq_nentries * sizeof(struct vring_desc);
356e9efa4d9SJianfeng Tan 	used_addr = RTE_ALIGN_CEIL(avail_addr + offsetof(struct vring_avail,
357e9efa4d9SJianfeng Tan 							 ring[vq->vq_nentries]),
358e9efa4d9SJianfeng Tan 				   VIRTIO_PCI_VRING_ALIGN);
359e9efa4d9SJianfeng Tan 
360e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].num = vq->vq_nentries;
361e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].desc = (void *)(uintptr_t)desc_addr;
362e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].avail = (void *)(uintptr_t)avail_addr;
363e9efa4d9SJianfeng Tan 	dev->vrings[queue_idx].used = (void *)(uintptr_t)used_addr;
36448a44640SJens Freimann }
36548a44640SJens Freimann 
36648a44640SJens Freimann static int
36748a44640SJens Freimann virtio_user_setup_queue(struct virtio_hw *hw, struct virtqueue *vq)
36848a44640SJens Freimann {
36948a44640SJens Freimann 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
37048a44640SJens Freimann 
37148a44640SJens Freimann 	if (vtpci_packed_queue(hw))
37248a44640SJens Freimann 		virtio_user_setup_queue_packed(vq, dev);
37348a44640SJens Freimann 	else
37448a44640SJens Freimann 		virtio_user_setup_queue_split(vq, dev);
375e9efa4d9SJianfeng Tan 
376e9efa4d9SJianfeng Tan 	return 0;
377e9efa4d9SJianfeng Tan }
378e9efa4d9SJianfeng Tan 
379e9efa4d9SJianfeng Tan static void
380e9efa4d9SJianfeng Tan virtio_user_del_queue(struct virtio_hw *hw, struct virtqueue *vq)
381e9efa4d9SJianfeng Tan {
382e9efa4d9SJianfeng Tan 	/* For legacy devices, write 0 to VIRTIO_PCI_QUEUE_PFN port, QEMU
383e9efa4d9SJianfeng Tan 	 * correspondingly stops the ioeventfds, and reset the status of
384e9efa4d9SJianfeng Tan 	 * the device.
385e9efa4d9SJianfeng Tan 	 * For modern devices, set queue desc, avail, used in PCI bar to 0,
386e9efa4d9SJianfeng Tan 	 * not see any more behavior in QEMU.
387e9efa4d9SJianfeng Tan 	 *
388e9efa4d9SJianfeng Tan 	 * Here we just care about what information to deliver to vhost-user
389e9efa4d9SJianfeng Tan 	 * or vhost-kernel. So we just close ioeventfd for now.
390e9efa4d9SJianfeng Tan 	 */
391e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
392e9efa4d9SJianfeng Tan 
393e9efa4d9SJianfeng Tan 	close(dev->callfds[vq->vq_queue_index]);
394e9efa4d9SJianfeng Tan 	close(dev->kickfds[vq->vq_queue_index]);
395e9efa4d9SJianfeng Tan }
396e9efa4d9SJianfeng Tan 
397e9efa4d9SJianfeng Tan static void
398e9efa4d9SJianfeng Tan virtio_user_notify_queue(struct virtio_hw *hw, struct virtqueue *vq)
399e9efa4d9SJianfeng Tan {
400e9efa4d9SJianfeng Tan 	uint64_t buf = 1;
401e9efa4d9SJianfeng Tan 	struct virtio_user_dev *dev = virtio_user_get_dev(hw);
402e9efa4d9SJianfeng Tan 
4031b69528eSJianfeng Tan 	if (hw->cvq && (hw->cvq->vq == vq)) {
40448a44640SJens Freimann 		if (vtpci_packed_queue(vq->hw))
40548a44640SJens Freimann 			virtio_user_handle_cq_packed(dev, vq->vq_queue_index);
40648a44640SJens Freimann 		else
4071b69528eSJianfeng Tan 			virtio_user_handle_cq(dev, vq->vq_queue_index);
4081b69528eSJianfeng Tan 		return;
4091b69528eSJianfeng Tan 	}
4101b69528eSJianfeng Tan 
411e9efa4d9SJianfeng Tan 	if (write(dev->kickfds[vq->vq_queue_index], &buf, sizeof(buf)) < 0)
412f2462150SFerruh Yigit 		PMD_DRV_LOG(ERR, "failed to kick backend: %s",
413e9efa4d9SJianfeng Tan 			    strerror(errno));
414e9efa4d9SJianfeng Tan }
415e9efa4d9SJianfeng Tan 
4166d890f8aSYuanhan Liu const struct virtio_pci_ops virtio_user_ops = {
417e9efa4d9SJianfeng Tan 	.read_dev_cfg	= virtio_user_read_dev_config,
418e9efa4d9SJianfeng Tan 	.write_dev_cfg	= virtio_user_write_dev_config,
419e9efa4d9SJianfeng Tan 	.get_status	= virtio_user_get_status,
420e9efa4d9SJianfeng Tan 	.set_status	= virtio_user_set_status,
421e9efa4d9SJianfeng Tan 	.get_features	= virtio_user_get_features,
422e9efa4d9SJianfeng Tan 	.set_features	= virtio_user_set_features,
423e9efa4d9SJianfeng Tan 	.get_isr	= virtio_user_get_isr,
424e9efa4d9SJianfeng Tan 	.set_config_irq	= virtio_user_set_config_irq,
4253d4fb6fdSJianfeng Tan 	.set_queue_irq	= virtio_user_set_queue_irq,
426e9efa4d9SJianfeng Tan 	.get_queue_num	= virtio_user_get_queue_num,
427e9efa4d9SJianfeng Tan 	.setup_queue	= virtio_user_setup_queue,
428e9efa4d9SJianfeng Tan 	.del_queue	= virtio_user_del_queue,
429e9efa4d9SJianfeng Tan 	.notify_queue	= virtio_user_notify_queue,
430e9efa4d9SJianfeng Tan };
431ce2eabddSJianfeng Tan 
432ce2eabddSJianfeng Tan static const char *valid_args[] = {
433ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_QUEUES_NUM     "queues"
434ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_QUEUES_NUM,
435ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_CQ_NUM         "cq"
436ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_CQ_NUM,
437ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_MAC            "mac"
438ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_MAC,
439ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_PATH           "path"
440ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_PATH,
441ce2eabddSJianfeng Tan #define VIRTIO_USER_ARG_QUEUE_SIZE     "queue_size"
442ce2eabddSJianfeng Tan 	VIRTIO_USER_ARG_QUEUE_SIZE,
4434214a1b4SWenfeng Liu #define VIRTIO_USER_ARG_INTERFACE_NAME "iface"
4444214a1b4SWenfeng Liu 	VIRTIO_USER_ARG_INTERFACE_NAME,
445bd8f50a4SZhiyong Yang #define VIRTIO_USER_ARG_SERVER_MODE    "server"
446bd8f50a4SZhiyong Yang 	VIRTIO_USER_ARG_SERVER_MODE,
447488ed97aSMarvin Liu #define VIRTIO_USER_ARG_MRG_RXBUF      "mrg_rxbuf"
448488ed97aSMarvin Liu 	VIRTIO_USER_ARG_MRG_RXBUF,
449488ed97aSMarvin Liu #define VIRTIO_USER_ARG_IN_ORDER       "in_order"
450488ed97aSMarvin Liu 	VIRTIO_USER_ARG_IN_ORDER,
45134f3966cSYuanhan Liu #define VIRTIO_USER_ARG_PACKED_VQ      "packed_vq"
45234f3966cSYuanhan Liu 	VIRTIO_USER_ARG_PACKED_VQ,
453ce2eabddSJianfeng Tan 	NULL
454ce2eabddSJianfeng Tan };
455ce2eabddSJianfeng Tan 
456ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_CQ_EN	0
457ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_Q_NUM	1
458ce2eabddSJianfeng Tan #define VIRTIO_USER_DEF_Q_SZ	256
459bd8f50a4SZhiyong Yang #define VIRTIO_USER_DEF_SERVER_MODE	0
460ce2eabddSJianfeng Tan 
461ce2eabddSJianfeng Tan static int
462ce2eabddSJianfeng Tan get_string_arg(const char *key __rte_unused,
463ce2eabddSJianfeng Tan 	       const char *value, void *extra_args)
464ce2eabddSJianfeng Tan {
465ce2eabddSJianfeng Tan 	if (!value || !extra_args)
466ce2eabddSJianfeng Tan 		return -EINVAL;
467ce2eabddSJianfeng Tan 
468ce2eabddSJianfeng Tan 	*(char **)extra_args = strdup(value);
469ce2eabddSJianfeng Tan 
4704214a1b4SWenfeng Liu 	if (!*(char **)extra_args)
4714214a1b4SWenfeng Liu 		return -ENOMEM;
4724214a1b4SWenfeng Liu 
473ce2eabddSJianfeng Tan 	return 0;
474ce2eabddSJianfeng Tan }
475ce2eabddSJianfeng Tan 
476ce2eabddSJianfeng Tan static int
477ce2eabddSJianfeng Tan get_integer_arg(const char *key __rte_unused,
478ce2eabddSJianfeng Tan 		const char *value, void *extra_args)
479ce2eabddSJianfeng Tan {
480ce2eabddSJianfeng Tan 	if (!value || !extra_args)
481ce2eabddSJianfeng Tan 		return -EINVAL;
482ce2eabddSJianfeng Tan 
483ce2eabddSJianfeng Tan 	*(uint64_t *)extra_args = strtoull(value, NULL, 0);
484ce2eabddSJianfeng Tan 
485ce2eabddSJianfeng Tan 	return 0;
486ce2eabddSJianfeng Tan }
487ce2eabddSJianfeng Tan 
488ce2eabddSJianfeng Tan static struct rte_eth_dev *
489050fe6e9SJan Blunck virtio_user_eth_dev_alloc(struct rte_vdev_device *vdev)
490ce2eabddSJianfeng Tan {
491ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
492ce2eabddSJianfeng Tan 	struct rte_eth_dev_data *data;
493ce2eabddSJianfeng Tan 	struct virtio_hw *hw;
494ce2eabddSJianfeng Tan 	struct virtio_user_dev *dev;
495ce2eabddSJianfeng Tan 
496050fe6e9SJan Blunck 	eth_dev = rte_eth_vdev_allocate(vdev, sizeof(*hw));
497ce2eabddSJianfeng Tan 	if (!eth_dev) {
498ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "cannot alloc rte_eth_dev");
499ce2eabddSJianfeng Tan 		return NULL;
500ce2eabddSJianfeng Tan 	}
501ce2eabddSJianfeng Tan 
502ce2eabddSJianfeng Tan 	data = eth_dev->data;
503050fe6e9SJan Blunck 	hw = eth_dev->data->dev_private;
504ce2eabddSJianfeng Tan 
505ce2eabddSJianfeng Tan 	dev = rte_zmalloc(NULL, sizeof(*dev), 0);
506ce2eabddSJianfeng Tan 	if (!dev) {
507ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "malloc virtio_user_dev failed");
508ce2eabddSJianfeng Tan 		rte_eth_dev_release_port(eth_dev);
509ce2eabddSJianfeng Tan 		return NULL;
510ce2eabddSJianfeng Tan 	}
511ce2eabddSJianfeng Tan 
512553f4593SYuanhan Liu 	hw->port_id = data->port_id;
5133d4fb6fdSJianfeng Tan 	dev->port_id = data->port_id;
514553f4593SYuanhan Liu 	virtio_hw_internal[hw->port_id].vtpci_ops = &virtio_user_ops;
515ef53b603SJianfeng Tan 	/*
516ef53b603SJianfeng Tan 	 * MSIX is required to enable LSC (see virtio_init_device).
517ef53b603SJianfeng Tan 	 * Here just pretend that we support msix.
518ef53b603SJianfeng Tan 	 */
519ef53b603SJianfeng Tan 	hw->use_msix = 1;
520ce2eabddSJianfeng Tan 	hw->modern   = 0;
52109649363SOlivier Matz 	hw->use_simple_rx = 0;
5229f233f54SMarvin Liu 	hw->use_inorder_rx = 0;
5239f233f54SMarvin Liu 	hw->use_inorder_tx = 0;
524ce2eabddSJianfeng Tan 	hw->virtio_user_dev = dev;
525ce2eabddSJianfeng Tan 	return eth_dev;
526ce2eabddSJianfeng Tan }
527ce2eabddSJianfeng Tan 
528ca8326a9SJianfeng Tan static void
529ca8326a9SJianfeng Tan virtio_user_eth_dev_free(struct rte_eth_dev *eth_dev)
530ca8326a9SJianfeng Tan {
531ca8326a9SJianfeng Tan 	struct rte_eth_dev_data *data = eth_dev->data;
532ca8326a9SJianfeng Tan 	struct virtio_hw *hw = data->dev_private;
533ca8326a9SJianfeng Tan 
534ca8326a9SJianfeng Tan 	rte_free(hw->virtio_user_dev);
535ca8326a9SJianfeng Tan 	rte_eth_dev_release_port(eth_dev);
536ca8326a9SJianfeng Tan }
537ca8326a9SJianfeng Tan 
538ce2eabddSJianfeng Tan /* Dev initialization routine. Invoked once for each virtio vdev at
539c3b2fdfeSYong Wang  * EAL init time, see rte_bus_probe().
540ce2eabddSJianfeng Tan  * Returns 0 on success.
541ce2eabddSJianfeng Tan  */
542ce2eabddSJianfeng Tan static int
5435d2aa461SJan Blunck virtio_user_pmd_probe(struct rte_vdev_device *dev)
544ce2eabddSJianfeng Tan {
54514f06474SJianfeng Tan 	struct rte_kvargs *kvlist = NULL;
546ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
547ce2eabddSJianfeng Tan 	struct virtio_hw *hw;
548ce2eabddSJianfeng Tan 	uint64_t queues = VIRTIO_USER_DEF_Q_NUM;
549ce2eabddSJianfeng Tan 	uint64_t cq = VIRTIO_USER_DEF_CQ_EN;
550ce2eabddSJianfeng Tan 	uint64_t queue_size = VIRTIO_USER_DEF_Q_SZ;
551bd8f50a4SZhiyong Yang 	uint64_t server_mode = VIRTIO_USER_DEF_SERVER_MODE;
552488ed97aSMarvin Liu 	uint64_t mrg_rxbuf = 1;
553488ed97aSMarvin Liu 	uint64_t in_order = 1;
5549070f88bSTiwei Bie 	uint64_t packed_vq = 0;
555ce2eabddSJianfeng Tan 	char *path = NULL;
5564214a1b4SWenfeng Liu 	char *ifname = NULL;
557ce2eabddSJianfeng Tan 	char *mac_addr = NULL;
558ce2eabddSJianfeng Tan 	int ret = -1;
559ce2eabddSJianfeng Tan 
5601c8489daSTiwei Bie 	if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
5611c8489daSTiwei Bie 		const char *name = rte_vdev_device_name(dev);
5621c8489daSTiwei Bie 		eth_dev = rte_eth_dev_attach_secondary(name);
5631c8489daSTiwei Bie 		if (!eth_dev) {
564*88fa5bb6SStephen Hemminger 			PMD_INIT_LOG(ERR, "Failed to probe %s", name);
5651c8489daSTiwei Bie 			return -1;
5661c8489daSTiwei Bie 		}
5671c8489daSTiwei Bie 
5681c8489daSTiwei Bie 		if (eth_virtio_dev_init(eth_dev) < 0) {
5691c8489daSTiwei Bie 			PMD_INIT_LOG(ERR, "eth_virtio_dev_init fails");
5701c8489daSTiwei Bie 			rte_eth_dev_release_port(eth_dev);
5711c8489daSTiwei Bie 			return -1;
5721c8489daSTiwei Bie 		}
5731c8489daSTiwei Bie 
5741c8489daSTiwei Bie 		eth_dev->dev_ops = &virtio_user_secondary_eth_dev_ops;
5751c8489daSTiwei Bie 		eth_dev->device = &dev->device;
5761c8489daSTiwei Bie 		rte_eth_dev_probing_finish(eth_dev);
5771c8489daSTiwei Bie 		return 0;
5781c8489daSTiwei Bie 	}
5791c8489daSTiwei Bie 
5805d2aa461SJan Blunck 	kvlist = rte_kvargs_parse(rte_vdev_device_args(dev), valid_args);
581ce2eabddSJianfeng Tan 	if (!kvlist) {
582ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "error when parsing param");
583ce2eabddSJianfeng Tan 		goto end;
584ce2eabddSJianfeng Tan 	}
585ce2eabddSJianfeng Tan 
5869cca159eSMaxime Coquelin 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_PATH) == 1) {
587ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_PATH,
588ca8326a9SJianfeng Tan 				       &get_string_arg, &path) < 0) {
589404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
590404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_PATH);
591404bd6bfSJianfeng Tan 			goto end;
592404bd6bfSJianfeng Tan 		}
5939cca159eSMaxime Coquelin 	} else {
594f2462150SFerruh Yigit 		PMD_INIT_LOG(ERR, "arg %s is mandatory for virtio_user",
5952dac0df4STiwei Bie 			     VIRTIO_USER_ARG_PATH);
596ce2eabddSJianfeng Tan 		goto end;
597ce2eabddSJianfeng Tan 	}
598ce2eabddSJianfeng Tan 
5994214a1b4SWenfeng Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_INTERFACE_NAME) == 1) {
6004214a1b4SWenfeng Liu 		if (is_vhost_user_by_type(path)) {
6014214a1b4SWenfeng Liu 			PMD_INIT_LOG(ERR,
6024214a1b4SWenfeng Liu 				"arg %s applies only to vhost-kernel backend",
6034214a1b4SWenfeng Liu 				VIRTIO_USER_ARG_INTERFACE_NAME);
6044214a1b4SWenfeng Liu 			goto end;
6054214a1b4SWenfeng Liu 		}
6064214a1b4SWenfeng Liu 
6074214a1b4SWenfeng Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_INTERFACE_NAME,
6084214a1b4SWenfeng Liu 				       &get_string_arg, &ifname) < 0) {
6094214a1b4SWenfeng Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
6104214a1b4SWenfeng Liu 				     VIRTIO_USER_ARG_INTERFACE_NAME);
6114214a1b4SWenfeng Liu 			goto end;
6124214a1b4SWenfeng Liu 		}
6134214a1b4SWenfeng Liu 	}
6144214a1b4SWenfeng Liu 
615404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_MAC) == 1) {
616ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_MAC,
617ca8326a9SJianfeng Tan 				       &get_string_arg, &mac_addr) < 0) {
618404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
619404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_MAC);
620404bd6bfSJianfeng Tan 			goto end;
621404bd6bfSJianfeng Tan 		}
622404bd6bfSJianfeng Tan 	}
623ce2eabddSJianfeng Tan 
624404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_QUEUE_SIZE) == 1) {
625ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_QUEUE_SIZE,
626ca8326a9SJianfeng Tan 				       &get_integer_arg, &queue_size) < 0) {
627404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
628404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_QUEUE_SIZE);
629404bd6bfSJianfeng Tan 			goto end;
630404bd6bfSJianfeng Tan 		}
631404bd6bfSJianfeng Tan 	}
632ce2eabddSJianfeng Tan 
633404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_QUEUES_NUM) == 1) {
634ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_QUEUES_NUM,
635ca8326a9SJianfeng Tan 				       &get_integer_arg, &queues) < 0) {
636404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
637404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_QUEUES_NUM);
638404bd6bfSJianfeng Tan 			goto end;
639404bd6bfSJianfeng Tan 		}
640404bd6bfSJianfeng Tan 	}
641ce2eabddSJianfeng Tan 
642bd8f50a4SZhiyong Yang 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_SERVER_MODE) == 1) {
643bd8f50a4SZhiyong Yang 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_SERVER_MODE,
644bd8f50a4SZhiyong Yang 				       &get_integer_arg, &server_mode) < 0) {
645bd8f50a4SZhiyong Yang 			PMD_INIT_LOG(ERR, "error to parse %s",
646bd8f50a4SZhiyong Yang 				     VIRTIO_USER_ARG_SERVER_MODE);
647bd8f50a4SZhiyong Yang 			goto end;
648bd8f50a4SZhiyong Yang 		}
649bd8f50a4SZhiyong Yang 	}
650bd8f50a4SZhiyong Yang 
651404bd6bfSJianfeng Tan 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_CQ_NUM) == 1) {
652ca8326a9SJianfeng Tan 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_CQ_NUM,
653ca8326a9SJianfeng Tan 				       &get_integer_arg, &cq) < 0) {
654404bd6bfSJianfeng Tan 			PMD_INIT_LOG(ERR, "error to parse %s",
655404bd6bfSJianfeng Tan 				     VIRTIO_USER_ARG_CQ_NUM);
656404bd6bfSJianfeng Tan 			goto end;
657404bd6bfSJianfeng Tan 		}
658404bd6bfSJianfeng Tan 	} else if (queues > 1) {
6591b69528eSJianfeng Tan 		cq = 1;
660404bd6bfSJianfeng Tan 	}
6611b69528eSJianfeng Tan 
66234f3966cSYuanhan Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_PACKED_VQ) == 1) {
66334f3966cSYuanhan Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_PACKED_VQ,
66434f3966cSYuanhan Liu 				       &get_integer_arg, &packed_vq) < 0) {
66534f3966cSYuanhan Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
66634f3966cSYuanhan Liu 				     VIRTIO_USER_ARG_PACKED_VQ);
66734f3966cSYuanhan Liu 			goto end;
66834f3966cSYuanhan Liu 		}
66934f3966cSYuanhan Liu 	}
67034f3966cSYuanhan Liu 
6711b69528eSJianfeng Tan 	if (queues > 1 && cq == 0) {
6721b69528eSJianfeng Tan 		PMD_INIT_LOG(ERR, "multi-q requires ctrl-q");
6731b69528eSJianfeng Tan 		goto end;
6741b69528eSJianfeng Tan 	}
675ce2eabddSJianfeng Tan 
6762269b9aeSWenfeng Liu 	if (queues > VIRTIO_MAX_VIRTQUEUE_PAIRS) {
6772269b9aeSWenfeng Liu 		PMD_INIT_LOG(ERR, "arg %s %" PRIu64 " exceeds the limit %u",
6782269b9aeSWenfeng Liu 			VIRTIO_USER_ARG_QUEUES_NUM, queues,
6792269b9aeSWenfeng Liu 			VIRTIO_MAX_VIRTQUEUE_PAIRS);
6802269b9aeSWenfeng Liu 		goto end;
6812269b9aeSWenfeng Liu 	}
6822269b9aeSWenfeng Liu 
683488ed97aSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_MRG_RXBUF) == 1) {
684488ed97aSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_MRG_RXBUF,
685488ed97aSMarvin Liu 				       &get_integer_arg, &mrg_rxbuf) < 0) {
686488ed97aSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
687488ed97aSMarvin Liu 				     VIRTIO_USER_ARG_MRG_RXBUF);
688488ed97aSMarvin Liu 			goto end;
689488ed97aSMarvin Liu 		}
690488ed97aSMarvin Liu 	}
691488ed97aSMarvin Liu 
692488ed97aSMarvin Liu 	if (rte_kvargs_count(kvlist, VIRTIO_USER_ARG_IN_ORDER) == 1) {
693488ed97aSMarvin Liu 		if (rte_kvargs_process(kvlist, VIRTIO_USER_ARG_IN_ORDER,
694488ed97aSMarvin Liu 				       &get_integer_arg, &in_order) < 0) {
695488ed97aSMarvin Liu 			PMD_INIT_LOG(ERR, "error to parse %s",
696488ed97aSMarvin Liu 				     VIRTIO_USER_ARG_IN_ORDER);
697488ed97aSMarvin Liu 			goto end;
698488ed97aSMarvin Liu 		}
699488ed97aSMarvin Liu 	}
700488ed97aSMarvin Liu 
701050fe6e9SJan Blunck 	eth_dev = virtio_user_eth_dev_alloc(dev);
702ce2eabddSJianfeng Tan 	if (!eth_dev) {
703e8df94b8SJianfeng Tan 		PMD_INIT_LOG(ERR, "virtio_user fails to alloc device");
704ce2eabddSJianfeng Tan 		goto end;
705ce2eabddSJianfeng Tan 	}
706ce2eabddSJianfeng Tan 
707ce2eabddSJianfeng Tan 	hw = eth_dev->data->dev_private;
708ce2eabddSJianfeng Tan 	if (virtio_user_dev_init(hw->virtio_user_dev, path, queues, cq,
7091c8489daSTiwei Bie 			 queue_size, mac_addr, &ifname, server_mode,
7101c8489daSTiwei Bie 			 mrg_rxbuf, in_order, packed_vq) < 0) {
711ca8326a9SJianfeng Tan 		PMD_INIT_LOG(ERR, "virtio_user_dev_init fails");
712ca8326a9SJianfeng Tan 		virtio_user_eth_dev_free(eth_dev);
713ce2eabddSJianfeng Tan 		goto end;
714ca8326a9SJianfeng Tan 	}
715fbe90cddSThomas Monjalon 
7163dcfe039SThomas Monjalon 	/* previously called by rte_pci_probe() for physical dev */
717ce2eabddSJianfeng Tan 	if (eth_virtio_dev_init(eth_dev) < 0) {
718ce2eabddSJianfeng Tan 		PMD_INIT_LOG(ERR, "eth_virtio_dev_init fails");
719ca8326a9SJianfeng Tan 		virtio_user_eth_dev_free(eth_dev);
720ce2eabddSJianfeng Tan 		goto end;
721ce2eabddSJianfeng Tan 	}
722fbe90cddSThomas Monjalon 
723fbe90cddSThomas Monjalon 	rte_eth_dev_probing_finish(eth_dev);
724ce2eabddSJianfeng Tan 	ret = 0;
725ce2eabddSJianfeng Tan 
726ce2eabddSJianfeng Tan end:
72714f06474SJianfeng Tan 	if (kvlist)
72814f06474SJianfeng Tan 		rte_kvargs_free(kvlist);
729ce2eabddSJianfeng Tan 	if (path)
730ce2eabddSJianfeng Tan 		free(path);
731ce2eabddSJianfeng Tan 	if (mac_addr)
732ce2eabddSJianfeng Tan 		free(mac_addr);
7334214a1b4SWenfeng Liu 	if (ifname)
7344214a1b4SWenfeng Liu 		free(ifname);
735ce2eabddSJianfeng Tan 	return ret;
736ce2eabddSJianfeng Tan }
737ce2eabddSJianfeng Tan 
738ce2eabddSJianfeng Tan static int
7395d2aa461SJan Blunck virtio_user_pmd_remove(struct rte_vdev_device *vdev)
740ce2eabddSJianfeng Tan {
7415d2aa461SJan Blunck 	const char *name;
742ce2eabddSJianfeng Tan 	struct rte_eth_dev *eth_dev;
743ce2eabddSJianfeng Tan 
7445d2aa461SJan Blunck 	if (!vdev)
745ce2eabddSJianfeng Tan 		return -EINVAL;
746ce2eabddSJianfeng Tan 
7475d2aa461SJan Blunck 	name = rte_vdev_device_name(vdev);
748f2462150SFerruh Yigit 	PMD_DRV_LOG(INFO, "Un-Initializing %s", name);
749ce2eabddSJianfeng Tan 	eth_dev = rte_eth_dev_allocated(name);
7507f468b2eSTiwei Bie 	/* Port has already been released by close. */
751ce2eabddSJianfeng Tan 	if (!eth_dev)
7527f468b2eSTiwei Bie 		return 0;
753ce2eabddSJianfeng Tan 
7541c8489daSTiwei Bie 	if (rte_eal_process_type() != RTE_PROC_PRIMARY)
7551c8489daSTiwei Bie 		return rte_eth_dev_release_port(eth_dev);
7561c8489daSTiwei Bie 
757ce2eabddSJianfeng Tan 	/* make sure the device is stopped, queues freed */
758ce2eabddSJianfeng Tan 	rte_eth_dev_close(eth_dev->data->port_id);
759ce2eabddSJianfeng Tan 
760ce2eabddSJianfeng Tan 	return 0;
761ce2eabddSJianfeng Tan }
762ce2eabddSJianfeng Tan 
763fe363dd4SJan Viktorin static struct rte_vdev_driver virtio_user_driver = {
76450a3345fSShreyansh Jain 	.probe = virtio_user_pmd_probe,
76550a3345fSShreyansh Jain 	.remove = virtio_user_pmd_remove,
766ce2eabddSJianfeng Tan };
767ce2eabddSJianfeng Tan 
76801f19227SShreyansh Jain RTE_PMD_REGISTER_VDEV(net_virtio_user, virtio_user_driver);
7699fa80cb2SJan Blunck RTE_PMD_REGISTER_ALIAS(net_virtio_user, virtio_user);
77001f19227SShreyansh Jain RTE_PMD_REGISTER_PARAM_STRING(net_virtio_user,
77144e32a67SPablo de Lara 	"path=<path> "
77244e32a67SPablo de Lara 	"mac=<mac addr> "
77344e32a67SPablo de Lara 	"cq=<int> "
77444e32a67SPablo de Lara 	"queue_size=<int> "
7754214a1b4SWenfeng Liu 	"queues=<int> "
776488ed97aSMarvin Liu 	"iface=<string> "
77762758c76STiwei Bie 	"server=<0|1> "
778488ed97aSMarvin Liu 	"mrg_rxbuf=<0|1> "
7799070f88bSTiwei Bie 	"in_order=<0|1> "
7809070f88bSTiwei Bie 	"packed_vq=<0|1>");
781