xref: /dpdk/drivers/net/virtio/virtio_user/vhost_kernel_tap.c (revision 1db4d2330bc849a19b9f18479ae7a5a75bc01df2)
15566a3e3SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause
25566a3e3SBruce Richardson  * Copyright(c) 2016 Intel Corporation
3e3b43481SJianfeng Tan  */
4e3b43481SJianfeng Tan 
5e3b43481SJianfeng Tan #include <unistd.h>
6e3b43481SJianfeng Tan #include <sys/types.h>
7e3b43481SJianfeng Tan #include <sys/stat.h>
8e3b43481SJianfeng Tan #include <fcntl.h>
9e3b43481SJianfeng Tan #include <net/if.h>
10791b43e0SNing Li #include <net/if_arp.h>
11e3b43481SJianfeng Tan #include <errno.h>
12e3b43481SJianfeng Tan #include <string.h>
13e3b43481SJianfeng Tan #include <limits.h>
14e3b43481SJianfeng Tan 
15791b43e0SNing Li #include <rte_ether.h>
16791b43e0SNing Li 
17e3b43481SJianfeng Tan #include "vhost_kernel_tap.h"
18e3b43481SJianfeng Tan #include "../virtio_logs.h"
19*1db4d233SEric Zhang #include "../virtio_pci.h"
20*1db4d233SEric Zhang 
21*1db4d233SEric Zhang static int
22*1db4d233SEric Zhang vhost_kernel_tap_set_offload(int fd, uint64_t features)
23*1db4d233SEric Zhang {
24*1db4d233SEric Zhang 	unsigned int offload = 0;
25*1db4d233SEric Zhang 
26*1db4d233SEric Zhang 	if (features & (1ULL << VIRTIO_NET_F_GUEST_CSUM)) {
27*1db4d233SEric Zhang 		offload |= TUN_F_CSUM;
28*1db4d233SEric Zhang 		if (features & (1ULL << VIRTIO_NET_F_GUEST_TSO4))
29*1db4d233SEric Zhang 			offload |= TUN_F_TSO4;
30*1db4d233SEric Zhang 		if (features & (1ULL << VIRTIO_NET_F_GUEST_TSO6))
31*1db4d233SEric Zhang 			offload |= TUN_F_TSO6;
32*1db4d233SEric Zhang 		if (features & ((1ULL << VIRTIO_NET_F_GUEST_TSO4) |
33*1db4d233SEric Zhang 			(1ULL << VIRTIO_NET_F_GUEST_TSO6)) &&
34*1db4d233SEric Zhang 			(features & (1ULL << VIRTIO_NET_F_GUEST_ECN)))
35*1db4d233SEric Zhang 			offload |= TUN_F_TSO_ECN;
36*1db4d233SEric Zhang 		if (features & (1ULL << VIRTIO_NET_F_GUEST_UFO))
37*1db4d233SEric Zhang 			offload |= TUN_F_UFO;
38*1db4d233SEric Zhang 	}
39*1db4d233SEric Zhang 
40*1db4d233SEric Zhang 	if (offload != 0) {
41*1db4d233SEric Zhang 		/* Check if our kernel supports TUNSETOFFLOAD */
42*1db4d233SEric Zhang 		if (ioctl(fd, TUNSETOFFLOAD, 0) != 0 && errno == EINVAL) {
43*1db4d233SEric Zhang 			PMD_DRV_LOG(ERR, "Kernel does't support TUNSETOFFLOAD\n");
44*1db4d233SEric Zhang 			return -ENOTSUP;
45*1db4d233SEric Zhang 		}
46*1db4d233SEric Zhang 
47*1db4d233SEric Zhang 		if (ioctl(fd, TUNSETOFFLOAD, offload) != 0) {
48*1db4d233SEric Zhang 			offload &= ~TUN_F_UFO;
49*1db4d233SEric Zhang 			if (ioctl(fd, TUNSETOFFLOAD, offload) != 0) {
50*1db4d233SEric Zhang 				PMD_DRV_LOG(ERR, "TUNSETOFFLOAD ioctl() failed: %s\n",
51*1db4d233SEric Zhang 					strerror(errno));
52*1db4d233SEric Zhang 				return -1;
53*1db4d233SEric Zhang 			}
54*1db4d233SEric Zhang 		}
55*1db4d233SEric Zhang 	}
56*1db4d233SEric Zhang 
57*1db4d233SEric Zhang 	return 0;
58*1db4d233SEric Zhang }
59e3b43481SJianfeng Tan 
60e3b43481SJianfeng Tan int
61791b43e0SNing Li vhost_kernel_open_tap(char **p_ifname, int hdr_size, int req_mq,
62*1db4d233SEric Zhang 			 const char *mac, uint64_t features)
63e3b43481SJianfeng Tan {
64e3b43481SJianfeng Tan 	unsigned int tap_features;
65e3b43481SJianfeng Tan 	int sndbuf = INT_MAX;
66e3b43481SJianfeng Tan 	struct ifreq ifr;
67e3b43481SJianfeng Tan 	int tapfd;
68e3b43481SJianfeng Tan 
69e3b43481SJianfeng Tan 	/* TODO:
70e3b43481SJianfeng Tan 	 * 1. verify we can get/set vnet_hdr_len, tap_probe_vnet_hdr_len
71e3b43481SJianfeng Tan 	 * 2. get number of memory regions from vhost module parameter
72e3b43481SJianfeng Tan 	 * max_mem_regions, supported in newer version linux kernel
73e3b43481SJianfeng Tan 	 */
74e3b43481SJianfeng Tan 	tapfd = open(PATH_NET_TUN, O_RDWR);
75e3b43481SJianfeng Tan 	if (tapfd < 0) {
76e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "fail to open %s: %s",
77e3b43481SJianfeng Tan 			    PATH_NET_TUN, strerror(errno));
78e3b43481SJianfeng Tan 		return -1;
79e3b43481SJianfeng Tan 	}
80e3b43481SJianfeng Tan 
81e3b43481SJianfeng Tan 	/* Construct ifr */
82e3b43481SJianfeng Tan 	memset(&ifr, 0, sizeof(ifr));
83e3b43481SJianfeng Tan 	ifr.ifr_flags = IFF_TAP | IFF_NO_PI;
84e3b43481SJianfeng Tan 
85e3b43481SJianfeng Tan 	if (ioctl(tapfd, TUNGETFEATURES, &tap_features) == -1) {
86e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "TUNGETFEATURES failed: %s", strerror(errno));
87e3b43481SJianfeng Tan 		goto error;
88e3b43481SJianfeng Tan 	}
89e3b43481SJianfeng Tan 	if (tap_features & IFF_ONE_QUEUE)
90e3b43481SJianfeng Tan 		ifr.ifr_flags |= IFF_ONE_QUEUE;
91e3b43481SJianfeng Tan 
92e3b43481SJianfeng Tan 	/* Let tap instead of vhost-net handle vnet header, as the latter does
93e3b43481SJianfeng Tan 	 * not support offloading. And in this case, we should not set feature
94e3b43481SJianfeng Tan 	 * bit VHOST_NET_F_VIRTIO_NET_HDR.
95e3b43481SJianfeng Tan 	 */
96e3b43481SJianfeng Tan 	if (tap_features & IFF_VNET_HDR) {
97e3b43481SJianfeng Tan 		ifr.ifr_flags |= IFF_VNET_HDR;
98e3b43481SJianfeng Tan 	} else {
99e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "TAP does not support IFF_VNET_HDR");
100e3b43481SJianfeng Tan 		goto error;
101e3b43481SJianfeng Tan 	}
102e3b43481SJianfeng Tan 
103be7a4707SJianfeng Tan 	if (req_mq)
104be7a4707SJianfeng Tan 		ifr.ifr_flags |= IFF_MULTI_QUEUE;
105be7a4707SJianfeng Tan 
106e3b43481SJianfeng Tan 	if (*p_ifname)
107907d125eSSebastian Basierski 		strncpy(ifr.ifr_name, *p_ifname, IFNAMSIZ - 1);
108e3b43481SJianfeng Tan 	else
109907d125eSSebastian Basierski 		strncpy(ifr.ifr_name, "tap%d", IFNAMSIZ - 1);
110e3b43481SJianfeng Tan 	if (ioctl(tapfd, TUNSETIFF, (void *)&ifr) == -1) {
111e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "TUNSETIFF failed: %s", strerror(errno));
112e3b43481SJianfeng Tan 		goto error;
113e3b43481SJianfeng Tan 	}
114e3b43481SJianfeng Tan 
115e3b43481SJianfeng Tan 	fcntl(tapfd, F_SETFL, O_NONBLOCK);
116e3b43481SJianfeng Tan 
117e3b43481SJianfeng Tan 	if (ioctl(tapfd, TUNSETVNETHDRSZ, &hdr_size) < 0) {
118e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "TUNSETVNETHDRSZ failed: %s", strerror(errno));
119e3b43481SJianfeng Tan 		goto error;
120e3b43481SJianfeng Tan 	}
121e3b43481SJianfeng Tan 
122e3b43481SJianfeng Tan 	if (ioctl(tapfd, TUNSETSNDBUF, &sndbuf) < 0) {
123e3b43481SJianfeng Tan 		PMD_DRV_LOG(ERR, "TUNSETSNDBUF failed: %s", strerror(errno));
124e3b43481SJianfeng Tan 		goto error;
125e3b43481SJianfeng Tan 	}
126e3b43481SJianfeng Tan 
127*1db4d233SEric Zhang 	vhost_kernel_tap_set_offload(tapfd, features);
1285e97e420SJianfeng Tan 
129791b43e0SNing Li 	memset(&ifr, 0, sizeof(ifr));
130791b43e0SNing Li 	ifr.ifr_hwaddr.sa_family = ARPHRD_ETHER;
131791b43e0SNing Li 	memcpy(ifr.ifr_hwaddr.sa_data, mac, ETHER_ADDR_LEN);
132791b43e0SNing Li 	if (ioctl(tapfd, SIOCSIFHWADDR, (void *)&ifr) == -1) {
133791b43e0SNing Li 		PMD_DRV_LOG(ERR, "SIOCSIFHWADDR failed: %s", strerror(errno));
134791b43e0SNing Li 		goto error;
135791b43e0SNing Li 	}
136791b43e0SNing Li 
137e3b43481SJianfeng Tan 	if (!(*p_ifname))
138e3b43481SJianfeng Tan 		*p_ifname = strdup(ifr.ifr_name);
139e3b43481SJianfeng Tan 
140e3b43481SJianfeng Tan 	return tapfd;
141e3b43481SJianfeng Tan error:
142e3b43481SJianfeng Tan 	close(tapfd);
143e3b43481SJianfeng Tan 	return -1;
144e3b43481SJianfeng Tan }
145