15566a3e3SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause 25566a3e3SBruce Richardson * Copyright(c) 2016 Intel Corporation 3e3b43481SJianfeng Tan */ 4e3b43481SJianfeng Tan 5e3b43481SJianfeng Tan #include <unistd.h> 6e3b43481SJianfeng Tan #include <sys/types.h> 7e3b43481SJianfeng Tan #include <sys/stat.h> 8e3b43481SJianfeng Tan #include <fcntl.h> 9e3b43481SJianfeng Tan #include <net/if.h> 10791b43e0SNing Li #include <net/if_arp.h> 11e3b43481SJianfeng Tan #include <errno.h> 12e3b43481SJianfeng Tan #include <string.h> 13e3b43481SJianfeng Tan #include <limits.h> 14e3b43481SJianfeng Tan 15791b43e0SNing Li #include <rte_ether.h> 16791b43e0SNing Li 17e3b43481SJianfeng Tan #include "vhost_kernel_tap.h" 18e3b43481SJianfeng Tan #include "../virtio_logs.h" 19*1db4d233SEric Zhang #include "../virtio_pci.h" 20*1db4d233SEric Zhang 21*1db4d233SEric Zhang static int 22*1db4d233SEric Zhang vhost_kernel_tap_set_offload(int fd, uint64_t features) 23*1db4d233SEric Zhang { 24*1db4d233SEric Zhang unsigned int offload = 0; 25*1db4d233SEric Zhang 26*1db4d233SEric Zhang if (features & (1ULL << VIRTIO_NET_F_GUEST_CSUM)) { 27*1db4d233SEric Zhang offload |= TUN_F_CSUM; 28*1db4d233SEric Zhang if (features & (1ULL << VIRTIO_NET_F_GUEST_TSO4)) 29*1db4d233SEric Zhang offload |= TUN_F_TSO4; 30*1db4d233SEric Zhang if (features & (1ULL << VIRTIO_NET_F_GUEST_TSO6)) 31*1db4d233SEric Zhang offload |= TUN_F_TSO6; 32*1db4d233SEric Zhang if (features & ((1ULL << VIRTIO_NET_F_GUEST_TSO4) | 33*1db4d233SEric Zhang (1ULL << VIRTIO_NET_F_GUEST_TSO6)) && 34*1db4d233SEric Zhang (features & (1ULL << VIRTIO_NET_F_GUEST_ECN))) 35*1db4d233SEric Zhang offload |= TUN_F_TSO_ECN; 36*1db4d233SEric Zhang if (features & (1ULL << VIRTIO_NET_F_GUEST_UFO)) 37*1db4d233SEric Zhang offload |= TUN_F_UFO; 38*1db4d233SEric Zhang } 39*1db4d233SEric Zhang 40*1db4d233SEric Zhang if (offload != 0) { 41*1db4d233SEric Zhang /* Check if our kernel supports TUNSETOFFLOAD */ 42*1db4d233SEric Zhang if (ioctl(fd, TUNSETOFFLOAD, 0) != 0 && errno == EINVAL) { 43*1db4d233SEric Zhang PMD_DRV_LOG(ERR, "Kernel does't support TUNSETOFFLOAD\n"); 44*1db4d233SEric Zhang return -ENOTSUP; 45*1db4d233SEric Zhang } 46*1db4d233SEric Zhang 47*1db4d233SEric Zhang if (ioctl(fd, TUNSETOFFLOAD, offload) != 0) { 48*1db4d233SEric Zhang offload &= ~TUN_F_UFO; 49*1db4d233SEric Zhang if (ioctl(fd, TUNSETOFFLOAD, offload) != 0) { 50*1db4d233SEric Zhang PMD_DRV_LOG(ERR, "TUNSETOFFLOAD ioctl() failed: %s\n", 51*1db4d233SEric Zhang strerror(errno)); 52*1db4d233SEric Zhang return -1; 53*1db4d233SEric Zhang } 54*1db4d233SEric Zhang } 55*1db4d233SEric Zhang } 56*1db4d233SEric Zhang 57*1db4d233SEric Zhang return 0; 58*1db4d233SEric Zhang } 59e3b43481SJianfeng Tan 60e3b43481SJianfeng Tan int 61791b43e0SNing Li vhost_kernel_open_tap(char **p_ifname, int hdr_size, int req_mq, 62*1db4d233SEric Zhang const char *mac, uint64_t features) 63e3b43481SJianfeng Tan { 64e3b43481SJianfeng Tan unsigned int tap_features; 65e3b43481SJianfeng Tan int sndbuf = INT_MAX; 66e3b43481SJianfeng Tan struct ifreq ifr; 67e3b43481SJianfeng Tan int tapfd; 68e3b43481SJianfeng Tan 69e3b43481SJianfeng Tan /* TODO: 70e3b43481SJianfeng Tan * 1. verify we can get/set vnet_hdr_len, tap_probe_vnet_hdr_len 71e3b43481SJianfeng Tan * 2. get number of memory regions from vhost module parameter 72e3b43481SJianfeng Tan * max_mem_regions, supported in newer version linux kernel 73e3b43481SJianfeng Tan */ 74e3b43481SJianfeng Tan tapfd = open(PATH_NET_TUN, O_RDWR); 75e3b43481SJianfeng Tan if (tapfd < 0) { 76e3b43481SJianfeng Tan PMD_DRV_LOG(ERR, "fail to open %s: %s", 77e3b43481SJianfeng Tan PATH_NET_TUN, strerror(errno)); 78e3b43481SJianfeng Tan return -1; 79e3b43481SJianfeng Tan } 80e3b43481SJianfeng Tan 81e3b43481SJianfeng Tan /* Construct ifr */ 82e3b43481SJianfeng Tan memset(&ifr, 0, sizeof(ifr)); 83e3b43481SJianfeng Tan ifr.ifr_flags = IFF_TAP | IFF_NO_PI; 84e3b43481SJianfeng Tan 85e3b43481SJianfeng Tan if (ioctl(tapfd, TUNGETFEATURES, &tap_features) == -1) { 86e3b43481SJianfeng Tan PMD_DRV_LOG(ERR, "TUNGETFEATURES failed: %s", strerror(errno)); 87e3b43481SJianfeng Tan goto error; 88e3b43481SJianfeng Tan } 89e3b43481SJianfeng Tan if (tap_features & IFF_ONE_QUEUE) 90e3b43481SJianfeng Tan ifr.ifr_flags |= IFF_ONE_QUEUE; 91e3b43481SJianfeng Tan 92e3b43481SJianfeng Tan /* Let tap instead of vhost-net handle vnet header, as the latter does 93e3b43481SJianfeng Tan * not support offloading. And in this case, we should not set feature 94e3b43481SJianfeng Tan * bit VHOST_NET_F_VIRTIO_NET_HDR. 95e3b43481SJianfeng Tan */ 96e3b43481SJianfeng Tan if (tap_features & IFF_VNET_HDR) { 97e3b43481SJianfeng Tan ifr.ifr_flags |= IFF_VNET_HDR; 98e3b43481SJianfeng Tan } else { 99e3b43481SJianfeng Tan PMD_DRV_LOG(ERR, "TAP does not support IFF_VNET_HDR"); 100e3b43481SJianfeng Tan goto error; 101e3b43481SJianfeng Tan } 102e3b43481SJianfeng Tan 103be7a4707SJianfeng Tan if (req_mq) 104be7a4707SJianfeng Tan ifr.ifr_flags |= IFF_MULTI_QUEUE; 105be7a4707SJianfeng Tan 106e3b43481SJianfeng Tan if (*p_ifname) 107907d125eSSebastian Basierski strncpy(ifr.ifr_name, *p_ifname, IFNAMSIZ - 1); 108e3b43481SJianfeng Tan else 109907d125eSSebastian Basierski strncpy(ifr.ifr_name, "tap%d", IFNAMSIZ - 1); 110e3b43481SJianfeng Tan if (ioctl(tapfd, TUNSETIFF, (void *)&ifr) == -1) { 111e3b43481SJianfeng Tan PMD_DRV_LOG(ERR, "TUNSETIFF failed: %s", strerror(errno)); 112e3b43481SJianfeng Tan goto error; 113e3b43481SJianfeng Tan } 114e3b43481SJianfeng Tan 115e3b43481SJianfeng Tan fcntl(tapfd, F_SETFL, O_NONBLOCK); 116e3b43481SJianfeng Tan 117e3b43481SJianfeng Tan if (ioctl(tapfd, TUNSETVNETHDRSZ, &hdr_size) < 0) { 118e3b43481SJianfeng Tan PMD_DRV_LOG(ERR, "TUNSETVNETHDRSZ failed: %s", strerror(errno)); 119e3b43481SJianfeng Tan goto error; 120e3b43481SJianfeng Tan } 121e3b43481SJianfeng Tan 122e3b43481SJianfeng Tan if (ioctl(tapfd, TUNSETSNDBUF, &sndbuf) < 0) { 123e3b43481SJianfeng Tan PMD_DRV_LOG(ERR, "TUNSETSNDBUF failed: %s", strerror(errno)); 124e3b43481SJianfeng Tan goto error; 125e3b43481SJianfeng Tan } 126e3b43481SJianfeng Tan 127*1db4d233SEric Zhang vhost_kernel_tap_set_offload(tapfd, features); 1285e97e420SJianfeng Tan 129791b43e0SNing Li memset(&ifr, 0, sizeof(ifr)); 130791b43e0SNing Li ifr.ifr_hwaddr.sa_family = ARPHRD_ETHER; 131791b43e0SNing Li memcpy(ifr.ifr_hwaddr.sa_data, mac, ETHER_ADDR_LEN); 132791b43e0SNing Li if (ioctl(tapfd, SIOCSIFHWADDR, (void *)&ifr) == -1) { 133791b43e0SNing Li PMD_DRV_LOG(ERR, "SIOCSIFHWADDR failed: %s", strerror(errno)); 134791b43e0SNing Li goto error; 135791b43e0SNing Li } 136791b43e0SNing Li 137e3b43481SJianfeng Tan if (!(*p_ifname)) 138e3b43481SJianfeng Tan *p_ifname = strdup(ifr.ifr_name); 139e3b43481SJianfeng Tan 140e3b43481SJianfeng Tan return tapfd; 141e3b43481SJianfeng Tan error: 142e3b43481SJianfeng Tan close(tapfd); 143e3b43481SJianfeng Tan return -1; 144e3b43481SJianfeng Tan } 145