13998e2a0SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause 23998e2a0SBruce Richardson * Copyright(c) 2010-2014 Intel Corporation 3e107e82eSAnatoly Burakov */ 4e107e82eSAnatoly Burakov 5e107e82eSAnatoly Burakov #include <stdio.h> 6e107e82eSAnatoly Burakov #include <stdlib.h> 7e107e82eSAnatoly Burakov #include <stdint.h> 8e107e82eSAnatoly Burakov #include <inttypes.h> 9e107e82eSAnatoly Burakov #include <sys/types.h> 10e107e82eSAnatoly Burakov #include <sys/param.h> 11e107e82eSAnatoly Burakov #include <string.h> 12e107e82eSAnatoly Burakov #include <sys/queue.h> 13e107e82eSAnatoly Burakov #include <stdarg.h> 14e107e82eSAnatoly Burakov #include <errno.h> 15e107e82eSAnatoly Burakov #include <getopt.h> 16e107e82eSAnatoly Burakov 17e107e82eSAnatoly Burakov #include <rte_common.h> 18e107e82eSAnatoly Burakov #include <rte_byteorder.h> 19e107e82eSAnatoly Burakov #include <rte_log.h> 20e107e82eSAnatoly Burakov #include <rte_memory.h> 21e107e82eSAnatoly Burakov #include <rte_memcpy.h> 22e107e82eSAnatoly Burakov #include <rte_eal.h> 23e107e82eSAnatoly Burakov #include <rte_launch.h> 24e107e82eSAnatoly Burakov #include <rte_atomic.h> 25e107e82eSAnatoly Burakov #include <rte_cycles.h> 26e107e82eSAnatoly Burakov #include <rte_prefetch.h> 27e107e82eSAnatoly Burakov #include <rte_lcore.h> 28e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 29e107e82eSAnatoly Burakov #include <rte_branch_prediction.h> 30e107e82eSAnatoly Burakov #include <rte_interrupts.h> 31e107e82eSAnatoly Burakov #include <rte_random.h> 32e107e82eSAnatoly Burakov #include <rte_debug.h> 33e107e82eSAnatoly Burakov #include <rte_ether.h> 34e107e82eSAnatoly Burakov #include <rte_ethdev.h> 35e107e82eSAnatoly Burakov #include <rte_mempool.h> 36e107e82eSAnatoly Burakov #include <rte_mbuf.h> 37e107e82eSAnatoly Burakov #include <rte_lpm.h> 3874de12b7SAnatoly Burakov #include <rte_lpm6.h> 39e107e82eSAnatoly Burakov #include <rte_ip.h> 4074de12b7SAnatoly Burakov #include <rte_string_fns.h> 41e107e82eSAnatoly Burakov 4274de12b7SAnatoly Burakov #include <rte_ip_frag.h> 4374de12b7SAnatoly Burakov 4474de12b7SAnatoly Burakov #define RTE_LOGTYPE_IP_FRAG RTE_LOGTYPE_USER1 45e107e82eSAnatoly Burakov 46e107e82eSAnatoly Burakov /* allow max jumbo frame 9.5 KB */ 47e107e82eSAnatoly Burakov #define JUMBO_FRAME_MAX_SIZE 0x2600 48e107e82eSAnatoly Burakov 49e107e82eSAnatoly Burakov #define ROUNDUP_DIV(a, b) (((a) + (b) - 1) / (b)) 50e107e82eSAnatoly Burakov 51e107e82eSAnatoly Burakov /* 5274de12b7SAnatoly Burakov * Default byte size for the IPv6 Maximum Transfer Unit (MTU). 5374de12b7SAnatoly Burakov * This value includes the size of IPv6 header. 54e107e82eSAnatoly Burakov */ 5574de12b7SAnatoly Burakov #define IPV4_MTU_DEFAULT ETHER_MTU 5674de12b7SAnatoly Burakov #define IPV6_MTU_DEFAULT ETHER_MTU 5774de12b7SAnatoly Burakov 5874de12b7SAnatoly Burakov /* 5974de12b7SAnatoly Burakov * Default payload in bytes for the IPv6 packet. 6074de12b7SAnatoly Burakov */ 6174de12b7SAnatoly Burakov #define IPV4_DEFAULT_PAYLOAD (IPV4_MTU_DEFAULT - sizeof(struct ipv4_hdr)) 6274de12b7SAnatoly Burakov #define IPV6_DEFAULT_PAYLOAD (IPV6_MTU_DEFAULT - sizeof(struct ipv6_hdr)) 6374de12b7SAnatoly Burakov 6474de12b7SAnatoly Burakov /* 6574de12b7SAnatoly Burakov * Max number of fragments per packet expected - defined by config file. 6674de12b7SAnatoly Burakov */ 6774de12b7SAnatoly Burakov #define MAX_PACKET_FRAG RTE_LIBRTE_IP_FRAG_MAX_FRAG 68e107e82eSAnatoly Burakov 69e107e82eSAnatoly Burakov #define NB_MBUF 8192 70e107e82eSAnatoly Burakov 71e107e82eSAnatoly Burakov #define MAX_PKT_BURST 32 72e107e82eSAnatoly Burakov #define BURST_TX_DRAIN_US 100 /* TX drain every ~100us */ 73e107e82eSAnatoly Burakov 74e107e82eSAnatoly Burakov /* Configure how many packets ahead to prefetch, when reading packets */ 75e107e82eSAnatoly Burakov #define PREFETCH_OFFSET 3 76e107e82eSAnatoly Burakov 77e107e82eSAnatoly Burakov /* 78e107e82eSAnatoly Burakov * Configurable number of RX/TX ring descriptors 79e107e82eSAnatoly Burakov */ 80*867a6c66SKevin Laatz #define RTE_TEST_RX_DESC_DEFAULT 1024 81*867a6c66SKevin Laatz #define RTE_TEST_TX_DESC_DEFAULT 1024 82e107e82eSAnatoly Burakov static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT; 83e107e82eSAnatoly Burakov static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT; 84e107e82eSAnatoly Burakov 85e107e82eSAnatoly Burakov /* ethernet addresses of ports */ 86e107e82eSAnatoly Burakov static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS]; 8774de12b7SAnatoly Burakov 8874de12b7SAnatoly Burakov #ifndef IPv4_BYTES 8974de12b7SAnatoly Burakov #define IPv4_BYTES_FMT "%" PRIu8 ".%" PRIu8 ".%" PRIu8 ".%" PRIu8 9074de12b7SAnatoly Burakov #define IPv4_BYTES(addr) \ 9174de12b7SAnatoly Burakov (uint8_t) (((addr) >> 24) & 0xFF),\ 9274de12b7SAnatoly Burakov (uint8_t) (((addr) >> 16) & 0xFF),\ 9374de12b7SAnatoly Burakov (uint8_t) (((addr) >> 8) & 0xFF),\ 9474de12b7SAnatoly Burakov (uint8_t) ((addr) & 0xFF) 9574de12b7SAnatoly Burakov #endif 9674de12b7SAnatoly Burakov 9774de12b7SAnatoly Burakov #ifndef IPv6_BYTES 9874de12b7SAnatoly Burakov #define IPv6_BYTES_FMT "%02x%02x:%02x%02x:%02x%02x:%02x%02x:"\ 9974de12b7SAnatoly Burakov "%02x%02x:%02x%02x:%02x%02x:%02x%02x" 10074de12b7SAnatoly Burakov #define IPv6_BYTES(addr) \ 10174de12b7SAnatoly Burakov addr[0], addr[1], addr[2], addr[3], \ 10274de12b7SAnatoly Burakov addr[4], addr[5], addr[6], addr[7], \ 10374de12b7SAnatoly Burakov addr[8], addr[9], addr[10], addr[11],\ 10474de12b7SAnatoly Burakov addr[12], addr[13],addr[14], addr[15] 10574de12b7SAnatoly Burakov #endif 10674de12b7SAnatoly Burakov 10774de12b7SAnatoly Burakov #define IPV6_ADDR_LEN 16 108e107e82eSAnatoly Burakov 109e107e82eSAnatoly Burakov /* mask of enabled ports */ 110e107e82eSAnatoly Burakov static int enabled_port_mask = 0; 111e107e82eSAnatoly Burakov 112e107e82eSAnatoly Burakov static int rx_queue_per_lcore = 1; 113e107e82eSAnatoly Burakov 114e107e82eSAnatoly Burakov #define MBUF_TABLE_SIZE (2 * MAX(MAX_PKT_BURST, MAX_PACKET_FRAG)) 115e107e82eSAnatoly Burakov 116e107e82eSAnatoly Burakov struct mbuf_table { 117e107e82eSAnatoly Burakov uint16_t len; 118e107e82eSAnatoly Burakov struct rte_mbuf *m_table[MBUF_TABLE_SIZE]; 119e107e82eSAnatoly Burakov }; 120e107e82eSAnatoly Burakov 12174de12b7SAnatoly Burakov struct rx_queue { 12274de12b7SAnatoly Burakov struct rte_mempool *direct_pool; 12374de12b7SAnatoly Burakov struct rte_mempool *indirect_pool; 12474de12b7SAnatoly Burakov struct rte_lpm *lpm; 12574de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 126f8244c63SZhiyong Yang uint16_t portid; 12774de12b7SAnatoly Burakov }; 12874de12b7SAnatoly Burakov 129e107e82eSAnatoly Burakov #define MAX_RX_QUEUE_PER_LCORE 16 130e107e82eSAnatoly Burakov #define MAX_TX_QUEUE_PER_PORT 16 131e107e82eSAnatoly Burakov struct lcore_queue_conf { 132e107e82eSAnatoly Burakov uint16_t n_rx_queue; 133e107e82eSAnatoly Burakov uint16_t tx_queue_id[RTE_MAX_ETHPORTS]; 13474de12b7SAnatoly Burakov struct rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE]; 135e107e82eSAnatoly Burakov struct mbuf_table tx_mbufs[RTE_MAX_ETHPORTS]; 136e107e82eSAnatoly Burakov } __rte_cache_aligned; 137e107e82eSAnatoly Burakov struct lcore_queue_conf lcore_queue_conf[RTE_MAX_LCORE]; 138e107e82eSAnatoly Burakov 1395e470a66SAndriy Berestovskyy static struct rte_eth_conf port_conf = { 140e107e82eSAnatoly Burakov .rxmode = { 141e107e82eSAnatoly Burakov .max_rx_pkt_len = JUMBO_FRAME_MAX_SIZE, 142e107e82eSAnatoly Burakov .split_hdr_size = 0, 143fdb9eff6SShahaf Shuler .ignore_offload_bitfield = 1, 144fdb9eff6SShahaf Shuler .offloads = (DEV_RX_OFFLOAD_CHECKSUM | 145fdb9eff6SShahaf Shuler DEV_RX_OFFLOAD_JUMBO_FRAME | 146fdb9eff6SShahaf Shuler DEV_RX_OFFLOAD_CRC_STRIP), 147e107e82eSAnatoly Burakov }, 148e107e82eSAnatoly Burakov .txmode = { 149e107e82eSAnatoly Burakov .mq_mode = ETH_MQ_TX_NONE, 150fdb9eff6SShahaf Shuler .offloads = (DEV_TX_OFFLOAD_IPV4_CKSUM | 151fdb9eff6SShahaf Shuler DEV_TX_OFFLOAD_MULTI_SEGS), 152e107e82eSAnatoly Burakov }, 153e107e82eSAnatoly Burakov }; 154e107e82eSAnatoly Burakov 15574de12b7SAnatoly Burakov /* 15674de12b7SAnatoly Burakov * IPv4 forwarding table 15774de12b7SAnatoly Burakov */ 15874de12b7SAnatoly Burakov struct l3fwd_ipv4_route { 159e107e82eSAnatoly Burakov uint32_t ip; 160e107e82eSAnatoly Burakov uint8_t depth; 161e107e82eSAnatoly Burakov uint8_t if_out; 162e107e82eSAnatoly Burakov }; 163e107e82eSAnatoly Burakov 16474de12b7SAnatoly Burakov struct l3fwd_ipv4_route l3fwd_ipv4_route_array[] = { 16574de12b7SAnatoly Burakov {IPv4(100,10,0,0), 16, 0}, 16674de12b7SAnatoly Burakov {IPv4(100,20,0,0), 16, 1}, 16774de12b7SAnatoly Burakov {IPv4(100,30,0,0), 16, 2}, 16874de12b7SAnatoly Burakov {IPv4(100,40,0,0), 16, 3}, 16974de12b7SAnatoly Burakov {IPv4(100,50,0,0), 16, 4}, 17074de12b7SAnatoly Burakov {IPv4(100,60,0,0), 16, 5}, 17174de12b7SAnatoly Burakov {IPv4(100,70,0,0), 16, 6}, 17274de12b7SAnatoly Burakov {IPv4(100,80,0,0), 16, 7}, 173e107e82eSAnatoly Burakov }; 174e107e82eSAnatoly Burakov 17574de12b7SAnatoly Burakov /* 17674de12b7SAnatoly Burakov * IPv6 forwarding table 17774de12b7SAnatoly Burakov */ 178e107e82eSAnatoly Burakov 17974de12b7SAnatoly Burakov struct l3fwd_ipv6_route { 18074de12b7SAnatoly Burakov uint8_t ip[IPV6_ADDR_LEN]; 18174de12b7SAnatoly Burakov uint8_t depth; 18274de12b7SAnatoly Burakov uint8_t if_out; 18374de12b7SAnatoly Burakov }; 184e107e82eSAnatoly Burakov 18574de12b7SAnatoly Burakov static struct l3fwd_ipv6_route l3fwd_ipv6_route_array[] = { 18674de12b7SAnatoly Burakov {{1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 0}, 18774de12b7SAnatoly Burakov {{2,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 1}, 18874de12b7SAnatoly Burakov {{3,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 2}, 18974de12b7SAnatoly Burakov {{4,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 3}, 19074de12b7SAnatoly Burakov {{5,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 4}, 19174de12b7SAnatoly Burakov {{6,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 5}, 19274de12b7SAnatoly Burakov {{7,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 6}, 19374de12b7SAnatoly Burakov {{8,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 7}, 19474de12b7SAnatoly Burakov }; 19574de12b7SAnatoly Burakov 19674de12b7SAnatoly Burakov #define LPM_MAX_RULES 1024 19774de12b7SAnatoly Burakov #define LPM6_MAX_RULES 1024 19874de12b7SAnatoly Burakov #define LPM6_NUMBER_TBL8S (1 << 16) 19974de12b7SAnatoly Burakov 20074de12b7SAnatoly Burakov struct rte_lpm6_config lpm6_config = { 20174de12b7SAnatoly Burakov .max_rules = LPM6_MAX_RULES, 20274de12b7SAnatoly Burakov .number_tbl8s = LPM6_NUMBER_TBL8S, 20374de12b7SAnatoly Burakov .flags = 0 20474de12b7SAnatoly Burakov }; 20574de12b7SAnatoly Burakov 20674de12b7SAnatoly Burakov static struct rte_mempool *socket_direct_pool[RTE_MAX_NUMA_NODES]; 20774de12b7SAnatoly Burakov static struct rte_mempool *socket_indirect_pool[RTE_MAX_NUMA_NODES]; 20874de12b7SAnatoly Burakov static struct rte_lpm *socket_lpm[RTE_MAX_NUMA_NODES]; 20974de12b7SAnatoly Burakov static struct rte_lpm6 *socket_lpm6[RTE_MAX_NUMA_NODES]; 210e107e82eSAnatoly Burakov 211e107e82eSAnatoly Burakov /* Send burst of packets on an output interface */ 212e107e82eSAnatoly Burakov static inline int 213f8244c63SZhiyong Yang send_burst(struct lcore_queue_conf *qconf, uint16_t n, uint16_t port) 214e107e82eSAnatoly Burakov { 215e107e82eSAnatoly Burakov struct rte_mbuf **m_table; 216e107e82eSAnatoly Burakov int ret; 217e107e82eSAnatoly Burakov uint16_t queueid; 218e107e82eSAnatoly Burakov 219e107e82eSAnatoly Burakov queueid = qconf->tx_queue_id[port]; 220e107e82eSAnatoly Burakov m_table = (struct rte_mbuf **)qconf->tx_mbufs[port].m_table; 221e107e82eSAnatoly Burakov 222e107e82eSAnatoly Burakov ret = rte_eth_tx_burst(port, queueid, m_table, n); 223e107e82eSAnatoly Burakov if (unlikely(ret < n)) { 224e107e82eSAnatoly Burakov do { 225e107e82eSAnatoly Burakov rte_pktmbuf_free(m_table[ret]); 226e107e82eSAnatoly Burakov } while (++ret < n); 227e107e82eSAnatoly Burakov } 228e107e82eSAnatoly Burakov 229e107e82eSAnatoly Burakov return 0; 230e107e82eSAnatoly Burakov } 231e107e82eSAnatoly Burakov 232e107e82eSAnatoly Burakov static inline void 23374de12b7SAnatoly Burakov l3fwd_simple_forward(struct rte_mbuf *m, struct lcore_queue_conf *qconf, 234f8244c63SZhiyong Yang uint8_t queueid, uint16_t port_in) 235e107e82eSAnatoly Burakov { 23674de12b7SAnatoly Burakov struct rx_queue *rxq; 237d89a5bceSVladyslav Buslov uint32_t i, len, next_hop; 238f8244c63SZhiyong Yang uint8_t ipv6; 239f8244c63SZhiyong Yang uint16_t port_out; 240e107e82eSAnatoly Burakov int32_t len2; 241e107e82eSAnatoly Burakov 24274de12b7SAnatoly Burakov ipv6 = 0; 24374de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[queueid]; 24474de12b7SAnatoly Burakov 24574de12b7SAnatoly Burakov /* by default, send everything back to the source port */ 24674de12b7SAnatoly Burakov port_out = port_in; 247e107e82eSAnatoly Burakov 248e107e82eSAnatoly Burakov /* Remove the Ethernet header and trailer from the input packet */ 249e107e82eSAnatoly Burakov rte_pktmbuf_adj(m, (uint16_t)sizeof(struct ether_hdr)); 250e107e82eSAnatoly Burakov 25174de12b7SAnatoly Burakov /* Build transmission burst */ 25274de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 25374de12b7SAnatoly Burakov 25474de12b7SAnatoly Burakov /* if this is an IPv4 packet */ 2553c0184ccSHelin Zhang if (RTE_ETH_IS_IPV4_HDR(m->packet_type)) { 25674de12b7SAnatoly Burakov struct ipv4_hdr *ip_hdr; 25774de12b7SAnatoly Burakov uint32_t ip_dst; 258e107e82eSAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 259e107e82eSAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv4_hdr *); 260e107e82eSAnatoly Burakov ip_dst = rte_be_to_cpu_32(ip_hdr->dst_addr); 261e107e82eSAnatoly Burakov 262e107e82eSAnatoly Burakov /* Find destination port */ 263d89a5bceSVladyslav Buslov if (rte_lpm_lookup(rxq->lpm, ip_dst, &next_hop) == 0 && 264d89a5bceSVladyslav Buslov (enabled_port_mask & 1 << next_hop) != 0) { 265d89a5bceSVladyslav Buslov port_out = next_hop; 266e107e82eSAnatoly Burakov 26774de12b7SAnatoly Burakov /* Build transmission burst for new port */ 268e107e82eSAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 26974de12b7SAnatoly Burakov } 270e107e82eSAnatoly Burakov 271e107e82eSAnatoly Burakov /* if we don't need to do any fragmentation */ 272ea672a8bSOlivier Matz if (likely (IPV4_MTU_DEFAULT >= m->pkt_len)) { 273e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 274e107e82eSAnatoly Burakov len2 = 1; 275e107e82eSAnatoly Burakov } else { 276e107e82eSAnatoly Burakov len2 = rte_ipv4_fragment_packet(m, 277e107e82eSAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 278e107e82eSAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 279e107e82eSAnatoly Burakov IPV4_MTU_DEFAULT, 28074de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 281e107e82eSAnatoly Burakov 282e107e82eSAnatoly Burakov /* Free input packet */ 283e107e82eSAnatoly Burakov rte_pktmbuf_free(m); 284e107e82eSAnatoly Burakov 285e107e82eSAnatoly Burakov /* If we fail to fragment the packet */ 286e107e82eSAnatoly Burakov if (unlikely (len2 < 0)) 287e107e82eSAnatoly Burakov return; 288e107e82eSAnatoly Burakov } 2893c0184ccSHelin Zhang } else if (RTE_ETH_IS_IPV6_HDR(m->packet_type)) { 2903c0184ccSHelin Zhang /* if this is an IPv6 packet */ 29174de12b7SAnatoly Burakov struct ipv6_hdr *ip_hdr; 29274de12b7SAnatoly Burakov 29374de12b7SAnatoly Burakov ipv6 = 1; 29474de12b7SAnatoly Burakov 29574de12b7SAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 29674de12b7SAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv6_hdr *); 29774de12b7SAnatoly Burakov 29874de12b7SAnatoly Burakov /* Find destination port */ 299d89a5bceSVladyslav Buslov if (rte_lpm6_lookup(rxq->lpm6, ip_hdr->dst_addr, 300d89a5bceSVladyslav Buslov &next_hop) == 0 && 301d89a5bceSVladyslav Buslov (enabled_port_mask & 1 << next_hop) != 0) { 302d89a5bceSVladyslav Buslov port_out = next_hop; 30374de12b7SAnatoly Burakov 30474de12b7SAnatoly Burakov /* Build transmission burst for new port */ 30574de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 30674de12b7SAnatoly Burakov } 30774de12b7SAnatoly Burakov 30874de12b7SAnatoly Burakov /* if we don't need to do any fragmentation */ 309ea672a8bSOlivier Matz if (likely (IPV6_MTU_DEFAULT >= m->pkt_len)) { 31074de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 31174de12b7SAnatoly Burakov len2 = 1; 31274de12b7SAnatoly Burakov } else { 31374de12b7SAnatoly Burakov len2 = rte_ipv6_fragment_packet(m, 31474de12b7SAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 31574de12b7SAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 31674de12b7SAnatoly Burakov IPV6_MTU_DEFAULT, 31774de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 31874de12b7SAnatoly Burakov 31974de12b7SAnatoly Burakov /* Free input packet */ 32074de12b7SAnatoly Burakov rte_pktmbuf_free(m); 32174de12b7SAnatoly Burakov 32274de12b7SAnatoly Burakov /* If we fail to fragment the packet */ 32374de12b7SAnatoly Burakov if (unlikely (len2 < 0)) 32474de12b7SAnatoly Burakov return; 32574de12b7SAnatoly Burakov } 32674de12b7SAnatoly Burakov } 32774de12b7SAnatoly Burakov /* else, just forward the packet */ 32874de12b7SAnatoly Burakov else { 32974de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 33074de12b7SAnatoly Burakov len2 = 1; 33174de12b7SAnatoly Burakov } 332e107e82eSAnatoly Burakov 333e107e82eSAnatoly Burakov for (i = len; i < len + len2; i ++) { 33474de12b7SAnatoly Burakov void *d_addr_bytes; 33574de12b7SAnatoly Burakov 336e107e82eSAnatoly Burakov m = qconf->tx_mbufs[port_out].m_table[i]; 337e107e82eSAnatoly Burakov struct ether_hdr *eth_hdr = (struct ether_hdr *) 338e107e82eSAnatoly Burakov rte_pktmbuf_prepend(m, (uint16_t)sizeof(struct ether_hdr)); 339e107e82eSAnatoly Burakov if (eth_hdr == NULL) { 340e107e82eSAnatoly Burakov rte_panic("No headroom in mbuf.\n"); 341e107e82eSAnatoly Burakov } 342e107e82eSAnatoly Burakov 3437869536fSBruce Richardson m->l2_len = sizeof(struct ether_hdr); 344e107e82eSAnatoly Burakov 34574de12b7SAnatoly Burakov /* 02:00:00:00:00:xx */ 34674de12b7SAnatoly Burakov d_addr_bytes = ð_hdr->d_addr.addr_bytes[0]; 34774de12b7SAnatoly Burakov *((uint64_t *)d_addr_bytes) = 0x000000000002 + ((uint64_t)port_out << 40); 34874de12b7SAnatoly Burakov 34974de12b7SAnatoly Burakov /* src addr */ 350e107e82eSAnatoly Burakov ether_addr_copy(&ports_eth_addr[port_out], ð_hdr->s_addr); 35174de12b7SAnatoly Burakov if (ipv6) 35274de12b7SAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv6); 35374de12b7SAnatoly Burakov else 354e107e82eSAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv4); 355e107e82eSAnatoly Burakov } 356e107e82eSAnatoly Burakov 357e107e82eSAnatoly Burakov len += len2; 358e107e82eSAnatoly Burakov 359e107e82eSAnatoly Burakov if (likely(len < MAX_PKT_BURST)) { 360e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = (uint16_t)len; 361e107e82eSAnatoly Burakov return; 362e107e82eSAnatoly Burakov } 363e107e82eSAnatoly Burakov 364e107e82eSAnatoly Burakov /* Transmit packets */ 365e107e82eSAnatoly Burakov send_burst(qconf, (uint16_t)len, port_out); 366e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = 0; 367e107e82eSAnatoly Burakov } 368e107e82eSAnatoly Burakov 369e107e82eSAnatoly Burakov /* main processing loop */ 370e107e82eSAnatoly Burakov static int 371e107e82eSAnatoly Burakov main_loop(__attribute__((unused)) void *dummy) 372e107e82eSAnatoly Burakov { 373e107e82eSAnatoly Burakov struct rte_mbuf *pkts_burst[MAX_PKT_BURST]; 374e107e82eSAnatoly Burakov unsigned lcore_id; 375e107e82eSAnatoly Burakov uint64_t prev_tsc, diff_tsc, cur_tsc; 376e107e82eSAnatoly Burakov int i, j, nb_rx; 377f8244c63SZhiyong Yang uint16_t portid; 378e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 379e107e82eSAnatoly Burakov const uint64_t drain_tsc = (rte_get_tsc_hz() + US_PER_S - 1) / US_PER_S * BURST_TX_DRAIN_US; 380e107e82eSAnatoly Burakov 381e107e82eSAnatoly Burakov prev_tsc = 0; 382e107e82eSAnatoly Burakov 383e107e82eSAnatoly Burakov lcore_id = rte_lcore_id(); 384e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 385e107e82eSAnatoly Burakov 386e107e82eSAnatoly Burakov if (qconf->n_rx_queue == 0) { 38774de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "lcore %u has nothing to do\n", lcore_id); 388e107e82eSAnatoly Burakov return 0; 389e107e82eSAnatoly Burakov } 390e107e82eSAnatoly Burakov 39174de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "entering main loop on lcore %u\n", lcore_id); 392e107e82eSAnatoly Burakov 393e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 394e107e82eSAnatoly Burakov 39574de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 39674de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, " -- lcoreid=%u portid=%d\n", lcore_id, 397f8244c63SZhiyong Yang portid); 398e107e82eSAnatoly Burakov } 399e107e82eSAnatoly Burakov 400e107e82eSAnatoly Burakov while (1) { 401e107e82eSAnatoly Burakov 402e107e82eSAnatoly Burakov cur_tsc = rte_rdtsc(); 403e107e82eSAnatoly Burakov 404e107e82eSAnatoly Burakov /* 405e107e82eSAnatoly Burakov * TX burst queue drain 406e107e82eSAnatoly Burakov */ 407e107e82eSAnatoly Burakov diff_tsc = cur_tsc - prev_tsc; 408e107e82eSAnatoly Burakov if (unlikely(diff_tsc > drain_tsc)) { 409e107e82eSAnatoly Burakov 410e107e82eSAnatoly Burakov /* 411e107e82eSAnatoly Burakov * This could be optimized (use queueid instead of 412e107e82eSAnatoly Burakov * portid), but it is not called so often 413e107e82eSAnatoly Burakov */ 414e107e82eSAnatoly Burakov for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) { 415e107e82eSAnatoly Burakov if (qconf->tx_mbufs[portid].len == 0) 416e107e82eSAnatoly Burakov continue; 417e107e82eSAnatoly Burakov send_burst(&lcore_queue_conf[lcore_id], 418e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len, 419e107e82eSAnatoly Burakov portid); 420e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len = 0; 421e107e82eSAnatoly Burakov } 422e107e82eSAnatoly Burakov 423e107e82eSAnatoly Burakov prev_tsc = cur_tsc; 424e107e82eSAnatoly Burakov } 425e107e82eSAnatoly Burakov 426e107e82eSAnatoly Burakov /* 427e107e82eSAnatoly Burakov * Read packet from RX queues 428e107e82eSAnatoly Burakov */ 429e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 430e107e82eSAnatoly Burakov 43174de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 432e107e82eSAnatoly Burakov nb_rx = rte_eth_rx_burst(portid, 0, pkts_burst, 433e107e82eSAnatoly Burakov MAX_PKT_BURST); 434e107e82eSAnatoly Burakov 435e107e82eSAnatoly Burakov /* Prefetch first packets */ 436e107e82eSAnatoly Burakov for (j = 0; j < PREFETCH_OFFSET && j < nb_rx; j++) { 437e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod( 438e107e82eSAnatoly Burakov pkts_burst[j], void *)); 439e107e82eSAnatoly Burakov } 440e107e82eSAnatoly Burakov 441e107e82eSAnatoly Burakov /* Prefetch and forward already prefetched packets */ 442e107e82eSAnatoly Burakov for (j = 0; j < (nb_rx - PREFETCH_OFFSET); j++) { 443e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod(pkts_burst[ 444e107e82eSAnatoly Burakov j + PREFETCH_OFFSET], void *)); 44574de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 446e107e82eSAnatoly Burakov } 447e107e82eSAnatoly Burakov 448e107e82eSAnatoly Burakov /* Forward remaining prefetched packets */ 449e107e82eSAnatoly Burakov for (; j < nb_rx; j++) { 45074de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 451e107e82eSAnatoly Burakov } 452e107e82eSAnatoly Burakov } 453e107e82eSAnatoly Burakov } 454e107e82eSAnatoly Burakov } 455e107e82eSAnatoly Burakov 456e107e82eSAnatoly Burakov /* display usage */ 457e107e82eSAnatoly Burakov static void 458e107e82eSAnatoly Burakov print_usage(const char *prgname) 459e107e82eSAnatoly Burakov { 460e107e82eSAnatoly Burakov printf("%s [EAL options] -- -p PORTMASK [-q NQ]\n" 461e107e82eSAnatoly Burakov " -p PORTMASK: hexadecimal bitmask of ports to configure\n" 462e107e82eSAnatoly Burakov " -q NQ: number of queue (=ports) per lcore (default is 1)\n", 463e107e82eSAnatoly Burakov prgname); 464e107e82eSAnatoly Burakov } 465e107e82eSAnatoly Burakov 466e107e82eSAnatoly Burakov static int 467e107e82eSAnatoly Burakov parse_portmask(const char *portmask) 468e107e82eSAnatoly Burakov { 469e107e82eSAnatoly Burakov char *end = NULL; 470e107e82eSAnatoly Burakov unsigned long pm; 471e107e82eSAnatoly Burakov 472e107e82eSAnatoly Burakov /* parse hexadecimal string */ 473e107e82eSAnatoly Burakov pm = strtoul(portmask, &end, 16); 474e107e82eSAnatoly Burakov if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0')) 475e107e82eSAnatoly Burakov return -1; 476e107e82eSAnatoly Burakov 477e107e82eSAnatoly Burakov if (pm == 0) 478e107e82eSAnatoly Burakov return -1; 479e107e82eSAnatoly Burakov 480e107e82eSAnatoly Burakov return pm; 481e107e82eSAnatoly Burakov } 482e107e82eSAnatoly Burakov 483e107e82eSAnatoly Burakov static int 484e107e82eSAnatoly Burakov parse_nqueue(const char *q_arg) 485e107e82eSAnatoly Burakov { 486e107e82eSAnatoly Burakov char *end = NULL; 487e107e82eSAnatoly Burakov unsigned long n; 488e107e82eSAnatoly Burakov 489e107e82eSAnatoly Burakov /* parse hexadecimal string */ 490e107e82eSAnatoly Burakov n = strtoul(q_arg, &end, 10); 491e107e82eSAnatoly Burakov if ((q_arg[0] == '\0') || (end == NULL) || (*end != '\0')) 492e107e82eSAnatoly Burakov return -1; 493e107e82eSAnatoly Burakov if (n == 0) 494e107e82eSAnatoly Burakov return -1; 495e107e82eSAnatoly Burakov if (n >= MAX_RX_QUEUE_PER_LCORE) 496e107e82eSAnatoly Burakov return -1; 497e107e82eSAnatoly Burakov 498e107e82eSAnatoly Burakov return n; 499e107e82eSAnatoly Burakov } 500e107e82eSAnatoly Burakov 501e107e82eSAnatoly Burakov /* Parse the argument given in the command line of the application */ 502e107e82eSAnatoly Burakov static int 503e107e82eSAnatoly Burakov parse_args(int argc, char **argv) 504e107e82eSAnatoly Burakov { 505e107e82eSAnatoly Burakov int opt, ret; 506e107e82eSAnatoly Burakov char **argvopt; 507e107e82eSAnatoly Burakov int option_index; 508e107e82eSAnatoly Burakov char *prgname = argv[0]; 509e107e82eSAnatoly Burakov static struct option lgopts[] = { 510e107e82eSAnatoly Burakov {NULL, 0, 0, 0} 511e107e82eSAnatoly Burakov }; 512e107e82eSAnatoly Burakov 513e107e82eSAnatoly Burakov argvopt = argv; 514e107e82eSAnatoly Burakov 515e107e82eSAnatoly Burakov while ((opt = getopt_long(argc, argvopt, "p:q:", 516e107e82eSAnatoly Burakov lgopts, &option_index)) != EOF) { 517e107e82eSAnatoly Burakov 518e107e82eSAnatoly Burakov switch (opt) { 519e107e82eSAnatoly Burakov /* portmask */ 520e107e82eSAnatoly Burakov case 'p': 521e107e82eSAnatoly Burakov enabled_port_mask = parse_portmask(optarg); 522e107e82eSAnatoly Burakov if (enabled_port_mask < 0) { 523e107e82eSAnatoly Burakov printf("invalid portmask\n"); 524e107e82eSAnatoly Burakov print_usage(prgname); 525e107e82eSAnatoly Burakov return -1; 526e107e82eSAnatoly Burakov } 527e107e82eSAnatoly Burakov break; 528e107e82eSAnatoly Burakov 529e107e82eSAnatoly Burakov /* nqueue */ 530e107e82eSAnatoly Burakov case 'q': 531e107e82eSAnatoly Burakov rx_queue_per_lcore = parse_nqueue(optarg); 532e107e82eSAnatoly Burakov if (rx_queue_per_lcore < 0) { 533e107e82eSAnatoly Burakov printf("invalid queue number\n"); 534e107e82eSAnatoly Burakov print_usage(prgname); 535e107e82eSAnatoly Burakov return -1; 536e107e82eSAnatoly Burakov } 537e107e82eSAnatoly Burakov break; 538e107e82eSAnatoly Burakov 539e107e82eSAnatoly Burakov /* long options */ 540e107e82eSAnatoly Burakov case 0: 541e107e82eSAnatoly Burakov print_usage(prgname); 542e107e82eSAnatoly Burakov return -1; 543e107e82eSAnatoly Burakov 544e107e82eSAnatoly Burakov default: 545e107e82eSAnatoly Burakov print_usage(prgname); 546e107e82eSAnatoly Burakov return -1; 547e107e82eSAnatoly Burakov } 548e107e82eSAnatoly Burakov } 549e107e82eSAnatoly Burakov 550e107e82eSAnatoly Burakov if (enabled_port_mask == 0) { 551e107e82eSAnatoly Burakov printf("portmask not specified\n"); 552e107e82eSAnatoly Burakov print_usage(prgname); 553e107e82eSAnatoly Burakov return -1; 554e107e82eSAnatoly Burakov } 555e107e82eSAnatoly Burakov 556e107e82eSAnatoly Burakov if (optind >= 0) 557e107e82eSAnatoly Burakov argv[optind-1] = prgname; 558e107e82eSAnatoly Burakov 559e107e82eSAnatoly Burakov ret = optind-1; 5609d5ca532SKeith Wiles optind = 1; /* reset getopt lib */ 561e107e82eSAnatoly Burakov return ret; 562e107e82eSAnatoly Burakov } 563e107e82eSAnatoly Burakov 564e107e82eSAnatoly Burakov static void 565e107e82eSAnatoly Burakov print_ethaddr(const char *name, struct ether_addr *eth_addr) 566e107e82eSAnatoly Burakov { 567ec3d82dbSCunming Liang char buf[ETHER_ADDR_FMT_SIZE]; 568ec3d82dbSCunming Liang ether_format_addr(buf, ETHER_ADDR_FMT_SIZE, eth_addr); 569ec3d82dbSCunming Liang printf("%s%s", name, buf); 570e107e82eSAnatoly Burakov } 571e107e82eSAnatoly Burakov 572e107e82eSAnatoly Burakov /* Check the link status of all ports in up to 9s, and print them finally */ 573e107e82eSAnatoly Burakov static void 574f8244c63SZhiyong Yang check_all_ports_link_status(uint16_t port_num, uint32_t port_mask) 575e107e82eSAnatoly Burakov { 576e107e82eSAnatoly Burakov #define CHECK_INTERVAL 100 /* 100ms */ 577e107e82eSAnatoly Burakov #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */ 578f8244c63SZhiyong Yang uint16_t portid; 579f8244c63SZhiyong Yang uint8_t count, all_ports_up, print_flag = 0; 580e107e82eSAnatoly Burakov struct rte_eth_link link; 581e107e82eSAnatoly Burakov 582e107e82eSAnatoly Burakov printf("\nChecking link status"); 583e107e82eSAnatoly Burakov fflush(stdout); 584e107e82eSAnatoly Burakov for (count = 0; count <= MAX_CHECK_TIME; count++) { 585e107e82eSAnatoly Burakov all_ports_up = 1; 586e107e82eSAnatoly Burakov for (portid = 0; portid < port_num; portid++) { 587e107e82eSAnatoly Burakov if ((port_mask & (1 << portid)) == 0) 588e107e82eSAnatoly Burakov continue; 589e107e82eSAnatoly Burakov memset(&link, 0, sizeof(link)); 590e107e82eSAnatoly Burakov rte_eth_link_get_nowait(portid, &link); 591e107e82eSAnatoly Burakov /* print link status if flag set */ 592e107e82eSAnatoly Burakov if (print_flag == 1) { 593e107e82eSAnatoly Burakov if (link.link_status) 594f8244c63SZhiyong Yang printf( 595f8244c63SZhiyong Yang "Port%d Link Up .Speed %u Mbps - %s\n", 596f8244c63SZhiyong Yang portid, link.link_speed, 597e107e82eSAnatoly Burakov (link.link_duplex == ETH_LINK_FULL_DUPLEX) ? 598e107e82eSAnatoly Burakov ("full-duplex") : ("half-duplex\n")); 599e107e82eSAnatoly Burakov else 600f8244c63SZhiyong Yang printf("Port %d Link Down\n", portid); 601e107e82eSAnatoly Burakov continue; 602e107e82eSAnatoly Burakov } 603e107e82eSAnatoly Burakov /* clear all_ports_up flag if any link down */ 60409419f23SThomas Monjalon if (link.link_status == ETH_LINK_DOWN) { 605e107e82eSAnatoly Burakov all_ports_up = 0; 606e107e82eSAnatoly Burakov break; 607e107e82eSAnatoly Burakov } 608e107e82eSAnatoly Burakov } 609e107e82eSAnatoly Burakov /* after finally printing all link status, get out */ 610e107e82eSAnatoly Burakov if (print_flag == 1) 611e107e82eSAnatoly Burakov break; 612e107e82eSAnatoly Burakov 613e107e82eSAnatoly Burakov if (all_ports_up == 0) { 614e107e82eSAnatoly Burakov printf("."); 615e107e82eSAnatoly Burakov fflush(stdout); 616e107e82eSAnatoly Burakov rte_delay_ms(CHECK_INTERVAL); 617e107e82eSAnatoly Burakov } 618e107e82eSAnatoly Burakov 619e107e82eSAnatoly Burakov /* set the print_flag if all ports up or timeout */ 620e107e82eSAnatoly Burakov if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) { 621e107e82eSAnatoly Burakov print_flag = 1; 62274de12b7SAnatoly Burakov printf("\ndone\n"); 623e107e82eSAnatoly Burakov } 624e107e82eSAnatoly Burakov } 625e107e82eSAnatoly Burakov } 626e107e82eSAnatoly Burakov 627201d52bcSWei Dai /* Check L3 packet type detection capablity of the NIC port */ 628201d52bcSWei Dai static int 629201d52bcSWei Dai check_ptype(int portid) 630201d52bcSWei Dai { 631201d52bcSWei Dai int i, ret; 632201d52bcSWei Dai int ptype_l3_ipv4 = 0, ptype_l3_ipv6 = 0; 633201d52bcSWei Dai uint32_t ptype_mask = RTE_PTYPE_L3_MASK; 634201d52bcSWei Dai 635201d52bcSWei Dai ret = rte_eth_dev_get_supported_ptypes(portid, ptype_mask, NULL, 0); 636201d52bcSWei Dai if (ret <= 0) 637201d52bcSWei Dai return 0; 638201d52bcSWei Dai 639201d52bcSWei Dai uint32_t ptypes[ret]; 640201d52bcSWei Dai 641201d52bcSWei Dai ret = rte_eth_dev_get_supported_ptypes(portid, ptype_mask, ptypes, ret); 642201d52bcSWei Dai for (i = 0; i < ret; ++i) { 643201d52bcSWei Dai if (ptypes[i] & RTE_PTYPE_L3_IPV4) 644201d52bcSWei Dai ptype_l3_ipv4 = 1; 645201d52bcSWei Dai if (ptypes[i] & RTE_PTYPE_L3_IPV6) 646201d52bcSWei Dai ptype_l3_ipv6 = 1; 647201d52bcSWei Dai } 648201d52bcSWei Dai 649201d52bcSWei Dai if (ptype_l3_ipv4 == 0) 650201d52bcSWei Dai printf("port %d cannot parse RTE_PTYPE_L3_IPV4\n", portid); 651201d52bcSWei Dai 652201d52bcSWei Dai if (ptype_l3_ipv6 == 0) 653201d52bcSWei Dai printf("port %d cannot parse RTE_PTYPE_L3_IPV6\n", portid); 654201d52bcSWei Dai 655201d52bcSWei Dai if (ptype_l3_ipv4 && ptype_l3_ipv6) 656201d52bcSWei Dai return 1; 657201d52bcSWei Dai 658201d52bcSWei Dai return 0; 659201d52bcSWei Dai 660201d52bcSWei Dai } 661201d52bcSWei Dai 662201d52bcSWei Dai /* Parse packet type of a packet by SW */ 663201d52bcSWei Dai static inline void 664201d52bcSWei Dai parse_ptype(struct rte_mbuf *m) 665201d52bcSWei Dai { 666201d52bcSWei Dai struct ether_hdr *eth_hdr; 667201d52bcSWei Dai uint32_t packet_type = RTE_PTYPE_UNKNOWN; 668201d52bcSWei Dai uint16_t ether_type; 669201d52bcSWei Dai 670201d52bcSWei Dai eth_hdr = rte_pktmbuf_mtod(m, struct ether_hdr *); 671201d52bcSWei Dai ether_type = eth_hdr->ether_type; 672201d52bcSWei Dai if (ether_type == rte_cpu_to_be_16(ETHER_TYPE_IPv4)) 673201d52bcSWei Dai packet_type |= RTE_PTYPE_L3_IPV4_EXT_UNKNOWN; 674201d52bcSWei Dai else if (ether_type == rte_cpu_to_be_16(ETHER_TYPE_IPv6)) 675201d52bcSWei Dai packet_type |= RTE_PTYPE_L3_IPV6_EXT_UNKNOWN; 676201d52bcSWei Dai 677201d52bcSWei Dai m->packet_type = packet_type; 678201d52bcSWei Dai } 679201d52bcSWei Dai 680201d52bcSWei Dai /* callback function to detect packet type for a queue of a port */ 681201d52bcSWei Dai static uint16_t 682f8244c63SZhiyong Yang cb_parse_ptype(uint16_t port __rte_unused, uint16_t queue __rte_unused, 683201d52bcSWei Dai struct rte_mbuf *pkts[], uint16_t nb_pkts, 684201d52bcSWei Dai uint16_t max_pkts __rte_unused, 685201d52bcSWei Dai void *user_param __rte_unused) 686201d52bcSWei Dai { 687201d52bcSWei Dai uint16_t i; 688201d52bcSWei Dai 689201d52bcSWei Dai for (i = 0; i < nb_pkts; ++i) 690201d52bcSWei Dai parse_ptype(pkts[i]); 691201d52bcSWei Dai 692201d52bcSWei Dai return nb_pkts; 693201d52bcSWei Dai } 694201d52bcSWei Dai 69574de12b7SAnatoly Burakov static int 69674de12b7SAnatoly Burakov init_routing_table(void) 69774de12b7SAnatoly Burakov { 69874de12b7SAnatoly Burakov struct rte_lpm *lpm; 69974de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 70074de12b7SAnatoly Burakov int socket, ret; 70174de12b7SAnatoly Burakov unsigned i; 70274de12b7SAnatoly Burakov 70374de12b7SAnatoly Burakov for (socket = 0; socket < RTE_MAX_NUMA_NODES; socket++) { 70474de12b7SAnatoly Burakov if (socket_lpm[socket]) { 70574de12b7SAnatoly Burakov lpm = socket_lpm[socket]; 70674de12b7SAnatoly Burakov /* populate the LPM table */ 70774de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv4_route_array); i++) { 70874de12b7SAnatoly Burakov ret = rte_lpm_add(lpm, 70974de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].ip, 71074de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 71174de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 71274de12b7SAnatoly Burakov 71374de12b7SAnatoly Burakov if (ret < 0) { 71474de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 71574de12b7SAnatoly Burakov "LPM table\n", i); 71674de12b7SAnatoly Burakov return -1; 71774de12b7SAnatoly Burakov } 71874de12b7SAnatoly Burakov 71974de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv4_BYTES_FMT 72074de12b7SAnatoly Burakov "/%d (port %d)\n", 72174de12b7SAnatoly Burakov socket, 72274de12b7SAnatoly Burakov IPv4_BYTES(l3fwd_ipv4_route_array[i].ip), 72374de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 72474de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 72574de12b7SAnatoly Burakov } 72674de12b7SAnatoly Burakov } 72774de12b7SAnatoly Burakov 72874de12b7SAnatoly Burakov if (socket_lpm6[socket]) { 72974de12b7SAnatoly Burakov lpm6 = socket_lpm6[socket]; 73074de12b7SAnatoly Burakov /* populate the LPM6 table */ 73174de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv6_route_array); i++) { 73274de12b7SAnatoly Burakov ret = rte_lpm6_add(lpm6, 73374de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].ip, 73474de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 73574de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 73674de12b7SAnatoly Burakov 73774de12b7SAnatoly Burakov if (ret < 0) { 73874de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 73974de12b7SAnatoly Burakov "LPM6 table\n", i); 74074de12b7SAnatoly Burakov return -1; 74174de12b7SAnatoly Burakov } 74274de12b7SAnatoly Burakov 74374de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv6_BYTES_FMT 74474de12b7SAnatoly Burakov "/%d (port %d)\n", 74574de12b7SAnatoly Burakov socket, 74674de12b7SAnatoly Burakov IPv6_BYTES(l3fwd_ipv6_route_array[i].ip), 74774de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 74874de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 74974de12b7SAnatoly Burakov } 75074de12b7SAnatoly Burakov } 75174de12b7SAnatoly Burakov } 75274de12b7SAnatoly Burakov return 0; 75374de12b7SAnatoly Burakov } 75474de12b7SAnatoly Burakov 75574de12b7SAnatoly Burakov static int 75674de12b7SAnatoly Burakov init_mem(void) 75774de12b7SAnatoly Burakov { 75874de12b7SAnatoly Burakov char buf[PATH_MAX]; 75974de12b7SAnatoly Burakov struct rte_mempool *mp; 76074de12b7SAnatoly Burakov struct rte_lpm *lpm; 76174de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 762f1f72618SMichal Kobylinski struct rte_lpm_config lpm_config; 76374de12b7SAnatoly Burakov int socket; 76474de12b7SAnatoly Burakov unsigned lcore_id; 76574de12b7SAnatoly Burakov 76674de12b7SAnatoly Burakov /* traverse through lcores and initialize structures on each socket */ 76774de12b7SAnatoly Burakov 76874de12b7SAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 76974de12b7SAnatoly Burakov 77074de12b7SAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 77174de12b7SAnatoly Burakov continue; 77274de12b7SAnatoly Burakov 77374de12b7SAnatoly Burakov socket = rte_lcore_to_socket_id(lcore_id); 77474de12b7SAnatoly Burakov 77574de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 77674de12b7SAnatoly Burakov socket = 0; 77774de12b7SAnatoly Burakov 77874de12b7SAnatoly Burakov if (socket_direct_pool[socket] == NULL) { 77974de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating direct mempool on socket %i\n", 78074de12b7SAnatoly Burakov socket); 7816f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_direct_%i", socket); 78274de12b7SAnatoly Burakov 783ea0c20eaSOlivier Matz mp = rte_pktmbuf_pool_create(buf, NB_MBUF, 32, 784824cb29cSKonstantin Ananyev 0, RTE_MBUF_DEFAULT_BUF_SIZE, socket); 78574de12b7SAnatoly Burakov if (mp == NULL) { 78674de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create direct mempool\n"); 78774de12b7SAnatoly Burakov return -1; 78874de12b7SAnatoly Burakov } 78974de12b7SAnatoly Burakov socket_direct_pool[socket] = mp; 79074de12b7SAnatoly Burakov } 79174de12b7SAnatoly Burakov 79274de12b7SAnatoly Burakov if (socket_indirect_pool[socket] == NULL) { 79374de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating indirect mempool on socket %i\n", 79474de12b7SAnatoly Burakov socket); 7956f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_indirect_%i", socket); 79674de12b7SAnatoly Burakov 797ea0c20eaSOlivier Matz mp = rte_pktmbuf_pool_create(buf, NB_MBUF, 32, 0, 0, 798ea0c20eaSOlivier Matz socket); 79974de12b7SAnatoly Burakov if (mp == NULL) { 80074de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create indirect mempool\n"); 80174de12b7SAnatoly Burakov return -1; 80274de12b7SAnatoly Burakov } 80374de12b7SAnatoly Burakov socket_indirect_pool[socket] = mp; 80474de12b7SAnatoly Burakov } 80574de12b7SAnatoly Burakov 80674de12b7SAnatoly Burakov if (socket_lpm[socket] == NULL) { 80774de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM table on socket %i\n", socket); 8086f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 80974de12b7SAnatoly Burakov 810f1f72618SMichal Kobylinski lpm_config.max_rules = LPM_MAX_RULES; 811f1f72618SMichal Kobylinski lpm_config.number_tbl8s = 256; 812f1f72618SMichal Kobylinski lpm_config.flags = 0; 813f1f72618SMichal Kobylinski 814f1f72618SMichal Kobylinski lpm = rte_lpm_create(buf, socket, &lpm_config); 81574de12b7SAnatoly Burakov if (lpm == NULL) { 81674de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 81774de12b7SAnatoly Burakov return -1; 81874de12b7SAnatoly Burakov } 81974de12b7SAnatoly Burakov socket_lpm[socket] = lpm; 82074de12b7SAnatoly Burakov } 82174de12b7SAnatoly Burakov 82274de12b7SAnatoly Burakov if (socket_lpm6[socket] == NULL) { 82374de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM6 table on socket %i\n", socket); 8246f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 82574de12b7SAnatoly Burakov 826d1082cdeSOlivier Matz lpm6 = rte_lpm6_create(buf, socket, &lpm6_config); 82774de12b7SAnatoly Burakov if (lpm6 == NULL) { 82874de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 82974de12b7SAnatoly Burakov return -1; 83074de12b7SAnatoly Burakov } 83174de12b7SAnatoly Burakov socket_lpm6[socket] = lpm6; 83274de12b7SAnatoly Burakov } 83374de12b7SAnatoly Burakov } 83474de12b7SAnatoly Burakov 83574de12b7SAnatoly Burakov return 0; 83674de12b7SAnatoly Burakov } 83774de12b7SAnatoly Burakov 838e107e82eSAnatoly Burakov int 83998a16481SDavid Marchand main(int argc, char **argv) 840e107e82eSAnatoly Burakov { 841e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 84281f7ecd9SPablo de Lara struct rte_eth_dev_info dev_info; 84381f7ecd9SPablo de Lara struct rte_eth_txconf *txconf; 84474de12b7SAnatoly Burakov struct rx_queue *rxq; 84574de12b7SAnatoly Burakov int socket, ret; 84674de12b7SAnatoly Burakov unsigned nb_ports; 847e107e82eSAnatoly Burakov uint16_t queueid = 0; 848e107e82eSAnatoly Burakov unsigned lcore_id = 0, rx_lcore_id = 0; 849e107e82eSAnatoly Burakov uint32_t n_tx_queue, nb_lcores; 850f8244c63SZhiyong Yang uint16_t portid; 851e107e82eSAnatoly Burakov 852e107e82eSAnatoly Burakov /* init EAL */ 853e107e82eSAnatoly Burakov ret = rte_eal_init(argc, argv); 854e107e82eSAnatoly Burakov if (ret < 0) 855e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eal_init failed"); 856e107e82eSAnatoly Burakov argc -= ret; 857e107e82eSAnatoly Burakov argv += ret; 858e107e82eSAnatoly Burakov 859e107e82eSAnatoly Burakov /* parse application arguments (after the EAL ones) */ 860e107e82eSAnatoly Burakov ret = parse_args(argc, argv); 861e107e82eSAnatoly Burakov if (ret < 0) 862e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Invalid arguments"); 863e107e82eSAnatoly Burakov 864e107e82eSAnatoly Burakov nb_ports = rte_eth_dev_count(); 865b4e0f64fSMauricio Vasquez B if (nb_ports == 0) 86674de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "No ports found!\n"); 867e107e82eSAnatoly Burakov 868e107e82eSAnatoly Burakov nb_lcores = rte_lcore_count(); 869e107e82eSAnatoly Burakov 87074de12b7SAnatoly Burakov /* initialize structures (mempools, lpm etc.) */ 87174de12b7SAnatoly Burakov if (init_mem() < 0) 87274de12b7SAnatoly Burakov rte_panic("Cannot initialize memory structures!\n"); 87374de12b7SAnatoly Burakov 874eaa8d3bfSAnatoly Burakov /* check if portmask has non-existent ports */ 875eaa8d3bfSAnatoly Burakov if (enabled_port_mask & ~(RTE_LEN2MASK(nb_ports, unsigned))) 876eaa8d3bfSAnatoly Burakov rte_exit(EXIT_FAILURE, "Non-existent ports in portmask!\n"); 877eaa8d3bfSAnatoly Burakov 878e107e82eSAnatoly Burakov /* initialize all ports */ 879e107e82eSAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 880fdb9eff6SShahaf Shuler struct rte_eth_conf local_port_conf = port_conf; 881fdb9eff6SShahaf Shuler struct rte_eth_rxconf rxq_conf; 882fdb9eff6SShahaf Shuler 883e107e82eSAnatoly Burakov /* skip ports that are not enabled */ 884e107e82eSAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 885e107e82eSAnatoly Burakov printf("Skipping disabled port %d\n", portid); 886e107e82eSAnatoly Burakov continue; 887e107e82eSAnatoly Burakov } 888e107e82eSAnatoly Burakov 889e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 890e107e82eSAnatoly Burakov 8915e470a66SAndriy Berestovskyy /* limit the frame size to the maximum supported by NIC */ 8925e470a66SAndriy Berestovskyy rte_eth_dev_info_get(portid, &dev_info); 893fdb9eff6SShahaf Shuler local_port_conf.rxmode.max_rx_pkt_len = RTE_MIN( 894fdb9eff6SShahaf Shuler dev_info.max_rx_pktlen, 895fdb9eff6SShahaf Shuler local_port_conf.rxmode.max_rx_pkt_len); 8965e470a66SAndriy Berestovskyy 897e107e82eSAnatoly Burakov /* get the lcore_id for this port */ 898e107e82eSAnatoly Burakov while (rte_lcore_is_enabled(rx_lcore_id) == 0 || 899e107e82eSAnatoly Burakov qconf->n_rx_queue == (unsigned)rx_queue_per_lcore) { 900e107e82eSAnatoly Burakov 901e107e82eSAnatoly Burakov rx_lcore_id ++; 902e107e82eSAnatoly Burakov if (rx_lcore_id >= RTE_MAX_LCORE) 903e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Not enough cores\n"); 904e107e82eSAnatoly Burakov 905e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 906e107e82eSAnatoly Burakov } 90774de12b7SAnatoly Burakov 908324bcf45SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(rx_lcore_id); 90974de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 91074de12b7SAnatoly Burakov socket = 0; 91174de12b7SAnatoly Burakov 91274de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[qconf->n_rx_queue]; 91374de12b7SAnatoly Burakov rxq->portid = portid; 91474de12b7SAnatoly Burakov rxq->direct_pool = socket_direct_pool[socket]; 91574de12b7SAnatoly Burakov rxq->indirect_pool = socket_indirect_pool[socket]; 91674de12b7SAnatoly Burakov rxq->lpm = socket_lpm[socket]; 91774de12b7SAnatoly Burakov rxq->lpm6 = socket_lpm6[socket]; 918e107e82eSAnatoly Burakov qconf->n_rx_queue++; 919e107e82eSAnatoly Burakov 920e107e82eSAnatoly Burakov /* init port */ 921e107e82eSAnatoly Burakov printf("Initializing port %d on lcore %u...", portid, 922e107e82eSAnatoly Burakov rx_lcore_id); 923e107e82eSAnatoly Burakov fflush(stdout); 924e107e82eSAnatoly Burakov 925e107e82eSAnatoly Burakov n_tx_queue = nb_lcores; 926e107e82eSAnatoly Burakov if (n_tx_queue > MAX_TX_QUEUE_PER_PORT) 927e107e82eSAnatoly Burakov n_tx_queue = MAX_TX_QUEUE_PER_PORT; 928fdb9eff6SShahaf Shuler if (dev_info.tx_offload_capa & DEV_TX_OFFLOAD_MBUF_FAST_FREE) 929fdb9eff6SShahaf Shuler local_port_conf.txmode.offloads |= 930fdb9eff6SShahaf Shuler DEV_TX_OFFLOAD_MBUF_FAST_FREE; 931e107e82eSAnatoly Burakov ret = rte_eth_dev_configure(portid, 1, (uint16_t)n_tx_queue, 932fdb9eff6SShahaf Shuler &local_port_conf); 93374de12b7SAnatoly Burakov if (ret < 0) { 93474de12b7SAnatoly Burakov printf("\n"); 935e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot configure device: " 936e107e82eSAnatoly Burakov "err=%d, port=%d\n", 937e107e82eSAnatoly Burakov ret, portid); 93874de12b7SAnatoly Burakov } 93974de12b7SAnatoly Burakov 94060efb44fSRoman Zhukov ret = rte_eth_dev_adjust_nb_rx_tx_desc(portid, &nb_rxd, 94160efb44fSRoman Zhukov &nb_txd); 94260efb44fSRoman Zhukov if (ret < 0) { 94360efb44fSRoman Zhukov printf("\n"); 94460efb44fSRoman Zhukov rte_exit(EXIT_FAILURE, "Cannot adjust number of " 94560efb44fSRoman Zhukov "descriptors: err=%d, port=%d\n", ret, portid); 94660efb44fSRoman Zhukov } 94760efb44fSRoman Zhukov 94874de12b7SAnatoly Burakov /* init one RX queue */ 949fdb9eff6SShahaf Shuler rxq_conf = dev_info.default_rxconf; 950fdb9eff6SShahaf Shuler rxq_conf.offloads = local_port_conf.rxmode.offloads; 95174de12b7SAnatoly Burakov ret = rte_eth_rx_queue_setup(portid, 0, nb_rxd, 952fdb9eff6SShahaf Shuler socket, &rxq_conf, 95374de12b7SAnatoly Burakov socket_direct_pool[socket]); 95474de12b7SAnatoly Burakov if (ret < 0) { 95574de12b7SAnatoly Burakov printf("\n"); 95674de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_rx_queue_setup: " 95774de12b7SAnatoly Burakov "err=%d, port=%d\n", 95874de12b7SAnatoly Burakov ret, portid); 95974de12b7SAnatoly Burakov } 960e107e82eSAnatoly Burakov 961e107e82eSAnatoly Burakov rte_eth_macaddr_get(portid, &ports_eth_addr[portid]); 962e107e82eSAnatoly Burakov print_ethaddr(" Address:", &ports_eth_addr[portid]); 96374de12b7SAnatoly Burakov printf("\n"); 964e107e82eSAnatoly Burakov 965e107e82eSAnatoly Burakov /* init one TX queue per couple (lcore,port) */ 966e107e82eSAnatoly Burakov queueid = 0; 967e107e82eSAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 968e107e82eSAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 969e107e82eSAnatoly Burakov continue; 97074de12b7SAnatoly Burakov 97174de12b7SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(lcore_id); 972e107e82eSAnatoly Burakov printf("txq=%u,%d ", lcore_id, queueid); 973e107e82eSAnatoly Burakov fflush(stdout); 97481f7ecd9SPablo de Lara 97581f7ecd9SPablo de Lara txconf = &dev_info.default_txconf; 976fdb9eff6SShahaf Shuler txconf->txq_flags = ETH_TXQ_FLAGS_IGNORE; 977fdb9eff6SShahaf Shuler txconf->offloads = local_port_conf.txmode.offloads; 978e107e82eSAnatoly Burakov ret = rte_eth_tx_queue_setup(portid, queueid, nb_txd, 97981f7ecd9SPablo de Lara socket, txconf); 98074de12b7SAnatoly Burakov if (ret < 0) { 98174de12b7SAnatoly Burakov printf("\n"); 982e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_tx_queue_setup: " 983e107e82eSAnatoly Burakov "err=%d, port=%d\n", ret, portid); 98474de12b7SAnatoly Burakov } 985e107e82eSAnatoly Burakov 986e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 987e107e82eSAnatoly Burakov qconf->tx_queue_id[portid] = queueid; 988e107e82eSAnatoly Burakov queueid++; 989e107e82eSAnatoly Burakov } 990e107e82eSAnatoly Burakov 99174de12b7SAnatoly Burakov printf("\n"); 99274de12b7SAnatoly Burakov } 99374de12b7SAnatoly Burakov 99474de12b7SAnatoly Burakov printf("\n"); 99574de12b7SAnatoly Burakov 99674de12b7SAnatoly Burakov /* start ports */ 99774de12b7SAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 99874de12b7SAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 99974de12b7SAnatoly Burakov continue; 100074de12b7SAnatoly Burakov } 1001e107e82eSAnatoly Burakov /* Start device */ 1002e107e82eSAnatoly Burakov ret = rte_eth_dev_start(portid); 1003e107e82eSAnatoly Burakov if (ret < 0) 100474de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_dev_start: err=%d, port=%d\n", 1005e107e82eSAnatoly Burakov ret, portid); 1006e107e82eSAnatoly Burakov 1007e107e82eSAnatoly Burakov rte_eth_promiscuous_enable(portid); 1008201d52bcSWei Dai 1009201d52bcSWei Dai if (check_ptype(portid) == 0) { 1010201d52bcSWei Dai rte_eth_add_rx_callback(portid, 0, cb_parse_ptype, NULL); 101198a7ea33SJerin Jacob printf("Add Rx callback function to detect L3 packet type by SW :" 1012201d52bcSWei Dai " port = %d\n", portid); 1013201d52bcSWei Dai } 1014e107e82eSAnatoly Burakov } 1015e107e82eSAnatoly Burakov 101674de12b7SAnatoly Burakov if (init_routing_table() < 0) 101774de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot init routing table\n"); 101874de12b7SAnatoly Burakov 1019f8244c63SZhiyong Yang check_all_ports_link_status(nb_ports, enabled_port_mask); 1020e107e82eSAnatoly Burakov 1021e107e82eSAnatoly Burakov /* launch per-lcore init on every lcore */ 1022e107e82eSAnatoly Burakov rte_eal_mp_remote_launch(main_loop, NULL, CALL_MASTER); 1023e107e82eSAnatoly Burakov RTE_LCORE_FOREACH_SLAVE(lcore_id) { 1024e107e82eSAnatoly Burakov if (rte_eal_wait_lcore(lcore_id) < 0) 1025e107e82eSAnatoly Burakov return -1; 1026e107e82eSAnatoly Burakov } 1027e107e82eSAnatoly Burakov 1028e107e82eSAnatoly Burakov return 0; 1029e107e82eSAnatoly Burakov } 1030