13998e2a0SBruce Richardson /* SPDX-License-Identifier: BSD-3-Clause 23998e2a0SBruce Richardson * Copyright(c) 2010-2014 Intel Corporation 3e107e82eSAnatoly Burakov */ 4e107e82eSAnatoly Burakov 5e107e82eSAnatoly Burakov #include <stdio.h> 6e107e82eSAnatoly Burakov #include <stdlib.h> 7e107e82eSAnatoly Burakov #include <stdint.h> 8e107e82eSAnatoly Burakov #include <inttypes.h> 9e107e82eSAnatoly Burakov #include <sys/types.h> 10e107e82eSAnatoly Burakov #include <sys/param.h> 11e107e82eSAnatoly Burakov #include <string.h> 12e107e82eSAnatoly Burakov #include <sys/queue.h> 13e107e82eSAnatoly Burakov #include <stdarg.h> 14e107e82eSAnatoly Burakov #include <errno.h> 15e107e82eSAnatoly Burakov #include <getopt.h> 16e107e82eSAnatoly Burakov 17e107e82eSAnatoly Burakov #include <rte_common.h> 18e107e82eSAnatoly Burakov #include <rte_byteorder.h> 19e107e82eSAnatoly Burakov #include <rte_log.h> 20e107e82eSAnatoly Burakov #include <rte_memory.h> 21e107e82eSAnatoly Burakov #include <rte_memcpy.h> 22e107e82eSAnatoly Burakov #include <rte_eal.h> 23e107e82eSAnatoly Burakov #include <rte_launch.h> 24e107e82eSAnatoly Burakov #include <rte_atomic.h> 25e107e82eSAnatoly Burakov #include <rte_cycles.h> 26e107e82eSAnatoly Burakov #include <rte_prefetch.h> 27e107e82eSAnatoly Burakov #include <rte_lcore.h> 28e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 29e107e82eSAnatoly Burakov #include <rte_branch_prediction.h> 30e107e82eSAnatoly Burakov #include <rte_interrupts.h> 31e107e82eSAnatoly Burakov #include <rte_random.h> 32e107e82eSAnatoly Burakov #include <rte_debug.h> 33e107e82eSAnatoly Burakov #include <rte_ether.h> 34e107e82eSAnatoly Burakov #include <rte_ethdev.h> 35e107e82eSAnatoly Burakov #include <rte_mempool.h> 36e107e82eSAnatoly Burakov #include <rte_mbuf.h> 37e107e82eSAnatoly Burakov #include <rte_lpm.h> 3874de12b7SAnatoly Burakov #include <rte_lpm6.h> 39e107e82eSAnatoly Burakov #include <rte_ip.h> 4074de12b7SAnatoly Burakov #include <rte_string_fns.h> 41e107e82eSAnatoly Burakov 4274de12b7SAnatoly Burakov #include <rte_ip_frag.h> 4374de12b7SAnatoly Burakov 4474de12b7SAnatoly Burakov #define RTE_LOGTYPE_IP_FRAG RTE_LOGTYPE_USER1 45e107e82eSAnatoly Burakov 46e107e82eSAnatoly Burakov /* allow max jumbo frame 9.5 KB */ 47e107e82eSAnatoly Burakov #define JUMBO_FRAME_MAX_SIZE 0x2600 48e107e82eSAnatoly Burakov 49e107e82eSAnatoly Burakov #define ROUNDUP_DIV(a, b) (((a) + (b) - 1) / (b)) 50e107e82eSAnatoly Burakov 51e107e82eSAnatoly Burakov /* 5274de12b7SAnatoly Burakov * Default byte size for the IPv6 Maximum Transfer Unit (MTU). 5374de12b7SAnatoly Burakov * This value includes the size of IPv6 header. 54e107e82eSAnatoly Burakov */ 5574de12b7SAnatoly Burakov #define IPV4_MTU_DEFAULT ETHER_MTU 5674de12b7SAnatoly Burakov #define IPV6_MTU_DEFAULT ETHER_MTU 5774de12b7SAnatoly Burakov 5874de12b7SAnatoly Burakov /* 5974de12b7SAnatoly Burakov * Default payload in bytes for the IPv6 packet. 6074de12b7SAnatoly Burakov */ 6174de12b7SAnatoly Burakov #define IPV4_DEFAULT_PAYLOAD (IPV4_MTU_DEFAULT - sizeof(struct ipv4_hdr)) 6274de12b7SAnatoly Burakov #define IPV6_DEFAULT_PAYLOAD (IPV6_MTU_DEFAULT - sizeof(struct ipv6_hdr)) 6374de12b7SAnatoly Burakov 6474de12b7SAnatoly Burakov /* 6574de12b7SAnatoly Burakov * Max number of fragments per packet expected - defined by config file. 6674de12b7SAnatoly Burakov */ 6774de12b7SAnatoly Burakov #define MAX_PACKET_FRAG RTE_LIBRTE_IP_FRAG_MAX_FRAG 68e107e82eSAnatoly Burakov 69e107e82eSAnatoly Burakov #define NB_MBUF 8192 70e107e82eSAnatoly Burakov 71e107e82eSAnatoly Burakov #define MAX_PKT_BURST 32 72e107e82eSAnatoly Burakov #define BURST_TX_DRAIN_US 100 /* TX drain every ~100us */ 73e107e82eSAnatoly Burakov 74e107e82eSAnatoly Burakov /* Configure how many packets ahead to prefetch, when reading packets */ 75e107e82eSAnatoly Burakov #define PREFETCH_OFFSET 3 76e107e82eSAnatoly Burakov 77e107e82eSAnatoly Burakov /* 78e107e82eSAnatoly Burakov * Configurable number of RX/TX ring descriptors 79e107e82eSAnatoly Burakov */ 80867a6c66SKevin Laatz #define RTE_TEST_RX_DESC_DEFAULT 1024 81867a6c66SKevin Laatz #define RTE_TEST_TX_DESC_DEFAULT 1024 82e107e82eSAnatoly Burakov static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT; 83e107e82eSAnatoly Burakov static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT; 84e107e82eSAnatoly Burakov 85e107e82eSAnatoly Burakov /* ethernet addresses of ports */ 86e107e82eSAnatoly Burakov static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS]; 8774de12b7SAnatoly Burakov 8874de12b7SAnatoly Burakov #ifndef IPv4_BYTES 8974de12b7SAnatoly Burakov #define IPv4_BYTES_FMT "%" PRIu8 ".%" PRIu8 ".%" PRIu8 ".%" PRIu8 9074de12b7SAnatoly Burakov #define IPv4_BYTES(addr) \ 9174de12b7SAnatoly Burakov (uint8_t) (((addr) >> 24) & 0xFF),\ 9274de12b7SAnatoly Burakov (uint8_t) (((addr) >> 16) & 0xFF),\ 9374de12b7SAnatoly Burakov (uint8_t) (((addr) >> 8) & 0xFF),\ 9474de12b7SAnatoly Burakov (uint8_t) ((addr) & 0xFF) 9574de12b7SAnatoly Burakov #endif 9674de12b7SAnatoly Burakov 9774de12b7SAnatoly Burakov #ifndef IPv6_BYTES 9874de12b7SAnatoly Burakov #define IPv6_BYTES_FMT "%02x%02x:%02x%02x:%02x%02x:%02x%02x:"\ 9974de12b7SAnatoly Burakov "%02x%02x:%02x%02x:%02x%02x:%02x%02x" 10074de12b7SAnatoly Burakov #define IPv6_BYTES(addr) \ 10174de12b7SAnatoly Burakov addr[0], addr[1], addr[2], addr[3], \ 10274de12b7SAnatoly Burakov addr[4], addr[5], addr[6], addr[7], \ 10374de12b7SAnatoly Burakov addr[8], addr[9], addr[10], addr[11],\ 10474de12b7SAnatoly Burakov addr[12], addr[13],addr[14], addr[15] 10574de12b7SAnatoly Burakov #endif 10674de12b7SAnatoly Burakov 10774de12b7SAnatoly Burakov #define IPV6_ADDR_LEN 16 108e107e82eSAnatoly Burakov 109e107e82eSAnatoly Burakov /* mask of enabled ports */ 110e107e82eSAnatoly Burakov static int enabled_port_mask = 0; 111e107e82eSAnatoly Burakov 112e107e82eSAnatoly Burakov static int rx_queue_per_lcore = 1; 113e107e82eSAnatoly Burakov 114e107e82eSAnatoly Burakov #define MBUF_TABLE_SIZE (2 * MAX(MAX_PKT_BURST, MAX_PACKET_FRAG)) 115e107e82eSAnatoly Burakov 116e107e82eSAnatoly Burakov struct mbuf_table { 117e107e82eSAnatoly Burakov uint16_t len; 118e107e82eSAnatoly Burakov struct rte_mbuf *m_table[MBUF_TABLE_SIZE]; 119e107e82eSAnatoly Burakov }; 120e107e82eSAnatoly Burakov 12174de12b7SAnatoly Burakov struct rx_queue { 12274de12b7SAnatoly Burakov struct rte_mempool *direct_pool; 12374de12b7SAnatoly Burakov struct rte_mempool *indirect_pool; 12474de12b7SAnatoly Burakov struct rte_lpm *lpm; 12574de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 126f8244c63SZhiyong Yang uint16_t portid; 12774de12b7SAnatoly Burakov }; 12874de12b7SAnatoly Burakov 129e107e82eSAnatoly Burakov #define MAX_RX_QUEUE_PER_LCORE 16 130e107e82eSAnatoly Burakov #define MAX_TX_QUEUE_PER_PORT 16 131e107e82eSAnatoly Burakov struct lcore_queue_conf { 132e107e82eSAnatoly Burakov uint16_t n_rx_queue; 133e107e82eSAnatoly Burakov uint16_t tx_queue_id[RTE_MAX_ETHPORTS]; 13474de12b7SAnatoly Burakov struct rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE]; 135e107e82eSAnatoly Burakov struct mbuf_table tx_mbufs[RTE_MAX_ETHPORTS]; 136e107e82eSAnatoly Burakov } __rte_cache_aligned; 137e107e82eSAnatoly Burakov struct lcore_queue_conf lcore_queue_conf[RTE_MAX_LCORE]; 138e107e82eSAnatoly Burakov 1395e470a66SAndriy Berestovskyy static struct rte_eth_conf port_conf = { 140e107e82eSAnatoly Burakov .rxmode = { 141e107e82eSAnatoly Burakov .max_rx_pkt_len = JUMBO_FRAME_MAX_SIZE, 142e107e82eSAnatoly Burakov .split_hdr_size = 0, 143fdb9eff6SShahaf Shuler .offloads = (DEV_RX_OFFLOAD_CHECKSUM | 144*323e7b66SFerruh Yigit DEV_RX_OFFLOAD_JUMBO_FRAME), 145e107e82eSAnatoly Burakov }, 146e107e82eSAnatoly Burakov .txmode = { 147e107e82eSAnatoly Burakov .mq_mode = ETH_MQ_TX_NONE, 148fdb9eff6SShahaf Shuler .offloads = (DEV_TX_OFFLOAD_IPV4_CKSUM | 149fdb9eff6SShahaf Shuler DEV_TX_OFFLOAD_MULTI_SEGS), 150e107e82eSAnatoly Burakov }, 151e107e82eSAnatoly Burakov }; 152e107e82eSAnatoly Burakov 15374de12b7SAnatoly Burakov /* 15474de12b7SAnatoly Burakov * IPv4 forwarding table 15574de12b7SAnatoly Burakov */ 15674de12b7SAnatoly Burakov struct l3fwd_ipv4_route { 157e107e82eSAnatoly Burakov uint32_t ip; 158e107e82eSAnatoly Burakov uint8_t depth; 159e107e82eSAnatoly Burakov uint8_t if_out; 160e107e82eSAnatoly Burakov }; 161e107e82eSAnatoly Burakov 16274de12b7SAnatoly Burakov struct l3fwd_ipv4_route l3fwd_ipv4_route_array[] = { 16374de12b7SAnatoly Burakov {IPv4(100,10,0,0), 16, 0}, 16474de12b7SAnatoly Burakov {IPv4(100,20,0,0), 16, 1}, 16574de12b7SAnatoly Burakov {IPv4(100,30,0,0), 16, 2}, 16674de12b7SAnatoly Burakov {IPv4(100,40,0,0), 16, 3}, 16774de12b7SAnatoly Burakov {IPv4(100,50,0,0), 16, 4}, 16874de12b7SAnatoly Burakov {IPv4(100,60,0,0), 16, 5}, 16974de12b7SAnatoly Burakov {IPv4(100,70,0,0), 16, 6}, 17074de12b7SAnatoly Burakov {IPv4(100,80,0,0), 16, 7}, 171e107e82eSAnatoly Burakov }; 172e107e82eSAnatoly Burakov 17374de12b7SAnatoly Burakov /* 17474de12b7SAnatoly Burakov * IPv6 forwarding table 17574de12b7SAnatoly Burakov */ 176e107e82eSAnatoly Burakov 17774de12b7SAnatoly Burakov struct l3fwd_ipv6_route { 17874de12b7SAnatoly Burakov uint8_t ip[IPV6_ADDR_LEN]; 17974de12b7SAnatoly Burakov uint8_t depth; 18074de12b7SAnatoly Burakov uint8_t if_out; 18174de12b7SAnatoly Burakov }; 182e107e82eSAnatoly Burakov 18374de12b7SAnatoly Burakov static struct l3fwd_ipv6_route l3fwd_ipv6_route_array[] = { 18474de12b7SAnatoly Burakov {{1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 0}, 18574de12b7SAnatoly Burakov {{2,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 1}, 18674de12b7SAnatoly Burakov {{3,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 2}, 18774de12b7SAnatoly Burakov {{4,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 3}, 18874de12b7SAnatoly Burakov {{5,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 4}, 18974de12b7SAnatoly Burakov {{6,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 5}, 19074de12b7SAnatoly Burakov {{7,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 6}, 19174de12b7SAnatoly Burakov {{8,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 7}, 19274de12b7SAnatoly Burakov }; 19374de12b7SAnatoly Burakov 19474de12b7SAnatoly Burakov #define LPM_MAX_RULES 1024 19574de12b7SAnatoly Burakov #define LPM6_MAX_RULES 1024 19674de12b7SAnatoly Burakov #define LPM6_NUMBER_TBL8S (1 << 16) 19774de12b7SAnatoly Burakov 19874de12b7SAnatoly Burakov struct rte_lpm6_config lpm6_config = { 19974de12b7SAnatoly Burakov .max_rules = LPM6_MAX_RULES, 20074de12b7SAnatoly Burakov .number_tbl8s = LPM6_NUMBER_TBL8S, 20174de12b7SAnatoly Burakov .flags = 0 20274de12b7SAnatoly Burakov }; 20374de12b7SAnatoly Burakov 20474de12b7SAnatoly Burakov static struct rte_mempool *socket_direct_pool[RTE_MAX_NUMA_NODES]; 20574de12b7SAnatoly Burakov static struct rte_mempool *socket_indirect_pool[RTE_MAX_NUMA_NODES]; 20674de12b7SAnatoly Burakov static struct rte_lpm *socket_lpm[RTE_MAX_NUMA_NODES]; 20774de12b7SAnatoly Burakov static struct rte_lpm6 *socket_lpm6[RTE_MAX_NUMA_NODES]; 208e107e82eSAnatoly Burakov 209e107e82eSAnatoly Burakov /* Send burst of packets on an output interface */ 210e107e82eSAnatoly Burakov static inline int 211f8244c63SZhiyong Yang send_burst(struct lcore_queue_conf *qconf, uint16_t n, uint16_t port) 212e107e82eSAnatoly Burakov { 213e107e82eSAnatoly Burakov struct rte_mbuf **m_table; 214e107e82eSAnatoly Burakov int ret; 215e107e82eSAnatoly Burakov uint16_t queueid; 216e107e82eSAnatoly Burakov 217e107e82eSAnatoly Burakov queueid = qconf->tx_queue_id[port]; 218e107e82eSAnatoly Burakov m_table = (struct rte_mbuf **)qconf->tx_mbufs[port].m_table; 219e107e82eSAnatoly Burakov 220e107e82eSAnatoly Burakov ret = rte_eth_tx_burst(port, queueid, m_table, n); 221e107e82eSAnatoly Burakov if (unlikely(ret < n)) { 222e107e82eSAnatoly Burakov do { 223e107e82eSAnatoly Burakov rte_pktmbuf_free(m_table[ret]); 224e107e82eSAnatoly Burakov } while (++ret < n); 225e107e82eSAnatoly Burakov } 226e107e82eSAnatoly Burakov 227e107e82eSAnatoly Burakov return 0; 228e107e82eSAnatoly Burakov } 229e107e82eSAnatoly Burakov 230e107e82eSAnatoly Burakov static inline void 23174de12b7SAnatoly Burakov l3fwd_simple_forward(struct rte_mbuf *m, struct lcore_queue_conf *qconf, 232f8244c63SZhiyong Yang uint8_t queueid, uint16_t port_in) 233e107e82eSAnatoly Burakov { 23474de12b7SAnatoly Burakov struct rx_queue *rxq; 235d89a5bceSVladyslav Buslov uint32_t i, len, next_hop; 236f8244c63SZhiyong Yang uint8_t ipv6; 237f8244c63SZhiyong Yang uint16_t port_out; 238e107e82eSAnatoly Burakov int32_t len2; 239e107e82eSAnatoly Burakov 24074de12b7SAnatoly Burakov ipv6 = 0; 24174de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[queueid]; 24274de12b7SAnatoly Burakov 24374de12b7SAnatoly Burakov /* by default, send everything back to the source port */ 24474de12b7SAnatoly Burakov port_out = port_in; 245e107e82eSAnatoly Burakov 246e107e82eSAnatoly Burakov /* Remove the Ethernet header and trailer from the input packet */ 247e107e82eSAnatoly Burakov rte_pktmbuf_adj(m, (uint16_t)sizeof(struct ether_hdr)); 248e107e82eSAnatoly Burakov 24974de12b7SAnatoly Burakov /* Build transmission burst */ 25074de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 25174de12b7SAnatoly Burakov 25274de12b7SAnatoly Burakov /* if this is an IPv4 packet */ 2533c0184ccSHelin Zhang if (RTE_ETH_IS_IPV4_HDR(m->packet_type)) { 25474de12b7SAnatoly Burakov struct ipv4_hdr *ip_hdr; 25574de12b7SAnatoly Burakov uint32_t ip_dst; 256e107e82eSAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 257e107e82eSAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv4_hdr *); 258e107e82eSAnatoly Burakov ip_dst = rte_be_to_cpu_32(ip_hdr->dst_addr); 259e107e82eSAnatoly Burakov 260e107e82eSAnatoly Burakov /* Find destination port */ 261d89a5bceSVladyslav Buslov if (rte_lpm_lookup(rxq->lpm, ip_dst, &next_hop) == 0 && 262d89a5bceSVladyslav Buslov (enabled_port_mask & 1 << next_hop) != 0) { 263d89a5bceSVladyslav Buslov port_out = next_hop; 264e107e82eSAnatoly Burakov 26574de12b7SAnatoly Burakov /* Build transmission burst for new port */ 266e107e82eSAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 26774de12b7SAnatoly Burakov } 268e107e82eSAnatoly Burakov 269e107e82eSAnatoly Burakov /* if we don't need to do any fragmentation */ 270ea672a8bSOlivier Matz if (likely (IPV4_MTU_DEFAULT >= m->pkt_len)) { 271e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 272e107e82eSAnatoly Burakov len2 = 1; 273e107e82eSAnatoly Burakov } else { 274e107e82eSAnatoly Burakov len2 = rte_ipv4_fragment_packet(m, 275e107e82eSAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 276e107e82eSAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 277e107e82eSAnatoly Burakov IPV4_MTU_DEFAULT, 27874de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 279e107e82eSAnatoly Burakov 280e107e82eSAnatoly Burakov /* Free input packet */ 281e107e82eSAnatoly Burakov rte_pktmbuf_free(m); 282e107e82eSAnatoly Burakov 283e107e82eSAnatoly Burakov /* If we fail to fragment the packet */ 284e107e82eSAnatoly Burakov if (unlikely (len2 < 0)) 285e107e82eSAnatoly Burakov return; 286e107e82eSAnatoly Burakov } 2873c0184ccSHelin Zhang } else if (RTE_ETH_IS_IPV6_HDR(m->packet_type)) { 2883c0184ccSHelin Zhang /* if this is an IPv6 packet */ 28974de12b7SAnatoly Burakov struct ipv6_hdr *ip_hdr; 29074de12b7SAnatoly Burakov 29174de12b7SAnatoly Burakov ipv6 = 1; 29274de12b7SAnatoly Burakov 29374de12b7SAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 29474de12b7SAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv6_hdr *); 29574de12b7SAnatoly Burakov 29674de12b7SAnatoly Burakov /* Find destination port */ 297d89a5bceSVladyslav Buslov if (rte_lpm6_lookup(rxq->lpm6, ip_hdr->dst_addr, 298d89a5bceSVladyslav Buslov &next_hop) == 0 && 299d89a5bceSVladyslav Buslov (enabled_port_mask & 1 << next_hop) != 0) { 300d89a5bceSVladyslav Buslov port_out = next_hop; 30174de12b7SAnatoly Burakov 30274de12b7SAnatoly Burakov /* Build transmission burst for new port */ 30374de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 30474de12b7SAnatoly Burakov } 30574de12b7SAnatoly Burakov 30674de12b7SAnatoly Burakov /* if we don't need to do any fragmentation */ 307ea672a8bSOlivier Matz if (likely (IPV6_MTU_DEFAULT >= m->pkt_len)) { 30874de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 30974de12b7SAnatoly Burakov len2 = 1; 31074de12b7SAnatoly Burakov } else { 31174de12b7SAnatoly Burakov len2 = rte_ipv6_fragment_packet(m, 31274de12b7SAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 31374de12b7SAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 31474de12b7SAnatoly Burakov IPV6_MTU_DEFAULT, 31574de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 31674de12b7SAnatoly Burakov 31774de12b7SAnatoly Burakov /* Free input packet */ 31874de12b7SAnatoly Burakov rte_pktmbuf_free(m); 31974de12b7SAnatoly Burakov 32074de12b7SAnatoly Burakov /* If we fail to fragment the packet */ 32174de12b7SAnatoly Burakov if (unlikely (len2 < 0)) 32274de12b7SAnatoly Burakov return; 32374de12b7SAnatoly Burakov } 32474de12b7SAnatoly Burakov } 32574de12b7SAnatoly Burakov /* else, just forward the packet */ 32674de12b7SAnatoly Burakov else { 32774de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 32874de12b7SAnatoly Burakov len2 = 1; 32974de12b7SAnatoly Burakov } 330e107e82eSAnatoly Burakov 331e107e82eSAnatoly Burakov for (i = len; i < len + len2; i ++) { 33274de12b7SAnatoly Burakov void *d_addr_bytes; 33374de12b7SAnatoly Burakov 334e107e82eSAnatoly Burakov m = qconf->tx_mbufs[port_out].m_table[i]; 335e107e82eSAnatoly Burakov struct ether_hdr *eth_hdr = (struct ether_hdr *) 336e107e82eSAnatoly Burakov rte_pktmbuf_prepend(m, (uint16_t)sizeof(struct ether_hdr)); 337e107e82eSAnatoly Burakov if (eth_hdr == NULL) { 338e107e82eSAnatoly Burakov rte_panic("No headroom in mbuf.\n"); 339e107e82eSAnatoly Burakov } 340e107e82eSAnatoly Burakov 3417869536fSBruce Richardson m->l2_len = sizeof(struct ether_hdr); 342e107e82eSAnatoly Burakov 34374de12b7SAnatoly Burakov /* 02:00:00:00:00:xx */ 34474de12b7SAnatoly Burakov d_addr_bytes = ð_hdr->d_addr.addr_bytes[0]; 34574de12b7SAnatoly Burakov *((uint64_t *)d_addr_bytes) = 0x000000000002 + ((uint64_t)port_out << 40); 34674de12b7SAnatoly Burakov 34774de12b7SAnatoly Burakov /* src addr */ 348e107e82eSAnatoly Burakov ether_addr_copy(&ports_eth_addr[port_out], ð_hdr->s_addr); 34974de12b7SAnatoly Burakov if (ipv6) 35074de12b7SAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv6); 35174de12b7SAnatoly Burakov else 352e107e82eSAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv4); 353e107e82eSAnatoly Burakov } 354e107e82eSAnatoly Burakov 355e107e82eSAnatoly Burakov len += len2; 356e107e82eSAnatoly Burakov 357e107e82eSAnatoly Burakov if (likely(len < MAX_PKT_BURST)) { 358e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = (uint16_t)len; 359e107e82eSAnatoly Burakov return; 360e107e82eSAnatoly Burakov } 361e107e82eSAnatoly Burakov 362e107e82eSAnatoly Burakov /* Transmit packets */ 363e107e82eSAnatoly Burakov send_burst(qconf, (uint16_t)len, port_out); 364e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = 0; 365e107e82eSAnatoly Burakov } 366e107e82eSAnatoly Burakov 367e107e82eSAnatoly Burakov /* main processing loop */ 368e107e82eSAnatoly Burakov static int 369e107e82eSAnatoly Burakov main_loop(__attribute__((unused)) void *dummy) 370e107e82eSAnatoly Burakov { 371e107e82eSAnatoly Burakov struct rte_mbuf *pkts_burst[MAX_PKT_BURST]; 372e107e82eSAnatoly Burakov unsigned lcore_id; 373e107e82eSAnatoly Burakov uint64_t prev_tsc, diff_tsc, cur_tsc; 374e107e82eSAnatoly Burakov int i, j, nb_rx; 375f8244c63SZhiyong Yang uint16_t portid; 376e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 377e107e82eSAnatoly Burakov const uint64_t drain_tsc = (rte_get_tsc_hz() + US_PER_S - 1) / US_PER_S * BURST_TX_DRAIN_US; 378e107e82eSAnatoly Burakov 379e107e82eSAnatoly Burakov prev_tsc = 0; 380e107e82eSAnatoly Burakov 381e107e82eSAnatoly Burakov lcore_id = rte_lcore_id(); 382e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 383e107e82eSAnatoly Burakov 384e107e82eSAnatoly Burakov if (qconf->n_rx_queue == 0) { 38574de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "lcore %u has nothing to do\n", lcore_id); 386e107e82eSAnatoly Burakov return 0; 387e107e82eSAnatoly Burakov } 388e107e82eSAnatoly Burakov 38974de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "entering main loop on lcore %u\n", lcore_id); 390e107e82eSAnatoly Burakov 391e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 392e107e82eSAnatoly Burakov 39374de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 39474de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, " -- lcoreid=%u portid=%d\n", lcore_id, 395f8244c63SZhiyong Yang portid); 396e107e82eSAnatoly Burakov } 397e107e82eSAnatoly Burakov 398e107e82eSAnatoly Burakov while (1) { 399e107e82eSAnatoly Burakov 400e107e82eSAnatoly Burakov cur_tsc = rte_rdtsc(); 401e107e82eSAnatoly Burakov 402e107e82eSAnatoly Burakov /* 403e107e82eSAnatoly Burakov * TX burst queue drain 404e107e82eSAnatoly Burakov */ 405e107e82eSAnatoly Burakov diff_tsc = cur_tsc - prev_tsc; 406e107e82eSAnatoly Burakov if (unlikely(diff_tsc > drain_tsc)) { 407e107e82eSAnatoly Burakov 408e107e82eSAnatoly Burakov /* 409e107e82eSAnatoly Burakov * This could be optimized (use queueid instead of 410e107e82eSAnatoly Burakov * portid), but it is not called so often 411e107e82eSAnatoly Burakov */ 412e107e82eSAnatoly Burakov for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) { 413e107e82eSAnatoly Burakov if (qconf->tx_mbufs[portid].len == 0) 414e107e82eSAnatoly Burakov continue; 415e107e82eSAnatoly Burakov send_burst(&lcore_queue_conf[lcore_id], 416e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len, 417e107e82eSAnatoly Burakov portid); 418e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len = 0; 419e107e82eSAnatoly Burakov } 420e107e82eSAnatoly Burakov 421e107e82eSAnatoly Burakov prev_tsc = cur_tsc; 422e107e82eSAnatoly Burakov } 423e107e82eSAnatoly Burakov 424e107e82eSAnatoly Burakov /* 425e107e82eSAnatoly Burakov * Read packet from RX queues 426e107e82eSAnatoly Burakov */ 427e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 428e107e82eSAnatoly Burakov 42974de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 430e107e82eSAnatoly Burakov nb_rx = rte_eth_rx_burst(portid, 0, pkts_burst, 431e107e82eSAnatoly Burakov MAX_PKT_BURST); 432e107e82eSAnatoly Burakov 433e107e82eSAnatoly Burakov /* Prefetch first packets */ 434e107e82eSAnatoly Burakov for (j = 0; j < PREFETCH_OFFSET && j < nb_rx; j++) { 435e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod( 436e107e82eSAnatoly Burakov pkts_burst[j], void *)); 437e107e82eSAnatoly Burakov } 438e107e82eSAnatoly Burakov 439e107e82eSAnatoly Burakov /* Prefetch and forward already prefetched packets */ 440e107e82eSAnatoly Burakov for (j = 0; j < (nb_rx - PREFETCH_OFFSET); j++) { 441e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod(pkts_burst[ 442e107e82eSAnatoly Burakov j + PREFETCH_OFFSET], void *)); 44374de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 444e107e82eSAnatoly Burakov } 445e107e82eSAnatoly Burakov 446e107e82eSAnatoly Burakov /* Forward remaining prefetched packets */ 447e107e82eSAnatoly Burakov for (; j < nb_rx; j++) { 44874de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 449e107e82eSAnatoly Burakov } 450e107e82eSAnatoly Burakov } 451e107e82eSAnatoly Burakov } 452e107e82eSAnatoly Burakov } 453e107e82eSAnatoly Burakov 454e107e82eSAnatoly Burakov /* display usage */ 455e107e82eSAnatoly Burakov static void 456e107e82eSAnatoly Burakov print_usage(const char *prgname) 457e107e82eSAnatoly Burakov { 458e107e82eSAnatoly Burakov printf("%s [EAL options] -- -p PORTMASK [-q NQ]\n" 459e107e82eSAnatoly Burakov " -p PORTMASK: hexadecimal bitmask of ports to configure\n" 460e107e82eSAnatoly Burakov " -q NQ: number of queue (=ports) per lcore (default is 1)\n", 461e107e82eSAnatoly Burakov prgname); 462e107e82eSAnatoly Burakov } 463e107e82eSAnatoly Burakov 464e107e82eSAnatoly Burakov static int 465e107e82eSAnatoly Burakov parse_portmask(const char *portmask) 466e107e82eSAnatoly Burakov { 467e107e82eSAnatoly Burakov char *end = NULL; 468e107e82eSAnatoly Burakov unsigned long pm; 469e107e82eSAnatoly Burakov 470e107e82eSAnatoly Burakov /* parse hexadecimal string */ 471e107e82eSAnatoly Burakov pm = strtoul(portmask, &end, 16); 472e107e82eSAnatoly Burakov if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0')) 473e107e82eSAnatoly Burakov return -1; 474e107e82eSAnatoly Burakov 475e107e82eSAnatoly Burakov if (pm == 0) 476e107e82eSAnatoly Burakov return -1; 477e107e82eSAnatoly Burakov 478e107e82eSAnatoly Burakov return pm; 479e107e82eSAnatoly Burakov } 480e107e82eSAnatoly Burakov 481e107e82eSAnatoly Burakov static int 482e107e82eSAnatoly Burakov parse_nqueue(const char *q_arg) 483e107e82eSAnatoly Burakov { 484e107e82eSAnatoly Burakov char *end = NULL; 485e107e82eSAnatoly Burakov unsigned long n; 486e107e82eSAnatoly Burakov 487e107e82eSAnatoly Burakov /* parse hexadecimal string */ 488e107e82eSAnatoly Burakov n = strtoul(q_arg, &end, 10); 489e107e82eSAnatoly Burakov if ((q_arg[0] == '\0') || (end == NULL) || (*end != '\0')) 490e107e82eSAnatoly Burakov return -1; 491e107e82eSAnatoly Burakov if (n == 0) 492e107e82eSAnatoly Burakov return -1; 493e107e82eSAnatoly Burakov if (n >= MAX_RX_QUEUE_PER_LCORE) 494e107e82eSAnatoly Burakov return -1; 495e107e82eSAnatoly Burakov 496e107e82eSAnatoly Burakov return n; 497e107e82eSAnatoly Burakov } 498e107e82eSAnatoly Burakov 499e107e82eSAnatoly Burakov /* Parse the argument given in the command line of the application */ 500e107e82eSAnatoly Burakov static int 501e107e82eSAnatoly Burakov parse_args(int argc, char **argv) 502e107e82eSAnatoly Burakov { 503e107e82eSAnatoly Burakov int opt, ret; 504e107e82eSAnatoly Burakov char **argvopt; 505e107e82eSAnatoly Burakov int option_index; 506e107e82eSAnatoly Burakov char *prgname = argv[0]; 507e107e82eSAnatoly Burakov static struct option lgopts[] = { 508e107e82eSAnatoly Burakov {NULL, 0, 0, 0} 509e107e82eSAnatoly Burakov }; 510e107e82eSAnatoly Burakov 511e107e82eSAnatoly Burakov argvopt = argv; 512e107e82eSAnatoly Burakov 513e107e82eSAnatoly Burakov while ((opt = getopt_long(argc, argvopt, "p:q:", 514e107e82eSAnatoly Burakov lgopts, &option_index)) != EOF) { 515e107e82eSAnatoly Burakov 516e107e82eSAnatoly Burakov switch (opt) { 517e107e82eSAnatoly Burakov /* portmask */ 518e107e82eSAnatoly Burakov case 'p': 519e107e82eSAnatoly Burakov enabled_port_mask = parse_portmask(optarg); 520e107e82eSAnatoly Burakov if (enabled_port_mask < 0) { 521e107e82eSAnatoly Burakov printf("invalid portmask\n"); 522e107e82eSAnatoly Burakov print_usage(prgname); 523e107e82eSAnatoly Burakov return -1; 524e107e82eSAnatoly Burakov } 525e107e82eSAnatoly Burakov break; 526e107e82eSAnatoly Burakov 527e107e82eSAnatoly Burakov /* nqueue */ 528e107e82eSAnatoly Burakov case 'q': 529e107e82eSAnatoly Burakov rx_queue_per_lcore = parse_nqueue(optarg); 530e107e82eSAnatoly Burakov if (rx_queue_per_lcore < 0) { 531e107e82eSAnatoly Burakov printf("invalid queue number\n"); 532e107e82eSAnatoly Burakov print_usage(prgname); 533e107e82eSAnatoly Burakov return -1; 534e107e82eSAnatoly Burakov } 535e107e82eSAnatoly Burakov break; 536e107e82eSAnatoly Burakov 537e107e82eSAnatoly Burakov /* long options */ 538e107e82eSAnatoly Burakov case 0: 539e107e82eSAnatoly Burakov print_usage(prgname); 540e107e82eSAnatoly Burakov return -1; 541e107e82eSAnatoly Burakov 542e107e82eSAnatoly Burakov default: 543e107e82eSAnatoly Burakov print_usage(prgname); 544e107e82eSAnatoly Burakov return -1; 545e107e82eSAnatoly Burakov } 546e107e82eSAnatoly Burakov } 547e107e82eSAnatoly Burakov 548e107e82eSAnatoly Burakov if (enabled_port_mask == 0) { 549e107e82eSAnatoly Burakov printf("portmask not specified\n"); 550e107e82eSAnatoly Burakov print_usage(prgname); 551e107e82eSAnatoly Burakov return -1; 552e107e82eSAnatoly Burakov } 553e107e82eSAnatoly Burakov 554e107e82eSAnatoly Burakov if (optind >= 0) 555e107e82eSAnatoly Burakov argv[optind-1] = prgname; 556e107e82eSAnatoly Burakov 557e107e82eSAnatoly Burakov ret = optind-1; 5589d5ca532SKeith Wiles optind = 1; /* reset getopt lib */ 559e107e82eSAnatoly Burakov return ret; 560e107e82eSAnatoly Burakov } 561e107e82eSAnatoly Burakov 562e107e82eSAnatoly Burakov static void 563e107e82eSAnatoly Burakov print_ethaddr(const char *name, struct ether_addr *eth_addr) 564e107e82eSAnatoly Burakov { 565ec3d82dbSCunming Liang char buf[ETHER_ADDR_FMT_SIZE]; 566ec3d82dbSCunming Liang ether_format_addr(buf, ETHER_ADDR_FMT_SIZE, eth_addr); 567ec3d82dbSCunming Liang printf("%s%s", name, buf); 568e107e82eSAnatoly Burakov } 569e107e82eSAnatoly Burakov 570e107e82eSAnatoly Burakov /* Check the link status of all ports in up to 9s, and print them finally */ 571e107e82eSAnatoly Burakov static void 5728728ccf3SThomas Monjalon check_all_ports_link_status(uint32_t port_mask) 573e107e82eSAnatoly Burakov { 574e107e82eSAnatoly Burakov #define CHECK_INTERVAL 100 /* 100ms */ 575e107e82eSAnatoly Burakov #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */ 576f8244c63SZhiyong Yang uint16_t portid; 577f8244c63SZhiyong Yang uint8_t count, all_ports_up, print_flag = 0; 578e107e82eSAnatoly Burakov struct rte_eth_link link; 579e107e82eSAnatoly Burakov 580e107e82eSAnatoly Burakov printf("\nChecking link status"); 581e107e82eSAnatoly Burakov fflush(stdout); 582e107e82eSAnatoly Burakov for (count = 0; count <= MAX_CHECK_TIME; count++) { 583e107e82eSAnatoly Burakov all_ports_up = 1; 5848728ccf3SThomas Monjalon RTE_ETH_FOREACH_DEV(portid) { 585e107e82eSAnatoly Burakov if ((port_mask & (1 << portid)) == 0) 586e107e82eSAnatoly Burakov continue; 587e107e82eSAnatoly Burakov memset(&link, 0, sizeof(link)); 588e107e82eSAnatoly Burakov rte_eth_link_get_nowait(portid, &link); 589e107e82eSAnatoly Burakov /* print link status if flag set */ 590e107e82eSAnatoly Burakov if (print_flag == 1) { 591e107e82eSAnatoly Burakov if (link.link_status) 592f8244c63SZhiyong Yang printf( 593f8244c63SZhiyong Yang "Port%d Link Up .Speed %u Mbps - %s\n", 594f8244c63SZhiyong Yang portid, link.link_speed, 595e107e82eSAnatoly Burakov (link.link_duplex == ETH_LINK_FULL_DUPLEX) ? 596e107e82eSAnatoly Burakov ("full-duplex") : ("half-duplex\n")); 597e107e82eSAnatoly Burakov else 598f8244c63SZhiyong Yang printf("Port %d Link Down\n", portid); 599e107e82eSAnatoly Burakov continue; 600e107e82eSAnatoly Burakov } 601e107e82eSAnatoly Burakov /* clear all_ports_up flag if any link down */ 60209419f23SThomas Monjalon if (link.link_status == ETH_LINK_DOWN) { 603e107e82eSAnatoly Burakov all_ports_up = 0; 604e107e82eSAnatoly Burakov break; 605e107e82eSAnatoly Burakov } 606e107e82eSAnatoly Burakov } 607e107e82eSAnatoly Burakov /* after finally printing all link status, get out */ 608e107e82eSAnatoly Burakov if (print_flag == 1) 609e107e82eSAnatoly Burakov break; 610e107e82eSAnatoly Burakov 611e107e82eSAnatoly Burakov if (all_ports_up == 0) { 612e107e82eSAnatoly Burakov printf("."); 613e107e82eSAnatoly Burakov fflush(stdout); 614e107e82eSAnatoly Burakov rte_delay_ms(CHECK_INTERVAL); 615e107e82eSAnatoly Burakov } 616e107e82eSAnatoly Burakov 617e107e82eSAnatoly Burakov /* set the print_flag if all ports up or timeout */ 618e107e82eSAnatoly Burakov if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) { 619e107e82eSAnatoly Burakov print_flag = 1; 62074de12b7SAnatoly Burakov printf("\ndone\n"); 621e107e82eSAnatoly Burakov } 622e107e82eSAnatoly Burakov } 623e107e82eSAnatoly Burakov } 624e107e82eSAnatoly Burakov 625201d52bcSWei Dai /* Check L3 packet type detection capablity of the NIC port */ 626201d52bcSWei Dai static int 627201d52bcSWei Dai check_ptype(int portid) 628201d52bcSWei Dai { 629201d52bcSWei Dai int i, ret; 630201d52bcSWei Dai int ptype_l3_ipv4 = 0, ptype_l3_ipv6 = 0; 631201d52bcSWei Dai uint32_t ptype_mask = RTE_PTYPE_L3_MASK; 632201d52bcSWei Dai 633201d52bcSWei Dai ret = rte_eth_dev_get_supported_ptypes(portid, ptype_mask, NULL, 0); 634201d52bcSWei Dai if (ret <= 0) 635201d52bcSWei Dai return 0; 636201d52bcSWei Dai 637201d52bcSWei Dai uint32_t ptypes[ret]; 638201d52bcSWei Dai 639201d52bcSWei Dai ret = rte_eth_dev_get_supported_ptypes(portid, ptype_mask, ptypes, ret); 640201d52bcSWei Dai for (i = 0; i < ret; ++i) { 641201d52bcSWei Dai if (ptypes[i] & RTE_PTYPE_L3_IPV4) 642201d52bcSWei Dai ptype_l3_ipv4 = 1; 643201d52bcSWei Dai if (ptypes[i] & RTE_PTYPE_L3_IPV6) 644201d52bcSWei Dai ptype_l3_ipv6 = 1; 645201d52bcSWei Dai } 646201d52bcSWei Dai 647201d52bcSWei Dai if (ptype_l3_ipv4 == 0) 648201d52bcSWei Dai printf("port %d cannot parse RTE_PTYPE_L3_IPV4\n", portid); 649201d52bcSWei Dai 650201d52bcSWei Dai if (ptype_l3_ipv6 == 0) 651201d52bcSWei Dai printf("port %d cannot parse RTE_PTYPE_L3_IPV6\n", portid); 652201d52bcSWei Dai 653201d52bcSWei Dai if (ptype_l3_ipv4 && ptype_l3_ipv6) 654201d52bcSWei Dai return 1; 655201d52bcSWei Dai 656201d52bcSWei Dai return 0; 657201d52bcSWei Dai 658201d52bcSWei Dai } 659201d52bcSWei Dai 660201d52bcSWei Dai /* Parse packet type of a packet by SW */ 661201d52bcSWei Dai static inline void 662201d52bcSWei Dai parse_ptype(struct rte_mbuf *m) 663201d52bcSWei Dai { 664201d52bcSWei Dai struct ether_hdr *eth_hdr; 665201d52bcSWei Dai uint32_t packet_type = RTE_PTYPE_UNKNOWN; 666201d52bcSWei Dai uint16_t ether_type; 667201d52bcSWei Dai 668201d52bcSWei Dai eth_hdr = rte_pktmbuf_mtod(m, struct ether_hdr *); 669201d52bcSWei Dai ether_type = eth_hdr->ether_type; 670201d52bcSWei Dai if (ether_type == rte_cpu_to_be_16(ETHER_TYPE_IPv4)) 671201d52bcSWei Dai packet_type |= RTE_PTYPE_L3_IPV4_EXT_UNKNOWN; 672201d52bcSWei Dai else if (ether_type == rte_cpu_to_be_16(ETHER_TYPE_IPv6)) 673201d52bcSWei Dai packet_type |= RTE_PTYPE_L3_IPV6_EXT_UNKNOWN; 674201d52bcSWei Dai 675201d52bcSWei Dai m->packet_type = packet_type; 676201d52bcSWei Dai } 677201d52bcSWei Dai 678201d52bcSWei Dai /* callback function to detect packet type for a queue of a port */ 679201d52bcSWei Dai static uint16_t 680f8244c63SZhiyong Yang cb_parse_ptype(uint16_t port __rte_unused, uint16_t queue __rte_unused, 681201d52bcSWei Dai struct rte_mbuf *pkts[], uint16_t nb_pkts, 682201d52bcSWei Dai uint16_t max_pkts __rte_unused, 683201d52bcSWei Dai void *user_param __rte_unused) 684201d52bcSWei Dai { 685201d52bcSWei Dai uint16_t i; 686201d52bcSWei Dai 687201d52bcSWei Dai for (i = 0; i < nb_pkts; ++i) 688201d52bcSWei Dai parse_ptype(pkts[i]); 689201d52bcSWei Dai 690201d52bcSWei Dai return nb_pkts; 691201d52bcSWei Dai } 692201d52bcSWei Dai 69374de12b7SAnatoly Burakov static int 69474de12b7SAnatoly Burakov init_routing_table(void) 69574de12b7SAnatoly Burakov { 69674de12b7SAnatoly Burakov struct rte_lpm *lpm; 69774de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 69874de12b7SAnatoly Burakov int socket, ret; 69974de12b7SAnatoly Burakov unsigned i; 70074de12b7SAnatoly Burakov 70174de12b7SAnatoly Burakov for (socket = 0; socket < RTE_MAX_NUMA_NODES; socket++) { 70274de12b7SAnatoly Burakov if (socket_lpm[socket]) { 70374de12b7SAnatoly Burakov lpm = socket_lpm[socket]; 70474de12b7SAnatoly Burakov /* populate the LPM table */ 70574de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv4_route_array); i++) { 70674de12b7SAnatoly Burakov ret = rte_lpm_add(lpm, 70774de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].ip, 70874de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 70974de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 71074de12b7SAnatoly Burakov 71174de12b7SAnatoly Burakov if (ret < 0) { 71274de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 71374de12b7SAnatoly Burakov "LPM table\n", i); 71474de12b7SAnatoly Burakov return -1; 71574de12b7SAnatoly Burakov } 71674de12b7SAnatoly Burakov 71774de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv4_BYTES_FMT 71874de12b7SAnatoly Burakov "/%d (port %d)\n", 71974de12b7SAnatoly Burakov socket, 72074de12b7SAnatoly Burakov IPv4_BYTES(l3fwd_ipv4_route_array[i].ip), 72174de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 72274de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 72374de12b7SAnatoly Burakov } 72474de12b7SAnatoly Burakov } 72574de12b7SAnatoly Burakov 72674de12b7SAnatoly Burakov if (socket_lpm6[socket]) { 72774de12b7SAnatoly Burakov lpm6 = socket_lpm6[socket]; 72874de12b7SAnatoly Burakov /* populate the LPM6 table */ 72974de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv6_route_array); i++) { 73074de12b7SAnatoly Burakov ret = rte_lpm6_add(lpm6, 73174de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].ip, 73274de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 73374de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 73474de12b7SAnatoly Burakov 73574de12b7SAnatoly Burakov if (ret < 0) { 73674de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 73774de12b7SAnatoly Burakov "LPM6 table\n", i); 73874de12b7SAnatoly Burakov return -1; 73974de12b7SAnatoly Burakov } 74074de12b7SAnatoly Burakov 74174de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv6_BYTES_FMT 74274de12b7SAnatoly Burakov "/%d (port %d)\n", 74374de12b7SAnatoly Burakov socket, 74474de12b7SAnatoly Burakov IPv6_BYTES(l3fwd_ipv6_route_array[i].ip), 74574de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 74674de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 74774de12b7SAnatoly Burakov } 74874de12b7SAnatoly Burakov } 74974de12b7SAnatoly Burakov } 75074de12b7SAnatoly Burakov return 0; 75174de12b7SAnatoly Burakov } 75274de12b7SAnatoly Burakov 75374de12b7SAnatoly Burakov static int 75474de12b7SAnatoly Burakov init_mem(void) 75574de12b7SAnatoly Burakov { 75674de12b7SAnatoly Burakov char buf[PATH_MAX]; 75774de12b7SAnatoly Burakov struct rte_mempool *mp; 75874de12b7SAnatoly Burakov struct rte_lpm *lpm; 75974de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 760f1f72618SMichal Kobylinski struct rte_lpm_config lpm_config; 76174de12b7SAnatoly Burakov int socket; 76274de12b7SAnatoly Burakov unsigned lcore_id; 76374de12b7SAnatoly Burakov 76474de12b7SAnatoly Burakov /* traverse through lcores and initialize structures on each socket */ 76574de12b7SAnatoly Burakov 76674de12b7SAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 76774de12b7SAnatoly Burakov 76874de12b7SAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 76974de12b7SAnatoly Burakov continue; 77074de12b7SAnatoly Burakov 77174de12b7SAnatoly Burakov socket = rte_lcore_to_socket_id(lcore_id); 77274de12b7SAnatoly Burakov 77374de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 77474de12b7SAnatoly Burakov socket = 0; 77574de12b7SAnatoly Burakov 77674de12b7SAnatoly Burakov if (socket_direct_pool[socket] == NULL) { 77774de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating direct mempool on socket %i\n", 77874de12b7SAnatoly Burakov socket); 7796f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_direct_%i", socket); 78074de12b7SAnatoly Burakov 781ea0c20eaSOlivier Matz mp = rte_pktmbuf_pool_create(buf, NB_MBUF, 32, 782824cb29cSKonstantin Ananyev 0, RTE_MBUF_DEFAULT_BUF_SIZE, socket); 78374de12b7SAnatoly Burakov if (mp == NULL) { 78474de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create direct mempool\n"); 78574de12b7SAnatoly Burakov return -1; 78674de12b7SAnatoly Burakov } 78774de12b7SAnatoly Burakov socket_direct_pool[socket] = mp; 78874de12b7SAnatoly Burakov } 78974de12b7SAnatoly Burakov 79074de12b7SAnatoly Burakov if (socket_indirect_pool[socket] == NULL) { 79174de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating indirect mempool on socket %i\n", 79274de12b7SAnatoly Burakov socket); 7936f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_indirect_%i", socket); 79474de12b7SAnatoly Burakov 795ea0c20eaSOlivier Matz mp = rte_pktmbuf_pool_create(buf, NB_MBUF, 32, 0, 0, 796ea0c20eaSOlivier Matz socket); 79774de12b7SAnatoly Burakov if (mp == NULL) { 79874de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create indirect mempool\n"); 79974de12b7SAnatoly Burakov return -1; 80074de12b7SAnatoly Burakov } 80174de12b7SAnatoly Burakov socket_indirect_pool[socket] = mp; 80274de12b7SAnatoly Burakov } 80374de12b7SAnatoly Burakov 80474de12b7SAnatoly Burakov if (socket_lpm[socket] == NULL) { 80574de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM table on socket %i\n", socket); 8066f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 80774de12b7SAnatoly Burakov 808f1f72618SMichal Kobylinski lpm_config.max_rules = LPM_MAX_RULES; 809f1f72618SMichal Kobylinski lpm_config.number_tbl8s = 256; 810f1f72618SMichal Kobylinski lpm_config.flags = 0; 811f1f72618SMichal Kobylinski 812f1f72618SMichal Kobylinski lpm = rte_lpm_create(buf, socket, &lpm_config); 81374de12b7SAnatoly Burakov if (lpm == NULL) { 81474de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 81574de12b7SAnatoly Burakov return -1; 81674de12b7SAnatoly Burakov } 81774de12b7SAnatoly Burakov socket_lpm[socket] = lpm; 81874de12b7SAnatoly Burakov } 81974de12b7SAnatoly Burakov 82074de12b7SAnatoly Burakov if (socket_lpm6[socket] == NULL) { 82174de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM6 table on socket %i\n", socket); 8226f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 82374de12b7SAnatoly Burakov 824d1082cdeSOlivier Matz lpm6 = rte_lpm6_create(buf, socket, &lpm6_config); 82574de12b7SAnatoly Burakov if (lpm6 == NULL) { 82674de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 82774de12b7SAnatoly Burakov return -1; 82874de12b7SAnatoly Burakov } 82974de12b7SAnatoly Burakov socket_lpm6[socket] = lpm6; 83074de12b7SAnatoly Burakov } 83174de12b7SAnatoly Burakov } 83274de12b7SAnatoly Burakov 83374de12b7SAnatoly Burakov return 0; 83474de12b7SAnatoly Burakov } 83574de12b7SAnatoly Burakov 836e107e82eSAnatoly Burakov int 83798a16481SDavid Marchand main(int argc, char **argv) 838e107e82eSAnatoly Burakov { 839e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 84081f7ecd9SPablo de Lara struct rte_eth_dev_info dev_info; 84181f7ecd9SPablo de Lara struct rte_eth_txconf *txconf; 84274de12b7SAnatoly Burakov struct rx_queue *rxq; 84374de12b7SAnatoly Burakov int socket, ret; 844d9a42a69SThomas Monjalon uint16_t nb_ports; 845e107e82eSAnatoly Burakov uint16_t queueid = 0; 846e107e82eSAnatoly Burakov unsigned lcore_id = 0, rx_lcore_id = 0; 847e107e82eSAnatoly Burakov uint32_t n_tx_queue, nb_lcores; 848f8244c63SZhiyong Yang uint16_t portid; 849e107e82eSAnatoly Burakov 850e107e82eSAnatoly Burakov /* init EAL */ 851e107e82eSAnatoly Burakov ret = rte_eal_init(argc, argv); 852e107e82eSAnatoly Burakov if (ret < 0) 853e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eal_init failed"); 854e107e82eSAnatoly Burakov argc -= ret; 855e107e82eSAnatoly Burakov argv += ret; 856e107e82eSAnatoly Burakov 857e107e82eSAnatoly Burakov /* parse application arguments (after the EAL ones) */ 858e107e82eSAnatoly Burakov ret = parse_args(argc, argv); 859e107e82eSAnatoly Burakov if (ret < 0) 860e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Invalid arguments"); 861e107e82eSAnatoly Burakov 862d9a42a69SThomas Monjalon nb_ports = rte_eth_dev_count_avail(); 863b4e0f64fSMauricio Vasquez B if (nb_ports == 0) 86474de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "No ports found!\n"); 865e107e82eSAnatoly Burakov 866e107e82eSAnatoly Burakov nb_lcores = rte_lcore_count(); 867e107e82eSAnatoly Burakov 86874de12b7SAnatoly Burakov /* initialize structures (mempools, lpm etc.) */ 86974de12b7SAnatoly Burakov if (init_mem() < 0) 87074de12b7SAnatoly Burakov rte_panic("Cannot initialize memory structures!\n"); 87174de12b7SAnatoly Burakov 872eaa8d3bfSAnatoly Burakov /* check if portmask has non-existent ports */ 873eaa8d3bfSAnatoly Burakov if (enabled_port_mask & ~(RTE_LEN2MASK(nb_ports, unsigned))) 874eaa8d3bfSAnatoly Burakov rte_exit(EXIT_FAILURE, "Non-existent ports in portmask!\n"); 875eaa8d3bfSAnatoly Burakov 876e107e82eSAnatoly Burakov /* initialize all ports */ 8778728ccf3SThomas Monjalon RTE_ETH_FOREACH_DEV(portid) { 878fdb9eff6SShahaf Shuler struct rte_eth_conf local_port_conf = port_conf; 879fdb9eff6SShahaf Shuler struct rte_eth_rxconf rxq_conf; 880fdb9eff6SShahaf Shuler 881e107e82eSAnatoly Burakov /* skip ports that are not enabled */ 882e107e82eSAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 883e107e82eSAnatoly Burakov printf("Skipping disabled port %d\n", portid); 884e107e82eSAnatoly Burakov continue; 885e107e82eSAnatoly Burakov } 886e107e82eSAnatoly Burakov 887e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 888e107e82eSAnatoly Burakov 8895e470a66SAndriy Berestovskyy /* limit the frame size to the maximum supported by NIC */ 8905e470a66SAndriy Berestovskyy rte_eth_dev_info_get(portid, &dev_info); 891fdb9eff6SShahaf Shuler local_port_conf.rxmode.max_rx_pkt_len = RTE_MIN( 892fdb9eff6SShahaf Shuler dev_info.max_rx_pktlen, 893fdb9eff6SShahaf Shuler local_port_conf.rxmode.max_rx_pkt_len); 8945e470a66SAndriy Berestovskyy 895e107e82eSAnatoly Burakov /* get the lcore_id for this port */ 896e107e82eSAnatoly Burakov while (rte_lcore_is_enabled(rx_lcore_id) == 0 || 897e107e82eSAnatoly Burakov qconf->n_rx_queue == (unsigned)rx_queue_per_lcore) { 898e107e82eSAnatoly Burakov 899e107e82eSAnatoly Burakov rx_lcore_id ++; 900e107e82eSAnatoly Burakov if (rx_lcore_id >= RTE_MAX_LCORE) 901e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Not enough cores\n"); 902e107e82eSAnatoly Burakov 903e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 904e107e82eSAnatoly Burakov } 90574de12b7SAnatoly Burakov 906324bcf45SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(rx_lcore_id); 90774de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 90874de12b7SAnatoly Burakov socket = 0; 90974de12b7SAnatoly Burakov 91074de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[qconf->n_rx_queue]; 91174de12b7SAnatoly Burakov rxq->portid = portid; 91274de12b7SAnatoly Burakov rxq->direct_pool = socket_direct_pool[socket]; 91374de12b7SAnatoly Burakov rxq->indirect_pool = socket_indirect_pool[socket]; 91474de12b7SAnatoly Burakov rxq->lpm = socket_lpm[socket]; 91574de12b7SAnatoly Burakov rxq->lpm6 = socket_lpm6[socket]; 916e107e82eSAnatoly Burakov qconf->n_rx_queue++; 917e107e82eSAnatoly Burakov 918e107e82eSAnatoly Burakov /* init port */ 919e107e82eSAnatoly Burakov printf("Initializing port %d on lcore %u...", portid, 920e107e82eSAnatoly Burakov rx_lcore_id); 921e107e82eSAnatoly Burakov fflush(stdout); 922e107e82eSAnatoly Burakov 923e107e82eSAnatoly Burakov n_tx_queue = nb_lcores; 924e107e82eSAnatoly Burakov if (n_tx_queue > MAX_TX_QUEUE_PER_PORT) 925e107e82eSAnatoly Burakov n_tx_queue = MAX_TX_QUEUE_PER_PORT; 926fdb9eff6SShahaf Shuler if (dev_info.tx_offload_capa & DEV_TX_OFFLOAD_MBUF_FAST_FREE) 927fdb9eff6SShahaf Shuler local_port_conf.txmode.offloads |= 928fdb9eff6SShahaf Shuler DEV_TX_OFFLOAD_MBUF_FAST_FREE; 929e107e82eSAnatoly Burakov ret = rte_eth_dev_configure(portid, 1, (uint16_t)n_tx_queue, 930fdb9eff6SShahaf Shuler &local_port_conf); 93174de12b7SAnatoly Burakov if (ret < 0) { 93274de12b7SAnatoly Burakov printf("\n"); 933e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot configure device: " 934e107e82eSAnatoly Burakov "err=%d, port=%d\n", 935e107e82eSAnatoly Burakov ret, portid); 93674de12b7SAnatoly Burakov } 93774de12b7SAnatoly Burakov 93860efb44fSRoman Zhukov ret = rte_eth_dev_adjust_nb_rx_tx_desc(portid, &nb_rxd, 93960efb44fSRoman Zhukov &nb_txd); 94060efb44fSRoman Zhukov if (ret < 0) { 94160efb44fSRoman Zhukov printf("\n"); 94260efb44fSRoman Zhukov rte_exit(EXIT_FAILURE, "Cannot adjust number of " 94360efb44fSRoman Zhukov "descriptors: err=%d, port=%d\n", ret, portid); 94460efb44fSRoman Zhukov } 94560efb44fSRoman Zhukov 94674de12b7SAnatoly Burakov /* init one RX queue */ 947fdb9eff6SShahaf Shuler rxq_conf = dev_info.default_rxconf; 948fdb9eff6SShahaf Shuler rxq_conf.offloads = local_port_conf.rxmode.offloads; 94974de12b7SAnatoly Burakov ret = rte_eth_rx_queue_setup(portid, 0, nb_rxd, 950fdb9eff6SShahaf Shuler socket, &rxq_conf, 95174de12b7SAnatoly Burakov socket_direct_pool[socket]); 95274de12b7SAnatoly Burakov if (ret < 0) { 95374de12b7SAnatoly Burakov printf("\n"); 95474de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_rx_queue_setup: " 95574de12b7SAnatoly Burakov "err=%d, port=%d\n", 95674de12b7SAnatoly Burakov ret, portid); 95774de12b7SAnatoly Burakov } 958e107e82eSAnatoly Burakov 959e107e82eSAnatoly Burakov rte_eth_macaddr_get(portid, &ports_eth_addr[portid]); 960e107e82eSAnatoly Burakov print_ethaddr(" Address:", &ports_eth_addr[portid]); 96174de12b7SAnatoly Burakov printf("\n"); 962e107e82eSAnatoly Burakov 963e107e82eSAnatoly Burakov /* init one TX queue per couple (lcore,port) */ 964e107e82eSAnatoly Burakov queueid = 0; 965e107e82eSAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 966e107e82eSAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 967e107e82eSAnatoly Burakov continue; 96874de12b7SAnatoly Burakov 96974de12b7SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(lcore_id); 970e107e82eSAnatoly Burakov printf("txq=%u,%d ", lcore_id, queueid); 971e107e82eSAnatoly Burakov fflush(stdout); 97281f7ecd9SPablo de Lara 97381f7ecd9SPablo de Lara txconf = &dev_info.default_txconf; 974fdb9eff6SShahaf Shuler txconf->offloads = local_port_conf.txmode.offloads; 975e107e82eSAnatoly Burakov ret = rte_eth_tx_queue_setup(portid, queueid, nb_txd, 97681f7ecd9SPablo de Lara socket, txconf); 97774de12b7SAnatoly Burakov if (ret < 0) { 97874de12b7SAnatoly Burakov printf("\n"); 979e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_tx_queue_setup: " 980e107e82eSAnatoly Burakov "err=%d, port=%d\n", ret, portid); 98174de12b7SAnatoly Burakov } 982e107e82eSAnatoly Burakov 983e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 984e107e82eSAnatoly Burakov qconf->tx_queue_id[portid] = queueid; 985e107e82eSAnatoly Burakov queueid++; 986e107e82eSAnatoly Burakov } 987e107e82eSAnatoly Burakov 98874de12b7SAnatoly Burakov printf("\n"); 98974de12b7SAnatoly Burakov } 99074de12b7SAnatoly Burakov 99174de12b7SAnatoly Burakov printf("\n"); 99274de12b7SAnatoly Burakov 99374de12b7SAnatoly Burakov /* start ports */ 9948728ccf3SThomas Monjalon RTE_ETH_FOREACH_DEV(portid) { 99574de12b7SAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 99674de12b7SAnatoly Burakov continue; 99774de12b7SAnatoly Burakov } 998e107e82eSAnatoly Burakov /* Start device */ 999e107e82eSAnatoly Burakov ret = rte_eth_dev_start(portid); 1000e107e82eSAnatoly Burakov if (ret < 0) 100174de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_dev_start: err=%d, port=%d\n", 1002e107e82eSAnatoly Burakov ret, portid); 1003e107e82eSAnatoly Burakov 1004e107e82eSAnatoly Burakov rte_eth_promiscuous_enable(portid); 1005201d52bcSWei Dai 1006201d52bcSWei Dai if (check_ptype(portid) == 0) { 1007201d52bcSWei Dai rte_eth_add_rx_callback(portid, 0, cb_parse_ptype, NULL); 100898a7ea33SJerin Jacob printf("Add Rx callback function to detect L3 packet type by SW :" 1009201d52bcSWei Dai " port = %d\n", portid); 1010201d52bcSWei Dai } 1011e107e82eSAnatoly Burakov } 1012e107e82eSAnatoly Burakov 101374de12b7SAnatoly Burakov if (init_routing_table() < 0) 101474de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot init routing table\n"); 101574de12b7SAnatoly Burakov 10168728ccf3SThomas Monjalon check_all_ports_link_status(enabled_port_mask); 1017e107e82eSAnatoly Burakov 1018e107e82eSAnatoly Burakov /* launch per-lcore init on every lcore */ 1019e107e82eSAnatoly Burakov rte_eal_mp_remote_launch(main_loop, NULL, CALL_MASTER); 1020e107e82eSAnatoly Burakov RTE_LCORE_FOREACH_SLAVE(lcore_id) { 1021e107e82eSAnatoly Burakov if (rte_eal_wait_lcore(lcore_id) < 0) 1022e107e82eSAnatoly Burakov return -1; 1023e107e82eSAnatoly Burakov } 1024e107e82eSAnatoly Burakov 1025e107e82eSAnatoly Burakov return 0; 1026e107e82eSAnatoly Burakov } 1027