1e107e82eSAnatoly Burakov /*- 2e107e82eSAnatoly Burakov * BSD LICENSE 3e107e82eSAnatoly Burakov * 4e107e82eSAnatoly Burakov * Copyright(c) 2010-2014 Intel Corporation. All rights reserved. 5e107e82eSAnatoly Burakov * All rights reserved. 6e107e82eSAnatoly Burakov * 7e107e82eSAnatoly Burakov * Redistribution and use in source and binary forms, with or without 8e107e82eSAnatoly Burakov * modification, are permitted provided that the following conditions 9e107e82eSAnatoly Burakov * are met: 10e107e82eSAnatoly Burakov * 11e107e82eSAnatoly Burakov * * Redistributions of source code must retain the above copyright 12e107e82eSAnatoly Burakov * notice, this list of conditions and the following disclaimer. 13e107e82eSAnatoly Burakov * * Redistributions in binary form must reproduce the above copyright 14e107e82eSAnatoly Burakov * notice, this list of conditions and the following disclaimer in 15e107e82eSAnatoly Burakov * the documentation and/or other materials provided with the 16e107e82eSAnatoly Burakov * distribution. 17e107e82eSAnatoly Burakov * * Neither the name of Intel Corporation nor the names of its 18e107e82eSAnatoly Burakov * contributors may be used to endorse or promote products derived 19e107e82eSAnatoly Burakov * from this software without specific prior written permission. 20e107e82eSAnatoly Burakov * 21e107e82eSAnatoly Burakov * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 22e107e82eSAnatoly Burakov * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 23e107e82eSAnatoly Burakov * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 24e107e82eSAnatoly Burakov * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 25e107e82eSAnatoly Burakov * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 26e107e82eSAnatoly Burakov * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 27e107e82eSAnatoly Burakov * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 28e107e82eSAnatoly Burakov * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 29e107e82eSAnatoly Burakov * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 30e107e82eSAnatoly Burakov * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 31e107e82eSAnatoly Burakov * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 32e107e82eSAnatoly Burakov */ 33e107e82eSAnatoly Burakov 34e107e82eSAnatoly Burakov #include <stdio.h> 35e107e82eSAnatoly Burakov #include <stdlib.h> 36e107e82eSAnatoly Burakov #include <stdint.h> 37e107e82eSAnatoly Burakov #include <inttypes.h> 38e107e82eSAnatoly Burakov #include <sys/types.h> 39e107e82eSAnatoly Burakov #include <sys/param.h> 40e107e82eSAnatoly Burakov #include <string.h> 41e107e82eSAnatoly Burakov #include <sys/queue.h> 42e107e82eSAnatoly Burakov #include <stdarg.h> 43e107e82eSAnatoly Burakov #include <errno.h> 44e107e82eSAnatoly Burakov #include <getopt.h> 45e107e82eSAnatoly Burakov 46e107e82eSAnatoly Burakov #include <rte_common.h> 47e107e82eSAnatoly Burakov #include <rte_byteorder.h> 48e107e82eSAnatoly Burakov #include <rte_log.h> 49e107e82eSAnatoly Burakov #include <rte_memory.h> 50e107e82eSAnatoly Burakov #include <rte_memcpy.h> 51e107e82eSAnatoly Burakov #include <rte_memzone.h> 52e107e82eSAnatoly Burakov #include <rte_tailq.h> 53e107e82eSAnatoly Burakov #include <rte_eal.h> 54e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 55e107e82eSAnatoly Burakov #include <rte_launch.h> 56e107e82eSAnatoly Burakov #include <rte_atomic.h> 57e107e82eSAnatoly Burakov #include <rte_cycles.h> 58e107e82eSAnatoly Burakov #include <rte_prefetch.h> 59e107e82eSAnatoly Burakov #include <rte_lcore.h> 60e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 61e107e82eSAnatoly Burakov #include <rte_branch_prediction.h> 62e107e82eSAnatoly Burakov #include <rte_interrupts.h> 63e107e82eSAnatoly Burakov #include <rte_pci.h> 64e107e82eSAnatoly Burakov #include <rte_random.h> 65e107e82eSAnatoly Burakov #include <rte_debug.h> 66e107e82eSAnatoly Burakov #include <rte_ether.h> 67e107e82eSAnatoly Burakov #include <rte_ethdev.h> 68e107e82eSAnatoly Burakov #include <rte_ring.h> 69e107e82eSAnatoly Burakov #include <rte_mempool.h> 70e107e82eSAnatoly Burakov #include <rte_mbuf.h> 71e107e82eSAnatoly Burakov #include <rte_lpm.h> 7274de12b7SAnatoly Burakov #include <rte_lpm6.h> 73e107e82eSAnatoly Burakov #include <rte_ip.h> 7474de12b7SAnatoly Burakov #include <rte_string_fns.h> 75e107e82eSAnatoly Burakov 7674de12b7SAnatoly Burakov #include <rte_ip_frag.h> 7774de12b7SAnatoly Burakov 7874de12b7SAnatoly Burakov #define RTE_LOGTYPE_IP_FRAG RTE_LOGTYPE_USER1 79e107e82eSAnatoly Burakov 80e107e82eSAnatoly Burakov #define MBUF_SIZE (2048 + sizeof(struct rte_mbuf) + RTE_PKTMBUF_HEADROOM) 81e107e82eSAnatoly Burakov 82e107e82eSAnatoly Burakov /* allow max jumbo frame 9.5 KB */ 83e107e82eSAnatoly Burakov #define JUMBO_FRAME_MAX_SIZE 0x2600 84e107e82eSAnatoly Burakov 85e107e82eSAnatoly Burakov #define ROUNDUP_DIV(a, b) (((a) + (b) - 1) / (b)) 86e107e82eSAnatoly Burakov 87e107e82eSAnatoly Burakov /* 8874de12b7SAnatoly Burakov * Default byte size for the IPv6 Maximum Transfer Unit (MTU). 8974de12b7SAnatoly Burakov * This value includes the size of IPv6 header. 90e107e82eSAnatoly Burakov */ 9174de12b7SAnatoly Burakov #define IPV4_MTU_DEFAULT ETHER_MTU 9274de12b7SAnatoly Burakov #define IPV6_MTU_DEFAULT ETHER_MTU 9374de12b7SAnatoly Burakov 9474de12b7SAnatoly Burakov /* 9574de12b7SAnatoly Burakov * Default payload in bytes for the IPv6 packet. 9674de12b7SAnatoly Burakov */ 9774de12b7SAnatoly Burakov #define IPV4_DEFAULT_PAYLOAD (IPV4_MTU_DEFAULT - sizeof(struct ipv4_hdr)) 9874de12b7SAnatoly Burakov #define IPV6_DEFAULT_PAYLOAD (IPV6_MTU_DEFAULT - sizeof(struct ipv6_hdr)) 9974de12b7SAnatoly Burakov 10074de12b7SAnatoly Burakov /* 10174de12b7SAnatoly Burakov * Max number of fragments per packet expected - defined by config file. 10274de12b7SAnatoly Burakov */ 10374de12b7SAnatoly Burakov #define MAX_PACKET_FRAG RTE_LIBRTE_IP_FRAG_MAX_FRAG 104e107e82eSAnatoly Burakov 105e107e82eSAnatoly Burakov #define NB_MBUF 8192 106e107e82eSAnatoly Burakov 107e107e82eSAnatoly Burakov #define MAX_PKT_BURST 32 108e107e82eSAnatoly Burakov #define BURST_TX_DRAIN_US 100 /* TX drain every ~100us */ 109e107e82eSAnatoly Burakov 110e107e82eSAnatoly Burakov /* Configure how many packets ahead to prefetch, when reading packets */ 111e107e82eSAnatoly Burakov #define PREFETCH_OFFSET 3 112e107e82eSAnatoly Burakov 113e107e82eSAnatoly Burakov /* 114e107e82eSAnatoly Burakov * Configurable number of RX/TX ring descriptors 115e107e82eSAnatoly Burakov */ 116e107e82eSAnatoly Burakov #define RTE_TEST_RX_DESC_DEFAULT 128 117e107e82eSAnatoly Burakov #define RTE_TEST_TX_DESC_DEFAULT 512 118e107e82eSAnatoly Burakov static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT; 119e107e82eSAnatoly Burakov static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT; 120e107e82eSAnatoly Burakov 121e107e82eSAnatoly Burakov /* ethernet addresses of ports */ 122e107e82eSAnatoly Burakov static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS]; 12374de12b7SAnatoly Burakov 12474de12b7SAnatoly Burakov #ifndef IPv4_BYTES 12574de12b7SAnatoly Burakov #define IPv4_BYTES_FMT "%" PRIu8 ".%" PRIu8 ".%" PRIu8 ".%" PRIu8 12674de12b7SAnatoly Burakov #define IPv4_BYTES(addr) \ 12774de12b7SAnatoly Burakov (uint8_t) (((addr) >> 24) & 0xFF),\ 12874de12b7SAnatoly Burakov (uint8_t) (((addr) >> 16) & 0xFF),\ 12974de12b7SAnatoly Burakov (uint8_t) (((addr) >> 8) & 0xFF),\ 13074de12b7SAnatoly Burakov (uint8_t) ((addr) & 0xFF) 13174de12b7SAnatoly Burakov #endif 13274de12b7SAnatoly Burakov 13374de12b7SAnatoly Burakov #ifndef IPv6_BYTES 13474de12b7SAnatoly Burakov #define IPv6_BYTES_FMT "%02x%02x:%02x%02x:%02x%02x:%02x%02x:"\ 13574de12b7SAnatoly Burakov "%02x%02x:%02x%02x:%02x%02x:%02x%02x" 13674de12b7SAnatoly Burakov #define IPv6_BYTES(addr) \ 13774de12b7SAnatoly Burakov addr[0], addr[1], addr[2], addr[3], \ 13874de12b7SAnatoly Burakov addr[4], addr[5], addr[6], addr[7], \ 13974de12b7SAnatoly Burakov addr[8], addr[9], addr[10], addr[11],\ 14074de12b7SAnatoly Burakov addr[12], addr[13],addr[14], addr[15] 14174de12b7SAnatoly Burakov #endif 14274de12b7SAnatoly Burakov 14374de12b7SAnatoly Burakov #define IPV6_ADDR_LEN 16 144e107e82eSAnatoly Burakov 145e107e82eSAnatoly Burakov /* mask of enabled ports */ 146e107e82eSAnatoly Burakov static int enabled_port_mask = 0; 147e107e82eSAnatoly Burakov 148e107e82eSAnatoly Burakov static int rx_queue_per_lcore = 1; 149e107e82eSAnatoly Burakov 150e107e82eSAnatoly Burakov #define MBUF_TABLE_SIZE (2 * MAX(MAX_PKT_BURST, MAX_PACKET_FRAG)) 151e107e82eSAnatoly Burakov 152e107e82eSAnatoly Burakov struct mbuf_table { 153e107e82eSAnatoly Burakov uint16_t len; 154e107e82eSAnatoly Burakov struct rte_mbuf *m_table[MBUF_TABLE_SIZE]; 155e107e82eSAnatoly Burakov }; 156e107e82eSAnatoly Burakov 15774de12b7SAnatoly Burakov struct rx_queue { 15874de12b7SAnatoly Burakov struct rte_mempool *direct_pool; 15974de12b7SAnatoly Burakov struct rte_mempool *indirect_pool; 16074de12b7SAnatoly Burakov struct rte_lpm *lpm; 16174de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 16274de12b7SAnatoly Burakov uint8_t portid; 16374de12b7SAnatoly Burakov }; 16474de12b7SAnatoly Burakov 165e107e82eSAnatoly Burakov #define MAX_RX_QUEUE_PER_LCORE 16 166e107e82eSAnatoly Burakov #define MAX_TX_QUEUE_PER_PORT 16 167e107e82eSAnatoly Burakov struct lcore_queue_conf { 168e107e82eSAnatoly Burakov uint16_t n_rx_queue; 169e107e82eSAnatoly Burakov uint16_t tx_queue_id[RTE_MAX_ETHPORTS]; 17074de12b7SAnatoly Burakov struct rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE]; 171e107e82eSAnatoly Burakov struct mbuf_table tx_mbufs[RTE_MAX_ETHPORTS]; 172e107e82eSAnatoly Burakov } __rte_cache_aligned; 173e107e82eSAnatoly Burakov struct lcore_queue_conf lcore_queue_conf[RTE_MAX_LCORE]; 174e107e82eSAnatoly Burakov 175e107e82eSAnatoly Burakov static const struct rte_eth_conf port_conf = { 176e107e82eSAnatoly Burakov .rxmode = { 177e107e82eSAnatoly Burakov .max_rx_pkt_len = JUMBO_FRAME_MAX_SIZE, 178e107e82eSAnatoly Burakov .split_hdr_size = 0, 179e107e82eSAnatoly Burakov .header_split = 0, /**< Header Split disabled */ 18074de12b7SAnatoly Burakov .hw_ip_checksum = 1, /**< IP checksum offload enabled */ 181e107e82eSAnatoly Burakov .hw_vlan_filter = 0, /**< VLAN filtering disabled */ 182e107e82eSAnatoly Burakov .jumbo_frame = 1, /**< Jumbo Frame Support enabled */ 183e107e82eSAnatoly Burakov .hw_strip_crc = 0, /**< CRC stripped by hardware */ 184e107e82eSAnatoly Burakov }, 185e107e82eSAnatoly Burakov .txmode = { 186e107e82eSAnatoly Burakov .mq_mode = ETH_MQ_TX_NONE, 187e107e82eSAnatoly Burakov }, 188e107e82eSAnatoly Burakov }; 189e107e82eSAnatoly Burakov 19074de12b7SAnatoly Burakov /* 19174de12b7SAnatoly Burakov * IPv4 forwarding table 19274de12b7SAnatoly Burakov */ 19374de12b7SAnatoly Burakov struct l3fwd_ipv4_route { 194e107e82eSAnatoly Burakov uint32_t ip; 195e107e82eSAnatoly Burakov uint8_t depth; 196e107e82eSAnatoly Burakov uint8_t if_out; 197e107e82eSAnatoly Burakov }; 198e107e82eSAnatoly Burakov 19974de12b7SAnatoly Burakov struct l3fwd_ipv4_route l3fwd_ipv4_route_array[] = { 20074de12b7SAnatoly Burakov {IPv4(100,10,0,0), 16, 0}, 20174de12b7SAnatoly Burakov {IPv4(100,20,0,0), 16, 1}, 20274de12b7SAnatoly Burakov {IPv4(100,30,0,0), 16, 2}, 20374de12b7SAnatoly Burakov {IPv4(100,40,0,0), 16, 3}, 20474de12b7SAnatoly Burakov {IPv4(100,50,0,0), 16, 4}, 20574de12b7SAnatoly Burakov {IPv4(100,60,0,0), 16, 5}, 20674de12b7SAnatoly Burakov {IPv4(100,70,0,0), 16, 6}, 20774de12b7SAnatoly Burakov {IPv4(100,80,0,0), 16, 7}, 208e107e82eSAnatoly Burakov }; 209e107e82eSAnatoly Burakov 21074de12b7SAnatoly Burakov /* 21174de12b7SAnatoly Burakov * IPv6 forwarding table 21274de12b7SAnatoly Burakov */ 213e107e82eSAnatoly Burakov 21474de12b7SAnatoly Burakov struct l3fwd_ipv6_route { 21574de12b7SAnatoly Burakov uint8_t ip[IPV6_ADDR_LEN]; 21674de12b7SAnatoly Burakov uint8_t depth; 21774de12b7SAnatoly Burakov uint8_t if_out; 21874de12b7SAnatoly Burakov }; 219e107e82eSAnatoly Burakov 22074de12b7SAnatoly Burakov static struct l3fwd_ipv6_route l3fwd_ipv6_route_array[] = { 22174de12b7SAnatoly Burakov {{1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 0}, 22274de12b7SAnatoly Burakov {{2,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 1}, 22374de12b7SAnatoly Burakov {{3,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 2}, 22474de12b7SAnatoly Burakov {{4,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 3}, 22574de12b7SAnatoly Burakov {{5,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 4}, 22674de12b7SAnatoly Burakov {{6,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 5}, 22774de12b7SAnatoly Burakov {{7,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 6}, 22874de12b7SAnatoly Burakov {{8,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 7}, 22974de12b7SAnatoly Burakov }; 23074de12b7SAnatoly Burakov 23174de12b7SAnatoly Burakov #define LPM_MAX_RULES 1024 23274de12b7SAnatoly Burakov #define LPM6_MAX_RULES 1024 23374de12b7SAnatoly Burakov #define LPM6_NUMBER_TBL8S (1 << 16) 23474de12b7SAnatoly Burakov 23574de12b7SAnatoly Burakov struct rte_lpm6_config lpm6_config = { 23674de12b7SAnatoly Burakov .max_rules = LPM6_MAX_RULES, 23774de12b7SAnatoly Burakov .number_tbl8s = LPM6_NUMBER_TBL8S, 23874de12b7SAnatoly Burakov .flags = 0 23974de12b7SAnatoly Burakov }; 24074de12b7SAnatoly Burakov 24174de12b7SAnatoly Burakov static struct rte_mempool *socket_direct_pool[RTE_MAX_NUMA_NODES]; 24274de12b7SAnatoly Burakov static struct rte_mempool *socket_indirect_pool[RTE_MAX_NUMA_NODES]; 24374de12b7SAnatoly Burakov static struct rte_lpm *socket_lpm[RTE_MAX_NUMA_NODES]; 24474de12b7SAnatoly Burakov static struct rte_lpm6 *socket_lpm6[RTE_MAX_NUMA_NODES]; 245e107e82eSAnatoly Burakov 246e107e82eSAnatoly Burakov /* Send burst of packets on an output interface */ 247e107e82eSAnatoly Burakov static inline int 248e107e82eSAnatoly Burakov send_burst(struct lcore_queue_conf *qconf, uint16_t n, uint8_t port) 249e107e82eSAnatoly Burakov { 250e107e82eSAnatoly Burakov struct rte_mbuf **m_table; 251e107e82eSAnatoly Burakov int ret; 252e107e82eSAnatoly Burakov uint16_t queueid; 253e107e82eSAnatoly Burakov 254e107e82eSAnatoly Burakov queueid = qconf->tx_queue_id[port]; 255e107e82eSAnatoly Burakov m_table = (struct rte_mbuf **)qconf->tx_mbufs[port].m_table; 256e107e82eSAnatoly Burakov 257e107e82eSAnatoly Burakov ret = rte_eth_tx_burst(port, queueid, m_table, n); 258e107e82eSAnatoly Burakov if (unlikely(ret < n)) { 259e107e82eSAnatoly Burakov do { 260e107e82eSAnatoly Burakov rte_pktmbuf_free(m_table[ret]); 261e107e82eSAnatoly Burakov } while (++ret < n); 262e107e82eSAnatoly Burakov } 263e107e82eSAnatoly Burakov 264e107e82eSAnatoly Burakov return 0; 265e107e82eSAnatoly Burakov } 266e107e82eSAnatoly Burakov 267e107e82eSAnatoly Burakov static inline void 26874de12b7SAnatoly Burakov l3fwd_simple_forward(struct rte_mbuf *m, struct lcore_queue_conf *qconf, 26974de12b7SAnatoly Burakov uint8_t queueid, uint8_t port_in) 270e107e82eSAnatoly Burakov { 27174de12b7SAnatoly Burakov struct rx_queue *rxq; 27274de12b7SAnatoly Burakov uint32_t i, len; 27374de12b7SAnatoly Burakov uint8_t next_hop, port_out, ipv6; 274e107e82eSAnatoly Burakov int32_t len2; 275e107e82eSAnatoly Burakov 27674de12b7SAnatoly Burakov ipv6 = 0; 27774de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[queueid]; 27874de12b7SAnatoly Burakov 27974de12b7SAnatoly Burakov /* by default, send everything back to the source port */ 28074de12b7SAnatoly Burakov port_out = port_in; 281e107e82eSAnatoly Burakov 282e107e82eSAnatoly Burakov /* Remove the Ethernet header and trailer from the input packet */ 283e107e82eSAnatoly Burakov rte_pktmbuf_adj(m, (uint16_t)sizeof(struct ether_hdr)); 284e107e82eSAnatoly Burakov 28574de12b7SAnatoly Burakov /* Build transmission burst */ 28674de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 28774de12b7SAnatoly Burakov 28874de12b7SAnatoly Burakov /* if this is an IPv4 packet */ 28974de12b7SAnatoly Burakov if (m->ol_flags & PKT_RX_IPV4_HDR) { 29074de12b7SAnatoly Burakov struct ipv4_hdr *ip_hdr; 29174de12b7SAnatoly Burakov uint32_t ip_dst; 292e107e82eSAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 293e107e82eSAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv4_hdr *); 294e107e82eSAnatoly Burakov ip_dst = rte_be_to_cpu_32(ip_hdr->dst_addr); 295e107e82eSAnatoly Burakov 296e107e82eSAnatoly Burakov /* Find destination port */ 29774de12b7SAnatoly Burakov if (rte_lpm_lookup(rxq->lpm, ip_dst, &next_hop) == 0 && 29874de12b7SAnatoly Burakov (enabled_port_mask & 1 << next_hop) != 0) { 299e107e82eSAnatoly Burakov port_out = next_hop; 300e107e82eSAnatoly Burakov 30174de12b7SAnatoly Burakov /* Build transmission burst for new port */ 302e107e82eSAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 30374de12b7SAnatoly Burakov } 304e107e82eSAnatoly Burakov 305e107e82eSAnatoly Burakov /* if we don't need to do any fragmentation */ 306ea672a8bSOlivier Matz if (likely (IPV4_MTU_DEFAULT >= m->pkt_len)) { 307e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 308e107e82eSAnatoly Burakov len2 = 1; 309e107e82eSAnatoly Burakov } else { 310e107e82eSAnatoly Burakov len2 = rte_ipv4_fragment_packet(m, 311e107e82eSAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 312e107e82eSAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 313e107e82eSAnatoly Burakov IPV4_MTU_DEFAULT, 31474de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 315e107e82eSAnatoly Burakov 316e107e82eSAnatoly Burakov /* Free input packet */ 317e107e82eSAnatoly Burakov rte_pktmbuf_free(m); 318e107e82eSAnatoly Burakov 319e107e82eSAnatoly Burakov /* If we fail to fragment the packet */ 320e107e82eSAnatoly Burakov if (unlikely (len2 < 0)) 321e107e82eSAnatoly Burakov return; 322e107e82eSAnatoly Burakov } 32374de12b7SAnatoly Burakov } 32474de12b7SAnatoly Burakov /* if this is an IPv6 packet */ 32574de12b7SAnatoly Burakov else if (m->ol_flags & PKT_RX_IPV6_HDR) { 32674de12b7SAnatoly Burakov struct ipv6_hdr *ip_hdr; 32774de12b7SAnatoly Burakov 32874de12b7SAnatoly Burakov ipv6 = 1; 32974de12b7SAnatoly Burakov 33074de12b7SAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 33174de12b7SAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv6_hdr *); 33274de12b7SAnatoly Burakov 33374de12b7SAnatoly Burakov /* Find destination port */ 33474de12b7SAnatoly Burakov if (rte_lpm6_lookup(rxq->lpm6, ip_hdr->dst_addr, &next_hop) == 0 && 33574de12b7SAnatoly Burakov (enabled_port_mask & 1 << next_hop) != 0) { 33674de12b7SAnatoly Burakov port_out = next_hop; 33774de12b7SAnatoly Burakov 33874de12b7SAnatoly Burakov /* Build transmission burst for new port */ 33974de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 34074de12b7SAnatoly Burakov } 34174de12b7SAnatoly Burakov 34274de12b7SAnatoly Burakov /* if we don't need to do any fragmentation */ 343ea672a8bSOlivier Matz if (likely (IPV6_MTU_DEFAULT >= m->pkt_len)) { 34474de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 34574de12b7SAnatoly Burakov len2 = 1; 34674de12b7SAnatoly Burakov } else { 34774de12b7SAnatoly Burakov len2 = rte_ipv6_fragment_packet(m, 34874de12b7SAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 34974de12b7SAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 35074de12b7SAnatoly Burakov IPV6_MTU_DEFAULT, 35174de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 35274de12b7SAnatoly Burakov 35374de12b7SAnatoly Burakov /* Free input packet */ 35474de12b7SAnatoly Burakov rte_pktmbuf_free(m); 35574de12b7SAnatoly Burakov 35674de12b7SAnatoly Burakov /* If we fail to fragment the packet */ 35774de12b7SAnatoly Burakov if (unlikely (len2 < 0)) 35874de12b7SAnatoly Burakov return; 35974de12b7SAnatoly Burakov } 36074de12b7SAnatoly Burakov } 36174de12b7SAnatoly Burakov /* else, just forward the packet */ 36274de12b7SAnatoly Burakov else { 36374de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 36474de12b7SAnatoly Burakov len2 = 1; 36574de12b7SAnatoly Burakov } 366e107e82eSAnatoly Burakov 367e107e82eSAnatoly Burakov for (i = len; i < len + len2; i ++) { 36874de12b7SAnatoly Burakov void *d_addr_bytes; 36974de12b7SAnatoly Burakov 370e107e82eSAnatoly Burakov m = qconf->tx_mbufs[port_out].m_table[i]; 371e107e82eSAnatoly Burakov struct ether_hdr *eth_hdr = (struct ether_hdr *) 372e107e82eSAnatoly Burakov rte_pktmbuf_prepend(m, (uint16_t)sizeof(struct ether_hdr)); 373e107e82eSAnatoly Burakov if (eth_hdr == NULL) { 374e107e82eSAnatoly Burakov rte_panic("No headroom in mbuf.\n"); 375e107e82eSAnatoly Burakov } 376e107e82eSAnatoly Burakov 3777869536fSBruce Richardson m->l2_len = sizeof(struct ether_hdr); 378e107e82eSAnatoly Burakov 37974de12b7SAnatoly Burakov /* 02:00:00:00:00:xx */ 38074de12b7SAnatoly Burakov d_addr_bytes = ð_hdr->d_addr.addr_bytes[0]; 38174de12b7SAnatoly Burakov *((uint64_t *)d_addr_bytes) = 0x000000000002 + ((uint64_t)port_out << 40); 38274de12b7SAnatoly Burakov 38374de12b7SAnatoly Burakov /* src addr */ 384e107e82eSAnatoly Burakov ether_addr_copy(&ports_eth_addr[port_out], ð_hdr->s_addr); 38574de12b7SAnatoly Burakov if (ipv6) 38674de12b7SAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv6); 38774de12b7SAnatoly Burakov else 388e107e82eSAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv4); 389e107e82eSAnatoly Burakov } 390e107e82eSAnatoly Burakov 391e107e82eSAnatoly Burakov len += len2; 392e107e82eSAnatoly Burakov 393e107e82eSAnatoly Burakov if (likely(len < MAX_PKT_BURST)) { 394e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = (uint16_t)len; 395e107e82eSAnatoly Burakov return; 396e107e82eSAnatoly Burakov } 397e107e82eSAnatoly Burakov 398e107e82eSAnatoly Burakov /* Transmit packets */ 399e107e82eSAnatoly Burakov send_burst(qconf, (uint16_t)len, port_out); 400e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = 0; 401e107e82eSAnatoly Burakov } 402e107e82eSAnatoly Burakov 403e107e82eSAnatoly Burakov /* main processing loop */ 404e107e82eSAnatoly Burakov static int 405e107e82eSAnatoly Burakov main_loop(__attribute__((unused)) void *dummy) 406e107e82eSAnatoly Burakov { 407e107e82eSAnatoly Burakov struct rte_mbuf *pkts_burst[MAX_PKT_BURST]; 408e107e82eSAnatoly Burakov unsigned lcore_id; 409e107e82eSAnatoly Burakov uint64_t prev_tsc, diff_tsc, cur_tsc; 410e107e82eSAnatoly Burakov int i, j, nb_rx; 411e107e82eSAnatoly Burakov uint8_t portid; 412e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 413e107e82eSAnatoly Burakov const uint64_t drain_tsc = (rte_get_tsc_hz() + US_PER_S - 1) / US_PER_S * BURST_TX_DRAIN_US; 414e107e82eSAnatoly Burakov 415e107e82eSAnatoly Burakov prev_tsc = 0; 416e107e82eSAnatoly Burakov 417e107e82eSAnatoly Burakov lcore_id = rte_lcore_id(); 418e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 419e107e82eSAnatoly Burakov 420e107e82eSAnatoly Burakov if (qconf->n_rx_queue == 0) { 42174de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "lcore %u has nothing to do\n", lcore_id); 422e107e82eSAnatoly Burakov return 0; 423e107e82eSAnatoly Burakov } 424e107e82eSAnatoly Burakov 42574de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "entering main loop on lcore %u\n", lcore_id); 426e107e82eSAnatoly Burakov 427e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 428e107e82eSAnatoly Burakov 42974de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 43074de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, " -- lcoreid=%u portid=%d\n", lcore_id, 431e107e82eSAnatoly Burakov (int) portid); 432e107e82eSAnatoly Burakov } 433e107e82eSAnatoly Burakov 434e107e82eSAnatoly Burakov while (1) { 435e107e82eSAnatoly Burakov 436e107e82eSAnatoly Burakov cur_tsc = rte_rdtsc(); 437e107e82eSAnatoly Burakov 438e107e82eSAnatoly Burakov /* 439e107e82eSAnatoly Burakov * TX burst queue drain 440e107e82eSAnatoly Burakov */ 441e107e82eSAnatoly Burakov diff_tsc = cur_tsc - prev_tsc; 442e107e82eSAnatoly Burakov if (unlikely(diff_tsc > drain_tsc)) { 443e107e82eSAnatoly Burakov 444e107e82eSAnatoly Burakov /* 445e107e82eSAnatoly Burakov * This could be optimized (use queueid instead of 446e107e82eSAnatoly Burakov * portid), but it is not called so often 447e107e82eSAnatoly Burakov */ 448e107e82eSAnatoly Burakov for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) { 449e107e82eSAnatoly Burakov if (qconf->tx_mbufs[portid].len == 0) 450e107e82eSAnatoly Burakov continue; 451e107e82eSAnatoly Burakov send_burst(&lcore_queue_conf[lcore_id], 452e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len, 453e107e82eSAnatoly Burakov portid); 454e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len = 0; 455e107e82eSAnatoly Burakov } 456e107e82eSAnatoly Burakov 457e107e82eSAnatoly Burakov prev_tsc = cur_tsc; 458e107e82eSAnatoly Burakov } 459e107e82eSAnatoly Burakov 460e107e82eSAnatoly Burakov /* 461e107e82eSAnatoly Burakov * Read packet from RX queues 462e107e82eSAnatoly Burakov */ 463e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 464e107e82eSAnatoly Burakov 46574de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 466e107e82eSAnatoly Burakov nb_rx = rte_eth_rx_burst(portid, 0, pkts_burst, 467e107e82eSAnatoly Burakov MAX_PKT_BURST); 468e107e82eSAnatoly Burakov 469e107e82eSAnatoly Burakov /* Prefetch first packets */ 470e107e82eSAnatoly Burakov for (j = 0; j < PREFETCH_OFFSET && j < nb_rx; j++) { 471e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod( 472e107e82eSAnatoly Burakov pkts_burst[j], void *)); 473e107e82eSAnatoly Burakov } 474e107e82eSAnatoly Burakov 475e107e82eSAnatoly Burakov /* Prefetch and forward already prefetched packets */ 476e107e82eSAnatoly Burakov for (j = 0; j < (nb_rx - PREFETCH_OFFSET); j++) { 477e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod(pkts_burst[ 478e107e82eSAnatoly Burakov j + PREFETCH_OFFSET], void *)); 47974de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 480e107e82eSAnatoly Burakov } 481e107e82eSAnatoly Burakov 482e107e82eSAnatoly Burakov /* Forward remaining prefetched packets */ 483e107e82eSAnatoly Burakov for (; j < nb_rx; j++) { 48474de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 485e107e82eSAnatoly Burakov } 486e107e82eSAnatoly Burakov } 487e107e82eSAnatoly Burakov } 488e107e82eSAnatoly Burakov } 489e107e82eSAnatoly Burakov 490e107e82eSAnatoly Burakov /* display usage */ 491e107e82eSAnatoly Burakov static void 492e107e82eSAnatoly Burakov print_usage(const char *prgname) 493e107e82eSAnatoly Burakov { 494e107e82eSAnatoly Burakov printf("%s [EAL options] -- -p PORTMASK [-q NQ]\n" 495e107e82eSAnatoly Burakov " -p PORTMASK: hexadecimal bitmask of ports to configure\n" 496e107e82eSAnatoly Burakov " -q NQ: number of queue (=ports) per lcore (default is 1)\n", 497e107e82eSAnatoly Burakov prgname); 498e107e82eSAnatoly Burakov } 499e107e82eSAnatoly Burakov 500e107e82eSAnatoly Burakov static int 501e107e82eSAnatoly Burakov parse_portmask(const char *portmask) 502e107e82eSAnatoly Burakov { 503e107e82eSAnatoly Burakov char *end = NULL; 504e107e82eSAnatoly Burakov unsigned long pm; 505e107e82eSAnatoly Burakov 506e107e82eSAnatoly Burakov /* parse hexadecimal string */ 507e107e82eSAnatoly Burakov pm = strtoul(portmask, &end, 16); 508e107e82eSAnatoly Burakov if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0')) 509e107e82eSAnatoly Burakov return -1; 510e107e82eSAnatoly Burakov 511e107e82eSAnatoly Burakov if (pm == 0) 512e107e82eSAnatoly Burakov return -1; 513e107e82eSAnatoly Burakov 514e107e82eSAnatoly Burakov return pm; 515e107e82eSAnatoly Burakov } 516e107e82eSAnatoly Burakov 517e107e82eSAnatoly Burakov static int 518e107e82eSAnatoly Burakov parse_nqueue(const char *q_arg) 519e107e82eSAnatoly Burakov { 520e107e82eSAnatoly Burakov char *end = NULL; 521e107e82eSAnatoly Burakov unsigned long n; 522e107e82eSAnatoly Burakov 523e107e82eSAnatoly Burakov /* parse hexadecimal string */ 524e107e82eSAnatoly Burakov n = strtoul(q_arg, &end, 10); 525e107e82eSAnatoly Burakov if ((q_arg[0] == '\0') || (end == NULL) || (*end != '\0')) 526e107e82eSAnatoly Burakov return -1; 527e107e82eSAnatoly Burakov if (n == 0) 528e107e82eSAnatoly Burakov return -1; 529e107e82eSAnatoly Burakov if (n >= MAX_RX_QUEUE_PER_LCORE) 530e107e82eSAnatoly Burakov return -1; 531e107e82eSAnatoly Burakov 532e107e82eSAnatoly Burakov return n; 533e107e82eSAnatoly Burakov } 534e107e82eSAnatoly Burakov 535e107e82eSAnatoly Burakov /* Parse the argument given in the command line of the application */ 536e107e82eSAnatoly Burakov static int 537e107e82eSAnatoly Burakov parse_args(int argc, char **argv) 538e107e82eSAnatoly Burakov { 539e107e82eSAnatoly Burakov int opt, ret; 540e107e82eSAnatoly Burakov char **argvopt; 541e107e82eSAnatoly Burakov int option_index; 542e107e82eSAnatoly Burakov char *prgname = argv[0]; 543e107e82eSAnatoly Burakov static struct option lgopts[] = { 544e107e82eSAnatoly Burakov {NULL, 0, 0, 0} 545e107e82eSAnatoly Burakov }; 546e107e82eSAnatoly Burakov 547e107e82eSAnatoly Burakov argvopt = argv; 548e107e82eSAnatoly Burakov 549e107e82eSAnatoly Burakov while ((opt = getopt_long(argc, argvopt, "p:q:", 550e107e82eSAnatoly Burakov lgopts, &option_index)) != EOF) { 551e107e82eSAnatoly Burakov 552e107e82eSAnatoly Burakov switch (opt) { 553e107e82eSAnatoly Burakov /* portmask */ 554e107e82eSAnatoly Burakov case 'p': 555e107e82eSAnatoly Burakov enabled_port_mask = parse_portmask(optarg); 556e107e82eSAnatoly Burakov if (enabled_port_mask < 0) { 557e107e82eSAnatoly Burakov printf("invalid portmask\n"); 558e107e82eSAnatoly Burakov print_usage(prgname); 559e107e82eSAnatoly Burakov return -1; 560e107e82eSAnatoly Burakov } 561e107e82eSAnatoly Burakov break; 562e107e82eSAnatoly Burakov 563e107e82eSAnatoly Burakov /* nqueue */ 564e107e82eSAnatoly Burakov case 'q': 565e107e82eSAnatoly Burakov rx_queue_per_lcore = parse_nqueue(optarg); 566e107e82eSAnatoly Burakov if (rx_queue_per_lcore < 0) { 567e107e82eSAnatoly Burakov printf("invalid queue number\n"); 568e107e82eSAnatoly Burakov print_usage(prgname); 569e107e82eSAnatoly Burakov return -1; 570e107e82eSAnatoly Burakov } 571e107e82eSAnatoly Burakov break; 572e107e82eSAnatoly Burakov 573e107e82eSAnatoly Burakov /* long options */ 574e107e82eSAnatoly Burakov case 0: 575e107e82eSAnatoly Burakov print_usage(prgname); 576e107e82eSAnatoly Burakov return -1; 577e107e82eSAnatoly Burakov 578e107e82eSAnatoly Burakov default: 579e107e82eSAnatoly Burakov print_usage(prgname); 580e107e82eSAnatoly Burakov return -1; 581e107e82eSAnatoly Burakov } 582e107e82eSAnatoly Burakov } 583e107e82eSAnatoly Burakov 584e107e82eSAnatoly Burakov if (enabled_port_mask == 0) { 585e107e82eSAnatoly Burakov printf("portmask not specified\n"); 586e107e82eSAnatoly Burakov print_usage(prgname); 587e107e82eSAnatoly Burakov return -1; 588e107e82eSAnatoly Burakov } 589e107e82eSAnatoly Burakov 590e107e82eSAnatoly Burakov if (optind >= 0) 591e107e82eSAnatoly Burakov argv[optind-1] = prgname; 592e107e82eSAnatoly Burakov 593e107e82eSAnatoly Burakov ret = optind-1; 594e107e82eSAnatoly Burakov optind = 0; /* reset getopt lib */ 595e107e82eSAnatoly Burakov return ret; 596e107e82eSAnatoly Burakov } 597e107e82eSAnatoly Burakov 598e107e82eSAnatoly Burakov static void 599e107e82eSAnatoly Burakov print_ethaddr(const char *name, struct ether_addr *eth_addr) 600e107e82eSAnatoly Burakov { 601ec3d82dbSCunming Liang char buf[ETHER_ADDR_FMT_SIZE]; 602ec3d82dbSCunming Liang ether_format_addr(buf, ETHER_ADDR_FMT_SIZE, eth_addr); 603ec3d82dbSCunming Liang printf("%s%s", name, buf); 604e107e82eSAnatoly Burakov } 605e107e82eSAnatoly Burakov 606e107e82eSAnatoly Burakov /* Check the link status of all ports in up to 9s, and print them finally */ 607e107e82eSAnatoly Burakov static void 608e107e82eSAnatoly Burakov check_all_ports_link_status(uint8_t port_num, uint32_t port_mask) 609e107e82eSAnatoly Burakov { 610e107e82eSAnatoly Burakov #define CHECK_INTERVAL 100 /* 100ms */ 611e107e82eSAnatoly Burakov #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */ 612e107e82eSAnatoly Burakov uint8_t portid, count, all_ports_up, print_flag = 0; 613e107e82eSAnatoly Burakov struct rte_eth_link link; 614e107e82eSAnatoly Burakov 615e107e82eSAnatoly Burakov printf("\nChecking link status"); 616e107e82eSAnatoly Burakov fflush(stdout); 617e107e82eSAnatoly Burakov for (count = 0; count <= MAX_CHECK_TIME; count++) { 618e107e82eSAnatoly Burakov all_ports_up = 1; 619e107e82eSAnatoly Burakov for (portid = 0; portid < port_num; portid++) { 620e107e82eSAnatoly Burakov if ((port_mask & (1 << portid)) == 0) 621e107e82eSAnatoly Burakov continue; 622e107e82eSAnatoly Burakov memset(&link, 0, sizeof(link)); 623e107e82eSAnatoly Burakov rte_eth_link_get_nowait(portid, &link); 624e107e82eSAnatoly Burakov /* print link status if flag set */ 625e107e82eSAnatoly Burakov if (print_flag == 1) { 626e107e82eSAnatoly Burakov if (link.link_status) 627e107e82eSAnatoly Burakov printf("Port %d Link Up - speed %u " 628e107e82eSAnatoly Burakov "Mbps - %s\n", (uint8_t)portid, 629e107e82eSAnatoly Burakov (unsigned)link.link_speed, 630e107e82eSAnatoly Burakov (link.link_duplex == ETH_LINK_FULL_DUPLEX) ? 631e107e82eSAnatoly Burakov ("full-duplex") : ("half-duplex\n")); 632e107e82eSAnatoly Burakov else 633e107e82eSAnatoly Burakov printf("Port %d Link Down\n", 634e107e82eSAnatoly Burakov (uint8_t)portid); 635e107e82eSAnatoly Burakov continue; 636e107e82eSAnatoly Burakov } 637e107e82eSAnatoly Burakov /* clear all_ports_up flag if any link down */ 638e107e82eSAnatoly Burakov if (link.link_status == 0) { 639e107e82eSAnatoly Burakov all_ports_up = 0; 640e107e82eSAnatoly Burakov break; 641e107e82eSAnatoly Burakov } 642e107e82eSAnatoly Burakov } 643e107e82eSAnatoly Burakov /* after finally printing all link status, get out */ 644e107e82eSAnatoly Burakov if (print_flag == 1) 645e107e82eSAnatoly Burakov break; 646e107e82eSAnatoly Burakov 647e107e82eSAnatoly Burakov if (all_ports_up == 0) { 648e107e82eSAnatoly Burakov printf("."); 649e107e82eSAnatoly Burakov fflush(stdout); 650e107e82eSAnatoly Burakov rte_delay_ms(CHECK_INTERVAL); 651e107e82eSAnatoly Burakov } 652e107e82eSAnatoly Burakov 653e107e82eSAnatoly Burakov /* set the print_flag if all ports up or timeout */ 654e107e82eSAnatoly Burakov if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) { 655e107e82eSAnatoly Burakov print_flag = 1; 65674de12b7SAnatoly Burakov printf("\ndone\n"); 657e107e82eSAnatoly Burakov } 658e107e82eSAnatoly Burakov } 659e107e82eSAnatoly Burakov } 660e107e82eSAnatoly Burakov 66174de12b7SAnatoly Burakov static int 66274de12b7SAnatoly Burakov init_routing_table(void) 66374de12b7SAnatoly Burakov { 66474de12b7SAnatoly Burakov struct rte_lpm *lpm; 66574de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 66674de12b7SAnatoly Burakov int socket, ret; 66774de12b7SAnatoly Burakov unsigned i; 66874de12b7SAnatoly Burakov 66974de12b7SAnatoly Burakov for (socket = 0; socket < RTE_MAX_NUMA_NODES; socket++) { 67074de12b7SAnatoly Burakov if (socket_lpm[socket]) { 67174de12b7SAnatoly Burakov lpm = socket_lpm[socket]; 67274de12b7SAnatoly Burakov /* populate the LPM table */ 67374de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv4_route_array); i++) { 67474de12b7SAnatoly Burakov ret = rte_lpm_add(lpm, 67574de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].ip, 67674de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 67774de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 67874de12b7SAnatoly Burakov 67974de12b7SAnatoly Burakov if (ret < 0) { 68074de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 68174de12b7SAnatoly Burakov "LPM table\n", i); 68274de12b7SAnatoly Burakov return -1; 68374de12b7SAnatoly Burakov } 68474de12b7SAnatoly Burakov 68574de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv4_BYTES_FMT 68674de12b7SAnatoly Burakov "/%d (port %d)\n", 68774de12b7SAnatoly Burakov socket, 68874de12b7SAnatoly Burakov IPv4_BYTES(l3fwd_ipv4_route_array[i].ip), 68974de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 69074de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 69174de12b7SAnatoly Burakov } 69274de12b7SAnatoly Burakov } 69374de12b7SAnatoly Burakov 69474de12b7SAnatoly Burakov if (socket_lpm6[socket]) { 69574de12b7SAnatoly Burakov lpm6 = socket_lpm6[socket]; 69674de12b7SAnatoly Burakov /* populate the LPM6 table */ 69774de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv6_route_array); i++) { 69874de12b7SAnatoly Burakov ret = rte_lpm6_add(lpm6, 69974de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].ip, 70074de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 70174de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 70274de12b7SAnatoly Burakov 70374de12b7SAnatoly Burakov if (ret < 0) { 70474de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 70574de12b7SAnatoly Burakov "LPM6 table\n", i); 70674de12b7SAnatoly Burakov return -1; 70774de12b7SAnatoly Burakov } 70874de12b7SAnatoly Burakov 70974de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv6_BYTES_FMT 71074de12b7SAnatoly Burakov "/%d (port %d)\n", 71174de12b7SAnatoly Burakov socket, 71274de12b7SAnatoly Burakov IPv6_BYTES(l3fwd_ipv6_route_array[i].ip), 71374de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 71474de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 71574de12b7SAnatoly Burakov } 71674de12b7SAnatoly Burakov } 71774de12b7SAnatoly Burakov } 71874de12b7SAnatoly Burakov return 0; 71974de12b7SAnatoly Burakov } 72074de12b7SAnatoly Burakov 72174de12b7SAnatoly Burakov static int 72274de12b7SAnatoly Burakov init_mem(void) 72374de12b7SAnatoly Burakov { 72474de12b7SAnatoly Burakov char buf[PATH_MAX]; 72574de12b7SAnatoly Burakov struct rte_mempool *mp; 72674de12b7SAnatoly Burakov struct rte_lpm *lpm; 72774de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 72874de12b7SAnatoly Burakov int socket; 72974de12b7SAnatoly Burakov unsigned lcore_id; 73074de12b7SAnatoly Burakov 73174de12b7SAnatoly Burakov /* traverse through lcores and initialize structures on each socket */ 73274de12b7SAnatoly Burakov 73374de12b7SAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 73474de12b7SAnatoly Burakov 73574de12b7SAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 73674de12b7SAnatoly Burakov continue; 73774de12b7SAnatoly Burakov 73874de12b7SAnatoly Burakov socket = rte_lcore_to_socket_id(lcore_id); 73974de12b7SAnatoly Burakov 74074de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 74174de12b7SAnatoly Burakov socket = 0; 74274de12b7SAnatoly Burakov 74374de12b7SAnatoly Burakov if (socket_direct_pool[socket] == NULL) { 74474de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating direct mempool on socket %i\n", 74574de12b7SAnatoly Burakov socket); 7466f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_direct_%i", socket); 74774de12b7SAnatoly Burakov 74874de12b7SAnatoly Burakov mp = rte_mempool_create(buf, NB_MBUF, 74974de12b7SAnatoly Burakov MBUF_SIZE, 32, 75074de12b7SAnatoly Burakov sizeof(struct rte_pktmbuf_pool_private), 75174de12b7SAnatoly Burakov rte_pktmbuf_pool_init, NULL, 75274de12b7SAnatoly Burakov rte_pktmbuf_init, NULL, 75374de12b7SAnatoly Burakov socket, 0); 75474de12b7SAnatoly Burakov if (mp == NULL) { 75574de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create direct mempool\n"); 75674de12b7SAnatoly Burakov return -1; 75774de12b7SAnatoly Burakov } 75874de12b7SAnatoly Burakov socket_direct_pool[socket] = mp; 75974de12b7SAnatoly Burakov } 76074de12b7SAnatoly Burakov 76174de12b7SAnatoly Burakov if (socket_indirect_pool[socket] == NULL) { 76274de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating indirect mempool on socket %i\n", 76374de12b7SAnatoly Burakov socket); 7646f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_indirect_%i", socket); 76574de12b7SAnatoly Burakov 76674de12b7SAnatoly Burakov mp = rte_mempool_create(buf, NB_MBUF, 76774de12b7SAnatoly Burakov sizeof(struct rte_mbuf), 32, 76874de12b7SAnatoly Burakov 0, 76974de12b7SAnatoly Burakov NULL, NULL, 77074de12b7SAnatoly Burakov rte_pktmbuf_init, NULL, 77174de12b7SAnatoly Burakov socket, 0); 77274de12b7SAnatoly Burakov if (mp == NULL) { 77374de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create indirect mempool\n"); 77474de12b7SAnatoly Burakov return -1; 77574de12b7SAnatoly Burakov } 77674de12b7SAnatoly Burakov socket_indirect_pool[socket] = mp; 77774de12b7SAnatoly Burakov } 77874de12b7SAnatoly Burakov 77974de12b7SAnatoly Burakov if (socket_lpm[socket] == NULL) { 78074de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM table on socket %i\n", socket); 7816f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 78274de12b7SAnatoly Burakov 78374de12b7SAnatoly Burakov lpm = rte_lpm_create(buf, socket, LPM_MAX_RULES, 0); 78474de12b7SAnatoly Burakov if (lpm == NULL) { 78574de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 78674de12b7SAnatoly Burakov return -1; 78774de12b7SAnatoly Burakov } 78874de12b7SAnatoly Burakov socket_lpm[socket] = lpm; 78974de12b7SAnatoly Burakov } 79074de12b7SAnatoly Burakov 79174de12b7SAnatoly Burakov if (socket_lpm6[socket] == NULL) { 79274de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM6 table on socket %i\n", socket); 7936f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 79474de12b7SAnatoly Burakov 79574de12b7SAnatoly Burakov lpm6 = rte_lpm6_create("IP_FRAG_LPM6", socket, &lpm6_config); 79674de12b7SAnatoly Burakov if (lpm6 == NULL) { 79774de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 79874de12b7SAnatoly Burakov return -1; 79974de12b7SAnatoly Burakov } 80074de12b7SAnatoly Burakov socket_lpm6[socket] = lpm6; 80174de12b7SAnatoly Burakov } 80274de12b7SAnatoly Burakov } 80374de12b7SAnatoly Burakov 80474de12b7SAnatoly Burakov return 0; 80574de12b7SAnatoly Burakov } 80674de12b7SAnatoly Burakov 807e107e82eSAnatoly Burakov int 808*98a16481SDavid Marchand main(int argc, char **argv) 809e107e82eSAnatoly Burakov { 810e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 81181f7ecd9SPablo de Lara struct rte_eth_dev_info dev_info; 81281f7ecd9SPablo de Lara struct rte_eth_txconf *txconf; 81374de12b7SAnatoly Burakov struct rx_queue *rxq; 81474de12b7SAnatoly Burakov int socket, ret; 81574de12b7SAnatoly Burakov unsigned nb_ports; 816e107e82eSAnatoly Burakov uint16_t queueid = 0; 817e107e82eSAnatoly Burakov unsigned lcore_id = 0, rx_lcore_id = 0; 818e107e82eSAnatoly Burakov uint32_t n_tx_queue, nb_lcores; 819e107e82eSAnatoly Burakov uint8_t portid; 820e107e82eSAnatoly Burakov 821e107e82eSAnatoly Burakov /* init EAL */ 822e107e82eSAnatoly Burakov ret = rte_eal_init(argc, argv); 823e107e82eSAnatoly Burakov if (ret < 0) 824e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eal_init failed"); 825e107e82eSAnatoly Burakov argc -= ret; 826e107e82eSAnatoly Burakov argv += ret; 827e107e82eSAnatoly Burakov 828e107e82eSAnatoly Burakov /* parse application arguments (after the EAL ones) */ 829e107e82eSAnatoly Burakov ret = parse_args(argc, argv); 830e107e82eSAnatoly Burakov if (ret < 0) 831e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Invalid arguments"); 832e107e82eSAnatoly Burakov 833e107e82eSAnatoly Burakov nb_ports = rte_eth_dev_count(); 834e107e82eSAnatoly Burakov if (nb_ports > RTE_MAX_ETHPORTS) 835e107e82eSAnatoly Burakov nb_ports = RTE_MAX_ETHPORTS; 83674de12b7SAnatoly Burakov else if (nb_ports == 0) 83774de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "No ports found!\n"); 838e107e82eSAnatoly Burakov 839e107e82eSAnatoly Burakov nb_lcores = rte_lcore_count(); 840e107e82eSAnatoly Burakov 84174de12b7SAnatoly Burakov /* initialize structures (mempools, lpm etc.) */ 84274de12b7SAnatoly Burakov if (init_mem() < 0) 84374de12b7SAnatoly Burakov rte_panic("Cannot initialize memory structures!\n"); 84474de12b7SAnatoly Burakov 845eaa8d3bfSAnatoly Burakov /* check if portmask has non-existent ports */ 846eaa8d3bfSAnatoly Burakov if (enabled_port_mask & ~(RTE_LEN2MASK(nb_ports, unsigned))) 847eaa8d3bfSAnatoly Burakov rte_exit(EXIT_FAILURE, "Non-existent ports in portmask!\n"); 848eaa8d3bfSAnatoly Burakov 849e107e82eSAnatoly Burakov /* initialize all ports */ 850e107e82eSAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 851e107e82eSAnatoly Burakov /* skip ports that are not enabled */ 852e107e82eSAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 853e107e82eSAnatoly Burakov printf("Skipping disabled port %d\n", portid); 854e107e82eSAnatoly Burakov continue; 855e107e82eSAnatoly Burakov } 856e107e82eSAnatoly Burakov 857e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 858e107e82eSAnatoly Burakov 859e107e82eSAnatoly Burakov /* get the lcore_id for this port */ 860e107e82eSAnatoly Burakov while (rte_lcore_is_enabled(rx_lcore_id) == 0 || 861e107e82eSAnatoly Burakov qconf->n_rx_queue == (unsigned)rx_queue_per_lcore) { 862e107e82eSAnatoly Burakov 863e107e82eSAnatoly Burakov rx_lcore_id ++; 864e107e82eSAnatoly Burakov if (rx_lcore_id >= RTE_MAX_LCORE) 865e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Not enough cores\n"); 866e107e82eSAnatoly Burakov 867e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 868e107e82eSAnatoly Burakov } 86974de12b7SAnatoly Burakov 870324bcf45SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(rx_lcore_id); 87174de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 87274de12b7SAnatoly Burakov socket = 0; 87374de12b7SAnatoly Burakov 87474de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[qconf->n_rx_queue]; 87574de12b7SAnatoly Burakov rxq->portid = portid; 87674de12b7SAnatoly Burakov rxq->direct_pool = socket_direct_pool[socket]; 87774de12b7SAnatoly Burakov rxq->indirect_pool = socket_indirect_pool[socket]; 87874de12b7SAnatoly Burakov rxq->lpm = socket_lpm[socket]; 87974de12b7SAnatoly Burakov rxq->lpm6 = socket_lpm6[socket]; 880e107e82eSAnatoly Burakov qconf->n_rx_queue++; 881e107e82eSAnatoly Burakov 882e107e82eSAnatoly Burakov /* init port */ 883e107e82eSAnatoly Burakov printf("Initializing port %d on lcore %u...", portid, 884e107e82eSAnatoly Burakov rx_lcore_id); 885e107e82eSAnatoly Burakov fflush(stdout); 886e107e82eSAnatoly Burakov 887e107e82eSAnatoly Burakov n_tx_queue = nb_lcores; 888e107e82eSAnatoly Burakov if (n_tx_queue > MAX_TX_QUEUE_PER_PORT) 889e107e82eSAnatoly Burakov n_tx_queue = MAX_TX_QUEUE_PER_PORT; 890e107e82eSAnatoly Burakov ret = rte_eth_dev_configure(portid, 1, (uint16_t)n_tx_queue, 891e107e82eSAnatoly Burakov &port_conf); 89274de12b7SAnatoly Burakov if (ret < 0) { 89374de12b7SAnatoly Burakov printf("\n"); 894e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot configure device: " 895e107e82eSAnatoly Burakov "err=%d, port=%d\n", 896e107e82eSAnatoly Burakov ret, portid); 89774de12b7SAnatoly Burakov } 89874de12b7SAnatoly Burakov 89974de12b7SAnatoly Burakov /* init one RX queue */ 90074de12b7SAnatoly Burakov ret = rte_eth_rx_queue_setup(portid, 0, nb_rxd, 90181f7ecd9SPablo de Lara socket, NULL, 90274de12b7SAnatoly Burakov socket_direct_pool[socket]); 90374de12b7SAnatoly Burakov if (ret < 0) { 90474de12b7SAnatoly Burakov printf("\n"); 90574de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_rx_queue_setup: " 90674de12b7SAnatoly Burakov "err=%d, port=%d\n", 90774de12b7SAnatoly Burakov ret, portid); 90874de12b7SAnatoly Burakov } 909e107e82eSAnatoly Burakov 910e107e82eSAnatoly Burakov rte_eth_macaddr_get(portid, &ports_eth_addr[portid]); 911e107e82eSAnatoly Burakov print_ethaddr(" Address:", &ports_eth_addr[portid]); 91274de12b7SAnatoly Burakov printf("\n"); 913e107e82eSAnatoly Burakov 914e107e82eSAnatoly Burakov /* init one TX queue per couple (lcore,port) */ 915e107e82eSAnatoly Burakov queueid = 0; 916e107e82eSAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 917e107e82eSAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 918e107e82eSAnatoly Burakov continue; 91974de12b7SAnatoly Burakov 92074de12b7SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(lcore_id); 921e107e82eSAnatoly Burakov printf("txq=%u,%d ", lcore_id, queueid); 922e107e82eSAnatoly Burakov fflush(stdout); 92381f7ecd9SPablo de Lara 92481f7ecd9SPablo de Lara rte_eth_dev_info_get(portid, &dev_info); 92581f7ecd9SPablo de Lara txconf = &dev_info.default_txconf; 92681f7ecd9SPablo de Lara txconf->txq_flags = 0; 927e107e82eSAnatoly Burakov ret = rte_eth_tx_queue_setup(portid, queueid, nb_txd, 92881f7ecd9SPablo de Lara socket, txconf); 92974de12b7SAnatoly Burakov if (ret < 0) { 93074de12b7SAnatoly Burakov printf("\n"); 931e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_tx_queue_setup: " 932e107e82eSAnatoly Burakov "err=%d, port=%d\n", ret, portid); 93374de12b7SAnatoly Burakov } 934e107e82eSAnatoly Burakov 935e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 936e107e82eSAnatoly Burakov qconf->tx_queue_id[portid] = queueid; 937e107e82eSAnatoly Burakov queueid++; 938e107e82eSAnatoly Burakov } 939e107e82eSAnatoly Burakov 94074de12b7SAnatoly Burakov printf("\n"); 94174de12b7SAnatoly Burakov } 94274de12b7SAnatoly Burakov 94374de12b7SAnatoly Burakov printf("\n"); 94474de12b7SAnatoly Burakov 94574de12b7SAnatoly Burakov /* start ports */ 94674de12b7SAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 94774de12b7SAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 94874de12b7SAnatoly Burakov continue; 94974de12b7SAnatoly Burakov } 950e107e82eSAnatoly Burakov /* Start device */ 951e107e82eSAnatoly Burakov ret = rte_eth_dev_start(portid); 952e107e82eSAnatoly Burakov if (ret < 0) 95374de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_dev_start: err=%d, port=%d\n", 954e107e82eSAnatoly Burakov ret, portid); 955e107e82eSAnatoly Burakov 956e107e82eSAnatoly Burakov rte_eth_promiscuous_enable(portid); 957e107e82eSAnatoly Burakov } 958e107e82eSAnatoly Burakov 95974de12b7SAnatoly Burakov if (init_routing_table() < 0) 96074de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot init routing table\n"); 96174de12b7SAnatoly Burakov 962e107e82eSAnatoly Burakov check_all_ports_link_status((uint8_t)nb_ports, enabled_port_mask); 963e107e82eSAnatoly Burakov 964e107e82eSAnatoly Burakov /* launch per-lcore init on every lcore */ 965e107e82eSAnatoly Burakov rte_eal_mp_remote_launch(main_loop, NULL, CALL_MASTER); 966e107e82eSAnatoly Burakov RTE_LCORE_FOREACH_SLAVE(lcore_id) { 967e107e82eSAnatoly Burakov if (rte_eal_wait_lcore(lcore_id) < 0) 968e107e82eSAnatoly Burakov return -1; 969e107e82eSAnatoly Burakov } 970e107e82eSAnatoly Burakov 971e107e82eSAnatoly Burakov return 0; 972e107e82eSAnatoly Burakov } 973