1e107e82eSAnatoly Burakov /*- 2e107e82eSAnatoly Burakov * BSD LICENSE 3e107e82eSAnatoly Burakov * 4e107e82eSAnatoly Burakov * Copyright(c) 2010-2014 Intel Corporation. All rights reserved. 5e107e82eSAnatoly Burakov * All rights reserved. 6e107e82eSAnatoly Burakov * 7e107e82eSAnatoly Burakov * Redistribution and use in source and binary forms, with or without 8e107e82eSAnatoly Burakov * modification, are permitted provided that the following conditions 9e107e82eSAnatoly Burakov * are met: 10e107e82eSAnatoly Burakov * 11e107e82eSAnatoly Burakov * * Redistributions of source code must retain the above copyright 12e107e82eSAnatoly Burakov * notice, this list of conditions and the following disclaimer. 13e107e82eSAnatoly Burakov * * Redistributions in binary form must reproduce the above copyright 14e107e82eSAnatoly Burakov * notice, this list of conditions and the following disclaimer in 15e107e82eSAnatoly Burakov * the documentation and/or other materials provided with the 16e107e82eSAnatoly Burakov * distribution. 17e107e82eSAnatoly Burakov * * Neither the name of Intel Corporation nor the names of its 18e107e82eSAnatoly Burakov * contributors may be used to endorse or promote products derived 19e107e82eSAnatoly Burakov * from this software without specific prior written permission. 20e107e82eSAnatoly Burakov * 21e107e82eSAnatoly Burakov * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 22e107e82eSAnatoly Burakov * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 23e107e82eSAnatoly Burakov * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 24e107e82eSAnatoly Burakov * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 25e107e82eSAnatoly Burakov * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 26e107e82eSAnatoly Burakov * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 27e107e82eSAnatoly Burakov * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 28e107e82eSAnatoly Burakov * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 29e107e82eSAnatoly Burakov * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 30e107e82eSAnatoly Burakov * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 31e107e82eSAnatoly Burakov * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 32e107e82eSAnatoly Burakov */ 33e107e82eSAnatoly Burakov 34e107e82eSAnatoly Burakov #include <stdio.h> 35e107e82eSAnatoly Burakov #include <stdlib.h> 36e107e82eSAnatoly Burakov #include <stdint.h> 37e107e82eSAnatoly Burakov #include <inttypes.h> 38e107e82eSAnatoly Burakov #include <sys/types.h> 39e107e82eSAnatoly Burakov #include <sys/param.h> 40e107e82eSAnatoly Burakov #include <string.h> 41e107e82eSAnatoly Burakov #include <sys/queue.h> 42e107e82eSAnatoly Burakov #include <stdarg.h> 43e107e82eSAnatoly Burakov #include <errno.h> 44e107e82eSAnatoly Burakov #include <getopt.h> 45e107e82eSAnatoly Burakov 46e107e82eSAnatoly Burakov #include <rte_common.h> 47e107e82eSAnatoly Burakov #include <rte_byteorder.h> 48e107e82eSAnatoly Burakov #include <rte_log.h> 49e107e82eSAnatoly Burakov #include <rte_memory.h> 50e107e82eSAnatoly Burakov #include <rte_memcpy.h> 51e107e82eSAnatoly Burakov #include <rte_memzone.h> 52e107e82eSAnatoly Burakov #include <rte_tailq.h> 53e107e82eSAnatoly Burakov #include <rte_eal.h> 54e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 55e107e82eSAnatoly Burakov #include <rte_launch.h> 56e107e82eSAnatoly Burakov #include <rte_atomic.h> 57e107e82eSAnatoly Burakov #include <rte_cycles.h> 58e107e82eSAnatoly Burakov #include <rte_prefetch.h> 59e107e82eSAnatoly Burakov #include <rte_lcore.h> 60e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 61e107e82eSAnatoly Burakov #include <rte_branch_prediction.h> 62e107e82eSAnatoly Burakov #include <rte_interrupts.h> 63e107e82eSAnatoly Burakov #include <rte_pci.h> 64e107e82eSAnatoly Burakov #include <rte_random.h> 65e107e82eSAnatoly Burakov #include <rte_debug.h> 66e107e82eSAnatoly Burakov #include <rte_ether.h> 67e107e82eSAnatoly Burakov #include <rte_ethdev.h> 68e107e82eSAnatoly Burakov #include <rte_ring.h> 69e107e82eSAnatoly Burakov #include <rte_mempool.h> 70e107e82eSAnatoly Burakov #include <rte_mbuf.h> 71e107e82eSAnatoly Burakov #include <rte_lpm.h> 7274de12b7SAnatoly Burakov #include <rte_lpm6.h> 73e107e82eSAnatoly Burakov #include <rte_ip.h> 7474de12b7SAnatoly Burakov #include <rte_string_fns.h> 75e107e82eSAnatoly Burakov 7674de12b7SAnatoly Burakov #include <rte_ip_frag.h> 7774de12b7SAnatoly Burakov 78e107e82eSAnatoly Burakov #include "main.h" 79e107e82eSAnatoly Burakov 8074de12b7SAnatoly Burakov #define RTE_LOGTYPE_IP_FRAG RTE_LOGTYPE_USER1 81e107e82eSAnatoly Burakov 82e107e82eSAnatoly Burakov #define MBUF_SIZE (2048 + sizeof(struct rte_mbuf) + RTE_PKTMBUF_HEADROOM) 83e107e82eSAnatoly Burakov 84e107e82eSAnatoly Burakov /* allow max jumbo frame 9.5 KB */ 85e107e82eSAnatoly Burakov #define JUMBO_FRAME_MAX_SIZE 0x2600 86e107e82eSAnatoly Burakov 87e107e82eSAnatoly Burakov #define ROUNDUP_DIV(a, b) (((a) + (b) - 1) / (b)) 88e107e82eSAnatoly Burakov 89e107e82eSAnatoly Burakov /* 9074de12b7SAnatoly Burakov * Default byte size for the IPv6 Maximum Transfer Unit (MTU). 9174de12b7SAnatoly Burakov * This value includes the size of IPv6 header. 92e107e82eSAnatoly Burakov */ 9374de12b7SAnatoly Burakov #define IPV4_MTU_DEFAULT ETHER_MTU 9474de12b7SAnatoly Burakov #define IPV6_MTU_DEFAULT ETHER_MTU 9574de12b7SAnatoly Burakov 9674de12b7SAnatoly Burakov /* 9774de12b7SAnatoly Burakov * Default payload in bytes for the IPv6 packet. 9874de12b7SAnatoly Burakov */ 9974de12b7SAnatoly Burakov #define IPV4_DEFAULT_PAYLOAD (IPV4_MTU_DEFAULT - sizeof(struct ipv4_hdr)) 10074de12b7SAnatoly Burakov #define IPV6_DEFAULT_PAYLOAD (IPV6_MTU_DEFAULT - sizeof(struct ipv6_hdr)) 10174de12b7SAnatoly Burakov 10274de12b7SAnatoly Burakov /* 10374de12b7SAnatoly Burakov * Max number of fragments per packet expected - defined by config file. 10474de12b7SAnatoly Burakov */ 10574de12b7SAnatoly Burakov #define MAX_PACKET_FRAG RTE_LIBRTE_IP_FRAG_MAX_FRAG 106e107e82eSAnatoly Burakov 107e107e82eSAnatoly Burakov #define NB_MBUF 8192 108e107e82eSAnatoly Burakov 109e107e82eSAnatoly Burakov #define MAX_PKT_BURST 32 110e107e82eSAnatoly Burakov #define BURST_TX_DRAIN_US 100 /* TX drain every ~100us */ 111e107e82eSAnatoly Burakov 112e107e82eSAnatoly Burakov /* Configure how many packets ahead to prefetch, when reading packets */ 113e107e82eSAnatoly Burakov #define PREFETCH_OFFSET 3 114e107e82eSAnatoly Burakov 115e107e82eSAnatoly Burakov /* 116e107e82eSAnatoly Burakov * Configurable number of RX/TX ring descriptors 117e107e82eSAnatoly Burakov */ 118e107e82eSAnatoly Burakov #define RTE_TEST_RX_DESC_DEFAULT 128 119e107e82eSAnatoly Burakov #define RTE_TEST_TX_DESC_DEFAULT 512 120e107e82eSAnatoly Burakov static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT; 121e107e82eSAnatoly Burakov static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT; 122e107e82eSAnatoly Burakov 123e107e82eSAnatoly Burakov /* ethernet addresses of ports */ 124e107e82eSAnatoly Burakov static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS]; 12574de12b7SAnatoly Burakov 12674de12b7SAnatoly Burakov #ifndef IPv4_BYTES 12774de12b7SAnatoly Burakov #define IPv4_BYTES_FMT "%" PRIu8 ".%" PRIu8 ".%" PRIu8 ".%" PRIu8 12874de12b7SAnatoly Burakov #define IPv4_BYTES(addr) \ 12974de12b7SAnatoly Burakov (uint8_t) (((addr) >> 24) & 0xFF),\ 13074de12b7SAnatoly Burakov (uint8_t) (((addr) >> 16) & 0xFF),\ 13174de12b7SAnatoly Burakov (uint8_t) (((addr) >> 8) & 0xFF),\ 13274de12b7SAnatoly Burakov (uint8_t) ((addr) & 0xFF) 13374de12b7SAnatoly Burakov #endif 13474de12b7SAnatoly Burakov 13574de12b7SAnatoly Burakov #ifndef IPv6_BYTES 13674de12b7SAnatoly Burakov #define IPv6_BYTES_FMT "%02x%02x:%02x%02x:%02x%02x:%02x%02x:"\ 13774de12b7SAnatoly Burakov "%02x%02x:%02x%02x:%02x%02x:%02x%02x" 13874de12b7SAnatoly Burakov #define IPv6_BYTES(addr) \ 13974de12b7SAnatoly Burakov addr[0], addr[1], addr[2], addr[3], \ 14074de12b7SAnatoly Burakov addr[4], addr[5], addr[6], addr[7], \ 14174de12b7SAnatoly Burakov addr[8], addr[9], addr[10], addr[11],\ 14274de12b7SAnatoly Burakov addr[12], addr[13],addr[14], addr[15] 14374de12b7SAnatoly Burakov #endif 14474de12b7SAnatoly Burakov 14574de12b7SAnatoly Burakov #define IPV6_ADDR_LEN 16 146e107e82eSAnatoly Burakov 147e107e82eSAnatoly Burakov /* mask of enabled ports */ 148e107e82eSAnatoly Burakov static int enabled_port_mask = 0; 149e107e82eSAnatoly Burakov 150e107e82eSAnatoly Burakov static int rx_queue_per_lcore = 1; 151e107e82eSAnatoly Burakov 152e107e82eSAnatoly Burakov #define MBUF_TABLE_SIZE (2 * MAX(MAX_PKT_BURST, MAX_PACKET_FRAG)) 153e107e82eSAnatoly Burakov 154e107e82eSAnatoly Burakov struct mbuf_table { 155e107e82eSAnatoly Burakov uint16_t len; 156e107e82eSAnatoly Burakov struct rte_mbuf *m_table[MBUF_TABLE_SIZE]; 157e107e82eSAnatoly Burakov }; 158e107e82eSAnatoly Burakov 15974de12b7SAnatoly Burakov struct rx_queue { 16074de12b7SAnatoly Burakov struct rte_mempool *direct_pool; 16174de12b7SAnatoly Burakov struct rte_mempool *indirect_pool; 16274de12b7SAnatoly Burakov struct rte_lpm *lpm; 16374de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 16474de12b7SAnatoly Burakov uint8_t portid; 16574de12b7SAnatoly Burakov }; 16674de12b7SAnatoly Burakov 167e107e82eSAnatoly Burakov #define MAX_RX_QUEUE_PER_LCORE 16 168e107e82eSAnatoly Burakov #define MAX_TX_QUEUE_PER_PORT 16 169e107e82eSAnatoly Burakov struct lcore_queue_conf { 170e107e82eSAnatoly Burakov uint16_t n_rx_queue; 171e107e82eSAnatoly Burakov uint16_t tx_queue_id[RTE_MAX_ETHPORTS]; 17274de12b7SAnatoly Burakov struct rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE]; 173e107e82eSAnatoly Burakov struct mbuf_table tx_mbufs[RTE_MAX_ETHPORTS]; 174e107e82eSAnatoly Burakov } __rte_cache_aligned; 175e107e82eSAnatoly Burakov struct lcore_queue_conf lcore_queue_conf[RTE_MAX_LCORE]; 176e107e82eSAnatoly Burakov 177e107e82eSAnatoly Burakov static const struct rte_eth_conf port_conf = { 178e107e82eSAnatoly Burakov .rxmode = { 179e107e82eSAnatoly Burakov .max_rx_pkt_len = JUMBO_FRAME_MAX_SIZE, 180e107e82eSAnatoly Burakov .split_hdr_size = 0, 181e107e82eSAnatoly Burakov .header_split = 0, /**< Header Split disabled */ 18274de12b7SAnatoly Burakov .hw_ip_checksum = 1, /**< IP checksum offload enabled */ 183e107e82eSAnatoly Burakov .hw_vlan_filter = 0, /**< VLAN filtering disabled */ 184e107e82eSAnatoly Burakov .jumbo_frame = 1, /**< Jumbo Frame Support enabled */ 185e107e82eSAnatoly Burakov .hw_strip_crc = 0, /**< CRC stripped by hardware */ 186e107e82eSAnatoly Burakov }, 187e107e82eSAnatoly Burakov .txmode = { 188e107e82eSAnatoly Burakov .mq_mode = ETH_MQ_TX_NONE, 189e107e82eSAnatoly Burakov }, 190e107e82eSAnatoly Burakov }; 191e107e82eSAnatoly Burakov 19274de12b7SAnatoly Burakov /* 19374de12b7SAnatoly Burakov * IPv4 forwarding table 19474de12b7SAnatoly Burakov */ 19574de12b7SAnatoly Burakov struct l3fwd_ipv4_route { 196e107e82eSAnatoly Burakov uint32_t ip; 197e107e82eSAnatoly Burakov uint8_t depth; 198e107e82eSAnatoly Burakov uint8_t if_out; 199e107e82eSAnatoly Burakov }; 200e107e82eSAnatoly Burakov 20174de12b7SAnatoly Burakov struct l3fwd_ipv4_route l3fwd_ipv4_route_array[] = { 20274de12b7SAnatoly Burakov {IPv4(100,10,0,0), 16, 0}, 20374de12b7SAnatoly Burakov {IPv4(100,20,0,0), 16, 1}, 20474de12b7SAnatoly Burakov {IPv4(100,30,0,0), 16, 2}, 20574de12b7SAnatoly Burakov {IPv4(100,40,0,0), 16, 3}, 20674de12b7SAnatoly Burakov {IPv4(100,50,0,0), 16, 4}, 20774de12b7SAnatoly Burakov {IPv4(100,60,0,0), 16, 5}, 20874de12b7SAnatoly Burakov {IPv4(100,70,0,0), 16, 6}, 20974de12b7SAnatoly Burakov {IPv4(100,80,0,0), 16, 7}, 210e107e82eSAnatoly Burakov }; 211e107e82eSAnatoly Burakov 21274de12b7SAnatoly Burakov /* 21374de12b7SAnatoly Burakov * IPv6 forwarding table 21474de12b7SAnatoly Burakov */ 215e107e82eSAnatoly Burakov 21674de12b7SAnatoly Burakov struct l3fwd_ipv6_route { 21774de12b7SAnatoly Burakov uint8_t ip[IPV6_ADDR_LEN]; 21874de12b7SAnatoly Burakov uint8_t depth; 21974de12b7SAnatoly Burakov uint8_t if_out; 22074de12b7SAnatoly Burakov }; 221e107e82eSAnatoly Burakov 22274de12b7SAnatoly Burakov static struct l3fwd_ipv6_route l3fwd_ipv6_route_array[] = { 22374de12b7SAnatoly Burakov {{1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 0}, 22474de12b7SAnatoly Burakov {{2,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 1}, 22574de12b7SAnatoly Burakov {{3,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 2}, 22674de12b7SAnatoly Burakov {{4,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 3}, 22774de12b7SAnatoly Burakov {{5,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 4}, 22874de12b7SAnatoly Burakov {{6,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 5}, 22974de12b7SAnatoly Burakov {{7,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 6}, 23074de12b7SAnatoly Burakov {{8,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 7}, 23174de12b7SAnatoly Burakov }; 23274de12b7SAnatoly Burakov 23374de12b7SAnatoly Burakov #define LPM_MAX_RULES 1024 23474de12b7SAnatoly Burakov #define LPM6_MAX_RULES 1024 23574de12b7SAnatoly Burakov #define LPM6_NUMBER_TBL8S (1 << 16) 23674de12b7SAnatoly Burakov 23774de12b7SAnatoly Burakov struct rte_lpm6_config lpm6_config = { 23874de12b7SAnatoly Burakov .max_rules = LPM6_MAX_RULES, 23974de12b7SAnatoly Burakov .number_tbl8s = LPM6_NUMBER_TBL8S, 24074de12b7SAnatoly Burakov .flags = 0 24174de12b7SAnatoly Burakov }; 24274de12b7SAnatoly Burakov 24374de12b7SAnatoly Burakov static struct rte_mempool *socket_direct_pool[RTE_MAX_NUMA_NODES]; 24474de12b7SAnatoly Burakov static struct rte_mempool *socket_indirect_pool[RTE_MAX_NUMA_NODES]; 24574de12b7SAnatoly Burakov static struct rte_lpm *socket_lpm[RTE_MAX_NUMA_NODES]; 24674de12b7SAnatoly Burakov static struct rte_lpm6 *socket_lpm6[RTE_MAX_NUMA_NODES]; 247e107e82eSAnatoly Burakov 248e107e82eSAnatoly Burakov /* Send burst of packets on an output interface */ 249e107e82eSAnatoly Burakov static inline int 250e107e82eSAnatoly Burakov send_burst(struct lcore_queue_conf *qconf, uint16_t n, uint8_t port) 251e107e82eSAnatoly Burakov { 252e107e82eSAnatoly Burakov struct rte_mbuf **m_table; 253e107e82eSAnatoly Burakov int ret; 254e107e82eSAnatoly Burakov uint16_t queueid; 255e107e82eSAnatoly Burakov 256e107e82eSAnatoly Burakov queueid = qconf->tx_queue_id[port]; 257e107e82eSAnatoly Burakov m_table = (struct rte_mbuf **)qconf->tx_mbufs[port].m_table; 258e107e82eSAnatoly Burakov 259e107e82eSAnatoly Burakov ret = rte_eth_tx_burst(port, queueid, m_table, n); 260e107e82eSAnatoly Burakov if (unlikely(ret < n)) { 261e107e82eSAnatoly Burakov do { 262e107e82eSAnatoly Burakov rte_pktmbuf_free(m_table[ret]); 263e107e82eSAnatoly Burakov } while (++ret < n); 264e107e82eSAnatoly Burakov } 265e107e82eSAnatoly Burakov 266e107e82eSAnatoly Burakov return 0; 267e107e82eSAnatoly Burakov } 268e107e82eSAnatoly Burakov 269e107e82eSAnatoly Burakov static inline void 27074de12b7SAnatoly Burakov l3fwd_simple_forward(struct rte_mbuf *m, struct lcore_queue_conf *qconf, 27174de12b7SAnatoly Burakov uint8_t queueid, uint8_t port_in) 272e107e82eSAnatoly Burakov { 27374de12b7SAnatoly Burakov struct rx_queue *rxq; 27474de12b7SAnatoly Burakov uint32_t i, len; 27574de12b7SAnatoly Burakov uint8_t next_hop, port_out, ipv6; 276e107e82eSAnatoly Burakov int32_t len2; 277e107e82eSAnatoly Burakov 27874de12b7SAnatoly Burakov ipv6 = 0; 27974de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[queueid]; 28074de12b7SAnatoly Burakov 28174de12b7SAnatoly Burakov /* by default, send everything back to the source port */ 28274de12b7SAnatoly Burakov port_out = port_in; 283e107e82eSAnatoly Burakov 284e107e82eSAnatoly Burakov /* Remove the Ethernet header and trailer from the input packet */ 285e107e82eSAnatoly Burakov rte_pktmbuf_adj(m, (uint16_t)sizeof(struct ether_hdr)); 286e107e82eSAnatoly Burakov 28774de12b7SAnatoly Burakov /* Build transmission burst */ 28874de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 28974de12b7SAnatoly Burakov 29074de12b7SAnatoly Burakov /* if this is an IPv4 packet */ 29174de12b7SAnatoly Burakov if (m->ol_flags & PKT_RX_IPV4_HDR) { 29274de12b7SAnatoly Burakov struct ipv4_hdr *ip_hdr; 29374de12b7SAnatoly Burakov uint32_t ip_dst; 294e107e82eSAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 295e107e82eSAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv4_hdr *); 296e107e82eSAnatoly Burakov ip_dst = rte_be_to_cpu_32(ip_hdr->dst_addr); 297e107e82eSAnatoly Burakov 298e107e82eSAnatoly Burakov /* Find destination port */ 29974de12b7SAnatoly Burakov if (rte_lpm_lookup(rxq->lpm, ip_dst, &next_hop) == 0 && 30074de12b7SAnatoly Burakov (enabled_port_mask & 1 << next_hop) != 0) { 301e107e82eSAnatoly Burakov port_out = next_hop; 302e107e82eSAnatoly Burakov 30374de12b7SAnatoly Burakov /* Build transmission burst for new port */ 304e107e82eSAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 30574de12b7SAnatoly Burakov } 306e107e82eSAnatoly Burakov 307e107e82eSAnatoly Burakov /* if we don't need to do any fragmentation */ 308ea672a8bSOlivier Matz if (likely (IPV4_MTU_DEFAULT >= m->pkt_len)) { 309e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 310e107e82eSAnatoly Burakov len2 = 1; 311e107e82eSAnatoly Burakov } else { 312e107e82eSAnatoly Burakov len2 = rte_ipv4_fragment_packet(m, 313e107e82eSAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 314e107e82eSAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 315e107e82eSAnatoly Burakov IPV4_MTU_DEFAULT, 31674de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 317e107e82eSAnatoly Burakov 318e107e82eSAnatoly Burakov /* Free input packet */ 319e107e82eSAnatoly Burakov rte_pktmbuf_free(m); 320e107e82eSAnatoly Burakov 321e107e82eSAnatoly Burakov /* If we fail to fragment the packet */ 322e107e82eSAnatoly Burakov if (unlikely (len2 < 0)) 323e107e82eSAnatoly Burakov return; 324e107e82eSAnatoly Burakov } 32574de12b7SAnatoly Burakov } 32674de12b7SAnatoly Burakov /* if this is an IPv6 packet */ 32774de12b7SAnatoly Burakov else if (m->ol_flags & PKT_RX_IPV6_HDR) { 32874de12b7SAnatoly Burakov struct ipv6_hdr *ip_hdr; 32974de12b7SAnatoly Burakov 33074de12b7SAnatoly Burakov ipv6 = 1; 33174de12b7SAnatoly Burakov 33274de12b7SAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 33374de12b7SAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv6_hdr *); 33474de12b7SAnatoly Burakov 33574de12b7SAnatoly Burakov /* Find destination port */ 33674de12b7SAnatoly Burakov if (rte_lpm6_lookup(rxq->lpm6, ip_hdr->dst_addr, &next_hop) == 0 && 33774de12b7SAnatoly Burakov (enabled_port_mask & 1 << next_hop) != 0) { 33874de12b7SAnatoly Burakov port_out = next_hop; 33974de12b7SAnatoly Burakov 34074de12b7SAnatoly Burakov /* Build transmission burst for new port */ 34174de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 34274de12b7SAnatoly Burakov } 34374de12b7SAnatoly Burakov 34474de12b7SAnatoly Burakov /* if we don't need to do any fragmentation */ 345ea672a8bSOlivier Matz if (likely (IPV6_MTU_DEFAULT >= m->pkt_len)) { 34674de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 34774de12b7SAnatoly Burakov len2 = 1; 34874de12b7SAnatoly Burakov } else { 34974de12b7SAnatoly Burakov len2 = rte_ipv6_fragment_packet(m, 35074de12b7SAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 35174de12b7SAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 35274de12b7SAnatoly Burakov IPV6_MTU_DEFAULT, 35374de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 35474de12b7SAnatoly Burakov 35574de12b7SAnatoly Burakov /* Free input packet */ 35674de12b7SAnatoly Burakov rte_pktmbuf_free(m); 35774de12b7SAnatoly Burakov 35874de12b7SAnatoly Burakov /* If we fail to fragment the packet */ 35974de12b7SAnatoly Burakov if (unlikely (len2 < 0)) 36074de12b7SAnatoly Burakov return; 36174de12b7SAnatoly Burakov } 36274de12b7SAnatoly Burakov } 36374de12b7SAnatoly Burakov /* else, just forward the packet */ 36474de12b7SAnatoly Burakov else { 36574de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 36674de12b7SAnatoly Burakov len2 = 1; 36774de12b7SAnatoly Burakov } 368e107e82eSAnatoly Burakov 369e107e82eSAnatoly Burakov for (i = len; i < len + len2; i ++) { 37074de12b7SAnatoly Burakov void *d_addr_bytes; 37174de12b7SAnatoly Burakov 372e107e82eSAnatoly Burakov m = qconf->tx_mbufs[port_out].m_table[i]; 373e107e82eSAnatoly Burakov struct ether_hdr *eth_hdr = (struct ether_hdr *) 374e107e82eSAnatoly Burakov rte_pktmbuf_prepend(m, (uint16_t)sizeof(struct ether_hdr)); 375e107e82eSAnatoly Burakov if (eth_hdr == NULL) { 376e107e82eSAnatoly Burakov rte_panic("No headroom in mbuf.\n"); 377e107e82eSAnatoly Burakov } 378e107e82eSAnatoly Burakov 3797869536fSBruce Richardson m->l2_len = sizeof(struct ether_hdr); 380e107e82eSAnatoly Burakov 38174de12b7SAnatoly Burakov /* 02:00:00:00:00:xx */ 38274de12b7SAnatoly Burakov d_addr_bytes = ð_hdr->d_addr.addr_bytes[0]; 38374de12b7SAnatoly Burakov *((uint64_t *)d_addr_bytes) = 0x000000000002 + ((uint64_t)port_out << 40); 38474de12b7SAnatoly Burakov 38574de12b7SAnatoly Burakov /* src addr */ 386e107e82eSAnatoly Burakov ether_addr_copy(&ports_eth_addr[port_out], ð_hdr->s_addr); 38774de12b7SAnatoly Burakov if (ipv6) 38874de12b7SAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv6); 38974de12b7SAnatoly Burakov else 390e107e82eSAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv4); 391e107e82eSAnatoly Burakov } 392e107e82eSAnatoly Burakov 393e107e82eSAnatoly Burakov len += len2; 394e107e82eSAnatoly Burakov 395e107e82eSAnatoly Burakov if (likely(len < MAX_PKT_BURST)) { 396e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = (uint16_t)len; 397e107e82eSAnatoly Burakov return; 398e107e82eSAnatoly Burakov } 399e107e82eSAnatoly Burakov 400e107e82eSAnatoly Burakov /* Transmit packets */ 401e107e82eSAnatoly Burakov send_burst(qconf, (uint16_t)len, port_out); 402e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = 0; 403e107e82eSAnatoly Burakov } 404e107e82eSAnatoly Burakov 405e107e82eSAnatoly Burakov /* main processing loop */ 406e107e82eSAnatoly Burakov static int 407e107e82eSAnatoly Burakov main_loop(__attribute__((unused)) void *dummy) 408e107e82eSAnatoly Burakov { 409e107e82eSAnatoly Burakov struct rte_mbuf *pkts_burst[MAX_PKT_BURST]; 410e107e82eSAnatoly Burakov unsigned lcore_id; 411e107e82eSAnatoly Burakov uint64_t prev_tsc, diff_tsc, cur_tsc; 412e107e82eSAnatoly Burakov int i, j, nb_rx; 413e107e82eSAnatoly Burakov uint8_t portid; 414e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 415e107e82eSAnatoly Burakov const uint64_t drain_tsc = (rte_get_tsc_hz() + US_PER_S - 1) / US_PER_S * BURST_TX_DRAIN_US; 416e107e82eSAnatoly Burakov 417e107e82eSAnatoly Burakov prev_tsc = 0; 418e107e82eSAnatoly Burakov 419e107e82eSAnatoly Burakov lcore_id = rte_lcore_id(); 420e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 421e107e82eSAnatoly Burakov 422e107e82eSAnatoly Burakov if (qconf->n_rx_queue == 0) { 42374de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "lcore %u has nothing to do\n", lcore_id); 424e107e82eSAnatoly Burakov return 0; 425e107e82eSAnatoly Burakov } 426e107e82eSAnatoly Burakov 42774de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "entering main loop on lcore %u\n", lcore_id); 428e107e82eSAnatoly Burakov 429e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 430e107e82eSAnatoly Burakov 43174de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 43274de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, " -- lcoreid=%u portid=%d\n", lcore_id, 433e107e82eSAnatoly Burakov (int) portid); 434e107e82eSAnatoly Burakov } 435e107e82eSAnatoly Burakov 436e107e82eSAnatoly Burakov while (1) { 437e107e82eSAnatoly Burakov 438e107e82eSAnatoly Burakov cur_tsc = rte_rdtsc(); 439e107e82eSAnatoly Burakov 440e107e82eSAnatoly Burakov /* 441e107e82eSAnatoly Burakov * TX burst queue drain 442e107e82eSAnatoly Burakov */ 443e107e82eSAnatoly Burakov diff_tsc = cur_tsc - prev_tsc; 444e107e82eSAnatoly Burakov if (unlikely(diff_tsc > drain_tsc)) { 445e107e82eSAnatoly Burakov 446e107e82eSAnatoly Burakov /* 447e107e82eSAnatoly Burakov * This could be optimized (use queueid instead of 448e107e82eSAnatoly Burakov * portid), but it is not called so often 449e107e82eSAnatoly Burakov */ 450e107e82eSAnatoly Burakov for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) { 451e107e82eSAnatoly Burakov if (qconf->tx_mbufs[portid].len == 0) 452e107e82eSAnatoly Burakov continue; 453e107e82eSAnatoly Burakov send_burst(&lcore_queue_conf[lcore_id], 454e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len, 455e107e82eSAnatoly Burakov portid); 456e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len = 0; 457e107e82eSAnatoly Burakov } 458e107e82eSAnatoly Burakov 459e107e82eSAnatoly Burakov prev_tsc = cur_tsc; 460e107e82eSAnatoly Burakov } 461e107e82eSAnatoly Burakov 462e107e82eSAnatoly Burakov /* 463e107e82eSAnatoly Burakov * Read packet from RX queues 464e107e82eSAnatoly Burakov */ 465e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 466e107e82eSAnatoly Burakov 46774de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 468e107e82eSAnatoly Burakov nb_rx = rte_eth_rx_burst(portid, 0, pkts_burst, 469e107e82eSAnatoly Burakov MAX_PKT_BURST); 470e107e82eSAnatoly Burakov 471e107e82eSAnatoly Burakov /* Prefetch first packets */ 472e107e82eSAnatoly Burakov for (j = 0; j < PREFETCH_OFFSET && j < nb_rx; j++) { 473e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod( 474e107e82eSAnatoly Burakov pkts_burst[j], void *)); 475e107e82eSAnatoly Burakov } 476e107e82eSAnatoly Burakov 477e107e82eSAnatoly Burakov /* Prefetch and forward already prefetched packets */ 478e107e82eSAnatoly Burakov for (j = 0; j < (nb_rx - PREFETCH_OFFSET); j++) { 479e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod(pkts_burst[ 480e107e82eSAnatoly Burakov j + PREFETCH_OFFSET], void *)); 48174de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 482e107e82eSAnatoly Burakov } 483e107e82eSAnatoly Burakov 484e107e82eSAnatoly Burakov /* Forward remaining prefetched packets */ 485e107e82eSAnatoly Burakov for (; j < nb_rx; j++) { 48674de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 487e107e82eSAnatoly Burakov } 488e107e82eSAnatoly Burakov } 489e107e82eSAnatoly Burakov } 490e107e82eSAnatoly Burakov } 491e107e82eSAnatoly Burakov 492e107e82eSAnatoly Burakov /* display usage */ 493e107e82eSAnatoly Burakov static void 494e107e82eSAnatoly Burakov print_usage(const char *prgname) 495e107e82eSAnatoly Burakov { 496e107e82eSAnatoly Burakov printf("%s [EAL options] -- -p PORTMASK [-q NQ]\n" 497e107e82eSAnatoly Burakov " -p PORTMASK: hexadecimal bitmask of ports to configure\n" 498e107e82eSAnatoly Burakov " -q NQ: number of queue (=ports) per lcore (default is 1)\n", 499e107e82eSAnatoly Burakov prgname); 500e107e82eSAnatoly Burakov } 501e107e82eSAnatoly Burakov 502e107e82eSAnatoly Burakov static int 503e107e82eSAnatoly Burakov parse_portmask(const char *portmask) 504e107e82eSAnatoly Burakov { 505e107e82eSAnatoly Burakov char *end = NULL; 506e107e82eSAnatoly Burakov unsigned long pm; 507e107e82eSAnatoly Burakov 508e107e82eSAnatoly Burakov /* parse hexadecimal string */ 509e107e82eSAnatoly Burakov pm = strtoul(portmask, &end, 16); 510e107e82eSAnatoly Burakov if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0')) 511e107e82eSAnatoly Burakov return -1; 512e107e82eSAnatoly Burakov 513e107e82eSAnatoly Burakov if (pm == 0) 514e107e82eSAnatoly Burakov return -1; 515e107e82eSAnatoly Burakov 516e107e82eSAnatoly Burakov return pm; 517e107e82eSAnatoly Burakov } 518e107e82eSAnatoly Burakov 519e107e82eSAnatoly Burakov static int 520e107e82eSAnatoly Burakov parse_nqueue(const char *q_arg) 521e107e82eSAnatoly Burakov { 522e107e82eSAnatoly Burakov char *end = NULL; 523e107e82eSAnatoly Burakov unsigned long n; 524e107e82eSAnatoly Burakov 525e107e82eSAnatoly Burakov /* parse hexadecimal string */ 526e107e82eSAnatoly Burakov n = strtoul(q_arg, &end, 10); 527e107e82eSAnatoly Burakov if ((q_arg[0] == '\0') || (end == NULL) || (*end != '\0')) 528e107e82eSAnatoly Burakov return -1; 529e107e82eSAnatoly Burakov if (n == 0) 530e107e82eSAnatoly Burakov return -1; 531e107e82eSAnatoly Burakov if (n >= MAX_RX_QUEUE_PER_LCORE) 532e107e82eSAnatoly Burakov return -1; 533e107e82eSAnatoly Burakov 534e107e82eSAnatoly Burakov return n; 535e107e82eSAnatoly Burakov } 536e107e82eSAnatoly Burakov 537e107e82eSAnatoly Burakov /* Parse the argument given in the command line of the application */ 538e107e82eSAnatoly Burakov static int 539e107e82eSAnatoly Burakov parse_args(int argc, char **argv) 540e107e82eSAnatoly Burakov { 541e107e82eSAnatoly Burakov int opt, ret; 542e107e82eSAnatoly Burakov char **argvopt; 543e107e82eSAnatoly Burakov int option_index; 544e107e82eSAnatoly Burakov char *prgname = argv[0]; 545e107e82eSAnatoly Burakov static struct option lgopts[] = { 546e107e82eSAnatoly Burakov {NULL, 0, 0, 0} 547e107e82eSAnatoly Burakov }; 548e107e82eSAnatoly Burakov 549e107e82eSAnatoly Burakov argvopt = argv; 550e107e82eSAnatoly Burakov 551e107e82eSAnatoly Burakov while ((opt = getopt_long(argc, argvopt, "p:q:", 552e107e82eSAnatoly Burakov lgopts, &option_index)) != EOF) { 553e107e82eSAnatoly Burakov 554e107e82eSAnatoly Burakov switch (opt) { 555e107e82eSAnatoly Burakov /* portmask */ 556e107e82eSAnatoly Burakov case 'p': 557e107e82eSAnatoly Burakov enabled_port_mask = parse_portmask(optarg); 558e107e82eSAnatoly Burakov if (enabled_port_mask < 0) { 559e107e82eSAnatoly Burakov printf("invalid portmask\n"); 560e107e82eSAnatoly Burakov print_usage(prgname); 561e107e82eSAnatoly Burakov return -1; 562e107e82eSAnatoly Burakov } 563e107e82eSAnatoly Burakov break; 564e107e82eSAnatoly Burakov 565e107e82eSAnatoly Burakov /* nqueue */ 566e107e82eSAnatoly Burakov case 'q': 567e107e82eSAnatoly Burakov rx_queue_per_lcore = parse_nqueue(optarg); 568e107e82eSAnatoly Burakov if (rx_queue_per_lcore < 0) { 569e107e82eSAnatoly Burakov printf("invalid queue number\n"); 570e107e82eSAnatoly Burakov print_usage(prgname); 571e107e82eSAnatoly Burakov return -1; 572e107e82eSAnatoly Burakov } 573e107e82eSAnatoly Burakov break; 574e107e82eSAnatoly Burakov 575e107e82eSAnatoly Burakov /* long options */ 576e107e82eSAnatoly Burakov case 0: 577e107e82eSAnatoly Burakov print_usage(prgname); 578e107e82eSAnatoly Burakov return -1; 579e107e82eSAnatoly Burakov 580e107e82eSAnatoly Burakov default: 581e107e82eSAnatoly Burakov print_usage(prgname); 582e107e82eSAnatoly Burakov return -1; 583e107e82eSAnatoly Burakov } 584e107e82eSAnatoly Burakov } 585e107e82eSAnatoly Burakov 586e107e82eSAnatoly Burakov if (enabled_port_mask == 0) { 587e107e82eSAnatoly Burakov printf("portmask not specified\n"); 588e107e82eSAnatoly Burakov print_usage(prgname); 589e107e82eSAnatoly Burakov return -1; 590e107e82eSAnatoly Burakov } 591e107e82eSAnatoly Burakov 592e107e82eSAnatoly Burakov if (optind >= 0) 593e107e82eSAnatoly Burakov argv[optind-1] = prgname; 594e107e82eSAnatoly Burakov 595e107e82eSAnatoly Burakov ret = optind-1; 596e107e82eSAnatoly Burakov optind = 0; /* reset getopt lib */ 597e107e82eSAnatoly Burakov return ret; 598e107e82eSAnatoly Burakov } 599e107e82eSAnatoly Burakov 600e107e82eSAnatoly Burakov static void 601e107e82eSAnatoly Burakov print_ethaddr(const char *name, struct ether_addr *eth_addr) 602e107e82eSAnatoly Burakov { 603*ec3d82dbSCunming Liang char buf[ETHER_ADDR_FMT_SIZE]; 604*ec3d82dbSCunming Liang ether_format_addr(buf, ETHER_ADDR_FMT_SIZE, eth_addr); 605*ec3d82dbSCunming Liang printf("%s%s", name, buf); 606e107e82eSAnatoly Burakov } 607e107e82eSAnatoly Burakov 608e107e82eSAnatoly Burakov /* Check the link status of all ports in up to 9s, and print them finally */ 609e107e82eSAnatoly Burakov static void 610e107e82eSAnatoly Burakov check_all_ports_link_status(uint8_t port_num, uint32_t port_mask) 611e107e82eSAnatoly Burakov { 612e107e82eSAnatoly Burakov #define CHECK_INTERVAL 100 /* 100ms */ 613e107e82eSAnatoly Burakov #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */ 614e107e82eSAnatoly Burakov uint8_t portid, count, all_ports_up, print_flag = 0; 615e107e82eSAnatoly Burakov struct rte_eth_link link; 616e107e82eSAnatoly Burakov 617e107e82eSAnatoly Burakov printf("\nChecking link status"); 618e107e82eSAnatoly Burakov fflush(stdout); 619e107e82eSAnatoly Burakov for (count = 0; count <= MAX_CHECK_TIME; count++) { 620e107e82eSAnatoly Burakov all_ports_up = 1; 621e107e82eSAnatoly Burakov for (portid = 0; portid < port_num; portid++) { 622e107e82eSAnatoly Burakov if ((port_mask & (1 << portid)) == 0) 623e107e82eSAnatoly Burakov continue; 624e107e82eSAnatoly Burakov memset(&link, 0, sizeof(link)); 625e107e82eSAnatoly Burakov rte_eth_link_get_nowait(portid, &link); 626e107e82eSAnatoly Burakov /* print link status if flag set */ 627e107e82eSAnatoly Burakov if (print_flag == 1) { 628e107e82eSAnatoly Burakov if (link.link_status) 629e107e82eSAnatoly Burakov printf("Port %d Link Up - speed %u " 630e107e82eSAnatoly Burakov "Mbps - %s\n", (uint8_t)portid, 631e107e82eSAnatoly Burakov (unsigned)link.link_speed, 632e107e82eSAnatoly Burakov (link.link_duplex == ETH_LINK_FULL_DUPLEX) ? 633e107e82eSAnatoly Burakov ("full-duplex") : ("half-duplex\n")); 634e107e82eSAnatoly Burakov else 635e107e82eSAnatoly Burakov printf("Port %d Link Down\n", 636e107e82eSAnatoly Burakov (uint8_t)portid); 637e107e82eSAnatoly Burakov continue; 638e107e82eSAnatoly Burakov } 639e107e82eSAnatoly Burakov /* clear all_ports_up flag if any link down */ 640e107e82eSAnatoly Burakov if (link.link_status == 0) { 641e107e82eSAnatoly Burakov all_ports_up = 0; 642e107e82eSAnatoly Burakov break; 643e107e82eSAnatoly Burakov } 644e107e82eSAnatoly Burakov } 645e107e82eSAnatoly Burakov /* after finally printing all link status, get out */ 646e107e82eSAnatoly Burakov if (print_flag == 1) 647e107e82eSAnatoly Burakov break; 648e107e82eSAnatoly Burakov 649e107e82eSAnatoly Burakov if (all_ports_up == 0) { 650e107e82eSAnatoly Burakov printf("."); 651e107e82eSAnatoly Burakov fflush(stdout); 652e107e82eSAnatoly Burakov rte_delay_ms(CHECK_INTERVAL); 653e107e82eSAnatoly Burakov } 654e107e82eSAnatoly Burakov 655e107e82eSAnatoly Burakov /* set the print_flag if all ports up or timeout */ 656e107e82eSAnatoly Burakov if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) { 657e107e82eSAnatoly Burakov print_flag = 1; 65874de12b7SAnatoly Burakov printf("\ndone\n"); 659e107e82eSAnatoly Burakov } 660e107e82eSAnatoly Burakov } 661e107e82eSAnatoly Burakov } 662e107e82eSAnatoly Burakov 66374de12b7SAnatoly Burakov static int 66474de12b7SAnatoly Burakov init_routing_table(void) 66574de12b7SAnatoly Burakov { 66674de12b7SAnatoly Burakov struct rte_lpm *lpm; 66774de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 66874de12b7SAnatoly Burakov int socket, ret; 66974de12b7SAnatoly Burakov unsigned i; 67074de12b7SAnatoly Burakov 67174de12b7SAnatoly Burakov for (socket = 0; socket < RTE_MAX_NUMA_NODES; socket++) { 67274de12b7SAnatoly Burakov if (socket_lpm[socket]) { 67374de12b7SAnatoly Burakov lpm = socket_lpm[socket]; 67474de12b7SAnatoly Burakov /* populate the LPM table */ 67574de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv4_route_array); i++) { 67674de12b7SAnatoly Burakov ret = rte_lpm_add(lpm, 67774de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].ip, 67874de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 67974de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 68074de12b7SAnatoly Burakov 68174de12b7SAnatoly Burakov if (ret < 0) { 68274de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 68374de12b7SAnatoly Burakov "LPM table\n", i); 68474de12b7SAnatoly Burakov return -1; 68574de12b7SAnatoly Burakov } 68674de12b7SAnatoly Burakov 68774de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv4_BYTES_FMT 68874de12b7SAnatoly Burakov "/%d (port %d)\n", 68974de12b7SAnatoly Burakov socket, 69074de12b7SAnatoly Burakov IPv4_BYTES(l3fwd_ipv4_route_array[i].ip), 69174de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 69274de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 69374de12b7SAnatoly Burakov } 69474de12b7SAnatoly Burakov } 69574de12b7SAnatoly Burakov 69674de12b7SAnatoly Burakov if (socket_lpm6[socket]) { 69774de12b7SAnatoly Burakov lpm6 = socket_lpm6[socket]; 69874de12b7SAnatoly Burakov /* populate the LPM6 table */ 69974de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv6_route_array); i++) { 70074de12b7SAnatoly Burakov ret = rte_lpm6_add(lpm6, 70174de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].ip, 70274de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 70374de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 70474de12b7SAnatoly Burakov 70574de12b7SAnatoly Burakov if (ret < 0) { 70674de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 70774de12b7SAnatoly Burakov "LPM6 table\n", i); 70874de12b7SAnatoly Burakov return -1; 70974de12b7SAnatoly Burakov } 71074de12b7SAnatoly Burakov 71174de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv6_BYTES_FMT 71274de12b7SAnatoly Burakov "/%d (port %d)\n", 71374de12b7SAnatoly Burakov socket, 71474de12b7SAnatoly Burakov IPv6_BYTES(l3fwd_ipv6_route_array[i].ip), 71574de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 71674de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 71774de12b7SAnatoly Burakov } 71874de12b7SAnatoly Burakov } 71974de12b7SAnatoly Burakov } 72074de12b7SAnatoly Burakov return 0; 72174de12b7SAnatoly Burakov } 72274de12b7SAnatoly Burakov 72374de12b7SAnatoly Burakov static int 72474de12b7SAnatoly Burakov init_mem(void) 72574de12b7SAnatoly Burakov { 72674de12b7SAnatoly Burakov char buf[PATH_MAX]; 72774de12b7SAnatoly Burakov struct rte_mempool *mp; 72874de12b7SAnatoly Burakov struct rte_lpm *lpm; 72974de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 73074de12b7SAnatoly Burakov int socket; 73174de12b7SAnatoly Burakov unsigned lcore_id; 73274de12b7SAnatoly Burakov 73374de12b7SAnatoly Burakov /* traverse through lcores and initialize structures on each socket */ 73474de12b7SAnatoly Burakov 73574de12b7SAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 73674de12b7SAnatoly Burakov 73774de12b7SAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 73874de12b7SAnatoly Burakov continue; 73974de12b7SAnatoly Burakov 74074de12b7SAnatoly Burakov socket = rte_lcore_to_socket_id(lcore_id); 74174de12b7SAnatoly Burakov 74274de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 74374de12b7SAnatoly Burakov socket = 0; 74474de12b7SAnatoly Burakov 74574de12b7SAnatoly Burakov if (socket_direct_pool[socket] == NULL) { 74674de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating direct mempool on socket %i\n", 74774de12b7SAnatoly Burakov socket); 7486f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_direct_%i", socket); 74974de12b7SAnatoly Burakov 75074de12b7SAnatoly Burakov mp = rte_mempool_create(buf, NB_MBUF, 75174de12b7SAnatoly Burakov MBUF_SIZE, 32, 75274de12b7SAnatoly Burakov sizeof(struct rte_pktmbuf_pool_private), 75374de12b7SAnatoly Burakov rte_pktmbuf_pool_init, NULL, 75474de12b7SAnatoly Burakov rte_pktmbuf_init, NULL, 75574de12b7SAnatoly Burakov socket, 0); 75674de12b7SAnatoly Burakov if (mp == NULL) { 75774de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create direct mempool\n"); 75874de12b7SAnatoly Burakov return -1; 75974de12b7SAnatoly Burakov } 76074de12b7SAnatoly Burakov socket_direct_pool[socket] = mp; 76174de12b7SAnatoly Burakov } 76274de12b7SAnatoly Burakov 76374de12b7SAnatoly Burakov if (socket_indirect_pool[socket] == NULL) { 76474de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating indirect mempool on socket %i\n", 76574de12b7SAnatoly Burakov socket); 7666f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "pool_indirect_%i", socket); 76774de12b7SAnatoly Burakov 76874de12b7SAnatoly Burakov mp = rte_mempool_create(buf, NB_MBUF, 76974de12b7SAnatoly Burakov sizeof(struct rte_mbuf), 32, 77074de12b7SAnatoly Burakov 0, 77174de12b7SAnatoly Burakov NULL, NULL, 77274de12b7SAnatoly Burakov rte_pktmbuf_init, NULL, 77374de12b7SAnatoly Burakov socket, 0); 77474de12b7SAnatoly Burakov if (mp == NULL) { 77574de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create indirect mempool\n"); 77674de12b7SAnatoly Burakov return -1; 77774de12b7SAnatoly Burakov } 77874de12b7SAnatoly Burakov socket_indirect_pool[socket] = mp; 77974de12b7SAnatoly Burakov } 78074de12b7SAnatoly Burakov 78174de12b7SAnatoly Burakov if (socket_lpm[socket] == NULL) { 78274de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM table on socket %i\n", socket); 7836f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 78474de12b7SAnatoly Burakov 78574de12b7SAnatoly Burakov lpm = rte_lpm_create(buf, socket, LPM_MAX_RULES, 0); 78674de12b7SAnatoly Burakov if (lpm == NULL) { 78774de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 78874de12b7SAnatoly Burakov return -1; 78974de12b7SAnatoly Burakov } 79074de12b7SAnatoly Burakov socket_lpm[socket] = lpm; 79174de12b7SAnatoly Burakov } 79274de12b7SAnatoly Burakov 79374de12b7SAnatoly Burakov if (socket_lpm6[socket] == NULL) { 79474de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM6 table on socket %i\n", socket); 7956f41fe75SStephen Hemminger snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 79674de12b7SAnatoly Burakov 79774de12b7SAnatoly Burakov lpm6 = rte_lpm6_create("IP_FRAG_LPM6", socket, &lpm6_config); 79874de12b7SAnatoly Burakov if (lpm6 == NULL) { 79974de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 80074de12b7SAnatoly Burakov return -1; 80174de12b7SAnatoly Burakov } 80274de12b7SAnatoly Burakov socket_lpm6[socket] = lpm6; 80374de12b7SAnatoly Burakov } 80474de12b7SAnatoly Burakov } 80574de12b7SAnatoly Burakov 80674de12b7SAnatoly Burakov return 0; 80774de12b7SAnatoly Burakov } 80874de12b7SAnatoly Burakov 809e107e82eSAnatoly Burakov int 810e107e82eSAnatoly Burakov MAIN(int argc, char **argv) 811e107e82eSAnatoly Burakov { 812e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 81381f7ecd9SPablo de Lara struct rte_eth_dev_info dev_info; 81481f7ecd9SPablo de Lara struct rte_eth_txconf *txconf; 81574de12b7SAnatoly Burakov struct rx_queue *rxq; 81674de12b7SAnatoly Burakov int socket, ret; 81774de12b7SAnatoly Burakov unsigned nb_ports; 818e107e82eSAnatoly Burakov uint16_t queueid = 0; 819e107e82eSAnatoly Burakov unsigned lcore_id = 0, rx_lcore_id = 0; 820e107e82eSAnatoly Burakov uint32_t n_tx_queue, nb_lcores; 821e107e82eSAnatoly Burakov uint8_t portid; 822e107e82eSAnatoly Burakov 823e107e82eSAnatoly Burakov /* init EAL */ 824e107e82eSAnatoly Burakov ret = rte_eal_init(argc, argv); 825e107e82eSAnatoly Burakov if (ret < 0) 826e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eal_init failed"); 827e107e82eSAnatoly Burakov argc -= ret; 828e107e82eSAnatoly Burakov argv += ret; 829e107e82eSAnatoly Burakov 830e107e82eSAnatoly Burakov /* parse application arguments (after the EAL ones) */ 831e107e82eSAnatoly Burakov ret = parse_args(argc, argv); 832e107e82eSAnatoly Burakov if (ret < 0) 833e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Invalid arguments"); 834e107e82eSAnatoly Burakov 835e107e82eSAnatoly Burakov nb_ports = rte_eth_dev_count(); 836e107e82eSAnatoly Burakov if (nb_ports > RTE_MAX_ETHPORTS) 837e107e82eSAnatoly Burakov nb_ports = RTE_MAX_ETHPORTS; 83874de12b7SAnatoly Burakov else if (nb_ports == 0) 83974de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "No ports found!\n"); 840e107e82eSAnatoly Burakov 841e107e82eSAnatoly Burakov nb_lcores = rte_lcore_count(); 842e107e82eSAnatoly Burakov 84374de12b7SAnatoly Burakov /* initialize structures (mempools, lpm etc.) */ 84474de12b7SAnatoly Burakov if (init_mem() < 0) 84574de12b7SAnatoly Burakov rte_panic("Cannot initialize memory structures!\n"); 84674de12b7SAnatoly Burakov 847eaa8d3bfSAnatoly Burakov /* check if portmask has non-existent ports */ 848eaa8d3bfSAnatoly Burakov if (enabled_port_mask & ~(RTE_LEN2MASK(nb_ports, unsigned))) 849eaa8d3bfSAnatoly Burakov rte_exit(EXIT_FAILURE, "Non-existent ports in portmask!\n"); 850eaa8d3bfSAnatoly Burakov 851e107e82eSAnatoly Burakov /* initialize all ports */ 852e107e82eSAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 853e107e82eSAnatoly Burakov /* skip ports that are not enabled */ 854e107e82eSAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 855e107e82eSAnatoly Burakov printf("Skipping disabled port %d\n", portid); 856e107e82eSAnatoly Burakov continue; 857e107e82eSAnatoly Burakov } 858e107e82eSAnatoly Burakov 859e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 860e107e82eSAnatoly Burakov 861e107e82eSAnatoly Burakov /* get the lcore_id for this port */ 862e107e82eSAnatoly Burakov while (rte_lcore_is_enabled(rx_lcore_id) == 0 || 863e107e82eSAnatoly Burakov qconf->n_rx_queue == (unsigned)rx_queue_per_lcore) { 864e107e82eSAnatoly Burakov 865e107e82eSAnatoly Burakov rx_lcore_id ++; 866e107e82eSAnatoly Burakov if (rx_lcore_id >= RTE_MAX_LCORE) 867e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Not enough cores\n"); 868e107e82eSAnatoly Burakov 869e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 870e107e82eSAnatoly Burakov } 87174de12b7SAnatoly Burakov 872324bcf45SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(rx_lcore_id); 87374de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 87474de12b7SAnatoly Burakov socket = 0; 87574de12b7SAnatoly Burakov 87674de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[qconf->n_rx_queue]; 87774de12b7SAnatoly Burakov rxq->portid = portid; 87874de12b7SAnatoly Burakov rxq->direct_pool = socket_direct_pool[socket]; 87974de12b7SAnatoly Burakov rxq->indirect_pool = socket_indirect_pool[socket]; 88074de12b7SAnatoly Burakov rxq->lpm = socket_lpm[socket]; 88174de12b7SAnatoly Burakov rxq->lpm6 = socket_lpm6[socket]; 882e107e82eSAnatoly Burakov qconf->n_rx_queue++; 883e107e82eSAnatoly Burakov 884e107e82eSAnatoly Burakov /* init port */ 885e107e82eSAnatoly Burakov printf("Initializing port %d on lcore %u...", portid, 886e107e82eSAnatoly Burakov rx_lcore_id); 887e107e82eSAnatoly Burakov fflush(stdout); 888e107e82eSAnatoly Burakov 889e107e82eSAnatoly Burakov n_tx_queue = nb_lcores; 890e107e82eSAnatoly Burakov if (n_tx_queue > MAX_TX_QUEUE_PER_PORT) 891e107e82eSAnatoly Burakov n_tx_queue = MAX_TX_QUEUE_PER_PORT; 892e107e82eSAnatoly Burakov ret = rte_eth_dev_configure(portid, 1, (uint16_t)n_tx_queue, 893e107e82eSAnatoly Burakov &port_conf); 89474de12b7SAnatoly Burakov if (ret < 0) { 89574de12b7SAnatoly Burakov printf("\n"); 896e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot configure device: " 897e107e82eSAnatoly Burakov "err=%d, port=%d\n", 898e107e82eSAnatoly Burakov ret, portid); 89974de12b7SAnatoly Burakov } 90074de12b7SAnatoly Burakov 90174de12b7SAnatoly Burakov /* init one RX queue */ 90274de12b7SAnatoly Burakov ret = rte_eth_rx_queue_setup(portid, 0, nb_rxd, 90381f7ecd9SPablo de Lara socket, NULL, 90474de12b7SAnatoly Burakov socket_direct_pool[socket]); 90574de12b7SAnatoly Burakov if (ret < 0) { 90674de12b7SAnatoly Burakov printf("\n"); 90774de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_rx_queue_setup: " 90874de12b7SAnatoly Burakov "err=%d, port=%d\n", 90974de12b7SAnatoly Burakov ret, portid); 91074de12b7SAnatoly Burakov } 911e107e82eSAnatoly Burakov 912e107e82eSAnatoly Burakov rte_eth_macaddr_get(portid, &ports_eth_addr[portid]); 913e107e82eSAnatoly Burakov print_ethaddr(" Address:", &ports_eth_addr[portid]); 91474de12b7SAnatoly Burakov printf("\n"); 915e107e82eSAnatoly Burakov 916e107e82eSAnatoly Burakov /* init one TX queue per couple (lcore,port) */ 917e107e82eSAnatoly Burakov queueid = 0; 918e107e82eSAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 919e107e82eSAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 920e107e82eSAnatoly Burakov continue; 92174de12b7SAnatoly Burakov 92274de12b7SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(lcore_id); 923e107e82eSAnatoly Burakov printf("txq=%u,%d ", lcore_id, queueid); 924e107e82eSAnatoly Burakov fflush(stdout); 92581f7ecd9SPablo de Lara 92681f7ecd9SPablo de Lara rte_eth_dev_info_get(portid, &dev_info); 92781f7ecd9SPablo de Lara txconf = &dev_info.default_txconf; 92881f7ecd9SPablo de Lara txconf->txq_flags = 0; 929e107e82eSAnatoly Burakov ret = rte_eth_tx_queue_setup(portid, queueid, nb_txd, 93081f7ecd9SPablo de Lara socket, txconf); 93174de12b7SAnatoly Burakov if (ret < 0) { 93274de12b7SAnatoly Burakov printf("\n"); 933e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_tx_queue_setup: " 934e107e82eSAnatoly Burakov "err=%d, port=%d\n", ret, portid); 93574de12b7SAnatoly Burakov } 936e107e82eSAnatoly Burakov 937e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 938e107e82eSAnatoly Burakov qconf->tx_queue_id[portid] = queueid; 939e107e82eSAnatoly Burakov queueid++; 940e107e82eSAnatoly Burakov } 941e107e82eSAnatoly Burakov 94274de12b7SAnatoly Burakov printf("\n"); 94374de12b7SAnatoly Burakov } 94474de12b7SAnatoly Burakov 94574de12b7SAnatoly Burakov printf("\n"); 94674de12b7SAnatoly Burakov 94774de12b7SAnatoly Burakov /* start ports */ 94874de12b7SAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 94974de12b7SAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 95074de12b7SAnatoly Burakov continue; 95174de12b7SAnatoly Burakov } 952e107e82eSAnatoly Burakov /* Start device */ 953e107e82eSAnatoly Burakov ret = rte_eth_dev_start(portid); 954e107e82eSAnatoly Burakov if (ret < 0) 95574de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_dev_start: err=%d, port=%d\n", 956e107e82eSAnatoly Burakov ret, portid); 957e107e82eSAnatoly Burakov 958e107e82eSAnatoly Burakov rte_eth_promiscuous_enable(portid); 959e107e82eSAnatoly Burakov } 960e107e82eSAnatoly Burakov 96174de12b7SAnatoly Burakov if (init_routing_table() < 0) 96274de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot init routing table\n"); 96374de12b7SAnatoly Burakov 964e107e82eSAnatoly Burakov check_all_ports_link_status((uint8_t)nb_ports, enabled_port_mask); 965e107e82eSAnatoly Burakov 966e107e82eSAnatoly Burakov /* launch per-lcore init on every lcore */ 967e107e82eSAnatoly Burakov rte_eal_mp_remote_launch(main_loop, NULL, CALL_MASTER); 968e107e82eSAnatoly Burakov RTE_LCORE_FOREACH_SLAVE(lcore_id) { 969e107e82eSAnatoly Burakov if (rte_eal_wait_lcore(lcore_id) < 0) 970e107e82eSAnatoly Burakov return -1; 971e107e82eSAnatoly Burakov } 972e107e82eSAnatoly Burakov 973e107e82eSAnatoly Burakov return 0; 974e107e82eSAnatoly Burakov } 975