1e107e82eSAnatoly Burakov /*- 2e107e82eSAnatoly Burakov * BSD LICENSE 3e107e82eSAnatoly Burakov * 4e107e82eSAnatoly Burakov * Copyright(c) 2010-2014 Intel Corporation. All rights reserved. 5e107e82eSAnatoly Burakov * All rights reserved. 6e107e82eSAnatoly Burakov * 7e107e82eSAnatoly Burakov * Redistribution and use in source and binary forms, with or without 8e107e82eSAnatoly Burakov * modification, are permitted provided that the following conditions 9e107e82eSAnatoly Burakov * are met: 10e107e82eSAnatoly Burakov * 11e107e82eSAnatoly Burakov * * Redistributions of source code must retain the above copyright 12e107e82eSAnatoly Burakov * notice, this list of conditions and the following disclaimer. 13e107e82eSAnatoly Burakov * * Redistributions in binary form must reproduce the above copyright 14e107e82eSAnatoly Burakov * notice, this list of conditions and the following disclaimer in 15e107e82eSAnatoly Burakov * the documentation and/or other materials provided with the 16e107e82eSAnatoly Burakov * distribution. 17e107e82eSAnatoly Burakov * * Neither the name of Intel Corporation nor the names of its 18e107e82eSAnatoly Burakov * contributors may be used to endorse or promote products derived 19e107e82eSAnatoly Burakov * from this software without specific prior written permission. 20e107e82eSAnatoly Burakov * 21e107e82eSAnatoly Burakov * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 22e107e82eSAnatoly Burakov * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 23e107e82eSAnatoly Burakov * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 24e107e82eSAnatoly Burakov * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 25e107e82eSAnatoly Burakov * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 26e107e82eSAnatoly Burakov * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 27e107e82eSAnatoly Burakov * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 28e107e82eSAnatoly Burakov * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 29e107e82eSAnatoly Burakov * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 30e107e82eSAnatoly Burakov * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 31e107e82eSAnatoly Burakov * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 32e107e82eSAnatoly Burakov */ 33e107e82eSAnatoly Burakov 34e107e82eSAnatoly Burakov #include <stdio.h> 35e107e82eSAnatoly Burakov #include <stdlib.h> 36e107e82eSAnatoly Burakov #include <stdint.h> 37e107e82eSAnatoly Burakov #include <inttypes.h> 38e107e82eSAnatoly Burakov #include <sys/types.h> 39e107e82eSAnatoly Burakov #include <sys/param.h> 40e107e82eSAnatoly Burakov #include <string.h> 41e107e82eSAnatoly Burakov #include <sys/queue.h> 42e107e82eSAnatoly Burakov #include <stdarg.h> 43e107e82eSAnatoly Burakov #include <errno.h> 44e107e82eSAnatoly Burakov #include <getopt.h> 45e107e82eSAnatoly Burakov 46e107e82eSAnatoly Burakov #include <rte_common.h> 47e107e82eSAnatoly Burakov #include <rte_byteorder.h> 48e107e82eSAnatoly Burakov #include <rte_log.h> 49e107e82eSAnatoly Burakov #include <rte_memory.h> 50e107e82eSAnatoly Burakov #include <rte_memcpy.h> 51e107e82eSAnatoly Burakov #include <rte_memzone.h> 52e107e82eSAnatoly Burakov #include <rte_tailq.h> 53e107e82eSAnatoly Burakov #include <rte_eal.h> 54e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 55e107e82eSAnatoly Burakov #include <rte_launch.h> 56e107e82eSAnatoly Burakov #include <rte_atomic.h> 57e107e82eSAnatoly Burakov #include <rte_cycles.h> 58e107e82eSAnatoly Burakov #include <rte_prefetch.h> 59e107e82eSAnatoly Burakov #include <rte_lcore.h> 60e107e82eSAnatoly Burakov #include <rte_per_lcore.h> 61e107e82eSAnatoly Burakov #include <rte_branch_prediction.h> 62e107e82eSAnatoly Burakov #include <rte_interrupts.h> 63e107e82eSAnatoly Burakov #include <rte_pci.h> 64e107e82eSAnatoly Burakov #include <rte_random.h> 65e107e82eSAnatoly Burakov #include <rte_debug.h> 66e107e82eSAnatoly Burakov #include <rte_ether.h> 67e107e82eSAnatoly Burakov #include <rte_ethdev.h> 68e107e82eSAnatoly Burakov #include <rte_ring.h> 69e107e82eSAnatoly Burakov #include <rte_mempool.h> 70e107e82eSAnatoly Burakov #include <rte_mbuf.h> 71e107e82eSAnatoly Burakov #include <rte_lpm.h> 7274de12b7SAnatoly Burakov #include <rte_lpm6.h> 73e107e82eSAnatoly Burakov #include <rte_ip.h> 7474de12b7SAnatoly Burakov #include <rte_string_fns.h> 75e107e82eSAnatoly Burakov 7674de12b7SAnatoly Burakov #include <rte_ip_frag.h> 7774de12b7SAnatoly Burakov 78e107e82eSAnatoly Burakov #include "main.h" 79e107e82eSAnatoly Burakov 8074de12b7SAnatoly Burakov #define RTE_LOGTYPE_IP_FRAG RTE_LOGTYPE_USER1 81e107e82eSAnatoly Burakov 82e107e82eSAnatoly Burakov #define MBUF_SIZE (2048 + sizeof(struct rte_mbuf) + RTE_PKTMBUF_HEADROOM) 83e107e82eSAnatoly Burakov 84e107e82eSAnatoly Burakov /* allow max jumbo frame 9.5 KB */ 85e107e82eSAnatoly Burakov #define JUMBO_FRAME_MAX_SIZE 0x2600 86e107e82eSAnatoly Burakov 87e107e82eSAnatoly Burakov #define ROUNDUP_DIV(a, b) (((a) + (b) - 1) / (b)) 88e107e82eSAnatoly Burakov 89e107e82eSAnatoly Burakov /* 9074de12b7SAnatoly Burakov * Default byte size for the IPv6 Maximum Transfer Unit (MTU). 9174de12b7SAnatoly Burakov * This value includes the size of IPv6 header. 92e107e82eSAnatoly Burakov */ 9374de12b7SAnatoly Burakov #define IPV4_MTU_DEFAULT ETHER_MTU 9474de12b7SAnatoly Burakov #define IPV6_MTU_DEFAULT ETHER_MTU 9574de12b7SAnatoly Burakov 9674de12b7SAnatoly Burakov /* 9774de12b7SAnatoly Burakov * Default payload in bytes for the IPv6 packet. 9874de12b7SAnatoly Burakov */ 9974de12b7SAnatoly Burakov #define IPV4_DEFAULT_PAYLOAD (IPV4_MTU_DEFAULT - sizeof(struct ipv4_hdr)) 10074de12b7SAnatoly Burakov #define IPV6_DEFAULT_PAYLOAD (IPV6_MTU_DEFAULT - sizeof(struct ipv6_hdr)) 10174de12b7SAnatoly Burakov 10274de12b7SAnatoly Burakov /* 10374de12b7SAnatoly Burakov * Max number of fragments per packet expected - defined by config file. 10474de12b7SAnatoly Burakov */ 10574de12b7SAnatoly Burakov #define MAX_PACKET_FRAG RTE_LIBRTE_IP_FRAG_MAX_FRAG 106e107e82eSAnatoly Burakov 107e107e82eSAnatoly Burakov #define NB_MBUF 8192 108e107e82eSAnatoly Burakov 109e107e82eSAnatoly Burakov /* 110e107e82eSAnatoly Burakov * RX and TX Prefetch, Host, and Write-back threshold values should be 111e107e82eSAnatoly Burakov * carefully set for optimal performance. Consult the network 112e107e82eSAnatoly Burakov * controller's datasheet and supporting DPDK documentation for guidance 113e107e82eSAnatoly Burakov * on how these parameters should be set. 114e107e82eSAnatoly Burakov */ 115e107e82eSAnatoly Burakov #define RX_PTHRESH 8 /**< Default values of RX prefetch threshold reg. */ 116e107e82eSAnatoly Burakov #define RX_HTHRESH 8 /**< Default values of RX host threshold reg. */ 117e107e82eSAnatoly Burakov #define RX_WTHRESH 4 /**< Default values of RX write-back threshold reg. */ 118e107e82eSAnatoly Burakov 119e107e82eSAnatoly Burakov /* 120e107e82eSAnatoly Burakov * These default values are optimized for use with the Intel(R) 82599 10 GbE 121e107e82eSAnatoly Burakov * Controller and the DPDK ixgbe PMD. Consider using other values for other 122e107e82eSAnatoly Burakov * network controllers and/or network drivers. 123e107e82eSAnatoly Burakov */ 124e107e82eSAnatoly Burakov #define TX_PTHRESH 36 /**< Default values of TX prefetch threshold reg. */ 125e107e82eSAnatoly Burakov #define TX_HTHRESH 0 /**< Default values of TX host threshold reg. */ 126e107e82eSAnatoly Burakov #define TX_WTHRESH 0 /**< Default values of TX write-back threshold reg. */ 127e107e82eSAnatoly Burakov 128e107e82eSAnatoly Burakov #define MAX_PKT_BURST 32 129e107e82eSAnatoly Burakov #define BURST_TX_DRAIN_US 100 /* TX drain every ~100us */ 130e107e82eSAnatoly Burakov 131e107e82eSAnatoly Burakov /* Configure how many packets ahead to prefetch, when reading packets */ 132e107e82eSAnatoly Burakov #define PREFETCH_OFFSET 3 133e107e82eSAnatoly Burakov 134e107e82eSAnatoly Burakov /* 135e107e82eSAnatoly Burakov * Configurable number of RX/TX ring descriptors 136e107e82eSAnatoly Burakov */ 137e107e82eSAnatoly Burakov #define RTE_TEST_RX_DESC_DEFAULT 128 138e107e82eSAnatoly Burakov #define RTE_TEST_TX_DESC_DEFAULT 512 139e107e82eSAnatoly Burakov static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT; 140e107e82eSAnatoly Burakov static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT; 141e107e82eSAnatoly Burakov 142e107e82eSAnatoly Burakov /* ethernet addresses of ports */ 143e107e82eSAnatoly Burakov static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS]; 14474de12b7SAnatoly Burakov 14574de12b7SAnatoly Burakov #ifndef IPv4_BYTES 14674de12b7SAnatoly Burakov #define IPv4_BYTES_FMT "%" PRIu8 ".%" PRIu8 ".%" PRIu8 ".%" PRIu8 14774de12b7SAnatoly Burakov #define IPv4_BYTES(addr) \ 14874de12b7SAnatoly Burakov (uint8_t) (((addr) >> 24) & 0xFF),\ 14974de12b7SAnatoly Burakov (uint8_t) (((addr) >> 16) & 0xFF),\ 15074de12b7SAnatoly Burakov (uint8_t) (((addr) >> 8) & 0xFF),\ 15174de12b7SAnatoly Burakov (uint8_t) ((addr) & 0xFF) 15274de12b7SAnatoly Burakov #endif 15374de12b7SAnatoly Burakov 15474de12b7SAnatoly Burakov #ifndef IPv6_BYTES 15574de12b7SAnatoly Burakov #define IPv6_BYTES_FMT "%02x%02x:%02x%02x:%02x%02x:%02x%02x:"\ 15674de12b7SAnatoly Burakov "%02x%02x:%02x%02x:%02x%02x:%02x%02x" 15774de12b7SAnatoly Burakov #define IPv6_BYTES(addr) \ 15874de12b7SAnatoly Burakov addr[0], addr[1], addr[2], addr[3], \ 15974de12b7SAnatoly Burakov addr[4], addr[5], addr[6], addr[7], \ 16074de12b7SAnatoly Burakov addr[8], addr[9], addr[10], addr[11],\ 16174de12b7SAnatoly Burakov addr[12], addr[13],addr[14], addr[15] 16274de12b7SAnatoly Burakov #endif 16374de12b7SAnatoly Burakov 16474de12b7SAnatoly Burakov #define IPV6_ADDR_LEN 16 165e107e82eSAnatoly Burakov 166e107e82eSAnatoly Burakov /* mask of enabled ports */ 167e107e82eSAnatoly Burakov static int enabled_port_mask = 0; 168e107e82eSAnatoly Burakov 169e107e82eSAnatoly Burakov static int rx_queue_per_lcore = 1; 170e107e82eSAnatoly Burakov 171e107e82eSAnatoly Burakov #define MBUF_TABLE_SIZE (2 * MAX(MAX_PKT_BURST, MAX_PACKET_FRAG)) 172e107e82eSAnatoly Burakov 173e107e82eSAnatoly Burakov struct mbuf_table { 174e107e82eSAnatoly Burakov uint16_t len; 175e107e82eSAnatoly Burakov struct rte_mbuf *m_table[MBUF_TABLE_SIZE]; 176e107e82eSAnatoly Burakov }; 177e107e82eSAnatoly Burakov 17874de12b7SAnatoly Burakov struct rx_queue { 17974de12b7SAnatoly Burakov struct rte_mempool *direct_pool; 18074de12b7SAnatoly Burakov struct rte_mempool *indirect_pool; 18174de12b7SAnatoly Burakov struct rte_lpm *lpm; 18274de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 18374de12b7SAnatoly Burakov uint8_t portid; 18474de12b7SAnatoly Burakov }; 18574de12b7SAnatoly Burakov 186e107e82eSAnatoly Burakov #define MAX_RX_QUEUE_PER_LCORE 16 187e107e82eSAnatoly Burakov #define MAX_TX_QUEUE_PER_PORT 16 188e107e82eSAnatoly Burakov struct lcore_queue_conf { 189e107e82eSAnatoly Burakov uint16_t n_rx_queue; 190e107e82eSAnatoly Burakov uint16_t tx_queue_id[RTE_MAX_ETHPORTS]; 19174de12b7SAnatoly Burakov struct rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE]; 192e107e82eSAnatoly Burakov struct mbuf_table tx_mbufs[RTE_MAX_ETHPORTS]; 193e107e82eSAnatoly Burakov } __rte_cache_aligned; 194e107e82eSAnatoly Burakov struct lcore_queue_conf lcore_queue_conf[RTE_MAX_LCORE]; 195e107e82eSAnatoly Burakov 196e107e82eSAnatoly Burakov static const struct rte_eth_conf port_conf = { 197e107e82eSAnatoly Burakov .rxmode = { 198e107e82eSAnatoly Burakov .max_rx_pkt_len = JUMBO_FRAME_MAX_SIZE, 199e107e82eSAnatoly Burakov .split_hdr_size = 0, 200e107e82eSAnatoly Burakov .header_split = 0, /**< Header Split disabled */ 20174de12b7SAnatoly Burakov .hw_ip_checksum = 1, /**< IP checksum offload enabled */ 202e107e82eSAnatoly Burakov .hw_vlan_filter = 0, /**< VLAN filtering disabled */ 203e107e82eSAnatoly Burakov .jumbo_frame = 1, /**< Jumbo Frame Support enabled */ 204e107e82eSAnatoly Burakov .hw_strip_crc = 0, /**< CRC stripped by hardware */ 205e107e82eSAnatoly Burakov }, 206e107e82eSAnatoly Burakov .txmode = { 207e107e82eSAnatoly Burakov .mq_mode = ETH_MQ_TX_NONE, 208e107e82eSAnatoly Burakov }, 209e107e82eSAnatoly Burakov }; 210e107e82eSAnatoly Burakov 211e107e82eSAnatoly Burakov static const struct rte_eth_rxconf rx_conf = { 212e107e82eSAnatoly Burakov .rx_thresh = { 213e107e82eSAnatoly Burakov .pthresh = RX_PTHRESH, 214e107e82eSAnatoly Burakov .hthresh = RX_HTHRESH, 215e107e82eSAnatoly Burakov .wthresh = RX_WTHRESH, 216e107e82eSAnatoly Burakov }, 217e107e82eSAnatoly Burakov }; 218e107e82eSAnatoly Burakov 219e107e82eSAnatoly Burakov static const struct rte_eth_txconf tx_conf = { 220e107e82eSAnatoly Burakov .tx_thresh = { 221e107e82eSAnatoly Burakov .pthresh = TX_PTHRESH, 222e107e82eSAnatoly Burakov .hthresh = TX_HTHRESH, 223e107e82eSAnatoly Burakov .wthresh = TX_WTHRESH, 224e107e82eSAnatoly Burakov }, 225e107e82eSAnatoly Burakov .tx_free_thresh = 0, /* Use PMD default values */ 226e107e82eSAnatoly Burakov .tx_rs_thresh = 0, /* Use PMD default values */ 227e107e82eSAnatoly Burakov }; 228e107e82eSAnatoly Burakov 22974de12b7SAnatoly Burakov /* 23074de12b7SAnatoly Burakov * IPv4 forwarding table 23174de12b7SAnatoly Burakov */ 23274de12b7SAnatoly Burakov struct l3fwd_ipv4_route { 233e107e82eSAnatoly Burakov uint32_t ip; 234e107e82eSAnatoly Burakov uint8_t depth; 235e107e82eSAnatoly Burakov uint8_t if_out; 236e107e82eSAnatoly Burakov }; 237e107e82eSAnatoly Burakov 23874de12b7SAnatoly Burakov struct l3fwd_ipv4_route l3fwd_ipv4_route_array[] = { 23974de12b7SAnatoly Burakov {IPv4(100,10,0,0), 16, 0}, 24074de12b7SAnatoly Burakov {IPv4(100,20,0,0), 16, 1}, 24174de12b7SAnatoly Burakov {IPv4(100,30,0,0), 16, 2}, 24274de12b7SAnatoly Burakov {IPv4(100,40,0,0), 16, 3}, 24374de12b7SAnatoly Burakov {IPv4(100,50,0,0), 16, 4}, 24474de12b7SAnatoly Burakov {IPv4(100,60,0,0), 16, 5}, 24574de12b7SAnatoly Burakov {IPv4(100,70,0,0), 16, 6}, 24674de12b7SAnatoly Burakov {IPv4(100,80,0,0), 16, 7}, 247e107e82eSAnatoly Burakov }; 248e107e82eSAnatoly Burakov 24974de12b7SAnatoly Burakov /* 25074de12b7SAnatoly Burakov * IPv6 forwarding table 25174de12b7SAnatoly Burakov */ 252e107e82eSAnatoly Burakov 25374de12b7SAnatoly Burakov struct l3fwd_ipv6_route { 25474de12b7SAnatoly Burakov uint8_t ip[IPV6_ADDR_LEN]; 25574de12b7SAnatoly Burakov uint8_t depth; 25674de12b7SAnatoly Burakov uint8_t if_out; 25774de12b7SAnatoly Burakov }; 258e107e82eSAnatoly Burakov 25974de12b7SAnatoly Burakov static struct l3fwd_ipv6_route l3fwd_ipv6_route_array[] = { 26074de12b7SAnatoly Burakov {{1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 0}, 26174de12b7SAnatoly Burakov {{2,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 1}, 26274de12b7SAnatoly Burakov {{3,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 2}, 26374de12b7SAnatoly Burakov {{4,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 3}, 26474de12b7SAnatoly Burakov {{5,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 4}, 26574de12b7SAnatoly Burakov {{6,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 5}, 26674de12b7SAnatoly Burakov {{7,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 6}, 26774de12b7SAnatoly Burakov {{8,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 7}, 26874de12b7SAnatoly Burakov }; 26974de12b7SAnatoly Burakov 27074de12b7SAnatoly Burakov #define LPM_MAX_RULES 1024 27174de12b7SAnatoly Burakov #define LPM6_MAX_RULES 1024 27274de12b7SAnatoly Burakov #define LPM6_NUMBER_TBL8S (1 << 16) 27374de12b7SAnatoly Burakov 27474de12b7SAnatoly Burakov struct rte_lpm6_config lpm6_config = { 27574de12b7SAnatoly Burakov .max_rules = LPM6_MAX_RULES, 27674de12b7SAnatoly Burakov .number_tbl8s = LPM6_NUMBER_TBL8S, 27774de12b7SAnatoly Burakov .flags = 0 27874de12b7SAnatoly Burakov }; 27974de12b7SAnatoly Burakov 28074de12b7SAnatoly Burakov static struct rte_mempool *socket_direct_pool[RTE_MAX_NUMA_NODES]; 28174de12b7SAnatoly Burakov static struct rte_mempool *socket_indirect_pool[RTE_MAX_NUMA_NODES]; 28274de12b7SAnatoly Burakov static struct rte_lpm *socket_lpm[RTE_MAX_NUMA_NODES]; 28374de12b7SAnatoly Burakov static struct rte_lpm6 *socket_lpm6[RTE_MAX_NUMA_NODES]; 284e107e82eSAnatoly Burakov 285e107e82eSAnatoly Burakov /* Send burst of packets on an output interface */ 286e107e82eSAnatoly Burakov static inline int 287e107e82eSAnatoly Burakov send_burst(struct lcore_queue_conf *qconf, uint16_t n, uint8_t port) 288e107e82eSAnatoly Burakov { 289e107e82eSAnatoly Burakov struct rte_mbuf **m_table; 290e107e82eSAnatoly Burakov int ret; 291e107e82eSAnatoly Burakov uint16_t queueid; 292e107e82eSAnatoly Burakov 293e107e82eSAnatoly Burakov queueid = qconf->tx_queue_id[port]; 294e107e82eSAnatoly Burakov m_table = (struct rte_mbuf **)qconf->tx_mbufs[port].m_table; 295e107e82eSAnatoly Burakov 296e107e82eSAnatoly Burakov ret = rte_eth_tx_burst(port, queueid, m_table, n); 297e107e82eSAnatoly Burakov if (unlikely(ret < n)) { 298e107e82eSAnatoly Burakov do { 299e107e82eSAnatoly Burakov rte_pktmbuf_free(m_table[ret]); 300e107e82eSAnatoly Burakov } while (++ret < n); 301e107e82eSAnatoly Burakov } 302e107e82eSAnatoly Burakov 303e107e82eSAnatoly Burakov return 0; 304e107e82eSAnatoly Burakov } 305e107e82eSAnatoly Burakov 306e107e82eSAnatoly Burakov static inline void 30774de12b7SAnatoly Burakov l3fwd_simple_forward(struct rte_mbuf *m, struct lcore_queue_conf *qconf, 30874de12b7SAnatoly Burakov uint8_t queueid, uint8_t port_in) 309e107e82eSAnatoly Burakov { 31074de12b7SAnatoly Burakov struct rx_queue *rxq; 31174de12b7SAnatoly Burakov uint32_t i, len; 31274de12b7SAnatoly Burakov uint8_t next_hop, port_out, ipv6; 313e107e82eSAnatoly Burakov int32_t len2; 314e107e82eSAnatoly Burakov 31574de12b7SAnatoly Burakov ipv6 = 0; 31674de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[queueid]; 31774de12b7SAnatoly Burakov 31874de12b7SAnatoly Burakov /* by default, send everything back to the source port */ 31974de12b7SAnatoly Burakov port_out = port_in; 320e107e82eSAnatoly Burakov 321e107e82eSAnatoly Burakov /* Remove the Ethernet header and trailer from the input packet */ 322e107e82eSAnatoly Burakov rte_pktmbuf_adj(m, (uint16_t)sizeof(struct ether_hdr)); 323e107e82eSAnatoly Burakov 32474de12b7SAnatoly Burakov /* Build transmission burst */ 32574de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 32674de12b7SAnatoly Burakov 32774de12b7SAnatoly Burakov /* if this is an IPv4 packet */ 32874de12b7SAnatoly Burakov if (m->ol_flags & PKT_RX_IPV4_HDR) { 32974de12b7SAnatoly Burakov struct ipv4_hdr *ip_hdr; 33074de12b7SAnatoly Burakov uint32_t ip_dst; 331e107e82eSAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 332e107e82eSAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv4_hdr *); 333e107e82eSAnatoly Burakov ip_dst = rte_be_to_cpu_32(ip_hdr->dst_addr); 334e107e82eSAnatoly Burakov 335e107e82eSAnatoly Burakov /* Find destination port */ 33674de12b7SAnatoly Burakov if (rte_lpm_lookup(rxq->lpm, ip_dst, &next_hop) == 0 && 33774de12b7SAnatoly Burakov (enabled_port_mask & 1 << next_hop) != 0) { 338e107e82eSAnatoly Burakov port_out = next_hop; 339e107e82eSAnatoly Burakov 34074de12b7SAnatoly Burakov /* Build transmission burst for new port */ 341e107e82eSAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 34274de12b7SAnatoly Burakov } 343e107e82eSAnatoly Burakov 344e107e82eSAnatoly Burakov /* if we don't need to do any fragmentation */ 345e107e82eSAnatoly Burakov if (likely (IPV4_MTU_DEFAULT >= m->pkt.pkt_len)) { 346e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 347e107e82eSAnatoly Burakov len2 = 1; 348e107e82eSAnatoly Burakov } else { 349e107e82eSAnatoly Burakov len2 = rte_ipv4_fragment_packet(m, 350e107e82eSAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 351e107e82eSAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 352e107e82eSAnatoly Burakov IPV4_MTU_DEFAULT, 35374de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 354e107e82eSAnatoly Burakov 355e107e82eSAnatoly Burakov /* Free input packet */ 356e107e82eSAnatoly Burakov rte_pktmbuf_free(m); 357e107e82eSAnatoly Burakov 358e107e82eSAnatoly Burakov /* If we fail to fragment the packet */ 359e107e82eSAnatoly Burakov if (unlikely (len2 < 0)) 360e107e82eSAnatoly Burakov return; 361e107e82eSAnatoly Burakov } 36274de12b7SAnatoly Burakov } 36374de12b7SAnatoly Burakov /* if this is an IPv6 packet */ 36474de12b7SAnatoly Burakov else if (m->ol_flags & PKT_RX_IPV6_HDR) { 36574de12b7SAnatoly Burakov struct ipv6_hdr *ip_hdr; 36674de12b7SAnatoly Burakov 36774de12b7SAnatoly Burakov ipv6 = 1; 36874de12b7SAnatoly Burakov 36974de12b7SAnatoly Burakov /* Read the lookup key (i.e. ip_dst) from the input packet */ 37074de12b7SAnatoly Burakov ip_hdr = rte_pktmbuf_mtod(m, struct ipv6_hdr *); 37174de12b7SAnatoly Burakov 37274de12b7SAnatoly Burakov /* Find destination port */ 37374de12b7SAnatoly Burakov if (rte_lpm6_lookup(rxq->lpm6, ip_hdr->dst_addr, &next_hop) == 0 && 37474de12b7SAnatoly Burakov (enabled_port_mask & 1 << next_hop) != 0) { 37574de12b7SAnatoly Burakov port_out = next_hop; 37674de12b7SAnatoly Burakov 37774de12b7SAnatoly Burakov /* Build transmission burst for new port */ 37874de12b7SAnatoly Burakov len = qconf->tx_mbufs[port_out].len; 37974de12b7SAnatoly Burakov } 38074de12b7SAnatoly Burakov 38174de12b7SAnatoly Burakov /* if we don't need to do any fragmentation */ 38274de12b7SAnatoly Burakov if (likely (IPV6_MTU_DEFAULT >= m->pkt.pkt_len)) { 38374de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 38474de12b7SAnatoly Burakov len2 = 1; 38574de12b7SAnatoly Burakov } else { 38674de12b7SAnatoly Burakov len2 = rte_ipv6_fragment_packet(m, 38774de12b7SAnatoly Burakov &qconf->tx_mbufs[port_out].m_table[len], 38874de12b7SAnatoly Burakov (uint16_t)(MBUF_TABLE_SIZE - len), 38974de12b7SAnatoly Burakov IPV6_MTU_DEFAULT, 39074de12b7SAnatoly Burakov rxq->direct_pool, rxq->indirect_pool); 39174de12b7SAnatoly Burakov 39274de12b7SAnatoly Burakov /* Free input packet */ 39374de12b7SAnatoly Burakov rte_pktmbuf_free(m); 39474de12b7SAnatoly Burakov 39574de12b7SAnatoly Burakov /* If we fail to fragment the packet */ 39674de12b7SAnatoly Burakov if (unlikely (len2 < 0)) 39774de12b7SAnatoly Burakov return; 39874de12b7SAnatoly Burakov } 39974de12b7SAnatoly Burakov } 40074de12b7SAnatoly Burakov /* else, just forward the packet */ 40174de12b7SAnatoly Burakov else { 40274de12b7SAnatoly Burakov qconf->tx_mbufs[port_out].m_table[len] = m; 40374de12b7SAnatoly Burakov len2 = 1; 40474de12b7SAnatoly Burakov } 405e107e82eSAnatoly Burakov 406e107e82eSAnatoly Burakov for (i = len; i < len + len2; i ++) { 40774de12b7SAnatoly Burakov void *d_addr_bytes; 40874de12b7SAnatoly Burakov 409e107e82eSAnatoly Burakov m = qconf->tx_mbufs[port_out].m_table[i]; 410e107e82eSAnatoly Burakov struct ether_hdr *eth_hdr = (struct ether_hdr *) 411e107e82eSAnatoly Burakov rte_pktmbuf_prepend(m, (uint16_t)sizeof(struct ether_hdr)); 412e107e82eSAnatoly Burakov if (eth_hdr == NULL) { 413e107e82eSAnatoly Burakov rte_panic("No headroom in mbuf.\n"); 414e107e82eSAnatoly Burakov } 415e107e82eSAnatoly Burakov 416e107e82eSAnatoly Burakov m->pkt.vlan_macip.f.l2_len = sizeof(struct ether_hdr); 417e107e82eSAnatoly Burakov 41874de12b7SAnatoly Burakov /* 02:00:00:00:00:xx */ 41974de12b7SAnatoly Burakov d_addr_bytes = ð_hdr->d_addr.addr_bytes[0]; 42074de12b7SAnatoly Burakov *((uint64_t *)d_addr_bytes) = 0x000000000002 + ((uint64_t)port_out << 40); 42174de12b7SAnatoly Burakov 42274de12b7SAnatoly Burakov /* src addr */ 423e107e82eSAnatoly Burakov ether_addr_copy(&ports_eth_addr[port_out], ð_hdr->s_addr); 42474de12b7SAnatoly Burakov if (ipv6) 42574de12b7SAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv6); 42674de12b7SAnatoly Burakov else 427e107e82eSAnatoly Burakov eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv4); 428e107e82eSAnatoly Burakov } 429e107e82eSAnatoly Burakov 430e107e82eSAnatoly Burakov len += len2; 431e107e82eSAnatoly Burakov 432e107e82eSAnatoly Burakov if (likely(len < MAX_PKT_BURST)) { 433e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = (uint16_t)len; 434e107e82eSAnatoly Burakov return; 435e107e82eSAnatoly Burakov } 436e107e82eSAnatoly Burakov 437e107e82eSAnatoly Burakov /* Transmit packets */ 438e107e82eSAnatoly Burakov send_burst(qconf, (uint16_t)len, port_out); 439e107e82eSAnatoly Burakov qconf->tx_mbufs[port_out].len = 0; 440e107e82eSAnatoly Burakov } 441e107e82eSAnatoly Burakov 442e107e82eSAnatoly Burakov /* main processing loop */ 443e107e82eSAnatoly Burakov static int 444e107e82eSAnatoly Burakov main_loop(__attribute__((unused)) void *dummy) 445e107e82eSAnatoly Burakov { 446e107e82eSAnatoly Burakov struct rte_mbuf *pkts_burst[MAX_PKT_BURST]; 447e107e82eSAnatoly Burakov unsigned lcore_id; 448e107e82eSAnatoly Burakov uint64_t prev_tsc, diff_tsc, cur_tsc; 449e107e82eSAnatoly Burakov int i, j, nb_rx; 450e107e82eSAnatoly Burakov uint8_t portid; 451e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 452e107e82eSAnatoly Burakov const uint64_t drain_tsc = (rte_get_tsc_hz() + US_PER_S - 1) / US_PER_S * BURST_TX_DRAIN_US; 453e107e82eSAnatoly Burakov 454e107e82eSAnatoly Burakov prev_tsc = 0; 455e107e82eSAnatoly Burakov 456e107e82eSAnatoly Burakov lcore_id = rte_lcore_id(); 457e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 458e107e82eSAnatoly Burakov 459e107e82eSAnatoly Burakov if (qconf->n_rx_queue == 0) { 46074de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "lcore %u has nothing to do\n", lcore_id); 461e107e82eSAnatoly Burakov return 0; 462e107e82eSAnatoly Burakov } 463e107e82eSAnatoly Burakov 46474de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "entering main loop on lcore %u\n", lcore_id); 465e107e82eSAnatoly Burakov 466e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 467e107e82eSAnatoly Burakov 46874de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 46974de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, " -- lcoreid=%u portid=%d\n", lcore_id, 470e107e82eSAnatoly Burakov (int) portid); 471e107e82eSAnatoly Burakov } 472e107e82eSAnatoly Burakov 473e107e82eSAnatoly Burakov while (1) { 474e107e82eSAnatoly Burakov 475e107e82eSAnatoly Burakov cur_tsc = rte_rdtsc(); 476e107e82eSAnatoly Burakov 477e107e82eSAnatoly Burakov /* 478e107e82eSAnatoly Burakov * TX burst queue drain 479e107e82eSAnatoly Burakov */ 480e107e82eSAnatoly Burakov diff_tsc = cur_tsc - prev_tsc; 481e107e82eSAnatoly Burakov if (unlikely(diff_tsc > drain_tsc)) { 482e107e82eSAnatoly Burakov 483e107e82eSAnatoly Burakov /* 484e107e82eSAnatoly Burakov * This could be optimized (use queueid instead of 485e107e82eSAnatoly Burakov * portid), but it is not called so often 486e107e82eSAnatoly Burakov */ 487e107e82eSAnatoly Burakov for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) { 488e107e82eSAnatoly Burakov if (qconf->tx_mbufs[portid].len == 0) 489e107e82eSAnatoly Burakov continue; 490e107e82eSAnatoly Burakov send_burst(&lcore_queue_conf[lcore_id], 491e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len, 492e107e82eSAnatoly Burakov portid); 493e107e82eSAnatoly Burakov qconf->tx_mbufs[portid].len = 0; 494e107e82eSAnatoly Burakov } 495e107e82eSAnatoly Burakov 496e107e82eSAnatoly Burakov prev_tsc = cur_tsc; 497e107e82eSAnatoly Burakov } 498e107e82eSAnatoly Burakov 499e107e82eSAnatoly Burakov /* 500e107e82eSAnatoly Burakov * Read packet from RX queues 501e107e82eSAnatoly Burakov */ 502e107e82eSAnatoly Burakov for (i = 0; i < qconf->n_rx_queue; i++) { 503e107e82eSAnatoly Burakov 50474de12b7SAnatoly Burakov portid = qconf->rx_queue_list[i].portid; 505e107e82eSAnatoly Burakov nb_rx = rte_eth_rx_burst(portid, 0, pkts_burst, 506e107e82eSAnatoly Burakov MAX_PKT_BURST); 507e107e82eSAnatoly Burakov 508e107e82eSAnatoly Burakov /* Prefetch first packets */ 509e107e82eSAnatoly Burakov for (j = 0; j < PREFETCH_OFFSET && j < nb_rx; j++) { 510e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod( 511e107e82eSAnatoly Burakov pkts_burst[j], void *)); 512e107e82eSAnatoly Burakov } 513e107e82eSAnatoly Burakov 514e107e82eSAnatoly Burakov /* Prefetch and forward already prefetched packets */ 515e107e82eSAnatoly Burakov for (j = 0; j < (nb_rx - PREFETCH_OFFSET); j++) { 516e107e82eSAnatoly Burakov rte_prefetch0(rte_pktmbuf_mtod(pkts_burst[ 517e107e82eSAnatoly Burakov j + PREFETCH_OFFSET], void *)); 51874de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 519e107e82eSAnatoly Burakov } 520e107e82eSAnatoly Burakov 521e107e82eSAnatoly Burakov /* Forward remaining prefetched packets */ 522e107e82eSAnatoly Burakov for (; j < nb_rx; j++) { 52374de12b7SAnatoly Burakov l3fwd_simple_forward(pkts_burst[j], qconf, i, portid); 524e107e82eSAnatoly Burakov } 525e107e82eSAnatoly Burakov } 526e107e82eSAnatoly Burakov } 527e107e82eSAnatoly Burakov } 528e107e82eSAnatoly Burakov 529e107e82eSAnatoly Burakov /* display usage */ 530e107e82eSAnatoly Burakov static void 531e107e82eSAnatoly Burakov print_usage(const char *prgname) 532e107e82eSAnatoly Burakov { 533e107e82eSAnatoly Burakov printf("%s [EAL options] -- -p PORTMASK [-q NQ]\n" 534e107e82eSAnatoly Burakov " -p PORTMASK: hexadecimal bitmask of ports to configure\n" 535e107e82eSAnatoly Burakov " -q NQ: number of queue (=ports) per lcore (default is 1)\n", 536e107e82eSAnatoly Burakov prgname); 537e107e82eSAnatoly Burakov } 538e107e82eSAnatoly Burakov 539e107e82eSAnatoly Burakov static int 540e107e82eSAnatoly Burakov parse_portmask(const char *portmask) 541e107e82eSAnatoly Burakov { 542e107e82eSAnatoly Burakov char *end = NULL; 543e107e82eSAnatoly Burakov unsigned long pm; 544e107e82eSAnatoly Burakov 545e107e82eSAnatoly Burakov /* parse hexadecimal string */ 546e107e82eSAnatoly Burakov pm = strtoul(portmask, &end, 16); 547e107e82eSAnatoly Burakov if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0')) 548e107e82eSAnatoly Burakov return -1; 549e107e82eSAnatoly Burakov 550e107e82eSAnatoly Burakov if (pm == 0) 551e107e82eSAnatoly Burakov return -1; 552e107e82eSAnatoly Burakov 553e107e82eSAnatoly Burakov return pm; 554e107e82eSAnatoly Burakov } 555e107e82eSAnatoly Burakov 556e107e82eSAnatoly Burakov static int 557e107e82eSAnatoly Burakov parse_nqueue(const char *q_arg) 558e107e82eSAnatoly Burakov { 559e107e82eSAnatoly Burakov char *end = NULL; 560e107e82eSAnatoly Burakov unsigned long n; 561e107e82eSAnatoly Burakov 562e107e82eSAnatoly Burakov /* parse hexadecimal string */ 563e107e82eSAnatoly Burakov n = strtoul(q_arg, &end, 10); 564e107e82eSAnatoly Burakov if ((q_arg[0] == '\0') || (end == NULL) || (*end != '\0')) 565e107e82eSAnatoly Burakov return -1; 566e107e82eSAnatoly Burakov if (n == 0) 567e107e82eSAnatoly Burakov return -1; 568e107e82eSAnatoly Burakov if (n >= MAX_RX_QUEUE_PER_LCORE) 569e107e82eSAnatoly Burakov return -1; 570e107e82eSAnatoly Burakov 571e107e82eSAnatoly Burakov return n; 572e107e82eSAnatoly Burakov } 573e107e82eSAnatoly Burakov 574e107e82eSAnatoly Burakov /* Parse the argument given in the command line of the application */ 575e107e82eSAnatoly Burakov static int 576e107e82eSAnatoly Burakov parse_args(int argc, char **argv) 577e107e82eSAnatoly Burakov { 578e107e82eSAnatoly Burakov int opt, ret; 579e107e82eSAnatoly Burakov char **argvopt; 580e107e82eSAnatoly Burakov int option_index; 581e107e82eSAnatoly Burakov char *prgname = argv[0]; 582e107e82eSAnatoly Burakov static struct option lgopts[] = { 583e107e82eSAnatoly Burakov {NULL, 0, 0, 0} 584e107e82eSAnatoly Burakov }; 585e107e82eSAnatoly Burakov 586e107e82eSAnatoly Burakov argvopt = argv; 587e107e82eSAnatoly Burakov 588e107e82eSAnatoly Burakov while ((opt = getopt_long(argc, argvopt, "p:q:", 589e107e82eSAnatoly Burakov lgopts, &option_index)) != EOF) { 590e107e82eSAnatoly Burakov 591e107e82eSAnatoly Burakov switch (opt) { 592e107e82eSAnatoly Burakov /* portmask */ 593e107e82eSAnatoly Burakov case 'p': 594e107e82eSAnatoly Burakov enabled_port_mask = parse_portmask(optarg); 595e107e82eSAnatoly Burakov if (enabled_port_mask < 0) { 596e107e82eSAnatoly Burakov printf("invalid portmask\n"); 597e107e82eSAnatoly Burakov print_usage(prgname); 598e107e82eSAnatoly Burakov return -1; 599e107e82eSAnatoly Burakov } 600e107e82eSAnatoly Burakov break; 601e107e82eSAnatoly Burakov 602e107e82eSAnatoly Burakov /* nqueue */ 603e107e82eSAnatoly Burakov case 'q': 604e107e82eSAnatoly Burakov rx_queue_per_lcore = parse_nqueue(optarg); 605e107e82eSAnatoly Burakov if (rx_queue_per_lcore < 0) { 606e107e82eSAnatoly Burakov printf("invalid queue number\n"); 607e107e82eSAnatoly Burakov print_usage(prgname); 608e107e82eSAnatoly Burakov return -1; 609e107e82eSAnatoly Burakov } 610e107e82eSAnatoly Burakov break; 611e107e82eSAnatoly Burakov 612e107e82eSAnatoly Burakov /* long options */ 613e107e82eSAnatoly Burakov case 0: 614e107e82eSAnatoly Burakov print_usage(prgname); 615e107e82eSAnatoly Burakov return -1; 616e107e82eSAnatoly Burakov 617e107e82eSAnatoly Burakov default: 618e107e82eSAnatoly Burakov print_usage(prgname); 619e107e82eSAnatoly Burakov return -1; 620e107e82eSAnatoly Burakov } 621e107e82eSAnatoly Burakov } 622e107e82eSAnatoly Burakov 623e107e82eSAnatoly Burakov if (enabled_port_mask == 0) { 624e107e82eSAnatoly Burakov printf("portmask not specified\n"); 625e107e82eSAnatoly Burakov print_usage(prgname); 626e107e82eSAnatoly Burakov return -1; 627e107e82eSAnatoly Burakov } 628e107e82eSAnatoly Burakov 629e107e82eSAnatoly Burakov if (optind >= 0) 630e107e82eSAnatoly Burakov argv[optind-1] = prgname; 631e107e82eSAnatoly Burakov 632e107e82eSAnatoly Burakov ret = optind-1; 633e107e82eSAnatoly Burakov optind = 0; /* reset getopt lib */ 634e107e82eSAnatoly Burakov return ret; 635e107e82eSAnatoly Burakov } 636e107e82eSAnatoly Burakov 637e107e82eSAnatoly Burakov static void 638e107e82eSAnatoly Burakov print_ethaddr(const char *name, struct ether_addr *eth_addr) 639e107e82eSAnatoly Burakov { 640e107e82eSAnatoly Burakov printf("%s%02X:%02X:%02X:%02X:%02X:%02X", name, 641e107e82eSAnatoly Burakov eth_addr->addr_bytes[0], 642e107e82eSAnatoly Burakov eth_addr->addr_bytes[1], 643e107e82eSAnatoly Burakov eth_addr->addr_bytes[2], 644e107e82eSAnatoly Burakov eth_addr->addr_bytes[3], 645e107e82eSAnatoly Burakov eth_addr->addr_bytes[4], 646e107e82eSAnatoly Burakov eth_addr->addr_bytes[5]); 647e107e82eSAnatoly Burakov } 648e107e82eSAnatoly Burakov 649e107e82eSAnatoly Burakov /* Check the link status of all ports in up to 9s, and print them finally */ 650e107e82eSAnatoly Burakov static void 651e107e82eSAnatoly Burakov check_all_ports_link_status(uint8_t port_num, uint32_t port_mask) 652e107e82eSAnatoly Burakov { 653e107e82eSAnatoly Burakov #define CHECK_INTERVAL 100 /* 100ms */ 654e107e82eSAnatoly Burakov #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */ 655e107e82eSAnatoly Burakov uint8_t portid, count, all_ports_up, print_flag = 0; 656e107e82eSAnatoly Burakov struct rte_eth_link link; 657e107e82eSAnatoly Burakov 658e107e82eSAnatoly Burakov printf("\nChecking link status"); 659e107e82eSAnatoly Burakov fflush(stdout); 660e107e82eSAnatoly Burakov for (count = 0; count <= MAX_CHECK_TIME; count++) { 661e107e82eSAnatoly Burakov all_ports_up = 1; 662e107e82eSAnatoly Burakov for (portid = 0; portid < port_num; portid++) { 663e107e82eSAnatoly Burakov if ((port_mask & (1 << portid)) == 0) 664e107e82eSAnatoly Burakov continue; 665e107e82eSAnatoly Burakov memset(&link, 0, sizeof(link)); 666e107e82eSAnatoly Burakov rte_eth_link_get_nowait(portid, &link); 667e107e82eSAnatoly Burakov /* print link status if flag set */ 668e107e82eSAnatoly Burakov if (print_flag == 1) { 669e107e82eSAnatoly Burakov if (link.link_status) 670e107e82eSAnatoly Burakov printf("Port %d Link Up - speed %u " 671e107e82eSAnatoly Burakov "Mbps - %s\n", (uint8_t)portid, 672e107e82eSAnatoly Burakov (unsigned)link.link_speed, 673e107e82eSAnatoly Burakov (link.link_duplex == ETH_LINK_FULL_DUPLEX) ? 674e107e82eSAnatoly Burakov ("full-duplex") : ("half-duplex\n")); 675e107e82eSAnatoly Burakov else 676e107e82eSAnatoly Burakov printf("Port %d Link Down\n", 677e107e82eSAnatoly Burakov (uint8_t)portid); 678e107e82eSAnatoly Burakov continue; 679e107e82eSAnatoly Burakov } 680e107e82eSAnatoly Burakov /* clear all_ports_up flag if any link down */ 681e107e82eSAnatoly Burakov if (link.link_status == 0) { 682e107e82eSAnatoly Burakov all_ports_up = 0; 683e107e82eSAnatoly Burakov break; 684e107e82eSAnatoly Burakov } 685e107e82eSAnatoly Burakov } 686e107e82eSAnatoly Burakov /* after finally printing all link status, get out */ 687e107e82eSAnatoly Burakov if (print_flag == 1) 688e107e82eSAnatoly Burakov break; 689e107e82eSAnatoly Burakov 690e107e82eSAnatoly Burakov if (all_ports_up == 0) { 691e107e82eSAnatoly Burakov printf("."); 692e107e82eSAnatoly Burakov fflush(stdout); 693e107e82eSAnatoly Burakov rte_delay_ms(CHECK_INTERVAL); 694e107e82eSAnatoly Burakov } 695e107e82eSAnatoly Burakov 696e107e82eSAnatoly Burakov /* set the print_flag if all ports up or timeout */ 697e107e82eSAnatoly Burakov if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) { 698e107e82eSAnatoly Burakov print_flag = 1; 69974de12b7SAnatoly Burakov printf("\ndone\n"); 700e107e82eSAnatoly Burakov } 701e107e82eSAnatoly Burakov } 702e107e82eSAnatoly Burakov } 703e107e82eSAnatoly Burakov 70474de12b7SAnatoly Burakov static int 70574de12b7SAnatoly Burakov init_routing_table(void) 70674de12b7SAnatoly Burakov { 70774de12b7SAnatoly Burakov struct rte_lpm *lpm; 70874de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 70974de12b7SAnatoly Burakov int socket, ret; 71074de12b7SAnatoly Burakov unsigned i; 71174de12b7SAnatoly Burakov 71274de12b7SAnatoly Burakov for (socket = 0; socket < RTE_MAX_NUMA_NODES; socket++) { 71374de12b7SAnatoly Burakov if (socket_lpm[socket]) { 71474de12b7SAnatoly Burakov lpm = socket_lpm[socket]; 71574de12b7SAnatoly Burakov /* populate the LPM table */ 71674de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv4_route_array); i++) { 71774de12b7SAnatoly Burakov ret = rte_lpm_add(lpm, 71874de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].ip, 71974de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 72074de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 72174de12b7SAnatoly Burakov 72274de12b7SAnatoly Burakov if (ret < 0) { 72374de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 72474de12b7SAnatoly Burakov "LPM table\n", i); 72574de12b7SAnatoly Burakov return -1; 72674de12b7SAnatoly Burakov } 72774de12b7SAnatoly Burakov 72874de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv4_BYTES_FMT 72974de12b7SAnatoly Burakov "/%d (port %d)\n", 73074de12b7SAnatoly Burakov socket, 73174de12b7SAnatoly Burakov IPv4_BYTES(l3fwd_ipv4_route_array[i].ip), 73274de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].depth, 73374de12b7SAnatoly Burakov l3fwd_ipv4_route_array[i].if_out); 73474de12b7SAnatoly Burakov } 73574de12b7SAnatoly Burakov } 73674de12b7SAnatoly Burakov 73774de12b7SAnatoly Burakov if (socket_lpm6[socket]) { 73874de12b7SAnatoly Burakov lpm6 = socket_lpm6[socket]; 73974de12b7SAnatoly Burakov /* populate the LPM6 table */ 74074de12b7SAnatoly Burakov for (i = 0; i < RTE_DIM(l3fwd_ipv6_route_array); i++) { 74174de12b7SAnatoly Burakov ret = rte_lpm6_add(lpm6, 74274de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].ip, 74374de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 74474de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 74574de12b7SAnatoly Burakov 74674de12b7SAnatoly Burakov if (ret < 0) { 74774de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd " 74874de12b7SAnatoly Burakov "LPM6 table\n", i); 74974de12b7SAnatoly Burakov return -1; 75074de12b7SAnatoly Burakov } 75174de12b7SAnatoly Burakov 75274de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv6_BYTES_FMT 75374de12b7SAnatoly Burakov "/%d (port %d)\n", 75474de12b7SAnatoly Burakov socket, 75574de12b7SAnatoly Burakov IPv6_BYTES(l3fwd_ipv6_route_array[i].ip), 75674de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].depth, 75774de12b7SAnatoly Burakov l3fwd_ipv6_route_array[i].if_out); 75874de12b7SAnatoly Burakov } 75974de12b7SAnatoly Burakov } 76074de12b7SAnatoly Burakov } 76174de12b7SAnatoly Burakov return 0; 76274de12b7SAnatoly Burakov } 76374de12b7SAnatoly Burakov 76474de12b7SAnatoly Burakov static int 76574de12b7SAnatoly Burakov init_mem(void) 76674de12b7SAnatoly Burakov { 76774de12b7SAnatoly Burakov char buf[PATH_MAX]; 76874de12b7SAnatoly Burakov struct rte_mempool *mp; 76974de12b7SAnatoly Burakov struct rte_lpm *lpm; 77074de12b7SAnatoly Burakov struct rte_lpm6 *lpm6; 77174de12b7SAnatoly Burakov int socket; 77274de12b7SAnatoly Burakov unsigned lcore_id; 77374de12b7SAnatoly Burakov 77474de12b7SAnatoly Burakov /* traverse through lcores and initialize structures on each socket */ 77574de12b7SAnatoly Burakov 77674de12b7SAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 77774de12b7SAnatoly Burakov 77874de12b7SAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 77974de12b7SAnatoly Burakov continue; 78074de12b7SAnatoly Burakov 78174de12b7SAnatoly Burakov socket = rte_lcore_to_socket_id(lcore_id); 78274de12b7SAnatoly Burakov 78374de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 78474de12b7SAnatoly Burakov socket = 0; 78574de12b7SAnatoly Burakov 78674de12b7SAnatoly Burakov if (socket_direct_pool[socket] == NULL) { 78774de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating direct mempool on socket %i\n", 78874de12b7SAnatoly Burakov socket); 78974de12b7SAnatoly Burakov rte_snprintf(buf, sizeof(buf), "pool_direct_%i", socket); 79074de12b7SAnatoly Burakov 79174de12b7SAnatoly Burakov mp = rte_mempool_create(buf, NB_MBUF, 79274de12b7SAnatoly Burakov MBUF_SIZE, 32, 79374de12b7SAnatoly Burakov sizeof(struct rte_pktmbuf_pool_private), 79474de12b7SAnatoly Burakov rte_pktmbuf_pool_init, NULL, 79574de12b7SAnatoly Burakov rte_pktmbuf_init, NULL, 79674de12b7SAnatoly Burakov socket, 0); 79774de12b7SAnatoly Burakov if (mp == NULL) { 79874de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create direct mempool\n"); 79974de12b7SAnatoly Burakov return -1; 80074de12b7SAnatoly Burakov } 80174de12b7SAnatoly Burakov socket_direct_pool[socket] = mp; 80274de12b7SAnatoly Burakov } 80374de12b7SAnatoly Burakov 80474de12b7SAnatoly Burakov if (socket_indirect_pool[socket] == NULL) { 80574de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating indirect mempool on socket %i\n", 80674de12b7SAnatoly Burakov socket); 80774de12b7SAnatoly Burakov rte_snprintf(buf, sizeof(buf), "pool_indirect_%i", socket); 80874de12b7SAnatoly Burakov 80974de12b7SAnatoly Burakov mp = rte_mempool_create(buf, NB_MBUF, 81074de12b7SAnatoly Burakov sizeof(struct rte_mbuf), 32, 81174de12b7SAnatoly Burakov 0, 81274de12b7SAnatoly Burakov NULL, NULL, 81374de12b7SAnatoly Burakov rte_pktmbuf_init, NULL, 81474de12b7SAnatoly Burakov socket, 0); 81574de12b7SAnatoly Burakov if (mp == NULL) { 81674de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create indirect mempool\n"); 81774de12b7SAnatoly Burakov return -1; 81874de12b7SAnatoly Burakov } 81974de12b7SAnatoly Burakov socket_indirect_pool[socket] = mp; 82074de12b7SAnatoly Burakov } 82174de12b7SAnatoly Burakov 82274de12b7SAnatoly Burakov if (socket_lpm[socket] == NULL) { 82374de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM table on socket %i\n", socket); 82474de12b7SAnatoly Burakov rte_snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 82574de12b7SAnatoly Burakov 82674de12b7SAnatoly Burakov lpm = rte_lpm_create(buf, socket, LPM_MAX_RULES, 0); 82774de12b7SAnatoly Burakov if (lpm == NULL) { 82874de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 82974de12b7SAnatoly Burakov return -1; 83074de12b7SAnatoly Burakov } 83174de12b7SAnatoly Burakov socket_lpm[socket] = lpm; 83274de12b7SAnatoly Burakov } 83374de12b7SAnatoly Burakov 83474de12b7SAnatoly Burakov if (socket_lpm6[socket] == NULL) { 83574de12b7SAnatoly Burakov RTE_LOG(INFO, IP_FRAG, "Creating LPM6 table on socket %i\n", socket); 83674de12b7SAnatoly Burakov rte_snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket); 83774de12b7SAnatoly Burakov 83874de12b7SAnatoly Burakov lpm6 = rte_lpm6_create("IP_FRAG_LPM6", socket, &lpm6_config); 83974de12b7SAnatoly Burakov if (lpm6 == NULL) { 84074de12b7SAnatoly Burakov RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n"); 84174de12b7SAnatoly Burakov return -1; 84274de12b7SAnatoly Burakov } 84374de12b7SAnatoly Burakov socket_lpm6[socket] = lpm6; 84474de12b7SAnatoly Burakov } 84574de12b7SAnatoly Burakov } 84674de12b7SAnatoly Burakov 84774de12b7SAnatoly Burakov return 0; 84874de12b7SAnatoly Burakov } 84974de12b7SAnatoly Burakov 850e107e82eSAnatoly Burakov int 851e107e82eSAnatoly Burakov MAIN(int argc, char **argv) 852e107e82eSAnatoly Burakov { 853e107e82eSAnatoly Burakov struct lcore_queue_conf *qconf; 85474de12b7SAnatoly Burakov struct rx_queue *rxq; 85574de12b7SAnatoly Burakov int socket, ret; 85674de12b7SAnatoly Burakov unsigned nb_ports; 857e107e82eSAnatoly Burakov uint16_t queueid = 0; 858e107e82eSAnatoly Burakov unsigned lcore_id = 0, rx_lcore_id = 0; 859e107e82eSAnatoly Burakov uint32_t n_tx_queue, nb_lcores; 860e107e82eSAnatoly Burakov uint8_t portid; 861e107e82eSAnatoly Burakov 862e107e82eSAnatoly Burakov /* init EAL */ 863e107e82eSAnatoly Burakov ret = rte_eal_init(argc, argv); 864e107e82eSAnatoly Burakov if (ret < 0) 865e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eal_init failed"); 866e107e82eSAnatoly Burakov argc -= ret; 867e107e82eSAnatoly Burakov argv += ret; 868e107e82eSAnatoly Burakov 869e107e82eSAnatoly Burakov /* parse application arguments (after the EAL ones) */ 870e107e82eSAnatoly Burakov ret = parse_args(argc, argv); 871e107e82eSAnatoly Burakov if (ret < 0) 872e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Invalid arguments"); 873e107e82eSAnatoly Burakov 874e107e82eSAnatoly Burakov if (rte_eal_pci_probe() < 0) 875e107e82eSAnatoly Burakov rte_panic("Cannot probe PCI\n"); 876e107e82eSAnatoly Burakov 877e107e82eSAnatoly Burakov nb_ports = rte_eth_dev_count(); 878e107e82eSAnatoly Burakov if (nb_ports > RTE_MAX_ETHPORTS) 879e107e82eSAnatoly Burakov nb_ports = RTE_MAX_ETHPORTS; 88074de12b7SAnatoly Burakov else if (nb_ports == 0) 88174de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "No ports found!\n"); 882e107e82eSAnatoly Burakov 883e107e82eSAnatoly Burakov nb_lcores = rte_lcore_count(); 884e107e82eSAnatoly Burakov 88574de12b7SAnatoly Burakov /* initialize structures (mempools, lpm etc.) */ 88674de12b7SAnatoly Burakov if (init_mem() < 0) 88774de12b7SAnatoly Burakov rte_panic("Cannot initialize memory structures!\n"); 88874de12b7SAnatoly Burakov 889eaa8d3bfSAnatoly Burakov /* check if portmask has non-existent ports */ 890eaa8d3bfSAnatoly Burakov if (enabled_port_mask & ~(RTE_LEN2MASK(nb_ports, unsigned))) 891eaa8d3bfSAnatoly Burakov rte_exit(EXIT_FAILURE, "Non-existent ports in portmask!\n"); 892eaa8d3bfSAnatoly Burakov 893e107e82eSAnatoly Burakov /* initialize all ports */ 894e107e82eSAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 895e107e82eSAnatoly Burakov /* skip ports that are not enabled */ 896e107e82eSAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 897e107e82eSAnatoly Burakov printf("Skipping disabled port %d\n", portid); 898e107e82eSAnatoly Burakov continue; 899e107e82eSAnatoly Burakov } 900e107e82eSAnatoly Burakov 901e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 902e107e82eSAnatoly Burakov 903e107e82eSAnatoly Burakov /* get the lcore_id for this port */ 904e107e82eSAnatoly Burakov while (rte_lcore_is_enabled(rx_lcore_id) == 0 || 905e107e82eSAnatoly Burakov qconf->n_rx_queue == (unsigned)rx_queue_per_lcore) { 906e107e82eSAnatoly Burakov 907e107e82eSAnatoly Burakov rx_lcore_id ++; 908e107e82eSAnatoly Burakov if (rx_lcore_id >= RTE_MAX_LCORE) 909e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Not enough cores\n"); 910e107e82eSAnatoly Burakov 911e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[rx_lcore_id]; 912e107e82eSAnatoly Burakov } 91374de12b7SAnatoly Burakov 914*324bcf45SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(rx_lcore_id); 91574de12b7SAnatoly Burakov if (socket == SOCKET_ID_ANY) 91674de12b7SAnatoly Burakov socket = 0; 91774de12b7SAnatoly Burakov 91874de12b7SAnatoly Burakov rxq = &qconf->rx_queue_list[qconf->n_rx_queue]; 91974de12b7SAnatoly Burakov rxq->portid = portid; 92074de12b7SAnatoly Burakov rxq->direct_pool = socket_direct_pool[socket]; 92174de12b7SAnatoly Burakov rxq->indirect_pool = socket_indirect_pool[socket]; 92274de12b7SAnatoly Burakov rxq->lpm = socket_lpm[socket]; 92374de12b7SAnatoly Burakov rxq->lpm6 = socket_lpm6[socket]; 924e107e82eSAnatoly Burakov qconf->n_rx_queue++; 925e107e82eSAnatoly Burakov 926e107e82eSAnatoly Burakov /* init port */ 927e107e82eSAnatoly Burakov printf("Initializing port %d on lcore %u...", portid, 928e107e82eSAnatoly Burakov rx_lcore_id); 929e107e82eSAnatoly Burakov fflush(stdout); 930e107e82eSAnatoly Burakov 931e107e82eSAnatoly Burakov n_tx_queue = nb_lcores; 932e107e82eSAnatoly Burakov if (n_tx_queue > MAX_TX_QUEUE_PER_PORT) 933e107e82eSAnatoly Burakov n_tx_queue = MAX_TX_QUEUE_PER_PORT; 934e107e82eSAnatoly Burakov ret = rte_eth_dev_configure(portid, 1, (uint16_t)n_tx_queue, 935e107e82eSAnatoly Burakov &port_conf); 93674de12b7SAnatoly Burakov if (ret < 0) { 93774de12b7SAnatoly Burakov printf("\n"); 938e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot configure device: " 939e107e82eSAnatoly Burakov "err=%d, port=%d\n", 940e107e82eSAnatoly Burakov ret, portid); 94174de12b7SAnatoly Burakov } 94274de12b7SAnatoly Burakov 94374de12b7SAnatoly Burakov /* init one RX queue */ 94474de12b7SAnatoly Burakov ret = rte_eth_rx_queue_setup(portid, 0, nb_rxd, 94574de12b7SAnatoly Burakov socket, &rx_conf, 94674de12b7SAnatoly Burakov socket_direct_pool[socket]); 94774de12b7SAnatoly Burakov if (ret < 0) { 94874de12b7SAnatoly Burakov printf("\n"); 94974de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_rx_queue_setup: " 95074de12b7SAnatoly Burakov "err=%d, port=%d\n", 95174de12b7SAnatoly Burakov ret, portid); 95274de12b7SAnatoly Burakov } 953e107e82eSAnatoly Burakov 954e107e82eSAnatoly Burakov rte_eth_macaddr_get(portid, &ports_eth_addr[portid]); 955e107e82eSAnatoly Burakov print_ethaddr(" Address:", &ports_eth_addr[portid]); 95674de12b7SAnatoly Burakov printf("\n"); 957e107e82eSAnatoly Burakov 958e107e82eSAnatoly Burakov /* init one TX queue per couple (lcore,port) */ 959e107e82eSAnatoly Burakov queueid = 0; 960e107e82eSAnatoly Burakov for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 961e107e82eSAnatoly Burakov if (rte_lcore_is_enabled(lcore_id) == 0) 962e107e82eSAnatoly Burakov continue; 96374de12b7SAnatoly Burakov 96474de12b7SAnatoly Burakov socket = (int) rte_lcore_to_socket_id(lcore_id); 965e107e82eSAnatoly Burakov printf("txq=%u,%d ", lcore_id, queueid); 966e107e82eSAnatoly Burakov fflush(stdout); 967e107e82eSAnatoly Burakov ret = rte_eth_tx_queue_setup(portid, queueid, nb_txd, 96874de12b7SAnatoly Burakov socket, &tx_conf); 96974de12b7SAnatoly Burakov if (ret < 0) { 97074de12b7SAnatoly Burakov printf("\n"); 971e107e82eSAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_tx_queue_setup: " 972e107e82eSAnatoly Burakov "err=%d, port=%d\n", ret, portid); 97374de12b7SAnatoly Burakov } 974e107e82eSAnatoly Burakov 975e107e82eSAnatoly Burakov qconf = &lcore_queue_conf[lcore_id]; 976e107e82eSAnatoly Burakov qconf->tx_queue_id[portid] = queueid; 977e107e82eSAnatoly Burakov queueid++; 978e107e82eSAnatoly Burakov } 979e107e82eSAnatoly Burakov 98074de12b7SAnatoly Burakov printf("\n"); 98174de12b7SAnatoly Burakov } 98274de12b7SAnatoly Burakov 98374de12b7SAnatoly Burakov printf("\n"); 98474de12b7SAnatoly Burakov 98574de12b7SAnatoly Burakov /* start ports */ 98674de12b7SAnatoly Burakov for (portid = 0; portid < nb_ports; portid++) { 98774de12b7SAnatoly Burakov if ((enabled_port_mask & (1 << portid)) == 0) { 98874de12b7SAnatoly Burakov continue; 98974de12b7SAnatoly Burakov } 990e107e82eSAnatoly Burakov /* Start device */ 991e107e82eSAnatoly Burakov ret = rte_eth_dev_start(portid); 992e107e82eSAnatoly Burakov if (ret < 0) 99374de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "rte_eth_dev_start: err=%d, port=%d\n", 994e107e82eSAnatoly Burakov ret, portid); 995e107e82eSAnatoly Burakov 996e107e82eSAnatoly Burakov rte_eth_promiscuous_enable(portid); 997e107e82eSAnatoly Burakov } 998e107e82eSAnatoly Burakov 99974de12b7SAnatoly Burakov if (init_routing_table() < 0) 100074de12b7SAnatoly Burakov rte_exit(EXIT_FAILURE, "Cannot init routing table\n"); 100174de12b7SAnatoly Burakov 1002e107e82eSAnatoly Burakov check_all_ports_link_status((uint8_t)nb_ports, enabled_port_mask); 1003e107e82eSAnatoly Burakov 1004e107e82eSAnatoly Burakov /* launch per-lcore init on every lcore */ 1005e107e82eSAnatoly Burakov rte_eal_mp_remote_launch(main_loop, NULL, CALL_MASTER); 1006e107e82eSAnatoly Burakov RTE_LCORE_FOREACH_SLAVE(lcore_id) { 1007e107e82eSAnatoly Burakov if (rte_eal_wait_lcore(lcore_id) < 0) 1008e107e82eSAnatoly Burakov return -1; 1009e107e82eSAnatoly Burakov } 1010e107e82eSAnatoly Burakov 1011e107e82eSAnatoly Burakov return 0; 1012e107e82eSAnatoly Burakov } 1013