xref: /dpdk/examples/ip_fragmentation/main.c (revision ea0c20ea95fd5d71a10757e6598ac66233ea1495)
1e107e82eSAnatoly Burakov /*-
2e107e82eSAnatoly Burakov  *   BSD LICENSE
3e107e82eSAnatoly Burakov  *
4e107e82eSAnatoly Burakov  *   Copyright(c) 2010-2014 Intel Corporation. All rights reserved.
5e107e82eSAnatoly Burakov  *   All rights reserved.
6e107e82eSAnatoly Burakov  *
7e107e82eSAnatoly Burakov  *   Redistribution and use in source and binary forms, with or without
8e107e82eSAnatoly Burakov  *   modification, are permitted provided that the following conditions
9e107e82eSAnatoly Burakov  *   are met:
10e107e82eSAnatoly Burakov  *
11e107e82eSAnatoly Burakov  *     * Redistributions of source code must retain the above copyright
12e107e82eSAnatoly Burakov  *       notice, this list of conditions and the following disclaimer.
13e107e82eSAnatoly Burakov  *     * Redistributions in binary form must reproduce the above copyright
14e107e82eSAnatoly Burakov  *       notice, this list of conditions and the following disclaimer in
15e107e82eSAnatoly Burakov  *       the documentation and/or other materials provided with the
16e107e82eSAnatoly Burakov  *       distribution.
17e107e82eSAnatoly Burakov  *     * Neither the name of Intel Corporation nor the names of its
18e107e82eSAnatoly Burakov  *       contributors may be used to endorse or promote products derived
19e107e82eSAnatoly Burakov  *       from this software without specific prior written permission.
20e107e82eSAnatoly Burakov  *
21e107e82eSAnatoly Burakov  *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22e107e82eSAnatoly Burakov  *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23e107e82eSAnatoly Burakov  *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24e107e82eSAnatoly Burakov  *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25e107e82eSAnatoly Burakov  *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26e107e82eSAnatoly Burakov  *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27e107e82eSAnatoly Burakov  *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28e107e82eSAnatoly Burakov  *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29e107e82eSAnatoly Burakov  *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30e107e82eSAnatoly Burakov  *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31e107e82eSAnatoly Burakov  *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32e107e82eSAnatoly Burakov  */
33e107e82eSAnatoly Burakov 
34e107e82eSAnatoly Burakov #include <stdio.h>
35e107e82eSAnatoly Burakov #include <stdlib.h>
36e107e82eSAnatoly Burakov #include <stdint.h>
37e107e82eSAnatoly Burakov #include <inttypes.h>
38e107e82eSAnatoly Burakov #include <sys/types.h>
39e107e82eSAnatoly Burakov #include <sys/param.h>
40e107e82eSAnatoly Burakov #include <string.h>
41e107e82eSAnatoly Burakov #include <sys/queue.h>
42e107e82eSAnatoly Burakov #include <stdarg.h>
43e107e82eSAnatoly Burakov #include <errno.h>
44e107e82eSAnatoly Burakov #include <getopt.h>
45e107e82eSAnatoly Burakov 
46e107e82eSAnatoly Burakov #include <rte_common.h>
47e107e82eSAnatoly Burakov #include <rte_byteorder.h>
48e107e82eSAnatoly Burakov #include <rte_log.h>
49e107e82eSAnatoly Burakov #include <rte_memory.h>
50e107e82eSAnatoly Burakov #include <rte_memcpy.h>
51e107e82eSAnatoly Burakov #include <rte_memzone.h>
52e107e82eSAnatoly Burakov #include <rte_eal.h>
53e107e82eSAnatoly Burakov #include <rte_per_lcore.h>
54e107e82eSAnatoly Burakov #include <rte_launch.h>
55e107e82eSAnatoly Burakov #include <rte_atomic.h>
56e107e82eSAnatoly Burakov #include <rte_cycles.h>
57e107e82eSAnatoly Burakov #include <rte_prefetch.h>
58e107e82eSAnatoly Burakov #include <rte_lcore.h>
59e107e82eSAnatoly Burakov #include <rte_per_lcore.h>
60e107e82eSAnatoly Burakov #include <rte_branch_prediction.h>
61e107e82eSAnatoly Burakov #include <rte_interrupts.h>
62e107e82eSAnatoly Burakov #include <rte_pci.h>
63e107e82eSAnatoly Burakov #include <rte_random.h>
64e107e82eSAnatoly Burakov #include <rte_debug.h>
65e107e82eSAnatoly Burakov #include <rte_ether.h>
66e107e82eSAnatoly Burakov #include <rte_ethdev.h>
67e107e82eSAnatoly Burakov #include <rte_ring.h>
68e107e82eSAnatoly Burakov #include <rte_mempool.h>
69e107e82eSAnatoly Burakov #include <rte_mbuf.h>
70e107e82eSAnatoly Burakov #include <rte_lpm.h>
7174de12b7SAnatoly Burakov #include <rte_lpm6.h>
72e107e82eSAnatoly Burakov #include <rte_ip.h>
7374de12b7SAnatoly Burakov #include <rte_string_fns.h>
74e107e82eSAnatoly Burakov 
7574de12b7SAnatoly Burakov #include <rte_ip_frag.h>
7674de12b7SAnatoly Burakov 
7774de12b7SAnatoly Burakov #define RTE_LOGTYPE_IP_FRAG RTE_LOGTYPE_USER1
78e107e82eSAnatoly Burakov 
79*ea0c20eaSOlivier Matz #define MBUF_SIZE (2048 + RTE_PKTMBUF_HEADROOM)
80e107e82eSAnatoly Burakov 
81e107e82eSAnatoly Burakov /* allow max jumbo frame 9.5 KB */
82e107e82eSAnatoly Burakov #define JUMBO_FRAME_MAX_SIZE	0x2600
83e107e82eSAnatoly Burakov 
84e107e82eSAnatoly Burakov #define	ROUNDUP_DIV(a, b)	(((a) + (b) - 1) / (b))
85e107e82eSAnatoly Burakov 
86e107e82eSAnatoly Burakov /*
8774de12b7SAnatoly Burakov  * Default byte size for the IPv6 Maximum Transfer Unit (MTU).
8874de12b7SAnatoly Burakov  * This value includes the size of IPv6 header.
89e107e82eSAnatoly Burakov  */
9074de12b7SAnatoly Burakov #define	IPV4_MTU_DEFAULT	ETHER_MTU
9174de12b7SAnatoly Burakov #define	IPV6_MTU_DEFAULT	ETHER_MTU
9274de12b7SAnatoly Burakov 
9374de12b7SAnatoly Burakov /*
9474de12b7SAnatoly Burakov  * Default payload in bytes for the IPv6 packet.
9574de12b7SAnatoly Burakov  */
9674de12b7SAnatoly Burakov #define	IPV4_DEFAULT_PAYLOAD	(IPV4_MTU_DEFAULT - sizeof(struct ipv4_hdr))
9774de12b7SAnatoly Burakov #define	IPV6_DEFAULT_PAYLOAD	(IPV6_MTU_DEFAULT - sizeof(struct ipv6_hdr))
9874de12b7SAnatoly Burakov 
9974de12b7SAnatoly Burakov /*
10074de12b7SAnatoly Burakov  * Max number of fragments per packet expected - defined by config file.
10174de12b7SAnatoly Burakov  */
10274de12b7SAnatoly Burakov #define	MAX_PACKET_FRAG RTE_LIBRTE_IP_FRAG_MAX_FRAG
103e107e82eSAnatoly Burakov 
104e107e82eSAnatoly Burakov #define NB_MBUF   8192
105e107e82eSAnatoly Burakov 
106e107e82eSAnatoly Burakov #define MAX_PKT_BURST	32
107e107e82eSAnatoly Burakov #define BURST_TX_DRAIN_US 100 /* TX drain every ~100us */
108e107e82eSAnatoly Burakov 
109e107e82eSAnatoly Burakov /* Configure how many packets ahead to prefetch, when reading packets */
110e107e82eSAnatoly Burakov #define PREFETCH_OFFSET	3
111e107e82eSAnatoly Burakov 
112e107e82eSAnatoly Burakov /*
113e107e82eSAnatoly Burakov  * Configurable number of RX/TX ring descriptors
114e107e82eSAnatoly Burakov  */
115e107e82eSAnatoly Burakov #define RTE_TEST_RX_DESC_DEFAULT 128
116e107e82eSAnatoly Burakov #define RTE_TEST_TX_DESC_DEFAULT 512
117e107e82eSAnatoly Burakov static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT;
118e107e82eSAnatoly Burakov static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT;
119e107e82eSAnatoly Burakov 
120e107e82eSAnatoly Burakov /* ethernet addresses of ports */
121e107e82eSAnatoly Burakov static struct ether_addr ports_eth_addr[RTE_MAX_ETHPORTS];
12274de12b7SAnatoly Burakov 
12374de12b7SAnatoly Burakov #ifndef IPv4_BYTES
12474de12b7SAnatoly Burakov #define IPv4_BYTES_FMT "%" PRIu8 ".%" PRIu8 ".%" PRIu8 ".%" PRIu8
12574de12b7SAnatoly Burakov #define IPv4_BYTES(addr) \
12674de12b7SAnatoly Burakov 		(uint8_t) (((addr) >> 24) & 0xFF),\
12774de12b7SAnatoly Burakov 		(uint8_t) (((addr) >> 16) & 0xFF),\
12874de12b7SAnatoly Burakov 		(uint8_t) (((addr) >> 8) & 0xFF),\
12974de12b7SAnatoly Burakov 		(uint8_t) ((addr) & 0xFF)
13074de12b7SAnatoly Burakov #endif
13174de12b7SAnatoly Burakov 
13274de12b7SAnatoly Burakov #ifndef IPv6_BYTES
13374de12b7SAnatoly Burakov #define IPv6_BYTES_FMT "%02x%02x:%02x%02x:%02x%02x:%02x%02x:"\
13474de12b7SAnatoly Burakov                        "%02x%02x:%02x%02x:%02x%02x:%02x%02x"
13574de12b7SAnatoly Burakov #define IPv6_BYTES(addr) \
13674de12b7SAnatoly Burakov 	addr[0],  addr[1], addr[2],  addr[3], \
13774de12b7SAnatoly Burakov 	addr[4],  addr[5], addr[6],  addr[7], \
13874de12b7SAnatoly Burakov 	addr[8],  addr[9], addr[10], addr[11],\
13974de12b7SAnatoly Burakov 	addr[12], addr[13],addr[14], addr[15]
14074de12b7SAnatoly Burakov #endif
14174de12b7SAnatoly Burakov 
14274de12b7SAnatoly Burakov #define IPV6_ADDR_LEN 16
143e107e82eSAnatoly Burakov 
144e107e82eSAnatoly Burakov /* mask of enabled ports */
145e107e82eSAnatoly Burakov static int enabled_port_mask = 0;
146e107e82eSAnatoly Burakov 
147e107e82eSAnatoly Burakov static int rx_queue_per_lcore = 1;
148e107e82eSAnatoly Burakov 
149e107e82eSAnatoly Burakov #define MBUF_TABLE_SIZE  (2 * MAX(MAX_PKT_BURST, MAX_PACKET_FRAG))
150e107e82eSAnatoly Burakov 
151e107e82eSAnatoly Burakov struct mbuf_table {
152e107e82eSAnatoly Burakov 	uint16_t len;
153e107e82eSAnatoly Burakov 	struct rte_mbuf *m_table[MBUF_TABLE_SIZE];
154e107e82eSAnatoly Burakov };
155e107e82eSAnatoly Burakov 
15674de12b7SAnatoly Burakov struct rx_queue {
15774de12b7SAnatoly Burakov 	struct rte_mempool *direct_pool;
15874de12b7SAnatoly Burakov 	struct rte_mempool *indirect_pool;
15974de12b7SAnatoly Burakov 	struct rte_lpm *lpm;
16074de12b7SAnatoly Burakov 	struct rte_lpm6 *lpm6;
16174de12b7SAnatoly Burakov 	uint8_t portid;
16274de12b7SAnatoly Burakov };
16374de12b7SAnatoly Burakov 
164e107e82eSAnatoly Burakov #define MAX_RX_QUEUE_PER_LCORE 16
165e107e82eSAnatoly Burakov #define MAX_TX_QUEUE_PER_PORT 16
166e107e82eSAnatoly Burakov struct lcore_queue_conf {
167e107e82eSAnatoly Burakov 	uint16_t n_rx_queue;
168e107e82eSAnatoly Burakov 	uint16_t tx_queue_id[RTE_MAX_ETHPORTS];
16974de12b7SAnatoly Burakov 	struct rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE];
170e107e82eSAnatoly Burakov 	struct mbuf_table tx_mbufs[RTE_MAX_ETHPORTS];
171e107e82eSAnatoly Burakov } __rte_cache_aligned;
172e107e82eSAnatoly Burakov struct lcore_queue_conf lcore_queue_conf[RTE_MAX_LCORE];
173e107e82eSAnatoly Burakov 
174e107e82eSAnatoly Burakov static const struct rte_eth_conf port_conf = {
175e107e82eSAnatoly Burakov 	.rxmode = {
176e107e82eSAnatoly Burakov 		.max_rx_pkt_len = JUMBO_FRAME_MAX_SIZE,
177e107e82eSAnatoly Burakov 		.split_hdr_size = 0,
178e107e82eSAnatoly Burakov 		.header_split   = 0, /**< Header Split disabled */
17974de12b7SAnatoly Burakov 		.hw_ip_checksum = 1, /**< IP checksum offload enabled */
180e107e82eSAnatoly Burakov 		.hw_vlan_filter = 0, /**< VLAN filtering disabled */
181e107e82eSAnatoly Burakov 		.jumbo_frame    = 1, /**< Jumbo Frame Support enabled */
182e107e82eSAnatoly Burakov 		.hw_strip_crc   = 0, /**< CRC stripped by hardware */
183e107e82eSAnatoly Burakov 	},
184e107e82eSAnatoly Burakov 	.txmode = {
185e107e82eSAnatoly Burakov 		.mq_mode = ETH_MQ_TX_NONE,
186e107e82eSAnatoly Burakov 	},
187e107e82eSAnatoly Burakov };
188e107e82eSAnatoly Burakov 
18974de12b7SAnatoly Burakov /*
19074de12b7SAnatoly Burakov  * IPv4 forwarding table
19174de12b7SAnatoly Burakov  */
19274de12b7SAnatoly Burakov struct l3fwd_ipv4_route {
193e107e82eSAnatoly Burakov 	uint32_t ip;
194e107e82eSAnatoly Burakov 	uint8_t  depth;
195e107e82eSAnatoly Burakov 	uint8_t  if_out;
196e107e82eSAnatoly Burakov };
197e107e82eSAnatoly Burakov 
19874de12b7SAnatoly Burakov struct l3fwd_ipv4_route l3fwd_ipv4_route_array[] = {
19974de12b7SAnatoly Burakov 		{IPv4(100,10,0,0), 16, 0},
20074de12b7SAnatoly Burakov 		{IPv4(100,20,0,0), 16, 1},
20174de12b7SAnatoly Burakov 		{IPv4(100,30,0,0), 16, 2},
20274de12b7SAnatoly Burakov 		{IPv4(100,40,0,0), 16, 3},
20374de12b7SAnatoly Burakov 		{IPv4(100,50,0,0), 16, 4},
20474de12b7SAnatoly Burakov 		{IPv4(100,60,0,0), 16, 5},
20574de12b7SAnatoly Burakov 		{IPv4(100,70,0,0), 16, 6},
20674de12b7SAnatoly Burakov 		{IPv4(100,80,0,0), 16, 7},
207e107e82eSAnatoly Burakov };
208e107e82eSAnatoly Burakov 
20974de12b7SAnatoly Burakov /*
21074de12b7SAnatoly Burakov  * IPv6 forwarding table
21174de12b7SAnatoly Burakov  */
212e107e82eSAnatoly Burakov 
21374de12b7SAnatoly Burakov struct l3fwd_ipv6_route {
21474de12b7SAnatoly Burakov 	uint8_t ip[IPV6_ADDR_LEN];
21574de12b7SAnatoly Burakov 	uint8_t depth;
21674de12b7SAnatoly Burakov 	uint8_t if_out;
21774de12b7SAnatoly Burakov };
218e107e82eSAnatoly Burakov 
21974de12b7SAnatoly Burakov static struct l3fwd_ipv6_route l3fwd_ipv6_route_array[] = {
22074de12b7SAnatoly Burakov 	{{1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 0},
22174de12b7SAnatoly Burakov 	{{2,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 1},
22274de12b7SAnatoly Burakov 	{{3,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 2},
22374de12b7SAnatoly Burakov 	{{4,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 3},
22474de12b7SAnatoly Burakov 	{{5,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 4},
22574de12b7SAnatoly Burakov 	{{6,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 5},
22674de12b7SAnatoly Burakov 	{{7,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 6},
22774de12b7SAnatoly Burakov 	{{8,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1}, 48, 7},
22874de12b7SAnatoly Burakov };
22974de12b7SAnatoly Burakov 
23074de12b7SAnatoly Burakov #define LPM_MAX_RULES         1024
23174de12b7SAnatoly Burakov #define LPM6_MAX_RULES         1024
23274de12b7SAnatoly Burakov #define LPM6_NUMBER_TBL8S (1 << 16)
23374de12b7SAnatoly Burakov 
23474de12b7SAnatoly Burakov struct rte_lpm6_config lpm6_config = {
23574de12b7SAnatoly Burakov 		.max_rules = LPM6_MAX_RULES,
23674de12b7SAnatoly Burakov 		.number_tbl8s = LPM6_NUMBER_TBL8S,
23774de12b7SAnatoly Burakov 		.flags = 0
23874de12b7SAnatoly Burakov };
23974de12b7SAnatoly Burakov 
24074de12b7SAnatoly Burakov static struct rte_mempool *socket_direct_pool[RTE_MAX_NUMA_NODES];
24174de12b7SAnatoly Burakov static struct rte_mempool *socket_indirect_pool[RTE_MAX_NUMA_NODES];
24274de12b7SAnatoly Burakov static struct rte_lpm *socket_lpm[RTE_MAX_NUMA_NODES];
24374de12b7SAnatoly Burakov static struct rte_lpm6 *socket_lpm6[RTE_MAX_NUMA_NODES];
244e107e82eSAnatoly Burakov 
245e107e82eSAnatoly Burakov /* Send burst of packets on an output interface */
246e107e82eSAnatoly Burakov static inline int
247e107e82eSAnatoly Burakov send_burst(struct lcore_queue_conf *qconf, uint16_t n, uint8_t port)
248e107e82eSAnatoly Burakov {
249e107e82eSAnatoly Burakov 	struct rte_mbuf **m_table;
250e107e82eSAnatoly Burakov 	int ret;
251e107e82eSAnatoly Burakov 	uint16_t queueid;
252e107e82eSAnatoly Burakov 
253e107e82eSAnatoly Burakov 	queueid = qconf->tx_queue_id[port];
254e107e82eSAnatoly Burakov 	m_table = (struct rte_mbuf **)qconf->tx_mbufs[port].m_table;
255e107e82eSAnatoly Burakov 
256e107e82eSAnatoly Burakov 	ret = rte_eth_tx_burst(port, queueid, m_table, n);
257e107e82eSAnatoly Burakov 	if (unlikely(ret < n)) {
258e107e82eSAnatoly Burakov 		do {
259e107e82eSAnatoly Burakov 			rte_pktmbuf_free(m_table[ret]);
260e107e82eSAnatoly Burakov 		} while (++ret < n);
261e107e82eSAnatoly Burakov 	}
262e107e82eSAnatoly Burakov 
263e107e82eSAnatoly Burakov 	return 0;
264e107e82eSAnatoly Burakov }
265e107e82eSAnatoly Burakov 
266e107e82eSAnatoly Burakov static inline void
26774de12b7SAnatoly Burakov l3fwd_simple_forward(struct rte_mbuf *m, struct lcore_queue_conf *qconf,
26874de12b7SAnatoly Burakov 		uint8_t queueid, uint8_t port_in)
269e107e82eSAnatoly Burakov {
27074de12b7SAnatoly Burakov 	struct rx_queue *rxq;
27174de12b7SAnatoly Burakov 	uint32_t i, len;
27274de12b7SAnatoly Burakov 	uint8_t next_hop, port_out, ipv6;
273e107e82eSAnatoly Burakov 	int32_t len2;
274e107e82eSAnatoly Burakov 
27574de12b7SAnatoly Burakov 	ipv6 = 0;
27674de12b7SAnatoly Burakov 	rxq = &qconf->rx_queue_list[queueid];
27774de12b7SAnatoly Burakov 
27874de12b7SAnatoly Burakov 	/* by default, send everything back to the source port */
27974de12b7SAnatoly Burakov 	port_out = port_in;
280e107e82eSAnatoly Burakov 
281e107e82eSAnatoly Burakov 	/* Remove the Ethernet header and trailer from the input packet */
282e107e82eSAnatoly Burakov 	rte_pktmbuf_adj(m, (uint16_t)sizeof(struct ether_hdr));
283e107e82eSAnatoly Burakov 
28474de12b7SAnatoly Burakov 	/* Build transmission burst */
28574de12b7SAnatoly Burakov 	len = qconf->tx_mbufs[port_out].len;
28674de12b7SAnatoly Burakov 
28774de12b7SAnatoly Burakov 	/* if this is an IPv4 packet */
28874de12b7SAnatoly Burakov 	if (m->ol_flags & PKT_RX_IPV4_HDR) {
28974de12b7SAnatoly Burakov 		struct ipv4_hdr *ip_hdr;
29074de12b7SAnatoly Burakov 		uint32_t ip_dst;
291e107e82eSAnatoly Burakov 		/* Read the lookup key (i.e. ip_dst) from the input packet */
292e107e82eSAnatoly Burakov 		ip_hdr = rte_pktmbuf_mtod(m, struct ipv4_hdr *);
293e107e82eSAnatoly Burakov 		ip_dst = rte_be_to_cpu_32(ip_hdr->dst_addr);
294e107e82eSAnatoly Burakov 
295e107e82eSAnatoly Burakov 		/* Find destination port */
29674de12b7SAnatoly Burakov 		if (rte_lpm_lookup(rxq->lpm, ip_dst, &next_hop) == 0 &&
29774de12b7SAnatoly Burakov 				(enabled_port_mask & 1 << next_hop) != 0) {
298e107e82eSAnatoly Burakov 			port_out = next_hop;
299e107e82eSAnatoly Burakov 
30074de12b7SAnatoly Burakov 			/* Build transmission burst for new port */
301e107e82eSAnatoly Burakov 			len = qconf->tx_mbufs[port_out].len;
30274de12b7SAnatoly Burakov 		}
303e107e82eSAnatoly Burakov 
304e107e82eSAnatoly Burakov 		/* if we don't need to do any fragmentation */
305ea672a8bSOlivier Matz 		if (likely (IPV4_MTU_DEFAULT >= m->pkt_len)) {
306e107e82eSAnatoly Burakov 			qconf->tx_mbufs[port_out].m_table[len] = m;
307e107e82eSAnatoly Burakov 			len2 = 1;
308e107e82eSAnatoly Burakov 		} else {
309e107e82eSAnatoly Burakov 			len2 = rte_ipv4_fragment_packet(m,
310e107e82eSAnatoly Burakov 				&qconf->tx_mbufs[port_out].m_table[len],
311e107e82eSAnatoly Burakov 				(uint16_t)(MBUF_TABLE_SIZE - len),
312e107e82eSAnatoly Burakov 				IPV4_MTU_DEFAULT,
31374de12b7SAnatoly Burakov 				rxq->direct_pool, rxq->indirect_pool);
314e107e82eSAnatoly Burakov 
315e107e82eSAnatoly Burakov 			/* Free input packet */
316e107e82eSAnatoly Burakov 			rte_pktmbuf_free(m);
317e107e82eSAnatoly Burakov 
318e107e82eSAnatoly Burakov 			/* If we fail to fragment the packet */
319e107e82eSAnatoly Burakov 			if (unlikely (len2 < 0))
320e107e82eSAnatoly Burakov 				return;
321e107e82eSAnatoly Burakov 		}
32274de12b7SAnatoly Burakov 	}
32374de12b7SAnatoly Burakov 	/* if this is an IPv6 packet */
32474de12b7SAnatoly Burakov 	else if (m->ol_flags & PKT_RX_IPV6_HDR) {
32574de12b7SAnatoly Burakov 		struct ipv6_hdr *ip_hdr;
32674de12b7SAnatoly Burakov 
32774de12b7SAnatoly Burakov 		ipv6 = 1;
32874de12b7SAnatoly Burakov 
32974de12b7SAnatoly Burakov 		/* Read the lookup key (i.e. ip_dst) from the input packet */
33074de12b7SAnatoly Burakov 		ip_hdr = rte_pktmbuf_mtod(m, struct ipv6_hdr *);
33174de12b7SAnatoly Burakov 
33274de12b7SAnatoly Burakov 		/* Find destination port */
33374de12b7SAnatoly Burakov 		if (rte_lpm6_lookup(rxq->lpm6, ip_hdr->dst_addr, &next_hop) == 0 &&
33474de12b7SAnatoly Burakov 				(enabled_port_mask & 1 << next_hop) != 0) {
33574de12b7SAnatoly Burakov 			port_out = next_hop;
33674de12b7SAnatoly Burakov 
33774de12b7SAnatoly Burakov 			/* Build transmission burst for new port */
33874de12b7SAnatoly Burakov 			len = qconf->tx_mbufs[port_out].len;
33974de12b7SAnatoly Burakov 		}
34074de12b7SAnatoly Burakov 
34174de12b7SAnatoly Burakov 		/* if we don't need to do any fragmentation */
342ea672a8bSOlivier Matz 		if (likely (IPV6_MTU_DEFAULT >= m->pkt_len)) {
34374de12b7SAnatoly Burakov 			qconf->tx_mbufs[port_out].m_table[len] = m;
34474de12b7SAnatoly Burakov 			len2 = 1;
34574de12b7SAnatoly Burakov 		} else {
34674de12b7SAnatoly Burakov 			len2 = rte_ipv6_fragment_packet(m,
34774de12b7SAnatoly Burakov 				&qconf->tx_mbufs[port_out].m_table[len],
34874de12b7SAnatoly Burakov 				(uint16_t)(MBUF_TABLE_SIZE - len),
34974de12b7SAnatoly Burakov 				IPV6_MTU_DEFAULT,
35074de12b7SAnatoly Burakov 				rxq->direct_pool, rxq->indirect_pool);
35174de12b7SAnatoly Burakov 
35274de12b7SAnatoly Burakov 			/* Free input packet */
35374de12b7SAnatoly Burakov 			rte_pktmbuf_free(m);
35474de12b7SAnatoly Burakov 
35574de12b7SAnatoly Burakov 			/* If we fail to fragment the packet */
35674de12b7SAnatoly Burakov 			if (unlikely (len2 < 0))
35774de12b7SAnatoly Burakov 				return;
35874de12b7SAnatoly Burakov 		}
35974de12b7SAnatoly Burakov 	}
36074de12b7SAnatoly Burakov 	/* else, just forward the packet */
36174de12b7SAnatoly Burakov 	else {
36274de12b7SAnatoly Burakov 		qconf->tx_mbufs[port_out].m_table[len] = m;
36374de12b7SAnatoly Burakov 		len2 = 1;
36474de12b7SAnatoly Burakov 	}
365e107e82eSAnatoly Burakov 
366e107e82eSAnatoly Burakov 	for (i = len; i < len + len2; i ++) {
36774de12b7SAnatoly Burakov 		void *d_addr_bytes;
36874de12b7SAnatoly Burakov 
369e107e82eSAnatoly Burakov 		m = qconf->tx_mbufs[port_out].m_table[i];
370e107e82eSAnatoly Burakov 		struct ether_hdr *eth_hdr = (struct ether_hdr *)
371e107e82eSAnatoly Burakov 			rte_pktmbuf_prepend(m, (uint16_t)sizeof(struct ether_hdr));
372e107e82eSAnatoly Burakov 		if (eth_hdr == NULL) {
373e107e82eSAnatoly Burakov 			rte_panic("No headroom in mbuf.\n");
374e107e82eSAnatoly Burakov 		}
375e107e82eSAnatoly Burakov 
3767869536fSBruce Richardson 		m->l2_len = sizeof(struct ether_hdr);
377e107e82eSAnatoly Burakov 
37874de12b7SAnatoly Burakov 		/* 02:00:00:00:00:xx */
37974de12b7SAnatoly Burakov 		d_addr_bytes = &eth_hdr->d_addr.addr_bytes[0];
38074de12b7SAnatoly Burakov 		*((uint64_t *)d_addr_bytes) = 0x000000000002 + ((uint64_t)port_out << 40);
38174de12b7SAnatoly Burakov 
38274de12b7SAnatoly Burakov 		/* src addr */
383e107e82eSAnatoly Burakov 		ether_addr_copy(&ports_eth_addr[port_out], &eth_hdr->s_addr);
38474de12b7SAnatoly Burakov 		if (ipv6)
38574de12b7SAnatoly Burakov 			eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv6);
38674de12b7SAnatoly Burakov 		else
387e107e82eSAnatoly Burakov 			eth_hdr->ether_type = rte_be_to_cpu_16(ETHER_TYPE_IPv4);
388e107e82eSAnatoly Burakov 	}
389e107e82eSAnatoly Burakov 
390e107e82eSAnatoly Burakov 	len += len2;
391e107e82eSAnatoly Burakov 
392e107e82eSAnatoly Burakov 	if (likely(len < MAX_PKT_BURST)) {
393e107e82eSAnatoly Burakov 		qconf->tx_mbufs[port_out].len = (uint16_t)len;
394e107e82eSAnatoly Burakov 		return;
395e107e82eSAnatoly Burakov 	}
396e107e82eSAnatoly Burakov 
397e107e82eSAnatoly Burakov 	/* Transmit packets */
398e107e82eSAnatoly Burakov 	send_burst(qconf, (uint16_t)len, port_out);
399e107e82eSAnatoly Burakov 	qconf->tx_mbufs[port_out].len = 0;
400e107e82eSAnatoly Burakov }
401e107e82eSAnatoly Burakov 
402e107e82eSAnatoly Burakov /* main processing loop */
403e107e82eSAnatoly Burakov static int
404e107e82eSAnatoly Burakov main_loop(__attribute__((unused)) void *dummy)
405e107e82eSAnatoly Burakov {
406e107e82eSAnatoly Burakov 	struct rte_mbuf *pkts_burst[MAX_PKT_BURST];
407e107e82eSAnatoly Burakov 	unsigned lcore_id;
408e107e82eSAnatoly Burakov 	uint64_t prev_tsc, diff_tsc, cur_tsc;
409e107e82eSAnatoly Burakov 	int i, j, nb_rx;
410e107e82eSAnatoly Burakov 	uint8_t portid;
411e107e82eSAnatoly Burakov 	struct lcore_queue_conf *qconf;
412e107e82eSAnatoly Burakov 	const uint64_t drain_tsc = (rte_get_tsc_hz() + US_PER_S - 1) / US_PER_S * BURST_TX_DRAIN_US;
413e107e82eSAnatoly Burakov 
414e107e82eSAnatoly Burakov 	prev_tsc = 0;
415e107e82eSAnatoly Burakov 
416e107e82eSAnatoly Burakov 	lcore_id = rte_lcore_id();
417e107e82eSAnatoly Burakov 	qconf = &lcore_queue_conf[lcore_id];
418e107e82eSAnatoly Burakov 
419e107e82eSAnatoly Burakov 	if (qconf->n_rx_queue == 0) {
42074de12b7SAnatoly Burakov 		RTE_LOG(INFO, IP_FRAG, "lcore %u has nothing to do\n", lcore_id);
421e107e82eSAnatoly Burakov 		return 0;
422e107e82eSAnatoly Burakov 	}
423e107e82eSAnatoly Burakov 
42474de12b7SAnatoly Burakov 	RTE_LOG(INFO, IP_FRAG, "entering main loop on lcore %u\n", lcore_id);
425e107e82eSAnatoly Burakov 
426e107e82eSAnatoly Burakov 	for (i = 0; i < qconf->n_rx_queue; i++) {
427e107e82eSAnatoly Burakov 
42874de12b7SAnatoly Burakov 		portid = qconf->rx_queue_list[i].portid;
42974de12b7SAnatoly Burakov 		RTE_LOG(INFO, IP_FRAG, " -- lcoreid=%u portid=%d\n", lcore_id,
430e107e82eSAnatoly Burakov 				(int) portid);
431e107e82eSAnatoly Burakov 	}
432e107e82eSAnatoly Burakov 
433e107e82eSAnatoly Burakov 	while (1) {
434e107e82eSAnatoly Burakov 
435e107e82eSAnatoly Burakov 		cur_tsc = rte_rdtsc();
436e107e82eSAnatoly Burakov 
437e107e82eSAnatoly Burakov 		/*
438e107e82eSAnatoly Burakov 		 * TX burst queue drain
439e107e82eSAnatoly Burakov 		 */
440e107e82eSAnatoly Burakov 		diff_tsc = cur_tsc - prev_tsc;
441e107e82eSAnatoly Burakov 		if (unlikely(diff_tsc > drain_tsc)) {
442e107e82eSAnatoly Burakov 
443e107e82eSAnatoly Burakov 			/*
444e107e82eSAnatoly Burakov 			 * This could be optimized (use queueid instead of
445e107e82eSAnatoly Burakov 			 * portid), but it is not called so often
446e107e82eSAnatoly Burakov 			 */
447e107e82eSAnatoly Burakov 			for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) {
448e107e82eSAnatoly Burakov 				if (qconf->tx_mbufs[portid].len == 0)
449e107e82eSAnatoly Burakov 					continue;
450e107e82eSAnatoly Burakov 				send_burst(&lcore_queue_conf[lcore_id],
451e107e82eSAnatoly Burakov 					   qconf->tx_mbufs[portid].len,
452e107e82eSAnatoly Burakov 					   portid);
453e107e82eSAnatoly Burakov 				qconf->tx_mbufs[portid].len = 0;
454e107e82eSAnatoly Burakov 			}
455e107e82eSAnatoly Burakov 
456e107e82eSAnatoly Burakov 			prev_tsc = cur_tsc;
457e107e82eSAnatoly Burakov 		}
458e107e82eSAnatoly Burakov 
459e107e82eSAnatoly Burakov 		/*
460e107e82eSAnatoly Burakov 		 * Read packet from RX queues
461e107e82eSAnatoly Burakov 		 */
462e107e82eSAnatoly Burakov 		for (i = 0; i < qconf->n_rx_queue; i++) {
463e107e82eSAnatoly Burakov 
46474de12b7SAnatoly Burakov 			portid = qconf->rx_queue_list[i].portid;
465e107e82eSAnatoly Burakov 			nb_rx = rte_eth_rx_burst(portid, 0, pkts_burst,
466e107e82eSAnatoly Burakov 						 MAX_PKT_BURST);
467e107e82eSAnatoly Burakov 
468e107e82eSAnatoly Burakov 			/* Prefetch first packets */
469e107e82eSAnatoly Burakov 			for (j = 0; j < PREFETCH_OFFSET && j < nb_rx; j++) {
470e107e82eSAnatoly Burakov 				rte_prefetch0(rte_pktmbuf_mtod(
471e107e82eSAnatoly Burakov 						pkts_burst[j], void *));
472e107e82eSAnatoly Burakov 			}
473e107e82eSAnatoly Burakov 
474e107e82eSAnatoly Burakov 			/* Prefetch and forward already prefetched packets */
475e107e82eSAnatoly Burakov 			for (j = 0; j < (nb_rx - PREFETCH_OFFSET); j++) {
476e107e82eSAnatoly Burakov 				rte_prefetch0(rte_pktmbuf_mtod(pkts_burst[
477e107e82eSAnatoly Burakov 						j + PREFETCH_OFFSET], void *));
47874de12b7SAnatoly Burakov 				l3fwd_simple_forward(pkts_burst[j], qconf, i, portid);
479e107e82eSAnatoly Burakov 			}
480e107e82eSAnatoly Burakov 
481e107e82eSAnatoly Burakov 			/* Forward remaining prefetched packets */
482e107e82eSAnatoly Burakov 			for (; j < nb_rx; j++) {
48374de12b7SAnatoly Burakov 				l3fwd_simple_forward(pkts_burst[j], qconf, i, portid);
484e107e82eSAnatoly Burakov 			}
485e107e82eSAnatoly Burakov 		}
486e107e82eSAnatoly Burakov 	}
487e107e82eSAnatoly Burakov }
488e107e82eSAnatoly Burakov 
489e107e82eSAnatoly Burakov /* display usage */
490e107e82eSAnatoly Burakov static void
491e107e82eSAnatoly Burakov print_usage(const char *prgname)
492e107e82eSAnatoly Burakov {
493e107e82eSAnatoly Burakov 	printf("%s [EAL options] -- -p PORTMASK [-q NQ]\n"
494e107e82eSAnatoly Burakov 	       "  -p PORTMASK: hexadecimal bitmask of ports to configure\n"
495e107e82eSAnatoly Burakov 	       "  -q NQ: number of queue (=ports) per lcore (default is 1)\n",
496e107e82eSAnatoly Burakov 	       prgname);
497e107e82eSAnatoly Burakov }
498e107e82eSAnatoly Burakov 
499e107e82eSAnatoly Burakov static int
500e107e82eSAnatoly Burakov parse_portmask(const char *portmask)
501e107e82eSAnatoly Burakov {
502e107e82eSAnatoly Burakov 	char *end = NULL;
503e107e82eSAnatoly Burakov 	unsigned long pm;
504e107e82eSAnatoly Burakov 
505e107e82eSAnatoly Burakov 	/* parse hexadecimal string */
506e107e82eSAnatoly Burakov 	pm = strtoul(portmask, &end, 16);
507e107e82eSAnatoly Burakov 	if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0'))
508e107e82eSAnatoly Burakov 		return -1;
509e107e82eSAnatoly Burakov 
510e107e82eSAnatoly Burakov 	if (pm == 0)
511e107e82eSAnatoly Burakov 		return -1;
512e107e82eSAnatoly Burakov 
513e107e82eSAnatoly Burakov 	return pm;
514e107e82eSAnatoly Burakov }
515e107e82eSAnatoly Burakov 
516e107e82eSAnatoly Burakov static int
517e107e82eSAnatoly Burakov parse_nqueue(const char *q_arg)
518e107e82eSAnatoly Burakov {
519e107e82eSAnatoly Burakov 	char *end = NULL;
520e107e82eSAnatoly Burakov 	unsigned long n;
521e107e82eSAnatoly Burakov 
522e107e82eSAnatoly Burakov 	/* parse hexadecimal string */
523e107e82eSAnatoly Burakov 	n = strtoul(q_arg, &end, 10);
524e107e82eSAnatoly Burakov 	if ((q_arg[0] == '\0') || (end == NULL) || (*end != '\0'))
525e107e82eSAnatoly Burakov 		return -1;
526e107e82eSAnatoly Burakov 	if (n == 0)
527e107e82eSAnatoly Burakov 		return -1;
528e107e82eSAnatoly Burakov 	if (n >= MAX_RX_QUEUE_PER_LCORE)
529e107e82eSAnatoly Burakov 		return -1;
530e107e82eSAnatoly Burakov 
531e107e82eSAnatoly Burakov 	return n;
532e107e82eSAnatoly Burakov }
533e107e82eSAnatoly Burakov 
534e107e82eSAnatoly Burakov /* Parse the argument given in the command line of the application */
535e107e82eSAnatoly Burakov static int
536e107e82eSAnatoly Burakov parse_args(int argc, char **argv)
537e107e82eSAnatoly Burakov {
538e107e82eSAnatoly Burakov 	int opt, ret;
539e107e82eSAnatoly Burakov 	char **argvopt;
540e107e82eSAnatoly Burakov 	int option_index;
541e107e82eSAnatoly Burakov 	char *prgname = argv[0];
542e107e82eSAnatoly Burakov 	static struct option lgopts[] = {
543e107e82eSAnatoly Burakov 		{NULL, 0, 0, 0}
544e107e82eSAnatoly Burakov 	};
545e107e82eSAnatoly Burakov 
546e107e82eSAnatoly Burakov 	argvopt = argv;
547e107e82eSAnatoly Burakov 
548e107e82eSAnatoly Burakov 	while ((opt = getopt_long(argc, argvopt, "p:q:",
549e107e82eSAnatoly Burakov 				  lgopts, &option_index)) != EOF) {
550e107e82eSAnatoly Burakov 
551e107e82eSAnatoly Burakov 		switch (opt) {
552e107e82eSAnatoly Burakov 		/* portmask */
553e107e82eSAnatoly Burakov 		case 'p':
554e107e82eSAnatoly Burakov 			enabled_port_mask = parse_portmask(optarg);
555e107e82eSAnatoly Burakov 			if (enabled_port_mask < 0) {
556e107e82eSAnatoly Burakov 				printf("invalid portmask\n");
557e107e82eSAnatoly Burakov 				print_usage(prgname);
558e107e82eSAnatoly Burakov 				return -1;
559e107e82eSAnatoly Burakov 			}
560e107e82eSAnatoly Burakov 			break;
561e107e82eSAnatoly Burakov 
562e107e82eSAnatoly Burakov 		/* nqueue */
563e107e82eSAnatoly Burakov 		case 'q':
564e107e82eSAnatoly Burakov 			rx_queue_per_lcore = parse_nqueue(optarg);
565e107e82eSAnatoly Burakov 			if (rx_queue_per_lcore < 0) {
566e107e82eSAnatoly Burakov 				printf("invalid queue number\n");
567e107e82eSAnatoly Burakov 				print_usage(prgname);
568e107e82eSAnatoly Burakov 				return -1;
569e107e82eSAnatoly Burakov 			}
570e107e82eSAnatoly Burakov 			break;
571e107e82eSAnatoly Burakov 
572e107e82eSAnatoly Burakov 		/* long options */
573e107e82eSAnatoly Burakov 		case 0:
574e107e82eSAnatoly Burakov 			print_usage(prgname);
575e107e82eSAnatoly Burakov 			return -1;
576e107e82eSAnatoly Burakov 
577e107e82eSAnatoly Burakov 		default:
578e107e82eSAnatoly Burakov 			print_usage(prgname);
579e107e82eSAnatoly Burakov 			return -1;
580e107e82eSAnatoly Burakov 		}
581e107e82eSAnatoly Burakov 	}
582e107e82eSAnatoly Burakov 
583e107e82eSAnatoly Burakov 	if (enabled_port_mask == 0) {
584e107e82eSAnatoly Burakov 		printf("portmask not specified\n");
585e107e82eSAnatoly Burakov 		print_usage(prgname);
586e107e82eSAnatoly Burakov 		return -1;
587e107e82eSAnatoly Burakov 	}
588e107e82eSAnatoly Burakov 
589e107e82eSAnatoly Burakov 	if (optind >= 0)
590e107e82eSAnatoly Burakov 		argv[optind-1] = prgname;
591e107e82eSAnatoly Burakov 
592e107e82eSAnatoly Burakov 	ret = optind-1;
593e107e82eSAnatoly Burakov 	optind = 0; /* reset getopt lib */
594e107e82eSAnatoly Burakov 	return ret;
595e107e82eSAnatoly Burakov }
596e107e82eSAnatoly Burakov 
597e107e82eSAnatoly Burakov static void
598e107e82eSAnatoly Burakov print_ethaddr(const char *name, struct ether_addr *eth_addr)
599e107e82eSAnatoly Burakov {
600ec3d82dbSCunming Liang 	char buf[ETHER_ADDR_FMT_SIZE];
601ec3d82dbSCunming Liang 	ether_format_addr(buf, ETHER_ADDR_FMT_SIZE, eth_addr);
602ec3d82dbSCunming Liang 	printf("%s%s", name, buf);
603e107e82eSAnatoly Burakov }
604e107e82eSAnatoly Burakov 
605e107e82eSAnatoly Burakov /* Check the link status of all ports in up to 9s, and print them finally */
606e107e82eSAnatoly Burakov static void
607e107e82eSAnatoly Burakov check_all_ports_link_status(uint8_t port_num, uint32_t port_mask)
608e107e82eSAnatoly Burakov {
609e107e82eSAnatoly Burakov #define CHECK_INTERVAL 100 /* 100ms */
610e107e82eSAnatoly Burakov #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */
611e107e82eSAnatoly Burakov 	uint8_t portid, count, all_ports_up, print_flag = 0;
612e107e82eSAnatoly Burakov 	struct rte_eth_link link;
613e107e82eSAnatoly Burakov 
614e107e82eSAnatoly Burakov 	printf("\nChecking link status");
615e107e82eSAnatoly Burakov 	fflush(stdout);
616e107e82eSAnatoly Burakov 	for (count = 0; count <= MAX_CHECK_TIME; count++) {
617e107e82eSAnatoly Burakov 		all_ports_up = 1;
618e107e82eSAnatoly Burakov 		for (portid = 0; portid < port_num; portid++) {
619e107e82eSAnatoly Burakov 			if ((port_mask & (1 << portid)) == 0)
620e107e82eSAnatoly Burakov 				continue;
621e107e82eSAnatoly Burakov 			memset(&link, 0, sizeof(link));
622e107e82eSAnatoly Burakov 			rte_eth_link_get_nowait(portid, &link);
623e107e82eSAnatoly Burakov 			/* print link status if flag set */
624e107e82eSAnatoly Burakov 			if (print_flag == 1) {
625e107e82eSAnatoly Burakov 				if (link.link_status)
626e107e82eSAnatoly Burakov 					printf("Port %d Link Up - speed %u "
627e107e82eSAnatoly Burakov 						"Mbps - %s\n", (uint8_t)portid,
628e107e82eSAnatoly Burakov 						(unsigned)link.link_speed,
629e107e82eSAnatoly Burakov 				(link.link_duplex == ETH_LINK_FULL_DUPLEX) ?
630e107e82eSAnatoly Burakov 					("full-duplex") : ("half-duplex\n"));
631e107e82eSAnatoly Burakov 				else
632e107e82eSAnatoly Burakov 					printf("Port %d Link Down\n",
633e107e82eSAnatoly Burakov 							(uint8_t)portid);
634e107e82eSAnatoly Burakov 				continue;
635e107e82eSAnatoly Burakov 			}
636e107e82eSAnatoly Burakov 			/* clear all_ports_up flag if any link down */
637e107e82eSAnatoly Burakov 			if (link.link_status == 0) {
638e107e82eSAnatoly Burakov 				all_ports_up = 0;
639e107e82eSAnatoly Burakov 				break;
640e107e82eSAnatoly Burakov 			}
641e107e82eSAnatoly Burakov 		}
642e107e82eSAnatoly Burakov 		/* after finally printing all link status, get out */
643e107e82eSAnatoly Burakov 		if (print_flag == 1)
644e107e82eSAnatoly Burakov 			break;
645e107e82eSAnatoly Burakov 
646e107e82eSAnatoly Burakov 		if (all_ports_up == 0) {
647e107e82eSAnatoly Burakov 			printf(".");
648e107e82eSAnatoly Burakov 			fflush(stdout);
649e107e82eSAnatoly Burakov 			rte_delay_ms(CHECK_INTERVAL);
650e107e82eSAnatoly Burakov 		}
651e107e82eSAnatoly Burakov 
652e107e82eSAnatoly Burakov 		/* set the print_flag if all ports up or timeout */
653e107e82eSAnatoly Burakov 		if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) {
654e107e82eSAnatoly Burakov 			print_flag = 1;
65574de12b7SAnatoly Burakov 			printf("\ndone\n");
656e107e82eSAnatoly Burakov 		}
657e107e82eSAnatoly Burakov 	}
658e107e82eSAnatoly Burakov }
659e107e82eSAnatoly Burakov 
66074de12b7SAnatoly Burakov static int
66174de12b7SAnatoly Burakov init_routing_table(void)
66274de12b7SAnatoly Burakov {
66374de12b7SAnatoly Burakov 	struct rte_lpm *lpm;
66474de12b7SAnatoly Burakov 	struct rte_lpm6 *lpm6;
66574de12b7SAnatoly Burakov 	int socket, ret;
66674de12b7SAnatoly Burakov 	unsigned i;
66774de12b7SAnatoly Burakov 
66874de12b7SAnatoly Burakov 	for (socket = 0; socket < RTE_MAX_NUMA_NODES; socket++) {
66974de12b7SAnatoly Burakov 		if (socket_lpm[socket]) {
67074de12b7SAnatoly Burakov 			lpm = socket_lpm[socket];
67174de12b7SAnatoly Burakov 			/* populate the LPM table */
67274de12b7SAnatoly Burakov 			for (i = 0; i < RTE_DIM(l3fwd_ipv4_route_array); i++) {
67374de12b7SAnatoly Burakov 				ret = rte_lpm_add(lpm,
67474de12b7SAnatoly Burakov 					l3fwd_ipv4_route_array[i].ip,
67574de12b7SAnatoly Burakov 					l3fwd_ipv4_route_array[i].depth,
67674de12b7SAnatoly Burakov 					l3fwd_ipv4_route_array[i].if_out);
67774de12b7SAnatoly Burakov 
67874de12b7SAnatoly Burakov 				if (ret < 0) {
67974de12b7SAnatoly Burakov 					RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd "
68074de12b7SAnatoly Burakov 						"LPM table\n", i);
68174de12b7SAnatoly Burakov 					return -1;
68274de12b7SAnatoly Burakov 				}
68374de12b7SAnatoly Burakov 
68474de12b7SAnatoly Burakov 				RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv4_BYTES_FMT
68574de12b7SAnatoly Burakov 						"/%d (port %d)\n",
68674de12b7SAnatoly Burakov 					socket,
68774de12b7SAnatoly Burakov 					IPv4_BYTES(l3fwd_ipv4_route_array[i].ip),
68874de12b7SAnatoly Burakov 					l3fwd_ipv4_route_array[i].depth,
68974de12b7SAnatoly Burakov 					l3fwd_ipv4_route_array[i].if_out);
69074de12b7SAnatoly Burakov 			}
69174de12b7SAnatoly Burakov 		}
69274de12b7SAnatoly Burakov 
69374de12b7SAnatoly Burakov 		if (socket_lpm6[socket]) {
69474de12b7SAnatoly Burakov 			lpm6 = socket_lpm6[socket];
69574de12b7SAnatoly Burakov 			/* populate the LPM6 table */
69674de12b7SAnatoly Burakov 			for (i = 0; i < RTE_DIM(l3fwd_ipv6_route_array); i++) {
69774de12b7SAnatoly Burakov 				ret = rte_lpm6_add(lpm6,
69874de12b7SAnatoly Burakov 					l3fwd_ipv6_route_array[i].ip,
69974de12b7SAnatoly Burakov 					l3fwd_ipv6_route_array[i].depth,
70074de12b7SAnatoly Burakov 					l3fwd_ipv6_route_array[i].if_out);
70174de12b7SAnatoly Burakov 
70274de12b7SAnatoly Burakov 				if (ret < 0) {
70374de12b7SAnatoly Burakov 					RTE_LOG(ERR, IP_FRAG, "Unable to add entry %i to the l3fwd "
70474de12b7SAnatoly Burakov 						"LPM6 table\n", i);
70574de12b7SAnatoly Burakov 					return -1;
70674de12b7SAnatoly Burakov 				}
70774de12b7SAnatoly Burakov 
70874de12b7SAnatoly Burakov 				RTE_LOG(INFO, IP_FRAG, "Socket %i: adding route " IPv6_BYTES_FMT
70974de12b7SAnatoly Burakov 						"/%d (port %d)\n",
71074de12b7SAnatoly Burakov 					socket,
71174de12b7SAnatoly Burakov 					IPv6_BYTES(l3fwd_ipv6_route_array[i].ip),
71274de12b7SAnatoly Burakov 					l3fwd_ipv6_route_array[i].depth,
71374de12b7SAnatoly Burakov 					l3fwd_ipv6_route_array[i].if_out);
71474de12b7SAnatoly Burakov 			}
71574de12b7SAnatoly Burakov 		}
71674de12b7SAnatoly Burakov 	}
71774de12b7SAnatoly Burakov 	return 0;
71874de12b7SAnatoly Burakov }
71974de12b7SAnatoly Burakov 
72074de12b7SAnatoly Burakov static int
72174de12b7SAnatoly Burakov init_mem(void)
72274de12b7SAnatoly Burakov {
72374de12b7SAnatoly Burakov 	char buf[PATH_MAX];
72474de12b7SAnatoly Burakov 	struct rte_mempool *mp;
72574de12b7SAnatoly Burakov 	struct rte_lpm *lpm;
72674de12b7SAnatoly Burakov 	struct rte_lpm6 *lpm6;
72774de12b7SAnatoly Burakov 	int socket;
72874de12b7SAnatoly Burakov 	unsigned lcore_id;
72974de12b7SAnatoly Burakov 
73074de12b7SAnatoly Burakov 	/* traverse through lcores and initialize structures on each socket */
73174de12b7SAnatoly Burakov 
73274de12b7SAnatoly Burakov 	for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) {
73374de12b7SAnatoly Burakov 
73474de12b7SAnatoly Burakov 		if (rte_lcore_is_enabled(lcore_id) == 0)
73574de12b7SAnatoly Burakov 			continue;
73674de12b7SAnatoly Burakov 
73774de12b7SAnatoly Burakov 		socket = rte_lcore_to_socket_id(lcore_id);
73874de12b7SAnatoly Burakov 
73974de12b7SAnatoly Burakov 		if (socket == SOCKET_ID_ANY)
74074de12b7SAnatoly Burakov 			socket = 0;
74174de12b7SAnatoly Burakov 
74274de12b7SAnatoly Burakov 		if (socket_direct_pool[socket] == NULL) {
74374de12b7SAnatoly Burakov 			RTE_LOG(INFO, IP_FRAG, "Creating direct mempool on socket %i\n",
74474de12b7SAnatoly Burakov 					socket);
7456f41fe75SStephen Hemminger 			snprintf(buf, sizeof(buf), "pool_direct_%i", socket);
74674de12b7SAnatoly Burakov 
747*ea0c20eaSOlivier Matz 			mp = rte_pktmbuf_pool_create(buf, NB_MBUF, 32,
748*ea0c20eaSOlivier Matz 				0, MBUF_DATA_SIZE, socket);
74974de12b7SAnatoly Burakov 			if (mp == NULL) {
75074de12b7SAnatoly Burakov 				RTE_LOG(ERR, IP_FRAG, "Cannot create direct mempool\n");
75174de12b7SAnatoly Burakov 				return -1;
75274de12b7SAnatoly Burakov 			}
75374de12b7SAnatoly Burakov 			socket_direct_pool[socket] = mp;
75474de12b7SAnatoly Burakov 		}
75574de12b7SAnatoly Burakov 
75674de12b7SAnatoly Burakov 		if (socket_indirect_pool[socket] == NULL) {
75774de12b7SAnatoly Burakov 			RTE_LOG(INFO, IP_FRAG, "Creating indirect mempool on socket %i\n",
75874de12b7SAnatoly Burakov 					socket);
7596f41fe75SStephen Hemminger 			snprintf(buf, sizeof(buf), "pool_indirect_%i", socket);
76074de12b7SAnatoly Burakov 
761*ea0c20eaSOlivier Matz 			mp = rte_pktmbuf_pool_create(buf, NB_MBUF, 32, 0, 0,
762*ea0c20eaSOlivier Matz 				socket);
76374de12b7SAnatoly Burakov 			if (mp == NULL) {
76474de12b7SAnatoly Burakov 				RTE_LOG(ERR, IP_FRAG, "Cannot create indirect mempool\n");
76574de12b7SAnatoly Burakov 				return -1;
76674de12b7SAnatoly Burakov 			}
76774de12b7SAnatoly Burakov 			socket_indirect_pool[socket] = mp;
76874de12b7SAnatoly Burakov 		}
76974de12b7SAnatoly Burakov 
77074de12b7SAnatoly Burakov 		if (socket_lpm[socket] == NULL) {
77174de12b7SAnatoly Burakov 			RTE_LOG(INFO, IP_FRAG, "Creating LPM table on socket %i\n", socket);
7726f41fe75SStephen Hemminger 			snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket);
77374de12b7SAnatoly Burakov 
77474de12b7SAnatoly Burakov 			lpm = rte_lpm_create(buf, socket, LPM_MAX_RULES, 0);
77574de12b7SAnatoly Burakov 			if (lpm == NULL) {
77674de12b7SAnatoly Burakov 				RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n");
77774de12b7SAnatoly Burakov 				return -1;
77874de12b7SAnatoly Burakov 			}
77974de12b7SAnatoly Burakov 			socket_lpm[socket] = lpm;
78074de12b7SAnatoly Burakov 		}
78174de12b7SAnatoly Burakov 
78274de12b7SAnatoly Burakov 		if (socket_lpm6[socket] == NULL) {
78374de12b7SAnatoly Burakov 			RTE_LOG(INFO, IP_FRAG, "Creating LPM6 table on socket %i\n", socket);
7846f41fe75SStephen Hemminger 			snprintf(buf, sizeof(buf), "IP_FRAG_LPM_%i", socket);
78574de12b7SAnatoly Burakov 
78674de12b7SAnatoly Burakov 			lpm6 = rte_lpm6_create("IP_FRAG_LPM6", socket, &lpm6_config);
78774de12b7SAnatoly Burakov 			if (lpm6 == NULL) {
78874de12b7SAnatoly Burakov 				RTE_LOG(ERR, IP_FRAG, "Cannot create LPM table\n");
78974de12b7SAnatoly Burakov 				return -1;
79074de12b7SAnatoly Burakov 			}
79174de12b7SAnatoly Burakov 			socket_lpm6[socket] = lpm6;
79274de12b7SAnatoly Burakov 		}
79374de12b7SAnatoly Burakov 	}
79474de12b7SAnatoly Burakov 
79574de12b7SAnatoly Burakov 	return 0;
79674de12b7SAnatoly Burakov }
79774de12b7SAnatoly Burakov 
798e107e82eSAnatoly Burakov int
79998a16481SDavid Marchand main(int argc, char **argv)
800e107e82eSAnatoly Burakov {
801e107e82eSAnatoly Burakov 	struct lcore_queue_conf *qconf;
80281f7ecd9SPablo de Lara 	struct rte_eth_dev_info dev_info;
80381f7ecd9SPablo de Lara 	struct rte_eth_txconf *txconf;
80474de12b7SAnatoly Burakov 	struct rx_queue *rxq;
80574de12b7SAnatoly Burakov 	int socket, ret;
80674de12b7SAnatoly Burakov 	unsigned nb_ports;
807e107e82eSAnatoly Burakov 	uint16_t queueid = 0;
808e107e82eSAnatoly Burakov 	unsigned lcore_id = 0, rx_lcore_id = 0;
809e107e82eSAnatoly Burakov 	uint32_t n_tx_queue, nb_lcores;
810e107e82eSAnatoly Burakov 	uint8_t portid;
811e107e82eSAnatoly Burakov 
812e107e82eSAnatoly Burakov 	/* init EAL */
813e107e82eSAnatoly Burakov 	ret = rte_eal_init(argc, argv);
814e107e82eSAnatoly Burakov 	if (ret < 0)
815e107e82eSAnatoly Burakov 		rte_exit(EXIT_FAILURE, "rte_eal_init failed");
816e107e82eSAnatoly Burakov 	argc -= ret;
817e107e82eSAnatoly Burakov 	argv += ret;
818e107e82eSAnatoly Burakov 
819e107e82eSAnatoly Burakov 	/* parse application arguments (after the EAL ones) */
820e107e82eSAnatoly Burakov 	ret = parse_args(argc, argv);
821e107e82eSAnatoly Burakov 	if (ret < 0)
822e107e82eSAnatoly Burakov 		rte_exit(EXIT_FAILURE, "Invalid arguments");
823e107e82eSAnatoly Burakov 
824e107e82eSAnatoly Burakov 	nb_ports = rte_eth_dev_count();
825e107e82eSAnatoly Burakov 	if (nb_ports > RTE_MAX_ETHPORTS)
826e107e82eSAnatoly Burakov 		nb_ports = RTE_MAX_ETHPORTS;
82774de12b7SAnatoly Burakov 	else if (nb_ports == 0)
82874de12b7SAnatoly Burakov 		rte_exit(EXIT_FAILURE, "No ports found!\n");
829e107e82eSAnatoly Burakov 
830e107e82eSAnatoly Burakov 	nb_lcores = rte_lcore_count();
831e107e82eSAnatoly Burakov 
83274de12b7SAnatoly Burakov 	/* initialize structures (mempools, lpm etc.) */
83374de12b7SAnatoly Burakov 	if (init_mem() < 0)
83474de12b7SAnatoly Burakov 		rte_panic("Cannot initialize memory structures!\n");
83574de12b7SAnatoly Burakov 
836eaa8d3bfSAnatoly Burakov 	/* check if portmask has non-existent ports */
837eaa8d3bfSAnatoly Burakov 	if (enabled_port_mask & ~(RTE_LEN2MASK(nb_ports, unsigned)))
838eaa8d3bfSAnatoly Burakov 		rte_exit(EXIT_FAILURE, "Non-existent ports in portmask!\n");
839eaa8d3bfSAnatoly Burakov 
840e107e82eSAnatoly Burakov 	/* initialize all ports */
841e107e82eSAnatoly Burakov 	for (portid = 0; portid < nb_ports; portid++) {
842e107e82eSAnatoly Burakov 		/* skip ports that are not enabled */
843e107e82eSAnatoly Burakov 		if ((enabled_port_mask & (1 << portid)) == 0) {
844e107e82eSAnatoly Burakov 			printf("Skipping disabled port %d\n", portid);
845e107e82eSAnatoly Burakov 			continue;
846e107e82eSAnatoly Burakov 		}
847e107e82eSAnatoly Burakov 
848e107e82eSAnatoly Burakov 		qconf = &lcore_queue_conf[rx_lcore_id];
849e107e82eSAnatoly Burakov 
850e107e82eSAnatoly Burakov 		/* get the lcore_id for this port */
851e107e82eSAnatoly Burakov 		while (rte_lcore_is_enabled(rx_lcore_id) == 0 ||
852e107e82eSAnatoly Burakov 		       qconf->n_rx_queue == (unsigned)rx_queue_per_lcore) {
853e107e82eSAnatoly Burakov 
854e107e82eSAnatoly Burakov 			rx_lcore_id ++;
855e107e82eSAnatoly Burakov 			if (rx_lcore_id >= RTE_MAX_LCORE)
856e107e82eSAnatoly Burakov 				rte_exit(EXIT_FAILURE, "Not enough cores\n");
857e107e82eSAnatoly Burakov 
858e107e82eSAnatoly Burakov 			qconf = &lcore_queue_conf[rx_lcore_id];
859e107e82eSAnatoly Burakov 		}
86074de12b7SAnatoly Burakov 
861324bcf45SAnatoly Burakov 		socket = (int) rte_lcore_to_socket_id(rx_lcore_id);
86274de12b7SAnatoly Burakov 		if (socket == SOCKET_ID_ANY)
86374de12b7SAnatoly Burakov 			socket = 0;
86474de12b7SAnatoly Burakov 
86574de12b7SAnatoly Burakov 		rxq = &qconf->rx_queue_list[qconf->n_rx_queue];
86674de12b7SAnatoly Burakov 		rxq->portid = portid;
86774de12b7SAnatoly Burakov 		rxq->direct_pool = socket_direct_pool[socket];
86874de12b7SAnatoly Burakov 		rxq->indirect_pool = socket_indirect_pool[socket];
86974de12b7SAnatoly Burakov 		rxq->lpm = socket_lpm[socket];
87074de12b7SAnatoly Burakov 		rxq->lpm6 = socket_lpm6[socket];
871e107e82eSAnatoly Burakov 		qconf->n_rx_queue++;
872e107e82eSAnatoly Burakov 
873e107e82eSAnatoly Burakov 		/* init port */
874e107e82eSAnatoly Burakov 		printf("Initializing port %d on lcore %u...", portid,
875e107e82eSAnatoly Burakov 		       rx_lcore_id);
876e107e82eSAnatoly Burakov 		fflush(stdout);
877e107e82eSAnatoly Burakov 
878e107e82eSAnatoly Burakov 		n_tx_queue = nb_lcores;
879e107e82eSAnatoly Burakov 		if (n_tx_queue > MAX_TX_QUEUE_PER_PORT)
880e107e82eSAnatoly Burakov 			n_tx_queue = MAX_TX_QUEUE_PER_PORT;
881e107e82eSAnatoly Burakov 		ret = rte_eth_dev_configure(portid, 1, (uint16_t)n_tx_queue,
882e107e82eSAnatoly Burakov 					    &port_conf);
88374de12b7SAnatoly Burakov 		if (ret < 0) {
88474de12b7SAnatoly Burakov 			printf("\n");
885e107e82eSAnatoly Burakov 			rte_exit(EXIT_FAILURE, "Cannot configure device: "
886e107e82eSAnatoly Burakov 				"err=%d, port=%d\n",
887e107e82eSAnatoly Burakov 				ret, portid);
88874de12b7SAnatoly Burakov 		}
88974de12b7SAnatoly Burakov 
89074de12b7SAnatoly Burakov 		/* init one RX queue */
89174de12b7SAnatoly Burakov 		ret = rte_eth_rx_queue_setup(portid, 0, nb_rxd,
89281f7ecd9SPablo de Lara 					     socket, NULL,
89374de12b7SAnatoly Burakov 					     socket_direct_pool[socket]);
89474de12b7SAnatoly Burakov 		if (ret < 0) {
89574de12b7SAnatoly Burakov 			printf("\n");
89674de12b7SAnatoly Burakov 			rte_exit(EXIT_FAILURE, "rte_eth_rx_queue_setup: "
89774de12b7SAnatoly Burakov 				"err=%d, port=%d\n",
89874de12b7SAnatoly Burakov 				ret, portid);
89974de12b7SAnatoly Burakov 		}
900e107e82eSAnatoly Burakov 
901e107e82eSAnatoly Burakov 		rte_eth_macaddr_get(portid, &ports_eth_addr[portid]);
902e107e82eSAnatoly Burakov 		print_ethaddr(" Address:", &ports_eth_addr[portid]);
90374de12b7SAnatoly Burakov 		printf("\n");
904e107e82eSAnatoly Burakov 
905e107e82eSAnatoly Burakov 		/* init one TX queue per couple (lcore,port) */
906e107e82eSAnatoly Burakov 		queueid = 0;
907e107e82eSAnatoly Burakov 		for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) {
908e107e82eSAnatoly Burakov 			if (rte_lcore_is_enabled(lcore_id) == 0)
909e107e82eSAnatoly Burakov 				continue;
91074de12b7SAnatoly Burakov 
91174de12b7SAnatoly Burakov 			socket = (int) rte_lcore_to_socket_id(lcore_id);
912e107e82eSAnatoly Burakov 			printf("txq=%u,%d ", lcore_id, queueid);
913e107e82eSAnatoly Burakov 			fflush(stdout);
91481f7ecd9SPablo de Lara 
91581f7ecd9SPablo de Lara 			rte_eth_dev_info_get(portid, &dev_info);
91681f7ecd9SPablo de Lara 			txconf = &dev_info.default_txconf;
91781f7ecd9SPablo de Lara 			txconf->txq_flags = 0;
918e107e82eSAnatoly Burakov 			ret = rte_eth_tx_queue_setup(portid, queueid, nb_txd,
91981f7ecd9SPablo de Lara 						     socket, txconf);
92074de12b7SAnatoly Burakov 			if (ret < 0) {
92174de12b7SAnatoly Burakov 				printf("\n");
922e107e82eSAnatoly Burakov 				rte_exit(EXIT_FAILURE, "rte_eth_tx_queue_setup: "
923e107e82eSAnatoly Burakov 					"err=%d, port=%d\n", ret, portid);
92474de12b7SAnatoly Burakov 			}
925e107e82eSAnatoly Burakov 
926e107e82eSAnatoly Burakov 			qconf = &lcore_queue_conf[lcore_id];
927e107e82eSAnatoly Burakov 			qconf->tx_queue_id[portid] = queueid;
928e107e82eSAnatoly Burakov 			queueid++;
929e107e82eSAnatoly Burakov 		}
930e107e82eSAnatoly Burakov 
93174de12b7SAnatoly Burakov 		printf("\n");
93274de12b7SAnatoly Burakov 	}
93374de12b7SAnatoly Burakov 
93474de12b7SAnatoly Burakov 	printf("\n");
93574de12b7SAnatoly Burakov 
93674de12b7SAnatoly Burakov 	/* start ports */
93774de12b7SAnatoly Burakov 	for (portid = 0; portid < nb_ports; portid++) {
93874de12b7SAnatoly Burakov 		if ((enabled_port_mask & (1 << portid)) == 0) {
93974de12b7SAnatoly Burakov 			continue;
94074de12b7SAnatoly Burakov 		}
941e107e82eSAnatoly Burakov 		/* Start device */
942e107e82eSAnatoly Burakov 		ret = rte_eth_dev_start(portid);
943e107e82eSAnatoly Burakov 		if (ret < 0)
94474de12b7SAnatoly Burakov 			rte_exit(EXIT_FAILURE, "rte_eth_dev_start: err=%d, port=%d\n",
945e107e82eSAnatoly Burakov 				ret, portid);
946e107e82eSAnatoly Burakov 
947e107e82eSAnatoly Burakov 		rte_eth_promiscuous_enable(portid);
948e107e82eSAnatoly Burakov 	}
949e107e82eSAnatoly Burakov 
95074de12b7SAnatoly Burakov 	if (init_routing_table() < 0)
95174de12b7SAnatoly Burakov 		rte_exit(EXIT_FAILURE, "Cannot init routing table\n");
95274de12b7SAnatoly Burakov 
953e107e82eSAnatoly Burakov 	check_all_ports_link_status((uint8_t)nb_ports, enabled_port_mask);
954e107e82eSAnatoly Burakov 
955e107e82eSAnatoly Burakov 	/* launch per-lcore init on every lcore */
956e107e82eSAnatoly Burakov 	rte_eal_mp_remote_launch(main_loop, NULL, CALL_MASTER);
957e107e82eSAnatoly Burakov 	RTE_LCORE_FOREACH_SLAVE(lcore_id) {
958e107e82eSAnatoly Burakov 		if (rte_eal_wait_lcore(lcore_id) < 0)
959e107e82eSAnatoly Burakov 			return -1;
960e107e82eSAnatoly Burakov 	}
961e107e82eSAnatoly Burakov 
962e107e82eSAnatoly Burakov 	return 0;
963e107e82eSAnatoly Burakov }
964