1 /* SPDX-License-Identifier: BSD-3-Clause 2 * Copyright(C) 2020 Marvell International Ltd. 3 */ 4 5 #include <arpa/inet.h> 6 #include <errno.h> 7 #include <getopt.h> 8 #include <inttypes.h> 9 #include <signal.h> 10 #include <stdarg.h> 11 #include <stdbool.h> 12 #include <stdint.h> 13 #include <stdio.h> 14 #include <stdlib.h> 15 #include <string.h> 16 #include <sys/socket.h> 17 #include <sys/types.h> 18 #include <sys/queue.h> 19 #include <unistd.h> 20 21 #include <rte_branch_prediction.h> 22 #include <rte_common.h> 23 #include <rte_cycles.h> 24 #include <rte_eal.h> 25 #include <rte_ethdev.h> 26 #include <rte_graph_worker.h> 27 #include <rte_launch.h> 28 #include <rte_lcore.h> 29 #include <rte_log.h> 30 #include <rte_mempool.h> 31 #include <rte_node_eth_api.h> 32 #include <rte_node_ip4_api.h> 33 #include <rte_per_lcore.h> 34 #include <rte_string_fns.h> 35 #include <rte_vect.h> 36 37 #include <cmdline_parse.h> 38 #include <cmdline_parse_etheraddr.h> 39 40 /* Log type */ 41 #define RTE_LOGTYPE_L3FWD_GRAPH RTE_LOGTYPE_USER1 42 43 /* 44 * Configurable number of RX/TX ring descriptors 45 */ 46 #define RTE_TEST_RX_DESC_DEFAULT 1024 47 #define RTE_TEST_TX_DESC_DEFAULT 1024 48 49 #define MAX_TX_QUEUE_PER_PORT RTE_MAX_ETHPORTS 50 #define MAX_RX_QUEUE_PER_PORT 128 51 52 #define MAX_RX_QUEUE_PER_LCORE 16 53 54 #define MAX_LCORE_PARAMS 1024 55 56 #define NB_SOCKETS 8 57 58 /* Static global variables used within this file. */ 59 static uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT; 60 static uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT; 61 62 /**< Ports set in promiscuous mode off by default. */ 63 static int promiscuous_on; 64 65 static int numa_on = 1; /**< NUMA is enabled by default. */ 66 static int per_port_pool; /**< Use separate buffer pools per port; disabled */ 67 /**< by default */ 68 69 static volatile bool force_quit; 70 71 /* Ethernet addresses of ports */ 72 static uint64_t dest_eth_addr[RTE_MAX_ETHPORTS]; 73 static struct rte_ether_addr ports_eth_addr[RTE_MAX_ETHPORTS]; 74 xmm_t val_eth[RTE_MAX_ETHPORTS]; 75 76 /* Mask of enabled ports */ 77 static uint32_t enabled_port_mask; 78 79 struct lcore_rx_queue { 80 uint16_t port_id; 81 uint8_t queue_id; 82 char node_name[RTE_NODE_NAMESIZE]; 83 }; 84 85 /* Lcore conf */ 86 struct lcore_conf { 87 uint16_t n_rx_queue; 88 struct lcore_rx_queue rx_queue_list[MAX_RX_QUEUE_PER_LCORE]; 89 90 struct rte_graph *graph; 91 char name[RTE_GRAPH_NAMESIZE]; 92 rte_graph_t graph_id; 93 } __rte_cache_aligned; 94 95 static struct lcore_conf lcore_conf[RTE_MAX_LCORE]; 96 97 struct lcore_params { 98 uint16_t port_id; 99 uint8_t queue_id; 100 uint8_t lcore_id; 101 } __rte_cache_aligned; 102 103 static struct lcore_params lcore_params_array[MAX_LCORE_PARAMS]; 104 static struct lcore_params lcore_params_array_default[] = { 105 {0, 0, 2}, {0, 1, 2}, {0, 2, 2}, {1, 0, 2}, {1, 1, 2}, 106 {1, 2, 2}, {2, 0, 2}, {3, 0, 3}, {3, 1, 3}, 107 }; 108 109 static struct lcore_params *lcore_params = lcore_params_array_default; 110 static uint16_t nb_lcore_params = RTE_DIM(lcore_params_array_default); 111 112 static struct rte_eth_conf port_conf = { 113 .rxmode = { 114 .mq_mode = ETH_MQ_RX_RSS, 115 .max_rx_pkt_len = RTE_ETHER_MAX_LEN, 116 .split_hdr_size = 0, 117 }, 118 .rx_adv_conf = { 119 .rss_conf = { 120 .rss_key = NULL, 121 .rss_hf = ETH_RSS_IP, 122 }, 123 }, 124 .txmode = { 125 .mq_mode = ETH_MQ_TX_NONE, 126 }, 127 }; 128 129 static struct rte_mempool *pktmbuf_pool[RTE_MAX_ETHPORTS][NB_SOCKETS]; 130 131 static struct rte_node_ethdev_config ethdev_conf[RTE_MAX_ETHPORTS]; 132 133 struct ipv4_l3fwd_lpm_route { 134 uint32_t ip; 135 uint8_t depth; 136 uint8_t if_out; 137 }; 138 139 #define IPV4_L3FWD_LPM_NUM_ROUTES \ 140 (sizeof(ipv4_l3fwd_lpm_route_array) / \ 141 sizeof(ipv4_l3fwd_lpm_route_array[0])) 142 /* 198.18.0.0/16 are set aside for RFC2544 benchmarking. */ 143 static struct ipv4_l3fwd_lpm_route ipv4_l3fwd_lpm_route_array[] = { 144 {RTE_IPV4(198, 18, 0, 0), 24, 0}, {RTE_IPV4(198, 18, 1, 0), 24, 1}, 145 {RTE_IPV4(198, 18, 2, 0), 24, 2}, {RTE_IPV4(198, 18, 3, 0), 24, 3}, 146 {RTE_IPV4(198, 18, 4, 0), 24, 4}, {RTE_IPV4(198, 18, 5, 0), 24, 5}, 147 {RTE_IPV4(198, 18, 6, 0), 24, 6}, {RTE_IPV4(198, 18, 7, 0), 24, 7}, 148 }; 149 150 static int 151 check_lcore_params(void) 152 { 153 uint8_t queue, lcore; 154 int socketid; 155 uint16_t i; 156 157 for (i = 0; i < nb_lcore_params; ++i) { 158 queue = lcore_params[i].queue_id; 159 if (queue >= MAX_RX_QUEUE_PER_PORT) { 160 printf("Invalid queue number: %hhu\n", queue); 161 return -1; 162 } 163 lcore = lcore_params[i].lcore_id; 164 if (!rte_lcore_is_enabled(lcore)) { 165 printf("Error: lcore %hhu is not enabled in lcore mask\n", 166 lcore); 167 return -1; 168 } 169 170 if (lcore == rte_get_master_lcore()) { 171 printf("Error: lcore %u is master lcore\n", lcore); 172 return -1; 173 } 174 socketid = rte_lcore_to_socket_id(lcore); 175 if ((socketid != 0) && (numa_on == 0)) { 176 printf("Warning: lcore %hhu is on socket %d with numa off\n", 177 lcore, socketid); 178 } 179 } 180 181 return 0; 182 } 183 184 static int 185 check_port_config(void) 186 { 187 uint16_t portid; 188 uint16_t i; 189 190 for (i = 0; i < nb_lcore_params; ++i) { 191 portid = lcore_params[i].port_id; 192 if ((enabled_port_mask & (1 << portid)) == 0) { 193 printf("Port %u is not enabled in port mask\n", portid); 194 return -1; 195 } 196 if (!rte_eth_dev_is_valid_port(portid)) { 197 printf("Port %u is not present on the board\n", portid); 198 return -1; 199 } 200 } 201 202 return 0; 203 } 204 205 static uint8_t 206 get_port_n_rx_queues(const uint16_t port) 207 { 208 int queue = -1; 209 uint16_t i; 210 211 for (i = 0; i < nb_lcore_params; ++i) { 212 if (lcore_params[i].port_id == port) { 213 if (lcore_params[i].queue_id == queue + 1) 214 queue = lcore_params[i].queue_id; 215 else 216 rte_exit(EXIT_FAILURE, 217 "Queue ids of the port %d must be" 218 " in sequence and must start with 0\n", 219 lcore_params[i].port_id); 220 } 221 } 222 223 return (uint8_t)(++queue); 224 } 225 226 static int 227 init_lcore_rx_queues(void) 228 { 229 uint16_t i, nb_rx_queue; 230 uint8_t lcore; 231 232 for (i = 0; i < nb_lcore_params; ++i) { 233 lcore = lcore_params[i].lcore_id; 234 nb_rx_queue = lcore_conf[lcore].n_rx_queue; 235 if (nb_rx_queue >= MAX_RX_QUEUE_PER_LCORE) { 236 printf("Error: too many queues (%u) for lcore: %u\n", 237 (unsigned int)nb_rx_queue + 1, 238 (unsigned int)lcore); 239 return -1; 240 } 241 242 lcore_conf[lcore].rx_queue_list[nb_rx_queue].port_id = 243 lcore_params[i].port_id; 244 lcore_conf[lcore].rx_queue_list[nb_rx_queue].queue_id = 245 lcore_params[i].queue_id; 246 lcore_conf[lcore].n_rx_queue++; 247 } 248 249 return 0; 250 } 251 252 /* Display usage */ 253 static void 254 print_usage(const char *prgname) 255 { 256 fprintf(stderr, 257 "%s [EAL options] --" 258 " -p PORTMASK" 259 " [-P]" 260 " --config (port,queue,lcore)[,(port,queue,lcore)]" 261 " [--eth-dest=X,MM:MM:MM:MM:MM:MM]" 262 " [--enable-jumbo [--max-pkt-len PKTLEN]]" 263 " [--no-numa]" 264 " [--per-port-pool]\n\n" 265 266 " -p PORTMASK: Hexadecimal bitmask of ports to configure\n" 267 " -P : Enable promiscuous mode\n" 268 " --config (port,queue,lcore): Rx queue configuration\n" 269 " --eth-dest=X,MM:MM:MM:MM:MM:MM: Ethernet destination for " 270 "port X\n" 271 " --enable-jumbo: Enable jumbo frames\n" 272 " --max-pkt-len: Under the premise of enabling jumbo,\n" 273 " maximum packet length in decimal (64-9600)\n" 274 " --no-numa: Disable numa awareness\n" 275 " --per-port-pool: Use separate buffer pool per port\n\n", 276 prgname); 277 } 278 279 static int 280 parse_max_pkt_len(const char *pktlen) 281 { 282 unsigned long len; 283 char *end = NULL; 284 285 /* Parse decimal string */ 286 len = strtoul(pktlen, &end, 10); 287 if ((pktlen[0] == '\0') || (end == NULL) || (*end != '\0')) 288 return -1; 289 290 if (len == 0) 291 return -1; 292 293 return len; 294 } 295 296 static int 297 parse_portmask(const char *portmask) 298 { 299 char *end = NULL; 300 unsigned long pm; 301 302 /* Parse hexadecimal string */ 303 pm = strtoul(portmask, &end, 16); 304 if ((portmask[0] == '\0') || (end == NULL) || (*end != '\0')) 305 return -1; 306 307 if (pm == 0) 308 return -1; 309 310 return pm; 311 } 312 313 static int 314 parse_config(const char *q_arg) 315 { 316 enum fieldnames { FLD_PORT = 0, FLD_QUEUE, FLD_LCORE, _NUM_FLD }; 317 unsigned long int_fld[_NUM_FLD]; 318 const char *p, *p0 = q_arg; 319 char *str_fld[_NUM_FLD]; 320 uint32_t size; 321 char s[256]; 322 char *end; 323 int i; 324 325 nb_lcore_params = 0; 326 327 while ((p = strchr(p0, '(')) != NULL) { 328 ++p; 329 p0 = strchr(p, ')'); 330 if (p0 == NULL) 331 return -1; 332 333 size = p0 - p; 334 if (size >= sizeof(s)) 335 return -1; 336 337 memcpy(s, p, size); 338 s[size] = '\0'; 339 if (rte_strsplit(s, sizeof(s), str_fld, _NUM_FLD, ',') != 340 _NUM_FLD) 341 return -1; 342 for (i = 0; i < _NUM_FLD; i++) { 343 errno = 0; 344 int_fld[i] = strtoul(str_fld[i], &end, 0); 345 if (errno != 0 || end == str_fld[i]) 346 return -1; 347 } 348 349 if (nb_lcore_params >= MAX_LCORE_PARAMS) { 350 printf("Exceeded max number of lcore params: %hu\n", 351 nb_lcore_params); 352 return -1; 353 } 354 355 if (int_fld[FLD_PORT] >= RTE_MAX_ETHPORTS || 356 int_fld[FLD_LCORE] >= RTE_MAX_LCORE) { 357 printf("Invalid port/lcore id\n"); 358 return -1; 359 } 360 361 lcore_params_array[nb_lcore_params].port_id = 362 (uint8_t)int_fld[FLD_PORT]; 363 lcore_params_array[nb_lcore_params].queue_id = 364 (uint8_t)int_fld[FLD_QUEUE]; 365 lcore_params_array[nb_lcore_params].lcore_id = 366 (uint8_t)int_fld[FLD_LCORE]; 367 ++nb_lcore_params; 368 } 369 lcore_params = lcore_params_array; 370 371 return 0; 372 } 373 374 static void 375 parse_eth_dest(const char *optarg) 376 { 377 uint8_t c, *dest, peer_addr[6]; 378 uint16_t portid; 379 char *port_end; 380 381 errno = 0; 382 portid = strtoul(optarg, &port_end, 10); 383 if (errno != 0 || port_end == optarg || *port_end++ != ',') 384 rte_exit(EXIT_FAILURE, "Invalid eth-dest: %s", optarg); 385 if (portid >= RTE_MAX_ETHPORTS) 386 rte_exit(EXIT_FAILURE, 387 "eth-dest: port %d >= RTE_MAX_ETHPORTS(%d)\n", portid, 388 RTE_MAX_ETHPORTS); 389 390 if (cmdline_parse_etheraddr(NULL, port_end, &peer_addr, 391 sizeof(peer_addr)) < 0) 392 rte_exit(EXIT_FAILURE, "Invalid ethernet address: %s\n", 393 port_end); 394 dest = (uint8_t *)&dest_eth_addr[portid]; 395 for (c = 0; c < 6; c++) 396 dest[c] = peer_addr[c]; 397 *(uint64_t *)(val_eth + portid) = dest_eth_addr[portid]; 398 } 399 400 #define MAX_JUMBO_PKT_LEN 9600 401 #define MEMPOOL_CACHE_SIZE 256 402 403 static const char short_options[] = "p:" /* portmask */ 404 "P" /* promiscuous */ 405 ; 406 407 #define CMD_LINE_OPT_CONFIG "config" 408 #define CMD_LINE_OPT_ETH_DEST "eth-dest" 409 #define CMD_LINE_OPT_NO_NUMA "no-numa" 410 #define CMD_LINE_OPT_ENABLE_JUMBO "enable-jumbo" 411 #define CMD_LINE_OPT_PER_PORT_POOL "per-port-pool" 412 enum { 413 /* Long options mapped to a short option */ 414 415 /* First long only option value must be >= 256, so that we won't 416 * conflict with short options 417 */ 418 CMD_LINE_OPT_MIN_NUM = 256, 419 CMD_LINE_OPT_CONFIG_NUM, 420 CMD_LINE_OPT_ETH_DEST_NUM, 421 CMD_LINE_OPT_NO_NUMA_NUM, 422 CMD_LINE_OPT_ENABLE_JUMBO_NUM, 423 CMD_LINE_OPT_PARSE_PER_PORT_POOL, 424 }; 425 426 static const struct option lgopts[] = { 427 {CMD_LINE_OPT_CONFIG, 1, 0, CMD_LINE_OPT_CONFIG_NUM}, 428 {CMD_LINE_OPT_ETH_DEST, 1, 0, CMD_LINE_OPT_ETH_DEST_NUM}, 429 {CMD_LINE_OPT_NO_NUMA, 0, 0, CMD_LINE_OPT_NO_NUMA_NUM}, 430 {CMD_LINE_OPT_ENABLE_JUMBO, 0, 0, CMD_LINE_OPT_ENABLE_JUMBO_NUM}, 431 {CMD_LINE_OPT_PER_PORT_POOL, 0, 0, CMD_LINE_OPT_PARSE_PER_PORT_POOL}, 432 {NULL, 0, 0, 0}, 433 }; 434 435 /* 436 * This expression is used to calculate the number of mbufs needed 437 * depending on user input, taking into account memory for rx and 438 * tx hardware rings, cache per lcore and mtable per port per lcore. 439 * RTE_MAX is used to ensure that NB_MBUF never goes below a minimum 440 * value of 8192 441 */ 442 #define NB_MBUF(nports) \ 443 RTE_MAX((nports * nb_rx_queue * nb_rxd + \ 444 nports * nb_lcores * RTE_GRAPH_BURST_SIZE + \ 445 nports * n_tx_queue * nb_txd + \ 446 nb_lcores * MEMPOOL_CACHE_SIZE), 8192u) 447 448 /* Parse the argument given in the command line of the application */ 449 static int 450 parse_args(int argc, char **argv) 451 { 452 char *prgname = argv[0]; 453 int option_index; 454 char **argvopt; 455 int opt, ret; 456 457 argvopt = argv; 458 459 /* Error or normal output strings. */ 460 while ((opt = getopt_long(argc, argvopt, short_options, lgopts, 461 &option_index)) != EOF) { 462 463 switch (opt) { 464 /* Portmask */ 465 case 'p': 466 enabled_port_mask = parse_portmask(optarg); 467 if (enabled_port_mask == 0) { 468 fprintf(stderr, "Invalid portmask\n"); 469 print_usage(prgname); 470 return -1; 471 } 472 break; 473 474 case 'P': 475 promiscuous_on = 1; 476 break; 477 478 /* Long options */ 479 case CMD_LINE_OPT_CONFIG_NUM: 480 ret = parse_config(optarg); 481 if (ret) { 482 fprintf(stderr, "Invalid config\n"); 483 print_usage(prgname); 484 return -1; 485 } 486 break; 487 488 case CMD_LINE_OPT_ETH_DEST_NUM: 489 parse_eth_dest(optarg); 490 break; 491 492 case CMD_LINE_OPT_NO_NUMA_NUM: 493 numa_on = 0; 494 break; 495 496 case CMD_LINE_OPT_ENABLE_JUMBO_NUM: { 497 const struct option lenopts = {"max-pkt-len", 498 required_argument, 0, 0}; 499 500 port_conf.rxmode.offloads |= DEV_RX_OFFLOAD_JUMBO_FRAME; 501 port_conf.txmode.offloads |= DEV_TX_OFFLOAD_MULTI_SEGS; 502 503 /* 504 * if no max-pkt-len set, use the default 505 * value RTE_ETHER_MAX_LEN. 506 */ 507 if (getopt_long(argc, argvopt, "", &lenopts, 508 &option_index) == 0) { 509 ret = parse_max_pkt_len(optarg); 510 if (ret < 64 || ret > MAX_JUMBO_PKT_LEN) { 511 fprintf(stderr, "Invalid maximum " 512 "packet length\n"); 513 print_usage(prgname); 514 return -1; 515 } 516 port_conf.rxmode.max_rx_pkt_len = ret; 517 } 518 break; 519 } 520 521 case CMD_LINE_OPT_PARSE_PER_PORT_POOL: 522 printf("Per port buffer pool is enabled\n"); 523 per_port_pool = 1; 524 break; 525 526 default: 527 print_usage(prgname); 528 return -1; 529 } 530 } 531 532 if (optind >= 0) 533 argv[optind - 1] = prgname; 534 ret = optind - 1; 535 optind = 1; /* Reset getopt lib */ 536 537 return ret; 538 } 539 540 static void 541 print_ethaddr(const char *name, const struct rte_ether_addr *eth_addr) 542 { 543 char buf[RTE_ETHER_ADDR_FMT_SIZE]; 544 rte_ether_format_addr(buf, RTE_ETHER_ADDR_FMT_SIZE, eth_addr); 545 printf("%s%s", name, buf); 546 } 547 548 static int 549 init_mem(uint16_t portid, uint32_t nb_mbuf) 550 { 551 uint32_t lcore_id; 552 int socketid; 553 char s[64]; 554 555 for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 556 if (rte_lcore_is_enabled(lcore_id) == 0) 557 continue; 558 559 if (numa_on) 560 socketid = rte_lcore_to_socket_id(lcore_id); 561 else 562 socketid = 0; 563 564 if (socketid >= NB_SOCKETS) { 565 rte_exit(EXIT_FAILURE, 566 "Socket %d of lcore %u is out of range %d\n", 567 socketid, lcore_id, NB_SOCKETS); 568 } 569 570 if (pktmbuf_pool[portid][socketid] == NULL) { 571 snprintf(s, sizeof(s), "mbuf_pool_%d:%d", portid, 572 socketid); 573 /* Create a pool with priv size of a cacheline */ 574 pktmbuf_pool[portid][socketid] = 575 rte_pktmbuf_pool_create( 576 s, nb_mbuf, MEMPOOL_CACHE_SIZE, 577 RTE_CACHE_LINE_SIZE, 578 RTE_MBUF_DEFAULT_BUF_SIZE, socketid); 579 if (pktmbuf_pool[portid][socketid] == NULL) 580 rte_exit(EXIT_FAILURE, 581 "Cannot init mbuf pool on socket %d\n", 582 socketid); 583 else 584 printf("Allocated mbuf pool on socket %d\n", 585 socketid); 586 } 587 } 588 589 return 0; 590 } 591 592 /* Check the link status of all ports in up to 9s, and print them finally */ 593 static void 594 check_all_ports_link_status(uint32_t port_mask) 595 { 596 #define CHECK_INTERVAL 100 /* 100ms */ 597 #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */ 598 uint8_t count, all_ports_up, print_flag = 0; 599 struct rte_eth_link link; 600 uint16_t portid; 601 602 printf("\nChecking link status"); 603 fflush(stdout); 604 for (count = 0; count <= MAX_CHECK_TIME; count++) { 605 if (force_quit) 606 return; 607 all_ports_up = 1; 608 RTE_ETH_FOREACH_DEV(portid) 609 { 610 if (force_quit) 611 return; 612 if ((port_mask & (1 << portid)) == 0) 613 continue; 614 memset(&link, 0, sizeof(link)); 615 rte_eth_link_get_nowait(portid, &link); 616 /* Print link status if flag set */ 617 if (print_flag == 1) { 618 if (link.link_status) 619 printf("Port%d Link Up. Speed %u Mbps " 620 "-%s\n", 621 portid, link.link_speed, 622 (link.link_duplex == 623 ETH_LINK_FULL_DUPLEX) 624 ? ("full-duplex") 625 : ("half-duplex\n")); 626 else 627 printf("Port %d Link Down\n", portid); 628 continue; 629 } 630 /* Clear all_ports_up flag if any link down */ 631 if (link.link_status == ETH_LINK_DOWN) { 632 all_ports_up = 0; 633 break; 634 } 635 } 636 /* After finally printing all link status, get out */ 637 if (print_flag == 1) 638 break; 639 640 if (all_ports_up == 0) { 641 printf("."); 642 fflush(stdout); 643 rte_delay_ms(CHECK_INTERVAL); 644 } 645 646 /* Set the print_flag if all ports up or timeout */ 647 if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) { 648 print_flag = 1; 649 printf("Done\n"); 650 } 651 } 652 } 653 654 static void 655 signal_handler(int signum) 656 { 657 if (signum == SIGINT || signum == SIGTERM) { 658 printf("\n\nSignal %d received, preparing to exit...\n", 659 signum); 660 force_quit = true; 661 } 662 } 663 664 static void 665 print_stats(void) 666 { 667 const char topLeft[] = {27, '[', '1', ';', '1', 'H', '\0'}; 668 const char clr[] = {27, '[', '2', 'J', '\0'}; 669 struct rte_graph_cluster_stats_param s_param; 670 struct rte_graph_cluster_stats *stats; 671 const char *pattern = "worker_*"; 672 673 /* Prepare stats object */ 674 memset(&s_param, 0, sizeof(s_param)); 675 s_param.f = stdout; 676 s_param.socket_id = SOCKET_ID_ANY; 677 s_param.graph_patterns = &pattern; 678 s_param.nb_graph_patterns = 1; 679 680 stats = rte_graph_cluster_stats_create(&s_param); 681 if (stats == NULL) 682 rte_exit(EXIT_FAILURE, "Unable to create stats object\n"); 683 684 while (!force_quit) { 685 /* Clear screen and move to top left */ 686 printf("%s%s", clr, topLeft); 687 rte_graph_cluster_stats_get(stats, 0); 688 rte_delay_ms(1E3); 689 } 690 691 rte_graph_cluster_stats_destroy(stats); 692 } 693 694 /* Main processing loop */ 695 static int 696 graph_main_loop(void *conf) 697 { 698 struct lcore_conf *qconf; 699 struct rte_graph *graph; 700 uint32_t lcore_id; 701 702 RTE_SET_USED(conf); 703 704 lcore_id = rte_lcore_id(); 705 qconf = &lcore_conf[lcore_id]; 706 graph = qconf->graph; 707 708 if (!graph) { 709 RTE_LOG(INFO, L3FWD_GRAPH, "Lcore %u has nothing to do\n", 710 lcore_id); 711 return 0; 712 } 713 714 RTE_LOG(INFO, L3FWD_GRAPH, 715 "Entering main loop on lcore %u, graph %s(%p)\n", lcore_id, 716 qconf->name, graph); 717 718 while (likely(!force_quit)) 719 rte_graph_walk(graph); 720 721 return 0; 722 } 723 724 int 725 main(int argc, char **argv) 726 { 727 /* Rewrite data of src and dst ether addr */ 728 uint8_t rewrite_data[2 * sizeof(struct rte_ether_addr)]; 729 static const char * const default_patterns[] = { 730 "ip4*", 731 "ethdev_tx-*", 732 "pkt_drop", 733 }; 734 uint8_t nb_rx_queue, queue, socketid; 735 struct rte_graph_param graph_conf; 736 struct rte_eth_dev_info dev_info; 737 uint32_t nb_ports, nb_conf = 0; 738 uint32_t n_tx_queue, nb_lcores; 739 struct rte_eth_txconf *txconf; 740 uint16_t queueid, portid, i; 741 const char **node_patterns; 742 struct lcore_conf *qconf; 743 uint16_t nb_graphs = 0; 744 uint16_t nb_patterns; 745 uint8_t rewrite_len; 746 uint32_t lcore_id; 747 int ret; 748 749 /* Init EAL */ 750 ret = rte_eal_init(argc, argv); 751 if (ret < 0) 752 rte_exit(EXIT_FAILURE, "Invalid EAL parameters\n"); 753 argc -= ret; 754 argv += ret; 755 756 force_quit = false; 757 signal(SIGINT, signal_handler); 758 signal(SIGTERM, signal_handler); 759 760 /* Pre-init dst MACs for all ports to 02:00:00:00:00:xx */ 761 for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) { 762 dest_eth_addr[portid] = 763 RTE_ETHER_LOCAL_ADMIN_ADDR + ((uint64_t)portid << 40); 764 *(uint64_t *)(val_eth + portid) = dest_eth_addr[portid]; 765 } 766 767 /* Parse application arguments (after the EAL ones) */ 768 ret = parse_args(argc, argv); 769 if (ret < 0) 770 rte_exit(EXIT_FAILURE, "Invalid L3FWD_GRAPH parameters\n"); 771 772 if (check_lcore_params() < 0) 773 rte_exit(EXIT_FAILURE, "check_lcore_params() failed\n"); 774 775 ret = init_lcore_rx_queues(); 776 if (ret < 0) 777 rte_exit(EXIT_FAILURE, "init_lcore_rx_queues() failed\n"); 778 779 if (check_port_config() < 0) 780 rte_exit(EXIT_FAILURE, "check_port_config() failed\n"); 781 782 nb_ports = rte_eth_dev_count_avail(); 783 nb_lcores = rte_lcore_count(); 784 785 /* Initialize all ports */ 786 RTE_ETH_FOREACH_DEV(portid) 787 { 788 struct rte_eth_conf local_port_conf = port_conf; 789 790 /* Skip ports that are not enabled */ 791 if ((enabled_port_mask & (1 << portid)) == 0) { 792 printf("\nSkipping disabled port %d\n", portid); 793 continue; 794 } 795 796 /* Init port */ 797 printf("Initializing port %d ... ", portid); 798 fflush(stdout); 799 800 nb_rx_queue = get_port_n_rx_queues(portid); 801 n_tx_queue = nb_lcores; 802 if (n_tx_queue > MAX_TX_QUEUE_PER_PORT) 803 n_tx_queue = MAX_TX_QUEUE_PER_PORT; 804 printf("Creating queues: nb_rxq=%d nb_txq=%u... ", 805 nb_rx_queue, n_tx_queue); 806 807 rte_eth_dev_info_get(portid, &dev_info); 808 if (dev_info.tx_offload_capa & DEV_TX_OFFLOAD_MBUF_FAST_FREE) 809 local_port_conf.txmode.offloads |= 810 DEV_TX_OFFLOAD_MBUF_FAST_FREE; 811 812 local_port_conf.rx_adv_conf.rss_conf.rss_hf &= 813 dev_info.flow_type_rss_offloads; 814 if (local_port_conf.rx_adv_conf.rss_conf.rss_hf != 815 port_conf.rx_adv_conf.rss_conf.rss_hf) { 816 printf("Port %u modified RSS hash function based on " 817 "hardware support," 818 "requested:%#" PRIx64 " configured:%#" PRIx64 819 "\n", 820 portid, port_conf.rx_adv_conf.rss_conf.rss_hf, 821 local_port_conf.rx_adv_conf.rss_conf.rss_hf); 822 } 823 824 ret = rte_eth_dev_configure(portid, nb_rx_queue, 825 n_tx_queue, &local_port_conf); 826 if (ret < 0) 827 rte_exit(EXIT_FAILURE, 828 "Cannot configure device: err=%d, port=%d\n", 829 ret, portid); 830 831 ret = rte_eth_dev_adjust_nb_rx_tx_desc(portid, &nb_rxd, 832 &nb_txd); 833 if (ret < 0) 834 rte_exit(EXIT_FAILURE, 835 "Cannot adjust number of descriptors: err=%d, " 836 "port=%d\n", 837 ret, portid); 838 839 rte_eth_macaddr_get(portid, &ports_eth_addr[portid]); 840 print_ethaddr(" Address:", &ports_eth_addr[portid]); 841 printf(", "); 842 print_ethaddr( 843 "Destination:", 844 (const struct rte_ether_addr *)&dest_eth_addr[portid]); 845 printf(", "); 846 847 /* 848 * prepare src MACs for each port. 849 */ 850 rte_ether_addr_copy( 851 &ports_eth_addr[portid], 852 (struct rte_ether_addr *)(val_eth + portid) + 1); 853 854 /* Init memory */ 855 if (!per_port_pool) { 856 /* portid = 0; this is *not* signifying the first port, 857 * rather, it signifies that portid is ignored. 858 */ 859 ret = init_mem(0, NB_MBUF(nb_ports)); 860 } else { 861 ret = init_mem(portid, NB_MBUF(1)); 862 } 863 if (ret < 0) 864 rte_exit(EXIT_FAILURE, "init_mem() failed\n"); 865 866 /* Init one TX queue per couple (lcore,port) */ 867 queueid = 0; 868 for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 869 if (rte_lcore_is_enabled(lcore_id) == 0) 870 continue; 871 872 qconf = &lcore_conf[lcore_id]; 873 874 if (numa_on) 875 socketid = (uint8_t)rte_lcore_to_socket_id( 876 lcore_id); 877 else 878 socketid = 0; 879 880 printf("txq=%u,%d,%d ", lcore_id, queueid, socketid); 881 fflush(stdout); 882 883 txconf = &dev_info.default_txconf; 884 txconf->offloads = local_port_conf.txmode.offloads; 885 ret = rte_eth_tx_queue_setup(portid, queueid, nb_txd, 886 socketid, txconf); 887 if (ret < 0) 888 rte_exit(EXIT_FAILURE, 889 "rte_eth_tx_queue_setup: err=%d, " 890 "port=%d\n", 891 ret, portid); 892 queueid++; 893 } 894 895 /* Setup ethdev node config */ 896 ethdev_conf[nb_conf].port_id = portid; 897 ethdev_conf[nb_conf].num_rx_queues = nb_rx_queue; 898 ethdev_conf[nb_conf].num_tx_queues = n_tx_queue; 899 if (!per_port_pool) 900 ethdev_conf[nb_conf].mp = pktmbuf_pool[0]; 901 902 else 903 ethdev_conf[nb_conf].mp = pktmbuf_pool[portid]; 904 ethdev_conf[nb_conf].mp_count = NB_SOCKETS; 905 906 nb_conf++; 907 printf("\n"); 908 } 909 910 for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 911 if (rte_lcore_is_enabled(lcore_id) == 0) 912 continue; 913 qconf = &lcore_conf[lcore_id]; 914 printf("\nInitializing rx queues on lcore %u ... ", lcore_id); 915 fflush(stdout); 916 /* Init RX queues */ 917 for (queue = 0; queue < qconf->n_rx_queue; ++queue) { 918 struct rte_eth_rxconf rxq_conf; 919 920 portid = qconf->rx_queue_list[queue].port_id; 921 queueid = qconf->rx_queue_list[queue].queue_id; 922 923 if (numa_on) 924 socketid = (uint8_t)rte_lcore_to_socket_id( 925 lcore_id); 926 else 927 socketid = 0; 928 929 printf("rxq=%d,%d,%d ", portid, queueid, socketid); 930 fflush(stdout); 931 932 rte_eth_dev_info_get(portid, &dev_info); 933 rxq_conf = dev_info.default_rxconf; 934 rxq_conf.offloads = port_conf.rxmode.offloads; 935 if (!per_port_pool) 936 ret = rte_eth_rx_queue_setup( 937 portid, queueid, nb_rxd, socketid, 938 &rxq_conf, pktmbuf_pool[0][socketid]); 939 else 940 ret = rte_eth_rx_queue_setup( 941 portid, queueid, nb_rxd, socketid, 942 &rxq_conf, 943 pktmbuf_pool[portid][socketid]); 944 if (ret < 0) 945 rte_exit(EXIT_FAILURE, 946 "rte_eth_rx_queue_setup: err=%d, " 947 "port=%d\n", 948 ret, portid); 949 950 /* Add this queue node to its graph */ 951 snprintf(qconf->rx_queue_list[queue].node_name, 952 RTE_NODE_NAMESIZE, "ethdev_rx-%u-%u", portid, 953 queueid); 954 } 955 956 /* Alloc a graph to this lcore only if source exists */ 957 if (qconf->n_rx_queue) 958 nb_graphs++; 959 } 960 961 printf("\n"); 962 963 /* Ethdev node config, skip rx queue mapping */ 964 ret = rte_node_eth_config(ethdev_conf, nb_conf, nb_graphs); 965 if (ret) 966 rte_exit(EXIT_FAILURE, "rte_node_eth_config: err=%d\n", ret); 967 968 /* Start ports */ 969 RTE_ETH_FOREACH_DEV(portid) 970 { 971 if ((enabled_port_mask & (1 << portid)) == 0) 972 continue; 973 974 /* Start device */ 975 ret = rte_eth_dev_start(portid); 976 if (ret < 0) 977 rte_exit(EXIT_FAILURE, 978 "rte_eth_dev_start: err=%d, port=%d\n", ret, 979 portid); 980 981 /* 982 * If enabled, put device in promiscuous mode. 983 * This allows IO forwarding mode to forward packets 984 * to itself through 2 cross-connected ports of the 985 * target machine. 986 */ 987 if (promiscuous_on) 988 rte_eth_promiscuous_enable(portid); 989 } 990 991 printf("\n"); 992 993 check_all_ports_link_status(enabled_port_mask); 994 995 /* Graph Initialization */ 996 nb_patterns = RTE_DIM(default_patterns); 997 node_patterns = malloc((MAX_RX_QUEUE_PER_LCORE + nb_patterns) * 998 sizeof(*node_patterns)); 999 if (!node_patterns) 1000 return -ENOMEM; 1001 memcpy(node_patterns, default_patterns, 1002 nb_patterns * sizeof(*node_patterns)); 1003 1004 memset(&graph_conf, 0, sizeof(graph_conf)); 1005 graph_conf.node_patterns = node_patterns; 1006 1007 for (lcore_id = 0; lcore_id < RTE_MAX_LCORE; lcore_id++) { 1008 rte_graph_t graph_id; 1009 rte_edge_t i; 1010 1011 if (rte_lcore_is_enabled(lcore_id) == 0) 1012 continue; 1013 1014 qconf = &lcore_conf[lcore_id]; 1015 1016 /* Skip graph creation if no source exists */ 1017 if (!qconf->n_rx_queue) 1018 continue; 1019 1020 /* Add rx node patterns of this lcore */ 1021 for (i = 0; i < qconf->n_rx_queue; i++) { 1022 graph_conf.node_patterns[nb_patterns + i] = 1023 qconf->rx_queue_list[i].node_name; 1024 } 1025 1026 graph_conf.nb_node_patterns = nb_patterns + i; 1027 graph_conf.socket_id = rte_lcore_to_socket_id(lcore_id); 1028 1029 snprintf(qconf->name, sizeof(qconf->name), "worker_%u", 1030 lcore_id); 1031 1032 graph_id = rte_graph_create(qconf->name, &graph_conf); 1033 if (graph_id == RTE_GRAPH_ID_INVALID) 1034 rte_exit(EXIT_FAILURE, 1035 "rte_graph_create(): graph_id invalid" 1036 " for lcore %u\n", lcore_id); 1037 1038 qconf->graph_id = graph_id; 1039 qconf->graph = rte_graph_lookup(qconf->name); 1040 if (!qconf->graph) 1041 rte_exit(EXIT_FAILURE, 1042 "rte_graph_lookup(): graph %s not found\n", 1043 qconf->name); 1044 } 1045 1046 memset(&rewrite_data, 0, sizeof(rewrite_data)); 1047 rewrite_len = sizeof(rewrite_data); 1048 1049 /* Add route to ip4 graph infra */ 1050 for (i = 0; i < IPV4_L3FWD_LPM_NUM_ROUTES; i++) { 1051 char route_str[INET6_ADDRSTRLEN * 4]; 1052 char abuf[INET6_ADDRSTRLEN]; 1053 struct in_addr in; 1054 uint32_t dst_port; 1055 1056 /* Skip unused ports */ 1057 if ((1 << ipv4_l3fwd_lpm_route_array[i].if_out & 1058 enabled_port_mask) == 0) 1059 continue; 1060 1061 dst_port = ipv4_l3fwd_lpm_route_array[i].if_out; 1062 1063 in.s_addr = htonl(ipv4_l3fwd_lpm_route_array[i].ip); 1064 snprintf(route_str, sizeof(route_str), "%s / %d (%d)", 1065 inet_ntop(AF_INET, &in, abuf, sizeof(abuf)), 1066 ipv4_l3fwd_lpm_route_array[i].depth, 1067 ipv4_l3fwd_lpm_route_array[i].if_out); 1068 1069 /* Use route index 'i' as next hop id */ 1070 ret = rte_node_ip4_route_add( 1071 ipv4_l3fwd_lpm_route_array[i].ip, 1072 ipv4_l3fwd_lpm_route_array[i].depth, i, 1073 RTE_NODE_IP4_LOOKUP_NEXT_REWRITE); 1074 1075 if (ret < 0) 1076 rte_exit(EXIT_FAILURE, 1077 "Unable to add ip4 route %s to graph\n", 1078 route_str); 1079 1080 memcpy(rewrite_data, val_eth + dst_port, rewrite_len); 1081 1082 /* Add next hop rewrite data for id 'i' */ 1083 ret = rte_node_ip4_rewrite_add(i, rewrite_data, 1084 rewrite_len, dst_port); 1085 if (ret < 0) 1086 rte_exit(EXIT_FAILURE, 1087 "Unable to add next hop %u for " 1088 "route %s\n", i, route_str); 1089 1090 RTE_LOG(INFO, L3FWD_GRAPH, "Added route %s, next_hop %u\n", 1091 route_str, i); 1092 } 1093 1094 /* Launch per-lcore init on every slave lcore */ 1095 rte_eal_mp_remote_launch(graph_main_loop, NULL, SKIP_MASTER); 1096 1097 /* Accumulate and print stats on master until exit */ 1098 if (rte_graph_has_stats_feature()) 1099 print_stats(); 1100 1101 /* Wait for slave cores to exit */ 1102 ret = 0; 1103 RTE_LCORE_FOREACH_SLAVE(lcore_id) { 1104 ret = rte_eal_wait_lcore(lcore_id); 1105 /* Destroy graph */ 1106 if (ret < 0 || rte_graph_destroy( 1107 rte_graph_from_name(lcore_conf[lcore_id].name))) { 1108 ret = -1; 1109 break; 1110 } 1111 } 1112 free(node_patterns); 1113 1114 /* Stop ports */ 1115 RTE_ETH_FOREACH_DEV(portid) { 1116 if ((enabled_port_mask & (1 << portid)) == 0) 1117 continue; 1118 printf("Closing port %d...", portid); 1119 rte_eth_dev_stop(portid); 1120 rte_eth_dev_close(portid); 1121 printf(" Done\n"); 1122 } 1123 printf("Bye...\n"); 1124 1125 return ret; 1126 } 1127