1 /* SPDX-License-Identifier: BSD-3-Clause 2 * Copyright(c) 2010-2017 Intel Corporation 3 */ 4 5 #include <stdarg.h> 6 #include <stdio.h> 7 #include <stdlib.h> 8 #include <signal.h> 9 #include <string.h> 10 #include <time.h> 11 #include <fcntl.h> 12 #ifndef RTE_EXEC_ENV_WINDOWS 13 #include <sys/mman.h> 14 #endif 15 #include <sys/types.h> 16 #include <errno.h> 17 #include <stdbool.h> 18 19 #include <sys/queue.h> 20 #include <sys/stat.h> 21 22 #include <stdint.h> 23 #include <unistd.h> 24 #include <inttypes.h> 25 26 #include <rte_common.h> 27 #include <rte_errno.h> 28 #include <rte_byteorder.h> 29 #include <rte_log.h> 30 #include <rte_debug.h> 31 #include <rte_cycles.h> 32 #include <rte_memory.h> 33 #include <rte_memcpy.h> 34 #include <rte_launch.h> 35 #include <rte_eal.h> 36 #include <rte_alarm.h> 37 #include <rte_per_lcore.h> 38 #include <rte_lcore.h> 39 #include <rte_branch_prediction.h> 40 #include <rte_mempool.h> 41 #include <rte_malloc.h> 42 #include <rte_mbuf.h> 43 #include <rte_mbuf_pool_ops.h> 44 #include <rte_interrupts.h> 45 #include <rte_pci.h> 46 #include <rte_ether.h> 47 #include <rte_ethdev.h> 48 #include <rte_dev.h> 49 #include <rte_string_fns.h> 50 #ifdef RTE_NET_IXGBE 51 #include <rte_pmd_ixgbe.h> 52 #endif 53 #ifdef RTE_LIB_PDUMP 54 #include <rte_pdump.h> 55 #endif 56 #include <rte_flow.h> 57 #ifdef RTE_LIB_METRICS 58 #include <rte_metrics.h> 59 #endif 60 #ifdef RTE_LIB_BITRATESTATS 61 #include <rte_bitrate.h> 62 #endif 63 #ifdef RTE_LIB_LATENCYSTATS 64 #include <rte_latencystats.h> 65 #endif 66 #ifdef RTE_EXEC_ENV_WINDOWS 67 #include <process.h> 68 #endif 69 #ifdef RTE_NET_BOND 70 #include <rte_eth_bond.h> 71 #endif 72 73 #include "testpmd.h" 74 75 #ifndef MAP_HUGETLB 76 /* FreeBSD may not have MAP_HUGETLB (in fact, it probably doesn't) */ 77 #define HUGE_FLAG (0x40000) 78 #else 79 #define HUGE_FLAG MAP_HUGETLB 80 #endif 81 82 #ifndef MAP_HUGE_SHIFT 83 /* older kernels (or FreeBSD) will not have this define */ 84 #define HUGE_SHIFT (26) 85 #else 86 #define HUGE_SHIFT MAP_HUGE_SHIFT 87 #endif 88 89 #define EXTMEM_HEAP_NAME "extmem" 90 /* 91 * Zone size with the malloc overhead (max of debug and release variants) 92 * must fit into the smallest supported hugepage size (2M), 93 * so that an IOVA-contiguous zone of this size can always be allocated 94 * if there are free 2M hugepages. 95 */ 96 #define EXTBUF_ZONE_SIZE (RTE_PGSIZE_2M - 4 * RTE_CACHE_LINE_SIZE) 97 98 uint16_t verbose_level = 0; /**< Silent by default. */ 99 int testpmd_logtype; /**< Log type for testpmd logs */ 100 101 /* use main core for command line ? */ 102 uint8_t interactive = 0; 103 uint8_t auto_start = 0; 104 uint8_t tx_first; 105 char cmdline_filename[PATH_MAX] = {0}; 106 107 /* 108 * NUMA support configuration. 109 * When set, the NUMA support attempts to dispatch the allocation of the 110 * RX and TX memory rings, and of the DMA memory buffers (mbufs) for the 111 * probed ports among the CPU sockets 0 and 1. 112 * Otherwise, all memory is allocated from CPU socket 0. 113 */ 114 uint8_t numa_support = 1; /**< numa enabled by default */ 115 116 /* 117 * In UMA mode,all memory is allocated from socket 0 if --socket-num is 118 * not configured. 119 */ 120 uint8_t socket_num = UMA_NO_CONFIG; 121 122 /* 123 * Select mempool allocation type: 124 * - native: use regular DPDK memory 125 * - anon: use regular DPDK memory to create mempool, but populate using 126 * anonymous memory (may not be IOVA-contiguous) 127 * - xmem: use externally allocated hugepage memory 128 */ 129 uint8_t mp_alloc_type = MP_ALLOC_NATIVE; 130 131 /* 132 * Store specified sockets on which memory pool to be used by ports 133 * is allocated. 134 */ 135 uint8_t port_numa[RTE_MAX_ETHPORTS]; 136 137 /* 138 * Store specified sockets on which RX ring to be used by ports 139 * is allocated. 140 */ 141 uint8_t rxring_numa[RTE_MAX_ETHPORTS]; 142 143 /* 144 * Store specified sockets on which TX ring to be used by ports 145 * is allocated. 146 */ 147 uint8_t txring_numa[RTE_MAX_ETHPORTS]; 148 149 /* 150 * Record the Ethernet address of peer target ports to which packets are 151 * forwarded. 152 * Must be instantiated with the ethernet addresses of peer traffic generator 153 * ports. 154 */ 155 struct rte_ether_addr peer_eth_addrs[RTE_MAX_ETHPORTS]; 156 portid_t nb_peer_eth_addrs = 0; 157 158 /* 159 * Probed Target Environment. 160 */ 161 struct rte_port *ports; /**< For all probed ethernet ports. */ 162 portid_t nb_ports; /**< Number of probed ethernet ports. */ 163 struct fwd_lcore **fwd_lcores; /**< For all probed logical cores. */ 164 lcoreid_t nb_lcores; /**< Number of probed logical cores. */ 165 166 portid_t ports_ids[RTE_MAX_ETHPORTS]; /**< Store all port ids. */ 167 168 /* 169 * Test Forwarding Configuration. 170 * nb_fwd_lcores <= nb_cfg_lcores <= nb_lcores 171 * nb_fwd_ports <= nb_cfg_ports <= nb_ports 172 */ 173 lcoreid_t nb_cfg_lcores; /**< Number of configured logical cores. */ 174 lcoreid_t nb_fwd_lcores; /**< Number of forwarding logical cores. */ 175 portid_t nb_cfg_ports; /**< Number of configured ports. */ 176 portid_t nb_fwd_ports; /**< Number of forwarding ports. */ 177 178 unsigned int fwd_lcores_cpuids[RTE_MAX_LCORE]; /**< CPU ids configuration. */ 179 portid_t fwd_ports_ids[RTE_MAX_ETHPORTS]; /**< Port ids configuration. */ 180 181 struct fwd_stream **fwd_streams; /**< For each RX queue of each port. */ 182 streamid_t nb_fwd_streams; /**< Is equal to (nb_ports * nb_rxq). */ 183 184 /* 185 * Forwarding engines. 186 */ 187 struct fwd_engine * fwd_engines[] = { 188 &io_fwd_engine, 189 &mac_fwd_engine, 190 &mac_swap_engine, 191 &flow_gen_engine, 192 &rx_only_engine, 193 &tx_only_engine, 194 &csum_fwd_engine, 195 &icmp_echo_engine, 196 &noisy_vnf_engine, 197 &five_tuple_swap_fwd_engine, 198 #ifdef RTE_LIBRTE_IEEE1588 199 &ieee1588_fwd_engine, 200 #endif 201 &shared_rxq_engine, 202 NULL, 203 }; 204 205 struct rte_mempool *mempools[RTE_MAX_NUMA_NODES * MAX_SEGS_BUFFER_SPLIT]; 206 uint16_t mempool_flags; 207 208 struct fwd_config cur_fwd_config; 209 struct fwd_engine *cur_fwd_eng = &io_fwd_engine; /**< IO mode by default. */ 210 uint32_t retry_enabled; 211 uint32_t burst_tx_delay_time = BURST_TX_WAIT_US; 212 uint32_t burst_tx_retry_num = BURST_TX_RETRIES; 213 214 uint32_t mbuf_data_size_n = 1; /* Number of specified mbuf sizes. */ 215 uint16_t mbuf_data_size[MAX_SEGS_BUFFER_SPLIT] = { 216 DEFAULT_MBUF_DATA_SIZE 217 }; /**< Mbuf data space size. */ 218 uint32_t param_total_num_mbufs = 0; /**< number of mbufs in all pools - if 219 * specified on command-line. */ 220 uint16_t stats_period; /**< Period to show statistics (disabled by default) */ 221 222 /** Extended statistics to show. */ 223 struct rte_eth_xstat_name *xstats_display; 224 225 unsigned int xstats_display_num; /**< Size of extended statistics to show */ 226 227 /* 228 * In container, it cannot terminate the process which running with 'stats-period' 229 * option. Set flag to exit stats period loop after received SIGINT/SIGTERM. 230 */ 231 uint8_t f_quit; 232 233 /* 234 * Max Rx frame size, set by '--max-pkt-len' parameter. 235 */ 236 uint32_t max_rx_pkt_len; 237 238 /* 239 * Configuration of packet segments used to scatter received packets 240 * if some of split features is configured. 241 */ 242 uint16_t rx_pkt_seg_lengths[MAX_SEGS_BUFFER_SPLIT]; 243 uint8_t rx_pkt_nb_segs; /**< Number of segments to split */ 244 uint16_t rx_pkt_seg_offsets[MAX_SEGS_BUFFER_SPLIT]; 245 uint8_t rx_pkt_nb_offs; /**< Number of specified offsets */ 246 247 /* 248 * Configuration of packet segments used by the "txonly" processing engine. 249 */ 250 uint16_t tx_pkt_length = TXONLY_DEF_PACKET_LEN; /**< TXONLY packet length. */ 251 uint16_t tx_pkt_seg_lengths[RTE_MAX_SEGS_PER_PKT] = { 252 TXONLY_DEF_PACKET_LEN, 253 }; 254 uint8_t tx_pkt_nb_segs = 1; /**< Number of segments in TXONLY packets */ 255 256 enum tx_pkt_split tx_pkt_split = TX_PKT_SPLIT_OFF; 257 /**< Split policy for packets to TX. */ 258 259 uint8_t txonly_multi_flow; 260 /**< Whether multiple flows are generated in TXONLY mode. */ 261 262 uint32_t tx_pkt_times_inter; 263 /**< Timings for send scheduling in TXONLY mode, time between bursts. */ 264 265 uint32_t tx_pkt_times_intra; 266 /**< Timings for send scheduling in TXONLY mode, time between packets. */ 267 268 uint16_t nb_pkt_per_burst = DEF_PKT_BURST; /**< Number of packets per burst. */ 269 uint16_t nb_pkt_flowgen_clones; /**< Number of Tx packet clones to send in flowgen mode. */ 270 int nb_flows_flowgen = 1024; /**< Number of flows in flowgen mode. */ 271 uint16_t mb_mempool_cache = DEF_MBUF_CACHE; /**< Size of mbuf mempool cache. */ 272 273 /* current configuration is in DCB or not,0 means it is not in DCB mode */ 274 uint8_t dcb_config = 0; 275 276 /* 277 * Configurable number of RX/TX queues. 278 */ 279 queueid_t nb_hairpinq; /**< Number of hairpin queues per port. */ 280 queueid_t nb_rxq = 1; /**< Number of RX queues per port. */ 281 queueid_t nb_txq = 1; /**< Number of TX queues per port. */ 282 283 /* 284 * Configurable number of RX/TX ring descriptors. 285 * Defaults are supplied by drivers via ethdev. 286 */ 287 #define RTE_TEST_RX_DESC_DEFAULT 0 288 #define RTE_TEST_TX_DESC_DEFAULT 0 289 uint16_t nb_rxd = RTE_TEST_RX_DESC_DEFAULT; /**< Number of RX descriptors. */ 290 uint16_t nb_txd = RTE_TEST_TX_DESC_DEFAULT; /**< Number of TX descriptors. */ 291 292 #define RTE_PMD_PARAM_UNSET -1 293 /* 294 * Configurable values of RX and TX ring threshold registers. 295 */ 296 297 int8_t rx_pthresh = RTE_PMD_PARAM_UNSET; 298 int8_t rx_hthresh = RTE_PMD_PARAM_UNSET; 299 int8_t rx_wthresh = RTE_PMD_PARAM_UNSET; 300 301 int8_t tx_pthresh = RTE_PMD_PARAM_UNSET; 302 int8_t tx_hthresh = RTE_PMD_PARAM_UNSET; 303 int8_t tx_wthresh = RTE_PMD_PARAM_UNSET; 304 305 /* 306 * Configurable value of RX free threshold. 307 */ 308 int16_t rx_free_thresh = RTE_PMD_PARAM_UNSET; 309 310 /* 311 * Configurable value of RX drop enable. 312 */ 313 int8_t rx_drop_en = RTE_PMD_PARAM_UNSET; 314 315 /* 316 * Configurable value of TX free threshold. 317 */ 318 int16_t tx_free_thresh = RTE_PMD_PARAM_UNSET; 319 320 /* 321 * Configurable value of TX RS bit threshold. 322 */ 323 int16_t tx_rs_thresh = RTE_PMD_PARAM_UNSET; 324 325 /* 326 * Configurable value of buffered packets before sending. 327 */ 328 uint16_t noisy_tx_sw_bufsz; 329 330 /* 331 * Configurable value of packet buffer timeout. 332 */ 333 uint16_t noisy_tx_sw_buf_flush_time; 334 335 /* 336 * Configurable value for size of VNF internal memory area 337 * used for simulating noisy neighbour behaviour 338 */ 339 uint64_t noisy_lkup_mem_sz; 340 341 /* 342 * Configurable value of number of random writes done in 343 * VNF simulation memory area. 344 */ 345 uint64_t noisy_lkup_num_writes; 346 347 /* 348 * Configurable value of number of random reads done in 349 * VNF simulation memory area. 350 */ 351 uint64_t noisy_lkup_num_reads; 352 353 /* 354 * Configurable value of number of random reads/writes done in 355 * VNF simulation memory area. 356 */ 357 uint64_t noisy_lkup_num_reads_writes; 358 359 /* 360 * Receive Side Scaling (RSS) configuration. 361 */ 362 uint64_t rss_hf = RTE_ETH_RSS_IP; /* RSS IP by default. */ 363 364 /* 365 * Port topology configuration 366 */ 367 uint16_t port_topology = PORT_TOPOLOGY_PAIRED; /* Ports are paired by default */ 368 369 /* 370 * Avoids to flush all the RX streams before starts forwarding. 371 */ 372 uint8_t no_flush_rx = 0; /* flush by default */ 373 374 /* 375 * Flow API isolated mode. 376 */ 377 uint8_t flow_isolate_all; 378 379 /* 380 * Avoids to check link status when starting/stopping a port. 381 */ 382 uint8_t no_link_check = 0; /* check by default */ 383 384 /* 385 * Don't automatically start all ports in interactive mode. 386 */ 387 uint8_t no_device_start = 0; 388 389 /* 390 * Enable link status change notification 391 */ 392 uint8_t lsc_interrupt = 1; /* enabled by default */ 393 394 /* 395 * Enable device removal notification. 396 */ 397 uint8_t rmv_interrupt = 1; /* enabled by default */ 398 399 uint8_t hot_plug = 0; /**< hotplug disabled by default. */ 400 401 /* After attach, port setup is called on event or by iterator */ 402 bool setup_on_probe_event = true; 403 404 /* Clear ptypes on port initialization. */ 405 uint8_t clear_ptypes = true; 406 407 /* Hairpin ports configuration mode. */ 408 uint16_t hairpin_mode; 409 410 /* Pretty printing of ethdev events */ 411 static const char * const eth_event_desc[] = { 412 [RTE_ETH_EVENT_UNKNOWN] = "unknown", 413 [RTE_ETH_EVENT_INTR_LSC] = "link state change", 414 [RTE_ETH_EVENT_QUEUE_STATE] = "queue state", 415 [RTE_ETH_EVENT_INTR_RESET] = "reset", 416 [RTE_ETH_EVENT_VF_MBOX] = "VF mbox", 417 [RTE_ETH_EVENT_IPSEC] = "IPsec", 418 [RTE_ETH_EVENT_MACSEC] = "MACsec", 419 [RTE_ETH_EVENT_INTR_RMV] = "device removal", 420 [RTE_ETH_EVENT_NEW] = "device probed", 421 [RTE_ETH_EVENT_DESTROY] = "device released", 422 [RTE_ETH_EVENT_FLOW_AGED] = "flow aged", 423 [RTE_ETH_EVENT_MAX] = NULL, 424 }; 425 426 /* 427 * Display or mask ether events 428 * Default to all events except VF_MBOX 429 */ 430 uint32_t event_print_mask = (UINT32_C(1) << RTE_ETH_EVENT_UNKNOWN) | 431 (UINT32_C(1) << RTE_ETH_EVENT_INTR_LSC) | 432 (UINT32_C(1) << RTE_ETH_EVENT_QUEUE_STATE) | 433 (UINT32_C(1) << RTE_ETH_EVENT_INTR_RESET) | 434 (UINT32_C(1) << RTE_ETH_EVENT_IPSEC) | 435 (UINT32_C(1) << RTE_ETH_EVENT_MACSEC) | 436 (UINT32_C(1) << RTE_ETH_EVENT_INTR_RMV) | 437 (UINT32_C(1) << RTE_ETH_EVENT_FLOW_AGED); 438 /* 439 * Decide if all memory are locked for performance. 440 */ 441 int do_mlockall = 0; 442 443 /* 444 * NIC bypass mode configuration options. 445 */ 446 447 #if defined RTE_NET_IXGBE && defined RTE_LIBRTE_IXGBE_BYPASS 448 /* The NIC bypass watchdog timeout. */ 449 uint32_t bypass_timeout = RTE_PMD_IXGBE_BYPASS_TMT_OFF; 450 #endif 451 452 453 #ifdef RTE_LIB_LATENCYSTATS 454 455 /* 456 * Set when latency stats is enabled in the commandline 457 */ 458 uint8_t latencystats_enabled; 459 460 /* 461 * Lcore ID to service latency statistics. 462 */ 463 lcoreid_t latencystats_lcore_id = -1; 464 465 #endif 466 467 /* 468 * Ethernet device configuration. 469 */ 470 struct rte_eth_rxmode rx_mode; 471 472 struct rte_eth_txmode tx_mode = { 473 .offloads = RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE, 474 }; 475 476 struct rte_eth_fdir_conf fdir_conf = { 477 .mode = RTE_FDIR_MODE_NONE, 478 .pballoc = RTE_ETH_FDIR_PBALLOC_64K, 479 .status = RTE_FDIR_REPORT_STATUS, 480 .mask = { 481 .vlan_tci_mask = 0xFFEF, 482 .ipv4_mask = { 483 .src_ip = 0xFFFFFFFF, 484 .dst_ip = 0xFFFFFFFF, 485 }, 486 .ipv6_mask = { 487 .src_ip = {0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF}, 488 .dst_ip = {0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF}, 489 }, 490 .src_port_mask = 0xFFFF, 491 .dst_port_mask = 0xFFFF, 492 .mac_addr_byte_mask = 0xFF, 493 .tunnel_type_mask = 1, 494 .tunnel_id_mask = 0xFFFFFFFF, 495 }, 496 .drop_queue = 127, 497 }; 498 499 volatile int test_done = 1; /* stop packet forwarding when set to 1. */ 500 501 /* 502 * Display zero values by default for xstats 503 */ 504 uint8_t xstats_hide_zero; 505 506 /* 507 * Measure of CPU cycles disabled by default 508 */ 509 uint8_t record_core_cycles; 510 511 /* 512 * Display of RX and TX bursts disabled by default 513 */ 514 uint8_t record_burst_stats; 515 516 /* 517 * Number of ports per shared Rx queue group, 0 disable. 518 */ 519 uint32_t rxq_share; 520 521 unsigned int num_sockets = 0; 522 unsigned int socket_ids[RTE_MAX_NUMA_NODES]; 523 524 #ifdef RTE_LIB_BITRATESTATS 525 /* Bitrate statistics */ 526 struct rte_stats_bitrates *bitrate_data; 527 lcoreid_t bitrate_lcore_id; 528 uint8_t bitrate_enabled; 529 #endif 530 531 #ifdef RTE_LIB_GRO 532 struct gro_status gro_ports[RTE_MAX_ETHPORTS]; 533 uint8_t gro_flush_cycles = GRO_DEFAULT_FLUSH_CYCLES; 534 #endif 535 536 /* 537 * hexadecimal bitmask of RX mq mode can be enabled. 538 */ 539 enum rte_eth_rx_mq_mode rx_mq_mode = RTE_ETH_MQ_RX_VMDQ_DCB_RSS; 540 541 /* 542 * Used to set forced link speed 543 */ 544 uint32_t eth_link_speed; 545 546 /* 547 * ID of the current process in multi-process, used to 548 * configure the queues to be polled. 549 */ 550 int proc_id; 551 552 /* 553 * Number of processes in multi-process, used to 554 * configure the queues to be polled. 555 */ 556 unsigned int num_procs = 1; 557 558 static void 559 eth_rx_metadata_negotiate_mp(uint16_t port_id) 560 { 561 uint64_t rx_meta_features = 0; 562 int ret; 563 564 if (!is_proc_primary()) 565 return; 566 567 rx_meta_features |= RTE_ETH_RX_METADATA_USER_FLAG; 568 rx_meta_features |= RTE_ETH_RX_METADATA_USER_MARK; 569 rx_meta_features |= RTE_ETH_RX_METADATA_TUNNEL_ID; 570 571 ret = rte_eth_rx_metadata_negotiate(port_id, &rx_meta_features); 572 if (ret == 0) { 573 if (!(rx_meta_features & RTE_ETH_RX_METADATA_USER_FLAG)) { 574 TESTPMD_LOG(DEBUG, "Flow action FLAG will not affect Rx mbufs on port %u\n", 575 port_id); 576 } 577 578 if (!(rx_meta_features & RTE_ETH_RX_METADATA_USER_MARK)) { 579 TESTPMD_LOG(DEBUG, "Flow action MARK will not affect Rx mbufs on port %u\n", 580 port_id); 581 } 582 583 if (!(rx_meta_features & RTE_ETH_RX_METADATA_TUNNEL_ID)) { 584 TESTPMD_LOG(DEBUG, "Flow tunnel offload support might be limited or unavailable on port %u\n", 585 port_id); 586 } 587 } else if (ret != -ENOTSUP) { 588 rte_exit(EXIT_FAILURE, "Error when negotiating Rx meta features on port %u: %s\n", 589 port_id, rte_strerror(-ret)); 590 } 591 } 592 593 static int 594 eth_dev_configure_mp(uint16_t port_id, uint16_t nb_rx_q, uint16_t nb_tx_q, 595 const struct rte_eth_conf *dev_conf) 596 { 597 if (is_proc_primary()) 598 return rte_eth_dev_configure(port_id, nb_rx_q, nb_tx_q, 599 dev_conf); 600 return 0; 601 } 602 603 static int 604 change_bonding_slave_port_status(portid_t bond_pid, bool is_stop) 605 { 606 #ifdef RTE_NET_BOND 607 608 portid_t slave_pids[RTE_MAX_ETHPORTS]; 609 struct rte_port *port; 610 int num_slaves; 611 portid_t slave_pid; 612 int i; 613 614 num_slaves = rte_eth_bond_slaves_get(bond_pid, slave_pids, 615 RTE_MAX_ETHPORTS); 616 if (num_slaves < 0) { 617 fprintf(stderr, "Failed to get slave list for port = %u\n", 618 bond_pid); 619 return num_slaves; 620 } 621 622 for (i = 0; i < num_slaves; i++) { 623 slave_pid = slave_pids[i]; 624 port = &ports[slave_pid]; 625 port->port_status = 626 is_stop ? RTE_PORT_STOPPED : RTE_PORT_STARTED; 627 } 628 #else 629 RTE_SET_USED(bond_pid); 630 RTE_SET_USED(is_stop); 631 #endif 632 return 0; 633 } 634 635 static int 636 eth_dev_start_mp(uint16_t port_id) 637 { 638 int ret; 639 640 if (is_proc_primary()) { 641 ret = rte_eth_dev_start(port_id); 642 if (ret != 0) 643 return ret; 644 645 struct rte_port *port = &ports[port_id]; 646 647 /* 648 * Starting a bonded port also starts all slaves under the bonded 649 * device. So if this port is bond device, we need to modify the 650 * port status of these slaves. 651 */ 652 if (port->bond_flag == 1) 653 return change_bonding_slave_port_status(port_id, false); 654 } 655 656 return 0; 657 } 658 659 static int 660 eth_dev_stop_mp(uint16_t port_id) 661 { 662 int ret; 663 664 if (is_proc_primary()) { 665 ret = rte_eth_dev_stop(port_id); 666 if (ret != 0) 667 return ret; 668 669 struct rte_port *port = &ports[port_id]; 670 671 /* 672 * Stopping a bonded port also stops all slaves under the bonded 673 * device. So if this port is bond device, we need to modify the 674 * port status of these slaves. 675 */ 676 if (port->bond_flag == 1) 677 return change_bonding_slave_port_status(port_id, true); 678 } 679 680 return 0; 681 } 682 683 static void 684 mempool_free_mp(struct rte_mempool *mp) 685 { 686 if (is_proc_primary()) 687 rte_mempool_free(mp); 688 } 689 690 static int 691 eth_dev_set_mtu_mp(uint16_t port_id, uint16_t mtu) 692 { 693 if (is_proc_primary()) 694 return rte_eth_dev_set_mtu(port_id, mtu); 695 696 return 0; 697 } 698 699 /* Forward function declarations */ 700 static void setup_attached_port(portid_t pi); 701 static void check_all_ports_link_status(uint32_t port_mask); 702 static int eth_event_callback(portid_t port_id, 703 enum rte_eth_event_type type, 704 void *param, void *ret_param); 705 static void dev_event_callback(const char *device_name, 706 enum rte_dev_event_type type, 707 void *param); 708 static void fill_xstats_display_info(void); 709 710 /* 711 * Check if all the ports are started. 712 * If yes, return positive value. If not, return zero. 713 */ 714 static int all_ports_started(void); 715 716 #ifdef RTE_LIB_GSO 717 struct gso_status gso_ports[RTE_MAX_ETHPORTS]; 718 uint16_t gso_max_segment_size = RTE_ETHER_MAX_LEN - RTE_ETHER_CRC_LEN; 719 #endif 720 721 /* Holds the registered mbuf dynamic flags names. */ 722 char dynf_names[64][RTE_MBUF_DYN_NAMESIZE]; 723 724 725 /* 726 * Helper function to check if socket is already discovered. 727 * If yes, return positive value. If not, return zero. 728 */ 729 int 730 new_socket_id(unsigned int socket_id) 731 { 732 unsigned int i; 733 734 for (i = 0; i < num_sockets; i++) { 735 if (socket_ids[i] == socket_id) 736 return 0; 737 } 738 return 1; 739 } 740 741 /* 742 * Setup default configuration. 743 */ 744 static void 745 set_default_fwd_lcores_config(void) 746 { 747 unsigned int i; 748 unsigned int nb_lc; 749 unsigned int sock_num; 750 751 nb_lc = 0; 752 for (i = 0; i < RTE_MAX_LCORE; i++) { 753 if (!rte_lcore_is_enabled(i)) 754 continue; 755 sock_num = rte_lcore_to_socket_id(i); 756 if (new_socket_id(sock_num)) { 757 if (num_sockets >= RTE_MAX_NUMA_NODES) { 758 rte_exit(EXIT_FAILURE, 759 "Total sockets greater than %u\n", 760 RTE_MAX_NUMA_NODES); 761 } 762 socket_ids[num_sockets++] = sock_num; 763 } 764 if (i == rte_get_main_lcore()) 765 continue; 766 fwd_lcores_cpuids[nb_lc++] = i; 767 } 768 nb_lcores = (lcoreid_t) nb_lc; 769 nb_cfg_lcores = nb_lcores; 770 nb_fwd_lcores = 1; 771 } 772 773 static void 774 set_def_peer_eth_addrs(void) 775 { 776 portid_t i; 777 778 for (i = 0; i < RTE_MAX_ETHPORTS; i++) { 779 peer_eth_addrs[i].addr_bytes[0] = RTE_ETHER_LOCAL_ADMIN_ADDR; 780 peer_eth_addrs[i].addr_bytes[5] = i; 781 } 782 } 783 784 static void 785 set_default_fwd_ports_config(void) 786 { 787 portid_t pt_id; 788 int i = 0; 789 790 RTE_ETH_FOREACH_DEV(pt_id) { 791 fwd_ports_ids[i++] = pt_id; 792 793 /* Update sockets info according to the attached device */ 794 int socket_id = rte_eth_dev_socket_id(pt_id); 795 if (socket_id >= 0 && new_socket_id(socket_id)) { 796 if (num_sockets >= RTE_MAX_NUMA_NODES) { 797 rte_exit(EXIT_FAILURE, 798 "Total sockets greater than %u\n", 799 RTE_MAX_NUMA_NODES); 800 } 801 socket_ids[num_sockets++] = socket_id; 802 } 803 } 804 805 nb_cfg_ports = nb_ports; 806 nb_fwd_ports = nb_ports; 807 } 808 809 void 810 set_def_fwd_config(void) 811 { 812 set_default_fwd_lcores_config(); 813 set_def_peer_eth_addrs(); 814 set_default_fwd_ports_config(); 815 } 816 817 #ifndef RTE_EXEC_ENV_WINDOWS 818 /* extremely pessimistic estimation of memory required to create a mempool */ 819 static int 820 calc_mem_size(uint32_t nb_mbufs, uint32_t mbuf_sz, size_t pgsz, size_t *out) 821 { 822 unsigned int n_pages, mbuf_per_pg, leftover; 823 uint64_t total_mem, mbuf_mem, obj_sz; 824 825 /* there is no good way to predict how much space the mempool will 826 * occupy because it will allocate chunks on the fly, and some of those 827 * will come from default DPDK memory while some will come from our 828 * external memory, so just assume 128MB will be enough for everyone. 829 */ 830 uint64_t hdr_mem = 128 << 20; 831 832 /* account for possible non-contiguousness */ 833 obj_sz = rte_mempool_calc_obj_size(mbuf_sz, 0, NULL); 834 if (obj_sz > pgsz) { 835 TESTPMD_LOG(ERR, "Object size is bigger than page size\n"); 836 return -1; 837 } 838 839 mbuf_per_pg = pgsz / obj_sz; 840 leftover = (nb_mbufs % mbuf_per_pg) > 0; 841 n_pages = (nb_mbufs / mbuf_per_pg) + leftover; 842 843 mbuf_mem = n_pages * pgsz; 844 845 total_mem = RTE_ALIGN(hdr_mem + mbuf_mem, pgsz); 846 847 if (total_mem > SIZE_MAX) { 848 TESTPMD_LOG(ERR, "Memory size too big\n"); 849 return -1; 850 } 851 *out = (size_t)total_mem; 852 853 return 0; 854 } 855 856 static int 857 pagesz_flags(uint64_t page_sz) 858 { 859 /* as per mmap() manpage, all page sizes are log2 of page size 860 * shifted by MAP_HUGE_SHIFT 861 */ 862 int log2 = rte_log2_u64(page_sz); 863 864 return (log2 << HUGE_SHIFT); 865 } 866 867 static void * 868 alloc_mem(size_t memsz, size_t pgsz, bool huge) 869 { 870 void *addr; 871 int flags; 872 873 /* allocate anonymous hugepages */ 874 flags = MAP_ANONYMOUS | MAP_PRIVATE; 875 if (huge) 876 flags |= HUGE_FLAG | pagesz_flags(pgsz); 877 878 addr = mmap(NULL, memsz, PROT_READ | PROT_WRITE, flags, -1, 0); 879 if (addr == MAP_FAILED) 880 return NULL; 881 882 return addr; 883 } 884 885 struct extmem_param { 886 void *addr; 887 size_t len; 888 size_t pgsz; 889 rte_iova_t *iova_table; 890 unsigned int iova_table_len; 891 }; 892 893 static int 894 create_extmem(uint32_t nb_mbufs, uint32_t mbuf_sz, struct extmem_param *param, 895 bool huge) 896 { 897 uint64_t pgsizes[] = {RTE_PGSIZE_2M, RTE_PGSIZE_1G, /* x86_64, ARM */ 898 RTE_PGSIZE_16M, RTE_PGSIZE_16G}; /* POWER */ 899 unsigned int cur_page, n_pages, pgsz_idx; 900 size_t mem_sz, cur_pgsz; 901 rte_iova_t *iovas = NULL; 902 void *addr; 903 int ret; 904 905 for (pgsz_idx = 0; pgsz_idx < RTE_DIM(pgsizes); pgsz_idx++) { 906 /* skip anything that is too big */ 907 if (pgsizes[pgsz_idx] > SIZE_MAX) 908 continue; 909 910 cur_pgsz = pgsizes[pgsz_idx]; 911 912 /* if we were told not to allocate hugepages, override */ 913 if (!huge) 914 cur_pgsz = sysconf(_SC_PAGESIZE); 915 916 ret = calc_mem_size(nb_mbufs, mbuf_sz, cur_pgsz, &mem_sz); 917 if (ret < 0) { 918 TESTPMD_LOG(ERR, "Cannot calculate memory size\n"); 919 return -1; 920 } 921 922 /* allocate our memory */ 923 addr = alloc_mem(mem_sz, cur_pgsz, huge); 924 925 /* if we couldn't allocate memory with a specified page size, 926 * that doesn't mean we can't do it with other page sizes, so 927 * try another one. 928 */ 929 if (addr == NULL) 930 continue; 931 932 /* store IOVA addresses for every page in this memory area */ 933 n_pages = mem_sz / cur_pgsz; 934 935 iovas = malloc(sizeof(*iovas) * n_pages); 936 937 if (iovas == NULL) { 938 TESTPMD_LOG(ERR, "Cannot allocate memory for iova addresses\n"); 939 goto fail; 940 } 941 /* lock memory if it's not huge pages */ 942 if (!huge) 943 mlock(addr, mem_sz); 944 945 /* populate IOVA addresses */ 946 for (cur_page = 0; cur_page < n_pages; cur_page++) { 947 rte_iova_t iova; 948 size_t offset; 949 void *cur; 950 951 offset = cur_pgsz * cur_page; 952 cur = RTE_PTR_ADD(addr, offset); 953 954 /* touch the page before getting its IOVA */ 955 *(volatile char *)cur = 0; 956 957 iova = rte_mem_virt2iova(cur); 958 959 iovas[cur_page] = iova; 960 } 961 962 break; 963 } 964 /* if we couldn't allocate anything */ 965 if (iovas == NULL) 966 return -1; 967 968 param->addr = addr; 969 param->len = mem_sz; 970 param->pgsz = cur_pgsz; 971 param->iova_table = iovas; 972 param->iova_table_len = n_pages; 973 974 return 0; 975 fail: 976 free(iovas); 977 if (addr) 978 munmap(addr, mem_sz); 979 980 return -1; 981 } 982 983 static int 984 setup_extmem(uint32_t nb_mbufs, uint32_t mbuf_sz, bool huge) 985 { 986 struct extmem_param param; 987 int socket_id, ret; 988 989 memset(¶m, 0, sizeof(param)); 990 991 /* check if our heap exists */ 992 socket_id = rte_malloc_heap_get_socket(EXTMEM_HEAP_NAME); 993 if (socket_id < 0) { 994 /* create our heap */ 995 ret = rte_malloc_heap_create(EXTMEM_HEAP_NAME); 996 if (ret < 0) { 997 TESTPMD_LOG(ERR, "Cannot create heap\n"); 998 return -1; 999 } 1000 } 1001 1002 ret = create_extmem(nb_mbufs, mbuf_sz, ¶m, huge); 1003 if (ret < 0) { 1004 TESTPMD_LOG(ERR, "Cannot create memory area\n"); 1005 return -1; 1006 } 1007 1008 /* we now have a valid memory area, so add it to heap */ 1009 ret = rte_malloc_heap_memory_add(EXTMEM_HEAP_NAME, 1010 param.addr, param.len, param.iova_table, 1011 param.iova_table_len, param.pgsz); 1012 1013 /* when using VFIO, memory is automatically mapped for DMA by EAL */ 1014 1015 /* not needed any more */ 1016 free(param.iova_table); 1017 1018 if (ret < 0) { 1019 TESTPMD_LOG(ERR, "Cannot add memory to heap\n"); 1020 munmap(param.addr, param.len); 1021 return -1; 1022 } 1023 1024 /* success */ 1025 1026 TESTPMD_LOG(DEBUG, "Allocated %zuMB of external memory\n", 1027 param.len >> 20); 1028 1029 return 0; 1030 } 1031 static void 1032 dma_unmap_cb(struct rte_mempool *mp __rte_unused, void *opaque __rte_unused, 1033 struct rte_mempool_memhdr *memhdr, unsigned mem_idx __rte_unused) 1034 { 1035 uint16_t pid = 0; 1036 int ret; 1037 1038 RTE_ETH_FOREACH_DEV(pid) { 1039 struct rte_eth_dev_info dev_info; 1040 1041 ret = eth_dev_info_get_print_err(pid, &dev_info); 1042 if (ret != 0) { 1043 TESTPMD_LOG(DEBUG, 1044 "unable to get device info for port %d on addr 0x%p," 1045 "mempool unmapping will not be performed\n", 1046 pid, memhdr->addr); 1047 continue; 1048 } 1049 1050 ret = rte_dev_dma_unmap(dev_info.device, memhdr->addr, 0, memhdr->len); 1051 if (ret) { 1052 TESTPMD_LOG(DEBUG, 1053 "unable to DMA unmap addr 0x%p " 1054 "for device %s\n", 1055 memhdr->addr, dev_info.device->name); 1056 } 1057 } 1058 ret = rte_extmem_unregister(memhdr->addr, memhdr->len); 1059 if (ret) { 1060 TESTPMD_LOG(DEBUG, 1061 "unable to un-register addr 0x%p\n", memhdr->addr); 1062 } 1063 } 1064 1065 static void 1066 dma_map_cb(struct rte_mempool *mp __rte_unused, void *opaque __rte_unused, 1067 struct rte_mempool_memhdr *memhdr, unsigned mem_idx __rte_unused) 1068 { 1069 uint16_t pid = 0; 1070 size_t page_size = sysconf(_SC_PAGESIZE); 1071 int ret; 1072 1073 ret = rte_extmem_register(memhdr->addr, memhdr->len, NULL, 0, 1074 page_size); 1075 if (ret) { 1076 TESTPMD_LOG(DEBUG, 1077 "unable to register addr 0x%p\n", memhdr->addr); 1078 return; 1079 } 1080 RTE_ETH_FOREACH_DEV(pid) { 1081 struct rte_eth_dev_info dev_info; 1082 1083 ret = eth_dev_info_get_print_err(pid, &dev_info); 1084 if (ret != 0) { 1085 TESTPMD_LOG(DEBUG, 1086 "unable to get device info for port %d on addr 0x%p," 1087 "mempool mapping will not be performed\n", 1088 pid, memhdr->addr); 1089 continue; 1090 } 1091 ret = rte_dev_dma_map(dev_info.device, memhdr->addr, 0, memhdr->len); 1092 if (ret) { 1093 TESTPMD_LOG(DEBUG, 1094 "unable to DMA map addr 0x%p " 1095 "for device %s\n", 1096 memhdr->addr, dev_info.device->name); 1097 } 1098 } 1099 } 1100 #endif 1101 1102 static unsigned int 1103 setup_extbuf(uint32_t nb_mbufs, uint16_t mbuf_sz, unsigned int socket_id, 1104 char *pool_name, struct rte_pktmbuf_extmem **ext_mem) 1105 { 1106 struct rte_pktmbuf_extmem *xmem; 1107 unsigned int ext_num, zone_num, elt_num; 1108 uint16_t elt_size; 1109 1110 elt_size = RTE_ALIGN_CEIL(mbuf_sz, RTE_CACHE_LINE_SIZE); 1111 elt_num = EXTBUF_ZONE_SIZE / elt_size; 1112 zone_num = (nb_mbufs + elt_num - 1) / elt_num; 1113 1114 xmem = malloc(sizeof(struct rte_pktmbuf_extmem) * zone_num); 1115 if (xmem == NULL) { 1116 TESTPMD_LOG(ERR, "Cannot allocate memory for " 1117 "external buffer descriptors\n"); 1118 *ext_mem = NULL; 1119 return 0; 1120 } 1121 for (ext_num = 0; ext_num < zone_num; ext_num++) { 1122 struct rte_pktmbuf_extmem *xseg = xmem + ext_num; 1123 const struct rte_memzone *mz; 1124 char mz_name[RTE_MEMZONE_NAMESIZE]; 1125 int ret; 1126 1127 ret = snprintf(mz_name, sizeof(mz_name), 1128 RTE_MEMPOOL_MZ_FORMAT "_xb_%u", pool_name, ext_num); 1129 if (ret < 0 || ret >= (int)sizeof(mz_name)) { 1130 errno = ENAMETOOLONG; 1131 ext_num = 0; 1132 break; 1133 } 1134 mz = rte_memzone_reserve(mz_name, EXTBUF_ZONE_SIZE, 1135 socket_id, 1136 RTE_MEMZONE_IOVA_CONTIG | 1137 RTE_MEMZONE_1GB | 1138 RTE_MEMZONE_SIZE_HINT_ONLY); 1139 if (mz == NULL) { 1140 /* 1141 * The caller exits on external buffer creation 1142 * error, so there is no need to free memzones. 1143 */ 1144 errno = ENOMEM; 1145 ext_num = 0; 1146 break; 1147 } 1148 xseg->buf_ptr = mz->addr; 1149 xseg->buf_iova = mz->iova; 1150 xseg->buf_len = EXTBUF_ZONE_SIZE; 1151 xseg->elt_size = elt_size; 1152 } 1153 if (ext_num == 0 && xmem != NULL) { 1154 free(xmem); 1155 xmem = NULL; 1156 } 1157 *ext_mem = xmem; 1158 return ext_num; 1159 } 1160 1161 /* 1162 * Configuration initialisation done once at init time. 1163 */ 1164 static struct rte_mempool * 1165 mbuf_pool_create(uint16_t mbuf_seg_size, unsigned nb_mbuf, 1166 unsigned int socket_id, uint16_t size_idx) 1167 { 1168 char pool_name[RTE_MEMPOOL_NAMESIZE]; 1169 struct rte_mempool *rte_mp = NULL; 1170 #ifndef RTE_EXEC_ENV_WINDOWS 1171 uint32_t mb_size; 1172 1173 mb_size = sizeof(struct rte_mbuf) + mbuf_seg_size; 1174 #endif 1175 mbuf_poolname_build(socket_id, pool_name, sizeof(pool_name), size_idx); 1176 if (!is_proc_primary()) { 1177 rte_mp = rte_mempool_lookup(pool_name); 1178 if (rte_mp == NULL) 1179 rte_exit(EXIT_FAILURE, 1180 "Get mbuf pool for socket %u failed: %s\n", 1181 socket_id, rte_strerror(rte_errno)); 1182 return rte_mp; 1183 } 1184 1185 TESTPMD_LOG(INFO, 1186 "create a new mbuf pool <%s>: n=%u, size=%u, socket=%u\n", 1187 pool_name, nb_mbuf, mbuf_seg_size, socket_id); 1188 1189 switch (mp_alloc_type) { 1190 case MP_ALLOC_NATIVE: 1191 { 1192 /* wrapper to rte_mempool_create() */ 1193 TESTPMD_LOG(INFO, "preferred mempool ops selected: %s\n", 1194 rte_mbuf_best_mempool_ops()); 1195 rte_mp = rte_pktmbuf_pool_create(pool_name, nb_mbuf, 1196 mb_mempool_cache, 0, mbuf_seg_size, socket_id); 1197 break; 1198 } 1199 #ifndef RTE_EXEC_ENV_WINDOWS 1200 case MP_ALLOC_ANON: 1201 { 1202 rte_mp = rte_mempool_create_empty(pool_name, nb_mbuf, 1203 mb_size, (unsigned int) mb_mempool_cache, 1204 sizeof(struct rte_pktmbuf_pool_private), 1205 socket_id, mempool_flags); 1206 if (rte_mp == NULL) 1207 goto err; 1208 1209 if (rte_mempool_populate_anon(rte_mp) == 0) { 1210 rte_mempool_free(rte_mp); 1211 rte_mp = NULL; 1212 goto err; 1213 } 1214 rte_pktmbuf_pool_init(rte_mp, NULL); 1215 rte_mempool_obj_iter(rte_mp, rte_pktmbuf_init, NULL); 1216 rte_mempool_mem_iter(rte_mp, dma_map_cb, NULL); 1217 break; 1218 } 1219 case MP_ALLOC_XMEM: 1220 case MP_ALLOC_XMEM_HUGE: 1221 { 1222 int heap_socket; 1223 bool huge = mp_alloc_type == MP_ALLOC_XMEM_HUGE; 1224 1225 if (setup_extmem(nb_mbuf, mbuf_seg_size, huge) < 0) 1226 rte_exit(EXIT_FAILURE, "Could not create external memory\n"); 1227 1228 heap_socket = 1229 rte_malloc_heap_get_socket(EXTMEM_HEAP_NAME); 1230 if (heap_socket < 0) 1231 rte_exit(EXIT_FAILURE, "Could not get external memory socket ID\n"); 1232 1233 TESTPMD_LOG(INFO, "preferred mempool ops selected: %s\n", 1234 rte_mbuf_best_mempool_ops()); 1235 rte_mp = rte_pktmbuf_pool_create(pool_name, nb_mbuf, 1236 mb_mempool_cache, 0, mbuf_seg_size, 1237 heap_socket); 1238 break; 1239 } 1240 #endif 1241 case MP_ALLOC_XBUF: 1242 { 1243 struct rte_pktmbuf_extmem *ext_mem; 1244 unsigned int ext_num; 1245 1246 ext_num = setup_extbuf(nb_mbuf, mbuf_seg_size, 1247 socket_id, pool_name, &ext_mem); 1248 if (ext_num == 0) 1249 rte_exit(EXIT_FAILURE, 1250 "Can't create pinned data buffers\n"); 1251 1252 TESTPMD_LOG(INFO, "preferred mempool ops selected: %s\n", 1253 rte_mbuf_best_mempool_ops()); 1254 rte_mp = rte_pktmbuf_pool_create_extbuf 1255 (pool_name, nb_mbuf, mb_mempool_cache, 1256 0, mbuf_seg_size, socket_id, 1257 ext_mem, ext_num); 1258 free(ext_mem); 1259 break; 1260 } 1261 default: 1262 { 1263 rte_exit(EXIT_FAILURE, "Invalid mempool creation mode\n"); 1264 } 1265 } 1266 1267 #ifndef RTE_EXEC_ENV_WINDOWS 1268 err: 1269 #endif 1270 if (rte_mp == NULL) { 1271 rte_exit(EXIT_FAILURE, 1272 "Creation of mbuf pool for socket %u failed: %s\n", 1273 socket_id, rte_strerror(rte_errno)); 1274 } else if (verbose_level > 0) { 1275 rte_mempool_dump(stdout, rte_mp); 1276 } 1277 return rte_mp; 1278 } 1279 1280 /* 1281 * Check given socket id is valid or not with NUMA mode, 1282 * if valid, return 0, else return -1 1283 */ 1284 static int 1285 check_socket_id(const unsigned int socket_id) 1286 { 1287 static int warning_once = 0; 1288 1289 if (new_socket_id(socket_id)) { 1290 if (!warning_once && numa_support) 1291 fprintf(stderr, 1292 "Warning: NUMA should be configured manually by using --port-numa-config and --ring-numa-config parameters along with --numa.\n"); 1293 warning_once = 1; 1294 return -1; 1295 } 1296 return 0; 1297 } 1298 1299 /* 1300 * Get the allowed maximum number of RX queues. 1301 * *pid return the port id which has minimal value of 1302 * max_rx_queues in all ports. 1303 */ 1304 queueid_t 1305 get_allowed_max_nb_rxq(portid_t *pid) 1306 { 1307 queueid_t allowed_max_rxq = RTE_MAX_QUEUES_PER_PORT; 1308 bool max_rxq_valid = false; 1309 portid_t pi; 1310 struct rte_eth_dev_info dev_info; 1311 1312 RTE_ETH_FOREACH_DEV(pi) { 1313 if (eth_dev_info_get_print_err(pi, &dev_info) != 0) 1314 continue; 1315 1316 max_rxq_valid = true; 1317 if (dev_info.max_rx_queues < allowed_max_rxq) { 1318 allowed_max_rxq = dev_info.max_rx_queues; 1319 *pid = pi; 1320 } 1321 } 1322 return max_rxq_valid ? allowed_max_rxq : 0; 1323 } 1324 1325 /* 1326 * Check input rxq is valid or not. 1327 * If input rxq is not greater than any of maximum number 1328 * of RX queues of all ports, it is valid. 1329 * if valid, return 0, else return -1 1330 */ 1331 int 1332 check_nb_rxq(queueid_t rxq) 1333 { 1334 queueid_t allowed_max_rxq; 1335 portid_t pid = 0; 1336 1337 allowed_max_rxq = get_allowed_max_nb_rxq(&pid); 1338 if (rxq > allowed_max_rxq) { 1339 fprintf(stderr, 1340 "Fail: input rxq (%u) can't be greater than max_rx_queues (%u) of port %u\n", 1341 rxq, allowed_max_rxq, pid); 1342 return -1; 1343 } 1344 return 0; 1345 } 1346 1347 /* 1348 * Get the allowed maximum number of TX queues. 1349 * *pid return the port id which has minimal value of 1350 * max_tx_queues in all ports. 1351 */ 1352 queueid_t 1353 get_allowed_max_nb_txq(portid_t *pid) 1354 { 1355 queueid_t allowed_max_txq = RTE_MAX_QUEUES_PER_PORT; 1356 bool max_txq_valid = false; 1357 portid_t pi; 1358 struct rte_eth_dev_info dev_info; 1359 1360 RTE_ETH_FOREACH_DEV(pi) { 1361 if (eth_dev_info_get_print_err(pi, &dev_info) != 0) 1362 continue; 1363 1364 max_txq_valid = true; 1365 if (dev_info.max_tx_queues < allowed_max_txq) { 1366 allowed_max_txq = dev_info.max_tx_queues; 1367 *pid = pi; 1368 } 1369 } 1370 return max_txq_valid ? allowed_max_txq : 0; 1371 } 1372 1373 /* 1374 * Check input txq is valid or not. 1375 * If input txq is not greater than any of maximum number 1376 * of TX queues of all ports, it is valid. 1377 * if valid, return 0, else return -1 1378 */ 1379 int 1380 check_nb_txq(queueid_t txq) 1381 { 1382 queueid_t allowed_max_txq; 1383 portid_t pid = 0; 1384 1385 allowed_max_txq = get_allowed_max_nb_txq(&pid); 1386 if (txq > allowed_max_txq) { 1387 fprintf(stderr, 1388 "Fail: input txq (%u) can't be greater than max_tx_queues (%u) of port %u\n", 1389 txq, allowed_max_txq, pid); 1390 return -1; 1391 } 1392 return 0; 1393 } 1394 1395 /* 1396 * Get the allowed maximum number of RXDs of every rx queue. 1397 * *pid return the port id which has minimal value of 1398 * max_rxd in all queues of all ports. 1399 */ 1400 static uint16_t 1401 get_allowed_max_nb_rxd(portid_t *pid) 1402 { 1403 uint16_t allowed_max_rxd = UINT16_MAX; 1404 portid_t pi; 1405 struct rte_eth_dev_info dev_info; 1406 1407 RTE_ETH_FOREACH_DEV(pi) { 1408 if (eth_dev_info_get_print_err(pi, &dev_info) != 0) 1409 continue; 1410 1411 if (dev_info.rx_desc_lim.nb_max < allowed_max_rxd) { 1412 allowed_max_rxd = dev_info.rx_desc_lim.nb_max; 1413 *pid = pi; 1414 } 1415 } 1416 return allowed_max_rxd; 1417 } 1418 1419 /* 1420 * Get the allowed minimal number of RXDs of every rx queue. 1421 * *pid return the port id which has minimal value of 1422 * min_rxd in all queues of all ports. 1423 */ 1424 static uint16_t 1425 get_allowed_min_nb_rxd(portid_t *pid) 1426 { 1427 uint16_t allowed_min_rxd = 0; 1428 portid_t pi; 1429 struct rte_eth_dev_info dev_info; 1430 1431 RTE_ETH_FOREACH_DEV(pi) { 1432 if (eth_dev_info_get_print_err(pi, &dev_info) != 0) 1433 continue; 1434 1435 if (dev_info.rx_desc_lim.nb_min > allowed_min_rxd) { 1436 allowed_min_rxd = dev_info.rx_desc_lim.nb_min; 1437 *pid = pi; 1438 } 1439 } 1440 1441 return allowed_min_rxd; 1442 } 1443 1444 /* 1445 * Check input rxd is valid or not. 1446 * If input rxd is not greater than any of maximum number 1447 * of RXDs of every Rx queues and is not less than any of 1448 * minimal number of RXDs of every Rx queues, it is valid. 1449 * if valid, return 0, else return -1 1450 */ 1451 int 1452 check_nb_rxd(queueid_t rxd) 1453 { 1454 uint16_t allowed_max_rxd; 1455 uint16_t allowed_min_rxd; 1456 portid_t pid = 0; 1457 1458 allowed_max_rxd = get_allowed_max_nb_rxd(&pid); 1459 if (rxd > allowed_max_rxd) { 1460 fprintf(stderr, 1461 "Fail: input rxd (%u) can't be greater than max_rxds (%u) of port %u\n", 1462 rxd, allowed_max_rxd, pid); 1463 return -1; 1464 } 1465 1466 allowed_min_rxd = get_allowed_min_nb_rxd(&pid); 1467 if (rxd < allowed_min_rxd) { 1468 fprintf(stderr, 1469 "Fail: input rxd (%u) can't be less than min_rxds (%u) of port %u\n", 1470 rxd, allowed_min_rxd, pid); 1471 return -1; 1472 } 1473 1474 return 0; 1475 } 1476 1477 /* 1478 * Get the allowed maximum number of TXDs of every rx queues. 1479 * *pid return the port id which has minimal value of 1480 * max_txd in every tx queue. 1481 */ 1482 static uint16_t 1483 get_allowed_max_nb_txd(portid_t *pid) 1484 { 1485 uint16_t allowed_max_txd = UINT16_MAX; 1486 portid_t pi; 1487 struct rte_eth_dev_info dev_info; 1488 1489 RTE_ETH_FOREACH_DEV(pi) { 1490 if (eth_dev_info_get_print_err(pi, &dev_info) != 0) 1491 continue; 1492 1493 if (dev_info.tx_desc_lim.nb_max < allowed_max_txd) { 1494 allowed_max_txd = dev_info.tx_desc_lim.nb_max; 1495 *pid = pi; 1496 } 1497 } 1498 return allowed_max_txd; 1499 } 1500 1501 /* 1502 * Get the allowed maximum number of TXDs of every tx queues. 1503 * *pid return the port id which has minimal value of 1504 * min_txd in every tx queue. 1505 */ 1506 static uint16_t 1507 get_allowed_min_nb_txd(portid_t *pid) 1508 { 1509 uint16_t allowed_min_txd = 0; 1510 portid_t pi; 1511 struct rte_eth_dev_info dev_info; 1512 1513 RTE_ETH_FOREACH_DEV(pi) { 1514 if (eth_dev_info_get_print_err(pi, &dev_info) != 0) 1515 continue; 1516 1517 if (dev_info.tx_desc_lim.nb_min > allowed_min_txd) { 1518 allowed_min_txd = dev_info.tx_desc_lim.nb_min; 1519 *pid = pi; 1520 } 1521 } 1522 1523 return allowed_min_txd; 1524 } 1525 1526 /* 1527 * Check input txd is valid or not. 1528 * If input txd is not greater than any of maximum number 1529 * of TXDs of every Rx queues, it is valid. 1530 * if valid, return 0, else return -1 1531 */ 1532 int 1533 check_nb_txd(queueid_t txd) 1534 { 1535 uint16_t allowed_max_txd; 1536 uint16_t allowed_min_txd; 1537 portid_t pid = 0; 1538 1539 allowed_max_txd = get_allowed_max_nb_txd(&pid); 1540 if (txd > allowed_max_txd) { 1541 fprintf(stderr, 1542 "Fail: input txd (%u) can't be greater than max_txds (%u) of port %u\n", 1543 txd, allowed_max_txd, pid); 1544 return -1; 1545 } 1546 1547 allowed_min_txd = get_allowed_min_nb_txd(&pid); 1548 if (txd < allowed_min_txd) { 1549 fprintf(stderr, 1550 "Fail: input txd (%u) can't be less than min_txds (%u) of port %u\n", 1551 txd, allowed_min_txd, pid); 1552 return -1; 1553 } 1554 return 0; 1555 } 1556 1557 1558 /* 1559 * Get the allowed maximum number of hairpin queues. 1560 * *pid return the port id which has minimal value of 1561 * max_hairpin_queues in all ports. 1562 */ 1563 queueid_t 1564 get_allowed_max_nb_hairpinq(portid_t *pid) 1565 { 1566 queueid_t allowed_max_hairpinq = RTE_MAX_QUEUES_PER_PORT; 1567 portid_t pi; 1568 struct rte_eth_hairpin_cap cap; 1569 1570 RTE_ETH_FOREACH_DEV(pi) { 1571 if (rte_eth_dev_hairpin_capability_get(pi, &cap) != 0) { 1572 *pid = pi; 1573 return 0; 1574 } 1575 if (cap.max_nb_queues < allowed_max_hairpinq) { 1576 allowed_max_hairpinq = cap.max_nb_queues; 1577 *pid = pi; 1578 } 1579 } 1580 return allowed_max_hairpinq; 1581 } 1582 1583 /* 1584 * Check input hairpin is valid or not. 1585 * If input hairpin is not greater than any of maximum number 1586 * of hairpin queues of all ports, it is valid. 1587 * if valid, return 0, else return -1 1588 */ 1589 int 1590 check_nb_hairpinq(queueid_t hairpinq) 1591 { 1592 queueid_t allowed_max_hairpinq; 1593 portid_t pid = 0; 1594 1595 allowed_max_hairpinq = get_allowed_max_nb_hairpinq(&pid); 1596 if (hairpinq > allowed_max_hairpinq) { 1597 fprintf(stderr, 1598 "Fail: input hairpin (%u) can't be greater than max_hairpin_queues (%u) of port %u\n", 1599 hairpinq, allowed_max_hairpinq, pid); 1600 return -1; 1601 } 1602 return 0; 1603 } 1604 1605 static int 1606 get_eth_overhead(struct rte_eth_dev_info *dev_info) 1607 { 1608 uint32_t eth_overhead; 1609 1610 if (dev_info->max_mtu != UINT16_MAX && 1611 dev_info->max_rx_pktlen > dev_info->max_mtu) 1612 eth_overhead = dev_info->max_rx_pktlen - dev_info->max_mtu; 1613 else 1614 eth_overhead = RTE_ETHER_HDR_LEN + RTE_ETHER_CRC_LEN; 1615 1616 return eth_overhead; 1617 } 1618 1619 static void 1620 init_config_port_offloads(portid_t pid, uint32_t socket_id) 1621 { 1622 struct rte_port *port = &ports[pid]; 1623 int ret; 1624 int i; 1625 1626 eth_rx_metadata_negotiate_mp(pid); 1627 1628 port->dev_conf.txmode = tx_mode; 1629 port->dev_conf.rxmode = rx_mode; 1630 1631 ret = eth_dev_info_get_print_err(pid, &port->dev_info); 1632 if (ret != 0) 1633 rte_exit(EXIT_FAILURE, "rte_eth_dev_info_get() failed\n"); 1634 1635 if (!(port->dev_info.tx_offload_capa & RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE)) 1636 port->dev_conf.txmode.offloads &= 1637 ~RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE; 1638 1639 /* Apply Rx offloads configuration */ 1640 for (i = 0; i < port->dev_info.max_rx_queues; i++) 1641 port->rxq[i].conf.offloads = port->dev_conf.rxmode.offloads; 1642 /* Apply Tx offloads configuration */ 1643 for (i = 0; i < port->dev_info.max_tx_queues; i++) 1644 port->txq[i].conf.offloads = port->dev_conf.txmode.offloads; 1645 1646 if (eth_link_speed) 1647 port->dev_conf.link_speeds = eth_link_speed; 1648 1649 if (max_rx_pkt_len) 1650 port->dev_conf.rxmode.mtu = max_rx_pkt_len - 1651 get_eth_overhead(&port->dev_info); 1652 1653 /* set flag to initialize port/queue */ 1654 port->need_reconfig = 1; 1655 port->need_reconfig_queues = 1; 1656 port->socket_id = socket_id; 1657 port->tx_metadata = 0; 1658 1659 /* 1660 * Check for maximum number of segments per MTU. 1661 * Accordingly update the mbuf data size. 1662 */ 1663 if (port->dev_info.rx_desc_lim.nb_mtu_seg_max != UINT16_MAX && 1664 port->dev_info.rx_desc_lim.nb_mtu_seg_max != 0) { 1665 uint32_t eth_overhead = get_eth_overhead(&port->dev_info); 1666 uint16_t mtu; 1667 1668 if (rte_eth_dev_get_mtu(pid, &mtu) == 0) { 1669 uint16_t data_size = (mtu + eth_overhead) / 1670 port->dev_info.rx_desc_lim.nb_mtu_seg_max; 1671 uint16_t buffer_size = data_size + RTE_PKTMBUF_HEADROOM; 1672 1673 if (buffer_size > mbuf_data_size[0]) { 1674 mbuf_data_size[0] = buffer_size; 1675 TESTPMD_LOG(WARNING, 1676 "Configured mbuf size of the first segment %hu\n", 1677 mbuf_data_size[0]); 1678 } 1679 } 1680 } 1681 } 1682 1683 static void 1684 init_config(void) 1685 { 1686 portid_t pid; 1687 struct rte_mempool *mbp; 1688 unsigned int nb_mbuf_per_pool; 1689 lcoreid_t lc_id; 1690 #ifdef RTE_LIB_GRO 1691 struct rte_gro_param gro_param; 1692 #endif 1693 #ifdef RTE_LIB_GSO 1694 uint32_t gso_types; 1695 #endif 1696 1697 /* Configuration of logical cores. */ 1698 fwd_lcores = rte_zmalloc("testpmd: fwd_lcores", 1699 sizeof(struct fwd_lcore *) * nb_lcores, 1700 RTE_CACHE_LINE_SIZE); 1701 if (fwd_lcores == NULL) { 1702 rte_exit(EXIT_FAILURE, "rte_zmalloc(%d (struct fwd_lcore *)) " 1703 "failed\n", nb_lcores); 1704 } 1705 for (lc_id = 0; lc_id < nb_lcores; lc_id++) { 1706 fwd_lcores[lc_id] = rte_zmalloc("testpmd: struct fwd_lcore", 1707 sizeof(struct fwd_lcore), 1708 RTE_CACHE_LINE_SIZE); 1709 if (fwd_lcores[lc_id] == NULL) { 1710 rte_exit(EXIT_FAILURE, "rte_zmalloc(struct fwd_lcore) " 1711 "failed\n"); 1712 } 1713 fwd_lcores[lc_id]->cpuid_idx = lc_id; 1714 } 1715 1716 RTE_ETH_FOREACH_DEV(pid) { 1717 uint32_t socket_id; 1718 1719 if (numa_support) { 1720 socket_id = port_numa[pid]; 1721 if (port_numa[pid] == NUMA_NO_CONFIG) { 1722 socket_id = rte_eth_dev_socket_id(pid); 1723 1724 /* 1725 * if socket_id is invalid, 1726 * set to the first available socket. 1727 */ 1728 if (check_socket_id(socket_id) < 0) 1729 socket_id = socket_ids[0]; 1730 } 1731 } else { 1732 socket_id = (socket_num == UMA_NO_CONFIG) ? 1733 0 : socket_num; 1734 } 1735 /* Apply default TxRx configuration for all ports */ 1736 init_config_port_offloads(pid, socket_id); 1737 } 1738 /* 1739 * Create pools of mbuf. 1740 * If NUMA support is disabled, create a single pool of mbuf in 1741 * socket 0 memory by default. 1742 * Otherwise, create a pool of mbuf in the memory of sockets 0 and 1. 1743 * 1744 * Use the maximum value of nb_rxd and nb_txd here, then nb_rxd and 1745 * nb_txd can be configured at run time. 1746 */ 1747 if (param_total_num_mbufs) 1748 nb_mbuf_per_pool = param_total_num_mbufs; 1749 else { 1750 nb_mbuf_per_pool = RTE_TEST_RX_DESC_MAX + 1751 (nb_lcores * mb_mempool_cache) + 1752 RTE_TEST_TX_DESC_MAX + MAX_PKT_BURST; 1753 nb_mbuf_per_pool *= RTE_MAX_ETHPORTS; 1754 } 1755 1756 if (numa_support) { 1757 uint8_t i, j; 1758 1759 for (i = 0; i < num_sockets; i++) 1760 for (j = 0; j < mbuf_data_size_n; j++) 1761 mempools[i * MAX_SEGS_BUFFER_SPLIT + j] = 1762 mbuf_pool_create(mbuf_data_size[j], 1763 nb_mbuf_per_pool, 1764 socket_ids[i], j); 1765 } else { 1766 uint8_t i; 1767 1768 for (i = 0; i < mbuf_data_size_n; i++) 1769 mempools[i] = mbuf_pool_create 1770 (mbuf_data_size[i], 1771 nb_mbuf_per_pool, 1772 socket_num == UMA_NO_CONFIG ? 1773 0 : socket_num, i); 1774 } 1775 1776 init_port_config(); 1777 1778 #ifdef RTE_LIB_GSO 1779 gso_types = RTE_ETH_TX_OFFLOAD_TCP_TSO | RTE_ETH_TX_OFFLOAD_VXLAN_TNL_TSO | 1780 RTE_ETH_TX_OFFLOAD_GRE_TNL_TSO | RTE_ETH_TX_OFFLOAD_UDP_TSO; 1781 #endif 1782 /* 1783 * Records which Mbuf pool to use by each logical core, if needed. 1784 */ 1785 for (lc_id = 0; lc_id < nb_lcores; lc_id++) { 1786 mbp = mbuf_pool_find( 1787 rte_lcore_to_socket_id(fwd_lcores_cpuids[lc_id]), 0); 1788 1789 if (mbp == NULL) 1790 mbp = mbuf_pool_find(0, 0); 1791 fwd_lcores[lc_id]->mbp = mbp; 1792 #ifdef RTE_LIB_GSO 1793 /* initialize GSO context */ 1794 fwd_lcores[lc_id]->gso_ctx.direct_pool = mbp; 1795 fwd_lcores[lc_id]->gso_ctx.indirect_pool = mbp; 1796 fwd_lcores[lc_id]->gso_ctx.gso_types = gso_types; 1797 fwd_lcores[lc_id]->gso_ctx.gso_size = RTE_ETHER_MAX_LEN - 1798 RTE_ETHER_CRC_LEN; 1799 fwd_lcores[lc_id]->gso_ctx.flag = 0; 1800 #endif 1801 } 1802 1803 fwd_config_setup(); 1804 1805 #ifdef RTE_LIB_GRO 1806 /* create a gro context for each lcore */ 1807 gro_param.gro_types = RTE_GRO_TCP_IPV4; 1808 gro_param.max_flow_num = GRO_MAX_FLUSH_CYCLES; 1809 gro_param.max_item_per_flow = MAX_PKT_BURST; 1810 for (lc_id = 0; lc_id < nb_lcores; lc_id++) { 1811 gro_param.socket_id = rte_lcore_to_socket_id( 1812 fwd_lcores_cpuids[lc_id]); 1813 fwd_lcores[lc_id]->gro_ctx = rte_gro_ctx_create(&gro_param); 1814 if (fwd_lcores[lc_id]->gro_ctx == NULL) { 1815 rte_exit(EXIT_FAILURE, 1816 "rte_gro_ctx_create() failed\n"); 1817 } 1818 } 1819 #endif 1820 } 1821 1822 1823 void 1824 reconfig(portid_t new_port_id, unsigned socket_id) 1825 { 1826 /* Reconfiguration of Ethernet ports. */ 1827 init_config_port_offloads(new_port_id, socket_id); 1828 init_port_config(); 1829 } 1830 1831 int 1832 init_fwd_streams(void) 1833 { 1834 portid_t pid; 1835 struct rte_port *port; 1836 streamid_t sm_id, nb_fwd_streams_new; 1837 queueid_t q; 1838 1839 /* set socket id according to numa or not */ 1840 RTE_ETH_FOREACH_DEV(pid) { 1841 port = &ports[pid]; 1842 if (nb_rxq > port->dev_info.max_rx_queues) { 1843 fprintf(stderr, 1844 "Fail: nb_rxq(%d) is greater than max_rx_queues(%d)\n", 1845 nb_rxq, port->dev_info.max_rx_queues); 1846 return -1; 1847 } 1848 if (nb_txq > port->dev_info.max_tx_queues) { 1849 fprintf(stderr, 1850 "Fail: nb_txq(%d) is greater than max_tx_queues(%d)\n", 1851 nb_txq, port->dev_info.max_tx_queues); 1852 return -1; 1853 } 1854 if (numa_support) { 1855 if (port_numa[pid] != NUMA_NO_CONFIG) 1856 port->socket_id = port_numa[pid]; 1857 else { 1858 port->socket_id = rte_eth_dev_socket_id(pid); 1859 1860 /* 1861 * if socket_id is invalid, 1862 * set to the first available socket. 1863 */ 1864 if (check_socket_id(port->socket_id) < 0) 1865 port->socket_id = socket_ids[0]; 1866 } 1867 } 1868 else { 1869 if (socket_num == UMA_NO_CONFIG) 1870 port->socket_id = 0; 1871 else 1872 port->socket_id = socket_num; 1873 } 1874 } 1875 1876 q = RTE_MAX(nb_rxq, nb_txq); 1877 if (q == 0) { 1878 fprintf(stderr, 1879 "Fail: Cannot allocate fwd streams as number of queues is 0\n"); 1880 return -1; 1881 } 1882 nb_fwd_streams_new = (streamid_t)(nb_ports * q); 1883 if (nb_fwd_streams_new == nb_fwd_streams) 1884 return 0; 1885 /* clear the old */ 1886 if (fwd_streams != NULL) { 1887 for (sm_id = 0; sm_id < nb_fwd_streams; sm_id++) { 1888 if (fwd_streams[sm_id] == NULL) 1889 continue; 1890 rte_free(fwd_streams[sm_id]); 1891 fwd_streams[sm_id] = NULL; 1892 } 1893 rte_free(fwd_streams); 1894 fwd_streams = NULL; 1895 } 1896 1897 /* init new */ 1898 nb_fwd_streams = nb_fwd_streams_new; 1899 if (nb_fwd_streams) { 1900 fwd_streams = rte_zmalloc("testpmd: fwd_streams", 1901 sizeof(struct fwd_stream *) * nb_fwd_streams, 1902 RTE_CACHE_LINE_SIZE); 1903 if (fwd_streams == NULL) 1904 rte_exit(EXIT_FAILURE, "rte_zmalloc(%d" 1905 " (struct fwd_stream *)) failed\n", 1906 nb_fwd_streams); 1907 1908 for (sm_id = 0; sm_id < nb_fwd_streams; sm_id++) { 1909 fwd_streams[sm_id] = rte_zmalloc("testpmd:" 1910 " struct fwd_stream", sizeof(struct fwd_stream), 1911 RTE_CACHE_LINE_SIZE); 1912 if (fwd_streams[sm_id] == NULL) 1913 rte_exit(EXIT_FAILURE, "rte_zmalloc" 1914 "(struct fwd_stream) failed\n"); 1915 } 1916 } 1917 1918 return 0; 1919 } 1920 1921 static void 1922 pkt_burst_stats_display(const char *rx_tx, struct pkt_burst_stats *pbs) 1923 { 1924 uint64_t total_burst, sburst; 1925 uint64_t nb_burst; 1926 uint64_t burst_stats[4]; 1927 uint16_t pktnb_stats[4]; 1928 uint16_t nb_pkt; 1929 int burst_percent[4], sburstp; 1930 int i; 1931 1932 /* 1933 * First compute the total number of packet bursts and the 1934 * two highest numbers of bursts of the same number of packets. 1935 */ 1936 memset(&burst_stats, 0x0, sizeof(burst_stats)); 1937 memset(&pktnb_stats, 0x0, sizeof(pktnb_stats)); 1938 1939 /* Show stats for 0 burst size always */ 1940 total_burst = pbs->pkt_burst_spread[0]; 1941 burst_stats[0] = pbs->pkt_burst_spread[0]; 1942 pktnb_stats[0] = 0; 1943 1944 /* Find the next 2 burst sizes with highest occurrences. */ 1945 for (nb_pkt = 1; nb_pkt < MAX_PKT_BURST + 1; nb_pkt++) { 1946 nb_burst = pbs->pkt_burst_spread[nb_pkt]; 1947 1948 if (nb_burst == 0) 1949 continue; 1950 1951 total_burst += nb_burst; 1952 1953 if (nb_burst > burst_stats[1]) { 1954 burst_stats[2] = burst_stats[1]; 1955 pktnb_stats[2] = pktnb_stats[1]; 1956 burst_stats[1] = nb_burst; 1957 pktnb_stats[1] = nb_pkt; 1958 } else if (nb_burst > burst_stats[2]) { 1959 burst_stats[2] = nb_burst; 1960 pktnb_stats[2] = nb_pkt; 1961 } 1962 } 1963 if (total_burst == 0) 1964 return; 1965 1966 printf(" %s-bursts : %"PRIu64" [", rx_tx, total_burst); 1967 for (i = 0, sburst = 0, sburstp = 0; i < 4; i++) { 1968 if (i == 3) { 1969 printf("%d%% of other]\n", 100 - sburstp); 1970 return; 1971 } 1972 1973 sburst += burst_stats[i]; 1974 if (sburst == total_burst) { 1975 printf("%d%% of %d pkts]\n", 1976 100 - sburstp, (int) pktnb_stats[i]); 1977 return; 1978 } 1979 1980 burst_percent[i] = 1981 (double)burst_stats[i] / total_burst * 100; 1982 printf("%d%% of %d pkts + ", 1983 burst_percent[i], (int) pktnb_stats[i]); 1984 sburstp += burst_percent[i]; 1985 } 1986 } 1987 1988 static void 1989 fwd_stream_stats_display(streamid_t stream_id) 1990 { 1991 struct fwd_stream *fs; 1992 static const char *fwd_top_stats_border = "-------"; 1993 1994 fs = fwd_streams[stream_id]; 1995 if ((fs->rx_packets == 0) && (fs->tx_packets == 0) && 1996 (fs->fwd_dropped == 0)) 1997 return; 1998 printf("\n %s Forward Stats for RX Port=%2d/Queue=%2d -> " 1999 "TX Port=%2d/Queue=%2d %s\n", 2000 fwd_top_stats_border, fs->rx_port, fs->rx_queue, 2001 fs->tx_port, fs->tx_queue, fwd_top_stats_border); 2002 printf(" RX-packets: %-14"PRIu64" TX-packets: %-14"PRIu64 2003 " TX-dropped: %-14"PRIu64, 2004 fs->rx_packets, fs->tx_packets, fs->fwd_dropped); 2005 2006 /* if checksum mode */ 2007 if (cur_fwd_eng == &csum_fwd_engine) { 2008 printf(" RX- bad IP checksum: %-14"PRIu64 2009 " Rx- bad L4 checksum: %-14"PRIu64 2010 " Rx- bad outer L4 checksum: %-14"PRIu64"\n", 2011 fs->rx_bad_ip_csum, fs->rx_bad_l4_csum, 2012 fs->rx_bad_outer_l4_csum); 2013 printf(" RX- bad outer IP checksum: %-14"PRIu64"\n", 2014 fs->rx_bad_outer_ip_csum); 2015 } else { 2016 printf("\n"); 2017 } 2018 2019 if (record_burst_stats) { 2020 pkt_burst_stats_display("RX", &fs->rx_burst_stats); 2021 pkt_burst_stats_display("TX", &fs->tx_burst_stats); 2022 } 2023 } 2024 2025 void 2026 fwd_stats_display(void) 2027 { 2028 static const char *fwd_stats_border = "----------------------"; 2029 static const char *acc_stats_border = "+++++++++++++++"; 2030 struct { 2031 struct fwd_stream *rx_stream; 2032 struct fwd_stream *tx_stream; 2033 uint64_t tx_dropped; 2034 uint64_t rx_bad_ip_csum; 2035 uint64_t rx_bad_l4_csum; 2036 uint64_t rx_bad_outer_l4_csum; 2037 uint64_t rx_bad_outer_ip_csum; 2038 } ports_stats[RTE_MAX_ETHPORTS]; 2039 uint64_t total_rx_dropped = 0; 2040 uint64_t total_tx_dropped = 0; 2041 uint64_t total_rx_nombuf = 0; 2042 struct rte_eth_stats stats; 2043 uint64_t fwd_cycles = 0; 2044 uint64_t total_recv = 0; 2045 uint64_t total_xmit = 0; 2046 struct rte_port *port; 2047 streamid_t sm_id; 2048 portid_t pt_id; 2049 int ret; 2050 int i; 2051 2052 memset(ports_stats, 0, sizeof(ports_stats)); 2053 2054 for (sm_id = 0; sm_id < cur_fwd_config.nb_fwd_streams; sm_id++) { 2055 struct fwd_stream *fs = fwd_streams[sm_id]; 2056 2057 if (cur_fwd_config.nb_fwd_streams > 2058 cur_fwd_config.nb_fwd_ports) { 2059 fwd_stream_stats_display(sm_id); 2060 } else { 2061 ports_stats[fs->tx_port].tx_stream = fs; 2062 ports_stats[fs->rx_port].rx_stream = fs; 2063 } 2064 2065 ports_stats[fs->tx_port].tx_dropped += fs->fwd_dropped; 2066 2067 ports_stats[fs->rx_port].rx_bad_ip_csum += fs->rx_bad_ip_csum; 2068 ports_stats[fs->rx_port].rx_bad_l4_csum += fs->rx_bad_l4_csum; 2069 ports_stats[fs->rx_port].rx_bad_outer_l4_csum += 2070 fs->rx_bad_outer_l4_csum; 2071 ports_stats[fs->rx_port].rx_bad_outer_ip_csum += 2072 fs->rx_bad_outer_ip_csum; 2073 2074 if (record_core_cycles) 2075 fwd_cycles += fs->core_cycles; 2076 } 2077 for (i = 0; i < cur_fwd_config.nb_fwd_ports; i++) { 2078 pt_id = fwd_ports_ids[i]; 2079 port = &ports[pt_id]; 2080 2081 ret = rte_eth_stats_get(pt_id, &stats); 2082 if (ret != 0) { 2083 fprintf(stderr, 2084 "%s: Error: failed to get stats (port %u): %d", 2085 __func__, pt_id, ret); 2086 continue; 2087 } 2088 stats.ipackets -= port->stats.ipackets; 2089 stats.opackets -= port->stats.opackets; 2090 stats.ibytes -= port->stats.ibytes; 2091 stats.obytes -= port->stats.obytes; 2092 stats.imissed -= port->stats.imissed; 2093 stats.oerrors -= port->stats.oerrors; 2094 stats.rx_nombuf -= port->stats.rx_nombuf; 2095 2096 total_recv += stats.ipackets; 2097 total_xmit += stats.opackets; 2098 total_rx_dropped += stats.imissed; 2099 total_tx_dropped += ports_stats[pt_id].tx_dropped; 2100 total_tx_dropped += stats.oerrors; 2101 total_rx_nombuf += stats.rx_nombuf; 2102 2103 printf("\n %s Forward statistics for port %-2d %s\n", 2104 fwd_stats_border, pt_id, fwd_stats_border); 2105 2106 printf(" RX-packets: %-14"PRIu64" RX-dropped: %-14"PRIu64 2107 "RX-total: %-"PRIu64"\n", stats.ipackets, stats.imissed, 2108 stats.ipackets + stats.imissed); 2109 2110 if (cur_fwd_eng == &csum_fwd_engine) { 2111 printf(" Bad-ipcsum: %-14"PRIu64 2112 " Bad-l4csum: %-14"PRIu64 2113 "Bad-outer-l4csum: %-14"PRIu64"\n", 2114 ports_stats[pt_id].rx_bad_ip_csum, 2115 ports_stats[pt_id].rx_bad_l4_csum, 2116 ports_stats[pt_id].rx_bad_outer_l4_csum); 2117 printf(" Bad-outer-ipcsum: %-14"PRIu64"\n", 2118 ports_stats[pt_id].rx_bad_outer_ip_csum); 2119 } 2120 if (stats.ierrors + stats.rx_nombuf > 0) { 2121 printf(" RX-error: %-"PRIu64"\n", stats.ierrors); 2122 printf(" RX-nombufs: %-14"PRIu64"\n", stats.rx_nombuf); 2123 } 2124 2125 printf(" TX-packets: %-14"PRIu64" TX-dropped: %-14"PRIu64 2126 "TX-total: %-"PRIu64"\n", 2127 stats.opackets, ports_stats[pt_id].tx_dropped, 2128 stats.opackets + ports_stats[pt_id].tx_dropped); 2129 2130 if (record_burst_stats) { 2131 if (ports_stats[pt_id].rx_stream) 2132 pkt_burst_stats_display("RX", 2133 &ports_stats[pt_id].rx_stream->rx_burst_stats); 2134 if (ports_stats[pt_id].tx_stream) 2135 pkt_burst_stats_display("TX", 2136 &ports_stats[pt_id].tx_stream->tx_burst_stats); 2137 } 2138 2139 printf(" %s--------------------------------%s\n", 2140 fwd_stats_border, fwd_stats_border); 2141 } 2142 2143 printf("\n %s Accumulated forward statistics for all ports" 2144 "%s\n", 2145 acc_stats_border, acc_stats_border); 2146 printf(" RX-packets: %-14"PRIu64" RX-dropped: %-14"PRIu64"RX-total: " 2147 "%-"PRIu64"\n" 2148 " TX-packets: %-14"PRIu64" TX-dropped: %-14"PRIu64"TX-total: " 2149 "%-"PRIu64"\n", 2150 total_recv, total_rx_dropped, total_recv + total_rx_dropped, 2151 total_xmit, total_tx_dropped, total_xmit + total_tx_dropped); 2152 if (total_rx_nombuf > 0) 2153 printf(" RX-nombufs: %-14"PRIu64"\n", total_rx_nombuf); 2154 printf(" %s++++++++++++++++++++++++++++++++++++++++++++++" 2155 "%s\n", 2156 acc_stats_border, acc_stats_border); 2157 if (record_core_cycles) { 2158 #define CYC_PER_MHZ 1E6 2159 if (total_recv > 0 || total_xmit > 0) { 2160 uint64_t total_pkts = 0; 2161 if (strcmp(cur_fwd_eng->fwd_mode_name, "txonly") == 0 || 2162 strcmp(cur_fwd_eng->fwd_mode_name, "flowgen") == 0) 2163 total_pkts = total_xmit; 2164 else 2165 total_pkts = total_recv; 2166 2167 printf("\n CPU cycles/packet=%.2F (total cycles=" 2168 "%"PRIu64" / total %s packets=%"PRIu64") at %"PRIu64 2169 " MHz Clock\n", 2170 (double) fwd_cycles / total_pkts, 2171 fwd_cycles, cur_fwd_eng->fwd_mode_name, total_pkts, 2172 (uint64_t)(rte_get_tsc_hz() / CYC_PER_MHZ)); 2173 } 2174 } 2175 } 2176 2177 void 2178 fwd_stats_reset(void) 2179 { 2180 streamid_t sm_id; 2181 portid_t pt_id; 2182 int ret; 2183 int i; 2184 2185 for (i = 0; i < cur_fwd_config.nb_fwd_ports; i++) { 2186 pt_id = fwd_ports_ids[i]; 2187 ret = rte_eth_stats_get(pt_id, &ports[pt_id].stats); 2188 if (ret != 0) 2189 fprintf(stderr, 2190 "%s: Error: failed to clear stats (port %u):%d", 2191 __func__, pt_id, ret); 2192 } 2193 for (sm_id = 0; sm_id < cur_fwd_config.nb_fwd_streams; sm_id++) { 2194 struct fwd_stream *fs = fwd_streams[sm_id]; 2195 2196 fs->rx_packets = 0; 2197 fs->tx_packets = 0; 2198 fs->fwd_dropped = 0; 2199 fs->rx_bad_ip_csum = 0; 2200 fs->rx_bad_l4_csum = 0; 2201 fs->rx_bad_outer_l4_csum = 0; 2202 fs->rx_bad_outer_ip_csum = 0; 2203 2204 memset(&fs->rx_burst_stats, 0, sizeof(fs->rx_burst_stats)); 2205 memset(&fs->tx_burst_stats, 0, sizeof(fs->tx_burst_stats)); 2206 fs->core_cycles = 0; 2207 } 2208 } 2209 2210 static void 2211 flush_fwd_rx_queues(void) 2212 { 2213 struct rte_mbuf *pkts_burst[MAX_PKT_BURST]; 2214 portid_t rxp; 2215 portid_t port_id; 2216 queueid_t rxq; 2217 uint16_t nb_rx; 2218 uint16_t i; 2219 uint8_t j; 2220 uint64_t prev_tsc = 0, diff_tsc, cur_tsc, timer_tsc = 0; 2221 uint64_t timer_period; 2222 2223 if (num_procs > 1) { 2224 printf("multi-process not support for flushing fwd Rx queues, skip the below lines and return.\n"); 2225 return; 2226 } 2227 2228 /* convert to number of cycles */ 2229 timer_period = rte_get_timer_hz(); /* 1 second timeout */ 2230 2231 for (j = 0; j < 2; j++) { 2232 for (rxp = 0; rxp < cur_fwd_config.nb_fwd_ports; rxp++) { 2233 for (rxq = 0; rxq < nb_rxq; rxq++) { 2234 port_id = fwd_ports_ids[rxp]; 2235 2236 /* Polling stopped queues is prohibited. */ 2237 if (ports[port_id].rxq[rxq].state == 2238 RTE_ETH_QUEUE_STATE_STOPPED) 2239 continue; 2240 2241 /** 2242 * testpmd can stuck in the below do while loop 2243 * if rte_eth_rx_burst() always returns nonzero 2244 * packets. So timer is added to exit this loop 2245 * after 1sec timer expiry. 2246 */ 2247 prev_tsc = rte_rdtsc(); 2248 do { 2249 nb_rx = rte_eth_rx_burst(port_id, rxq, 2250 pkts_burst, MAX_PKT_BURST); 2251 for (i = 0; i < nb_rx; i++) 2252 rte_pktmbuf_free(pkts_burst[i]); 2253 2254 cur_tsc = rte_rdtsc(); 2255 diff_tsc = cur_tsc - prev_tsc; 2256 timer_tsc += diff_tsc; 2257 } while ((nb_rx > 0) && 2258 (timer_tsc < timer_period)); 2259 timer_tsc = 0; 2260 } 2261 } 2262 rte_delay_ms(10); /* wait 10 milli-seconds before retrying */ 2263 } 2264 } 2265 2266 static void 2267 run_pkt_fwd_on_lcore(struct fwd_lcore *fc, packet_fwd_t pkt_fwd) 2268 { 2269 struct fwd_stream **fsm; 2270 streamid_t nb_fs; 2271 streamid_t sm_id; 2272 #ifdef RTE_LIB_BITRATESTATS 2273 uint64_t tics_per_1sec; 2274 uint64_t tics_datum; 2275 uint64_t tics_current; 2276 uint16_t i, cnt_ports; 2277 2278 cnt_ports = nb_ports; 2279 tics_datum = rte_rdtsc(); 2280 tics_per_1sec = rte_get_timer_hz(); 2281 #endif 2282 fsm = &fwd_streams[fc->stream_idx]; 2283 nb_fs = fc->stream_nb; 2284 do { 2285 for (sm_id = 0; sm_id < nb_fs; sm_id++) 2286 if (!fsm[sm_id]->disabled) 2287 (*pkt_fwd)(fsm[sm_id]); 2288 #ifdef RTE_LIB_BITRATESTATS 2289 if (bitrate_enabled != 0 && 2290 bitrate_lcore_id == rte_lcore_id()) { 2291 tics_current = rte_rdtsc(); 2292 if (tics_current - tics_datum >= tics_per_1sec) { 2293 /* Periodic bitrate calculation */ 2294 for (i = 0; i < cnt_ports; i++) 2295 rte_stats_bitrate_calc(bitrate_data, 2296 ports_ids[i]); 2297 tics_datum = tics_current; 2298 } 2299 } 2300 #endif 2301 #ifdef RTE_LIB_LATENCYSTATS 2302 if (latencystats_enabled != 0 && 2303 latencystats_lcore_id == rte_lcore_id()) 2304 rte_latencystats_update(); 2305 #endif 2306 2307 } while (! fc->stopped); 2308 } 2309 2310 static int 2311 start_pkt_forward_on_core(void *fwd_arg) 2312 { 2313 run_pkt_fwd_on_lcore((struct fwd_lcore *) fwd_arg, 2314 cur_fwd_config.fwd_eng->packet_fwd); 2315 return 0; 2316 } 2317 2318 /* 2319 * Run the TXONLY packet forwarding engine to send a single burst of packets. 2320 * Used to start communication flows in network loopback test configurations. 2321 */ 2322 static int 2323 run_one_txonly_burst_on_core(void *fwd_arg) 2324 { 2325 struct fwd_lcore *fwd_lc; 2326 struct fwd_lcore tmp_lcore; 2327 2328 fwd_lc = (struct fwd_lcore *) fwd_arg; 2329 tmp_lcore = *fwd_lc; 2330 tmp_lcore.stopped = 1; 2331 run_pkt_fwd_on_lcore(&tmp_lcore, tx_only_engine.packet_fwd); 2332 return 0; 2333 } 2334 2335 /* 2336 * Launch packet forwarding: 2337 * - Setup per-port forwarding context. 2338 * - launch logical cores with their forwarding configuration. 2339 */ 2340 static void 2341 launch_packet_forwarding(lcore_function_t *pkt_fwd_on_lcore) 2342 { 2343 unsigned int i; 2344 unsigned int lc_id; 2345 int diag; 2346 2347 for (i = 0; i < cur_fwd_config.nb_fwd_lcores; i++) { 2348 lc_id = fwd_lcores_cpuids[i]; 2349 if ((interactive == 0) || (lc_id != rte_lcore_id())) { 2350 fwd_lcores[i]->stopped = 0; 2351 diag = rte_eal_remote_launch(pkt_fwd_on_lcore, 2352 fwd_lcores[i], lc_id); 2353 if (diag != 0) 2354 fprintf(stderr, 2355 "launch lcore %u failed - diag=%d\n", 2356 lc_id, diag); 2357 } 2358 } 2359 } 2360 2361 /* 2362 * Launch packet forwarding configuration. 2363 */ 2364 void 2365 start_packet_forwarding(int with_tx_first) 2366 { 2367 port_fwd_begin_t port_fwd_begin; 2368 port_fwd_end_t port_fwd_end; 2369 stream_init_t stream_init = cur_fwd_eng->stream_init; 2370 unsigned int i; 2371 2372 if (strcmp(cur_fwd_eng->fwd_mode_name, "rxonly") == 0 && !nb_rxq) 2373 rte_exit(EXIT_FAILURE, "rxq are 0, cannot use rxonly fwd mode\n"); 2374 2375 if (strcmp(cur_fwd_eng->fwd_mode_name, "txonly") == 0 && !nb_txq) 2376 rte_exit(EXIT_FAILURE, "txq are 0, cannot use txonly fwd mode\n"); 2377 2378 if ((strcmp(cur_fwd_eng->fwd_mode_name, "rxonly") != 0 && 2379 strcmp(cur_fwd_eng->fwd_mode_name, "txonly") != 0) && 2380 (!nb_rxq || !nb_txq)) 2381 rte_exit(EXIT_FAILURE, 2382 "Either rxq or txq are 0, cannot use %s fwd mode\n", 2383 cur_fwd_eng->fwd_mode_name); 2384 2385 if (all_ports_started() == 0) { 2386 fprintf(stderr, "Not all ports were started\n"); 2387 return; 2388 } 2389 if (test_done == 0) { 2390 fprintf(stderr, "Packet forwarding already started\n"); 2391 return; 2392 } 2393 2394 fwd_config_setup(); 2395 2396 pkt_fwd_config_display(&cur_fwd_config); 2397 if (!pkt_fwd_shared_rxq_check()) 2398 return; 2399 2400 if (stream_init != NULL) 2401 for (i = 0; i < cur_fwd_config.nb_fwd_streams; i++) 2402 stream_init(fwd_streams[i]); 2403 2404 port_fwd_begin = cur_fwd_config.fwd_eng->port_fwd_begin; 2405 if (port_fwd_begin != NULL) { 2406 for (i = 0; i < cur_fwd_config.nb_fwd_ports; i++) { 2407 if (port_fwd_begin(fwd_ports_ids[i])) { 2408 fprintf(stderr, 2409 "Packet forwarding is not ready\n"); 2410 return; 2411 } 2412 } 2413 } 2414 2415 if (with_tx_first) { 2416 port_fwd_begin = tx_only_engine.port_fwd_begin; 2417 if (port_fwd_begin != NULL) { 2418 for (i = 0; i < cur_fwd_config.nb_fwd_ports; i++) { 2419 if (port_fwd_begin(fwd_ports_ids[i])) { 2420 fprintf(stderr, 2421 "Packet forwarding is not ready\n"); 2422 return; 2423 } 2424 } 2425 } 2426 } 2427 2428 test_done = 0; 2429 2430 if(!no_flush_rx) 2431 flush_fwd_rx_queues(); 2432 2433 rxtx_config_display(); 2434 2435 fwd_stats_reset(); 2436 if (with_tx_first) { 2437 while (with_tx_first--) { 2438 launch_packet_forwarding( 2439 run_one_txonly_burst_on_core); 2440 rte_eal_mp_wait_lcore(); 2441 } 2442 port_fwd_end = tx_only_engine.port_fwd_end; 2443 if (port_fwd_end != NULL) { 2444 for (i = 0; i < cur_fwd_config.nb_fwd_ports; i++) 2445 (*port_fwd_end)(fwd_ports_ids[i]); 2446 } 2447 } 2448 launch_packet_forwarding(start_pkt_forward_on_core); 2449 } 2450 2451 void 2452 stop_packet_forwarding(void) 2453 { 2454 port_fwd_end_t port_fwd_end; 2455 lcoreid_t lc_id; 2456 portid_t pt_id; 2457 int i; 2458 2459 if (test_done) { 2460 fprintf(stderr, "Packet forwarding not started\n"); 2461 return; 2462 } 2463 printf("Telling cores to stop..."); 2464 for (lc_id = 0; lc_id < cur_fwd_config.nb_fwd_lcores; lc_id++) 2465 fwd_lcores[lc_id]->stopped = 1; 2466 printf("\nWaiting for lcores to finish...\n"); 2467 rte_eal_mp_wait_lcore(); 2468 port_fwd_end = cur_fwd_config.fwd_eng->port_fwd_end; 2469 if (port_fwd_end != NULL) { 2470 for (i = 0; i < cur_fwd_config.nb_fwd_ports; i++) { 2471 pt_id = fwd_ports_ids[i]; 2472 (*port_fwd_end)(pt_id); 2473 } 2474 } 2475 2476 fwd_stats_display(); 2477 2478 printf("\nDone.\n"); 2479 test_done = 1; 2480 } 2481 2482 void 2483 dev_set_link_up(portid_t pid) 2484 { 2485 if (rte_eth_dev_set_link_up(pid) < 0) 2486 fprintf(stderr, "\nSet link up fail.\n"); 2487 } 2488 2489 void 2490 dev_set_link_down(portid_t pid) 2491 { 2492 if (rte_eth_dev_set_link_down(pid) < 0) 2493 fprintf(stderr, "\nSet link down fail.\n"); 2494 } 2495 2496 static int 2497 all_ports_started(void) 2498 { 2499 portid_t pi; 2500 struct rte_port *port; 2501 2502 RTE_ETH_FOREACH_DEV(pi) { 2503 port = &ports[pi]; 2504 /* Check if there is a port which is not started */ 2505 if ((port->port_status != RTE_PORT_STARTED) && 2506 (port->slave_flag == 0)) 2507 return 0; 2508 } 2509 2510 /* No port is not started */ 2511 return 1; 2512 } 2513 2514 int 2515 port_is_stopped(portid_t port_id) 2516 { 2517 struct rte_port *port = &ports[port_id]; 2518 2519 if ((port->port_status != RTE_PORT_STOPPED) && 2520 (port->slave_flag == 0)) 2521 return 0; 2522 return 1; 2523 } 2524 2525 int 2526 all_ports_stopped(void) 2527 { 2528 portid_t pi; 2529 2530 RTE_ETH_FOREACH_DEV(pi) { 2531 if (!port_is_stopped(pi)) 2532 return 0; 2533 } 2534 2535 return 1; 2536 } 2537 2538 int 2539 port_is_started(portid_t port_id) 2540 { 2541 if (port_id_is_invalid(port_id, ENABLED_WARN)) 2542 return 0; 2543 2544 if (ports[port_id].port_status != RTE_PORT_STARTED) 2545 return 0; 2546 2547 return 1; 2548 } 2549 2550 /* Configure the Rx and Tx hairpin queues for the selected port. */ 2551 static int 2552 setup_hairpin_queues(portid_t pi, portid_t p_pi, uint16_t cnt_pi) 2553 { 2554 queueid_t qi; 2555 struct rte_eth_hairpin_conf hairpin_conf = { 2556 .peer_count = 1, 2557 }; 2558 int i; 2559 int diag; 2560 struct rte_port *port = &ports[pi]; 2561 uint16_t peer_rx_port = pi; 2562 uint16_t peer_tx_port = pi; 2563 uint32_t manual = 1; 2564 uint32_t tx_exp = hairpin_mode & 0x10; 2565 2566 if (!(hairpin_mode & 0xf)) { 2567 peer_rx_port = pi; 2568 peer_tx_port = pi; 2569 manual = 0; 2570 } else if (hairpin_mode & 0x1) { 2571 peer_tx_port = rte_eth_find_next_owned_by(pi + 1, 2572 RTE_ETH_DEV_NO_OWNER); 2573 if (peer_tx_port >= RTE_MAX_ETHPORTS) 2574 peer_tx_port = rte_eth_find_next_owned_by(0, 2575 RTE_ETH_DEV_NO_OWNER); 2576 if (p_pi != RTE_MAX_ETHPORTS) { 2577 peer_rx_port = p_pi; 2578 } else { 2579 uint16_t next_pi; 2580 2581 /* Last port will be the peer RX port of the first. */ 2582 RTE_ETH_FOREACH_DEV(next_pi) 2583 peer_rx_port = next_pi; 2584 } 2585 manual = 1; 2586 } else if (hairpin_mode & 0x2) { 2587 if (cnt_pi & 0x1) { 2588 peer_rx_port = p_pi; 2589 } else { 2590 peer_rx_port = rte_eth_find_next_owned_by(pi + 1, 2591 RTE_ETH_DEV_NO_OWNER); 2592 if (peer_rx_port >= RTE_MAX_ETHPORTS) 2593 peer_rx_port = pi; 2594 } 2595 peer_tx_port = peer_rx_port; 2596 manual = 1; 2597 } 2598 2599 for (qi = nb_txq, i = 0; qi < nb_hairpinq + nb_txq; qi++) { 2600 hairpin_conf.peers[0].port = peer_rx_port; 2601 hairpin_conf.peers[0].queue = i + nb_rxq; 2602 hairpin_conf.manual_bind = !!manual; 2603 hairpin_conf.tx_explicit = !!tx_exp; 2604 diag = rte_eth_tx_hairpin_queue_setup 2605 (pi, qi, nb_txd, &hairpin_conf); 2606 i++; 2607 if (diag == 0) 2608 continue; 2609 2610 /* Fail to setup rx queue, return */ 2611 if (port->port_status == RTE_PORT_HANDLING) 2612 port->port_status = RTE_PORT_STOPPED; 2613 else 2614 fprintf(stderr, 2615 "Port %d can not be set back to stopped\n", pi); 2616 fprintf(stderr, "Fail to configure port %d hairpin queues\n", 2617 pi); 2618 /* try to reconfigure queues next time */ 2619 port->need_reconfig_queues = 1; 2620 return -1; 2621 } 2622 for (qi = nb_rxq, i = 0; qi < nb_hairpinq + nb_rxq; qi++) { 2623 hairpin_conf.peers[0].port = peer_tx_port; 2624 hairpin_conf.peers[0].queue = i + nb_txq; 2625 hairpin_conf.manual_bind = !!manual; 2626 hairpin_conf.tx_explicit = !!tx_exp; 2627 diag = rte_eth_rx_hairpin_queue_setup 2628 (pi, qi, nb_rxd, &hairpin_conf); 2629 i++; 2630 if (diag == 0) 2631 continue; 2632 2633 /* Fail to setup rx queue, return */ 2634 if (port->port_status == RTE_PORT_HANDLING) 2635 port->port_status = RTE_PORT_STOPPED; 2636 else 2637 fprintf(stderr, 2638 "Port %d can not be set back to stopped\n", pi); 2639 fprintf(stderr, "Fail to configure port %d hairpin queues\n", 2640 pi); 2641 /* try to reconfigure queues next time */ 2642 port->need_reconfig_queues = 1; 2643 return -1; 2644 } 2645 return 0; 2646 } 2647 2648 /* Configure the Rx with optional split. */ 2649 int 2650 rx_queue_setup(uint16_t port_id, uint16_t rx_queue_id, 2651 uint16_t nb_rx_desc, unsigned int socket_id, 2652 struct rte_eth_rxconf *rx_conf, struct rte_mempool *mp) 2653 { 2654 union rte_eth_rxseg rx_useg[MAX_SEGS_BUFFER_SPLIT] = {}; 2655 unsigned int i, mp_n; 2656 int ret; 2657 2658 if (rx_pkt_nb_segs <= 1 || 2659 (rx_conf->offloads & RTE_ETH_RX_OFFLOAD_BUFFER_SPLIT) == 0) { 2660 rx_conf->rx_seg = NULL; 2661 rx_conf->rx_nseg = 0; 2662 ret = rte_eth_rx_queue_setup(port_id, rx_queue_id, 2663 nb_rx_desc, socket_id, 2664 rx_conf, mp); 2665 goto exit; 2666 } 2667 for (i = 0; i < rx_pkt_nb_segs; i++) { 2668 struct rte_eth_rxseg_split *rx_seg = &rx_useg[i].split; 2669 struct rte_mempool *mpx; 2670 /* 2671 * Use last valid pool for the segments with number 2672 * exceeding the pool index. 2673 */ 2674 mp_n = (i > mbuf_data_size_n) ? mbuf_data_size_n - 1 : i; 2675 mpx = mbuf_pool_find(socket_id, mp_n); 2676 /* Handle zero as mbuf data buffer size. */ 2677 rx_seg->length = rx_pkt_seg_lengths[i] ? 2678 rx_pkt_seg_lengths[i] : 2679 mbuf_data_size[mp_n]; 2680 rx_seg->offset = i < rx_pkt_nb_offs ? 2681 rx_pkt_seg_offsets[i] : 0; 2682 rx_seg->mp = mpx ? mpx : mp; 2683 } 2684 rx_conf->rx_nseg = rx_pkt_nb_segs; 2685 rx_conf->rx_seg = rx_useg; 2686 ret = rte_eth_rx_queue_setup(port_id, rx_queue_id, nb_rx_desc, 2687 socket_id, rx_conf, NULL); 2688 rx_conf->rx_seg = NULL; 2689 rx_conf->rx_nseg = 0; 2690 exit: 2691 ports[port_id].rxq[rx_queue_id].state = rx_conf->rx_deferred_start ? 2692 RTE_ETH_QUEUE_STATE_STOPPED : 2693 RTE_ETH_QUEUE_STATE_STARTED; 2694 return ret; 2695 } 2696 2697 static int 2698 alloc_xstats_display_info(portid_t pi) 2699 { 2700 uint64_t **ids_supp = &ports[pi].xstats_info.ids_supp; 2701 uint64_t **prev_values = &ports[pi].xstats_info.prev_values; 2702 uint64_t **curr_values = &ports[pi].xstats_info.curr_values; 2703 2704 if (xstats_display_num == 0) 2705 return 0; 2706 2707 *ids_supp = calloc(xstats_display_num, sizeof(**ids_supp)); 2708 if (*ids_supp == NULL) 2709 goto fail_ids_supp; 2710 2711 *prev_values = calloc(xstats_display_num, 2712 sizeof(**prev_values)); 2713 if (*prev_values == NULL) 2714 goto fail_prev_values; 2715 2716 *curr_values = calloc(xstats_display_num, 2717 sizeof(**curr_values)); 2718 if (*curr_values == NULL) 2719 goto fail_curr_values; 2720 2721 ports[pi].xstats_info.allocated = true; 2722 2723 return 0; 2724 2725 fail_curr_values: 2726 free(*prev_values); 2727 fail_prev_values: 2728 free(*ids_supp); 2729 fail_ids_supp: 2730 return -ENOMEM; 2731 } 2732 2733 static void 2734 free_xstats_display_info(portid_t pi) 2735 { 2736 if (!ports[pi].xstats_info.allocated) 2737 return; 2738 free(ports[pi].xstats_info.ids_supp); 2739 free(ports[pi].xstats_info.prev_values); 2740 free(ports[pi].xstats_info.curr_values); 2741 ports[pi].xstats_info.allocated = false; 2742 } 2743 2744 /** Fill helper structures for specified port to show extended statistics. */ 2745 static void 2746 fill_xstats_display_info_for_port(portid_t pi) 2747 { 2748 unsigned int stat, stat_supp; 2749 const char *xstat_name; 2750 struct rte_port *port; 2751 uint64_t *ids_supp; 2752 int rc; 2753 2754 if (xstats_display_num == 0) 2755 return; 2756 2757 if (pi == (portid_t)RTE_PORT_ALL) { 2758 fill_xstats_display_info(); 2759 return; 2760 } 2761 2762 port = &ports[pi]; 2763 if (port->port_status != RTE_PORT_STARTED) 2764 return; 2765 2766 if (!port->xstats_info.allocated && alloc_xstats_display_info(pi) != 0) 2767 rte_exit(EXIT_FAILURE, 2768 "Failed to allocate xstats display memory\n"); 2769 2770 ids_supp = port->xstats_info.ids_supp; 2771 for (stat = stat_supp = 0; stat < xstats_display_num; stat++) { 2772 xstat_name = xstats_display[stat].name; 2773 rc = rte_eth_xstats_get_id_by_name(pi, xstat_name, 2774 ids_supp + stat_supp); 2775 if (rc != 0) { 2776 fprintf(stderr, "No xstat '%s' on port %u - skip it %u\n", 2777 xstat_name, pi, stat); 2778 continue; 2779 } 2780 stat_supp++; 2781 } 2782 2783 port->xstats_info.ids_supp_sz = stat_supp; 2784 } 2785 2786 /** Fill helper structures for all ports to show extended statistics. */ 2787 static void 2788 fill_xstats_display_info(void) 2789 { 2790 portid_t pi; 2791 2792 if (xstats_display_num == 0) 2793 return; 2794 2795 RTE_ETH_FOREACH_DEV(pi) 2796 fill_xstats_display_info_for_port(pi); 2797 } 2798 2799 int 2800 start_port(portid_t pid) 2801 { 2802 int diag, need_check_link_status = -1; 2803 portid_t pi; 2804 portid_t p_pi = RTE_MAX_ETHPORTS; 2805 portid_t pl[RTE_MAX_ETHPORTS]; 2806 portid_t peer_pl[RTE_MAX_ETHPORTS]; 2807 uint16_t cnt_pi = 0; 2808 uint16_t cfg_pi = 0; 2809 int peer_pi; 2810 queueid_t qi; 2811 struct rte_port *port; 2812 struct rte_eth_hairpin_cap cap; 2813 2814 if (port_id_is_invalid(pid, ENABLED_WARN)) 2815 return 0; 2816 2817 RTE_ETH_FOREACH_DEV(pi) { 2818 if (pid != pi && pid != (portid_t)RTE_PORT_ALL) 2819 continue; 2820 2821 if (port_is_bonding_slave(pi)) { 2822 fprintf(stderr, 2823 "Please remove port %d from bonded device.\n", 2824 pi); 2825 continue; 2826 } 2827 2828 need_check_link_status = 0; 2829 port = &ports[pi]; 2830 if (port->port_status == RTE_PORT_STOPPED) 2831 port->port_status = RTE_PORT_HANDLING; 2832 else { 2833 fprintf(stderr, "Port %d is now not stopped\n", pi); 2834 continue; 2835 } 2836 2837 if (port->need_reconfig > 0) { 2838 struct rte_eth_conf dev_conf; 2839 int k; 2840 2841 port->need_reconfig = 0; 2842 2843 if (flow_isolate_all) { 2844 int ret = port_flow_isolate(pi, 1); 2845 if (ret) { 2846 fprintf(stderr, 2847 "Failed to apply isolated mode on port %d\n", 2848 pi); 2849 return -1; 2850 } 2851 } 2852 configure_rxtx_dump_callbacks(0); 2853 printf("Configuring Port %d (socket %u)\n", pi, 2854 port->socket_id); 2855 if (nb_hairpinq > 0 && 2856 rte_eth_dev_hairpin_capability_get(pi, &cap)) { 2857 fprintf(stderr, 2858 "Port %d doesn't support hairpin queues\n", 2859 pi); 2860 return -1; 2861 } 2862 2863 /* configure port */ 2864 diag = eth_dev_configure_mp(pi, nb_rxq + nb_hairpinq, 2865 nb_txq + nb_hairpinq, 2866 &(port->dev_conf)); 2867 if (diag != 0) { 2868 if (port->port_status == RTE_PORT_HANDLING) 2869 port->port_status = RTE_PORT_STOPPED; 2870 else 2871 fprintf(stderr, 2872 "Port %d can not be set back to stopped\n", 2873 pi); 2874 fprintf(stderr, "Fail to configure port %d\n", 2875 pi); 2876 /* try to reconfigure port next time */ 2877 port->need_reconfig = 1; 2878 return -1; 2879 } 2880 /* get device configuration*/ 2881 if (0 != 2882 eth_dev_conf_get_print_err(pi, &dev_conf)) { 2883 fprintf(stderr, 2884 "port %d can not get device configuration\n", 2885 pi); 2886 return -1; 2887 } 2888 /* Apply Rx offloads configuration */ 2889 if (dev_conf.rxmode.offloads != 2890 port->dev_conf.rxmode.offloads) { 2891 port->dev_conf.rxmode.offloads |= 2892 dev_conf.rxmode.offloads; 2893 for (k = 0; 2894 k < port->dev_info.max_rx_queues; 2895 k++) 2896 port->rxq[k].conf.offloads |= 2897 dev_conf.rxmode.offloads; 2898 } 2899 /* Apply Tx offloads configuration */ 2900 if (dev_conf.txmode.offloads != 2901 port->dev_conf.txmode.offloads) { 2902 port->dev_conf.txmode.offloads |= 2903 dev_conf.txmode.offloads; 2904 for (k = 0; 2905 k < port->dev_info.max_tx_queues; 2906 k++) 2907 port->txq[k].conf.offloads |= 2908 dev_conf.txmode.offloads; 2909 } 2910 } 2911 if (port->need_reconfig_queues > 0 && is_proc_primary()) { 2912 port->need_reconfig_queues = 0; 2913 /* setup tx queues */ 2914 for (qi = 0; qi < nb_txq; qi++) { 2915 struct rte_eth_txconf *conf = 2916 &port->txq[qi].conf; 2917 2918 if ((numa_support) && 2919 (txring_numa[pi] != NUMA_NO_CONFIG)) 2920 diag = rte_eth_tx_queue_setup(pi, qi, 2921 port->nb_tx_desc[qi], 2922 txring_numa[pi], 2923 &(port->txq[qi].conf)); 2924 else 2925 diag = rte_eth_tx_queue_setup(pi, qi, 2926 port->nb_tx_desc[qi], 2927 port->socket_id, 2928 &(port->txq[qi].conf)); 2929 2930 if (diag == 0) { 2931 port->txq[qi].state = 2932 conf->tx_deferred_start ? 2933 RTE_ETH_QUEUE_STATE_STOPPED : 2934 RTE_ETH_QUEUE_STATE_STARTED; 2935 continue; 2936 } 2937 2938 /* Fail to setup tx queue, return */ 2939 if (port->port_status == RTE_PORT_HANDLING) 2940 port->port_status = RTE_PORT_STOPPED; 2941 else 2942 fprintf(stderr, 2943 "Port %d can not be set back to stopped\n", 2944 pi); 2945 fprintf(stderr, 2946 "Fail to configure port %d tx queues\n", 2947 pi); 2948 /* try to reconfigure queues next time */ 2949 port->need_reconfig_queues = 1; 2950 return -1; 2951 } 2952 for (qi = 0; qi < nb_rxq; qi++) { 2953 /* setup rx queues */ 2954 if ((numa_support) && 2955 (rxring_numa[pi] != NUMA_NO_CONFIG)) { 2956 struct rte_mempool * mp = 2957 mbuf_pool_find 2958 (rxring_numa[pi], 0); 2959 if (mp == NULL) { 2960 fprintf(stderr, 2961 "Failed to setup RX queue: No mempool allocation on the socket %d\n", 2962 rxring_numa[pi]); 2963 return -1; 2964 } 2965 2966 diag = rx_queue_setup(pi, qi, 2967 port->nb_rx_desc[qi], 2968 rxring_numa[pi], 2969 &(port->rxq[qi].conf), 2970 mp); 2971 } else { 2972 struct rte_mempool *mp = 2973 mbuf_pool_find 2974 (port->socket_id, 0); 2975 if (mp == NULL) { 2976 fprintf(stderr, 2977 "Failed to setup RX queue: No mempool allocation on the socket %d\n", 2978 port->socket_id); 2979 return -1; 2980 } 2981 diag = rx_queue_setup(pi, qi, 2982 port->nb_rx_desc[qi], 2983 port->socket_id, 2984 &(port->rxq[qi].conf), 2985 mp); 2986 } 2987 if (diag == 0) 2988 continue; 2989 2990 /* Fail to setup rx queue, return */ 2991 if (port->port_status == RTE_PORT_HANDLING) 2992 port->port_status = RTE_PORT_STOPPED; 2993 else 2994 fprintf(stderr, 2995 "Port %d can not be set back to stopped\n", 2996 pi); 2997 fprintf(stderr, 2998 "Fail to configure port %d rx queues\n", 2999 pi); 3000 /* try to reconfigure queues next time */ 3001 port->need_reconfig_queues = 1; 3002 return -1; 3003 } 3004 /* setup hairpin queues */ 3005 if (setup_hairpin_queues(pi, p_pi, cnt_pi) != 0) 3006 return -1; 3007 } 3008 configure_rxtx_dump_callbacks(verbose_level); 3009 if (clear_ptypes) { 3010 diag = rte_eth_dev_set_ptypes(pi, RTE_PTYPE_UNKNOWN, 3011 NULL, 0); 3012 if (diag < 0) 3013 fprintf(stderr, 3014 "Port %d: Failed to disable Ptype parsing\n", 3015 pi); 3016 } 3017 3018 p_pi = pi; 3019 cnt_pi++; 3020 3021 /* start port */ 3022 diag = eth_dev_start_mp(pi); 3023 if (diag < 0) { 3024 fprintf(stderr, "Fail to start port %d: %s\n", 3025 pi, rte_strerror(-diag)); 3026 3027 /* Fail to setup rx queue, return */ 3028 if (port->port_status == RTE_PORT_HANDLING) 3029 port->port_status = RTE_PORT_STOPPED; 3030 else 3031 fprintf(stderr, 3032 "Port %d can not be set back to stopped\n", 3033 pi); 3034 continue; 3035 } 3036 3037 if (port->port_status == RTE_PORT_HANDLING) 3038 port->port_status = RTE_PORT_STARTED; 3039 else 3040 fprintf(stderr, "Port %d can not be set into started\n", 3041 pi); 3042 3043 if (eth_macaddr_get_print_err(pi, &port->eth_addr) == 0) 3044 printf("Port %d: " RTE_ETHER_ADDR_PRT_FMT "\n", pi, 3045 RTE_ETHER_ADDR_BYTES(&port->eth_addr)); 3046 3047 /* at least one port started, need checking link status */ 3048 need_check_link_status = 1; 3049 3050 pl[cfg_pi++] = pi; 3051 } 3052 3053 if (need_check_link_status == 1 && !no_link_check) 3054 check_all_ports_link_status(RTE_PORT_ALL); 3055 else if (need_check_link_status == 0) 3056 fprintf(stderr, "Please stop the ports first\n"); 3057 3058 if (hairpin_mode & 0xf) { 3059 uint16_t i; 3060 int j; 3061 3062 /* bind all started hairpin ports */ 3063 for (i = 0; i < cfg_pi; i++) { 3064 pi = pl[i]; 3065 /* bind current Tx to all peer Rx */ 3066 peer_pi = rte_eth_hairpin_get_peer_ports(pi, peer_pl, 3067 RTE_MAX_ETHPORTS, 1); 3068 if (peer_pi < 0) 3069 return peer_pi; 3070 for (j = 0; j < peer_pi; j++) { 3071 if (!port_is_started(peer_pl[j])) 3072 continue; 3073 diag = rte_eth_hairpin_bind(pi, peer_pl[j]); 3074 if (diag < 0) { 3075 fprintf(stderr, 3076 "Error during binding hairpin Tx port %u to %u: %s\n", 3077 pi, peer_pl[j], 3078 rte_strerror(-diag)); 3079 return -1; 3080 } 3081 } 3082 /* bind all peer Tx to current Rx */ 3083 peer_pi = rte_eth_hairpin_get_peer_ports(pi, peer_pl, 3084 RTE_MAX_ETHPORTS, 0); 3085 if (peer_pi < 0) 3086 return peer_pi; 3087 for (j = 0; j < peer_pi; j++) { 3088 if (!port_is_started(peer_pl[j])) 3089 continue; 3090 diag = rte_eth_hairpin_bind(peer_pl[j], pi); 3091 if (diag < 0) { 3092 fprintf(stderr, 3093 "Error during binding hairpin Tx port %u to %u: %s\n", 3094 peer_pl[j], pi, 3095 rte_strerror(-diag)); 3096 return -1; 3097 } 3098 } 3099 } 3100 } 3101 3102 fill_xstats_display_info_for_port(pid); 3103 3104 printf("Done\n"); 3105 return 0; 3106 } 3107 3108 void 3109 stop_port(portid_t pid) 3110 { 3111 portid_t pi; 3112 struct rte_port *port; 3113 int need_check_link_status = 0; 3114 portid_t peer_pl[RTE_MAX_ETHPORTS]; 3115 int peer_pi; 3116 3117 if (port_id_is_invalid(pid, ENABLED_WARN)) 3118 return; 3119 3120 printf("Stopping ports...\n"); 3121 3122 RTE_ETH_FOREACH_DEV(pi) { 3123 if (pid != pi && pid != (portid_t)RTE_PORT_ALL) 3124 continue; 3125 3126 if (port_is_forwarding(pi) != 0 && test_done == 0) { 3127 fprintf(stderr, 3128 "Please remove port %d from forwarding configuration.\n", 3129 pi); 3130 continue; 3131 } 3132 3133 if (port_is_bonding_slave(pi)) { 3134 fprintf(stderr, 3135 "Please remove port %d from bonded device.\n", 3136 pi); 3137 continue; 3138 } 3139 3140 port = &ports[pi]; 3141 if (port->port_status == RTE_PORT_STARTED) 3142 port->port_status = RTE_PORT_HANDLING; 3143 else 3144 continue; 3145 3146 if (hairpin_mode & 0xf) { 3147 int j; 3148 3149 rte_eth_hairpin_unbind(pi, RTE_MAX_ETHPORTS); 3150 /* unbind all peer Tx from current Rx */ 3151 peer_pi = rte_eth_hairpin_get_peer_ports(pi, peer_pl, 3152 RTE_MAX_ETHPORTS, 0); 3153 if (peer_pi < 0) 3154 continue; 3155 for (j = 0; j < peer_pi; j++) { 3156 if (!port_is_started(peer_pl[j])) 3157 continue; 3158 rte_eth_hairpin_unbind(peer_pl[j], pi); 3159 } 3160 } 3161 3162 if (port->flow_list) 3163 port_flow_flush(pi); 3164 3165 if (eth_dev_stop_mp(pi) != 0) 3166 RTE_LOG(ERR, EAL, "rte_eth_dev_stop failed for port %u\n", 3167 pi); 3168 3169 if (port->port_status == RTE_PORT_HANDLING) 3170 port->port_status = RTE_PORT_STOPPED; 3171 else 3172 fprintf(stderr, "Port %d can not be set into stopped\n", 3173 pi); 3174 need_check_link_status = 1; 3175 } 3176 if (need_check_link_status && !no_link_check) 3177 check_all_ports_link_status(RTE_PORT_ALL); 3178 3179 printf("Done\n"); 3180 } 3181 3182 static void 3183 remove_invalid_ports_in(portid_t *array, portid_t *total) 3184 { 3185 portid_t i; 3186 portid_t new_total = 0; 3187 3188 for (i = 0; i < *total; i++) 3189 if (!port_id_is_invalid(array[i], DISABLED_WARN)) { 3190 array[new_total] = array[i]; 3191 new_total++; 3192 } 3193 *total = new_total; 3194 } 3195 3196 static void 3197 remove_invalid_ports(void) 3198 { 3199 remove_invalid_ports_in(ports_ids, &nb_ports); 3200 remove_invalid_ports_in(fwd_ports_ids, &nb_fwd_ports); 3201 nb_cfg_ports = nb_fwd_ports; 3202 } 3203 3204 void 3205 close_port(portid_t pid) 3206 { 3207 portid_t pi; 3208 struct rte_port *port; 3209 3210 if (port_id_is_invalid(pid, ENABLED_WARN)) 3211 return; 3212 3213 printf("Closing ports...\n"); 3214 3215 RTE_ETH_FOREACH_DEV(pi) { 3216 if (pid != pi && pid != (portid_t)RTE_PORT_ALL) 3217 continue; 3218 3219 if (port_is_forwarding(pi) != 0 && test_done == 0) { 3220 fprintf(stderr, 3221 "Please remove port %d from forwarding configuration.\n", 3222 pi); 3223 continue; 3224 } 3225 3226 if (port_is_bonding_slave(pi)) { 3227 fprintf(stderr, 3228 "Please remove port %d from bonded device.\n", 3229 pi); 3230 continue; 3231 } 3232 3233 port = &ports[pi]; 3234 if (port->port_status == RTE_PORT_CLOSED) { 3235 fprintf(stderr, "Port %d is already closed\n", pi); 3236 continue; 3237 } 3238 3239 if (is_proc_primary()) { 3240 port_flow_flush(pi); 3241 port_flex_item_flush(pi); 3242 port_action_handle_flush(pi); 3243 rte_eth_dev_close(pi); 3244 } 3245 3246 free_xstats_display_info(pi); 3247 } 3248 3249 remove_invalid_ports(); 3250 printf("Done\n"); 3251 } 3252 3253 void 3254 reset_port(portid_t pid) 3255 { 3256 int diag; 3257 portid_t pi; 3258 struct rte_port *port; 3259 3260 if (port_id_is_invalid(pid, ENABLED_WARN)) 3261 return; 3262 3263 if ((pid == (portid_t)RTE_PORT_ALL && !all_ports_stopped()) || 3264 (pid != (portid_t)RTE_PORT_ALL && !port_is_stopped(pid))) { 3265 fprintf(stderr, 3266 "Can not reset port(s), please stop port(s) first.\n"); 3267 return; 3268 } 3269 3270 printf("Resetting ports...\n"); 3271 3272 RTE_ETH_FOREACH_DEV(pi) { 3273 if (pid != pi && pid != (portid_t)RTE_PORT_ALL) 3274 continue; 3275 3276 if (port_is_forwarding(pi) != 0 && test_done == 0) { 3277 fprintf(stderr, 3278 "Please remove port %d from forwarding configuration.\n", 3279 pi); 3280 continue; 3281 } 3282 3283 if (port_is_bonding_slave(pi)) { 3284 fprintf(stderr, 3285 "Please remove port %d from bonded device.\n", 3286 pi); 3287 continue; 3288 } 3289 3290 diag = rte_eth_dev_reset(pi); 3291 if (diag == 0) { 3292 port = &ports[pi]; 3293 port->need_reconfig = 1; 3294 port->need_reconfig_queues = 1; 3295 } else { 3296 fprintf(stderr, "Failed to reset port %d. diag=%d\n", 3297 pi, diag); 3298 } 3299 } 3300 3301 printf("Done\n"); 3302 } 3303 3304 void 3305 attach_port(char *identifier) 3306 { 3307 portid_t pi; 3308 struct rte_dev_iterator iterator; 3309 3310 printf("Attaching a new port...\n"); 3311 3312 if (identifier == NULL) { 3313 fprintf(stderr, "Invalid parameters are specified\n"); 3314 return; 3315 } 3316 3317 if (rte_dev_probe(identifier) < 0) { 3318 TESTPMD_LOG(ERR, "Failed to attach port %s\n", identifier); 3319 return; 3320 } 3321 3322 /* first attach mode: event */ 3323 if (setup_on_probe_event) { 3324 /* new ports are detected on RTE_ETH_EVENT_NEW event */ 3325 for (pi = 0; pi < RTE_MAX_ETHPORTS; pi++) 3326 if (ports[pi].port_status == RTE_PORT_HANDLING && 3327 ports[pi].need_setup != 0) 3328 setup_attached_port(pi); 3329 return; 3330 } 3331 3332 /* second attach mode: iterator */ 3333 RTE_ETH_FOREACH_MATCHING_DEV(pi, identifier, &iterator) { 3334 /* setup ports matching the devargs used for probing */ 3335 if (port_is_forwarding(pi)) 3336 continue; /* port was already attached before */ 3337 setup_attached_port(pi); 3338 } 3339 } 3340 3341 static void 3342 setup_attached_port(portid_t pi) 3343 { 3344 unsigned int socket_id; 3345 int ret; 3346 3347 socket_id = (unsigned)rte_eth_dev_socket_id(pi); 3348 /* if socket_id is invalid, set to the first available socket. */ 3349 if (check_socket_id(socket_id) < 0) 3350 socket_id = socket_ids[0]; 3351 reconfig(pi, socket_id); 3352 ret = rte_eth_promiscuous_enable(pi); 3353 if (ret != 0) 3354 fprintf(stderr, 3355 "Error during enabling promiscuous mode for port %u: %s - ignore\n", 3356 pi, rte_strerror(-ret)); 3357 3358 ports_ids[nb_ports++] = pi; 3359 fwd_ports_ids[nb_fwd_ports++] = pi; 3360 nb_cfg_ports = nb_fwd_ports; 3361 ports[pi].need_setup = 0; 3362 ports[pi].port_status = RTE_PORT_STOPPED; 3363 3364 printf("Port %d is attached. Now total ports is %d\n", pi, nb_ports); 3365 printf("Done\n"); 3366 } 3367 3368 static void 3369 detach_device(struct rte_device *dev) 3370 { 3371 portid_t sibling; 3372 3373 if (dev == NULL) { 3374 fprintf(stderr, "Device already removed\n"); 3375 return; 3376 } 3377 3378 printf("Removing a device...\n"); 3379 3380 RTE_ETH_FOREACH_DEV_OF(sibling, dev) { 3381 if (ports[sibling].port_status != RTE_PORT_CLOSED) { 3382 if (ports[sibling].port_status != RTE_PORT_STOPPED) { 3383 fprintf(stderr, "Port %u not stopped\n", 3384 sibling); 3385 return; 3386 } 3387 port_flow_flush(sibling); 3388 } 3389 } 3390 3391 if (rte_dev_remove(dev) < 0) { 3392 TESTPMD_LOG(ERR, "Failed to detach device %s\n", dev->name); 3393 return; 3394 } 3395 remove_invalid_ports(); 3396 3397 printf("Device is detached\n"); 3398 printf("Now total ports is %d\n", nb_ports); 3399 printf("Done\n"); 3400 return; 3401 } 3402 3403 void 3404 detach_port_device(portid_t port_id) 3405 { 3406 int ret; 3407 struct rte_eth_dev_info dev_info; 3408 3409 if (port_id_is_invalid(port_id, ENABLED_WARN)) 3410 return; 3411 3412 if (ports[port_id].port_status != RTE_PORT_CLOSED) { 3413 if (ports[port_id].port_status != RTE_PORT_STOPPED) { 3414 fprintf(stderr, "Port not stopped\n"); 3415 return; 3416 } 3417 fprintf(stderr, "Port was not closed\n"); 3418 } 3419 3420 ret = eth_dev_info_get_print_err(port_id, &dev_info); 3421 if (ret != 0) { 3422 TESTPMD_LOG(ERR, 3423 "Failed to get device info for port %d, not detaching\n", 3424 port_id); 3425 return; 3426 } 3427 detach_device(dev_info.device); 3428 } 3429 3430 void 3431 detach_devargs(char *identifier) 3432 { 3433 struct rte_dev_iterator iterator; 3434 struct rte_devargs da; 3435 portid_t port_id; 3436 3437 printf("Removing a device...\n"); 3438 3439 memset(&da, 0, sizeof(da)); 3440 if (rte_devargs_parsef(&da, "%s", identifier)) { 3441 fprintf(stderr, "cannot parse identifier\n"); 3442 return; 3443 } 3444 3445 RTE_ETH_FOREACH_MATCHING_DEV(port_id, identifier, &iterator) { 3446 if (ports[port_id].port_status != RTE_PORT_CLOSED) { 3447 if (ports[port_id].port_status != RTE_PORT_STOPPED) { 3448 fprintf(stderr, "Port %u not stopped\n", 3449 port_id); 3450 rte_eth_iterator_cleanup(&iterator); 3451 rte_devargs_reset(&da); 3452 return; 3453 } 3454 port_flow_flush(port_id); 3455 } 3456 } 3457 3458 if (rte_eal_hotplug_remove(da.bus->name, da.name) != 0) { 3459 TESTPMD_LOG(ERR, "Failed to detach device %s(%s)\n", 3460 da.name, da.bus->name); 3461 rte_devargs_reset(&da); 3462 return; 3463 } 3464 3465 remove_invalid_ports(); 3466 3467 printf("Device %s is detached\n", identifier); 3468 printf("Now total ports is %d\n", nb_ports); 3469 printf("Done\n"); 3470 rte_devargs_reset(&da); 3471 } 3472 3473 void 3474 pmd_test_exit(void) 3475 { 3476 portid_t pt_id; 3477 unsigned int i; 3478 int ret; 3479 3480 if (test_done == 0) 3481 stop_packet_forwarding(); 3482 3483 #ifndef RTE_EXEC_ENV_WINDOWS 3484 for (i = 0 ; i < RTE_DIM(mempools) ; i++) { 3485 if (mempools[i]) { 3486 if (mp_alloc_type == MP_ALLOC_ANON) 3487 rte_mempool_mem_iter(mempools[i], dma_unmap_cb, 3488 NULL); 3489 } 3490 } 3491 #endif 3492 if (ports != NULL) { 3493 no_link_check = 1; 3494 RTE_ETH_FOREACH_DEV(pt_id) { 3495 printf("\nStopping port %d...\n", pt_id); 3496 fflush(stdout); 3497 stop_port(pt_id); 3498 } 3499 RTE_ETH_FOREACH_DEV(pt_id) { 3500 printf("\nShutting down port %d...\n", pt_id); 3501 fflush(stdout); 3502 close_port(pt_id); 3503 } 3504 } 3505 3506 if (hot_plug) { 3507 ret = rte_dev_event_monitor_stop(); 3508 if (ret) { 3509 RTE_LOG(ERR, EAL, 3510 "fail to stop device event monitor."); 3511 return; 3512 } 3513 3514 ret = rte_dev_event_callback_unregister(NULL, 3515 dev_event_callback, NULL); 3516 if (ret < 0) { 3517 RTE_LOG(ERR, EAL, 3518 "fail to unregister device event callback.\n"); 3519 return; 3520 } 3521 3522 ret = rte_dev_hotplug_handle_disable(); 3523 if (ret) { 3524 RTE_LOG(ERR, EAL, 3525 "fail to disable hotplug handling.\n"); 3526 return; 3527 } 3528 } 3529 for (i = 0 ; i < RTE_DIM(mempools) ; i++) { 3530 if (mempools[i]) 3531 mempool_free_mp(mempools[i]); 3532 } 3533 free(xstats_display); 3534 3535 printf("\nBye...\n"); 3536 } 3537 3538 typedef void (*cmd_func_t)(void); 3539 struct pmd_test_command { 3540 const char *cmd_name; 3541 cmd_func_t cmd_func; 3542 }; 3543 3544 /* Check the link status of all ports in up to 9s, and print them finally */ 3545 static void 3546 check_all_ports_link_status(uint32_t port_mask) 3547 { 3548 #define CHECK_INTERVAL 100 /* 100ms */ 3549 #define MAX_CHECK_TIME 90 /* 9s (90 * 100ms) in total */ 3550 portid_t portid; 3551 uint8_t count, all_ports_up, print_flag = 0; 3552 struct rte_eth_link link; 3553 int ret; 3554 char link_status[RTE_ETH_LINK_MAX_STR_LEN]; 3555 3556 printf("Checking link statuses...\n"); 3557 fflush(stdout); 3558 for (count = 0; count <= MAX_CHECK_TIME; count++) { 3559 all_ports_up = 1; 3560 RTE_ETH_FOREACH_DEV(portid) { 3561 if ((port_mask & (1 << portid)) == 0) 3562 continue; 3563 memset(&link, 0, sizeof(link)); 3564 ret = rte_eth_link_get_nowait(portid, &link); 3565 if (ret < 0) { 3566 all_ports_up = 0; 3567 if (print_flag == 1) 3568 fprintf(stderr, 3569 "Port %u link get failed: %s\n", 3570 portid, rte_strerror(-ret)); 3571 continue; 3572 } 3573 /* print link status if flag set */ 3574 if (print_flag == 1) { 3575 rte_eth_link_to_str(link_status, 3576 sizeof(link_status), &link); 3577 printf("Port %d %s\n", portid, link_status); 3578 continue; 3579 } 3580 /* clear all_ports_up flag if any link down */ 3581 if (link.link_status == RTE_ETH_LINK_DOWN) { 3582 all_ports_up = 0; 3583 break; 3584 } 3585 } 3586 /* after finally printing all link status, get out */ 3587 if (print_flag == 1) 3588 break; 3589 3590 if (all_ports_up == 0) { 3591 fflush(stdout); 3592 rte_delay_ms(CHECK_INTERVAL); 3593 } 3594 3595 /* set the print_flag if all ports up or timeout */ 3596 if (all_ports_up == 1 || count == (MAX_CHECK_TIME - 1)) { 3597 print_flag = 1; 3598 } 3599 3600 if (lsc_interrupt) 3601 break; 3602 } 3603 } 3604 3605 static void 3606 rmv_port_callback(void *arg) 3607 { 3608 int need_to_start = 0; 3609 int org_no_link_check = no_link_check; 3610 portid_t port_id = (intptr_t)arg; 3611 struct rte_eth_dev_info dev_info; 3612 int ret; 3613 3614 RTE_ETH_VALID_PORTID_OR_RET(port_id); 3615 3616 if (!test_done && port_is_forwarding(port_id)) { 3617 need_to_start = 1; 3618 stop_packet_forwarding(); 3619 } 3620 no_link_check = 1; 3621 stop_port(port_id); 3622 no_link_check = org_no_link_check; 3623 3624 ret = eth_dev_info_get_print_err(port_id, &dev_info); 3625 if (ret != 0) 3626 TESTPMD_LOG(ERR, 3627 "Failed to get device info for port %d, not detaching\n", 3628 port_id); 3629 else { 3630 struct rte_device *device = dev_info.device; 3631 close_port(port_id); 3632 detach_device(device); /* might be already removed or have more ports */ 3633 } 3634 if (need_to_start) 3635 start_packet_forwarding(0); 3636 } 3637 3638 /* This function is used by the interrupt thread */ 3639 static int 3640 eth_event_callback(portid_t port_id, enum rte_eth_event_type type, void *param, 3641 void *ret_param) 3642 { 3643 RTE_SET_USED(param); 3644 RTE_SET_USED(ret_param); 3645 3646 if (type >= RTE_ETH_EVENT_MAX) { 3647 fprintf(stderr, 3648 "\nPort %" PRIu16 ": %s called upon invalid event %d\n", 3649 port_id, __func__, type); 3650 fflush(stderr); 3651 } else if (event_print_mask & (UINT32_C(1) << type)) { 3652 printf("\nPort %" PRIu16 ": %s event\n", port_id, 3653 eth_event_desc[type]); 3654 fflush(stdout); 3655 } 3656 3657 switch (type) { 3658 case RTE_ETH_EVENT_NEW: 3659 ports[port_id].need_setup = 1; 3660 ports[port_id].port_status = RTE_PORT_HANDLING; 3661 break; 3662 case RTE_ETH_EVENT_INTR_RMV: 3663 if (port_id_is_invalid(port_id, DISABLED_WARN)) 3664 break; 3665 if (rte_eal_alarm_set(100000, 3666 rmv_port_callback, (void *)(intptr_t)port_id)) 3667 fprintf(stderr, 3668 "Could not set up deferred device removal\n"); 3669 break; 3670 case RTE_ETH_EVENT_DESTROY: 3671 ports[port_id].port_status = RTE_PORT_CLOSED; 3672 printf("Port %u is closed\n", port_id); 3673 break; 3674 default: 3675 break; 3676 } 3677 return 0; 3678 } 3679 3680 static int 3681 register_eth_event_callback(void) 3682 { 3683 int ret; 3684 enum rte_eth_event_type event; 3685 3686 for (event = RTE_ETH_EVENT_UNKNOWN; 3687 event < RTE_ETH_EVENT_MAX; event++) { 3688 ret = rte_eth_dev_callback_register(RTE_ETH_ALL, 3689 event, 3690 eth_event_callback, 3691 NULL); 3692 if (ret != 0) { 3693 TESTPMD_LOG(ERR, "Failed to register callback for " 3694 "%s event\n", eth_event_desc[event]); 3695 return -1; 3696 } 3697 } 3698 3699 return 0; 3700 } 3701 3702 /* This function is used by the interrupt thread */ 3703 static void 3704 dev_event_callback(const char *device_name, enum rte_dev_event_type type, 3705 __rte_unused void *arg) 3706 { 3707 uint16_t port_id; 3708 int ret; 3709 3710 if (type >= RTE_DEV_EVENT_MAX) { 3711 fprintf(stderr, "%s called upon invalid event %d\n", 3712 __func__, type); 3713 fflush(stderr); 3714 } 3715 3716 switch (type) { 3717 case RTE_DEV_EVENT_REMOVE: 3718 RTE_LOG(DEBUG, EAL, "The device: %s has been removed!\n", 3719 device_name); 3720 ret = rte_eth_dev_get_port_by_name(device_name, &port_id); 3721 if (ret) { 3722 RTE_LOG(ERR, EAL, "can not get port by device %s!\n", 3723 device_name); 3724 return; 3725 } 3726 /* 3727 * Because the user's callback is invoked in eal interrupt 3728 * callback, the interrupt callback need to be finished before 3729 * it can be unregistered when detaching device. So finish 3730 * callback soon and use a deferred removal to detach device 3731 * is need. It is a workaround, once the device detaching be 3732 * moved into the eal in the future, the deferred removal could 3733 * be deleted. 3734 */ 3735 if (rte_eal_alarm_set(100000, 3736 rmv_port_callback, (void *)(intptr_t)port_id)) 3737 RTE_LOG(ERR, EAL, 3738 "Could not set up deferred device removal\n"); 3739 break; 3740 case RTE_DEV_EVENT_ADD: 3741 RTE_LOG(ERR, EAL, "The device: %s has been added!\n", 3742 device_name); 3743 /* TODO: After finish kernel driver binding, 3744 * begin to attach port. 3745 */ 3746 break; 3747 default: 3748 break; 3749 } 3750 } 3751 3752 static void 3753 rxtx_port_config(portid_t pid) 3754 { 3755 uint16_t qid; 3756 uint64_t offloads; 3757 struct rte_port *port = &ports[pid]; 3758 3759 for (qid = 0; qid < nb_rxq; qid++) { 3760 offloads = port->rxq[qid].conf.offloads; 3761 port->rxq[qid].conf = port->dev_info.default_rxconf; 3762 3763 if (rxq_share > 0 && 3764 (port->dev_info.dev_capa & RTE_ETH_DEV_CAPA_RXQ_SHARE)) { 3765 /* Non-zero share group to enable RxQ share. */ 3766 port->rxq[qid].conf.share_group = pid / rxq_share + 1; 3767 port->rxq[qid].conf.share_qid = qid; /* Equal mapping. */ 3768 } 3769 3770 if (offloads != 0) 3771 port->rxq[qid].conf.offloads = offloads; 3772 3773 /* Check if any Rx parameters have been passed */ 3774 if (rx_pthresh != RTE_PMD_PARAM_UNSET) 3775 port->rxq[qid].conf.rx_thresh.pthresh = rx_pthresh; 3776 3777 if (rx_hthresh != RTE_PMD_PARAM_UNSET) 3778 port->rxq[qid].conf.rx_thresh.hthresh = rx_hthresh; 3779 3780 if (rx_wthresh != RTE_PMD_PARAM_UNSET) 3781 port->rxq[qid].conf.rx_thresh.wthresh = rx_wthresh; 3782 3783 if (rx_free_thresh != RTE_PMD_PARAM_UNSET) 3784 port->rxq[qid].conf.rx_free_thresh = rx_free_thresh; 3785 3786 if (rx_drop_en != RTE_PMD_PARAM_UNSET) 3787 port->rxq[qid].conf.rx_drop_en = rx_drop_en; 3788 3789 port->nb_rx_desc[qid] = nb_rxd; 3790 } 3791 3792 for (qid = 0; qid < nb_txq; qid++) { 3793 offloads = port->txq[qid].conf.offloads; 3794 port->txq[qid].conf = port->dev_info.default_txconf; 3795 if (offloads != 0) 3796 port->txq[qid].conf.offloads = offloads; 3797 3798 /* Check if any Tx parameters have been passed */ 3799 if (tx_pthresh != RTE_PMD_PARAM_UNSET) 3800 port->txq[qid].conf.tx_thresh.pthresh = tx_pthresh; 3801 3802 if (tx_hthresh != RTE_PMD_PARAM_UNSET) 3803 port->txq[qid].conf.tx_thresh.hthresh = tx_hthresh; 3804 3805 if (tx_wthresh != RTE_PMD_PARAM_UNSET) 3806 port->txq[qid].conf.tx_thresh.wthresh = tx_wthresh; 3807 3808 if (tx_rs_thresh != RTE_PMD_PARAM_UNSET) 3809 port->txq[qid].conf.tx_rs_thresh = tx_rs_thresh; 3810 3811 if (tx_free_thresh != RTE_PMD_PARAM_UNSET) 3812 port->txq[qid].conf.tx_free_thresh = tx_free_thresh; 3813 3814 port->nb_tx_desc[qid] = nb_txd; 3815 } 3816 } 3817 3818 /* 3819 * Helper function to set MTU from frame size 3820 * 3821 * port->dev_info should be set before calling this function. 3822 * 3823 * return 0 on success, negative on error 3824 */ 3825 int 3826 update_mtu_from_frame_size(portid_t portid, uint32_t max_rx_pktlen) 3827 { 3828 struct rte_port *port = &ports[portid]; 3829 uint32_t eth_overhead; 3830 uint16_t mtu, new_mtu; 3831 3832 eth_overhead = get_eth_overhead(&port->dev_info); 3833 3834 if (rte_eth_dev_get_mtu(portid, &mtu) != 0) { 3835 printf("Failed to get MTU for port %u\n", portid); 3836 return -1; 3837 } 3838 3839 new_mtu = max_rx_pktlen - eth_overhead; 3840 3841 if (mtu == new_mtu) 3842 return 0; 3843 3844 if (eth_dev_set_mtu_mp(portid, new_mtu) != 0) { 3845 fprintf(stderr, 3846 "Failed to set MTU to %u for port %u\n", 3847 new_mtu, portid); 3848 return -1; 3849 } 3850 3851 port->dev_conf.rxmode.mtu = new_mtu; 3852 3853 return 0; 3854 } 3855 3856 void 3857 init_port_config(void) 3858 { 3859 portid_t pid; 3860 struct rte_port *port; 3861 int ret, i; 3862 3863 RTE_ETH_FOREACH_DEV(pid) { 3864 port = &ports[pid]; 3865 port->dev_conf.fdir_conf = fdir_conf; 3866 3867 ret = eth_dev_info_get_print_err(pid, &port->dev_info); 3868 if (ret != 0) 3869 return; 3870 3871 if (nb_rxq > 1) { 3872 port->dev_conf.rx_adv_conf.rss_conf.rss_key = NULL; 3873 port->dev_conf.rx_adv_conf.rss_conf.rss_hf = 3874 rss_hf & port->dev_info.flow_type_rss_offloads; 3875 } else { 3876 port->dev_conf.rx_adv_conf.rss_conf.rss_key = NULL; 3877 port->dev_conf.rx_adv_conf.rss_conf.rss_hf = 0; 3878 } 3879 3880 if (port->dcb_flag == 0) { 3881 if (port->dev_conf.rx_adv_conf.rss_conf.rss_hf != 0) { 3882 port->dev_conf.rxmode.mq_mode = 3883 (enum rte_eth_rx_mq_mode) 3884 (rx_mq_mode & RTE_ETH_MQ_RX_RSS); 3885 } else { 3886 port->dev_conf.rxmode.mq_mode = RTE_ETH_MQ_RX_NONE; 3887 port->dev_conf.rxmode.offloads &= 3888 ~RTE_ETH_RX_OFFLOAD_RSS_HASH; 3889 3890 for (i = 0; 3891 i < port->dev_info.nb_rx_queues; 3892 i++) 3893 port->rxq[i].conf.offloads &= 3894 ~RTE_ETH_RX_OFFLOAD_RSS_HASH; 3895 } 3896 } 3897 3898 rxtx_port_config(pid); 3899 3900 ret = eth_macaddr_get_print_err(pid, &port->eth_addr); 3901 if (ret != 0) 3902 return; 3903 3904 #if defined RTE_NET_IXGBE && defined RTE_LIBRTE_IXGBE_BYPASS 3905 rte_pmd_ixgbe_bypass_init(pid); 3906 #endif 3907 3908 if (lsc_interrupt && (*port->dev_info.dev_flags & RTE_ETH_DEV_INTR_LSC)) 3909 port->dev_conf.intr_conf.lsc = 1; 3910 if (rmv_interrupt && (*port->dev_info.dev_flags & RTE_ETH_DEV_INTR_RMV)) 3911 port->dev_conf.intr_conf.rmv = 1; 3912 } 3913 } 3914 3915 void set_port_slave_flag(portid_t slave_pid) 3916 { 3917 struct rte_port *port; 3918 3919 port = &ports[slave_pid]; 3920 port->slave_flag = 1; 3921 } 3922 3923 void clear_port_slave_flag(portid_t slave_pid) 3924 { 3925 struct rte_port *port; 3926 3927 port = &ports[slave_pid]; 3928 port->slave_flag = 0; 3929 } 3930 3931 uint8_t port_is_bonding_slave(portid_t slave_pid) 3932 { 3933 struct rte_port *port; 3934 struct rte_eth_dev_info dev_info; 3935 int ret; 3936 3937 port = &ports[slave_pid]; 3938 ret = eth_dev_info_get_print_err(slave_pid, &dev_info); 3939 if (ret != 0) { 3940 TESTPMD_LOG(ERR, 3941 "Failed to get device info for port id %d," 3942 "cannot determine if the port is a bonded slave", 3943 slave_pid); 3944 return 0; 3945 } 3946 if ((*dev_info.dev_flags & RTE_ETH_DEV_BONDED_SLAVE) || (port->slave_flag == 1)) 3947 return 1; 3948 return 0; 3949 } 3950 3951 const uint16_t vlan_tags[] = { 3952 0, 1, 2, 3, 4, 5, 6, 7, 3953 8, 9, 10, 11, 12, 13, 14, 15, 3954 16, 17, 18, 19, 20, 21, 22, 23, 3955 24, 25, 26, 27, 28, 29, 30, 31 3956 }; 3957 3958 static int 3959 get_eth_dcb_conf(portid_t pid, struct rte_eth_conf *eth_conf, 3960 enum dcb_mode_enable dcb_mode, 3961 enum rte_eth_nb_tcs num_tcs, 3962 uint8_t pfc_en) 3963 { 3964 uint8_t i; 3965 int32_t rc; 3966 struct rte_eth_rss_conf rss_conf; 3967 3968 /* 3969 * Builds up the correct configuration for dcb+vt based on the vlan tags array 3970 * given above, and the number of traffic classes available for use. 3971 */ 3972 if (dcb_mode == DCB_VT_ENABLED) { 3973 struct rte_eth_vmdq_dcb_conf *vmdq_rx_conf = 3974 ð_conf->rx_adv_conf.vmdq_dcb_conf; 3975 struct rte_eth_vmdq_dcb_tx_conf *vmdq_tx_conf = 3976 ð_conf->tx_adv_conf.vmdq_dcb_tx_conf; 3977 3978 /* VMDQ+DCB RX and TX configurations */ 3979 vmdq_rx_conf->enable_default_pool = 0; 3980 vmdq_rx_conf->default_pool = 0; 3981 vmdq_rx_conf->nb_queue_pools = 3982 (num_tcs == RTE_ETH_4_TCS ? RTE_ETH_32_POOLS : RTE_ETH_16_POOLS); 3983 vmdq_tx_conf->nb_queue_pools = 3984 (num_tcs == RTE_ETH_4_TCS ? RTE_ETH_32_POOLS : RTE_ETH_16_POOLS); 3985 3986 vmdq_rx_conf->nb_pool_maps = vmdq_rx_conf->nb_queue_pools; 3987 for (i = 0; i < vmdq_rx_conf->nb_pool_maps; i++) { 3988 vmdq_rx_conf->pool_map[i].vlan_id = vlan_tags[i]; 3989 vmdq_rx_conf->pool_map[i].pools = 3990 1 << (i % vmdq_rx_conf->nb_queue_pools); 3991 } 3992 for (i = 0; i < RTE_ETH_DCB_NUM_USER_PRIORITIES; i++) { 3993 vmdq_rx_conf->dcb_tc[i] = i % num_tcs; 3994 vmdq_tx_conf->dcb_tc[i] = i % num_tcs; 3995 } 3996 3997 /* set DCB mode of RX and TX of multiple queues */ 3998 eth_conf->rxmode.mq_mode = 3999 (enum rte_eth_rx_mq_mode) 4000 (rx_mq_mode & RTE_ETH_MQ_RX_VMDQ_DCB); 4001 eth_conf->txmode.mq_mode = RTE_ETH_MQ_TX_VMDQ_DCB; 4002 } else { 4003 struct rte_eth_dcb_rx_conf *rx_conf = 4004 ð_conf->rx_adv_conf.dcb_rx_conf; 4005 struct rte_eth_dcb_tx_conf *tx_conf = 4006 ð_conf->tx_adv_conf.dcb_tx_conf; 4007 4008 memset(&rss_conf, 0, sizeof(struct rte_eth_rss_conf)); 4009 4010 rc = rte_eth_dev_rss_hash_conf_get(pid, &rss_conf); 4011 if (rc != 0) 4012 return rc; 4013 4014 rx_conf->nb_tcs = num_tcs; 4015 tx_conf->nb_tcs = num_tcs; 4016 4017 for (i = 0; i < RTE_ETH_DCB_NUM_USER_PRIORITIES; i++) { 4018 rx_conf->dcb_tc[i] = i % num_tcs; 4019 tx_conf->dcb_tc[i] = i % num_tcs; 4020 } 4021 4022 eth_conf->rxmode.mq_mode = 4023 (enum rte_eth_rx_mq_mode) 4024 (rx_mq_mode & RTE_ETH_MQ_RX_DCB_RSS); 4025 eth_conf->rx_adv_conf.rss_conf = rss_conf; 4026 eth_conf->txmode.mq_mode = RTE_ETH_MQ_TX_DCB; 4027 } 4028 4029 if (pfc_en) 4030 eth_conf->dcb_capability_en = 4031 RTE_ETH_DCB_PG_SUPPORT | RTE_ETH_DCB_PFC_SUPPORT; 4032 else 4033 eth_conf->dcb_capability_en = RTE_ETH_DCB_PG_SUPPORT; 4034 4035 return 0; 4036 } 4037 4038 int 4039 init_port_dcb_config(portid_t pid, 4040 enum dcb_mode_enable dcb_mode, 4041 enum rte_eth_nb_tcs num_tcs, 4042 uint8_t pfc_en) 4043 { 4044 struct rte_eth_conf port_conf; 4045 struct rte_port *rte_port; 4046 int retval; 4047 uint16_t i; 4048 4049 if (num_procs > 1) { 4050 printf("The multi-process feature doesn't support dcb.\n"); 4051 return -ENOTSUP; 4052 } 4053 rte_port = &ports[pid]; 4054 4055 /* retain the original device configuration. */ 4056 memcpy(&port_conf, &rte_port->dev_conf, sizeof(struct rte_eth_conf)); 4057 4058 /*set configuration of DCB in vt mode and DCB in non-vt mode*/ 4059 retval = get_eth_dcb_conf(pid, &port_conf, dcb_mode, num_tcs, pfc_en); 4060 if (retval < 0) 4061 return retval; 4062 port_conf.rxmode.offloads |= RTE_ETH_RX_OFFLOAD_VLAN_FILTER; 4063 /* remove RSS HASH offload for DCB in vt mode */ 4064 if (port_conf.rxmode.mq_mode == RTE_ETH_MQ_RX_VMDQ_DCB) { 4065 port_conf.rxmode.offloads &= ~RTE_ETH_RX_OFFLOAD_RSS_HASH; 4066 for (i = 0; i < nb_rxq; i++) 4067 rte_port->rxq[i].conf.offloads &= 4068 ~RTE_ETH_RX_OFFLOAD_RSS_HASH; 4069 } 4070 4071 /* re-configure the device . */ 4072 retval = rte_eth_dev_configure(pid, nb_rxq, nb_rxq, &port_conf); 4073 if (retval < 0) 4074 return retval; 4075 4076 retval = eth_dev_info_get_print_err(pid, &rte_port->dev_info); 4077 if (retval != 0) 4078 return retval; 4079 4080 /* If dev_info.vmdq_pool_base is greater than 0, 4081 * the queue id of vmdq pools is started after pf queues. 4082 */ 4083 if (dcb_mode == DCB_VT_ENABLED && 4084 rte_port->dev_info.vmdq_pool_base > 0) { 4085 fprintf(stderr, 4086 "VMDQ_DCB multi-queue mode is nonsensical for port %d.\n", 4087 pid); 4088 return -1; 4089 } 4090 4091 /* Assume the ports in testpmd have the same dcb capability 4092 * and has the same number of rxq and txq in dcb mode 4093 */ 4094 if (dcb_mode == DCB_VT_ENABLED) { 4095 if (rte_port->dev_info.max_vfs > 0) { 4096 nb_rxq = rte_port->dev_info.nb_rx_queues; 4097 nb_txq = rte_port->dev_info.nb_tx_queues; 4098 } else { 4099 nb_rxq = rte_port->dev_info.max_rx_queues; 4100 nb_txq = rte_port->dev_info.max_tx_queues; 4101 } 4102 } else { 4103 /*if vt is disabled, use all pf queues */ 4104 if (rte_port->dev_info.vmdq_pool_base == 0) { 4105 nb_rxq = rte_port->dev_info.max_rx_queues; 4106 nb_txq = rte_port->dev_info.max_tx_queues; 4107 } else { 4108 nb_rxq = (queueid_t)num_tcs; 4109 nb_txq = (queueid_t)num_tcs; 4110 4111 } 4112 } 4113 rx_free_thresh = 64; 4114 4115 memcpy(&rte_port->dev_conf, &port_conf, sizeof(struct rte_eth_conf)); 4116 4117 rxtx_port_config(pid); 4118 /* VLAN filter */ 4119 rte_port->dev_conf.rxmode.offloads |= RTE_ETH_RX_OFFLOAD_VLAN_FILTER; 4120 for (i = 0; i < RTE_DIM(vlan_tags); i++) 4121 rx_vft_set(pid, vlan_tags[i], 1); 4122 4123 retval = eth_macaddr_get_print_err(pid, &rte_port->eth_addr); 4124 if (retval != 0) 4125 return retval; 4126 4127 rte_port->dcb_flag = 1; 4128 4129 /* Enter DCB configuration status */ 4130 dcb_config = 1; 4131 4132 return 0; 4133 } 4134 4135 static void 4136 init_port(void) 4137 { 4138 int i; 4139 4140 /* Configuration of Ethernet ports. */ 4141 ports = rte_zmalloc("testpmd: ports", 4142 sizeof(struct rte_port) * RTE_MAX_ETHPORTS, 4143 RTE_CACHE_LINE_SIZE); 4144 if (ports == NULL) { 4145 rte_exit(EXIT_FAILURE, 4146 "rte_zmalloc(%d struct rte_port) failed\n", 4147 RTE_MAX_ETHPORTS); 4148 } 4149 for (i = 0; i < RTE_MAX_ETHPORTS; i++) 4150 ports[i].xstats_info.allocated = false; 4151 for (i = 0; i < RTE_MAX_ETHPORTS; i++) 4152 LIST_INIT(&ports[i].flow_tunnel_list); 4153 /* Initialize ports NUMA structures */ 4154 memset(port_numa, NUMA_NO_CONFIG, RTE_MAX_ETHPORTS); 4155 memset(rxring_numa, NUMA_NO_CONFIG, RTE_MAX_ETHPORTS); 4156 memset(txring_numa, NUMA_NO_CONFIG, RTE_MAX_ETHPORTS); 4157 } 4158 4159 static void 4160 force_quit(void) 4161 { 4162 pmd_test_exit(); 4163 prompt_exit(); 4164 } 4165 4166 static void 4167 print_stats(void) 4168 { 4169 uint8_t i; 4170 const char clr[] = { 27, '[', '2', 'J', '\0' }; 4171 const char top_left[] = { 27, '[', '1', ';', '1', 'H', '\0' }; 4172 4173 /* Clear screen and move to top left */ 4174 printf("%s%s", clr, top_left); 4175 4176 printf("\nPort statistics ===================================="); 4177 for (i = 0; i < cur_fwd_config.nb_fwd_ports; i++) 4178 nic_stats_display(fwd_ports_ids[i]); 4179 4180 fflush(stdout); 4181 } 4182 4183 static void 4184 signal_handler(int signum) 4185 { 4186 if (signum == SIGINT || signum == SIGTERM) { 4187 fprintf(stderr, "\nSignal %d received, preparing to exit...\n", 4188 signum); 4189 #ifdef RTE_LIB_PDUMP 4190 /* uninitialize packet capture framework */ 4191 rte_pdump_uninit(); 4192 #endif 4193 #ifdef RTE_LIB_LATENCYSTATS 4194 if (latencystats_enabled != 0) 4195 rte_latencystats_uninit(); 4196 #endif 4197 force_quit(); 4198 /* Set flag to indicate the force termination. */ 4199 f_quit = 1; 4200 /* exit with the expected status */ 4201 #ifndef RTE_EXEC_ENV_WINDOWS 4202 signal(signum, SIG_DFL); 4203 kill(getpid(), signum); 4204 #endif 4205 } 4206 } 4207 4208 int 4209 main(int argc, char** argv) 4210 { 4211 int diag; 4212 portid_t port_id; 4213 uint16_t count; 4214 int ret; 4215 4216 signal(SIGINT, signal_handler); 4217 signal(SIGTERM, signal_handler); 4218 4219 testpmd_logtype = rte_log_register("testpmd"); 4220 if (testpmd_logtype < 0) 4221 rte_exit(EXIT_FAILURE, "Cannot register log type"); 4222 rte_log_set_level(testpmd_logtype, RTE_LOG_DEBUG); 4223 4224 diag = rte_eal_init(argc, argv); 4225 if (diag < 0) 4226 rte_exit(EXIT_FAILURE, "Cannot init EAL: %s\n", 4227 rte_strerror(rte_errno)); 4228 4229 ret = register_eth_event_callback(); 4230 if (ret != 0) 4231 rte_exit(EXIT_FAILURE, "Cannot register for ethdev events"); 4232 4233 #ifdef RTE_LIB_PDUMP 4234 /* initialize packet capture framework */ 4235 rte_pdump_init(); 4236 #endif 4237 4238 count = 0; 4239 RTE_ETH_FOREACH_DEV(port_id) { 4240 ports_ids[count] = port_id; 4241 count++; 4242 } 4243 nb_ports = (portid_t) count; 4244 if (nb_ports == 0) 4245 TESTPMD_LOG(WARNING, "No probed ethernet devices\n"); 4246 4247 /* allocate port structures, and init them */ 4248 init_port(); 4249 4250 set_def_fwd_config(); 4251 if (nb_lcores == 0) 4252 rte_exit(EXIT_FAILURE, "No cores defined for forwarding\n" 4253 "Check the core mask argument\n"); 4254 4255 /* Bitrate/latency stats disabled by default */ 4256 #ifdef RTE_LIB_BITRATESTATS 4257 bitrate_enabled = 0; 4258 #endif 4259 #ifdef RTE_LIB_LATENCYSTATS 4260 latencystats_enabled = 0; 4261 #endif 4262 4263 /* on FreeBSD, mlockall() is disabled by default */ 4264 #ifdef RTE_EXEC_ENV_FREEBSD 4265 do_mlockall = 0; 4266 #else 4267 do_mlockall = 1; 4268 #endif 4269 4270 argc -= diag; 4271 argv += diag; 4272 if (argc > 1) 4273 launch_args_parse(argc, argv); 4274 4275 #ifndef RTE_EXEC_ENV_WINDOWS 4276 if (do_mlockall && mlockall(MCL_CURRENT | MCL_FUTURE)) { 4277 TESTPMD_LOG(NOTICE, "mlockall() failed with error \"%s\"\n", 4278 strerror(errno)); 4279 } 4280 #endif 4281 4282 if (tx_first && interactive) 4283 rte_exit(EXIT_FAILURE, "--tx-first cannot be used on " 4284 "interactive mode.\n"); 4285 4286 if (tx_first && lsc_interrupt) { 4287 fprintf(stderr, 4288 "Warning: lsc_interrupt needs to be off when using tx_first. Disabling.\n"); 4289 lsc_interrupt = 0; 4290 } 4291 4292 if (!nb_rxq && !nb_txq) 4293 fprintf(stderr, 4294 "Warning: Either rx or tx queues should be non-zero\n"); 4295 4296 if (nb_rxq > 1 && nb_rxq > nb_txq) 4297 fprintf(stderr, 4298 "Warning: nb_rxq=%d enables RSS configuration, but nb_txq=%d will prevent to fully test it.\n", 4299 nb_rxq, nb_txq); 4300 4301 init_config(); 4302 4303 if (hot_plug) { 4304 ret = rte_dev_hotplug_handle_enable(); 4305 if (ret) { 4306 RTE_LOG(ERR, EAL, 4307 "fail to enable hotplug handling."); 4308 return -1; 4309 } 4310 4311 ret = rte_dev_event_monitor_start(); 4312 if (ret) { 4313 RTE_LOG(ERR, EAL, 4314 "fail to start device event monitoring."); 4315 return -1; 4316 } 4317 4318 ret = rte_dev_event_callback_register(NULL, 4319 dev_event_callback, NULL); 4320 if (ret) { 4321 RTE_LOG(ERR, EAL, 4322 "fail to register device event callback\n"); 4323 return -1; 4324 } 4325 } 4326 4327 if (!no_device_start && start_port(RTE_PORT_ALL) != 0) 4328 rte_exit(EXIT_FAILURE, "Start ports failed\n"); 4329 4330 /* set all ports to promiscuous mode by default */ 4331 RTE_ETH_FOREACH_DEV(port_id) { 4332 ret = rte_eth_promiscuous_enable(port_id); 4333 if (ret != 0) 4334 fprintf(stderr, 4335 "Error during enabling promiscuous mode for port %u: %s - ignore\n", 4336 port_id, rte_strerror(-ret)); 4337 } 4338 4339 #ifdef RTE_LIB_METRICS 4340 /* Init metrics library */ 4341 rte_metrics_init(rte_socket_id()); 4342 #endif 4343 4344 #ifdef RTE_LIB_LATENCYSTATS 4345 if (latencystats_enabled != 0) { 4346 int ret = rte_latencystats_init(1, NULL); 4347 if (ret) 4348 fprintf(stderr, 4349 "Warning: latencystats init() returned error %d\n", 4350 ret); 4351 fprintf(stderr, "Latencystats running on lcore %d\n", 4352 latencystats_lcore_id); 4353 } 4354 #endif 4355 4356 /* Setup bitrate stats */ 4357 #ifdef RTE_LIB_BITRATESTATS 4358 if (bitrate_enabled != 0) { 4359 bitrate_data = rte_stats_bitrate_create(); 4360 if (bitrate_data == NULL) 4361 rte_exit(EXIT_FAILURE, 4362 "Could not allocate bitrate data.\n"); 4363 rte_stats_bitrate_reg(bitrate_data); 4364 } 4365 #endif 4366 #ifdef RTE_LIB_CMDLINE 4367 if (init_cmdline() != 0) 4368 rte_exit(EXIT_FAILURE, 4369 "Could not initialise cmdline context.\n"); 4370 4371 if (strlen(cmdline_filename) != 0) 4372 cmdline_read_from_file(cmdline_filename); 4373 4374 if (interactive == 1) { 4375 if (auto_start) { 4376 printf("Start automatic packet forwarding\n"); 4377 start_packet_forwarding(0); 4378 } 4379 prompt(); 4380 pmd_test_exit(); 4381 } else 4382 #endif 4383 { 4384 char c; 4385 int rc; 4386 4387 f_quit = 0; 4388 4389 printf("No commandline core given, start packet forwarding\n"); 4390 start_packet_forwarding(tx_first); 4391 if (stats_period != 0) { 4392 uint64_t prev_time = 0, cur_time, diff_time = 0; 4393 uint64_t timer_period; 4394 4395 /* Convert to number of cycles */ 4396 timer_period = stats_period * rte_get_timer_hz(); 4397 4398 while (f_quit == 0) { 4399 cur_time = rte_get_timer_cycles(); 4400 diff_time += cur_time - prev_time; 4401 4402 if (diff_time >= timer_period) { 4403 print_stats(); 4404 /* Reset the timer */ 4405 diff_time = 0; 4406 } 4407 /* Sleep to avoid unnecessary checks */ 4408 prev_time = cur_time; 4409 rte_delay_us_sleep(US_PER_S); 4410 } 4411 } 4412 4413 printf("Press enter to exit\n"); 4414 rc = read(0, &c, 1); 4415 pmd_test_exit(); 4416 if (rc < 0) 4417 return 1; 4418 } 4419 4420 ret = rte_eal_cleanup(); 4421 if (ret != 0) 4422 rte_exit(EXIT_FAILURE, 4423 "EAL cleanup failed: %s\n", strerror(-ret)); 4424 4425 return EXIT_SUCCESS; 4426 } 4427