xref: /dpdk/lib/ethdev/rte_ethdev.h (revision 877cb3e374261ad57116c7d8c05fae1eb53f0e13)
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright(c) 2010-2017 Intel Corporation
3  */
4 
5 #ifndef _RTE_ETHDEV_H_
6 #define _RTE_ETHDEV_H_
7 
8 /**
9  * @file
10  *
11  * RTE Ethernet Device API
12  *
13  * The Ethernet Device API is composed of two parts:
14  *
15  * - The application-oriented Ethernet API that includes functions to setup
16  *   an Ethernet device (configure it, setup its Rx and Tx queues and start it),
17  *   to get its MAC address, the speed and the status of its physical link,
18  *   to receive and to transmit packets, and so on.
19  *
20  * - The driver-oriented Ethernet API that exports functions allowing
21  *   an Ethernet Poll Mode Driver (PMD) to allocate an Ethernet device instance,
22  *   create memzone for HW rings and process registered callbacks, and so on.
23  *   PMDs should include ethdev_driver.h instead of this header.
24  *
25  * By default, all the functions of the Ethernet Device API exported by a PMD
26  * are lock-free functions which assume to not be invoked in parallel on
27  * different logical cores to work on the same target object.  For instance,
28  * the receive function of a PMD cannot be invoked in parallel on two logical
29  * cores to poll the same Rx queue [of the same port]. Of course, this function
30  * can be invoked in parallel by different logical cores on different Rx queues.
31  * It is the responsibility of the upper level application to enforce this rule.
32  *
33  * If needed, parallel accesses by multiple logical cores to shared queues
34  * shall be explicitly protected by dedicated inline lock-aware functions
35  * built on top of their corresponding lock-free functions of the PMD API.
36  *
37  * In all functions of the Ethernet API, the Ethernet device is
38  * designated by an integer >= 0 named the device port identifier.
39  *
40  * At the Ethernet driver level, Ethernet devices are represented by a generic
41  * data structure of type *rte_eth_dev*.
42  *
43  * Ethernet devices are dynamically registered during the PCI probing phase
44  * performed at EAL initialization time.
45  * When an Ethernet device is being probed, an *rte_eth_dev* structure and
46  * a new port identifier are allocated for that device. Then, the eth_dev_init()
47  * function supplied by the Ethernet driver matching the probed PCI
48  * device is invoked to properly initialize the device.
49  *
50  * The role of the device init function consists of resetting the hardware,
51  * checking access to Non-volatile Memory (NVM), reading the MAC address
52  * from NVM etc.
53  *
54  * If the device init operation is successful, the correspondence between
55  * the port identifier assigned to the new device and its associated
56  * *rte_eth_dev* structure is effectively registered.
57  * Otherwise, both the *rte_eth_dev* structure and the port identifier are
58  * freed.
59  *
60  * The functions exported by the application Ethernet API to setup a device
61  * designated by its port identifier must be invoked in the following order:
62  *     - rte_eth_dev_configure()
63  *     - rte_eth_tx_queue_setup()
64  *     - rte_eth_rx_queue_setup()
65  *     - rte_eth_dev_start()
66  *
67  * Then, the network application can invoke, in any order, the functions
68  * exported by the Ethernet API to get the MAC address of a given device, to
69  * get the speed and the status of a device physical link, to receive/transmit
70  * [burst of] packets, and so on.
71  *
72  * If the application wants to change the configuration (i.e. call
73  * rte_eth_dev_configure(), rte_eth_tx_queue_setup(), or
74  * rte_eth_rx_queue_setup()), it must call rte_eth_dev_stop() first to stop the
75  * device and then do the reconfiguration before calling rte_eth_dev_start()
76  * again. The transmit and receive functions should not be invoked when the
77  * device or the queue is stopped.
78  *
79  * Please note that some configuration is not stored between calls to
80  * rte_eth_dev_stop()/rte_eth_dev_start(). The following configuration will
81  * be retained:
82  *
83  *     - MTU
84  *     - flow control settings
85  *     - receive mode configuration (promiscuous mode, all-multicast mode,
86  *       hardware checksum mode, RSS/VMDq settings etc.)
87  *     - VLAN filtering configuration
88  *     - default MAC address
89  *     - MAC addresses supplied to MAC address array
90  *     - flow director filtering mode (but not filtering rules)
91  *     - NIC queue statistics mappings
92  *
93  * The following configuration may be retained or not
94  * depending on the device capabilities:
95  *
96  *     - flow rules
97  *     - flow-related shared objects, e.g. indirect actions
98  *
99  * Any other configuration will not be stored and will need to be re-entered
100  * before a call to rte_eth_dev_start().
101  *
102  * Finally, a network application can close an Ethernet device by invoking the
103  * rte_eth_dev_close() function.
104  *
105  * Each function of the application Ethernet API invokes a specific function
106  * of the PMD that controls the target device designated by its port
107  * identifier.
108  * For this purpose, all device-specific functions of an Ethernet driver are
109  * supplied through a set of pointers contained in a generic structure of type
110  * *eth_dev_ops*.
111  * The address of the *eth_dev_ops* structure is stored in the *rte_eth_dev*
112  * structure by the device init function of the Ethernet driver, which is
113  * invoked during the PCI probing phase, as explained earlier.
114  *
115  * In other words, each function of the Ethernet API simply retrieves the
116  * *rte_eth_dev* structure associated with the device port identifier and
117  * performs an indirect invocation of the corresponding driver function
118  * supplied in the *eth_dev_ops* structure of the *rte_eth_dev* structure.
119  *
120  * For performance reasons, the address of the burst-oriented Rx and Tx
121  * functions of the Ethernet driver are not contained in the *eth_dev_ops*
122  * structure. Instead, they are directly stored at the beginning of the
123  * *rte_eth_dev* structure to avoid an extra indirect memory access during
124  * their invocation.
125  *
126  * RTE Ethernet device drivers do not use interrupts for transmitting or
127  * receiving. Instead, Ethernet drivers export Poll-Mode receive and transmit
128  * functions to applications.
129  * Both receive and transmit functions are packet-burst oriented to minimize
130  * their cost per packet through the following optimizations:
131  *
132  * - Sharing among multiple packets the incompressible cost of the
133  *   invocation of receive/transmit functions.
134  *
135  * - Enabling receive/transmit functions to take advantage of burst-oriented
136  *   hardware features (L1 cache, prefetch instructions, NIC head/tail
137  *   registers) to minimize the number of CPU cycles per packet, for instance,
138  *   by avoiding useless read memory accesses to ring descriptors, or by
139  *   systematically using arrays of pointers that exactly fit L1 cache line
140  *   boundaries and sizes.
141  *
142  * The burst-oriented receive function does not provide any error notification,
143  * to avoid the corresponding overhead. As a hint, the upper-level application
144  * might check the status of the device link once being systematically returned
145  * a 0 value by the receive function of the driver for a given number of tries.
146  */
147 
148 #ifdef __cplusplus
149 extern "C" {
150 #endif
151 
152 #include <stdint.h>
153 
154 /* Use this macro to check if LRO API is supported */
155 #define RTE_ETHDEV_HAS_LRO_SUPPORT
156 
157 /* Alias RTE_LIBRTE_ETHDEV_DEBUG for backward compatibility. */
158 #ifdef RTE_LIBRTE_ETHDEV_DEBUG
159 #define RTE_ETHDEV_DEBUG_RX
160 #define RTE_ETHDEV_DEBUG_TX
161 #endif
162 
163 #include <rte_cman.h>
164 #include <rte_compat.h>
165 #include <rte_log.h>
166 #include <rte_interrupts.h>
167 #include <rte_dev.h>
168 #include <rte_devargs.h>
169 #include <rte_bitops.h>
170 #include <rte_errno.h>
171 #include <rte_common.h>
172 #include <rte_config.h>
173 #include <rte_power_intrinsics.h>
174 
175 #include "rte_ethdev_trace_fp.h"
176 #include "rte_dev_info.h"
177 
178 extern int rte_eth_dev_logtype;
179 
180 #define RTE_ETHDEV_LOG(level, ...) \
181 	rte_log(RTE_LOG_ ## level, rte_eth_dev_logtype, "" __VA_ARGS__)
182 
183 struct rte_mbuf;
184 
185 /**
186  * Initializes a device iterator.
187  *
188  * This iterator allows accessing a list of devices matching some devargs.
189  *
190  * @param iter
191  *   Device iterator handle initialized by the function.
192  *   The fields bus_str and cls_str might be dynamically allocated,
193  *   and could be freed by calling rte_eth_iterator_cleanup().
194  *
195  * @param devargs
196  *   Device description string.
197  *
198  * @return
199  *   0 on successful initialization, negative otherwise.
200  */
201 int rte_eth_iterator_init(struct rte_dev_iterator *iter, const char *devargs);
202 
203 /**
204  * Iterates on devices with devargs filter.
205  * The ownership is not checked.
206  *
207  * The next port ID is returned, and the iterator is updated.
208  *
209  * @param iter
210  *   Device iterator handle initialized by rte_eth_iterator_init().
211  *   Some fields bus_str and cls_str might be freed when no more port is found,
212  *   by calling rte_eth_iterator_cleanup().
213  *
214  * @return
215  *   A port ID if found, RTE_MAX_ETHPORTS otherwise.
216  */
217 uint16_t rte_eth_iterator_next(struct rte_dev_iterator *iter);
218 
219 /**
220  * Free some allocated fields of the iterator.
221  *
222  * This function is automatically called by rte_eth_iterator_next()
223  * on the last iteration (i.e. when no more matching port is found).
224  *
225  * It is safe to call this function twice; it will do nothing more.
226  *
227  * @param iter
228  *   Device iterator handle initialized by rte_eth_iterator_init().
229  *   The fields bus_str and cls_str are freed if needed.
230  */
231 void rte_eth_iterator_cleanup(struct rte_dev_iterator *iter);
232 
233 /**
234  * Macro to iterate over all ethdev ports matching some devargs.
235  *
236  * If a break is done before the end of the loop,
237  * the function rte_eth_iterator_cleanup() must be called.
238  *
239  * @param id
240  *   Iterated port ID of type uint16_t.
241  * @param devargs
242  *   Device parameters input as string of type char*.
243  * @param iter
244  *   Iterator handle of type struct rte_dev_iterator, used internally.
245  */
246 #define RTE_ETH_FOREACH_MATCHING_DEV(id, devargs, iter) \
247 	for (rte_eth_iterator_init(iter, devargs), \
248 	     id = rte_eth_iterator_next(iter); \
249 	     id != RTE_MAX_ETHPORTS; \
250 	     id = rte_eth_iterator_next(iter))
251 
252 /**
253  * A structure used to retrieve statistics for an Ethernet port.
254  * Not all statistics fields in struct rte_eth_stats are supported
255  * by any type of network interface card (NIC). If any statistics
256  * field is not supported, its value is 0.
257  * All byte-related statistics do not include Ethernet FCS regardless
258  * of whether these bytes have been delivered to the application
259  * (see RTE_ETH_RX_OFFLOAD_KEEP_CRC).
260  */
261 struct rte_eth_stats {
262 	uint64_t ipackets;  /**< Total number of successfully received packets. */
263 	uint64_t opackets;  /**< Total number of successfully transmitted packets.*/
264 	uint64_t ibytes;    /**< Total number of successfully received bytes. */
265 	uint64_t obytes;    /**< Total number of successfully transmitted bytes. */
266 	/**
267 	 * Total of Rx packets dropped by the HW,
268 	 * because there are no available buffer (i.e. Rx queues are full).
269 	 */
270 	uint64_t imissed;
271 	uint64_t ierrors;   /**< Total number of erroneous received packets. */
272 	uint64_t oerrors;   /**< Total number of failed transmitted packets. */
273 	uint64_t rx_nombuf; /**< Total number of Rx mbuf allocation failures. */
274 	/* Queue stats are limited to max 256 queues */
275 	/** Total number of queue Rx packets. */
276 	uint64_t q_ipackets[RTE_ETHDEV_QUEUE_STAT_CNTRS];
277 	/** Total number of queue Tx packets. */
278 	uint64_t q_opackets[RTE_ETHDEV_QUEUE_STAT_CNTRS];
279 	/** Total number of successfully received queue bytes. */
280 	uint64_t q_ibytes[RTE_ETHDEV_QUEUE_STAT_CNTRS];
281 	/** Total number of successfully transmitted queue bytes. */
282 	uint64_t q_obytes[RTE_ETHDEV_QUEUE_STAT_CNTRS];
283 	/** Total number of queue packets received that are dropped. */
284 	uint64_t q_errors[RTE_ETHDEV_QUEUE_STAT_CNTRS];
285 };
286 
287 /**@{@name Link speed capabilities
288  * Device supported speeds bitmap flags
289  */
290 #define RTE_ETH_LINK_SPEED_AUTONEG 0             /**< Autonegotiate (all speeds) */
291 #define RTE_ETH_LINK_SPEED_FIXED   RTE_BIT32(0)  /**< Disable autoneg (fixed speed) */
292 #define RTE_ETH_LINK_SPEED_10M_HD  RTE_BIT32(1)  /**<  10 Mbps half-duplex */
293 #define RTE_ETH_LINK_SPEED_10M     RTE_BIT32(2)  /**<  10 Mbps full-duplex */
294 #define RTE_ETH_LINK_SPEED_100M_HD RTE_BIT32(3)  /**< 100 Mbps half-duplex */
295 #define RTE_ETH_LINK_SPEED_100M    RTE_BIT32(4)  /**< 100 Mbps full-duplex */
296 #define RTE_ETH_LINK_SPEED_1G      RTE_BIT32(5)  /**<   1 Gbps */
297 #define RTE_ETH_LINK_SPEED_2_5G    RTE_BIT32(6)  /**< 2.5 Gbps */
298 #define RTE_ETH_LINK_SPEED_5G      RTE_BIT32(7)  /**<   5 Gbps */
299 #define RTE_ETH_LINK_SPEED_10G     RTE_BIT32(8)  /**<  10 Gbps */
300 #define RTE_ETH_LINK_SPEED_20G     RTE_BIT32(9)  /**<  20 Gbps */
301 #define RTE_ETH_LINK_SPEED_25G     RTE_BIT32(10) /**<  25 Gbps */
302 #define RTE_ETH_LINK_SPEED_40G     RTE_BIT32(11) /**<  40 Gbps */
303 #define RTE_ETH_LINK_SPEED_50G     RTE_BIT32(12) /**<  50 Gbps */
304 #define RTE_ETH_LINK_SPEED_56G     RTE_BIT32(13) /**<  56 Gbps */
305 #define RTE_ETH_LINK_SPEED_100G    RTE_BIT32(14) /**< 100 Gbps */
306 #define RTE_ETH_LINK_SPEED_200G    RTE_BIT32(15) /**< 200 Gbps */
307 #define RTE_ETH_LINK_SPEED_400G    RTE_BIT32(16) /**< 400 Gbps */
308 /**@}*/
309 
310 /**@{@name Link speed
311  * Ethernet numeric link speeds in Mbps
312  */
313 #define RTE_ETH_SPEED_NUM_NONE         0 /**< Not defined */
314 #define RTE_ETH_SPEED_NUM_10M         10 /**<  10 Mbps */
315 #define RTE_ETH_SPEED_NUM_100M       100 /**< 100 Mbps */
316 #define RTE_ETH_SPEED_NUM_1G        1000 /**<   1 Gbps */
317 #define RTE_ETH_SPEED_NUM_2_5G      2500 /**< 2.5 Gbps */
318 #define RTE_ETH_SPEED_NUM_5G        5000 /**<   5 Gbps */
319 #define RTE_ETH_SPEED_NUM_10G      10000 /**<  10 Gbps */
320 #define RTE_ETH_SPEED_NUM_20G      20000 /**<  20 Gbps */
321 #define RTE_ETH_SPEED_NUM_25G      25000 /**<  25 Gbps */
322 #define RTE_ETH_SPEED_NUM_40G      40000 /**<  40 Gbps */
323 #define RTE_ETH_SPEED_NUM_50G      50000 /**<  50 Gbps */
324 #define RTE_ETH_SPEED_NUM_56G      56000 /**<  56 Gbps */
325 #define RTE_ETH_SPEED_NUM_100G    100000 /**< 100 Gbps */
326 #define RTE_ETH_SPEED_NUM_200G    200000 /**< 200 Gbps */
327 #define RTE_ETH_SPEED_NUM_400G    400000 /**< 400 Gbps */
328 #define RTE_ETH_SPEED_NUM_UNKNOWN UINT32_MAX /**< Unknown */
329 /**@}*/
330 
331 /**
332  * A structure used to retrieve link-level information of an Ethernet port.
333  */
334 __extension__
335 struct rte_eth_link {
336 	uint32_t link_speed;        /**< RTE_ETH_SPEED_NUM_ */
337 	uint16_t link_duplex  : 1;  /**< RTE_ETH_LINK_[HALF/FULL]_DUPLEX */
338 	uint16_t link_autoneg : 1;  /**< RTE_ETH_LINK_[AUTONEG/FIXED] */
339 	uint16_t link_status  : 1;  /**< RTE_ETH_LINK_[DOWN/UP] */
340 } __rte_aligned(8);      /**< aligned for atomic64 read/write */
341 
342 /**@{@name Link negotiation
343  * Constants used in link management.
344  */
345 #define RTE_ETH_LINK_HALF_DUPLEX 0 /**< Half-duplex connection (see link_duplex). */
346 #define RTE_ETH_LINK_FULL_DUPLEX 1 /**< Full-duplex connection (see link_duplex). */
347 #define RTE_ETH_LINK_DOWN        0 /**< Link is down (see link_status). */
348 #define RTE_ETH_LINK_UP          1 /**< Link is up (see link_status). */
349 #define RTE_ETH_LINK_FIXED       0 /**< No autonegotiation (see link_autoneg). */
350 #define RTE_ETH_LINK_AUTONEG     1 /**< Autonegotiated (see link_autoneg). */
351 #define RTE_ETH_LINK_MAX_STR_LEN 40 /**< Max length of default link string. */
352 /**@}*/
353 
354 /**
355  * A structure used to configure the ring threshold registers of an Rx/Tx
356  * queue for an Ethernet port.
357  */
358 struct rte_eth_thresh {
359 	uint8_t pthresh; /**< Ring prefetch threshold. */
360 	uint8_t hthresh; /**< Ring host threshold. */
361 	uint8_t wthresh; /**< Ring writeback threshold. */
362 };
363 
364 /**@{@name Multi-queue mode
365  * @see rte_eth_conf.rxmode.mq_mode.
366  */
367 #define RTE_ETH_MQ_RX_RSS_FLAG  RTE_BIT32(0) /**< Enable RSS. @see rte_eth_rss_conf */
368 #define RTE_ETH_MQ_RX_DCB_FLAG  RTE_BIT32(1) /**< Enable DCB. */
369 #define RTE_ETH_MQ_RX_VMDQ_FLAG RTE_BIT32(2) /**< Enable VMDq. */
370 /**@}*/
371 
372 /**
373  *  A set of values to identify what method is to be used to route
374  *  packets to multiple queues.
375  */
376 enum rte_eth_rx_mq_mode {
377 	/** None of DCB, RSS or VMDq mode */
378 	RTE_ETH_MQ_RX_NONE = 0,
379 
380 	/** For Rx side, only RSS is on */
381 	RTE_ETH_MQ_RX_RSS = RTE_ETH_MQ_RX_RSS_FLAG,
382 	/** For Rx side,only DCB is on. */
383 	RTE_ETH_MQ_RX_DCB = RTE_ETH_MQ_RX_DCB_FLAG,
384 	/** Both DCB and RSS enable */
385 	RTE_ETH_MQ_RX_DCB_RSS = RTE_ETH_MQ_RX_RSS_FLAG | RTE_ETH_MQ_RX_DCB_FLAG,
386 
387 	/** Only VMDq, no RSS nor DCB */
388 	RTE_ETH_MQ_RX_VMDQ_ONLY = RTE_ETH_MQ_RX_VMDQ_FLAG,
389 	/** RSS mode with VMDq */
390 	RTE_ETH_MQ_RX_VMDQ_RSS = RTE_ETH_MQ_RX_RSS_FLAG | RTE_ETH_MQ_RX_VMDQ_FLAG,
391 	/** Use VMDq+DCB to route traffic to queues */
392 	RTE_ETH_MQ_RX_VMDQ_DCB = RTE_ETH_MQ_RX_VMDQ_FLAG | RTE_ETH_MQ_RX_DCB_FLAG,
393 	/** Enable both VMDq and DCB in VMDq */
394 	RTE_ETH_MQ_RX_VMDQ_DCB_RSS = RTE_ETH_MQ_RX_RSS_FLAG | RTE_ETH_MQ_RX_DCB_FLAG |
395 				 RTE_ETH_MQ_RX_VMDQ_FLAG,
396 };
397 
398 /**
399  * A set of values to identify what method is to be used to transmit
400  * packets using multi-TCs.
401  */
402 enum rte_eth_tx_mq_mode {
403 	RTE_ETH_MQ_TX_NONE    = 0,  /**< It is in neither DCB nor VT mode. */
404 	RTE_ETH_MQ_TX_DCB,          /**< For Tx side,only DCB is on. */
405 	RTE_ETH_MQ_TX_VMDQ_DCB,     /**< For Tx side,both DCB and VT is on. */
406 	RTE_ETH_MQ_TX_VMDQ_ONLY,    /**< Only VT on, no DCB */
407 };
408 
409 /**
410  * A structure used to configure the Rx features of an Ethernet port.
411  */
412 struct rte_eth_rxmode {
413 	/** The multi-queue packet distribution mode to be used, e.g. RSS. */
414 	enum rte_eth_rx_mq_mode mq_mode;
415 	uint32_t mtu;  /**< Requested MTU. */
416 	/** Maximum allowed size of LRO aggregated packet. */
417 	uint32_t max_lro_pkt_size;
418 	/**
419 	 * Per-port Rx offloads to be set using RTE_ETH_RX_OFFLOAD_* flags.
420 	 * Only offloads set on rx_offload_capa field on rte_eth_dev_info
421 	 * structure are allowed to be set.
422 	 */
423 	uint64_t offloads;
424 
425 	uint64_t reserved_64s[2]; /**< Reserved for future fields */
426 	void *reserved_ptrs[2];   /**< Reserved for future fields */
427 };
428 
429 /**
430  * VLAN types to indicate if it is for single VLAN, inner VLAN or outer VLAN.
431  * Note that single VLAN is treated the same as inner VLAN.
432  */
433 enum rte_vlan_type {
434 	RTE_ETH_VLAN_TYPE_UNKNOWN = 0,
435 	RTE_ETH_VLAN_TYPE_INNER, /**< Inner VLAN. */
436 	RTE_ETH_VLAN_TYPE_OUTER, /**< Single VLAN, or outer VLAN. */
437 	RTE_ETH_VLAN_TYPE_MAX,
438 };
439 
440 /**
441  * A structure used to describe a VLAN filter.
442  * If the bit corresponding to a VID is set, such VID is on.
443  */
444 struct rte_vlan_filter_conf {
445 	uint64_t ids[64];
446 };
447 
448 /**
449  * A structure used to configure the Receive Side Scaling (RSS) feature
450  * of an Ethernet port.
451  * If not NULL, the *rss_key* pointer of the *rss_conf* structure points
452  * to an array holding the RSS key to use for hashing specific header
453  * fields of received packets. The length of this array should be indicated
454  * by *rss_key_len* below. Otherwise, a default random hash key is used by
455  * the device driver.
456  *
457  * The *rss_key_len* field of the *rss_conf* structure indicates the length
458  * in bytes of the array pointed by *rss_key*. To be compatible, this length
459  * will be checked in i40e only. Others assume 40 bytes to be used as before.
460  *
461  * The *rss_hf* field of the *rss_conf* structure indicates the different
462  * types of IPv4/IPv6 packets to which the RSS hashing must be applied.
463  * Supplying an *rss_hf* equal to zero disables the RSS feature.
464  */
465 struct rte_eth_rss_conf {
466 	uint8_t *rss_key;    /**< If not NULL, 40-byte hash key. */
467 	uint8_t rss_key_len; /**< hash key length in bytes. */
468 	uint64_t rss_hf;     /**< Hash functions to apply - see below. */
469 };
470 
471 /*
472  * A packet can be identified by hardware as different flow types. Different
473  * NIC hardware may support different flow types.
474  * Basically, the NIC hardware identifies the flow type as deep protocol as
475  * possible, and exclusively. For example, if a packet is identified as
476  * 'RTE_ETH_FLOW_NONFRAG_IPV4_TCP', it will not be any of other flow types,
477  * though it is an actual IPV4 packet.
478  */
479 #define RTE_ETH_FLOW_UNKNOWN             0
480 #define RTE_ETH_FLOW_RAW                 1
481 #define RTE_ETH_FLOW_IPV4                2
482 #define RTE_ETH_FLOW_FRAG_IPV4           3
483 #define RTE_ETH_FLOW_NONFRAG_IPV4_TCP    4
484 #define RTE_ETH_FLOW_NONFRAG_IPV4_UDP    5
485 #define RTE_ETH_FLOW_NONFRAG_IPV4_SCTP   6
486 #define RTE_ETH_FLOW_NONFRAG_IPV4_OTHER  7
487 #define RTE_ETH_FLOW_IPV6                8
488 #define RTE_ETH_FLOW_FRAG_IPV6           9
489 #define RTE_ETH_FLOW_NONFRAG_IPV6_TCP   10
490 #define RTE_ETH_FLOW_NONFRAG_IPV6_UDP   11
491 #define RTE_ETH_FLOW_NONFRAG_IPV6_SCTP  12
492 #define RTE_ETH_FLOW_NONFRAG_IPV6_OTHER 13
493 #define RTE_ETH_FLOW_L2_PAYLOAD         14
494 #define RTE_ETH_FLOW_IPV6_EX            15
495 #define RTE_ETH_FLOW_IPV6_TCP_EX        16
496 #define RTE_ETH_FLOW_IPV6_UDP_EX        17
497 /** Consider device port number as a flow differentiator */
498 #define RTE_ETH_FLOW_PORT               18
499 #define RTE_ETH_FLOW_VXLAN              19 /**< VXLAN protocol based flow */
500 #define RTE_ETH_FLOW_GENEVE             20 /**< GENEVE protocol based flow */
501 #define RTE_ETH_FLOW_NVGRE              21 /**< NVGRE protocol based flow */
502 #define RTE_ETH_FLOW_VXLAN_GPE          22 /**< VXLAN-GPE protocol based flow */
503 #define RTE_ETH_FLOW_GTPU               23 /**< GTPU protocol based flow */
504 #define RTE_ETH_FLOW_MAX                24
505 
506 /*
507  * Below macros are defined for RSS offload types, they can be used to
508  * fill rte_eth_rss_conf.rss_hf or rte_flow_action_rss.types.
509  */
510 #define RTE_ETH_RSS_IPV4               RTE_BIT64(2)
511 #define RTE_ETH_RSS_FRAG_IPV4          RTE_BIT64(3)
512 #define RTE_ETH_RSS_NONFRAG_IPV4_TCP   RTE_BIT64(4)
513 #define RTE_ETH_RSS_NONFRAG_IPV4_UDP   RTE_BIT64(5)
514 #define RTE_ETH_RSS_NONFRAG_IPV4_SCTP  RTE_BIT64(6)
515 #define RTE_ETH_RSS_NONFRAG_IPV4_OTHER RTE_BIT64(7)
516 #define RTE_ETH_RSS_IPV6               RTE_BIT64(8)
517 #define RTE_ETH_RSS_FRAG_IPV6          RTE_BIT64(9)
518 #define RTE_ETH_RSS_NONFRAG_IPV6_TCP   RTE_BIT64(10)
519 #define RTE_ETH_RSS_NONFRAG_IPV6_UDP   RTE_BIT64(11)
520 #define RTE_ETH_RSS_NONFRAG_IPV6_SCTP  RTE_BIT64(12)
521 #define RTE_ETH_RSS_NONFRAG_IPV6_OTHER RTE_BIT64(13)
522 #define RTE_ETH_RSS_L2_PAYLOAD         RTE_BIT64(14)
523 #define RTE_ETH_RSS_IPV6_EX            RTE_BIT64(15)
524 #define RTE_ETH_RSS_IPV6_TCP_EX        RTE_BIT64(16)
525 #define RTE_ETH_RSS_IPV6_UDP_EX        RTE_BIT64(17)
526 #define RTE_ETH_RSS_PORT               RTE_BIT64(18)
527 #define RTE_ETH_RSS_VXLAN              RTE_BIT64(19)
528 #define RTE_ETH_RSS_GENEVE             RTE_BIT64(20)
529 #define RTE_ETH_RSS_NVGRE              RTE_BIT64(21)
530 #define RTE_ETH_RSS_GTPU               RTE_BIT64(23)
531 #define RTE_ETH_RSS_ETH                RTE_BIT64(24)
532 #define RTE_ETH_RSS_S_VLAN             RTE_BIT64(25)
533 #define RTE_ETH_RSS_C_VLAN             RTE_BIT64(26)
534 #define RTE_ETH_RSS_ESP                RTE_BIT64(27)
535 #define RTE_ETH_RSS_AH                 RTE_BIT64(28)
536 #define RTE_ETH_RSS_L2TPV3             RTE_BIT64(29)
537 #define RTE_ETH_RSS_PFCP               RTE_BIT64(30)
538 #define RTE_ETH_RSS_PPPOE              RTE_BIT64(31)
539 #define RTE_ETH_RSS_ECPRI              RTE_BIT64(32)
540 #define RTE_ETH_RSS_MPLS               RTE_BIT64(33)
541 #define RTE_ETH_RSS_IPV4_CHKSUM        RTE_BIT64(34)
542 
543 /**
544  * The RTE_ETH_RSS_L4_CHKSUM works on checksum field of any L4 header.
545  * It is similar to RTE_ETH_RSS_PORT that they don't specify the specific type of
546  * L4 header. This macro is defined to replace some specific L4 (TCP/UDP/SCTP)
547  * checksum type for constructing the use of RSS offload bits.
548  *
549  * Due to above reason, some old APIs (and configuration) don't support
550  * RTE_ETH_RSS_L4_CHKSUM. The rte_flow RSS API supports it.
551  *
552  * For the case that checksum is not used in an UDP header,
553  * it takes the reserved value 0 as input for the hash function.
554  */
555 #define RTE_ETH_RSS_L4_CHKSUM          RTE_BIT64(35)
556 
557 #define RTE_ETH_RSS_L2TPV2             RTE_BIT64(36)
558 
559 /*
560  * We use the following macros to combine with above RTE_ETH_RSS_* for
561  * more specific input set selection. These bits are defined starting
562  * from the high end of the 64 bits.
563  * Note: If we use above RTE_ETH_RSS_* without SRC/DST_ONLY, it represents
564  * both SRC and DST are taken into account. If SRC_ONLY and DST_ONLY of
565  * the same level are used simultaneously, it is the same case as none of
566  * them are added.
567  */
568 #define RTE_ETH_RSS_L3_SRC_ONLY        RTE_BIT64(63)
569 #define RTE_ETH_RSS_L3_DST_ONLY        RTE_BIT64(62)
570 #define RTE_ETH_RSS_L4_SRC_ONLY        RTE_BIT64(61)
571 #define RTE_ETH_RSS_L4_DST_ONLY        RTE_BIT64(60)
572 #define RTE_ETH_RSS_L2_SRC_ONLY        RTE_BIT64(59)
573 #define RTE_ETH_RSS_L2_DST_ONLY        RTE_BIT64(58)
574 
575 /*
576  * Only select IPV6 address prefix as RSS input set according to
577  * https://tools.ietf.org/html/rfc6052
578  * Must be combined with RTE_ETH_RSS_IPV6, RTE_ETH_RSS_NONFRAG_IPV6_UDP,
579  * RTE_ETH_RSS_NONFRAG_IPV6_TCP, RTE_ETH_RSS_NONFRAG_IPV6_SCTP.
580  */
581 #define RTE_ETH_RSS_L3_PRE32           RTE_BIT64(57)
582 #define RTE_ETH_RSS_L3_PRE40           RTE_BIT64(56)
583 #define RTE_ETH_RSS_L3_PRE48           RTE_BIT64(55)
584 #define RTE_ETH_RSS_L3_PRE56           RTE_BIT64(54)
585 #define RTE_ETH_RSS_L3_PRE64           RTE_BIT64(53)
586 #define RTE_ETH_RSS_L3_PRE96           RTE_BIT64(52)
587 
588 /*
589  * Use the following macros to combine with the above layers
590  * to choose inner and outer layers or both for RSS computation.
591  * Bits 50 and 51 are reserved for this.
592  */
593 
594 /**
595  * level 0, requests the default behavior.
596  * Depending on the packet type, it can mean outermost, innermost,
597  * anything in between or even no RSS.
598  * It basically stands for the innermost encapsulation level RSS
599  * can be performed on according to PMD and device capabilities.
600  */
601 #define RTE_ETH_RSS_LEVEL_PMD_DEFAULT  (UINT64_C(0) << 50)
602 
603 /**
604  * level 1, requests RSS to be performed on the outermost packet
605  * encapsulation level.
606  */
607 #define RTE_ETH_RSS_LEVEL_OUTERMOST    (UINT64_C(1) << 50)
608 
609 /**
610  * level 2, requests RSS to be performed on the specified inner packet
611  * encapsulation level, from outermost to innermost (lower to higher values).
612  */
613 #define RTE_ETH_RSS_LEVEL_INNERMOST    (UINT64_C(2) << 50)
614 #define RTE_ETH_RSS_LEVEL_MASK         (UINT64_C(3) << 50)
615 
616 #define RTE_ETH_RSS_LEVEL(rss_hf) ((rss_hf & RTE_ETH_RSS_LEVEL_MASK) >> 50)
617 
618 /**
619  * For input set change of hash filter, if SRC_ONLY and DST_ONLY of
620  * the same level are used simultaneously, it is the same case as
621  * none of them are added.
622  *
623  * @param rss_hf
624  *   RSS types with SRC/DST_ONLY.
625  * @return
626  *   RSS types.
627  */
628 static inline uint64_t
629 rte_eth_rss_hf_refine(uint64_t rss_hf)
630 {
631 	if ((rss_hf & RTE_ETH_RSS_L3_SRC_ONLY) && (rss_hf & RTE_ETH_RSS_L3_DST_ONLY))
632 		rss_hf &= ~(RTE_ETH_RSS_L3_SRC_ONLY | RTE_ETH_RSS_L3_DST_ONLY);
633 
634 	if ((rss_hf & RTE_ETH_RSS_L4_SRC_ONLY) && (rss_hf & RTE_ETH_RSS_L4_DST_ONLY))
635 		rss_hf &= ~(RTE_ETH_RSS_L4_SRC_ONLY | RTE_ETH_RSS_L4_DST_ONLY);
636 
637 	return rss_hf;
638 }
639 
640 #define RTE_ETH_RSS_IPV6_PRE32 ( \
641 		RTE_ETH_RSS_IPV6 | \
642 		RTE_ETH_RSS_L3_PRE32)
643 
644 #define RTE_ETH_RSS_IPV6_PRE40 ( \
645 		RTE_ETH_RSS_IPV6 | \
646 		RTE_ETH_RSS_L3_PRE40)
647 
648 #define RTE_ETH_RSS_IPV6_PRE48 ( \
649 		RTE_ETH_RSS_IPV6 | \
650 		RTE_ETH_RSS_L3_PRE48)
651 
652 #define RTE_ETH_RSS_IPV6_PRE56 ( \
653 		RTE_ETH_RSS_IPV6 | \
654 		RTE_ETH_RSS_L3_PRE56)
655 
656 #define RTE_ETH_RSS_IPV6_PRE64 ( \
657 		RTE_ETH_RSS_IPV6 | \
658 		RTE_ETH_RSS_L3_PRE64)
659 
660 #define RTE_ETH_RSS_IPV6_PRE96 ( \
661 		RTE_ETH_RSS_IPV6 | \
662 		RTE_ETH_RSS_L3_PRE96)
663 
664 #define RTE_ETH_RSS_IPV6_PRE32_UDP ( \
665 		RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
666 		RTE_ETH_RSS_L3_PRE32)
667 
668 #define RTE_ETH_RSS_IPV6_PRE40_UDP ( \
669 		RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
670 		RTE_ETH_RSS_L3_PRE40)
671 
672 #define RTE_ETH_RSS_IPV6_PRE48_UDP ( \
673 		RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
674 		RTE_ETH_RSS_L3_PRE48)
675 
676 #define RTE_ETH_RSS_IPV6_PRE56_UDP ( \
677 		RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
678 		RTE_ETH_RSS_L3_PRE56)
679 
680 #define RTE_ETH_RSS_IPV6_PRE64_UDP ( \
681 		RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
682 		RTE_ETH_RSS_L3_PRE64)
683 
684 #define RTE_ETH_RSS_IPV6_PRE96_UDP ( \
685 		RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
686 		RTE_ETH_RSS_L3_PRE96)
687 
688 #define RTE_ETH_RSS_IPV6_PRE32_TCP ( \
689 		RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
690 		RTE_ETH_RSS_L3_PRE32)
691 
692 #define RTE_ETH_RSS_IPV6_PRE40_TCP ( \
693 		RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
694 		RTE_ETH_RSS_L3_PRE40)
695 
696 #define RTE_ETH_RSS_IPV6_PRE48_TCP ( \
697 		RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
698 		RTE_ETH_RSS_L3_PRE48)
699 
700 #define RTE_ETH_RSS_IPV6_PRE56_TCP ( \
701 		RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
702 		RTE_ETH_RSS_L3_PRE56)
703 
704 #define RTE_ETH_RSS_IPV6_PRE64_TCP ( \
705 		RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
706 		RTE_ETH_RSS_L3_PRE64)
707 
708 #define RTE_ETH_RSS_IPV6_PRE96_TCP ( \
709 		RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
710 		RTE_ETH_RSS_L3_PRE96)
711 
712 #define RTE_ETH_RSS_IPV6_PRE32_SCTP ( \
713 		RTE_ETH_RSS_NONFRAG_IPV6_SCTP | \
714 		RTE_ETH_RSS_L3_PRE32)
715 
716 #define RTE_ETH_RSS_IPV6_PRE40_SCTP ( \
717 		RTE_ETH_RSS_NONFRAG_IPV6_SCTP | \
718 		RTE_ETH_RSS_L3_PRE40)
719 
720 #define RTE_ETH_RSS_IPV6_PRE48_SCTP ( \
721 		RTE_ETH_RSS_NONFRAG_IPV6_SCTP | \
722 		RTE_ETH_RSS_L3_PRE48)
723 
724 #define RTE_ETH_RSS_IPV6_PRE56_SCTP ( \
725 		RTE_ETH_RSS_NONFRAG_IPV6_SCTP | \
726 		RTE_ETH_RSS_L3_PRE56)
727 
728 #define RTE_ETH_RSS_IPV6_PRE64_SCTP ( \
729 		RTE_ETH_RSS_NONFRAG_IPV6_SCTP | \
730 		RTE_ETH_RSS_L3_PRE64)
731 
732 #define RTE_ETH_RSS_IPV6_PRE96_SCTP ( \
733 		RTE_ETH_RSS_NONFRAG_IPV6_SCTP | \
734 		RTE_ETH_RSS_L3_PRE96)
735 
736 #define RTE_ETH_RSS_IP ( \
737 	RTE_ETH_RSS_IPV4 | \
738 	RTE_ETH_RSS_FRAG_IPV4 | \
739 	RTE_ETH_RSS_NONFRAG_IPV4_OTHER | \
740 	RTE_ETH_RSS_IPV6 | \
741 	RTE_ETH_RSS_FRAG_IPV6 | \
742 	RTE_ETH_RSS_NONFRAG_IPV6_OTHER | \
743 	RTE_ETH_RSS_IPV6_EX)
744 
745 #define RTE_ETH_RSS_UDP ( \
746 	RTE_ETH_RSS_NONFRAG_IPV4_UDP | \
747 	RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
748 	RTE_ETH_RSS_IPV6_UDP_EX)
749 
750 #define RTE_ETH_RSS_TCP ( \
751 	RTE_ETH_RSS_NONFRAG_IPV4_TCP | \
752 	RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
753 	RTE_ETH_RSS_IPV6_TCP_EX)
754 
755 #define RTE_ETH_RSS_SCTP ( \
756 	RTE_ETH_RSS_NONFRAG_IPV4_SCTP | \
757 	RTE_ETH_RSS_NONFRAG_IPV6_SCTP)
758 
759 #define RTE_ETH_RSS_TUNNEL ( \
760 	RTE_ETH_RSS_VXLAN  | \
761 	RTE_ETH_RSS_GENEVE | \
762 	RTE_ETH_RSS_NVGRE)
763 
764 #define RTE_ETH_RSS_VLAN ( \
765 	RTE_ETH_RSS_S_VLAN  | \
766 	RTE_ETH_RSS_C_VLAN)
767 
768 /** Mask of valid RSS hash protocols */
769 #define RTE_ETH_RSS_PROTO_MASK ( \
770 	RTE_ETH_RSS_IPV4 | \
771 	RTE_ETH_RSS_FRAG_IPV4 | \
772 	RTE_ETH_RSS_NONFRAG_IPV4_TCP | \
773 	RTE_ETH_RSS_NONFRAG_IPV4_UDP | \
774 	RTE_ETH_RSS_NONFRAG_IPV4_SCTP | \
775 	RTE_ETH_RSS_NONFRAG_IPV4_OTHER | \
776 	RTE_ETH_RSS_IPV6 | \
777 	RTE_ETH_RSS_FRAG_IPV6 | \
778 	RTE_ETH_RSS_NONFRAG_IPV6_TCP | \
779 	RTE_ETH_RSS_NONFRAG_IPV6_UDP | \
780 	RTE_ETH_RSS_NONFRAG_IPV6_SCTP | \
781 	RTE_ETH_RSS_NONFRAG_IPV6_OTHER | \
782 	RTE_ETH_RSS_L2_PAYLOAD | \
783 	RTE_ETH_RSS_IPV6_EX | \
784 	RTE_ETH_RSS_IPV6_TCP_EX | \
785 	RTE_ETH_RSS_IPV6_UDP_EX | \
786 	RTE_ETH_RSS_PORT  | \
787 	RTE_ETH_RSS_VXLAN | \
788 	RTE_ETH_RSS_GENEVE | \
789 	RTE_ETH_RSS_NVGRE | \
790 	RTE_ETH_RSS_MPLS)
791 
792 /*
793  * Definitions used for redirection table entry size.
794  * Some RSS RETA sizes may not be supported by some drivers, check the
795  * documentation or the description of relevant functions for more details.
796  */
797 #define RTE_ETH_RSS_RETA_SIZE_64  64
798 #define RTE_ETH_RSS_RETA_SIZE_128 128
799 #define RTE_ETH_RSS_RETA_SIZE_256 256
800 #define RTE_ETH_RSS_RETA_SIZE_512 512
801 #define RTE_ETH_RETA_GROUP_SIZE   64
802 
803 /**@{@name VMDq and DCB maximums */
804 #define RTE_ETH_VMDQ_MAX_VLAN_FILTERS   64 /**< Maximum nb. of VMDq VLAN filters. */
805 #define RTE_ETH_DCB_NUM_USER_PRIORITIES 8  /**< Maximum nb. of DCB priorities. */
806 #define RTE_ETH_VMDQ_DCB_NUM_QUEUES     128 /**< Maximum nb. of VMDq DCB queues. */
807 #define RTE_ETH_DCB_NUM_QUEUES          128 /**< Maximum nb. of DCB queues. */
808 /**@}*/
809 
810 /**@{@name DCB capabilities */
811 #define RTE_ETH_DCB_PG_SUPPORT      RTE_BIT32(0) /**< Priority Group(ETS) support. */
812 #define RTE_ETH_DCB_PFC_SUPPORT     RTE_BIT32(1) /**< Priority Flow Control support. */
813 /**@}*/
814 
815 /**@{@name VLAN offload bits */
816 #define RTE_ETH_VLAN_STRIP_OFFLOAD   0x0001 /**< VLAN Strip  On/Off */
817 #define RTE_ETH_VLAN_FILTER_OFFLOAD  0x0002 /**< VLAN Filter On/Off */
818 #define RTE_ETH_VLAN_EXTEND_OFFLOAD  0x0004 /**< VLAN Extend On/Off */
819 #define RTE_ETH_QINQ_STRIP_OFFLOAD   0x0008 /**< QINQ Strip On/Off */
820 
821 #define RTE_ETH_VLAN_STRIP_MASK      0x0001 /**< VLAN Strip  setting mask */
822 #define RTE_ETH_VLAN_FILTER_MASK     0x0002 /**< VLAN Filter  setting mask*/
823 #define RTE_ETH_VLAN_EXTEND_MASK     0x0004 /**< VLAN Extend  setting mask*/
824 #define RTE_ETH_QINQ_STRIP_MASK      0x0008 /**< QINQ Strip  setting mask */
825 #define RTE_ETH_VLAN_ID_MAX          0x0FFF /**< VLAN ID is in lower 12 bits*/
826 /**@}*/
827 
828 /* Definitions used for receive MAC address */
829 #define RTE_ETH_NUM_RECEIVE_MAC_ADDR   128 /**< Maximum nb. of receive mac addr. */
830 
831 /* Definitions used for unicast hash */
832 #define RTE_ETH_VMDQ_NUM_UC_HASH_ARRAY 128 /**< Maximum nb. of UC hash array. */
833 
834 /**@{@name VMDq Rx mode
835  * @see rte_eth_vmdq_rx_conf.rx_mode
836  */
837 /** Accept untagged packets. */
838 #define RTE_ETH_VMDQ_ACCEPT_UNTAG      RTE_BIT32(0)
839 /** Accept packets in multicast table. */
840 #define RTE_ETH_VMDQ_ACCEPT_HASH_MC    RTE_BIT32(1)
841 /** Accept packets in unicast table. */
842 #define RTE_ETH_VMDQ_ACCEPT_HASH_UC    RTE_BIT32(2)
843 /** Accept broadcast packets. */
844 #define RTE_ETH_VMDQ_ACCEPT_BROADCAST  RTE_BIT32(3)
845 /** Multicast promiscuous. */
846 #define RTE_ETH_VMDQ_ACCEPT_MULTICAST  RTE_BIT32(4)
847 /**@}*/
848 
849 /**
850  * A structure used to configure 64 entries of Redirection Table of the
851  * Receive Side Scaling (RSS) feature of an Ethernet port. To configure
852  * more than 64 entries supported by hardware, an array of this structure
853  * is needed.
854  */
855 struct rte_eth_rss_reta_entry64 {
856 	/** Mask bits indicate which entries need to be updated/queried. */
857 	uint64_t mask;
858 	/** Group of 64 redirection table entries. */
859 	uint16_t reta[RTE_ETH_RETA_GROUP_SIZE];
860 };
861 
862 /**
863  * This enum indicates the possible number of traffic classes
864  * in DCB configurations
865  */
866 enum rte_eth_nb_tcs {
867 	RTE_ETH_4_TCS = 4, /**< 4 TCs with DCB. */
868 	RTE_ETH_8_TCS = 8  /**< 8 TCs with DCB. */
869 };
870 
871 /**
872  * This enum indicates the possible number of queue pools
873  * in VMDq configurations.
874  */
875 enum rte_eth_nb_pools {
876 	RTE_ETH_8_POOLS = 8,    /**< 8 VMDq pools. */
877 	RTE_ETH_16_POOLS = 16,  /**< 16 VMDq pools. */
878 	RTE_ETH_32_POOLS = 32,  /**< 32 VMDq pools. */
879 	RTE_ETH_64_POOLS = 64   /**< 64 VMDq pools. */
880 };
881 
882 /* This structure may be extended in future. */
883 struct rte_eth_dcb_rx_conf {
884 	enum rte_eth_nb_tcs nb_tcs; /**< Possible DCB TCs, 4 or 8 TCs */
885 	/** Traffic class each UP mapped to. */
886 	uint8_t dcb_tc[RTE_ETH_DCB_NUM_USER_PRIORITIES];
887 };
888 
889 struct rte_eth_vmdq_dcb_tx_conf {
890 	enum rte_eth_nb_pools nb_queue_pools; /**< With DCB, 16 or 32 pools. */
891 	/** Traffic class each UP mapped to. */
892 	uint8_t dcb_tc[RTE_ETH_DCB_NUM_USER_PRIORITIES];
893 };
894 
895 struct rte_eth_dcb_tx_conf {
896 	enum rte_eth_nb_tcs nb_tcs; /**< Possible DCB TCs, 4 or 8 TCs. */
897 	/** Traffic class each UP mapped to. */
898 	uint8_t dcb_tc[RTE_ETH_DCB_NUM_USER_PRIORITIES];
899 };
900 
901 struct rte_eth_vmdq_tx_conf {
902 	enum rte_eth_nb_pools nb_queue_pools; /**< VMDq mode, 64 pools. */
903 };
904 
905 /**
906  * A structure used to configure the VMDq+DCB feature
907  * of an Ethernet port.
908  *
909  * Using this feature, packets are routed to a pool of queues, based
910  * on the VLAN ID in the VLAN tag, and then to a specific queue within
911  * that pool, using the user priority VLAN tag field.
912  *
913  * A default pool may be used, if desired, to route all traffic which
914  * does not match the VLAN filter rules.
915  */
916 struct rte_eth_vmdq_dcb_conf {
917 	enum rte_eth_nb_pools nb_queue_pools; /**< With DCB, 16 or 32 pools */
918 	uint8_t enable_default_pool; /**< If non-zero, use a default pool */
919 	uint8_t default_pool; /**< The default pool, if applicable */
920 	uint8_t nb_pool_maps; /**< We can have up to 64 filters/mappings */
921 	struct {
922 		uint16_t vlan_id; /**< The VLAN ID of the received frame */
923 		uint64_t pools;   /**< Bitmask of pools for packet Rx */
924 	} pool_map[RTE_ETH_VMDQ_MAX_VLAN_FILTERS]; /**< VMDq VLAN pool maps. */
925 	/** Selects a queue in a pool */
926 	uint8_t dcb_tc[RTE_ETH_DCB_NUM_USER_PRIORITIES];
927 };
928 
929 /**
930  * A structure used to configure the VMDq feature of an Ethernet port when
931  * not combined with the DCB feature.
932  *
933  * Using this feature, packets are routed to a pool of queues. By default,
934  * the pool selection is based on the MAC address, the VLAN ID in the
935  * VLAN tag as specified in the pool_map array.
936  * Passing the RTE_ETH_VMDQ_ACCEPT_UNTAG in the rx_mode field allows pool
937  * selection using only the MAC address. MAC address to pool mapping is done
938  * using the rte_eth_dev_mac_addr_add function, with the pool parameter
939  * corresponding to the pool ID.
940  *
941  * Queue selection within the selected pool will be done using RSS when
942  * it is enabled or revert to the first queue of the pool if not.
943  *
944  * A default pool may be used, if desired, to route all traffic which
945  * does not match the VLAN filter rules or any pool MAC address.
946  */
947 struct rte_eth_vmdq_rx_conf {
948 	enum rte_eth_nb_pools nb_queue_pools; /**< VMDq only mode, 8 or 64 pools */
949 	uint8_t enable_default_pool; /**< If non-zero, use a default pool */
950 	uint8_t default_pool; /**< The default pool, if applicable */
951 	uint8_t enable_loop_back; /**< Enable VT loop back */
952 	uint8_t nb_pool_maps; /**< We can have up to 64 filters/mappings */
953 	uint32_t rx_mode; /**< Flags from RTE_ETH_VMDQ_ACCEPT_* */
954 	struct {
955 		uint16_t vlan_id; /**< The VLAN ID of the received frame */
956 		uint64_t pools;   /**< Bitmask of pools for packet Rx */
957 	} pool_map[RTE_ETH_VMDQ_MAX_VLAN_FILTERS]; /**< VMDq VLAN pool maps. */
958 };
959 
960 /**
961  * A structure used to configure the Tx features of an Ethernet port.
962  */
963 struct rte_eth_txmode {
964 	enum rte_eth_tx_mq_mode mq_mode; /**< Tx multi-queues mode. */
965 	/**
966 	 * Per-port Tx offloads to be set using RTE_ETH_TX_OFFLOAD_* flags.
967 	 * Only offloads set on tx_offload_capa field on rte_eth_dev_info
968 	 * structure are allowed to be set.
969 	 */
970 	uint64_t offloads;
971 
972 	uint16_t pvid;
973 	__extension__
974 	uint8_t /** If set, reject sending out tagged pkts */
975 		hw_vlan_reject_tagged : 1,
976 		/** If set, reject sending out untagged pkts */
977 		hw_vlan_reject_untagged : 1,
978 		/** If set, enable port based VLAN insertion */
979 		hw_vlan_insert_pvid : 1;
980 
981 	uint64_t reserved_64s[2]; /**< Reserved for future fields */
982 	void *reserved_ptrs[2];   /**< Reserved for future fields */
983 };
984 
985 /**
986  * @warning
987  * @b EXPERIMENTAL: this structure may change without prior notice.
988  *
989  * A structure used to configure an Rx packet segment to split.
990  *
991  * If RTE_ETH_RX_OFFLOAD_BUFFER_SPLIT flag is set in offloads field,
992  * the PMD will split the received packets into multiple segments
993  * according to the specification in the description array:
994  *
995  * - The first network buffer will be allocated from the memory pool,
996  *   specified in the first array element, the second buffer, from the
997  *   pool in the second element, and so on.
998  *
999  * - The proto_hdrs in the elements define the split position of
1000  *   received packets.
1001  *
1002  * - The offsets from the segment description elements specify
1003  *   the data offset from the buffer beginning except the first mbuf.
1004  *   The first segment offset is added with RTE_PKTMBUF_HEADROOM.
1005  *
1006  * - The lengths in the elements define the maximal data amount
1007  *   being received to each segment. The receiving starts with filling
1008  *   up the first mbuf data buffer up to specified length. If the
1009  *   there are data remaining (packet is longer than buffer in the first
1010  *   mbuf) the following data will be pushed to the next segment
1011  *   up to its own length, and so on.
1012  *
1013  * - If the length in the segment description element is zero
1014  *   the actual buffer size will be deduced from the appropriate
1015  *   memory pool properties.
1016  *
1017  * - If there is not enough elements to describe the buffer for entire
1018  *   packet of maximal length the following parameters will be used
1019  *   for the all remaining segments:
1020  *     - pool from the last valid element
1021  *     - the buffer size from this pool
1022  *     - zero offset
1023  *
1024  * - Length based buffer split:
1025  *     - mp, length, offset should be configured.
1026  *     - The proto_hdr field must be 0.
1027  *
1028  * - Protocol header based buffer split:
1029  *     - mp, offset, proto_hdr should be configured.
1030  *     - The length field must be 0.
1031  *     - The proto_hdr field in the last segment should be 0.
1032  *
1033  * - When protocol header split is enabled, NIC may receive packets
1034  *   which do not match all the protocol headers within the Rx segments.
1035  *   At this point, NIC will have two possible split behaviors according to
1036  *   matching results, one is exact match, another is longest match.
1037  *   The split result of NIC must belong to one of them.
1038  *   The exact match means NIC only do split when the packets exactly match all
1039  *   the protocol headers in the segments.
1040  *   Otherwise, the whole packet will be put into the last valid mempool.
1041  *   The longest match means NIC will do split until packets mismatch
1042  *   the protocol header in the segments.
1043  *   The rest will be put into the last valid pool.
1044  */
1045 struct rte_eth_rxseg_split {
1046 	struct rte_mempool *mp; /**< Memory pool to allocate segment from. */
1047 	uint16_t length; /**< Segment data length, configures split point. */
1048 	uint16_t offset; /**< Data offset from beginning of mbuf data buffer. */
1049 	/**
1050 	 * proto_hdr defines a bit mask of the protocol sequence as RTE_PTYPE_*.
1051 	 * The last RTE_PTYPE* in the mask indicates the split position.
1052 	 *
1053 	 * If one protocol header is defined to split packets into two segments,
1054 	 * for non-tunneling packets, the complete protocol sequence should be defined.
1055 	 * For tunneling packets, for simplicity, only the tunnel and inner part of
1056 	 * complete protocol sequence is required.
1057 	 * If several protocol headers are defined to split packets into multi-segments,
1058 	 * the repeated parts of adjacent segments should be omitted.
1059 	 */
1060 	uint32_t proto_hdr;
1061 };
1062 
1063 /**
1064  * @warning
1065  * @b EXPERIMENTAL: this structure may change without prior notice.
1066  *
1067  * A common structure used to describe Rx packet segment properties.
1068  */
1069 union rte_eth_rxseg {
1070 	/* The settings for buffer split offload. */
1071 	struct rte_eth_rxseg_split split;
1072 	/* The other features settings should be added here. */
1073 };
1074 
1075 /**
1076  * A structure used to configure an Rx ring of an Ethernet port.
1077  */
1078 struct rte_eth_rxconf {
1079 	struct rte_eth_thresh rx_thresh; /**< Rx ring threshold registers. */
1080 	uint16_t rx_free_thresh; /**< Drives the freeing of Rx descriptors. */
1081 	uint8_t rx_drop_en; /**< Drop packets if no descriptors are available. */
1082 	uint8_t rx_deferred_start; /**< Do not start queue with rte_eth_dev_start(). */
1083 	uint16_t rx_nseg; /**< Number of descriptions in rx_seg array. */
1084 	/**
1085 	 * Share group index in Rx domain and switch domain.
1086 	 * Non-zero value to enable Rx queue share, zero value disable share.
1087 	 * PMD is responsible for Rx queue consistency checks to avoid member
1088 	 * port's configuration contradict to each other.
1089 	 */
1090 	uint16_t share_group;
1091 	uint16_t share_qid; /**< Shared Rx queue ID in group */
1092 	/**
1093 	 * Per-queue Rx offloads to be set using RTE_ETH_RX_OFFLOAD_* flags.
1094 	 * Only offloads set on rx_queue_offload_capa or rx_offload_capa
1095 	 * fields on rte_eth_dev_info structure are allowed to be set.
1096 	 */
1097 	uint64_t offloads;
1098 	/**
1099 	 * Points to the array of segment descriptions for an entire packet.
1100 	 * Array elements are properties for consecutive Rx segments.
1101 	 *
1102 	 * The supported capabilities of receiving segmentation is reported
1103 	 * in rte_eth_dev_info.rx_seg_capa field.
1104 	 */
1105 	union rte_eth_rxseg *rx_seg;
1106 
1107 	/**
1108 	 * Array of mempools to allocate Rx buffers from.
1109 	 *
1110 	 * This provides support for multiple mbuf pools per Rx queue.
1111 	 * The capability is reported in device info via positive
1112 	 * max_rx_mempools.
1113 	 *
1114 	 * It could be useful for more efficient usage of memory when an
1115 	 * application creates different mempools to steer the specific
1116 	 * size of the packet.
1117 	 *
1118 	 * If many mempools are specified, packets received using Rx
1119 	 * burst may belong to any provided mempool. From ethdev user point
1120 	 * of view it is undefined how PMD/NIC chooses mempool for a packet.
1121 	 *
1122 	 * If Rx scatter is enabled, a packet may be delivered using a chain
1123 	 * of mbufs obtained from single mempool or multiple mempools based
1124 	 * on the NIC implementation.
1125 	 */
1126 	struct rte_mempool **rx_mempools;
1127 	uint16_t rx_nmempool; /** < Number of Rx mempools */
1128 
1129 	uint64_t reserved_64s[2]; /**< Reserved for future fields */
1130 	void *reserved_ptrs[2];   /**< Reserved for future fields */
1131 };
1132 
1133 /**
1134  * A structure used to configure a Tx ring of an Ethernet port.
1135  */
1136 struct rte_eth_txconf {
1137 	struct rte_eth_thresh tx_thresh; /**< Tx ring threshold registers. */
1138 	uint16_t tx_rs_thresh; /**< Drives the setting of RS bit on TXDs. */
1139 	uint16_t tx_free_thresh; /**< Start freeing Tx buffers if there are
1140 				      less free descriptors than this value. */
1141 
1142 	uint8_t tx_deferred_start; /**< Do not start queue with rte_eth_dev_start(). */
1143 	/**
1144 	 * Per-queue Tx offloads to be set  using RTE_ETH_TX_OFFLOAD_* flags.
1145 	 * Only offloads set on tx_queue_offload_capa or tx_offload_capa
1146 	 * fields on rte_eth_dev_info structure are allowed to be set.
1147 	 */
1148 	uint64_t offloads;
1149 
1150 	uint64_t reserved_64s[2]; /**< Reserved for future fields */
1151 	void *reserved_ptrs[2];   /**< Reserved for future fields */
1152 };
1153 
1154 /**
1155  * @warning
1156  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
1157  *
1158  * A structure used to return the Tx or Rx hairpin queue capabilities.
1159  */
1160 struct rte_eth_hairpin_queue_cap {
1161 	/**
1162 	 * When set, PMD supports placing descriptors and/or data buffers
1163 	 * in dedicated device memory.
1164 	 */
1165 	uint32_t locked_device_memory:1;
1166 
1167 	/**
1168 	 * When set, PMD supports placing descriptors and/or data buffers
1169 	 * in host memory managed by DPDK.
1170 	 */
1171 	uint32_t rte_memory:1;
1172 
1173 	uint32_t reserved:30; /**< Reserved for future fields */
1174 };
1175 
1176 /**
1177  * @warning
1178  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
1179  *
1180  * A structure used to return the hairpin capabilities that are supported.
1181  */
1182 struct rte_eth_hairpin_cap {
1183 	/** The max number of hairpin queues (different bindings). */
1184 	uint16_t max_nb_queues;
1185 	/** Max number of Rx queues to be connected to one Tx queue. */
1186 	uint16_t max_rx_2_tx;
1187 	/** Max number of Tx queues to be connected to one Rx queue. */
1188 	uint16_t max_tx_2_rx;
1189 	uint16_t max_nb_desc; /**< The max num of descriptors. */
1190 	struct rte_eth_hairpin_queue_cap rx_cap; /**< Rx hairpin queue capabilities. */
1191 	struct rte_eth_hairpin_queue_cap tx_cap; /**< Tx hairpin queue capabilities. */
1192 };
1193 
1194 #define RTE_ETH_MAX_HAIRPIN_PEERS 32
1195 
1196 /**
1197  * @warning
1198  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
1199  *
1200  * A structure used to hold hairpin peer data.
1201  */
1202 struct rte_eth_hairpin_peer {
1203 	uint16_t port; /**< Peer port. */
1204 	uint16_t queue; /**< Peer queue. */
1205 };
1206 
1207 /**
1208  * @warning
1209  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
1210  *
1211  * A structure used to configure hairpin binding.
1212  */
1213 struct rte_eth_hairpin_conf {
1214 	uint32_t peer_count:16; /**< The number of peers. */
1215 
1216 	/**
1217 	 * Explicit Tx flow rule mode.
1218 	 * One hairpin pair of queues should have the same attribute.
1219 	 *
1220 	 * - When set, the user should be responsible for inserting the hairpin
1221 	 *   Tx part flows and removing them.
1222 	 * - When clear, the PMD will try to handle the Tx part of the flows,
1223 	 *   e.g., by splitting one flow into two parts.
1224 	 */
1225 	uint32_t tx_explicit:1;
1226 
1227 	/**
1228 	 * Manually bind hairpin queues.
1229 	 * One hairpin pair of queues should have the same attribute.
1230 	 *
1231 	 * - When set, to enable hairpin, the user should call the hairpin bind
1232 	 *   function after all the queues are set up properly and the ports are
1233 	 *   started. Also, the hairpin unbind function should be called
1234 	 *   accordingly before stopping a port that with hairpin configured.
1235 	 * - When cleared, the PMD will try to enable the hairpin with the queues
1236 	 *   configured automatically during port start.
1237 	 */
1238 	uint32_t manual_bind:1;
1239 
1240 	/**
1241 	 * Use locked device memory as a backing storage.
1242 	 *
1243 	 * - When set, PMD will attempt place descriptors and/or data buffers
1244 	 *   in dedicated device memory.
1245 	 * - When cleared, PMD will use default memory type as a backing storage.
1246 	 *   Please refer to PMD documentation for details.
1247 	 *
1248 	 * API user should check if PMD supports this configuration flag using
1249 	 * @see rte_eth_dev_hairpin_capability_get.
1250 	 */
1251 	uint32_t use_locked_device_memory:1;
1252 
1253 	/**
1254 	 * Use DPDK memory as backing storage.
1255 	 *
1256 	 * - When set, PMD will attempt place descriptors and/or data buffers
1257 	 *   in host memory managed by DPDK.
1258 	 * - When cleared, PMD will use default memory type as a backing storage.
1259 	 *   Please refer to PMD documentation for details.
1260 	 *
1261 	 * API user should check if PMD supports this configuration flag using
1262 	 * @see rte_eth_dev_hairpin_capability_get.
1263 	 */
1264 	uint32_t use_rte_memory:1;
1265 
1266 	/**
1267 	 * Force usage of hairpin memory configuration.
1268 	 *
1269 	 * - When set, PMD will attempt to use specified memory settings.
1270 	 *   If resource allocation fails, then hairpin queue allocation
1271 	 *   will result in an error.
1272 	 * - When clear, PMD will attempt to use specified memory settings.
1273 	 *   If resource allocation fails, then PMD will retry
1274 	 *   allocation with default configuration.
1275 	 */
1276 	uint32_t force_memory:1;
1277 
1278 	uint32_t reserved:11; /**< Reserved bits. */
1279 
1280 	struct rte_eth_hairpin_peer peers[RTE_ETH_MAX_HAIRPIN_PEERS];
1281 };
1282 
1283 /**
1284  * A structure contains information about HW descriptor ring limitations.
1285  */
1286 struct rte_eth_desc_lim {
1287 	uint16_t nb_max;   /**< Max allowed number of descriptors. */
1288 	uint16_t nb_min;   /**< Min allowed number of descriptors. */
1289 	uint16_t nb_align; /**< Number of descriptors should be aligned to. */
1290 
1291 	/**
1292 	 * Max allowed number of segments per whole packet.
1293 	 *
1294 	 * - For TSO packet this is the total number of data descriptors allowed
1295 	 *   by device.
1296 	 *
1297 	 * @see nb_mtu_seg_max
1298 	 */
1299 	uint16_t nb_seg_max;
1300 
1301 	/**
1302 	 * Max number of segments per one MTU.
1303 	 *
1304 	 * - For non-TSO packet, this is the maximum allowed number of segments
1305 	 *   in a single transmit packet.
1306 	 *
1307 	 * - For TSO packet each segment within the TSO may span up to this
1308 	 *   value.
1309 	 *
1310 	 * @see nb_seg_max
1311 	 */
1312 	uint16_t nb_mtu_seg_max;
1313 };
1314 
1315 /**
1316  * This enum indicates the flow control mode
1317  */
1318 enum rte_eth_fc_mode {
1319 	RTE_ETH_FC_NONE = 0, /**< Disable flow control. */
1320 	RTE_ETH_FC_RX_PAUSE, /**< Rx pause frame, enable flowctrl on Tx side. */
1321 	RTE_ETH_FC_TX_PAUSE, /**< Tx pause frame, enable flowctrl on Rx side. */
1322 	RTE_ETH_FC_FULL      /**< Enable flow control on both side. */
1323 };
1324 
1325 /**
1326  * A structure used to configure Ethernet flow control parameter.
1327  * These parameters will be configured into the register of the NIC.
1328  * Please refer to the corresponding data sheet for proper value.
1329  */
1330 struct rte_eth_fc_conf {
1331 	uint32_t high_water;  /**< High threshold value to trigger XOFF */
1332 	uint32_t low_water;   /**< Low threshold value to trigger XON */
1333 	uint16_t pause_time;  /**< Pause quota in the Pause frame */
1334 	uint16_t send_xon;    /**< Is XON frame need be sent */
1335 	enum rte_eth_fc_mode mode;  /**< Link flow control mode */
1336 	uint8_t mac_ctrl_frame_fwd; /**< Forward MAC control frames */
1337 	uint8_t autoneg;      /**< Use Pause autoneg */
1338 };
1339 
1340 /**
1341  * A structure used to configure Ethernet priority flow control parameter.
1342  * These parameters will be configured into the register of the NIC.
1343  * Please refer to the corresponding data sheet for proper value.
1344  */
1345 struct rte_eth_pfc_conf {
1346 	struct rte_eth_fc_conf fc; /**< General flow control parameter. */
1347 	uint8_t priority;          /**< VLAN User Priority. */
1348 };
1349 
1350 /**
1351  * @warning
1352  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
1353  *
1354  * A structure used to retrieve information of queue based PFC.
1355  */
1356 struct rte_eth_pfc_queue_info {
1357 	/**
1358 	 * Maximum supported traffic class as per PFC (802.1Qbb) specification.
1359 	 */
1360 	uint8_t tc_max;
1361 	/** PFC queue mode capabilities. */
1362 	enum rte_eth_fc_mode mode_capa;
1363 };
1364 
1365 /**
1366  * @warning
1367  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
1368  *
1369  * A structure used to configure Ethernet priority flow control parameters for
1370  * ethdev queues.
1371  *
1372  * rte_eth_pfc_queue_conf::rx_pause structure shall be used to configure given
1373  * tx_qid with corresponding tc. When ethdev device receives PFC frame with
1374  * rte_eth_pfc_queue_conf::rx_pause::tc, traffic will be paused on
1375  * rte_eth_pfc_queue_conf::rx_pause::tx_qid for that tc.
1376  *
1377  * rte_eth_pfc_queue_conf::tx_pause structure shall be used to configure given
1378  * rx_qid. When rx_qid is congested, PFC frames are generated with
1379  * rte_eth_pfc_queue_conf::rx_pause::tc and
1380  * rte_eth_pfc_queue_conf::rx_pause::pause_time to the peer.
1381  */
1382 struct rte_eth_pfc_queue_conf {
1383 	enum rte_eth_fc_mode mode; /**< Link flow control mode */
1384 
1385 	struct {
1386 		uint16_t tx_qid; /**< Tx queue ID */
1387 		/** Traffic class as per PFC (802.1Qbb) spec. The value must be
1388 		 * in the range [0, rte_eth_pfc_queue_info::tx_max - 1]
1389 		 */
1390 		uint8_t tc;
1391 	} rx_pause; /* Valid when (mode == FC_RX_PAUSE || mode == FC_FULL) */
1392 
1393 	struct {
1394 		uint16_t pause_time; /**< Pause quota in the Pause frame */
1395 		uint16_t rx_qid;     /**< Rx queue ID */
1396 		/** Traffic class as per PFC (802.1Qbb) spec. The value must be
1397 		 * in the range [0, rte_eth_pfc_queue_info::tx_max - 1]
1398 		 */
1399 		uint8_t tc;
1400 	} tx_pause; /* Valid when (mode == FC_TX_PAUSE || mode == FC_FULL) */
1401 };
1402 
1403 /**
1404  * Tunnel type for device-specific classifier configuration.
1405  * @see rte_eth_udp_tunnel
1406  */
1407 enum rte_eth_tunnel_type {
1408 	RTE_ETH_TUNNEL_TYPE_NONE = 0,
1409 	RTE_ETH_TUNNEL_TYPE_VXLAN,
1410 	RTE_ETH_TUNNEL_TYPE_GENEVE,
1411 	RTE_ETH_TUNNEL_TYPE_TEREDO,
1412 	RTE_ETH_TUNNEL_TYPE_NVGRE,
1413 	RTE_ETH_TUNNEL_TYPE_IP_IN_GRE,
1414 	RTE_ETH_L2_TUNNEL_TYPE_E_TAG,
1415 	RTE_ETH_TUNNEL_TYPE_VXLAN_GPE,
1416 	RTE_ETH_TUNNEL_TYPE_ECPRI,
1417 	RTE_ETH_TUNNEL_TYPE_MAX,
1418 };
1419 
1420 /* Deprecated API file for rte_eth_dev_filter_* functions */
1421 #include "rte_eth_ctrl.h"
1422 
1423 /**
1424  * UDP tunneling configuration.
1425  *
1426  * Used to configure the classifier of a device,
1427  * associating an UDP port with a type of tunnel.
1428  *
1429  * Some NICs may need such configuration to properly parse a tunnel
1430  * with any standard or custom UDP port.
1431  */
1432 struct rte_eth_udp_tunnel {
1433 	uint16_t udp_port; /**< UDP port used for the tunnel. */
1434 	uint8_t prot_type; /**< Tunnel type. @see rte_eth_tunnel_type */
1435 };
1436 
1437 /**
1438  * A structure used to enable/disable specific device interrupts.
1439  */
1440 struct rte_eth_intr_conf {
1441 	/** enable/disable lsc interrupt. 0 (default) - disable, 1 enable */
1442 	uint32_t lsc:1;
1443 	/** enable/disable rxq interrupt. 0 (default) - disable, 1 enable */
1444 	uint32_t rxq:1;
1445 	/** enable/disable rmv interrupt. 0 (default) - disable, 1 enable */
1446 	uint32_t rmv:1;
1447 };
1448 
1449 #define rte_intr_conf rte_eth_intr_conf
1450 
1451 /**
1452  * A structure used to configure an Ethernet port.
1453  * Depending upon the Rx multi-queue mode, extra advanced
1454  * configuration settings may be needed.
1455  */
1456 struct rte_eth_conf {
1457 	uint32_t link_speeds; /**< bitmap of RTE_ETH_LINK_SPEED_XXX of speeds to be
1458 				used. RTE_ETH_LINK_SPEED_FIXED disables link
1459 				autonegotiation, and a unique speed shall be
1460 				set. Otherwise, the bitmap defines the set of
1461 				speeds to be advertised. If the special value
1462 				RTE_ETH_LINK_SPEED_AUTONEG (0) is used, all speeds
1463 				supported are advertised. */
1464 	struct rte_eth_rxmode rxmode; /**< Port Rx configuration. */
1465 	struct rte_eth_txmode txmode; /**< Port Tx configuration. */
1466 	uint32_t lpbk_mode; /**< Loopback operation mode. By default the value
1467 			         is 0, meaning the loopback mode is disabled.
1468 				 Read the datasheet of given Ethernet controller
1469 				 for details. The possible values of this field
1470 				 are defined in implementation of each driver. */
1471 	struct {
1472 		struct rte_eth_rss_conf rss_conf; /**< Port RSS configuration */
1473 		/** Port VMDq+DCB configuration. */
1474 		struct rte_eth_vmdq_dcb_conf vmdq_dcb_conf;
1475 		/** Port DCB Rx configuration. */
1476 		struct rte_eth_dcb_rx_conf dcb_rx_conf;
1477 		/** Port VMDq Rx configuration. */
1478 		struct rte_eth_vmdq_rx_conf vmdq_rx_conf;
1479 	} rx_adv_conf; /**< Port Rx filtering configuration. */
1480 	union {
1481 		/** Port VMDq+DCB Tx configuration. */
1482 		struct rte_eth_vmdq_dcb_tx_conf vmdq_dcb_tx_conf;
1483 		/** Port DCB Tx configuration. */
1484 		struct rte_eth_dcb_tx_conf dcb_tx_conf;
1485 		/** Port VMDq Tx configuration. */
1486 		struct rte_eth_vmdq_tx_conf vmdq_tx_conf;
1487 	} tx_adv_conf; /**< Port Tx DCB configuration (union). */
1488 	/** Currently,Priority Flow Control(PFC) are supported,if DCB with PFC
1489 	    is needed,and the variable must be set RTE_ETH_DCB_PFC_SUPPORT. */
1490 	uint32_t dcb_capability_en;
1491 	struct rte_eth_intr_conf intr_conf; /**< Interrupt mode configuration. */
1492 };
1493 
1494 /**
1495  * Rx offload capabilities of a device.
1496  */
1497 #define RTE_ETH_RX_OFFLOAD_VLAN_STRIP       RTE_BIT64(0)
1498 #define RTE_ETH_RX_OFFLOAD_IPV4_CKSUM       RTE_BIT64(1)
1499 #define RTE_ETH_RX_OFFLOAD_UDP_CKSUM        RTE_BIT64(2)
1500 #define RTE_ETH_RX_OFFLOAD_TCP_CKSUM        RTE_BIT64(3)
1501 #define RTE_ETH_RX_OFFLOAD_TCP_LRO          RTE_BIT64(4)
1502 #define RTE_ETH_RX_OFFLOAD_QINQ_STRIP       RTE_BIT64(5)
1503 #define RTE_ETH_RX_OFFLOAD_OUTER_IPV4_CKSUM RTE_BIT64(6)
1504 #define RTE_ETH_RX_OFFLOAD_MACSEC_STRIP     RTE_BIT64(7)
1505 #define RTE_ETH_RX_OFFLOAD_VLAN_FILTER      RTE_BIT64(9)
1506 #define RTE_ETH_RX_OFFLOAD_VLAN_EXTEND      RTE_BIT64(10)
1507 #define RTE_ETH_RX_OFFLOAD_SCATTER          RTE_BIT64(13)
1508 /**
1509  * Timestamp is set by the driver in RTE_MBUF_DYNFIELD_TIMESTAMP_NAME
1510  * and RTE_MBUF_DYNFLAG_RX_TIMESTAMP_NAME is set in ol_flags.
1511  * The mbuf field and flag are registered when the offload is configured.
1512  */
1513 #define RTE_ETH_RX_OFFLOAD_TIMESTAMP        RTE_BIT64(14)
1514 #define RTE_ETH_RX_OFFLOAD_SECURITY         RTE_BIT64(15)
1515 #define RTE_ETH_RX_OFFLOAD_KEEP_CRC         RTE_BIT64(16)
1516 #define RTE_ETH_RX_OFFLOAD_SCTP_CKSUM       RTE_BIT64(17)
1517 #define RTE_ETH_RX_OFFLOAD_OUTER_UDP_CKSUM  RTE_BIT64(18)
1518 #define RTE_ETH_RX_OFFLOAD_RSS_HASH         RTE_BIT64(19)
1519 #define RTE_ETH_RX_OFFLOAD_BUFFER_SPLIT     RTE_BIT64(20)
1520 
1521 #define RTE_ETH_RX_OFFLOAD_CHECKSUM (RTE_ETH_RX_OFFLOAD_IPV4_CKSUM | \
1522 				 RTE_ETH_RX_OFFLOAD_UDP_CKSUM | \
1523 				 RTE_ETH_RX_OFFLOAD_TCP_CKSUM)
1524 #define RTE_ETH_RX_OFFLOAD_VLAN (RTE_ETH_RX_OFFLOAD_VLAN_STRIP | \
1525 			     RTE_ETH_RX_OFFLOAD_VLAN_FILTER | \
1526 			     RTE_ETH_RX_OFFLOAD_VLAN_EXTEND | \
1527 			     RTE_ETH_RX_OFFLOAD_QINQ_STRIP)
1528 
1529 /*
1530  * If new Rx offload capabilities are defined, they also must be
1531  * mentioned in rte_rx_offload_names in rte_ethdev.c file.
1532  */
1533 
1534 /**
1535  * Tx offload capabilities of a device.
1536  */
1537 #define RTE_ETH_TX_OFFLOAD_VLAN_INSERT      RTE_BIT64(0)
1538 #define RTE_ETH_TX_OFFLOAD_IPV4_CKSUM       RTE_BIT64(1)
1539 #define RTE_ETH_TX_OFFLOAD_UDP_CKSUM        RTE_BIT64(2)
1540 #define RTE_ETH_TX_OFFLOAD_TCP_CKSUM        RTE_BIT64(3)
1541 #define RTE_ETH_TX_OFFLOAD_SCTP_CKSUM       RTE_BIT64(4)
1542 #define RTE_ETH_TX_OFFLOAD_TCP_TSO          RTE_BIT64(5)
1543 #define RTE_ETH_TX_OFFLOAD_UDP_TSO          RTE_BIT64(6)
1544 #define RTE_ETH_TX_OFFLOAD_OUTER_IPV4_CKSUM RTE_BIT64(7)  /**< Used for tunneling packet. */
1545 #define RTE_ETH_TX_OFFLOAD_QINQ_INSERT      RTE_BIT64(8)
1546 #define RTE_ETH_TX_OFFLOAD_VXLAN_TNL_TSO    RTE_BIT64(9)  /**< Used for tunneling packet. */
1547 #define RTE_ETH_TX_OFFLOAD_GRE_TNL_TSO      RTE_BIT64(10) /**< Used for tunneling packet. */
1548 #define RTE_ETH_TX_OFFLOAD_IPIP_TNL_TSO     RTE_BIT64(11) /**< Used for tunneling packet. */
1549 #define RTE_ETH_TX_OFFLOAD_GENEVE_TNL_TSO   RTE_BIT64(12) /**< Used for tunneling packet. */
1550 #define RTE_ETH_TX_OFFLOAD_MACSEC_INSERT    RTE_BIT64(13)
1551 /**
1552  * Multiple threads can invoke rte_eth_tx_burst() concurrently on the same
1553  * Tx queue without SW lock.
1554  */
1555 #define RTE_ETH_TX_OFFLOAD_MT_LOCKFREE      RTE_BIT64(14)
1556 /** Device supports multi segment send. */
1557 #define RTE_ETH_TX_OFFLOAD_MULTI_SEGS       RTE_BIT64(15)
1558 /**
1559  * Device supports optimization for fast release of mbufs.
1560  * When set application must guarantee that per-queue all mbufs comes from
1561  * the same mempool and has refcnt = 1.
1562  */
1563 #define RTE_ETH_TX_OFFLOAD_MBUF_FAST_FREE   RTE_BIT64(16)
1564 #define RTE_ETH_TX_OFFLOAD_SECURITY         RTE_BIT64(17)
1565 /**
1566  * Device supports generic UDP tunneled packet TSO.
1567  * Application must set RTE_MBUF_F_TX_TUNNEL_UDP and other mbuf fields required
1568  * for tunnel TSO.
1569  */
1570 #define RTE_ETH_TX_OFFLOAD_UDP_TNL_TSO      RTE_BIT64(18)
1571 /**
1572  * Device supports generic IP tunneled packet TSO.
1573  * Application must set RTE_MBUF_F_TX_TUNNEL_IP and other mbuf fields required
1574  * for tunnel TSO.
1575  */
1576 #define RTE_ETH_TX_OFFLOAD_IP_TNL_TSO       RTE_BIT64(19)
1577 /** Device supports outer UDP checksum */
1578 #define RTE_ETH_TX_OFFLOAD_OUTER_UDP_CKSUM  RTE_BIT64(20)
1579 /**
1580  * Device sends on time read from RTE_MBUF_DYNFIELD_TIMESTAMP_NAME
1581  * if RTE_MBUF_DYNFLAG_TX_TIMESTAMP_NAME is set in ol_flags.
1582  * The mbuf field and flag are registered when the offload is configured.
1583  */
1584 #define RTE_ETH_TX_OFFLOAD_SEND_ON_TIMESTAMP RTE_BIT64(21)
1585 /*
1586  * If new Tx offload capabilities are defined, they also must be
1587  * mentioned in rte_tx_offload_names in rte_ethdev.c file.
1588  */
1589 
1590 /**@{@name Device capabilities
1591  * Non-offload capabilities reported in rte_eth_dev_info.dev_capa.
1592  */
1593 /** Device supports Rx queue setup after device started. */
1594 #define RTE_ETH_DEV_CAPA_RUNTIME_RX_QUEUE_SETUP RTE_BIT64(0)
1595 /** Device supports Tx queue setup after device started. */
1596 #define RTE_ETH_DEV_CAPA_RUNTIME_TX_QUEUE_SETUP RTE_BIT64(1)
1597 /**
1598  * Device supports shared Rx queue among ports within Rx domain and
1599  * switch domain. Mbufs are consumed by shared Rx queue instead of
1600  * each queue. Multiple groups are supported by share_group of Rx
1601  * queue configuration. Shared Rx queue is identified by PMD using
1602  * share_qid of Rx queue configuration. Polling any port in the group
1603  * receive packets of all member ports, source port identified by
1604  * mbuf->port field.
1605  */
1606 #define RTE_ETH_DEV_CAPA_RXQ_SHARE              RTE_BIT64(2)
1607 /** Device supports keeping flow rules across restart. */
1608 #define RTE_ETH_DEV_CAPA_FLOW_RULE_KEEP         RTE_BIT64(3)
1609 /** Device supports keeping shared flow objects across restart. */
1610 #define RTE_ETH_DEV_CAPA_FLOW_SHARED_OBJECT_KEEP RTE_BIT64(4)
1611 /**@}*/
1612 
1613 /*
1614  * Fallback default preferred Rx/Tx port parameters.
1615  * These are used if an application requests default parameters
1616  * but the PMD does not provide preferred values.
1617  */
1618 #define RTE_ETH_DEV_FALLBACK_RX_RINGSIZE 512
1619 #define RTE_ETH_DEV_FALLBACK_TX_RINGSIZE 512
1620 #define RTE_ETH_DEV_FALLBACK_RX_NBQUEUES 1
1621 #define RTE_ETH_DEV_FALLBACK_TX_NBQUEUES 1
1622 
1623 /**
1624  * Preferred Rx/Tx port parameters.
1625  * There are separate instances of this structure for transmission
1626  * and reception respectively.
1627  */
1628 struct rte_eth_dev_portconf {
1629 	uint16_t burst_size; /**< Device-preferred burst size */
1630 	uint16_t ring_size; /**< Device-preferred size of queue rings */
1631 	uint16_t nb_queues; /**< Device-preferred number of queues */
1632 };
1633 
1634 /**
1635  * Default values for switch domain ID when ethdev does not support switch
1636  * domain definitions.
1637  */
1638 #define RTE_ETH_DEV_SWITCH_DOMAIN_ID_INVALID	(UINT16_MAX)
1639 
1640 /**
1641  * Ethernet device associated switch information
1642  */
1643 struct rte_eth_switch_info {
1644 	const char *name;	/**< switch name */
1645 	uint16_t domain_id;	/**< switch domain ID */
1646 	/**
1647 	 * Mapping to the devices physical switch port as enumerated from the
1648 	 * perspective of the embedded interconnect/switch. For SR-IOV enabled
1649 	 * device this may correspond to the VF_ID of each virtual function,
1650 	 * but each driver should explicitly define the mapping of switch
1651 	 * port identifier to that physical interconnect/switch
1652 	 */
1653 	uint16_t port_id;
1654 	/**
1655 	 * Shared Rx queue sub-domain boundary. Only ports in same Rx domain
1656 	 * and switch domain can share Rx queue. Valid only if device advertised
1657 	 * RTE_ETH_DEV_CAPA_RXQ_SHARE capability.
1658 	 */
1659 	uint16_t rx_domain;
1660 };
1661 
1662 /**
1663  * @warning
1664  * @b EXPERIMENTAL: this structure may change without prior notice.
1665  *
1666  * Ethernet device Rx buffer segmentation capabilities.
1667  */
1668 struct rte_eth_rxseg_capa {
1669 	__extension__
1670 	uint32_t multi_pools:1; /**< Supports receiving to multiple pools.*/
1671 	uint32_t offset_allowed:1; /**< Supports buffer offsets. */
1672 	uint32_t offset_align_log2:4; /**< Required offset alignment. */
1673 	uint16_t max_nseg; /**< Maximum amount of segments to split. */
1674 	uint16_t reserved; /**< Reserved field. */
1675 };
1676 
1677 /**
1678  * Ethernet device information
1679  */
1680 
1681 /**
1682  * Ethernet device representor port type.
1683  */
1684 enum rte_eth_representor_type {
1685 	RTE_ETH_REPRESENTOR_NONE, /**< not a representor. */
1686 	RTE_ETH_REPRESENTOR_VF,   /**< representor of Virtual Function. */
1687 	RTE_ETH_REPRESENTOR_SF,   /**< representor of Sub Function. */
1688 	RTE_ETH_REPRESENTOR_PF,   /**< representor of Physical Function. */
1689 };
1690 
1691 /**
1692  * @warning
1693  * @b EXPERIMENTAL: this enumeration may change without prior notice.
1694  *
1695  * Ethernet device error handling mode.
1696  */
1697 enum rte_eth_err_handle_mode {
1698 	/** No error handling modes are supported. */
1699 	RTE_ETH_ERROR_HANDLE_MODE_NONE,
1700 	/** Passive error handling, after the PMD detects that a reset is required,
1701 	 * the PMD reports @see RTE_ETH_EVENT_INTR_RESET event,
1702 	 * and the application invokes @see rte_eth_dev_reset to recover the port.
1703 	 */
1704 	RTE_ETH_ERROR_HANDLE_MODE_PASSIVE,
1705 	/** Proactive error handling, after the PMD detects that a reset is required,
1706 	 * the PMD reports @see RTE_ETH_EVENT_ERR_RECOVERING event,
1707 	 * do recovery internally, and finally reports the recovery result event
1708 	 * (@see RTE_ETH_EVENT_RECOVERY_*).
1709 	 */
1710 	RTE_ETH_ERROR_HANDLE_MODE_PROACTIVE,
1711 };
1712 
1713 /**
1714  * A structure used to retrieve the contextual information of
1715  * an Ethernet device, such as the controlling driver of the
1716  * device, etc...
1717  */
1718 struct rte_eth_dev_info {
1719 	struct rte_device *device; /**< Generic device information */
1720 	const char *driver_name; /**< Device Driver name. */
1721 	unsigned int if_index; /**< Index to bound host interface, or 0 if none.
1722 		Use if_indextoname() to translate into an interface name. */
1723 	uint16_t min_mtu;	/**< Minimum MTU allowed */
1724 	uint16_t max_mtu;	/**< Maximum MTU allowed */
1725 	const uint32_t *dev_flags; /**< Device flags */
1726 	uint32_t min_rx_bufsize; /**< Minimum size of Rx buffer. */
1727 	uint32_t max_rx_pktlen; /**< Maximum configurable length of Rx pkt. */
1728 	/** Maximum configurable size of LRO aggregated packet. */
1729 	uint32_t max_lro_pkt_size;
1730 	uint16_t max_rx_queues; /**< Maximum number of Rx queues. */
1731 	uint16_t max_tx_queues; /**< Maximum number of Tx queues. */
1732 	uint32_t max_mac_addrs; /**< Maximum number of MAC addresses. */
1733 	/** Maximum number of hash MAC addresses for MTA and UTA. */
1734 	uint32_t max_hash_mac_addrs;
1735 	uint16_t max_vfs; /**< Maximum number of VFs. */
1736 	uint16_t max_vmdq_pools; /**< Maximum number of VMDq pools. */
1737 	struct rte_eth_rxseg_capa rx_seg_capa; /**< Segmentation capability.*/
1738 	/** All Rx offload capabilities including all per-queue ones */
1739 	uint64_t rx_offload_capa;
1740 	/** All Tx offload capabilities including all per-queue ones */
1741 	uint64_t tx_offload_capa;
1742 	/** Device per-queue Rx offload capabilities. */
1743 	uint64_t rx_queue_offload_capa;
1744 	/** Device per-queue Tx offload capabilities. */
1745 	uint64_t tx_queue_offload_capa;
1746 	/** Device redirection table size, the total number of entries. */
1747 	uint16_t reta_size;
1748 	uint8_t hash_key_size; /**< Hash key size in bytes */
1749 	/** Bit mask of RSS offloads, the bit offset also means flow type */
1750 	uint64_t flow_type_rss_offloads;
1751 	struct rte_eth_rxconf default_rxconf; /**< Default Rx configuration */
1752 	struct rte_eth_txconf default_txconf; /**< Default Tx configuration */
1753 	uint16_t vmdq_queue_base; /**< First queue ID for VMDq pools. */
1754 	uint16_t vmdq_queue_num;  /**< Queue number for VMDq pools. */
1755 	uint16_t vmdq_pool_base;  /**< First ID of VMDq pools. */
1756 	struct rte_eth_desc_lim rx_desc_lim;  /**< Rx descriptors limits */
1757 	struct rte_eth_desc_lim tx_desc_lim;  /**< Tx descriptors limits */
1758 	uint32_t speed_capa;  /**< Supported speeds bitmap (RTE_ETH_LINK_SPEED_). */
1759 	/** Configured number of Rx/Tx queues */
1760 	uint16_t nb_rx_queues; /**< Number of Rx queues. */
1761 	uint16_t nb_tx_queues; /**< Number of Tx queues. */
1762 	/**
1763 	 * Maximum number of Rx mempools supported per Rx queue.
1764 	 *
1765 	 * Value greater than 0 means that the driver supports Rx queue
1766 	 * mempools specification via rx_conf->rx_mempools.
1767 	 */
1768 	uint16_t max_rx_mempools;
1769 	/** Rx parameter recommendations */
1770 	struct rte_eth_dev_portconf default_rxportconf;
1771 	/** Tx parameter recommendations */
1772 	struct rte_eth_dev_portconf default_txportconf;
1773 	/** Generic device capabilities (RTE_ETH_DEV_CAPA_). */
1774 	uint64_t dev_capa;
1775 	/**
1776 	 * Switching information for ports on a device with a
1777 	 * embedded managed interconnect/switch.
1778 	 */
1779 	struct rte_eth_switch_info switch_info;
1780 	/** Supported error handling mode. */
1781 	enum rte_eth_err_handle_mode err_handle_mode;
1782 
1783 	uint64_t reserved_64s[2]; /**< Reserved for future fields */
1784 	void *reserved_ptrs[2];   /**< Reserved for future fields */
1785 };
1786 
1787 /**@{@name Rx/Tx queue states */
1788 #define RTE_ETH_QUEUE_STATE_STOPPED 0 /**< Queue stopped. */
1789 #define RTE_ETH_QUEUE_STATE_STARTED 1 /**< Queue started. */
1790 #define RTE_ETH_QUEUE_STATE_HAIRPIN 2 /**< Queue used for hairpin. */
1791 /**@}*/
1792 
1793 /**
1794  * Ethernet device Rx queue information structure.
1795  * Used to retrieve information about configured queue.
1796  */
1797 struct rte_eth_rxq_info {
1798 	struct rte_mempool *mp;     /**< mempool used by that queue. */
1799 	struct rte_eth_rxconf conf; /**< queue config parameters. */
1800 	uint8_t scattered_rx;       /**< scattered packets Rx supported. */
1801 	uint8_t queue_state;        /**< one of RTE_ETH_QUEUE_STATE_*. */
1802 	uint16_t nb_desc;           /**< configured number of RXDs. */
1803 	uint16_t rx_buf_size;       /**< hardware receive buffer size. */
1804 	/**
1805 	 * Available Rx descriptors threshold defined as percentage
1806 	 * of Rx queue size. If number of available descriptors is lower,
1807 	 * the event RTE_ETH_EVENT_RX_AVAIL_THESH is generated.
1808 	 * Value 0 means that the threshold monitoring is disabled.
1809 	 */
1810 	uint8_t avail_thresh;
1811 } __rte_cache_min_aligned;
1812 
1813 /**
1814  * Ethernet device Tx queue information structure.
1815  * Used to retrieve information about configured queue.
1816  */
1817 struct rte_eth_txq_info {
1818 	struct rte_eth_txconf conf; /**< queue config parameters. */
1819 	uint16_t nb_desc;           /**< configured number of TXDs. */
1820 	uint8_t queue_state;        /**< one of RTE_ETH_QUEUE_STATE_*. */
1821 } __rte_cache_min_aligned;
1822 
1823 /**
1824  * @warning
1825  * @b EXPERIMENTAL: this structure may change without prior notice.
1826  *
1827  * Ethernet device Rx queue information structure for recycling mbufs.
1828  * Used to retrieve Rx queue information when Tx queue reusing mbufs and moving
1829  * them into Rx mbuf ring.
1830  */
1831 struct rte_eth_recycle_rxq_info {
1832 	struct rte_mbuf **mbuf_ring; /**< mbuf ring of Rx queue. */
1833 	struct rte_mempool *mp;     /**< mempool of Rx queue. */
1834 	uint16_t *refill_head;      /**< head of Rx queue refilling mbufs. */
1835 	uint16_t *receive_tail;     /**< tail of Rx queue receiving pkts. */
1836 	uint16_t mbuf_ring_size;     /**< configured number of mbuf ring size. */
1837 	/**
1838 	 * Requirement on mbuf refilling batch size of Rx mbuf ring.
1839 	 * For some PMD drivers, the number of Rx mbuf ring refilling mbufs
1840 	 * should be aligned with mbuf ring size, in order to simplify
1841 	 * ring wrapping around.
1842 	 * Value 0 means that PMD drivers have no requirement for this.
1843 	 */
1844 	uint16_t refill_requirement;
1845 } __rte_cache_min_aligned;
1846 
1847 /* Generic Burst mode flag definition, values can be ORed. */
1848 
1849 /**
1850  * If the queues have different burst mode description, this bit will be set
1851  * by PMD, then the application can iterate to retrieve burst description for
1852  * all other queues.
1853  */
1854 #define RTE_ETH_BURST_FLAG_PER_QUEUE RTE_BIT64(0)
1855 
1856 /**
1857  * Ethernet device Rx/Tx queue packet burst mode information structure.
1858  * Used to retrieve information about packet burst mode setting.
1859  */
1860 struct rte_eth_burst_mode {
1861 	uint64_t flags; /**< The ORed values of RTE_ETH_BURST_FLAG_xxx */
1862 
1863 #define RTE_ETH_BURST_MODE_INFO_SIZE 1024 /**< Maximum size for information */
1864 	char info[RTE_ETH_BURST_MODE_INFO_SIZE]; /**< burst mode information */
1865 };
1866 
1867 /** Maximum name length for extended statistics counters */
1868 #define RTE_ETH_XSTATS_NAME_SIZE 64
1869 
1870 /**
1871  * An Ethernet device extended statistic structure
1872  *
1873  * This structure is used by rte_eth_xstats_get() to provide
1874  * statistics that are not provided in the generic *rte_eth_stats*
1875  * structure.
1876  * It maps a name ID, corresponding to an index in the array returned
1877  * by rte_eth_xstats_get_names(), to a statistic value.
1878  */
1879 struct rte_eth_xstat {
1880 	uint64_t id;        /**< The index in xstats name array. */
1881 	uint64_t value;     /**< The statistic counter value. */
1882 };
1883 
1884 /**
1885  * A name element for extended statistics.
1886  *
1887  * An array of this structure is returned by rte_eth_xstats_get_names().
1888  * It lists the names of extended statistics for a PMD. The *rte_eth_xstat*
1889  * structure references these names by their array index.
1890  *
1891  * The xstats should follow a common naming scheme.
1892  * Some names are standardized in rte_stats_strings.
1893  * Examples:
1894  *     - rx_missed_errors
1895  *     - tx_q3_bytes
1896  *     - tx_size_128_to_255_packets
1897  */
1898 struct rte_eth_xstat_name {
1899 	char name[RTE_ETH_XSTATS_NAME_SIZE]; /**< The statistic name. */
1900 };
1901 
1902 #define RTE_ETH_DCB_NUM_TCS    8
1903 #define RTE_ETH_MAX_VMDQ_POOL  64
1904 
1905 /**
1906  * A structure used to get the information of queue and
1907  * TC mapping on both Tx and Rx paths.
1908  */
1909 struct rte_eth_dcb_tc_queue_mapping {
1910 	/** Rx queues assigned to tc per Pool */
1911 	struct {
1912 		uint16_t base;
1913 		uint16_t nb_queue;
1914 	} tc_rxq[RTE_ETH_MAX_VMDQ_POOL][RTE_ETH_DCB_NUM_TCS];
1915 	/** Rx queues assigned to tc per Pool */
1916 	struct {
1917 		uint16_t base;
1918 		uint16_t nb_queue;
1919 	} tc_txq[RTE_ETH_MAX_VMDQ_POOL][RTE_ETH_DCB_NUM_TCS];
1920 };
1921 
1922 /**
1923  * A structure used to get the information of DCB.
1924  * It includes TC UP mapping and queue TC mapping.
1925  */
1926 struct rte_eth_dcb_info {
1927 	uint8_t nb_tcs;        /**< number of TCs */
1928 	uint8_t prio_tc[RTE_ETH_DCB_NUM_USER_PRIORITIES]; /**< Priority to tc */
1929 	uint8_t tc_bws[RTE_ETH_DCB_NUM_TCS]; /**< Tx BW percentage for each TC */
1930 	/** Rx queues assigned to tc */
1931 	struct rte_eth_dcb_tc_queue_mapping tc_queue;
1932 };
1933 
1934 /**
1935  * This enum indicates the possible Forward Error Correction (FEC) modes
1936  * of an ethdev port.
1937  */
1938 enum rte_eth_fec_mode {
1939 	RTE_ETH_FEC_NOFEC = 0,      /**< FEC is off */
1940 	RTE_ETH_FEC_AUTO,	    /**< FEC autonegotiation modes */
1941 	RTE_ETH_FEC_BASER,          /**< FEC using common algorithm */
1942 	RTE_ETH_FEC_RS,             /**< FEC using RS algorithm */
1943 	RTE_ETH_FEC_LLRS,           /**< FEC using LLRS algorithm */
1944 };
1945 
1946 /* Translate from FEC mode to FEC capa */
1947 #define RTE_ETH_FEC_MODE_TO_CAPA(x) RTE_BIT32(x)
1948 
1949 /* This macro indicates FEC capa mask */
1950 #define RTE_ETH_FEC_MODE_CAPA_MASK(x) RTE_BIT32(RTE_ETH_FEC_ ## x)
1951 
1952 /* A structure used to get capabilities per link speed */
1953 struct rte_eth_fec_capa {
1954 	uint32_t speed; /**< Link speed (see RTE_ETH_SPEED_NUM_*) */
1955 	uint32_t capa;  /**< FEC capabilities bitmask */
1956 };
1957 
1958 #define RTE_ETH_ALL RTE_MAX_ETHPORTS
1959 
1960 /* Macros to check for valid port */
1961 #define RTE_ETH_VALID_PORTID_OR_ERR_RET(port_id, retval) do { \
1962 	if (!rte_eth_dev_is_valid_port(port_id)) { \
1963 		RTE_ETHDEV_LOG(ERR, "Invalid port_id=%u\n", port_id); \
1964 		return retval; \
1965 	} \
1966 } while (0)
1967 
1968 #define RTE_ETH_VALID_PORTID_OR_RET(port_id) do { \
1969 	if (!rte_eth_dev_is_valid_port(port_id)) { \
1970 		RTE_ETHDEV_LOG(ERR, "Invalid port_id=%u\n", port_id); \
1971 		return; \
1972 	} \
1973 } while (0)
1974 
1975 /**
1976  * Function type used for Rx packet processing packet callbacks.
1977  *
1978  * The callback function is called on Rx with a burst of packets that have
1979  * been received on the given port and queue.
1980  *
1981  * @param port_id
1982  *   The Ethernet port on which Rx is being performed.
1983  * @param queue
1984  *   The queue on the Ethernet port which is being used to receive the packets.
1985  * @param pkts
1986  *   The burst of packets that have just been received.
1987  * @param nb_pkts
1988  *   The number of packets in the burst pointed to by "pkts".
1989  * @param max_pkts
1990  *   The max number of packets that can be stored in the "pkts" array.
1991  * @param user_param
1992  *   The arbitrary user parameter passed in by the application when the callback
1993  *   was originally configured.
1994  * @return
1995  *   The number of packets returned to the user.
1996  */
1997 typedef uint16_t (*rte_rx_callback_fn)(uint16_t port_id, uint16_t queue,
1998 	struct rte_mbuf *pkts[], uint16_t nb_pkts, uint16_t max_pkts,
1999 	void *user_param);
2000 
2001 /**
2002  * Function type used for Tx packet processing packet callbacks.
2003  *
2004  * The callback function is called on Tx with a burst of packets immediately
2005  * before the packets are put onto the hardware queue for transmission.
2006  *
2007  * @param port_id
2008  *   The Ethernet port on which Tx is being performed.
2009  * @param queue
2010  *   The queue on the Ethernet port which is being used to transmit the packets.
2011  * @param pkts
2012  *   The burst of packets that are about to be transmitted.
2013  * @param nb_pkts
2014  *   The number of packets in the burst pointed to by "pkts".
2015  * @param user_param
2016  *   The arbitrary user parameter passed in by the application when the callback
2017  *   was originally configured.
2018  * @return
2019  *   The number of packets to be written to the NIC.
2020  */
2021 typedef uint16_t (*rte_tx_callback_fn)(uint16_t port_id, uint16_t queue,
2022 	struct rte_mbuf *pkts[], uint16_t nb_pkts, void *user_param);
2023 
2024 /**
2025  * Possible states of an ethdev port.
2026  */
2027 enum rte_eth_dev_state {
2028 	/** Device is unused before being probed. */
2029 	RTE_ETH_DEV_UNUSED = 0,
2030 	/** Device is attached when allocated in probing. */
2031 	RTE_ETH_DEV_ATTACHED,
2032 	/** Device is in removed state when plug-out is detected. */
2033 	RTE_ETH_DEV_REMOVED,
2034 };
2035 
2036 struct rte_eth_dev_sriov {
2037 	uint8_t active;               /**< SRIOV is active with 16, 32 or 64 pools */
2038 	uint8_t nb_q_per_pool;        /**< Rx queue number per pool */
2039 	uint16_t def_vmdq_idx;        /**< Default pool num used for PF */
2040 	uint16_t def_pool_q_idx;      /**< Default pool queue start reg index */
2041 };
2042 #define RTE_ETH_DEV_SRIOV(dev)         ((dev)->data->sriov)
2043 
2044 #define RTE_ETH_NAME_MAX_LEN RTE_DEV_NAME_MAX_LEN
2045 
2046 #define RTE_ETH_DEV_NO_OWNER 0
2047 
2048 #define RTE_ETH_MAX_OWNER_NAME_LEN 64
2049 
2050 struct rte_eth_dev_owner {
2051 	uint64_t id; /**< The owner unique identifier. */
2052 	char name[RTE_ETH_MAX_OWNER_NAME_LEN]; /**< The owner name. */
2053 };
2054 
2055 /**@{@name Device flags
2056  * Flags internally saved in rte_eth_dev_data.dev_flags
2057  * and reported in rte_eth_dev_info.dev_flags.
2058  */
2059 /** PMD supports thread-safe flow operations */
2060 #define RTE_ETH_DEV_FLOW_OPS_THREAD_SAFE  RTE_BIT32(0)
2061 /** Device supports link state interrupt */
2062 #define RTE_ETH_DEV_INTR_LSC              RTE_BIT32(1)
2063 /** Device is a bonding member */
2064 #define RTE_ETH_DEV_BONDING_MEMBER        RTE_BIT32(2)
2065 /** Device supports device removal interrupt */
2066 #define RTE_ETH_DEV_INTR_RMV              RTE_BIT32(3)
2067 /** Device is port representor */
2068 #define RTE_ETH_DEV_REPRESENTOR           RTE_BIT32(4)
2069 /** Device does not support MAC change after started */
2070 #define RTE_ETH_DEV_NOLIVE_MAC_ADDR       RTE_BIT32(5)
2071 /**
2072  * Queue xstats filled automatically by ethdev layer.
2073  * PMDs filling the queue xstats themselves should not set this flag
2074  */
2075 #define RTE_ETH_DEV_AUTOFILL_QUEUE_XSTATS RTE_BIT32(6)
2076 /**@}*/
2077 
2078 /**
2079  * Iterates over valid ethdev ports owned by a specific owner.
2080  *
2081  * @param port_id
2082  *   The ID of the next possible valid owned port.
2083  * @param	owner_id
2084  *  The owner identifier.
2085  *  RTE_ETH_DEV_NO_OWNER means iterate over all valid ownerless ports.
2086  * @return
2087  *   Next valid port ID owned by owner_id, RTE_MAX_ETHPORTS if there is none.
2088  */
2089 uint64_t rte_eth_find_next_owned_by(uint16_t port_id,
2090 		const uint64_t owner_id);
2091 
2092 /**
2093  * Macro to iterate over all enabled ethdev ports owned by a specific owner.
2094  */
2095 #define RTE_ETH_FOREACH_DEV_OWNED_BY(p, o) \
2096 	for (p = rte_eth_find_next_owned_by(0, o); \
2097 	     (unsigned int)p < (unsigned int)RTE_MAX_ETHPORTS; \
2098 	     p = rte_eth_find_next_owned_by(p + 1, o))
2099 
2100 /**
2101  * Iterates over valid ethdev ports.
2102  *
2103  * @param port_id
2104  *   The ID of the next possible valid port.
2105  * @return
2106  *   Next valid port ID, RTE_MAX_ETHPORTS if there is none.
2107  */
2108 uint16_t rte_eth_find_next(uint16_t port_id);
2109 
2110 /**
2111  * Macro to iterate over all enabled and ownerless ethdev ports.
2112  */
2113 #define RTE_ETH_FOREACH_DEV(p) \
2114 	RTE_ETH_FOREACH_DEV_OWNED_BY(p, RTE_ETH_DEV_NO_OWNER)
2115 
2116 /**
2117  * Iterates over ethdev ports of a specified device.
2118  *
2119  * @param port_id_start
2120  *   The ID of the next possible valid port.
2121  * @param parent
2122  *   The generic device behind the ports to iterate.
2123  * @return
2124  *   Next port ID of the device, possibly port_id_start,
2125  *   RTE_MAX_ETHPORTS if there is none.
2126  */
2127 uint16_t
2128 rte_eth_find_next_of(uint16_t port_id_start,
2129 		const struct rte_device *parent);
2130 
2131 /**
2132  * Macro to iterate over all ethdev ports of a specified device.
2133  *
2134  * @param port_id
2135  *   The ID of the matching port being iterated.
2136  * @param parent
2137  *   The rte_device pointer matching the iterated ports.
2138  */
2139 #define RTE_ETH_FOREACH_DEV_OF(port_id, parent) \
2140 	for (port_id = rte_eth_find_next_of(0, parent); \
2141 		port_id < RTE_MAX_ETHPORTS; \
2142 		port_id = rte_eth_find_next_of(port_id + 1, parent))
2143 
2144 /**
2145  * Iterates over sibling ethdev ports (i.e. sharing the same rte_device).
2146  *
2147  * @param port_id_start
2148  *   The ID of the next possible valid sibling port.
2149  * @param ref_port_id
2150  *   The ID of a reference port to compare rte_device with.
2151  * @return
2152  *   Next sibling port ID, possibly port_id_start or ref_port_id itself,
2153  *   RTE_MAX_ETHPORTS if there is none.
2154  */
2155 uint16_t
2156 rte_eth_find_next_sibling(uint16_t port_id_start, uint16_t ref_port_id);
2157 
2158 /**
2159  * Macro to iterate over all ethdev ports sharing the same rte_device
2160  * as the specified port.
2161  * Note: the specified reference port is part of the loop iterations.
2162  *
2163  * @param port_id
2164  *   The ID of the matching port being iterated.
2165  * @param ref_port_id
2166  *   The ID of the port being compared.
2167  */
2168 #define RTE_ETH_FOREACH_DEV_SIBLING(port_id, ref_port_id) \
2169 	for (port_id = rte_eth_find_next_sibling(0, ref_port_id); \
2170 		port_id < RTE_MAX_ETHPORTS; \
2171 		port_id = rte_eth_find_next_sibling(port_id + 1, ref_port_id))
2172 
2173 /**
2174  * Get a new unique owner identifier.
2175  * An owner identifier is used to owns Ethernet devices by only one DPDK entity
2176  * to avoid multiple management of device by different entities.
2177  *
2178  * @param	owner_id
2179  *   Owner identifier pointer.
2180  * @return
2181  *   Negative errno value on error, 0 on success.
2182  */
2183 int rte_eth_dev_owner_new(uint64_t *owner_id);
2184 
2185 /**
2186  * Set an Ethernet device owner.
2187  *
2188  * @param	port_id
2189  *  The identifier of the port to own.
2190  * @param	owner
2191  *  The owner pointer.
2192  * @return
2193  *  Negative errno value on error, 0 on success.
2194  */
2195 int rte_eth_dev_owner_set(const uint16_t port_id,
2196 		const struct rte_eth_dev_owner *owner);
2197 
2198 /**
2199  * Unset Ethernet device owner to make the device ownerless.
2200  *
2201  * @param	port_id
2202  *  The identifier of port to make ownerless.
2203  * @param	owner_id
2204  *  The owner identifier.
2205  * @return
2206  *  0 on success, negative errno value on error.
2207  */
2208 int rte_eth_dev_owner_unset(const uint16_t port_id,
2209 		const uint64_t owner_id);
2210 
2211 /**
2212  * Remove owner from all Ethernet devices owned by a specific owner.
2213  *
2214  * @param	owner_id
2215  *  The owner identifier.
2216  * @return
2217  *  0 on success, negative errno value on error.
2218  */
2219 int rte_eth_dev_owner_delete(const uint64_t owner_id);
2220 
2221 /**
2222  * Get the owner of an Ethernet device.
2223  *
2224  * @param	port_id
2225  *  The port identifier.
2226  * @param	owner
2227  *  The owner structure pointer to fill.
2228  * @return
2229  *  0 on success, negative errno value on error..
2230  */
2231 int rte_eth_dev_owner_get(const uint16_t port_id,
2232 		struct rte_eth_dev_owner *owner);
2233 
2234 /**
2235  * Get the number of ports which are usable for the application.
2236  *
2237  * These devices must be iterated by using the macro
2238  * ``RTE_ETH_FOREACH_DEV`` or ``RTE_ETH_FOREACH_DEV_OWNED_BY``
2239  * to deal with non-contiguous ranges of devices.
2240  *
2241  * @return
2242  *   The count of available Ethernet devices.
2243  */
2244 uint16_t rte_eth_dev_count_avail(void);
2245 
2246 /**
2247  * Get the total number of ports which are allocated.
2248  *
2249  * Some devices may not be available for the application.
2250  *
2251  * @return
2252  *   The total count of Ethernet devices.
2253  */
2254 uint16_t rte_eth_dev_count_total(void);
2255 
2256 /**
2257  * Convert a numerical speed in Mbps to a bitmap flag that can be used in
2258  * the bitmap link_speeds of the struct rte_eth_conf
2259  *
2260  * @param speed
2261  *   Numerical speed value in Mbps
2262  * @param duplex
2263  *   RTE_ETH_LINK_[HALF/FULL]_DUPLEX (only for 10/100M speeds)
2264  * @return
2265  *   0 if the speed cannot be mapped
2266  */
2267 uint32_t rte_eth_speed_bitflag(uint32_t speed, int duplex);
2268 
2269 /**
2270  * Get RTE_ETH_RX_OFFLOAD_* flag name.
2271  *
2272  * @param offload
2273  *   Offload flag.
2274  * @return
2275  *   Offload name or 'UNKNOWN' if the flag cannot be recognised.
2276  */
2277 const char *rte_eth_dev_rx_offload_name(uint64_t offload);
2278 
2279 /**
2280  * Get RTE_ETH_TX_OFFLOAD_* flag name.
2281  *
2282  * @param offload
2283  *   Offload flag.
2284  * @return
2285  *   Offload name or 'UNKNOWN' if the flag cannot be recognised.
2286  */
2287 const char *rte_eth_dev_tx_offload_name(uint64_t offload);
2288 
2289 /**
2290  * @warning
2291  * @b EXPERIMENTAL: this API may change without prior notice.
2292  *
2293  * Get RTE_ETH_DEV_CAPA_* flag name.
2294  *
2295  * @param capability
2296  *   Capability flag.
2297  * @return
2298  *   Capability name or 'UNKNOWN' if the flag cannot be recognized.
2299  */
2300 __rte_experimental
2301 const char *rte_eth_dev_capability_name(uint64_t capability);
2302 
2303 /**
2304  * Configure an Ethernet device.
2305  * This function must be invoked first before any other function in the
2306  * Ethernet API. This function can also be re-invoked when a device is in the
2307  * stopped state.
2308  *
2309  * @param port_id
2310  *   The port identifier of the Ethernet device to configure.
2311  * @param nb_rx_queue
2312  *   The number of receive queues to set up for the Ethernet device.
2313  * @param nb_tx_queue
2314  *   The number of transmit queues to set up for the Ethernet device.
2315  * @param eth_conf
2316  *   The pointer to the configuration data to be used for the Ethernet device.
2317  *   The *rte_eth_conf* structure includes:
2318  *     -  the hardware offload features to activate, with dedicated fields for
2319  *        each statically configurable offload hardware feature provided by
2320  *        Ethernet devices, such as IP checksum or VLAN tag stripping for
2321  *        example.
2322  *        The Rx offload bitfield API is obsolete and will be deprecated.
2323  *        Applications should set the ignore_bitfield_offloads bit on *rxmode*
2324  *        structure and use offloads field to set per-port offloads instead.
2325  *     -  Any offloading set in eth_conf->[rt]xmode.offloads must be within
2326  *        the [rt]x_offload_capa returned from rte_eth_dev_info_get().
2327  *        Any type of device supported offloading set in the input argument
2328  *        eth_conf->[rt]xmode.offloads to rte_eth_dev_configure() is enabled
2329  *        on all queues and it can't be disabled in rte_eth_[rt]x_queue_setup()
2330  *     -  the Receive Side Scaling (RSS) configuration when using multiple Rx
2331  *        queues per port. Any RSS hash function set in eth_conf->rss_conf.rss_hf
2332  *        must be within the flow_type_rss_offloads provided by drivers via
2333  *        rte_eth_dev_info_get() API.
2334  *
2335  *   Embedding all configuration information in a single data structure
2336  *   is the more flexible method that allows the addition of new features
2337  *   without changing the syntax of the API.
2338  * @return
2339  *   - 0: Success, device configured.
2340  *   - <0: Error code returned by the driver configuration function.
2341  */
2342 int rte_eth_dev_configure(uint16_t port_id, uint16_t nb_rx_queue,
2343 		uint16_t nb_tx_queue, const struct rte_eth_conf *eth_conf);
2344 
2345 /**
2346  * Check if an Ethernet device was physically removed.
2347  *
2348  * @param port_id
2349  *   The port identifier of the Ethernet device.
2350  * @return
2351  *   1 when the Ethernet device is removed, otherwise 0.
2352  */
2353 int
2354 rte_eth_dev_is_removed(uint16_t port_id);
2355 
2356 /**
2357  * Allocate and set up a receive queue for an Ethernet device.
2358  *
2359  * The function allocates a contiguous block of memory for *nb_rx_desc*
2360  * receive descriptors from a memory zone associated with *socket_id*
2361  * and initializes each receive descriptor with a network buffer allocated
2362  * from the memory pool *mb_pool*.
2363  *
2364  * @param port_id
2365  *   The port identifier of the Ethernet device.
2366  * @param rx_queue_id
2367  *   The index of the receive queue to set up.
2368  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
2369  *   to rte_eth_dev_configure().
2370  * @param nb_rx_desc
2371  *   The number of receive descriptors to allocate for the receive ring.
2372  * @param socket_id
2373  *   The *socket_id* argument is the socket identifier in case of NUMA.
2374  *   The value can be *SOCKET_ID_ANY* if there is no NUMA constraint for
2375  *   the DMA memory allocated for the receive descriptors of the ring.
2376  * @param rx_conf
2377  *   The pointer to the configuration data to be used for the receive queue.
2378  *   NULL value is allowed, in which case default Rx configuration
2379  *   will be used.
2380  *   The *rx_conf* structure contains an *rx_thresh* structure with the values
2381  *   of the Prefetch, Host, and Write-Back threshold registers of the receive
2382  *   ring.
2383  *   In addition it contains the hardware offloads features to activate using
2384  *   the RTE_ETH_RX_OFFLOAD_* flags.
2385  *   If an offloading set in rx_conf->offloads
2386  *   hasn't been set in the input argument eth_conf->rxmode.offloads
2387  *   to rte_eth_dev_configure(), it is a new added offloading, it must be
2388  *   per-queue type and it is enabled for the queue.
2389  *   No need to repeat any bit in rx_conf->offloads which has already been
2390  *   enabled in rte_eth_dev_configure() at port level. An offloading enabled
2391  *   at port level can't be disabled at queue level.
2392  *   The configuration structure also contains the pointer to the array
2393  *   of the receiving buffer segment descriptions, see rx_seg and rx_nseg
2394  *   fields, this extended configuration might be used by split offloads like
2395  *   RTE_ETH_RX_OFFLOAD_BUFFER_SPLIT. If mb_pool is not NULL,
2396  *   the extended configuration fields must be set to NULL and zero.
2397  * @param mb_pool
2398  *   The pointer to the memory pool from which to allocate *rte_mbuf* network
2399  *   memory buffers to populate each descriptor of the receive ring. There are
2400  *   two options to provide Rx buffer configuration:
2401  *   - single pool:
2402  *     mb_pool is not NULL, rx_conf.rx_nseg is 0.
2403  *   - multiple segments description:
2404  *     mb_pool is NULL, rx_conf.rx_seg is not NULL, rx_conf.rx_nseg is not 0.
2405  *     Taken only if flag RTE_ETH_RX_OFFLOAD_BUFFER_SPLIT is set in offloads.
2406  *
2407  * @return
2408  *   - 0: Success, receive queue correctly set up.
2409  *   - -EIO: if device is removed.
2410  *   - -ENODEV: if *port_id* is invalid.
2411  *   - -EINVAL: The memory pool pointer is null or the size of network buffers
2412  *      which can be allocated from this memory pool does not fit the various
2413  *      buffer sizes allowed by the device controller.
2414  *   - -ENOMEM: Unable to allocate the receive ring descriptors or to
2415  *      allocate network memory buffers from the memory pool when
2416  *      initializing receive descriptors.
2417  */
2418 int rte_eth_rx_queue_setup(uint16_t port_id, uint16_t rx_queue_id,
2419 		uint16_t nb_rx_desc, unsigned int socket_id,
2420 		const struct rte_eth_rxconf *rx_conf,
2421 		struct rte_mempool *mb_pool);
2422 
2423 /**
2424  * @warning
2425  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
2426  *
2427  * Allocate and set up a hairpin receive queue for an Ethernet device.
2428  *
2429  * The function set up the selected queue to be used in hairpin.
2430  *
2431  * @param port_id
2432  *   The port identifier of the Ethernet device.
2433  * @param rx_queue_id
2434  *   The index of the receive queue to set up.
2435  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
2436  *   to rte_eth_dev_configure().
2437  * @param nb_rx_desc
2438  *   The number of receive descriptors to allocate for the receive ring.
2439  *   0 means the PMD will use default value.
2440  * @param conf
2441  *   The pointer to the hairpin configuration.
2442  *
2443  * @return
2444  *   - (0) if successful.
2445  *   - (-ENODEV) if *port_id* is invalid.
2446  *   - (-ENOTSUP) if hardware doesn't support.
2447  *   - (-EINVAL) if bad parameter.
2448  *   - (-ENOMEM) if unable to allocate the resources.
2449  */
2450 __rte_experimental
2451 int rte_eth_rx_hairpin_queue_setup
2452 	(uint16_t port_id, uint16_t rx_queue_id, uint16_t nb_rx_desc,
2453 	 const struct rte_eth_hairpin_conf *conf);
2454 
2455 /**
2456  * Allocate and set up a transmit queue for an Ethernet device.
2457  *
2458  * @param port_id
2459  *   The port identifier of the Ethernet device.
2460  * @param tx_queue_id
2461  *   The index of the transmit queue to set up.
2462  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
2463  *   to rte_eth_dev_configure().
2464  * @param nb_tx_desc
2465  *   The number of transmit descriptors to allocate for the transmit ring.
2466  * @param socket_id
2467  *   The *socket_id* argument is the socket identifier in case of NUMA.
2468  *   Its value can be *SOCKET_ID_ANY* if there is no NUMA constraint for
2469  *   the DMA memory allocated for the transmit descriptors of the ring.
2470  * @param tx_conf
2471  *   The pointer to the configuration data to be used for the transmit queue.
2472  *   NULL value is allowed, in which case default Tx configuration
2473  *   will be used.
2474  *   The *tx_conf* structure contains the following data:
2475  *   - The *tx_thresh* structure with the values of the Prefetch, Host, and
2476  *     Write-Back threshold registers of the transmit ring.
2477  *     When setting Write-Back threshold to the value greater then zero,
2478  *     *tx_rs_thresh* value should be explicitly set to one.
2479  *   - The *tx_free_thresh* value indicates the [minimum] number of network
2480  *     buffers that must be pending in the transmit ring to trigger their
2481  *     [implicit] freeing by the driver transmit function.
2482  *   - The *tx_rs_thresh* value indicates the [minimum] number of transmit
2483  *     descriptors that must be pending in the transmit ring before setting the
2484  *     RS bit on a descriptor by the driver transmit function.
2485  *     The *tx_rs_thresh* value should be less or equal then
2486  *     *tx_free_thresh* value, and both of them should be less then
2487  *     *nb_tx_desc* - 3.
2488  *   - The *offloads* member contains Tx offloads to be enabled.
2489  *     If an offloading set in tx_conf->offloads
2490  *     hasn't been set in the input argument eth_conf->txmode.offloads
2491  *     to rte_eth_dev_configure(), it is a new added offloading, it must be
2492  *     per-queue type and it is enabled for the queue.
2493  *     No need to repeat any bit in tx_conf->offloads which has already been
2494  *     enabled in rte_eth_dev_configure() at port level. An offloading enabled
2495  *     at port level can't be disabled at queue level.
2496  *
2497  *     Note that setting *tx_free_thresh* or *tx_rs_thresh* value to 0 forces
2498  *     the transmit function to use default values.
2499  * @return
2500  *   - 0: Success, the transmit queue is correctly set up.
2501  *   - -ENOMEM: Unable to allocate the transmit ring descriptors.
2502  */
2503 int rte_eth_tx_queue_setup(uint16_t port_id, uint16_t tx_queue_id,
2504 		uint16_t nb_tx_desc, unsigned int socket_id,
2505 		const struct rte_eth_txconf *tx_conf);
2506 
2507 /**
2508  * @warning
2509  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
2510  *
2511  * Allocate and set up a transmit hairpin queue for an Ethernet device.
2512  *
2513  * @param port_id
2514  *   The port identifier of the Ethernet device.
2515  * @param tx_queue_id
2516  *   The index of the transmit queue to set up.
2517  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
2518  *   to rte_eth_dev_configure().
2519  * @param nb_tx_desc
2520  *   The number of transmit descriptors to allocate for the transmit ring.
2521  *   0 to set default PMD value.
2522  * @param conf
2523  *   The hairpin configuration.
2524  *
2525  * @return
2526  *   - (0) if successful.
2527  *   - (-ENODEV) if *port_id* is invalid.
2528  *   - (-ENOTSUP) if hardware doesn't support.
2529  *   - (-EINVAL) if bad parameter.
2530  *   - (-ENOMEM) if unable to allocate the resources.
2531  */
2532 __rte_experimental
2533 int rte_eth_tx_hairpin_queue_setup
2534 	(uint16_t port_id, uint16_t tx_queue_id, uint16_t nb_tx_desc,
2535 	 const struct rte_eth_hairpin_conf *conf);
2536 
2537 /**
2538  * @warning
2539  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
2540  *
2541  * Get all the hairpin peer Rx / Tx ports of the current port.
2542  * The caller should ensure that the array is large enough to save the ports
2543  * list.
2544  *
2545  * @param port_id
2546  *   The port identifier of the Ethernet device.
2547  * @param peer_ports
2548  *   Pointer to the array to store the peer ports list.
2549  * @param len
2550  *   Length of the array to store the port identifiers.
2551  * @param direction
2552  *   Current port to peer port direction
2553  *   positive - current used as Tx to get all peer Rx ports.
2554  *   zero - current used as Rx to get all peer Tx ports.
2555  *
2556  * @return
2557  *   - (0 or positive) actual peer ports number.
2558  *   - (-EINVAL) if bad parameter.
2559  *   - (-ENODEV) if *port_id* invalid
2560  *   - (-ENOTSUP) if hardware doesn't support.
2561  *   - Others detailed errors from PMDs.
2562  */
2563 __rte_experimental
2564 int rte_eth_hairpin_get_peer_ports(uint16_t port_id, uint16_t *peer_ports,
2565 				   size_t len, uint32_t direction);
2566 
2567 /**
2568  * @warning
2569  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
2570  *
2571  * Bind all hairpin Tx queues of one port to the Rx queues of the peer port.
2572  * It is only allowed to call this function after all hairpin queues are
2573  * configured properly and the devices are in started state.
2574  *
2575  * @param tx_port
2576  *   The identifier of the Tx port.
2577  * @param rx_port
2578  *   The identifier of peer Rx port.
2579  *   RTE_MAX_ETHPORTS is allowed for the traversal of all devices.
2580  *   Rx port ID could have the same value as Tx port ID.
2581  *
2582  * @return
2583  *   - (0) if successful.
2584  *   - (-ENODEV) if Tx port ID is invalid.
2585  *   - (-EBUSY) if device is not in started state.
2586  *   - (-ENOTSUP) if hardware doesn't support.
2587  *   - Others detailed errors from PMDs.
2588  */
2589 __rte_experimental
2590 int rte_eth_hairpin_bind(uint16_t tx_port, uint16_t rx_port);
2591 
2592 /**
2593  * @warning
2594  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
2595  *
2596  * Unbind all hairpin Tx queues of one port from the Rx queues of the peer port.
2597  * This should be called before closing the Tx or Rx devices, if the bind
2598  * function is called before.
2599  * After unbinding the hairpin ports pair, it is allowed to bind them again.
2600  * Changing queues configuration should be after stopping the device(s).
2601  *
2602  * @param tx_port
2603  *   The identifier of the Tx port.
2604  * @param rx_port
2605  *   The identifier of peer Rx port.
2606  *   RTE_MAX_ETHPORTS is allowed for traversal of all devices.
2607  *   Rx port ID could have the same value as Tx port ID.
2608  *
2609  * @return
2610  *   - (0) if successful.
2611  *   - (-ENODEV) if Tx port ID is invalid.
2612  *   - (-EBUSY) if device is in stopped state.
2613  *   - (-ENOTSUP) if hardware doesn't support.
2614  *   - Others detailed errors from PMDs.
2615  */
2616 __rte_experimental
2617 int rte_eth_hairpin_unbind(uint16_t tx_port, uint16_t rx_port);
2618 
2619 /**
2620  * @warning
2621  * @b EXPERIMENTAL: this API may change without prior notice.
2622  *
2623  *  Get the number of aggregated ports of the DPDK port (specified with port_id).
2624  *  It is used when multiple ports are aggregated into a single one.
2625  *
2626  *  For the regular physical port doesn't have aggregated ports,
2627  *  the number of aggregated ports is reported as 0.
2628  *
2629  * @param port_id
2630  *   The port identifier of the Ethernet device.
2631  * @return
2632  *   - (>=0) the number of aggregated port if success.
2633  */
2634 __rte_experimental
2635 int rte_eth_dev_count_aggr_ports(uint16_t port_id);
2636 
2637 /**
2638  * @warning
2639  * @b EXPERIMENTAL: this API may change without prior notice.
2640  *
2641  *  Map a Tx queue with an aggregated port of the DPDK port (specified with port_id).
2642  *  When multiple ports are aggregated into a single one,
2643  *  it allows to choose which port to use for Tx via a queue.
2644  *
2645  *  The application should use rte_eth_dev_map_aggr_tx_affinity()
2646  *  after rte_eth_dev_configure(), rte_eth_tx_queue_setup(), and
2647  *  before rte_eth_dev_start().
2648  *
2649  * @param port_id
2650  *   The identifier of the port used in rte_eth_tx_burst().
2651  * @param tx_queue_id
2652  *   The index of the transmit queue used in rte_eth_tx_burst().
2653  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
2654  *   to rte_eth_dev_configure().
2655  * @param affinity
2656  *   The number of the aggregated port.
2657  *   Value 0 means no affinity and traffic could be routed to any aggregated port.
2658  *   The first aggregated port is number 1 and so on.
2659  *   The maximum number is given by rte_eth_dev_count_aggr_ports().
2660  *
2661  * @return
2662  *   Zero if successful. Non-zero otherwise.
2663  */
2664 __rte_experimental
2665 int rte_eth_dev_map_aggr_tx_affinity(uint16_t port_id, uint16_t tx_queue_id,
2666 				     uint8_t affinity);
2667 
2668 /**
2669  * Return the NUMA socket to which an Ethernet device is connected
2670  *
2671  * @param port_id
2672  *   The port identifier of the Ethernet device
2673  * @return
2674  *   - The NUMA socket ID which the Ethernet device is connected to.
2675  *   - -1 (which translates to SOCKET_ID_ANY) if the socket could not be
2676  *     determined. rte_errno is then set to:
2677  *     - EINVAL is the port_id is invalid,
2678  *     - 0 is the socket could not be determined,
2679  */
2680 int rte_eth_dev_socket_id(uint16_t port_id);
2681 
2682 /**
2683  * Check if port_id of device is attached
2684  *
2685  * @param port_id
2686  *   The port identifier of the Ethernet device
2687  * @return
2688  *   - 0 if port is out of range or not attached
2689  *   - 1 if device is attached
2690  */
2691 int rte_eth_dev_is_valid_port(uint16_t port_id);
2692 
2693 /**
2694  * @warning
2695  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice.
2696  *
2697  * Check if Rx queue is valid.
2698  * If the queue has been setup, it is considered valid.
2699  *
2700  * @param port_id
2701  *   The port identifier of the Ethernet device.
2702  * @param queue_id
2703  *   The index of the receive queue.
2704  * @return
2705  *   - -ENODEV: if port_id is invalid.
2706  *   - -EINVAL: if queue_id is out of range or queue has not been setup.
2707  *   - 0 if Rx queue is valid.
2708  */
2709 __rte_experimental
2710 int rte_eth_rx_queue_is_valid(uint16_t port_id, uint16_t queue_id);
2711 
2712 /**
2713  * @warning
2714  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice.
2715  *
2716  * Check if Tx queue is valid.
2717  * If the queue has been setup, it is considered valid.
2718  *
2719  * @param port_id
2720  *   The port identifier of the Ethernet device.
2721  * @param queue_id
2722  *   The index of the transmit queue.
2723  * @return
2724  *   - -ENODEV: if port_id is invalid.
2725  *   - -EINVAL: if queue_id is out of range or queue has not been setup.
2726  *   - 0 if Tx queue is valid.
2727  */
2728 __rte_experimental
2729 int rte_eth_tx_queue_is_valid(uint16_t port_id, uint16_t queue_id);
2730 
2731 /**
2732  * Start specified Rx queue of a port. It is used when rx_deferred_start
2733  * flag of the specified queue is true.
2734  *
2735  * @param port_id
2736  *   The port identifier of the Ethernet device
2737  * @param rx_queue_id
2738  *   The index of the Rx queue to update the ring.
2739  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
2740  *   to rte_eth_dev_configure().
2741  * @return
2742  *   - 0: Success, the receive queue is started.
2743  *   - -ENODEV: if *port_id* is invalid.
2744  *   - -EINVAL: The queue_id out of range or belong to hairpin.
2745  *   - -EIO: if device is removed.
2746  *   - -ENOTSUP: The function not supported in PMD.
2747  */
2748 int rte_eth_dev_rx_queue_start(uint16_t port_id, uint16_t rx_queue_id);
2749 
2750 /**
2751  * Stop specified Rx queue of a port
2752  *
2753  * @param port_id
2754  *   The port identifier of the Ethernet device
2755  * @param rx_queue_id
2756  *   The index of the Rx queue to update the ring.
2757  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
2758  *   to rte_eth_dev_configure().
2759  * @return
2760  *   - 0: Success, the receive queue is stopped.
2761  *   - -ENODEV: if *port_id* is invalid.
2762  *   - -EINVAL: The queue_id out of range or belong to hairpin.
2763  *   - -EIO: if device is removed.
2764  *   - -ENOTSUP: The function not supported in PMD.
2765  */
2766 int rte_eth_dev_rx_queue_stop(uint16_t port_id, uint16_t rx_queue_id);
2767 
2768 /**
2769  * Start Tx for specified queue of a port. It is used when tx_deferred_start
2770  * flag of the specified queue is true.
2771  *
2772  * @param port_id
2773  *   The port identifier of the Ethernet device
2774  * @param tx_queue_id
2775  *   The index of the Tx queue to update the ring.
2776  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
2777  *   to rte_eth_dev_configure().
2778  * @return
2779  *   - 0: Success, the transmit queue is started.
2780  *   - -ENODEV: if *port_id* is invalid.
2781  *   - -EINVAL: The queue_id out of range or belong to hairpin.
2782  *   - -EIO: if device is removed.
2783  *   - -ENOTSUP: The function not supported in PMD.
2784  */
2785 int rte_eth_dev_tx_queue_start(uint16_t port_id, uint16_t tx_queue_id);
2786 
2787 /**
2788  * Stop specified Tx queue of a port
2789  *
2790  * @param port_id
2791  *   The port identifier of the Ethernet device
2792  * @param tx_queue_id
2793  *   The index of the Tx queue to update the ring.
2794  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
2795  *   to rte_eth_dev_configure().
2796  * @return
2797  *   - 0: Success, the transmit queue is stopped.
2798  *   - -ENODEV: if *port_id* is invalid.
2799  *   - -EINVAL: The queue_id out of range or belong to hairpin.
2800  *   - -EIO: if device is removed.
2801  *   - -ENOTSUP: The function not supported in PMD.
2802  */
2803 int rte_eth_dev_tx_queue_stop(uint16_t port_id, uint16_t tx_queue_id);
2804 
2805 /**
2806  * Start an Ethernet device.
2807  *
2808  * The device start step is the last one and consists of setting the configured
2809  * offload features and in starting the transmit and the receive units of the
2810  * device.
2811  *
2812  * Device RTE_ETH_DEV_NOLIVE_MAC_ADDR flag causes MAC address to be set before
2813  * PMD port start callback function is invoked.
2814  *
2815  * On success, all basic functions exported by the Ethernet API (link status,
2816  * receive/transmit, and so on) can be invoked.
2817  *
2818  * @param port_id
2819  *   The port identifier of the Ethernet device.
2820  * @return
2821  *   - 0: Success, Ethernet device started.
2822  *   - -EAGAIN: If start operation must be retried.
2823  *   - <0: Error code of the driver device start function.
2824  */
2825 int rte_eth_dev_start(uint16_t port_id);
2826 
2827 /**
2828  * Stop an Ethernet device. The device can be restarted with a call to
2829  * rte_eth_dev_start()
2830  *
2831  * @param port_id
2832  *   The port identifier of the Ethernet device.
2833  * @return
2834  *   - 0: Success, Ethernet device stopped.
2835  *   - -EBUSY: If stopping the port is not allowed in current state.
2836  *   - <0: Error code of the driver device stop function.
2837  */
2838 int rte_eth_dev_stop(uint16_t port_id);
2839 
2840 /**
2841  * Link up an Ethernet device.
2842  *
2843  * Set device link up will re-enable the device Rx/Tx
2844  * functionality after it is previously set device linked down.
2845  *
2846  * @param port_id
2847  *   The port identifier of the Ethernet device.
2848  * @return
2849  *   - 0: Success, Ethernet device linked up.
2850  *   - <0: Error code of the driver device link up function.
2851  */
2852 int rte_eth_dev_set_link_up(uint16_t port_id);
2853 
2854 /**
2855  * Link down an Ethernet device.
2856  * The device Rx/Tx functionality will be disabled if success,
2857  * and it can be re-enabled with a call to
2858  * rte_eth_dev_set_link_up()
2859  *
2860  * @param port_id
2861  *   The port identifier of the Ethernet device.
2862  */
2863 int rte_eth_dev_set_link_down(uint16_t port_id);
2864 
2865 /**
2866  * Close a stopped Ethernet device. The device cannot be restarted!
2867  * The function frees all port resources.
2868  *
2869  * @param port_id
2870  *   The port identifier of the Ethernet device.
2871  * @return
2872  *   - Zero if the port is closed successfully.
2873  *   - Negative if something went wrong.
2874  */
2875 int rte_eth_dev_close(uint16_t port_id);
2876 
2877 /**
2878  * Reset a Ethernet device and keep its port ID.
2879  *
2880  * When a port has to be reset passively, the DPDK application can invoke
2881  * this function. For example when a PF is reset, all its VFs should also
2882  * be reset. Normally a DPDK application can invoke this function when
2883  * RTE_ETH_EVENT_INTR_RESET event is detected, but can also use it to start
2884  * a port reset in other circumstances.
2885  *
2886  * When this function is called, it first stops the port and then calls the
2887  * PMD specific dev_uninit( ) and dev_init( ) to return the port to initial
2888  * state, in which no Tx and Rx queues are setup, as if the port has been
2889  * reset and not started. The port keeps the port ID it had before the
2890  * function call.
2891  *
2892  * After calling rte_eth_dev_reset( ), the application should use
2893  * rte_eth_dev_configure( ), rte_eth_rx_queue_setup( ),
2894  * rte_eth_tx_queue_setup( ), and rte_eth_dev_start( )
2895  * to reconfigure the device as appropriate.
2896  *
2897  * Note: To avoid unexpected behavior, the application should stop calling
2898  * Tx and Rx functions before calling rte_eth_dev_reset( ). For thread
2899  * safety, all these controlling functions should be called from the same
2900  * thread.
2901  *
2902  * @param port_id
2903  *   The port identifier of the Ethernet device.
2904  *
2905  * @return
2906  *   - (0) if successful.
2907  *   - (-ENODEV) if *port_id* is invalid.
2908  *   - (-ENOTSUP) if hardware doesn't support this function.
2909  *   - (-EPERM) if not ran from the primary process.
2910  *   - (-EIO) if re-initialisation failed or device is removed.
2911  *   - (-ENOMEM) if the reset failed due to OOM.
2912  *   - (-EAGAIN) if the reset temporarily failed and should be retried later.
2913  */
2914 int rte_eth_dev_reset(uint16_t port_id);
2915 
2916 /**
2917  * Enable receipt in promiscuous mode for an Ethernet device.
2918  *
2919  * @param port_id
2920  *   The port identifier of the Ethernet device.
2921  * @return
2922  *   - (0) if successful.
2923  *   - (-ENOTSUP) if support for promiscuous_enable() does not exist
2924  *     for the device.
2925  *   - (-ENODEV) if *port_id* invalid.
2926  */
2927 int rte_eth_promiscuous_enable(uint16_t port_id);
2928 
2929 /**
2930  * Disable receipt in promiscuous mode for an Ethernet device.
2931  *
2932  * @param port_id
2933  *   The port identifier of the Ethernet device.
2934  * @return
2935  *   - (0) if successful.
2936  *   - (-ENOTSUP) if support for promiscuous_disable() does not exist
2937  *     for the device.
2938  *   - (-ENODEV) if *port_id* invalid.
2939  */
2940 int rte_eth_promiscuous_disable(uint16_t port_id);
2941 
2942 /**
2943  * Return the value of promiscuous mode for an Ethernet device.
2944  *
2945  * @param port_id
2946  *   The port identifier of the Ethernet device.
2947  * @return
2948  *   - (1) if promiscuous is enabled
2949  *   - (0) if promiscuous is disabled.
2950  *   - (-1) on error
2951  */
2952 int rte_eth_promiscuous_get(uint16_t port_id);
2953 
2954 /**
2955  * Enable the receipt of any multicast frame by an Ethernet device.
2956  *
2957  * @param port_id
2958  *   The port identifier of the Ethernet device.
2959  * @return
2960  *   - (0) if successful.
2961  *   - (-ENOTSUP) if support for allmulticast_enable() does not exist
2962  *     for the device.
2963  *   - (-ENODEV) if *port_id* invalid.
2964  */
2965 int rte_eth_allmulticast_enable(uint16_t port_id);
2966 
2967 /**
2968  * Disable the receipt of all multicast frames by an Ethernet device.
2969  *
2970  * @param port_id
2971  *   The port identifier of the Ethernet device.
2972  * @return
2973  *   - (0) if successful.
2974  *   - (-ENOTSUP) if support for allmulticast_disable() does not exist
2975  *     for the device.
2976  *   - (-ENODEV) if *port_id* invalid.
2977  */
2978 int rte_eth_allmulticast_disable(uint16_t port_id);
2979 
2980 /**
2981  * Return the value of allmulticast mode for an Ethernet device.
2982  *
2983  * @param port_id
2984  *   The port identifier of the Ethernet device.
2985  * @return
2986  *   - (1) if allmulticast is enabled
2987  *   - (0) if allmulticast is disabled.
2988  *   - (-1) on error
2989  */
2990 int rte_eth_allmulticast_get(uint16_t port_id);
2991 
2992 /**
2993  * Retrieve the link status (up/down), the duplex mode (half/full),
2994  * the negotiation (auto/fixed), and if available, the speed (Mbps).
2995  *
2996  * It might need to wait up to 9 seconds.
2997  * @see rte_eth_link_get_nowait.
2998  *
2999  * @param port_id
3000  *   The port identifier of the Ethernet device.
3001  * @param link
3002  *   Link information written back.
3003  * @return
3004  *   - (0) if successful.
3005  *   - (-ENOTSUP) if the function is not supported in PMD.
3006  *   - (-ENODEV) if *port_id* invalid.
3007  *   - (-EINVAL) if bad parameter.
3008  */
3009 int rte_eth_link_get(uint16_t port_id, struct rte_eth_link *link);
3010 
3011 /**
3012  * Retrieve the link status (up/down), the duplex mode (half/full),
3013  * the negotiation (auto/fixed), and if available, the speed (Mbps).
3014  *
3015  * @param port_id
3016  *   The port identifier of the Ethernet device.
3017  * @param link
3018  *   Link information written back.
3019  * @return
3020  *   - (0) if successful.
3021  *   - (-ENOTSUP) if the function is not supported in PMD.
3022  *   - (-ENODEV) if *port_id* invalid.
3023  *   - (-EINVAL) if bad parameter.
3024  */
3025 int rte_eth_link_get_nowait(uint16_t port_id, struct rte_eth_link *link);
3026 
3027 /**
3028  * @warning
3029  * @b EXPERIMENTAL: this API may change without prior notice.
3030  *
3031  * The function converts a link_speed to a string. It handles all special
3032  * values like unknown or none speed.
3033  *
3034  * @param link_speed
3035  *   link_speed of rte_eth_link struct
3036  * @return
3037  *   Link speed in textual format. It's pointer to immutable memory.
3038  *   No free is required.
3039  */
3040 __rte_experimental
3041 const char *rte_eth_link_speed_to_str(uint32_t link_speed);
3042 
3043 /**
3044  * @warning
3045  * @b EXPERIMENTAL: this API may change without prior notice.
3046  *
3047  * The function converts a rte_eth_link struct representing a link status to
3048  * a string.
3049  *
3050  * @param str
3051  *   A pointer to a string to be filled with textual representation of
3052  *   device status. At least RTE_ETH_LINK_MAX_STR_LEN bytes should be allocated to
3053  *   store default link status text.
3054  * @param len
3055  *   Length of available memory at 'str' string.
3056  * @param eth_link
3057  *   Link status returned by rte_eth_link_get function
3058  * @return
3059  *   Number of bytes written to str array or -EINVAL if bad parameter.
3060  */
3061 __rte_experimental
3062 int rte_eth_link_to_str(char *str, size_t len,
3063 			const struct rte_eth_link *eth_link);
3064 
3065 /**
3066  * Retrieve the general I/O statistics of an Ethernet device.
3067  *
3068  * @param port_id
3069  *   The port identifier of the Ethernet device.
3070  * @param stats
3071  *   A pointer to a structure of type *rte_eth_stats* to be filled with
3072  *   the values of device counters for the following set of statistics:
3073  *   - *ipackets* with the total of successfully received packets.
3074  *   - *opackets* with the total of successfully transmitted packets.
3075  *   - *ibytes*   with the total of successfully received bytes.
3076  *   - *obytes*   with the total of successfully transmitted bytes.
3077  *   - *ierrors*  with the total of erroneous received packets.
3078  *   - *oerrors*  with the total of failed transmitted packets.
3079  * @return
3080  *   Zero if successful. Non-zero otherwise.
3081  */
3082 int rte_eth_stats_get(uint16_t port_id, struct rte_eth_stats *stats);
3083 
3084 /**
3085  * Reset the general I/O statistics of an Ethernet device.
3086  *
3087  * @param port_id
3088  *   The port identifier of the Ethernet device.
3089  * @return
3090  *   - (0) if device notified to reset stats.
3091  *   - (-ENOTSUP) if hardware doesn't support.
3092  *   - (-ENODEV) if *port_id* invalid.
3093  *   - (<0): Error code of the driver stats reset function.
3094  */
3095 int rte_eth_stats_reset(uint16_t port_id);
3096 
3097 /**
3098  * Retrieve names of extended statistics of an Ethernet device.
3099  *
3100  * There is an assumption that 'xstat_names' and 'xstats' arrays are matched
3101  * by array index:
3102  *  xstats_names[i].name => xstats[i].value
3103  *
3104  * And the array index is same with id field of 'struct rte_eth_xstat':
3105  *  xstats[i].id == i
3106  *
3107  * This assumption makes key-value pair matching less flexible but simpler.
3108  *
3109  * @param port_id
3110  *   The port identifier of the Ethernet device.
3111  * @param xstats_names
3112  *   An rte_eth_xstat_name array of at least *size* elements to
3113  *   be filled. If set to NULL, the function returns the required number
3114  *   of elements.
3115  * @param size
3116  *   The size of the xstats_names array (number of elements).
3117  * @return
3118  *   - A positive value lower or equal to size: success. The return value
3119  *     is the number of entries filled in the stats table.
3120  *   - A positive value higher than size: error, the given statistics table
3121  *     is too small. The return value corresponds to the size that should
3122  *     be given to succeed. The entries in the table are not valid and
3123  *     shall not be used by the caller.
3124  *   - A negative value on error (invalid port ID).
3125  */
3126 int rte_eth_xstats_get_names(uint16_t port_id,
3127 		struct rte_eth_xstat_name *xstats_names,
3128 		unsigned int size);
3129 
3130 /**
3131  * Retrieve extended statistics of an Ethernet device.
3132  *
3133  * There is an assumption that 'xstat_names' and 'xstats' arrays are matched
3134  * by array index:
3135  *  xstats_names[i].name => xstats[i].value
3136  *
3137  * And the array index is same with id field of 'struct rte_eth_xstat':
3138  *  xstats[i].id == i
3139  *
3140  * This assumption makes key-value pair matching less flexible but simpler.
3141  *
3142  * @param port_id
3143  *   The port identifier of the Ethernet device.
3144  * @param xstats
3145  *   A pointer to a table of structure of type *rte_eth_xstat*
3146  *   to be filled with device statistics ids and values.
3147  *   This parameter can be set to NULL if and only if n is 0.
3148  * @param n
3149  *   The size of the xstats array (number of elements).
3150  *   If lower than the required number of elements, the function returns
3151  *   the required number of elements.
3152  *   If equal to zero, the xstats must be NULL, the function returns the
3153  *   required number of elements.
3154  * @return
3155  *   - A positive value lower or equal to n: success. The return value
3156  *     is the number of entries filled in the stats table.
3157  *   - A positive value higher than n: error, the given statistics table
3158  *     is too small. The return value corresponds to the size that should
3159  *     be given to succeed. The entries in the table are not valid and
3160  *     shall not be used by the caller.
3161  *   - A negative value on error (invalid port ID).
3162  */
3163 int rte_eth_xstats_get(uint16_t port_id, struct rte_eth_xstat *xstats,
3164 		unsigned int n);
3165 
3166 /**
3167  * Retrieve names of extended statistics of an Ethernet device.
3168  *
3169  * @param port_id
3170  *   The port identifier of the Ethernet device.
3171  * @param xstats_names
3172  *   Array to be filled in with names of requested device statistics.
3173  *   Must not be NULL if @p ids are specified (not NULL).
3174  * @param size
3175  *   Number of elements in @p xstats_names array (if not NULL) and in
3176  *   @p ids array (if not NULL). Must be 0 if both array pointers are NULL.
3177  * @param ids
3178  *   IDs array given by app to retrieve specific statistics. May be NULL to
3179  *   retrieve names of all available statistics or, if @p xstats_names is
3180  *   NULL as well, just the number of available statistics.
3181  * @return
3182  *   - A positive value lower or equal to size: success. The return value
3183  *     is the number of entries filled in the stats table.
3184  *   - A positive value higher than size: success. The given statistics table
3185  *     is too small. The return value corresponds to the size that should
3186  *     be given to succeed. The entries in the table are not valid and
3187  *     shall not be used by the caller.
3188  *   - A negative value on error.
3189  */
3190 int
3191 rte_eth_xstats_get_names_by_id(uint16_t port_id,
3192 	struct rte_eth_xstat_name *xstats_names, unsigned int size,
3193 	uint64_t *ids);
3194 
3195 /**
3196  * Retrieve extended statistics of an Ethernet device.
3197  *
3198  * @param port_id
3199  *   The port identifier of the Ethernet device.
3200  * @param ids
3201  *   IDs array given by app to retrieve specific statistics. May be NULL to
3202  *   retrieve all available statistics or, if @p values is NULL as well,
3203  *   just the number of available statistics.
3204  * @param values
3205  *   Array to be filled in with requested device statistics.
3206  *   Must not be NULL if ids are specified (not NULL).
3207  * @param size
3208  *   Number of elements in @p values array (if not NULL) and in @p ids
3209  *   array (if not NULL). Must be 0 if both array pointers are NULL.
3210  * @return
3211  *   - A positive value lower or equal to size: success. The return value
3212  *     is the number of entries filled in the stats table.
3213  *   - A positive value higher than size: success: The given statistics table
3214  *     is too small. The return value corresponds to the size that should
3215  *     be given to succeed. The entries in the table are not valid and
3216  *     shall not be used by the caller.
3217  *   - A negative value on error.
3218  */
3219 int rte_eth_xstats_get_by_id(uint16_t port_id, const uint64_t *ids,
3220 			     uint64_t *values, unsigned int size);
3221 
3222 /**
3223  * Gets the ID of a statistic from its name.
3224  *
3225  * This function searches for the statistics using string compares, and
3226  * as such should not be used on the fast-path. For fast-path retrieval of
3227  * specific statistics, store the ID as provided in *id* from this function,
3228  * and pass the ID to rte_eth_xstats_get()
3229  *
3230  * @param port_id The port to look up statistics from
3231  * @param xstat_name The name of the statistic to return
3232  * @param[out] id A pointer to an app-supplied uint64_t which should be
3233  *                set to the ID of the stat if the stat exists.
3234  * @return
3235  *    0 on success
3236  *    -ENODEV for invalid port_id,
3237  *    -EIO if device is removed,
3238  *    -EINVAL if the xstat_name doesn't exist in port_id
3239  *    -ENOMEM if bad parameter.
3240  */
3241 int rte_eth_xstats_get_id_by_name(uint16_t port_id, const char *xstat_name,
3242 		uint64_t *id);
3243 
3244 /**
3245  * Reset extended statistics of an Ethernet device.
3246  *
3247  * @param port_id
3248  *   The port identifier of the Ethernet device.
3249  * @return
3250  *   - (0) if device notified to reset extended stats.
3251  *   - (-ENOTSUP) if pmd doesn't support both
3252  *     extended stats and basic stats reset.
3253  *   - (-ENODEV) if *port_id* invalid.
3254  *   - (<0): Error code of the driver xstats reset function.
3255  */
3256 int rte_eth_xstats_reset(uint16_t port_id);
3257 
3258 /**
3259  *  Set a mapping for the specified transmit queue to the specified per-queue
3260  *  statistics counter.
3261  *
3262  * @param port_id
3263  *   The port identifier of the Ethernet device.
3264  * @param tx_queue_id
3265  *   The index of the transmit queue for which a queue stats mapping is required.
3266  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
3267  *   to rte_eth_dev_configure().
3268  * @param stat_idx
3269  *   The per-queue packet statistics functionality number that the transmit
3270  *   queue is to be assigned.
3271  *   The value must be in the range [0, RTE_ETHDEV_QUEUE_STAT_CNTRS - 1].
3272  *   Max RTE_ETHDEV_QUEUE_STAT_CNTRS being 256.
3273  * @return
3274  *   Zero if successful. Non-zero otherwise.
3275  */
3276 int rte_eth_dev_set_tx_queue_stats_mapping(uint16_t port_id,
3277 		uint16_t tx_queue_id, uint8_t stat_idx);
3278 
3279 /**
3280  *  Set a mapping for the specified receive queue to the specified per-queue
3281  *  statistics counter.
3282  *
3283  * @param port_id
3284  *   The port identifier of the Ethernet device.
3285  * @param rx_queue_id
3286  *   The index of the receive queue for which a queue stats mapping is required.
3287  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
3288  *   to rte_eth_dev_configure().
3289  * @param stat_idx
3290  *   The per-queue packet statistics functionality number that the receive
3291  *   queue is to be assigned.
3292  *   The value must be in the range [0, RTE_ETHDEV_QUEUE_STAT_CNTRS - 1].
3293  *   Max RTE_ETHDEV_QUEUE_STAT_CNTRS being 256.
3294  * @return
3295  *   Zero if successful. Non-zero otherwise.
3296  */
3297 int rte_eth_dev_set_rx_queue_stats_mapping(uint16_t port_id,
3298 					   uint16_t rx_queue_id,
3299 					   uint8_t stat_idx);
3300 
3301 /**
3302  * Retrieve the Ethernet address of an Ethernet device.
3303  *
3304  * @param port_id
3305  *   The port identifier of the Ethernet device.
3306  * @param mac_addr
3307  *   A pointer to a structure of type *ether_addr* to be filled with
3308  *   the Ethernet address of the Ethernet device.
3309  * @return
3310  *   - (0) if successful
3311  *   - (-ENODEV) if *port_id* invalid.
3312  *   - (-EINVAL) if bad parameter.
3313  */
3314 int rte_eth_macaddr_get(uint16_t port_id, struct rte_ether_addr *mac_addr);
3315 
3316 /**
3317  * @warning
3318  * @b EXPERIMENTAL: this API may change without prior notice
3319  *
3320  * Retrieve the Ethernet addresses of an Ethernet device.
3321  *
3322  * @param port_id
3323  *   The port identifier of the Ethernet device.
3324  * @param ma
3325  *   A pointer to an array of structures of type *ether_addr* to be filled with
3326  *   the Ethernet addresses of the Ethernet device.
3327  * @param num
3328  *   Number of elements in the @p ma array.
3329  *   Note that  rte_eth_dev_info::max_mac_addrs can be used to retrieve
3330  *   max number of Ethernet addresses for given port.
3331  * @return
3332  *   - number of retrieved addresses if successful
3333  *   - (-ENODEV) if *port_id* invalid.
3334  *   - (-EINVAL) if bad parameter.
3335  */
3336 __rte_experimental
3337 int rte_eth_macaddrs_get(uint16_t port_id, struct rte_ether_addr *ma,
3338 	unsigned int num);
3339 
3340 /**
3341  * Retrieve the contextual information of an Ethernet device.
3342  *
3343  * This function returns the Ethernet device information based
3344  * on the values stored internally in the device specific data.
3345  * For example: number of queues, descriptor limits, device
3346  * capabilities and offload flags.
3347  *
3348  * @param port_id
3349  *   The port identifier of the Ethernet device.
3350  * @param dev_info
3351  *   A pointer to a structure of type *rte_eth_dev_info* to be filled with
3352  *   the contextual information of the Ethernet device.
3353  * @return
3354  *   - (0) if successful.
3355  *   - (-ENOTSUP) if support for dev_infos_get() does not exist for the device.
3356  *   - (-ENODEV) if *port_id* invalid.
3357  *   - (-EINVAL) if bad parameter.
3358  */
3359 int rte_eth_dev_info_get(uint16_t port_id, struct rte_eth_dev_info *dev_info);
3360 
3361 /**
3362  * @warning
3363  * @b EXPERIMENTAL: this API may change without prior notice.
3364  *
3365  * Retrieve the configuration of an Ethernet device.
3366  *
3367  * @param port_id
3368  *   The port identifier of the Ethernet device.
3369  * @param dev_conf
3370  *   Location for Ethernet device configuration to be filled in.
3371  * @return
3372  *   - (0) if successful.
3373  *   - (-ENODEV) if *port_id* invalid.
3374  *   - (-EINVAL) if bad parameter.
3375  */
3376 __rte_experimental
3377 int rte_eth_dev_conf_get(uint16_t port_id, struct rte_eth_conf *dev_conf);
3378 
3379 /**
3380  * Retrieve the firmware version of a device.
3381  *
3382  * @param port_id
3383  *   The port identifier of the device.
3384  * @param fw_version
3385  *   A pointer to a string array storing the firmware version of a device,
3386  *   the string includes terminating null. This pointer is allocated by caller.
3387  * @param fw_size
3388  *   The size of the string array pointed by fw_version, which should be
3389  *   large enough to store firmware version of the device.
3390  * @return
3391  *   - (0) if successful.
3392  *   - (-ENOTSUP) if operation is not supported.
3393  *   - (-ENODEV) if *port_id* invalid.
3394  *   - (-EIO) if device is removed.
3395  *   - (-EINVAL) if bad parameter.
3396  *   - (>0) if *fw_size* is not enough to store firmware version, return
3397  *          the size of the non truncated string.
3398  */
3399 int rte_eth_dev_fw_version_get(uint16_t port_id,
3400 			       char *fw_version, size_t fw_size);
3401 
3402 /**
3403  * Retrieve the supported packet types of an Ethernet device.
3404  *
3405  * When a packet type is announced as supported, it *must* be recognized by
3406  * the PMD. For instance, if RTE_PTYPE_L2_ETHER, RTE_PTYPE_L2_ETHER_VLAN
3407  * and RTE_PTYPE_L3_IPV4 are announced, the PMD must return the following
3408  * packet types for these packets:
3409  * - Ether/IPv4              -> RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV4
3410  * - Ether/VLAN/IPv4         -> RTE_PTYPE_L2_ETHER_VLAN | RTE_PTYPE_L3_IPV4
3411  * - Ether/[anything else]   -> RTE_PTYPE_L2_ETHER
3412  * - Ether/VLAN/[anything else] -> RTE_PTYPE_L2_ETHER_VLAN
3413  *
3414  * When a packet is received by a PMD, the most precise type must be
3415  * returned among the ones supported. However a PMD is allowed to set
3416  * packet type that is not in the supported list, at the condition that it
3417  * is more precise. Therefore, a PMD announcing no supported packet types
3418  * can still set a matching packet type in a received packet.
3419  *
3420  * @note
3421  *   Better to invoke this API after the device is already started or Rx burst
3422  *   function is decided, to obtain correct supported ptypes.
3423  * @note
3424  *   if a given PMD does not report what ptypes it supports, then the supported
3425  *   ptype count is reported as 0.
3426  * @param port_id
3427  *   The port identifier of the Ethernet device.
3428  * @param ptype_mask
3429  *   A hint of what kind of packet type which the caller is interested in.
3430  * @param ptypes
3431  *   An array pointer to store adequate packet types, allocated by caller.
3432  * @param num
3433  *  Size of the array pointed by param ptypes.
3434  * @return
3435  *   - (>=0) Number of supported ptypes. If the number of types exceeds num,
3436  *           only num entries will be filled into the ptypes array, but the full
3437  *           count of supported ptypes will be returned.
3438  *   - (-ENODEV) if *port_id* invalid.
3439  *   - (-EINVAL) if bad parameter.
3440  */
3441 int rte_eth_dev_get_supported_ptypes(uint16_t port_id, uint32_t ptype_mask,
3442 				     uint32_t *ptypes, int num);
3443 /**
3444  * Inform Ethernet device about reduced range of packet types to handle.
3445  *
3446  * Application can use this function to set only specific ptypes that it's
3447  * interested. This information can be used by the PMD to optimize Rx path.
3448  *
3449  * The function accepts an array `set_ptypes` allocated by the caller to
3450  * store the packet types set by the driver, the last element of the array
3451  * is set to RTE_PTYPE_UNKNOWN. The size of the `set_ptype` array should be
3452  * `rte_eth_dev_get_supported_ptypes() + 1` else it might only be filled
3453  * partially.
3454  *
3455  * @param port_id
3456  *   The port identifier of the Ethernet device.
3457  * @param ptype_mask
3458  *   The ptype family that application is interested in should be bitwise OR of
3459  *   RTE_PTYPE_*_MASK or 0.
3460  * @param set_ptypes
3461  *   An array pointer to store set packet types, allocated by caller. The
3462  *   function marks the end of array with RTE_PTYPE_UNKNOWN.
3463  * @param num
3464  *   Size of the array pointed by param ptypes.
3465  *   Should be rte_eth_dev_get_supported_ptypes() + 1 to accommodate the
3466  *   set ptypes.
3467  * @return
3468  *   - (0) if Success.
3469  *   - (-ENODEV) if *port_id* invalid.
3470  *   - (-EINVAL) if *ptype_mask* is invalid (or) set_ptypes is NULL and
3471  *     num > 0.
3472  */
3473 int rte_eth_dev_set_ptypes(uint16_t port_id, uint32_t ptype_mask,
3474 			   uint32_t *set_ptypes, unsigned int num);
3475 
3476 /**
3477  * Retrieve the MTU of an Ethernet device.
3478  *
3479  * @param port_id
3480  *   The port identifier of the Ethernet device.
3481  * @param mtu
3482  *   A pointer to a uint16_t where the retrieved MTU is to be stored.
3483  * @return
3484  *   - (0) if successful.
3485  *   - (-ENODEV) if *port_id* invalid.
3486  *   - (-EINVAL) if bad parameter.
3487  */
3488 int rte_eth_dev_get_mtu(uint16_t port_id, uint16_t *mtu);
3489 
3490 /**
3491  * Change the MTU of an Ethernet device.
3492  *
3493  * @param port_id
3494  *   The port identifier of the Ethernet device.
3495  * @param mtu
3496  *   A uint16_t for the MTU to be applied.
3497  * @return
3498  *   - (0) if successful.
3499  *   - (-ENOTSUP) if operation is not supported.
3500  *   - (-ENODEV) if *port_id* invalid.
3501  *   - (-EIO) if device is removed.
3502  *   - (-EINVAL) if *mtu* invalid, validation of mtu can occur within
3503  *     rte_eth_dev_set_mtu if dev_infos_get is supported by the device or
3504  *     when the mtu is set using dev->dev_ops->mtu_set.
3505  *   - (-EBUSY) if operation is not allowed when the port is running
3506  */
3507 int rte_eth_dev_set_mtu(uint16_t port_id, uint16_t mtu);
3508 
3509 /**
3510  * Enable/Disable hardware filtering by an Ethernet device of received
3511  * VLAN packets tagged with a given VLAN Tag Identifier.
3512  *
3513  * @param port_id
3514  *   The port identifier of the Ethernet device.
3515  * @param vlan_id
3516  *   The VLAN Tag Identifier whose filtering must be enabled or disabled.
3517  * @param on
3518  *   If > 0, enable VLAN filtering of VLAN packets tagged with *vlan_id*.
3519  *   Otherwise, disable VLAN filtering of VLAN packets tagged with *vlan_id*.
3520  * @return
3521  *   - (0) if successful.
3522  *   - (-ENOTSUP) if hardware-assisted VLAN filtering not configured.
3523  *   - (-ENODEV) if *port_id* invalid.
3524  *   - (-EIO) if device is removed.
3525  *   - (-ENOSYS) if VLAN filtering on *port_id* disabled.
3526  *   - (-EINVAL) if *vlan_id* > 4095.
3527  */
3528 int rte_eth_dev_vlan_filter(uint16_t port_id, uint16_t vlan_id, int on);
3529 
3530 /**
3531  * Enable/Disable hardware VLAN Strip by a Rx queue of an Ethernet device.
3532  *
3533  * @param port_id
3534  *   The port identifier of the Ethernet device.
3535  * @param rx_queue_id
3536  *   The index of the receive queue for which a queue stats mapping is required.
3537  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
3538  *   to rte_eth_dev_configure().
3539  * @param on
3540  *   If 1, Enable VLAN Stripping of the receive queue of the Ethernet port.
3541  *   If 0, Disable VLAN Stripping of the receive queue of the Ethernet port.
3542  * @return
3543  *   - (0) if successful.
3544  *   - (-ENOTSUP) if hardware-assisted VLAN stripping not configured.
3545  *   - (-ENODEV) if *port_id* invalid.
3546  *   - (-EINVAL) if *rx_queue_id* invalid.
3547  */
3548 int rte_eth_dev_set_vlan_strip_on_queue(uint16_t port_id, uint16_t rx_queue_id,
3549 		int on);
3550 
3551 /**
3552  * Set the Outer VLAN Ether Type by an Ethernet device, it can be inserted to
3553  * the VLAN header.
3554  *
3555  * @param port_id
3556  *   The port identifier of the Ethernet device.
3557  * @param vlan_type
3558  *   The VLAN type.
3559  * @param tag_type
3560  *   The Tag Protocol ID
3561  * @return
3562  *   - (0) if successful.
3563  *   - (-ENOTSUP) if hardware-assisted VLAN TPID setup is not supported.
3564  *   - (-ENODEV) if *port_id* invalid.
3565  *   - (-EIO) if device is removed.
3566  */
3567 int rte_eth_dev_set_vlan_ether_type(uint16_t port_id,
3568 				    enum rte_vlan_type vlan_type,
3569 				    uint16_t tag_type);
3570 
3571 /**
3572  * Set VLAN offload configuration on an Ethernet device.
3573  *
3574  * @param port_id
3575  *   The port identifier of the Ethernet device.
3576  * @param offload_mask
3577  *   The VLAN Offload bit mask can be mixed use with "OR"
3578  *       RTE_ETH_VLAN_STRIP_OFFLOAD
3579  *       RTE_ETH_VLAN_FILTER_OFFLOAD
3580  *       RTE_ETH_VLAN_EXTEND_OFFLOAD
3581  *       RTE_ETH_QINQ_STRIP_OFFLOAD
3582  * @return
3583  *   - (0) if successful.
3584  *   - (-ENOTSUP) if hardware-assisted VLAN filtering not configured.
3585  *   - (-ENODEV) if *port_id* invalid.
3586  *   - (-EIO) if device is removed.
3587  */
3588 int rte_eth_dev_set_vlan_offload(uint16_t port_id, int offload_mask);
3589 
3590 /**
3591  * Read VLAN Offload configuration from an Ethernet device
3592  *
3593  * @param port_id
3594  *   The port identifier of the Ethernet device.
3595  * @return
3596  *   - (>0) if successful. Bit mask to indicate
3597  *       RTE_ETH_VLAN_STRIP_OFFLOAD
3598  *       RTE_ETH_VLAN_FILTER_OFFLOAD
3599  *       RTE_ETH_VLAN_EXTEND_OFFLOAD
3600  *       RTE_ETH_QINQ_STRIP_OFFLOAD
3601  *   - (-ENODEV) if *port_id* invalid.
3602  */
3603 int rte_eth_dev_get_vlan_offload(uint16_t port_id);
3604 
3605 /**
3606  * Set port based Tx VLAN insertion on or off.
3607  *
3608  * @param port_id
3609  *  The port identifier of the Ethernet device.
3610  * @param pvid
3611  *  Port based Tx VLAN identifier together with user priority.
3612  * @param on
3613  *  Turn on or off the port based Tx VLAN insertion.
3614  *
3615  * @return
3616  *   - (0) if successful.
3617  *   - negative if failed.
3618  */
3619 int rte_eth_dev_set_vlan_pvid(uint16_t port_id, uint16_t pvid, int on);
3620 
3621 /**
3622  * @warning
3623  * @b EXPERIMENTAL: this API may change without prior notice.
3624  *
3625  * Set Rx queue available descriptors threshold.
3626  *
3627  * @param port_id
3628  *  The port identifier of the Ethernet device.
3629  * @param queue_id
3630  *  The index of the receive queue.
3631  * @param avail_thresh
3632  *  The available descriptors threshold is percentage of Rx queue size
3633  *  which describes the availability of Rx queue for hardware.
3634  *  If the Rx queue availability is below it,
3635  *  the event RTE_ETH_EVENT_RX_AVAIL_THRESH is triggered.
3636  *  [1-99] to set a new available descriptors threshold.
3637  *  0 to disable threshold monitoring.
3638  *
3639  * @return
3640  *   - 0 if successful.
3641  *   - (-ENODEV) if @p port_id is invalid.
3642  *   - (-EINVAL) if bad parameter.
3643  *   - (-ENOTSUP) if available Rx descriptors threshold is not supported.
3644  *   - (-EIO) if device is removed.
3645  */
3646 __rte_experimental
3647 int rte_eth_rx_avail_thresh_set(uint16_t port_id, uint16_t queue_id,
3648 			       uint8_t avail_thresh);
3649 
3650 /**
3651  * @warning
3652  * @b EXPERIMENTAL: this API may change without prior notice.
3653  *
3654  * Find Rx queue with RTE_ETH_EVENT_RX_AVAIL_THRESH event pending.
3655  *
3656  * @param port_id
3657  *  The port identifier of the Ethernet device.
3658  * @param[inout] queue_id
3659  *  On input starting Rx queue index to search from.
3660  *  If the queue_id is bigger than maximum queue ID of the port,
3661  *  search is started from 0. So that application can keep calling
3662  *  this function to handle all pending events with a simple increment
3663  *  of queue_id on the next call.
3664  *  On output if return value is 1, Rx queue index with the event pending.
3665  * @param[out] avail_thresh
3666  *  Location for available descriptors threshold of the found Rx queue.
3667  *
3668  * @return
3669  *   - 1 if an Rx queue with pending event is found.
3670  *   - 0 if no Rx queue with pending event is found.
3671  *   - (-ENODEV) if @p port_id is invalid.
3672  *   - (-EINVAL) if bad parameter (e.g. @p queue_id is NULL).
3673  *   - (-ENOTSUP) if operation is not supported.
3674  *   - (-EIO) if device is removed.
3675  */
3676 __rte_experimental
3677 int rte_eth_rx_avail_thresh_query(uint16_t port_id, uint16_t *queue_id,
3678 				 uint8_t *avail_thresh);
3679 
3680 typedef void (*buffer_tx_error_fn)(struct rte_mbuf **unsent, uint16_t count,
3681 		void *userdata);
3682 
3683 /**
3684  * Structure used to buffer packets for future Tx
3685  * Used by APIs rte_eth_tx_buffer and rte_eth_tx_buffer_flush
3686  */
3687 struct rte_eth_dev_tx_buffer {
3688 	buffer_tx_error_fn error_callback;
3689 	void *error_userdata;
3690 	uint16_t size;           /**< Size of buffer for buffered Tx */
3691 	uint16_t length;         /**< Number of packets in the array */
3692 	/** Pending packets to be sent on explicit flush or when full */
3693 	struct rte_mbuf *pkts[];
3694 };
3695 
3696 /**
3697  * Calculate the size of the Tx buffer.
3698  *
3699  * @param sz
3700  *   Number of stored packets.
3701  */
3702 #define RTE_ETH_TX_BUFFER_SIZE(sz) \
3703 	(sizeof(struct rte_eth_dev_tx_buffer) + (sz) * sizeof(struct rte_mbuf *))
3704 
3705 /**
3706  * Initialize default values for buffered transmitting
3707  *
3708  * @param buffer
3709  *   Tx buffer to be initialized.
3710  * @param size
3711  *   Buffer size
3712  * @return
3713  *   0 if no error
3714  */
3715 int
3716 rte_eth_tx_buffer_init(struct rte_eth_dev_tx_buffer *buffer, uint16_t size);
3717 
3718 /**
3719  * Configure a callback for buffered packets which cannot be sent
3720  *
3721  * Register a specific callback to be called when an attempt is made to send
3722  * all packets buffered on an Ethernet port, but not all packets can
3723  * successfully be sent. The callback registered here will be called only
3724  * from calls to rte_eth_tx_buffer() and rte_eth_tx_buffer_flush() APIs.
3725  * The default callback configured for each queue by default just frees the
3726  * packets back to the calling mempool. If additional behaviour is required,
3727  * for example, to count dropped packets, or to retry transmission of packets
3728  * which cannot be sent, this function should be used to register a suitable
3729  * callback function to implement the desired behaviour.
3730  * The example callback "rte_eth_count_unsent_packet_callback()" is also
3731  * provided as reference.
3732  *
3733  * @param buffer
3734  *   The port identifier of the Ethernet device.
3735  * @param callback
3736  *   The function to be used as the callback.
3737  * @param userdata
3738  *   Arbitrary parameter to be passed to the callback function
3739  * @return
3740  *   0 on success, or -EINVAL if bad parameter
3741  */
3742 int
3743 rte_eth_tx_buffer_set_err_callback(struct rte_eth_dev_tx_buffer *buffer,
3744 		buffer_tx_error_fn callback, void *userdata);
3745 
3746 /**
3747  * Callback function for silently dropping unsent buffered packets.
3748  *
3749  * This function can be passed to rte_eth_tx_buffer_set_err_callback() to
3750  * adjust the default behavior when buffered packets cannot be sent. This
3751  * function drops any unsent packets silently and is used by Tx buffered
3752  * operations as default behavior.
3753  *
3754  * NOTE: this function should not be called directly, instead it should be used
3755  *       as a callback for packet buffering.
3756  *
3757  * NOTE: when configuring this function as a callback with
3758  *       rte_eth_tx_buffer_set_err_callback(), the final, userdata parameter
3759  *       should point to an uint64_t value.
3760  *
3761  * @param pkts
3762  *   The previously buffered packets which could not be sent
3763  * @param unsent
3764  *   The number of unsent packets in the pkts array
3765  * @param userdata
3766  *   Not used
3767  */
3768 void
3769 rte_eth_tx_buffer_drop_callback(struct rte_mbuf **pkts, uint16_t unsent,
3770 		void *userdata);
3771 
3772 /**
3773  * Callback function for tracking unsent buffered packets.
3774  *
3775  * This function can be passed to rte_eth_tx_buffer_set_err_callback() to
3776  * adjust the default behavior when buffered packets cannot be sent. This
3777  * function drops any unsent packets, but also updates a user-supplied counter
3778  * to track the overall number of packets dropped. The counter should be an
3779  * uint64_t variable.
3780  *
3781  * NOTE: this function should not be called directly, instead it should be used
3782  *       as a callback for packet buffering.
3783  *
3784  * NOTE: when configuring this function as a callback with
3785  *       rte_eth_tx_buffer_set_err_callback(), the final, userdata parameter
3786  *       should point to an uint64_t value.
3787  *
3788  * @param pkts
3789  *   The previously buffered packets which could not be sent
3790  * @param unsent
3791  *   The number of unsent packets in the pkts array
3792  * @param userdata
3793  *   Pointer to an uint64_t value, which will be incremented by unsent
3794  */
3795 void
3796 rte_eth_tx_buffer_count_callback(struct rte_mbuf **pkts, uint16_t unsent,
3797 		void *userdata);
3798 
3799 /**
3800  * Request the driver to free mbufs currently cached by the driver. The
3801  * driver will only free the mbuf if it is no longer in use. It is the
3802  * application's responsibility to ensure rte_eth_tx_buffer_flush(..) is
3803  * called if needed.
3804  *
3805  * @param port_id
3806  *   The port identifier of the Ethernet device.
3807  * @param queue_id
3808  *   The index of the transmit queue through which output packets must be
3809  *   sent.
3810  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
3811  *   to rte_eth_dev_configure().
3812  * @param free_cnt
3813  *   Maximum number of packets to free. Use 0 to indicate all possible packets
3814  *   should be freed. Note that a packet may be using multiple mbufs.
3815  * @return
3816  *   Failure: < 0
3817  *     -ENODEV: Invalid interface
3818  *     -EIO: device is removed
3819  *     -ENOTSUP: Driver does not support function
3820  *   Success: >= 0
3821  *     0-n: Number of packets freed. More packets may still remain in ring that
3822  *     are in use.
3823  */
3824 int
3825 rte_eth_tx_done_cleanup(uint16_t port_id, uint16_t queue_id, uint32_t free_cnt);
3826 
3827 /**
3828  * Subtypes for MACsec offload event (@ref RTE_ETH_EVENT_MACSEC)
3829  * raised by Ethernet device.
3830  */
3831 enum rte_eth_event_macsec_subtype {
3832 	/** Notifies unknown MACsec subevent. */
3833 	RTE_ETH_SUBEVENT_MACSEC_UNKNOWN,
3834 	/**
3835 	 * Subevent of RTE_ETH_EVENT_MACSEC_SECTAG_VAL_ERR sectag validation events
3836 	 *	Validation check: SecTag.TCI.V = 1
3837 	 */
3838 	RTE_ETH_SUBEVENT_MACSEC_RX_SECTAG_V_EQ1,
3839 	/**
3840 	 * Subevent of RTE_ETH_EVENT_MACSEC_SECTAG_VAL_ERR sectag validation events
3841 	 *	Validation check: SecTag.TCI.E = 0 && SecTag.TCI.C = 1
3842 	 */
3843 	RTE_ETH_SUBEVENT_MACSEC_RX_SECTAG_E_EQ0_C_EQ1,
3844 	/**
3845 	 * Subevent of RTE_ETH_EVENT_MACSEC_SECTAG_VAL_ERR sectag validation events
3846 	 *	Validation check: SecTag.SL >= 'd48
3847 	 */
3848 	RTE_ETH_SUBEVENT_MACSEC_RX_SECTAG_SL_GTE48,
3849 	/**
3850 	 * Subevent of RTE_ETH_EVENT_MACSEC_SECTAG_VAL_ERR sectag validation events
3851 	 *	Validation check: SecTag.TCI.ES = 1 && SecTag.TCI.SC = 1
3852 	 */
3853 	RTE_ETH_SUBEVENT_MACSEC_RX_SECTAG_ES_EQ1_SC_EQ1,
3854 	/**
3855 	 * Subevent of RTE_ETH_EVENT_MACSEC_SECTAG_VAL_ERR sectag validation events
3856 	 *	Validation check: SecTag.TCI.SC = 1 && SecTag.TCI.SCB = 1
3857 	 */
3858 	RTE_ETH_SUBEVENT_MACSEC_RX_SECTAG_SC_EQ1_SCB_EQ1,
3859 };
3860 
3861 /**
3862  * Event types for MACsec offload event (@ref RTE_ETH_EVENT_MACSEC)
3863  * raised by eth device.
3864  */
3865 enum rte_eth_event_macsec_type {
3866 	/** Notifies unknown MACsec event. */
3867 	RTE_ETH_EVENT_MACSEC_UNKNOWN,
3868 	/** Notifies Sectag validation failure events. */
3869 	RTE_ETH_EVENT_MACSEC_SECTAG_VAL_ERR,
3870 	/** Notifies Rx SA hard expiry events. */
3871 	RTE_ETH_EVENT_MACSEC_RX_SA_PN_HARD_EXP,
3872 	/** Notifies Rx SA soft expiry events. */
3873 	RTE_ETH_EVENT_MACSEC_RX_SA_PN_SOFT_EXP,
3874 	/** Notifies Tx SA hard expiry events. */
3875 	RTE_ETH_EVENT_MACSEC_TX_SA_PN_HARD_EXP,
3876 	/** Notifies Tx SA soft events. */
3877 	RTE_ETH_EVENT_MACSEC_TX_SA_PN_SOFT_EXP,
3878 	/** Notifies Invalid SA event. */
3879 	RTE_ETH_EVENT_MACSEC_SA_NOT_VALID,
3880 };
3881 
3882 /**
3883  * Descriptor for @ref RTE_ETH_EVENT_MACSEC event.
3884  * Used by ethdev to send extra information of the MACsec offload event.
3885  */
3886 struct rte_eth_event_macsec_desc {
3887 	/** Type of RTE_ETH_EVENT_MACSEC_* event. */
3888 	enum rte_eth_event_macsec_type type;
3889 	/** Type of RTE_ETH_SUBEVENT_MACSEC_* subevent. */
3890 	enum rte_eth_event_macsec_subtype subtype;
3891 	/**
3892 	 * Event specific metadata.
3893 	 *
3894 	 * For the following events, *userdata* registered
3895 	 * with the *rte_security_session* would be returned
3896 	 * as metadata.
3897 	 *
3898 	 * @see struct rte_security_session_conf
3899 	 */
3900 	uint64_t metadata;
3901 };
3902 
3903 /**
3904  * Subtypes for IPsec offload event(@ref RTE_ETH_EVENT_IPSEC) raised by
3905  * eth device.
3906  */
3907 enum rte_eth_event_ipsec_subtype {
3908 	/**  PMD specific error start */
3909 	RTE_ETH_EVENT_IPSEC_PMD_ERROR_START = -256,
3910 	/**  PMD specific error end */
3911 	RTE_ETH_EVENT_IPSEC_PMD_ERROR_END = -1,
3912 	/** Unknown event type */
3913 	RTE_ETH_EVENT_IPSEC_UNKNOWN = 0,
3914 	/** Sequence number overflow */
3915 	RTE_ETH_EVENT_IPSEC_ESN_OVERFLOW,
3916 	/** Soft time expiry of SA */
3917 	RTE_ETH_EVENT_IPSEC_SA_TIME_EXPIRY,
3918 	/**
3919 	 * Soft byte expiry of SA determined by
3920 	 * @ref rte_security_ipsec_lifetime::bytes_soft_limit
3921 	 */
3922 	RTE_ETH_EVENT_IPSEC_SA_BYTE_EXPIRY,
3923 	/**
3924 	 * Soft packet expiry of SA determined by
3925 	 * @ref rte_security_ipsec_lifetime::packets_soft_limit
3926 	 */
3927 	RTE_ETH_EVENT_IPSEC_SA_PKT_EXPIRY,
3928 	/**
3929 	 * Hard byte expiry of SA determined by
3930 	 * @ref rte_security_ipsec_lifetime::bytes_hard_limit
3931 	 */
3932 	RTE_ETH_EVENT_IPSEC_SA_BYTE_HARD_EXPIRY,
3933 	/**
3934 	 * Hard packet expiry of SA determined by
3935 	 * @ref rte_security_ipsec_lifetime::packets_hard_limit
3936 	 */
3937 	RTE_ETH_EVENT_IPSEC_SA_PKT_HARD_EXPIRY,
3938 	/** Max value of this enum */
3939 	RTE_ETH_EVENT_IPSEC_MAX
3940 };
3941 
3942 /**
3943  * Descriptor for @ref RTE_ETH_EVENT_IPSEC event. Used by eth dev to send extra
3944  * information of the IPsec offload event.
3945  */
3946 struct rte_eth_event_ipsec_desc {
3947 	/** Type of RTE_ETH_EVENT_IPSEC_* event */
3948 	enum rte_eth_event_ipsec_subtype subtype;
3949 	/**
3950 	 * Event specific metadata.
3951 	 *
3952 	 * For the following events, *userdata* registered
3953 	 * with the *rte_security_session* would be returned
3954 	 * as metadata,
3955 	 *
3956 	 * - @ref RTE_ETH_EVENT_IPSEC_ESN_OVERFLOW
3957 	 * - @ref RTE_ETH_EVENT_IPSEC_SA_TIME_EXPIRY
3958 	 * - @ref RTE_ETH_EVENT_IPSEC_SA_BYTE_EXPIRY
3959 	 * - @ref RTE_ETH_EVENT_IPSEC_SA_PKT_EXPIRY
3960 	 * - @ref RTE_ETH_EVENT_IPSEC_SA_BYTE_HARD_EXPIRY
3961 	 * - @ref RTE_ETH_EVENT_IPSEC_SA_PKT_HARD_EXPIRY
3962 	 *
3963 	 * @see struct rte_security_session_conf
3964 	 *
3965 	 */
3966 	uint64_t metadata;
3967 };
3968 
3969 /**
3970  * The eth device event type for interrupt, and maybe others in the future.
3971  */
3972 enum rte_eth_event_type {
3973 	RTE_ETH_EVENT_UNKNOWN,  /**< unknown event type */
3974 	RTE_ETH_EVENT_INTR_LSC, /**< lsc interrupt event */
3975 	/** queue state event (enabled/disabled) */
3976 	RTE_ETH_EVENT_QUEUE_STATE,
3977 	/** reset interrupt event, sent to VF on PF reset */
3978 	RTE_ETH_EVENT_INTR_RESET,
3979 	RTE_ETH_EVENT_VF_MBOX,  /**< message from the VF received by PF */
3980 	RTE_ETH_EVENT_MACSEC,   /**< MACsec offload related event */
3981 	RTE_ETH_EVENT_INTR_RMV, /**< device removal event */
3982 	RTE_ETH_EVENT_NEW,      /**< port is probed */
3983 	RTE_ETH_EVENT_DESTROY,  /**< port is released */
3984 	RTE_ETH_EVENT_IPSEC,    /**< IPsec offload related event */
3985 	RTE_ETH_EVENT_FLOW_AGED,/**< New aged-out flows is detected */
3986 	/**
3987 	 * Number of available Rx descriptors is smaller than the threshold.
3988 	 * @see rte_eth_rx_avail_thresh_set()
3989 	 */
3990 	RTE_ETH_EVENT_RX_AVAIL_THRESH,
3991 	/** Port recovering from a hardware or firmware error.
3992 	 * If PMD supports proactive error recovery,
3993 	 * it should trigger this event to notify application
3994 	 * that it detected an error and the recovery is being started.
3995 	 * Upon receiving the event, the application should not invoke any control path API
3996 	 * (such as rte_eth_dev_configure/rte_eth_dev_stop...) until receiving
3997 	 * RTE_ETH_EVENT_RECOVERY_SUCCESS or RTE_ETH_EVENT_RECOVERY_FAILED event.
3998 	 * The PMD will set the data path pointers to dummy functions,
3999 	 * and re-set the data path pointers to non-dummy functions
4000 	 * before reporting RTE_ETH_EVENT_RECOVERY_SUCCESS event.
4001 	 * It means that the application cannot send or receive any packets
4002 	 * during this period.
4003 	 * @note Before the PMD reports the recovery result,
4004 	 * the PMD may report the RTE_ETH_EVENT_ERR_RECOVERING event again,
4005 	 * because a larger error may occur during the recovery.
4006 	 */
4007 	RTE_ETH_EVENT_ERR_RECOVERING,
4008 	/** Port recovers successfully from the error.
4009 	 * The PMD already re-configured the port,
4010 	 * and the effect is the same as a restart operation.
4011 	 * a) The following operation will be retained: (alphabetically)
4012 	 *    - DCB configuration
4013 	 *    - FEC configuration
4014 	 *    - Flow control configuration
4015 	 *    - LRO configuration
4016 	 *    - LSC configuration
4017 	 *    - MTU
4018 	 *    - MAC address (default and those supplied by MAC address array)
4019 	 *    - Promiscuous and allmulticast mode
4020 	 *    - PTP configuration
4021 	 *    - Queue (Rx/Tx) settings
4022 	 *    - Queue statistics mappings
4023 	 *    - RSS configuration by rte_eth_dev_rss_xxx() family
4024 	 *    - Rx checksum configuration
4025 	 *    - Rx interrupt settings
4026 	 *    - Traffic management configuration
4027 	 *    - VLAN configuration (including filtering, tpid, strip, pvid)
4028 	 *    - VMDq configuration
4029 	 * b) The following configuration maybe retained
4030 	 *    or not depending on the device capabilities:
4031 	 *    - flow rules
4032 	 *      (@see RTE_ETH_DEV_CAPA_FLOW_RULE_KEEP)
4033 	 *    - shared flow objects
4034 	 *      (@see RTE_ETH_DEV_CAPA_FLOW_SHARED_OBJECT_KEEP)
4035 	 * c) Any other configuration will not be stored
4036 	 *    and will need to be re-configured.
4037 	 */
4038 	RTE_ETH_EVENT_RECOVERY_SUCCESS,
4039 	/** Port recovery failed.
4040 	 * It means that the port should not be usable anymore.
4041 	 * The application should close the port.
4042 	 */
4043 	RTE_ETH_EVENT_RECOVERY_FAILED,
4044 	RTE_ETH_EVENT_MAX       /**< max value of this enum */
4045 };
4046 
4047 /** User application callback to be registered for interrupts. */
4048 typedef int (*rte_eth_dev_cb_fn)(uint16_t port_id,
4049 		enum rte_eth_event_type event, void *cb_arg, void *ret_param);
4050 
4051 /**
4052  * Register a callback function for port event.
4053  *
4054  * @param port_id
4055  *  Port ID.
4056  *  RTE_ETH_ALL means register the event for all port ids.
4057  * @param event
4058  *  Event interested.
4059  * @param cb_fn
4060  *  User supplied callback function to be called.
4061  * @param cb_arg
4062  *  Pointer to the parameters for the registered callback.
4063  *
4064  * @return
4065  *  - On success, zero.
4066  *  - On failure, a negative value.
4067  */
4068 int rte_eth_dev_callback_register(uint16_t port_id,
4069 			enum rte_eth_event_type event,
4070 		rte_eth_dev_cb_fn cb_fn, void *cb_arg);
4071 
4072 /**
4073  * Unregister a callback function for port event.
4074  *
4075  * @param port_id
4076  *  Port ID.
4077  *  RTE_ETH_ALL means unregister the event for all port ids.
4078  * @param event
4079  *  Event interested.
4080  * @param cb_fn
4081  *  User supplied callback function to be called.
4082  * @param cb_arg
4083  *  Pointer to the parameters for the registered callback. -1 means to
4084  *  remove all for the same callback address and same event.
4085  *
4086  * @return
4087  *  - On success, zero.
4088  *  - On failure, a negative value.
4089  */
4090 int rte_eth_dev_callback_unregister(uint16_t port_id,
4091 			enum rte_eth_event_type event,
4092 		rte_eth_dev_cb_fn cb_fn, void *cb_arg);
4093 
4094 /**
4095  * When there is no Rx packet coming in Rx Queue for a long time, we can
4096  * sleep lcore related to Rx Queue for power saving, and enable Rx interrupt
4097  * to be triggered when Rx packet arrives.
4098  *
4099  * The rte_eth_dev_rx_intr_enable() function enables Rx queue
4100  * interrupt on specific Rx queue of a port.
4101  *
4102  * @param port_id
4103  *   The port identifier of the Ethernet device.
4104  * @param queue_id
4105  *   The index of the receive queue from which to retrieve input packets.
4106  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
4107  *   to rte_eth_dev_configure().
4108  * @return
4109  *   - (0) if successful.
4110  *   - (-ENOTSUP) if underlying hardware OR driver doesn't support
4111  *     that operation.
4112  *   - (-ENODEV) if *port_id* invalid.
4113  *   - (-EIO) if device is removed.
4114  */
4115 int rte_eth_dev_rx_intr_enable(uint16_t port_id, uint16_t queue_id);
4116 
4117 /**
4118  * When lcore wakes up from Rx interrupt indicating packet coming, disable Rx
4119  * interrupt and returns to polling mode.
4120  *
4121  * The rte_eth_dev_rx_intr_disable() function disables Rx queue
4122  * interrupt on specific Rx queue of a port.
4123  *
4124  * @param port_id
4125  *   The port identifier of the Ethernet device.
4126  * @param queue_id
4127  *   The index of the receive queue from which to retrieve input packets.
4128  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
4129  *   to rte_eth_dev_configure().
4130  * @return
4131  *   - (0) if successful.
4132  *   - (-ENOTSUP) if underlying hardware OR driver doesn't support
4133  *     that operation.
4134  *   - (-ENODEV) if *port_id* invalid.
4135  *   - (-EIO) if device is removed.
4136  */
4137 int rte_eth_dev_rx_intr_disable(uint16_t port_id, uint16_t queue_id);
4138 
4139 /**
4140  * Rx Interrupt control per port.
4141  *
4142  * @param port_id
4143  *   The port identifier of the Ethernet device.
4144  * @param epfd
4145  *   Epoll instance fd which the intr vector associated to.
4146  *   Using RTE_EPOLL_PER_THREAD allows to use per thread epoll instance.
4147  * @param op
4148  *   The operation be performed for the vector.
4149  *   Operation type of {RTE_INTR_EVENT_ADD, RTE_INTR_EVENT_DEL}.
4150  * @param data
4151  *   User raw data.
4152  * @return
4153  *   - On success, zero.
4154  *   - On failure, a negative value.
4155  */
4156 int rte_eth_dev_rx_intr_ctl(uint16_t port_id, int epfd, int op, void *data);
4157 
4158 /**
4159  * Rx Interrupt control per queue.
4160  *
4161  * @param port_id
4162  *   The port identifier of the Ethernet device.
4163  * @param queue_id
4164  *   The index of the receive queue from which to retrieve input packets.
4165  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
4166  *   to rte_eth_dev_configure().
4167  * @param epfd
4168  *   Epoll instance fd which the intr vector associated to.
4169  *   Using RTE_EPOLL_PER_THREAD allows to use per thread epoll instance.
4170  * @param op
4171  *   The operation be performed for the vector.
4172  *   Operation type of {RTE_INTR_EVENT_ADD, RTE_INTR_EVENT_DEL}.
4173  * @param data
4174  *   User raw data.
4175  * @return
4176  *   - On success, zero.
4177  *   - On failure, a negative value.
4178  */
4179 int rte_eth_dev_rx_intr_ctl_q(uint16_t port_id, uint16_t queue_id,
4180 			      int epfd, int op, void *data);
4181 
4182 /**
4183  * Get interrupt fd per Rx queue.
4184  *
4185  * @param port_id
4186  *   The port identifier of the Ethernet device.
4187  * @param queue_id
4188  *   The index of the receive queue from which to retrieve input packets.
4189  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
4190  *   to rte_eth_dev_configure().
4191  * @return
4192  *   - (>=0) the interrupt fd associated to the requested Rx queue if
4193  *           successful.
4194  *   - (-1) on error.
4195  */
4196 int
4197 rte_eth_dev_rx_intr_ctl_q_get_fd(uint16_t port_id, uint16_t queue_id);
4198 
4199 /**
4200  * Turn on the LED on the Ethernet device.
4201  * This function turns on the LED on the Ethernet device.
4202  *
4203  * @param port_id
4204  *   The port identifier of the Ethernet device.
4205  * @return
4206  *   - (0) if successful.
4207  *   - (-ENOTSUP) if underlying hardware OR driver doesn't support
4208  *     that operation.
4209  *   - (-ENODEV) if *port_id* invalid.
4210  *   - (-EIO) if device is removed.
4211  */
4212 int  rte_eth_led_on(uint16_t port_id);
4213 
4214 /**
4215  * Turn off the LED on the Ethernet device.
4216  * This function turns off the LED on the Ethernet device.
4217  *
4218  * @param port_id
4219  *   The port identifier of the Ethernet device.
4220  * @return
4221  *   - (0) if successful.
4222  *   - (-ENOTSUP) if underlying hardware OR driver doesn't support
4223  *     that operation.
4224  *   - (-ENODEV) if *port_id* invalid.
4225  *   - (-EIO) if device is removed.
4226  */
4227 int  rte_eth_led_off(uint16_t port_id);
4228 
4229 /**
4230  * @warning
4231  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
4232  *
4233  * Get Forward Error Correction(FEC) capability.
4234  *
4235  * @param port_id
4236  *   The port identifier of the Ethernet device.
4237  * @param speed_fec_capa
4238  *   speed_fec_capa is out only with per-speed capabilities.
4239  *   If set to NULL, the function returns the required number
4240  *   of required array entries.
4241  * @param num
4242  *   a number of elements in an speed_fec_capa array.
4243  *
4244  * @return
4245  *   - A non-negative value lower or equal to num: success. The return value
4246  *     is the number of entries filled in the fec capa array.
4247  *   - A non-negative value higher than num: error, the given fec capa array
4248  *     is too small. The return value corresponds to the num that should
4249  *     be given to succeed. The entries in fec capa array are not valid and
4250  *     shall not be used by the caller.
4251  *   - (-ENOTSUP) if underlying hardware OR driver doesn't support.
4252  *     that operation.
4253  *   - (-EIO) if device is removed.
4254  *   - (-ENODEV)  if *port_id* invalid.
4255  *   - (-EINVAL)  if *num* or *speed_fec_capa* invalid
4256  */
4257 __rte_experimental
4258 int rte_eth_fec_get_capability(uint16_t port_id,
4259 			       struct rte_eth_fec_capa *speed_fec_capa,
4260 			       unsigned int num);
4261 
4262 /**
4263  * @warning
4264  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
4265  *
4266  * Get current Forward Error Correction(FEC) mode.
4267  * If link is down and AUTO is enabled, AUTO is returned, otherwise,
4268  * configured FEC mode is returned.
4269  * If link is up, current FEC mode is returned.
4270  *
4271  * @param port_id
4272  *   The port identifier of the Ethernet device.
4273  * @param fec_capa
4274  *   A bitmask with the current FEC mode.
4275  * @return
4276  *   - (0) if successful.
4277  *   - (-ENOTSUP) if underlying hardware OR driver doesn't support.
4278  *     that operation.
4279  *   - (-EIO) if device is removed.
4280  *   - (-ENODEV)  if *port_id* invalid.
4281  */
4282 __rte_experimental
4283 int rte_eth_fec_get(uint16_t port_id, uint32_t *fec_capa);
4284 
4285 /**
4286  * @warning
4287  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
4288  *
4289  * Set Forward Error Correction(FEC) mode.
4290  *
4291  * @param port_id
4292  *   The port identifier of the Ethernet device.
4293  * @param fec_capa
4294  *   A bitmask of allowed FEC modes.
4295  *   If only the AUTO bit is set, the decision on which FEC
4296  *   mode to use will be made by HW/FW or driver.
4297  *   If the AUTO bit is set with some FEC modes, only specified
4298  *   FEC modes can be set.
4299  *   If AUTO bit is clear, specify FEC mode to be used
4300  *   (only one valid mode per speed may be set).
4301  * @return
4302  *   - (0) if successful.
4303  *   - (-EINVAL) if the FEC mode is not valid.
4304  *   - (-ENOTSUP) if underlying hardware OR driver doesn't support.
4305  *   - (-EIO) if device is removed.
4306  *   - (-ENODEV)  if *port_id* invalid.
4307  */
4308 __rte_experimental
4309 int rte_eth_fec_set(uint16_t port_id, uint32_t fec_capa);
4310 
4311 /**
4312  * Get current status of the Ethernet link flow control for Ethernet device
4313  *
4314  * @param port_id
4315  *   The port identifier of the Ethernet device.
4316  * @param fc_conf
4317  *   The pointer to the structure where to store the flow control parameters.
4318  * @return
4319  *   - (0) if successful.
4320  *   - (-ENOTSUP) if hardware doesn't support flow control.
4321  *   - (-ENODEV)  if *port_id* invalid.
4322  *   - (-EIO)  if device is removed.
4323  *   - (-EINVAL) if bad parameter.
4324  */
4325 int rte_eth_dev_flow_ctrl_get(uint16_t port_id,
4326 			      struct rte_eth_fc_conf *fc_conf);
4327 
4328 /**
4329  * Configure the Ethernet link flow control for Ethernet device
4330  *
4331  * @param port_id
4332  *   The port identifier of the Ethernet device.
4333  * @param fc_conf
4334  *   The pointer to the structure of the flow control parameters.
4335  * @return
4336  *   - (0) if successful.
4337  *   - (-ENOTSUP) if hardware doesn't support flow control mode.
4338  *   - (-ENODEV)  if *port_id* invalid.
4339  *   - (-EINVAL)  if bad parameter
4340  *   - (-EIO)     if flow control setup failure or device is removed.
4341  */
4342 int rte_eth_dev_flow_ctrl_set(uint16_t port_id,
4343 			      struct rte_eth_fc_conf *fc_conf);
4344 
4345 /**
4346  * Configure the Ethernet priority flow control under DCB environment
4347  * for Ethernet device.
4348  *
4349  * @param port_id
4350  * The port identifier of the Ethernet device.
4351  * @param pfc_conf
4352  * The pointer to the structure of the priority flow control parameters.
4353  * @return
4354  *   - (0) if successful.
4355  *   - (-ENOTSUP) if hardware doesn't support priority flow control mode.
4356  *   - (-ENODEV)  if *port_id* invalid.
4357  *   - (-EINVAL)  if bad parameter
4358  *   - (-EIO)     if flow control setup failure or device is removed.
4359  */
4360 int rte_eth_dev_priority_flow_ctrl_set(uint16_t port_id,
4361 				struct rte_eth_pfc_conf *pfc_conf);
4362 
4363 /**
4364  * Add a MAC address to the set used for filtering incoming packets.
4365  *
4366  * @param port_id
4367  *   The port identifier of the Ethernet device.
4368  * @param mac_addr
4369  *   The MAC address to add.
4370  * @param pool
4371  *   VMDq pool index to associate address with (if VMDq is enabled). If VMDq is
4372  *   not enabled, this should be set to 0.
4373  * @return
4374  *   - (0) if successfully added or *mac_addr* was already added.
4375  *   - (-ENOTSUP) if hardware doesn't support this feature.
4376  *   - (-ENODEV) if *port* is invalid.
4377  *   - (-EIO) if device is removed.
4378  *   - (-ENOSPC) if no more MAC addresses can be added.
4379  *   - (-EINVAL) if MAC address is invalid.
4380  */
4381 int rte_eth_dev_mac_addr_add(uint16_t port_id, struct rte_ether_addr *mac_addr,
4382 				uint32_t pool);
4383 
4384 /**
4385  * @warning
4386  * @b EXPERIMENTAL: this API may change without prior notice.
4387  *
4388  * Retrieve the information for queue based PFC.
4389  *
4390  * @param port_id
4391  *   The port identifier of the Ethernet device.
4392  * @param pfc_queue_info
4393  *   A pointer to a structure of type *rte_eth_pfc_queue_info* to be filled with
4394  *   the information about queue based PFC.
4395  * @return
4396  *   - (0) if successful.
4397  *   - (-ENOTSUP) if support for priority_flow_ctrl_queue_info_get does not exist.
4398  *   - (-ENODEV) if *port_id* invalid.
4399  *   - (-EINVAL) if bad parameter.
4400  */
4401 __rte_experimental
4402 int rte_eth_dev_priority_flow_ctrl_queue_info_get(uint16_t port_id,
4403 		struct rte_eth_pfc_queue_info *pfc_queue_info);
4404 
4405 /**
4406  * @warning
4407  * @b EXPERIMENTAL: this API may change without prior notice.
4408  *
4409  * Configure the queue based priority flow control for a given queue
4410  * for Ethernet device.
4411  *
4412  * @note When an ethdev port switches to queue based PFC mode, the
4413  * unconfigured queues shall be configured by the driver with
4414  * default values such as lower priority value for TC etc.
4415  *
4416  * @param port_id
4417  *   The port identifier of the Ethernet device.
4418  * @param pfc_queue_conf
4419  *   The pointer to the structure of the priority flow control parameters
4420  *   for the queue.
4421  * @return
4422  *   - (0) if successful.
4423  *   - (-ENOTSUP) if hardware doesn't support queue based PFC mode.
4424  *   - (-ENODEV)  if *port_id* invalid.
4425  *   - (-EINVAL)  if bad parameter
4426  *   - (-EIO)     if flow control setup queue failure
4427  */
4428 __rte_experimental
4429 int rte_eth_dev_priority_flow_ctrl_queue_configure(uint16_t port_id,
4430 		struct rte_eth_pfc_queue_conf *pfc_queue_conf);
4431 
4432 /**
4433  * Remove a MAC address from the internal array of addresses.
4434  *
4435  * @param port_id
4436  *   The port identifier of the Ethernet device.
4437  * @param mac_addr
4438  *   MAC address to remove.
4439  * @return
4440  *   - (0) if successful, or *mac_addr* didn't exist.
4441  *   - (-ENOTSUP) if hardware doesn't support.
4442  *   - (-ENODEV) if *port* invalid.
4443  *   - (-EADDRINUSE) if attempting to remove the default MAC address.
4444  *   - (-EINVAL) if MAC address is invalid.
4445  */
4446 int rte_eth_dev_mac_addr_remove(uint16_t port_id,
4447 				struct rte_ether_addr *mac_addr);
4448 
4449 /**
4450  * Set the default MAC address.
4451  * It replaces the address at index 0 of the MAC address list.
4452  * If the address was already in the MAC address list,
4453  * please remove it first.
4454  *
4455  * @param port_id
4456  *   The port identifier of the Ethernet device.
4457  * @param mac_addr
4458  *   New default MAC address.
4459  * @return
4460  *   - (0) if successful, or *mac_addr* didn't exist.
4461  *   - (-ENOTSUP) if hardware doesn't support.
4462  *   - (-ENODEV) if *port* invalid.
4463  *   - (-EINVAL) if MAC address is invalid.
4464  *   - (-EEXIST) if MAC address was already in the address list.
4465  */
4466 int rte_eth_dev_default_mac_addr_set(uint16_t port_id,
4467 		struct rte_ether_addr *mac_addr);
4468 
4469 /**
4470  * Update Redirection Table(RETA) of Receive Side Scaling of Ethernet device.
4471  *
4472  * @param port_id
4473  *   The port identifier of the Ethernet device.
4474  * @param reta_conf
4475  *   RETA to update.
4476  * @param reta_size
4477  *   Redirection table size. The table size can be queried by
4478  *   rte_eth_dev_info_get().
4479  * @return
4480  *   - (0) if successful.
4481  *   - (-ENODEV) if *port_id* is invalid.
4482  *   - (-ENOTSUP) if hardware doesn't support.
4483  *   - (-EINVAL) if bad parameter.
4484  *   - (-EIO) if device is removed.
4485  */
4486 int rte_eth_dev_rss_reta_update(uint16_t port_id,
4487 				struct rte_eth_rss_reta_entry64 *reta_conf,
4488 				uint16_t reta_size);
4489 
4490 /**
4491  * Query Redirection Table(RETA) of Receive Side Scaling of Ethernet device.
4492  *
4493  * @param port_id
4494  *   The port identifier of the Ethernet device.
4495  * @param reta_conf
4496  *   RETA to query. For each requested reta entry, corresponding bit
4497  *   in mask must be set.
4498  * @param reta_size
4499  *   Redirection table size. The table size can be queried by
4500  *   rte_eth_dev_info_get().
4501  * @return
4502  *   - (0) if successful.
4503  *   - (-ENODEV) if *port_id* is invalid.
4504  *   - (-ENOTSUP) if hardware doesn't support.
4505  *   - (-EINVAL) if bad parameter.
4506  *   - (-EIO) if device is removed.
4507  */
4508 int rte_eth_dev_rss_reta_query(uint16_t port_id,
4509 			       struct rte_eth_rss_reta_entry64 *reta_conf,
4510 			       uint16_t reta_size);
4511 
4512 /**
4513  * Updates unicast hash table for receiving packet with the given destination
4514  * MAC address, and the packet is routed to all VFs for which the Rx mode is
4515  * accept packets that match the unicast hash table.
4516  *
4517  * @param port_id
4518  *   The port identifier of the Ethernet device.
4519  * @param addr
4520  *   Unicast MAC address.
4521  * @param on
4522  *    1 - Set an unicast hash bit for receiving packets with the MAC address.
4523  *    0 - Clear an unicast hash bit.
4524  * @return
4525  *   - (0) if successful.
4526  *   - (-ENOTSUP) if hardware doesn't support.
4527  *   - (-ENODEV) if *port_id* invalid.
4528  *   - (-EIO) if device is removed.
4529  *   - (-EINVAL) if bad parameter.
4530  */
4531 int rte_eth_dev_uc_hash_table_set(uint16_t port_id, struct rte_ether_addr *addr,
4532 				  uint8_t on);
4533 
4534 /**
4535  * Updates all unicast hash bitmaps for receiving packet with any Unicast
4536  * Ethernet MAC addresses,the packet is routed to all VFs for which the Rx
4537  * mode is accept packets that match the unicast hash table.
4538  *
4539  * @param port_id
4540  *   The port identifier of the Ethernet device.
4541  * @param on
4542  *    1 - Set all unicast hash bitmaps for receiving all the Ethernet
4543  *         MAC addresses
4544  *    0 - Clear all unicast hash bitmaps
4545  * @return
4546  *   - (0) if successful.
4547  *   - (-ENOTSUP) if hardware doesn't support.
4548  *   - (-ENODEV) if *port_id* invalid.
4549  *   - (-EIO) if device is removed.
4550  *   - (-EINVAL) if bad parameter.
4551  */
4552 int rte_eth_dev_uc_all_hash_table_set(uint16_t port_id, uint8_t on);
4553 
4554 /**
4555  * Set the rate limitation for a queue on an Ethernet device.
4556  *
4557  * @param port_id
4558  *   The port identifier of the Ethernet device.
4559  * @param queue_idx
4560  *   The queue ID.
4561  * @param tx_rate
4562  *   The Tx rate in Mbps. Allocated from the total port link speed.
4563  * @return
4564  *   - (0) if successful.
4565  *   - (-ENOTSUP) if hardware doesn't support this feature.
4566  *   - (-ENODEV) if *port_id* invalid.
4567  *   - (-EIO) if device is removed.
4568  *   - (-EINVAL) if bad parameter.
4569  */
4570 int rte_eth_set_queue_rate_limit(uint16_t port_id, uint16_t queue_idx,
4571 			uint32_t tx_rate);
4572 
4573 /**
4574  * Configuration of Receive Side Scaling hash computation of Ethernet device.
4575  *
4576  * @param port_id
4577  *   The port identifier of the Ethernet device.
4578  * @param rss_conf
4579  *   The new configuration to use for RSS hash computation on the port.
4580  * @return
4581  *   - (0) if successful.
4582  *   - (-ENODEV) if port identifier is invalid.
4583  *   - (-EIO) if device is removed.
4584  *   - (-ENOTSUP) if hardware doesn't support.
4585  *   - (-EINVAL) if bad parameter.
4586  */
4587 int rte_eth_dev_rss_hash_update(uint16_t port_id,
4588 				struct rte_eth_rss_conf *rss_conf);
4589 
4590 /**
4591  * Retrieve current configuration of Receive Side Scaling hash computation
4592  * of Ethernet device.
4593  *
4594  * @param port_id
4595  *   The port identifier of the Ethernet device.
4596  * @param rss_conf
4597  *   Where to store the current RSS hash configuration of the Ethernet device.
4598  * @return
4599  *   - (0) if successful.
4600  *   - (-ENODEV) if port identifier is invalid.
4601  *   - (-EIO) if device is removed.
4602  *   - (-ENOTSUP) if hardware doesn't support RSS.
4603  *   - (-EINVAL) if bad parameter.
4604  */
4605 int
4606 rte_eth_dev_rss_hash_conf_get(uint16_t port_id,
4607 			      struct rte_eth_rss_conf *rss_conf);
4608 
4609 /**
4610  * Add UDP tunneling port for a type of tunnel.
4611  *
4612  * Some NICs may require such configuration to properly parse a tunnel
4613  * with any standard or custom UDP port.
4614  * The packets with this UDP port will be parsed for this type of tunnel.
4615  * The device parser will also check the rest of the tunnel headers
4616  * before classifying the packet.
4617  *
4618  * With some devices, this API will affect packet classification, i.e.:
4619  *     - mbuf.packet_type reported on Rx
4620  *     - rte_flow rules with tunnel items
4621  *
4622  * @param port_id
4623  *   The port identifier of the Ethernet device.
4624  * @param tunnel_udp
4625  *   UDP tunneling configuration.
4626  *
4627  * @return
4628  *   - (0) if successful.
4629  *   - (-ENODEV) if port identifier is invalid.
4630  *   - (-EIO) if device is removed.
4631  *   - (-ENOTSUP) if hardware doesn't support tunnel type.
4632  */
4633 int
4634 rte_eth_dev_udp_tunnel_port_add(uint16_t port_id,
4635 				struct rte_eth_udp_tunnel *tunnel_udp);
4636 
4637 /**
4638  * Delete UDP tunneling port for a type of tunnel.
4639  *
4640  * The packets with this UDP port will not be classified as this type of tunnel
4641  * anymore if the device use such mapping for tunnel packet classification.
4642  *
4643  * @see rte_eth_dev_udp_tunnel_port_add
4644  *
4645  * @param port_id
4646  *   The port identifier of the Ethernet device.
4647  * @param tunnel_udp
4648  *   UDP tunneling configuration.
4649  *
4650  * @return
4651  *   - (0) if successful.
4652  *   - (-ENODEV) if port identifier is invalid.
4653  *   - (-EIO) if device is removed.
4654  *   - (-ENOTSUP) if hardware doesn't support tunnel type.
4655  */
4656 int
4657 rte_eth_dev_udp_tunnel_port_delete(uint16_t port_id,
4658 				   struct rte_eth_udp_tunnel *tunnel_udp);
4659 
4660 /**
4661  * Get DCB information on an Ethernet device.
4662  *
4663  * @param port_id
4664  *   The port identifier of the Ethernet device.
4665  * @param dcb_info
4666  *   DCB information.
4667  * @return
4668  *   - (0) if successful.
4669  *   - (-ENODEV) if port identifier is invalid.
4670  *   - (-EIO) if device is removed.
4671  *   - (-ENOTSUP) if hardware doesn't support.
4672  *   - (-EINVAL) if bad parameter.
4673  */
4674 int rte_eth_dev_get_dcb_info(uint16_t port_id,
4675 			     struct rte_eth_dcb_info *dcb_info);
4676 
4677 struct rte_eth_rxtx_callback;
4678 
4679 /**
4680  * Add a callback to be called on packet Rx on a given port and queue.
4681  *
4682  * This API configures a function to be called for each burst of
4683  * packets received on a given NIC port queue. The return value is a pointer
4684  * that can be used to later remove the callback using
4685  * rte_eth_remove_rx_callback().
4686  *
4687  * Multiple functions are called in the order that they are added.
4688  *
4689  * @param port_id
4690  *   The port identifier of the Ethernet device.
4691  * @param queue_id
4692  *   The queue on the Ethernet device on which the callback is to be added.
4693  * @param fn
4694  *   The callback function
4695  * @param user_param
4696  *   A generic pointer parameter which will be passed to each invocation of the
4697  *   callback function on this port and queue. Inter-thread synchronization
4698  *   of any user data changes is the responsibility of the user.
4699  *
4700  * @return
4701  *   NULL on error.
4702  *   On success, a pointer value which can later be used to remove the callback.
4703  */
4704 const struct rte_eth_rxtx_callback *
4705 rte_eth_add_rx_callback(uint16_t port_id, uint16_t queue_id,
4706 		rte_rx_callback_fn fn, void *user_param);
4707 
4708 /**
4709  * Add a callback that must be called first on packet Rx on a given port
4710  * and queue.
4711  *
4712  * This API configures a first function to be called for each burst of
4713  * packets received on a given NIC port queue. The return value is a pointer
4714  * that can be used to later remove the callback using
4715  * rte_eth_remove_rx_callback().
4716  *
4717  * Multiple functions are called in the order that they are added.
4718  *
4719  * @param port_id
4720  *   The port identifier of the Ethernet device.
4721  * @param queue_id
4722  *   The queue on the Ethernet device on which the callback is to be added.
4723  * @param fn
4724  *   The callback function
4725  * @param user_param
4726  *   A generic pointer parameter which will be passed to each invocation of the
4727  *   callback function on this port and queue. Inter-thread synchronization
4728  *   of any user data changes is the responsibility of the user.
4729  *
4730  * @return
4731  *   NULL on error.
4732  *   On success, a pointer value which can later be used to remove the callback.
4733  */
4734 const struct rte_eth_rxtx_callback *
4735 rte_eth_add_first_rx_callback(uint16_t port_id, uint16_t queue_id,
4736 		rte_rx_callback_fn fn, void *user_param);
4737 
4738 /**
4739  * Add a callback to be called on packet Tx on a given port and queue.
4740  *
4741  * This API configures a function to be called for each burst of
4742  * packets sent on a given NIC port queue. The return value is a pointer
4743  * that can be used to later remove the callback using
4744  * rte_eth_remove_tx_callback().
4745  *
4746  * Multiple functions are called in the order that they are added.
4747  *
4748  * @param port_id
4749  *   The port identifier of the Ethernet device.
4750  * @param queue_id
4751  *   The queue on the Ethernet device on which the callback is to be added.
4752  * @param fn
4753  *   The callback function
4754  * @param user_param
4755  *   A generic pointer parameter which will be passed to each invocation of the
4756  *   callback function on this port and queue. Inter-thread synchronization
4757  *   of any user data changes is the responsibility of the user.
4758  *
4759  * @return
4760  *   NULL on error.
4761  *   On success, a pointer value which can later be used to remove the callback.
4762  */
4763 const struct rte_eth_rxtx_callback *
4764 rte_eth_add_tx_callback(uint16_t port_id, uint16_t queue_id,
4765 		rte_tx_callback_fn fn, void *user_param);
4766 
4767 /**
4768  * Remove an Rx packet callback from a given port and queue.
4769  *
4770  * This function is used to removed callbacks that were added to a NIC port
4771  * queue using rte_eth_add_rx_callback().
4772  *
4773  * Note: the callback is removed from the callback list but it isn't freed
4774  * since the it may still be in use. The memory for the callback can be
4775  * subsequently freed back by the application by calling rte_free():
4776  *
4777  * - Immediately - if the port is stopped, or the user knows that no
4778  *   callbacks are in flight e.g. if called from the thread doing Rx/Tx
4779  *   on that queue.
4780  *
4781  * - After a short delay - where the delay is sufficient to allow any
4782  *   in-flight callbacks to complete. Alternately, the RCU mechanism can be
4783  *   used to detect when data plane threads have ceased referencing the
4784  *   callback memory.
4785  *
4786  * @param port_id
4787  *   The port identifier of the Ethernet device.
4788  * @param queue_id
4789  *   The queue on the Ethernet device from which the callback is to be removed.
4790  * @param user_cb
4791  *   User supplied callback created via rte_eth_add_rx_callback().
4792  *
4793  * @return
4794  *   - 0: Success. Callback was removed.
4795  *   - -ENODEV:  If *port_id* is invalid.
4796  *   - -ENOTSUP: Callback support is not available.
4797  *   - -EINVAL:  The queue_id is out of range, or the callback
4798  *               is NULL or not found for the port/queue.
4799  */
4800 int rte_eth_remove_rx_callback(uint16_t port_id, uint16_t queue_id,
4801 		const struct rte_eth_rxtx_callback *user_cb);
4802 
4803 /**
4804  * Remove a Tx packet callback from a given port and queue.
4805  *
4806  * This function is used to removed callbacks that were added to a NIC port
4807  * queue using rte_eth_add_tx_callback().
4808  *
4809  * Note: the callback is removed from the callback list but it isn't freed
4810  * since the it may still be in use. The memory for the callback can be
4811  * subsequently freed back by the application by calling rte_free():
4812  *
4813  * - Immediately - if the port is stopped, or the user knows that no
4814  *   callbacks are in flight e.g. if called from the thread doing Rx/Tx
4815  *   on that queue.
4816  *
4817  * - After a short delay - where the delay is sufficient to allow any
4818  *   in-flight callbacks to complete. Alternately, the RCU mechanism can be
4819  *   used to detect when data plane threads have ceased referencing the
4820  *   callback memory.
4821  *
4822  * @param port_id
4823  *   The port identifier of the Ethernet device.
4824  * @param queue_id
4825  *   The queue on the Ethernet device from which the callback is to be removed.
4826  * @param user_cb
4827  *   User supplied callback created via rte_eth_add_tx_callback().
4828  *
4829  * @return
4830  *   - 0: Success. Callback was removed.
4831  *   - -ENODEV:  If *port_id* is invalid.
4832  *   - -ENOTSUP: Callback support is not available.
4833  *   - -EINVAL:  The queue_id is out of range, or the callback
4834  *               is NULL or not found for the port/queue.
4835  */
4836 int rte_eth_remove_tx_callback(uint16_t port_id, uint16_t queue_id,
4837 		const struct rte_eth_rxtx_callback *user_cb);
4838 
4839 /**
4840  * Retrieve information about given port's Rx queue.
4841  *
4842  * @param port_id
4843  *   The port identifier of the Ethernet device.
4844  * @param queue_id
4845  *   The Rx queue on the Ethernet device for which information
4846  *   will be retrieved.
4847  * @param qinfo
4848  *   A pointer to a structure of type *rte_eth_rxq_info_info* to be filled with
4849  *   the information of the Ethernet device.
4850  *
4851  * @return
4852  *   - 0: Success
4853  *   - -ENODEV:  If *port_id* is invalid.
4854  *   - -ENOTSUP: routine is not supported by the device PMD.
4855  *   - -EINVAL:  The queue_id is out of range, or the queue
4856  *               is hairpin queue.
4857  */
4858 int rte_eth_rx_queue_info_get(uint16_t port_id, uint16_t queue_id,
4859 	struct rte_eth_rxq_info *qinfo);
4860 
4861 /**
4862  * Retrieve information about given port's Tx queue.
4863  *
4864  * @param port_id
4865  *   The port identifier of the Ethernet device.
4866  * @param queue_id
4867  *   The Tx queue on the Ethernet device for which information
4868  *   will be retrieved.
4869  * @param qinfo
4870  *   A pointer to a structure of type *rte_eth_txq_info_info* to be filled with
4871  *   the information of the Ethernet device.
4872  *
4873  * @return
4874  *   - 0: Success
4875  *   - -ENODEV:  If *port_id* is invalid.
4876  *   - -ENOTSUP: routine is not supported by the device PMD.
4877  *   - -EINVAL:  The queue_id is out of range, or the queue
4878  *               is hairpin queue.
4879  */
4880 int rte_eth_tx_queue_info_get(uint16_t port_id, uint16_t queue_id,
4881 	struct rte_eth_txq_info *qinfo);
4882 
4883 /**
4884  * @warning
4885  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
4886  *
4887  * Retrieve information about given ports's Rx queue for recycling mbufs.
4888  *
4889  * @param port_id
4890  *   The port identifier of the Ethernet device.
4891  * @param queue_id
4892  *   The Rx queue on the Ethernet devicefor which information
4893  *   will be retrieved.
4894  * @param recycle_rxq_info
4895  *   A pointer to a structure of type *rte_eth_recycle_rxq_info* to be filled.
4896  *
4897  * @return
4898  *   - 0: Success
4899  *   - -ENODEV:  If *port_id* is invalid.
4900  *   - -ENOTSUP: routine is not supported by the device PMD.
4901  *   - -EINVAL:  The queue_id is out of range.
4902  */
4903 __rte_experimental
4904 int rte_eth_recycle_rx_queue_info_get(uint16_t port_id,
4905 		uint16_t queue_id,
4906 		struct rte_eth_recycle_rxq_info *recycle_rxq_info);
4907 
4908 /**
4909  * Retrieve information about the Rx packet burst mode.
4910  *
4911  * @param port_id
4912  *   The port identifier of the Ethernet device.
4913  * @param queue_id
4914  *   The Rx queue on the Ethernet device for which information
4915  *   will be retrieved.
4916  * @param mode
4917  *   A pointer to a structure of type *rte_eth_burst_mode* to be filled
4918  *   with the information of the packet burst mode.
4919  *
4920  * @return
4921  *   - 0: Success
4922  *   - -ENODEV:  If *port_id* is invalid.
4923  *   - -ENOTSUP: routine is not supported by the device PMD.
4924  *   - -EINVAL:  The queue_id is out of range.
4925  */
4926 int rte_eth_rx_burst_mode_get(uint16_t port_id, uint16_t queue_id,
4927 	struct rte_eth_burst_mode *mode);
4928 
4929 /**
4930  * Retrieve information about the Tx packet burst mode.
4931  *
4932  * @param port_id
4933  *   The port identifier of the Ethernet device.
4934  * @param queue_id
4935  *   The Tx queue on the Ethernet device for which information
4936  *   will be retrieved.
4937  * @param mode
4938  *   A pointer to a structure of type *rte_eth_burst_mode* to be filled
4939  *   with the information of the packet burst mode.
4940  *
4941  * @return
4942  *   - 0: Success
4943  *   - -ENODEV:  If *port_id* is invalid.
4944  *   - -ENOTSUP: routine is not supported by the device PMD.
4945  *   - -EINVAL:  The queue_id is out of range.
4946  */
4947 int rte_eth_tx_burst_mode_get(uint16_t port_id, uint16_t queue_id,
4948 	struct rte_eth_burst_mode *mode);
4949 
4950 /**
4951  * @warning
4952  * @b EXPERIMENTAL: this API may change without prior notice.
4953  *
4954  * Retrieve the monitor condition for a given receive queue.
4955  *
4956  * @param port_id
4957  *   The port identifier of the Ethernet device.
4958  * @param queue_id
4959  *   The Rx queue on the Ethernet device for which information
4960  *   will be retrieved.
4961  * @param pmc
4962  *   The pointer to power-optimized monitoring condition structure.
4963  *
4964  * @return
4965  *   - 0: Success.
4966  *   -ENOTSUP: Operation not supported.
4967  *   -EINVAL: Invalid parameters.
4968  *   -ENODEV: Invalid port ID.
4969  */
4970 __rte_experimental
4971 int rte_eth_get_monitor_addr(uint16_t port_id, uint16_t queue_id,
4972 		struct rte_power_monitor_cond *pmc);
4973 
4974 /**
4975  * Retrieve device registers and register attributes (number of registers and
4976  * register size)
4977  *
4978  * @param port_id
4979  *   The port identifier of the Ethernet device.
4980  * @param info
4981  *   Pointer to rte_dev_reg_info structure to fill in. If info->data is
4982  *   NULL the function fills in the width and length fields. If non-NULL
4983  *   the registers are put into the buffer pointed at by the data field.
4984  * @return
4985  *   - (0) if successful.
4986  *   - (-ENOTSUP) if hardware doesn't support.
4987  *   - (-EINVAL) if bad parameter.
4988  *   - (-ENODEV) if *port_id* invalid.
4989  *   - (-EIO) if device is removed.
4990  *   - others depends on the specific operations implementation.
4991  */
4992 int rte_eth_dev_get_reg_info(uint16_t port_id, struct rte_dev_reg_info *info);
4993 
4994 /**
4995  * Retrieve size of device EEPROM
4996  *
4997  * @param port_id
4998  *   The port identifier of the Ethernet device.
4999  * @return
5000  *   - (>=0) EEPROM size if successful.
5001  *   - (-ENOTSUP) if hardware doesn't support.
5002  *   - (-ENODEV) if *port_id* invalid.
5003  *   - (-EIO) if device is removed.
5004  *   - others depends on the specific operations implementation.
5005  */
5006 int rte_eth_dev_get_eeprom_length(uint16_t port_id);
5007 
5008 /**
5009  * Retrieve EEPROM and EEPROM attribute
5010  *
5011  * @param port_id
5012  *   The port identifier of the Ethernet device.
5013  * @param info
5014  *   The template includes buffer for return EEPROM data and
5015  *   EEPROM attributes to be filled.
5016  * @return
5017  *   - (0) if successful.
5018  *   - (-ENOTSUP) if hardware doesn't support.
5019  *   - (-EINVAL) if bad parameter.
5020  *   - (-ENODEV) if *port_id* invalid.
5021  *   - (-EIO) if device is removed.
5022  *   - others depends on the specific operations implementation.
5023  */
5024 int rte_eth_dev_get_eeprom(uint16_t port_id, struct rte_dev_eeprom_info *info);
5025 
5026 /**
5027  * Program EEPROM with provided data
5028  *
5029  * @param port_id
5030  *   The port identifier of the Ethernet device.
5031  * @param info
5032  *   The template includes EEPROM data for programming and
5033  *   EEPROM attributes to be filled
5034  * @return
5035  *   - (0) if successful.
5036  *   - (-ENOTSUP) if hardware doesn't support.
5037  *   - (-ENODEV) if *port_id* invalid.
5038  *   - (-EINVAL) if bad parameter.
5039  *   - (-EIO) if device is removed.
5040  *   - others depends on the specific operations implementation.
5041  */
5042 int rte_eth_dev_set_eeprom(uint16_t port_id, struct rte_dev_eeprom_info *info);
5043 
5044 /**
5045  * @warning
5046  * @b EXPERIMENTAL: this API may change without prior notice.
5047  *
5048  * Retrieve the type and size of plugin module EEPROM
5049  *
5050  * @param port_id
5051  *   The port identifier of the Ethernet device.
5052  * @param modinfo
5053  *   The type and size of plugin module EEPROM.
5054  * @return
5055  *   - (0) if successful.
5056  *   - (-ENOTSUP) if hardware doesn't support.
5057  *   - (-ENODEV) if *port_id* invalid.
5058  *   - (-EINVAL) if bad parameter.
5059  *   - (-EIO) if device is removed.
5060  *   - others depends on the specific operations implementation.
5061  */
5062 __rte_experimental
5063 int
5064 rte_eth_dev_get_module_info(uint16_t port_id,
5065 			    struct rte_eth_dev_module_info *modinfo);
5066 
5067 /**
5068  * @warning
5069  * @b EXPERIMENTAL: this API may change without prior notice.
5070  *
5071  * Retrieve the data of plugin module EEPROM
5072  *
5073  * @param port_id
5074  *   The port identifier of the Ethernet device.
5075  * @param info
5076  *   The template includes the plugin module EEPROM attributes, and the
5077  *   buffer for return plugin module EEPROM data.
5078  * @return
5079  *   - (0) if successful.
5080  *   - (-ENOTSUP) if hardware doesn't support.
5081  *   - (-EINVAL) if bad parameter.
5082  *   - (-ENODEV) if *port_id* invalid.
5083  *   - (-EIO) if device is removed.
5084  *   - others depends on the specific operations implementation.
5085  */
5086 __rte_experimental
5087 int
5088 rte_eth_dev_get_module_eeprom(uint16_t port_id,
5089 			      struct rte_dev_eeprom_info *info);
5090 
5091 /**
5092  * Set the list of multicast addresses to filter on an Ethernet device.
5093  *
5094  * @param port_id
5095  *   The port identifier of the Ethernet device.
5096  * @param mc_addr_set
5097  *   The array of multicast addresses to set. Equal to NULL when the function
5098  *   is invoked to flush the set of filtered addresses.
5099  * @param nb_mc_addr
5100  *   The number of multicast addresses in the *mc_addr_set* array. Equal to 0
5101  *   when the function is invoked to flush the set of filtered addresses.
5102  * @return
5103  *   - (0) if successful.
5104  *   - (-ENODEV) if *port_id* invalid.
5105  *   - (-EIO) if device is removed.
5106  *   - (-ENOTSUP) if PMD of *port_id* doesn't support multicast filtering.
5107  *   - (-ENOSPC) if *port_id* has not enough multicast filtering resources.
5108  *   - (-EINVAL) if bad parameter.
5109  */
5110 int rte_eth_dev_set_mc_addr_list(uint16_t port_id,
5111 				 struct rte_ether_addr *mc_addr_set,
5112 				 uint32_t nb_mc_addr);
5113 
5114 /**
5115  * Enable IEEE1588/802.1AS timestamping for an Ethernet device.
5116  *
5117  * @param port_id
5118  *   The port identifier of the Ethernet device.
5119  *
5120  * @return
5121  *   - 0: Success.
5122  *   - -ENODEV: The port ID is invalid.
5123  *   - -EIO: if device is removed.
5124  *   - -ENOTSUP: The function is not supported by the Ethernet driver.
5125  */
5126 int rte_eth_timesync_enable(uint16_t port_id);
5127 
5128 /**
5129  * Disable IEEE1588/802.1AS timestamping for an Ethernet device.
5130  *
5131  * @param port_id
5132  *   The port identifier of the Ethernet device.
5133  *
5134  * @return
5135  *   - 0: Success.
5136  *   - -ENODEV: The port ID is invalid.
5137  *   - -EIO: if device is removed.
5138  *   - -ENOTSUP: The function is not supported by the Ethernet driver.
5139  */
5140 int rte_eth_timesync_disable(uint16_t port_id);
5141 
5142 /**
5143  * Read an IEEE1588/802.1AS Rx timestamp from an Ethernet device.
5144  *
5145  * @param port_id
5146  *   The port identifier of the Ethernet device.
5147  * @param timestamp
5148  *   Pointer to the timestamp struct.
5149  * @param flags
5150  *   Device specific flags. Used to pass the Rx timesync register index to
5151  *   i40e. Unused in igb/ixgbe, pass 0 instead.
5152  *
5153  * @return
5154  *   - 0: Success.
5155  *   - -EINVAL: No timestamp is available.
5156  *   - -ENODEV: The port ID is invalid.
5157  *   - -EIO: if device is removed.
5158  *   - -ENOTSUP: The function is not supported by the Ethernet driver.
5159  */
5160 int rte_eth_timesync_read_rx_timestamp(uint16_t port_id,
5161 		struct timespec *timestamp, uint32_t flags);
5162 
5163 /**
5164  * Read an IEEE1588/802.1AS Tx timestamp from an Ethernet device.
5165  *
5166  * @param port_id
5167  *   The port identifier of the Ethernet device.
5168  * @param timestamp
5169  *   Pointer to the timestamp struct.
5170  *
5171  * @return
5172  *   - 0: Success.
5173  *   - -EINVAL: No timestamp is available.
5174  *   - -ENODEV: The port ID is invalid.
5175  *   - -EIO: if device is removed.
5176  *   - -ENOTSUP: The function is not supported by the Ethernet driver.
5177  */
5178 int rte_eth_timesync_read_tx_timestamp(uint16_t port_id,
5179 		struct timespec *timestamp);
5180 
5181 /**
5182  * Adjust the timesync clock on an Ethernet device.
5183  *
5184  * This is usually used in conjunction with other Ethdev timesync functions to
5185  * synchronize the device time using the IEEE1588/802.1AS protocol.
5186  *
5187  * @param port_id
5188  *   The port identifier of the Ethernet device.
5189  * @param delta
5190  *   The adjustment in nanoseconds.
5191  *
5192  * @return
5193  *   - 0: Success.
5194  *   - -ENODEV: The port ID is invalid.
5195  *   - -EIO: if device is removed.
5196  *   - -ENOTSUP: The function is not supported by the Ethernet driver.
5197  */
5198 int rte_eth_timesync_adjust_time(uint16_t port_id, int64_t delta);
5199 
5200 /**
5201  * Read the time from the timesync clock on an Ethernet device.
5202  *
5203  * This is usually used in conjunction with other Ethdev timesync functions to
5204  * synchronize the device time using the IEEE1588/802.1AS protocol.
5205  *
5206  * @param port_id
5207  *   The port identifier of the Ethernet device.
5208  * @param time
5209  *   Pointer to the timespec struct that holds the time.
5210  *
5211  * @return
5212  *   - 0: Success.
5213  *   - -EINVAL: Bad parameter.
5214  */
5215 int rte_eth_timesync_read_time(uint16_t port_id, struct timespec *time);
5216 
5217 /**
5218  * Set the time of the timesync clock on an Ethernet device.
5219  *
5220  * This is usually used in conjunction with other Ethdev timesync functions to
5221  * synchronize the device time using the IEEE1588/802.1AS protocol.
5222  *
5223  * @param port_id
5224  *   The port identifier of the Ethernet device.
5225  * @param time
5226  *   Pointer to the timespec struct that holds the time.
5227  *
5228  * @return
5229  *   - 0: Success.
5230  *   - -EINVAL: No timestamp is available.
5231  *   - -ENODEV: The port ID is invalid.
5232  *   - -EIO: if device is removed.
5233  *   - -ENOTSUP: The function is not supported by the Ethernet driver.
5234  */
5235 int rte_eth_timesync_write_time(uint16_t port_id, const struct timespec *time);
5236 
5237 /**
5238  * @warning
5239  * @b EXPERIMENTAL: this API may change without prior notice.
5240  *
5241  * Read the current clock counter of an Ethernet device
5242  *
5243  * This returns the current raw clock value of an Ethernet device. It is
5244  * a raw amount of ticks, with no given time reference.
5245  * The value returned here is from the same clock than the one
5246  * filling timestamp field of Rx packets when using hardware timestamp
5247  * offload. Therefore it can be used to compute a precise conversion of
5248  * the device clock to the real time.
5249  *
5250  * E.g, a simple heuristic to derivate the frequency would be:
5251  * uint64_t start, end;
5252  * rte_eth_read_clock(port, start);
5253  * rte_delay_ms(100);
5254  * rte_eth_read_clock(port, end);
5255  * double freq = (end - start) * 10;
5256  *
5257  * Compute a common reference with:
5258  * uint64_t base_time_sec = current_time();
5259  * uint64_t base_clock;
5260  * rte_eth_read_clock(port, base_clock);
5261  *
5262  * Then, convert the raw mbuf timestamp with:
5263  * base_time_sec + (double)(*timestamp_dynfield(mbuf) - base_clock) / freq;
5264  *
5265  * This simple example will not provide a very good accuracy. One must
5266  * at least measure multiple times the frequency and do a regression.
5267  * To avoid deviation from the system time, the common reference can
5268  * be repeated from time to time. The integer division can also be
5269  * converted by a multiplication and a shift for better performance.
5270  *
5271  * @param port_id
5272  *   The port identifier of the Ethernet device.
5273  * @param clock
5274  *   Pointer to the uint64_t that holds the raw clock value.
5275  *
5276  * @return
5277  *   - 0: Success.
5278  *   - -ENODEV: The port ID is invalid.
5279  *   - -ENOTSUP: The function is not supported by the Ethernet driver.
5280  *   - -EINVAL: if bad parameter.
5281  */
5282 __rte_experimental
5283 int
5284 rte_eth_read_clock(uint16_t port_id, uint64_t *clock);
5285 
5286 /**
5287  * Get the port ID from device name.
5288  * The device name should be specified as below:
5289  * - PCIe address (Domain:Bus:Device.Function), for example- 0000:2:00.0
5290  * - SoC device name, for example- fsl-gmac0
5291  * - vdev dpdk name, for example- net_[pcap0|null0|tap0]
5292  *
5293  * @param name
5294  *   PCI address or name of the device.
5295  * @param port_id
5296  *   Pointer to port identifier of the device.
5297  * @return
5298  *   - (0) if successful and port_id is filled.
5299  *   - (-ENODEV or -EINVAL) on failure.
5300  */
5301 int
5302 rte_eth_dev_get_port_by_name(const char *name, uint16_t *port_id);
5303 
5304 /**
5305  * Get the device name from port ID.
5306  * The device name is specified as below:
5307  * - PCIe address (Domain:Bus:Device.Function), for example- 0000:02:00.0
5308  * - SoC device name, for example- fsl-gmac0
5309  * - vdev dpdk name, for example- net_[pcap0|null0|tun0|tap0]
5310  *
5311  * @param port_id
5312  *   Port identifier of the device.
5313  * @param name
5314  *   Buffer of size RTE_ETH_NAME_MAX_LEN to store the name.
5315  * @return
5316  *   - (0) if successful.
5317  *   - (-ENODEV) if *port_id* is invalid.
5318  *   - (-EINVAL) on failure.
5319  */
5320 int
5321 rte_eth_dev_get_name_by_port(uint16_t port_id, char *name);
5322 
5323 /**
5324  * Check that numbers of Rx and Tx descriptors satisfy descriptors limits from
5325  * the Ethernet device information, otherwise adjust them to boundaries.
5326  *
5327  * @param port_id
5328  *   The port identifier of the Ethernet device.
5329  * @param nb_rx_desc
5330  *   A pointer to a uint16_t where the number of receive
5331  *   descriptors stored.
5332  * @param nb_tx_desc
5333  *   A pointer to a uint16_t where the number of transmit
5334  *   descriptors stored.
5335  * @return
5336  *   - (0) if successful.
5337  *   - (-ENOTSUP, -ENODEV or -EINVAL) on failure.
5338  */
5339 int rte_eth_dev_adjust_nb_rx_tx_desc(uint16_t port_id,
5340 				     uint16_t *nb_rx_desc,
5341 				     uint16_t *nb_tx_desc);
5342 
5343 /**
5344  * Test if a port supports specific mempool ops.
5345  *
5346  * @param port_id
5347  *   Port identifier of the Ethernet device.
5348  * @param [in] pool
5349  *   The name of the pool operations to test.
5350  * @return
5351  *   - 0: best mempool ops choice for this port.
5352  *   - 1: mempool ops are supported for this port.
5353  *   - -ENOTSUP: mempool ops not supported for this port.
5354  *   - -ENODEV: Invalid port Identifier.
5355  *   - -EINVAL: Pool param is null.
5356  */
5357 int
5358 rte_eth_dev_pool_ops_supported(uint16_t port_id, const char *pool);
5359 
5360 /**
5361  * Get the security context for the Ethernet device.
5362  *
5363  * @param port_id
5364  *   Port identifier of the Ethernet device
5365  * @return
5366  *   - NULL on error.
5367  *   - pointer to security context on success.
5368  */
5369 void *
5370 rte_eth_dev_get_sec_ctx(uint16_t port_id);
5371 
5372 /**
5373  * @warning
5374  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5375  *
5376  * Query the device hairpin capabilities.
5377  *
5378  * @param port_id
5379  *   The port identifier of the Ethernet device.
5380  * @param cap
5381  *   Pointer to a structure that will hold the hairpin capabilities.
5382  * @return
5383  *   - (0) if successful.
5384  *   - (-ENOTSUP) if hardware doesn't support.
5385  *   - (-EINVAL) if bad parameter.
5386  */
5387 __rte_experimental
5388 int rte_eth_dev_hairpin_capability_get(uint16_t port_id,
5389 				       struct rte_eth_hairpin_cap *cap);
5390 
5391 /**
5392  * @warning
5393  * @b EXPERIMENTAL: this structure may change without prior notice.
5394  *
5395  * Ethernet device representor ID range entry
5396  */
5397 struct rte_eth_representor_range {
5398 	enum rte_eth_representor_type type; /**< Representor type */
5399 	int controller; /**< Controller index */
5400 	int pf; /**< Physical function index */
5401 	__extension__
5402 	union {
5403 		int vf; /**< VF start index */
5404 		int sf; /**< SF start index */
5405 	};
5406 	uint32_t id_base; /**< Representor ID start index */
5407 	uint32_t id_end;  /**< Representor ID end index */
5408 	char name[RTE_DEV_NAME_MAX_LEN]; /**< Representor name */
5409 };
5410 
5411 /**
5412  * @warning
5413  * @b EXPERIMENTAL: this structure may change without prior notice.
5414  *
5415  * Ethernet device representor information
5416  */
5417 struct rte_eth_representor_info {
5418 	uint16_t controller; /**< Controller ID of caller device. */
5419 	uint16_t pf; /**< Physical function ID of caller device. */
5420 	uint32_t nb_ranges_alloc; /**< Size of the ranges array. */
5421 	uint32_t nb_ranges; /**< Number of initialized ranges. */
5422 	struct rte_eth_representor_range ranges[];/**< Representor ID range. */
5423 };
5424 
5425 /**
5426  * Retrieve the representor info of the device.
5427  *
5428  * Get device representor info to be able to calculate a unique
5429  * representor ID. @see rte_eth_representor_id_get helper.
5430  *
5431  * @param port_id
5432  *   The port identifier of the device.
5433  * @param info
5434  *   A pointer to a representor info structure.
5435  *   NULL to return number of range entries and allocate memory
5436  *   for next call to store detail.
5437  *   The number of ranges that were written into this structure
5438  *   will be placed into its nb_ranges field. This number cannot be
5439  *   larger than the nb_ranges_alloc that by the user before calling
5440  *   this function. It can be smaller than the value returned by the
5441  *   function, however.
5442  * @return
5443  *   - (-ENOTSUP) if operation is not supported.
5444  *   - (-ENODEV) if *port_id* invalid.
5445  *   - (-EIO) if device is removed.
5446  *   - (>=0) number of available representor range entries.
5447  */
5448 __rte_experimental
5449 int rte_eth_representor_info_get(uint16_t port_id,
5450 				 struct rte_eth_representor_info *info);
5451 
5452 /** The NIC is able to deliver flag (if set) with packets to the PMD. */
5453 #define RTE_ETH_RX_METADATA_USER_FLAG RTE_BIT64(0)
5454 
5455 /** The NIC is able to deliver mark ID with packets to the PMD. */
5456 #define RTE_ETH_RX_METADATA_USER_MARK RTE_BIT64(1)
5457 
5458 /** The NIC is able to deliver tunnel ID with packets to the PMD. */
5459 #define RTE_ETH_RX_METADATA_TUNNEL_ID RTE_BIT64(2)
5460 
5461 /**
5462  * Negotiate the NIC's ability to deliver specific kinds of metadata to the PMD.
5463  *
5464  * Invoke this API before the first rte_eth_dev_configure() invocation
5465  * to let the PMD make preparations that are inconvenient to do later.
5466  *
5467  * The negotiation process is as follows:
5468  *
5469  * - the application requests features intending to use at least some of them;
5470  * - the PMD responds with the guaranteed subset of the requested feature set;
5471  * - the application can retry negotiation with another set of features;
5472  * - the application can pass zero to clear the negotiation result;
5473  * - the last negotiated result takes effect upon
5474  *   the ethdev configure and start.
5475  *
5476  * @note
5477  *   The PMD is supposed to first consider enabling the requested feature set
5478  *   in its entirety. Only if it fails to do so, does it have the right to
5479  *   respond with a smaller set of the originally requested features.
5480  *
5481  * @note
5482  *   Return code (-ENOTSUP) does not necessarily mean that the requested
5483  *   features are unsupported. In this case, the application should just
5484  *   assume that these features can be used without prior negotiations.
5485  *
5486  * @param port_id
5487  *   Port (ethdev) identifier
5488  *
5489  * @param[inout] features
5490  *   Feature selection buffer
5491  *
5492  * @return
5493  *   - (-EBUSY) if the port can't handle this in its current state;
5494  *   - (-ENOTSUP) if the method itself is not supported by the PMD;
5495  *   - (-ENODEV) if *port_id* is invalid;
5496  *   - (-EINVAL) if *features* is NULL;
5497  *   - (-EIO) if the device is removed;
5498  *   - (0) on success
5499  */
5500 int rte_eth_rx_metadata_negotiate(uint16_t port_id, uint64_t *features);
5501 
5502 /** Flag to offload IP reassembly for IPv4 packets. */
5503 #define RTE_ETH_DEV_REASSEMBLY_F_IPV4 (RTE_BIT32(0))
5504 /** Flag to offload IP reassembly for IPv6 packets. */
5505 #define RTE_ETH_DEV_REASSEMBLY_F_IPV6 (RTE_BIT32(1))
5506 
5507 /**
5508  * A structure used to get/set IP reassembly configuration. It is also used
5509  * to get the maximum capability values that a PMD can support.
5510  *
5511  * If rte_eth_ip_reassembly_capability_get() returns 0, IP reassembly can be
5512  * enabled using rte_eth_ip_reassembly_conf_set() and params values lower than
5513  * capability params can be set in the PMD.
5514  */
5515 struct rte_eth_ip_reassembly_params {
5516 	/** Maximum time in ms which PMD can wait for other fragments. */
5517 	uint32_t timeout_ms;
5518 	/** Maximum number of fragments that can be reassembled. */
5519 	uint16_t max_frags;
5520 	/**
5521 	 * Flags to enable reassembly of packet types -
5522 	 * RTE_ETH_DEV_REASSEMBLY_F_xxx.
5523 	 */
5524 	uint16_t flags;
5525 };
5526 
5527 /**
5528  * @warning
5529  * @b EXPERIMENTAL: this API may change without prior notice
5530  *
5531  * Get IP reassembly capabilities supported by the PMD. This is the first API
5532  * to be called for enabling the IP reassembly offload feature. PMD will return
5533  * the maximum values of parameters that PMD can support and user can call
5534  * rte_eth_ip_reassembly_conf_set() with param values lower than capability.
5535  *
5536  * @param port_id
5537  *   The port identifier of the device.
5538  * @param capa
5539  *   A pointer to rte_eth_ip_reassembly_params structure.
5540  * @return
5541  *   - (-ENOTSUP) if offload configuration is not supported by device.
5542  *   - (-ENODEV) if *port_id* invalid.
5543  *   - (-EIO) if device is removed.
5544  *   - (-EINVAL) if device is not configured or *capa* passed is NULL.
5545  *   - (0) on success.
5546  */
5547 __rte_experimental
5548 int rte_eth_ip_reassembly_capability_get(uint16_t port_id,
5549 		struct rte_eth_ip_reassembly_params *capa);
5550 
5551 /**
5552  * @warning
5553  * @b EXPERIMENTAL: this API may change without prior notice
5554  *
5555  * Get IP reassembly configuration parameters currently set in PMD.
5556  * The API will return error if the configuration is not already
5557  * set using rte_eth_ip_reassembly_conf_set() before calling this API or if
5558  * the device is not configured.
5559  *
5560  * @param port_id
5561  *   The port identifier of the device.
5562  * @param conf
5563  *   A pointer to rte_eth_ip_reassembly_params structure.
5564  * @return
5565  *   - (-ENOTSUP) if offload configuration is not supported by device.
5566  *   - (-ENODEV) if *port_id* invalid.
5567  *   - (-EIO) if device is removed.
5568  *   - (-EINVAL) if device is not configured or if *conf* passed is NULL or if
5569  *              configuration is not set using rte_eth_ip_reassembly_conf_set().
5570  *   - (0) on success.
5571  */
5572 __rte_experimental
5573 int rte_eth_ip_reassembly_conf_get(uint16_t port_id,
5574 		struct rte_eth_ip_reassembly_params *conf);
5575 
5576 /**
5577  * @warning
5578  * @b EXPERIMENTAL: this API may change without prior notice
5579  *
5580  * Set IP reassembly configuration parameters if the PMD supports IP reassembly
5581  * offload. User should first call rte_eth_ip_reassembly_capability_get() to
5582  * check the maximum values supported by the PMD before setting the
5583  * configuration. The use of this API is mandatory to enable this feature and
5584  * should be called before rte_eth_dev_start().
5585  *
5586  * In datapath, PMD cannot guarantee that IP reassembly is always successful.
5587  * Hence, PMD shall register mbuf dynamic field and dynamic flag using
5588  * rte_eth_ip_reassembly_dynfield_register() to denote incomplete IP reassembly.
5589  * If dynfield is not successfully registered, error will be returned and
5590  * IP reassembly offload cannot be used.
5591  *
5592  * @param port_id
5593  *   The port identifier of the device.
5594  * @param conf
5595  *   A pointer to rte_eth_ip_reassembly_params structure.
5596  * @return
5597  *   - (-ENOTSUP) if offload configuration is not supported by device.
5598  *   - (-ENODEV) if *port_id* invalid.
5599  *   - (-EIO) if device is removed.
5600  *   - (-EINVAL) if device is not configured or if device is already started or
5601  *               if *conf* passed is NULL or if mbuf dynfield is not registered
5602  *               successfully by the PMD.
5603  *   - (0) on success.
5604  */
5605 __rte_experimental
5606 int rte_eth_ip_reassembly_conf_set(uint16_t port_id,
5607 		const struct rte_eth_ip_reassembly_params *conf);
5608 
5609 /**
5610  * In case of IP reassembly offload failure, packet will be updated with
5611  * dynamic flag - RTE_MBUF_DYNFLAG_IP_REASSEMBLY_INCOMPLETE_NAME and packets
5612  * will be returned without alteration.
5613  * The application can retrieve the attached fragments using mbuf dynamic field
5614  * RTE_MBUF_DYNFIELD_IP_REASSEMBLY_NAME.
5615  */
5616 typedef struct {
5617 	/**
5618 	 * Next fragment packet. Application should fetch dynamic field of
5619 	 * each fragment until a NULL is received and nb_frags is 0.
5620 	 */
5621 	struct rte_mbuf *next_frag;
5622 	/** Time spent(in ms) by HW in waiting for further fragments. */
5623 	uint16_t time_spent;
5624 	/** Number of more fragments attached in mbuf dynamic fields. */
5625 	uint16_t nb_frags;
5626 } rte_eth_ip_reassembly_dynfield_t;
5627 
5628 /**
5629  * @warning
5630  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5631  *
5632  * Dump private info from device to a file. Provided data and the order depends
5633  * on the PMD.
5634  *
5635  * @param port_id
5636  *   The port identifier of the Ethernet device.
5637  * @param file
5638  *   A pointer to a file for output.
5639  * @return
5640  *   - (0) on success.
5641  *   - (-ENODEV) if *port_id* is invalid.
5642  *   - (-EINVAL) if null file.
5643  *   - (-ENOTSUP) if the device does not support this function.
5644  *   - (-EIO) if device is removed.
5645  */
5646 __rte_experimental
5647 int rte_eth_dev_priv_dump(uint16_t port_id, FILE *file);
5648 
5649 /**
5650  * @warning
5651  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5652  *
5653  * Dump ethdev Rx descriptor info to a file.
5654  *
5655  * This API is used for debugging, not a dataplane API.
5656  *
5657  * @param port_id
5658  *   The port identifier of the Ethernet device.
5659  * @param queue_id
5660  *   A Rx queue identifier on this port.
5661  * @param offset
5662  *  The offset of the descriptor starting from tail. (0 is the next
5663  *  packet to be received by the driver).
5664  * @param num
5665  *   The number of the descriptors to dump.
5666  * @param file
5667  *   A pointer to a file for output.
5668  * @return
5669  *   - On success, zero.
5670  *   - On failure, a negative value.
5671  */
5672 __rte_experimental
5673 int rte_eth_rx_descriptor_dump(uint16_t port_id, uint16_t queue_id,
5674 			       uint16_t offset, uint16_t num, FILE *file);
5675 
5676 /**
5677  * @warning
5678  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5679  *
5680  * Dump ethdev Tx descriptor info to a file.
5681  *
5682  * This API is used for debugging, not a dataplane API.
5683  *
5684  * @param port_id
5685  *   The port identifier of the Ethernet device.
5686  * @param queue_id
5687  *   A Tx queue identifier on this port.
5688  * @param offset
5689  *  The offset of the descriptor starting from tail. (0 is the place where
5690  *  the next packet will be send).
5691  * @param num
5692  *   The number of the descriptors to dump.
5693  * @param file
5694  *   A pointer to a file for output.
5695  * @return
5696  *   - On success, zero.
5697  *   - On failure, a negative value.
5698  */
5699 __rte_experimental
5700 int rte_eth_tx_descriptor_dump(uint16_t port_id, uint16_t queue_id,
5701 			       uint16_t offset, uint16_t num, FILE *file);
5702 
5703 
5704 /* Congestion management */
5705 
5706 /** Enumerate list of ethdev congestion management objects */
5707 enum rte_eth_cman_obj {
5708 	/** Congestion management based on Rx queue depth */
5709 	RTE_ETH_CMAN_OBJ_RX_QUEUE = RTE_BIT32(0),
5710 	/**
5711 	 * Congestion management based on mempool depth associated with Rx queue
5712 	 * @see rte_eth_rx_queue_setup()
5713 	 */
5714 	RTE_ETH_CMAN_OBJ_RX_QUEUE_MEMPOOL = RTE_BIT32(1),
5715 };
5716 
5717 /**
5718  * @warning
5719  * @b EXPERIMENTAL: this structure may change, or be removed, without prior notice
5720  *
5721  * A structure used to retrieve information of ethdev congestion management.
5722  */
5723 struct rte_eth_cman_info {
5724 	/**
5725 	 * Set of supported congestion management modes
5726 	 * @see enum rte_cman_mode
5727 	 */
5728 	uint64_t modes_supported;
5729 	/**
5730 	 * Set of supported congestion management objects
5731 	 * @see enum rte_eth_cman_obj
5732 	 */
5733 	uint64_t objs_supported;
5734 	/**
5735 	 * Reserved for future fields. Always returned as 0 when
5736 	 * rte_eth_cman_info_get() is invoked
5737 	 */
5738 	uint8_t rsvd[8];
5739 };
5740 
5741 /**
5742  * @warning
5743  * @b EXPERIMENTAL: this structure may change, or be removed, without prior notice
5744  *
5745  * A structure used to configure the ethdev congestion management.
5746  */
5747 struct rte_eth_cman_config {
5748 	/** Congestion management object */
5749 	enum rte_eth_cman_obj obj;
5750 	/** Congestion management mode */
5751 	enum rte_cman_mode mode;
5752 	union {
5753 		/**
5754 		 * Rx queue to configure congestion management.
5755 		 *
5756 		 * Valid when object is RTE_ETH_CMAN_OBJ_RX_QUEUE or
5757 		 * RTE_ETH_CMAN_OBJ_RX_QUEUE_MEMPOOL.
5758 		 */
5759 		uint16_t rx_queue;
5760 		/**
5761 		 * Reserved for future fields.
5762 		 * It must be set to 0 when rte_eth_cman_config_set() is invoked
5763 		 * and will be returned as 0 when rte_eth_cman_config_get() is
5764 		 * invoked.
5765 		 */
5766 		uint8_t rsvd_obj_params[4];
5767 	} obj_param;
5768 	union {
5769 		/**
5770 		 * RED configuration parameters.
5771 		 *
5772 		 * Valid when mode is RTE_CMAN_RED.
5773 		 */
5774 		struct rte_cman_red_params red;
5775 		/**
5776 		 * Reserved for future fields.
5777 		 * It must be set to 0 when rte_eth_cman_config_set() is invoked
5778 		 * and will be returned as 0 when rte_eth_cman_config_get() is
5779 		 * invoked.
5780 		 */
5781 		uint8_t rsvd_mode_params[4];
5782 	} mode_param;
5783 };
5784 
5785 /**
5786  * @warning
5787  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5788  *
5789  * Retrieve the information for ethdev congestion management
5790  *
5791  * @param port_id
5792  *   The port identifier of the Ethernet device.
5793  * @param info
5794  *   A pointer to a structure of type *rte_eth_cman_info* to be filled with
5795  *   the information about congestion management.
5796  * @return
5797  *   - (0) if successful.
5798  *   - (-ENOTSUP) if support for cman_info_get does not exist.
5799  *   - (-ENODEV) if *port_id* invalid.
5800  *   - (-EINVAL) if bad parameter.
5801  */
5802 __rte_experimental
5803 int rte_eth_cman_info_get(uint16_t port_id, struct rte_eth_cman_info *info);
5804 
5805 /**
5806  * @warning
5807  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5808  *
5809  * Initialize the ethdev congestion management configuration structure with default values.
5810  *
5811  * @param port_id
5812  *   The port identifier of the Ethernet device.
5813  * @param config
5814  *   A pointer to a structure of type *rte_eth_cman_config* to be initialized
5815  *   with default value.
5816  * @return
5817  *   - (0) if successful.
5818  *   - (-ENOTSUP) if support for cman_config_init does not exist.
5819  *   - (-ENODEV) if *port_id* invalid.
5820  *   - (-EINVAL) if bad parameter.
5821  */
5822 __rte_experimental
5823 int rte_eth_cman_config_init(uint16_t port_id, struct rte_eth_cman_config *config);
5824 
5825 /**
5826  * @warning
5827  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5828  *
5829  * Configure ethdev congestion management
5830  *
5831  * @param port_id
5832  *   The port identifier of the Ethernet device.
5833  * @param config
5834  *   A pointer to a structure of type *rte_eth_cman_config* to be configured.
5835  * @return
5836  *   - (0) if successful.
5837  *   - (-ENOTSUP) if support for cman_config_set does not exist.
5838  *   - (-ENODEV) if *port_id* invalid.
5839  *   - (-EINVAL) if bad parameter.
5840  */
5841 __rte_experimental
5842 int rte_eth_cman_config_set(uint16_t port_id, const struct rte_eth_cman_config *config);
5843 
5844 /**
5845  * @warning
5846  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
5847  *
5848  * Retrieve the applied ethdev congestion management parameters for the given port.
5849  *
5850  * @param port_id
5851  *   The port identifier of the Ethernet device.
5852  * @param config
5853  *   A pointer to a structure of type *rte_eth_cman_config* to retrieve
5854  *   congestion management parameters for the given object.
5855  *   Application must fill all parameters except mode_param parameter in
5856  *   struct rte_eth_cman_config.
5857  *
5858  * @return
5859  *   - (0) if successful.
5860  *   - (-ENOTSUP) if support for cman_config_get does not exist.
5861  *   - (-ENODEV) if *port_id* invalid.
5862  *   - (-EINVAL) if bad parameter.
5863  */
5864 __rte_experimental
5865 int rte_eth_cman_config_get(uint16_t port_id, struct rte_eth_cman_config *config);
5866 
5867 #include <rte_ethdev_core.h>
5868 
5869 /**
5870  * @internal
5871  * Helper routine for rte_eth_rx_burst().
5872  * Should be called at exit from PMD's rte_eth_rx_bulk implementation.
5873  * Does necessary post-processing - invokes Rx callbacks if any, etc.
5874  *
5875  * @param port_id
5876  *  The port identifier of the Ethernet device.
5877  * @param queue_id
5878  *  The index of the receive queue from which to retrieve input packets.
5879  * @param rx_pkts
5880  *   The address of an array of pointers to *rte_mbuf* structures that
5881  *   have been retrieved from the device.
5882  * @param nb_rx
5883  *   The number of packets that were retrieved from the device.
5884  * @param nb_pkts
5885  *   The number of elements in @p rx_pkts array.
5886  * @param opaque
5887  *   Opaque pointer of Rx queue callback related data.
5888  *
5889  * @return
5890  *  The number of packets effectively supplied to the @p rx_pkts array.
5891  */
5892 uint16_t rte_eth_call_rx_callbacks(uint16_t port_id, uint16_t queue_id,
5893 		struct rte_mbuf **rx_pkts, uint16_t nb_rx, uint16_t nb_pkts,
5894 		void *opaque);
5895 
5896 /**
5897  *
5898  * Retrieve a burst of input packets from a receive queue of an Ethernet
5899  * device. The retrieved packets are stored in *rte_mbuf* structures whose
5900  * pointers are supplied in the *rx_pkts* array.
5901  *
5902  * The rte_eth_rx_burst() function loops, parsing the Rx ring of the
5903  * receive queue, up to *nb_pkts* packets, and for each completed Rx
5904  * descriptor in the ring, it performs the following operations:
5905  *
5906  * - Initialize the *rte_mbuf* data structure associated with the
5907  *   Rx descriptor according to the information provided by the NIC into
5908  *   that Rx descriptor.
5909  *
5910  * - Store the *rte_mbuf* data structure into the next entry of the
5911  *   *rx_pkts* array.
5912  *
5913  * - Replenish the Rx descriptor with a new *rte_mbuf* buffer
5914  *   allocated from the memory pool associated with the receive queue at
5915  *   initialization time.
5916  *
5917  * When retrieving an input packet that was scattered by the controller
5918  * into multiple receive descriptors, the rte_eth_rx_burst() function
5919  * appends the associated *rte_mbuf* buffers to the first buffer of the
5920  * packet.
5921  *
5922  * The rte_eth_rx_burst() function returns the number of packets
5923  * actually retrieved, which is the number of *rte_mbuf* data structures
5924  * effectively supplied into the *rx_pkts* array.
5925  * A return value equal to *nb_pkts* indicates that the Rx queue contained
5926  * at least *rx_pkts* packets, and this is likely to signify that other
5927  * received packets remain in the input queue. Applications implementing
5928  * a "retrieve as much received packets as possible" policy can check this
5929  * specific case and keep invoking the rte_eth_rx_burst() function until
5930  * a value less than *nb_pkts* is returned.
5931  *
5932  * This receive method has the following advantages:
5933  *
5934  * - It allows a run-to-completion network stack engine to retrieve and
5935  *   to immediately process received packets in a fast burst-oriented
5936  *   approach, avoiding the overhead of unnecessary intermediate packet
5937  *   queue/dequeue operations.
5938  *
5939  * - Conversely, it also allows an asynchronous-oriented processing
5940  *   method to retrieve bursts of received packets and to immediately
5941  *   queue them for further parallel processing by another logical core,
5942  *   for instance. However, instead of having received packets being
5943  *   individually queued by the driver, this approach allows the caller
5944  *   of the rte_eth_rx_burst() function to queue a burst of retrieved
5945  *   packets at a time and therefore dramatically reduce the cost of
5946  *   enqueue/dequeue operations per packet.
5947  *
5948  * - It allows the rte_eth_rx_burst() function of the driver to take
5949  *   advantage of burst-oriented hardware features (CPU cache,
5950  *   prefetch instructions, and so on) to minimize the number of CPU
5951  *   cycles per packet.
5952  *
5953  * To summarize, the proposed receive API enables many
5954  * burst-oriented optimizations in both synchronous and asynchronous
5955  * packet processing environments with no overhead in both cases.
5956  *
5957  * @note
5958  *   Some drivers using vector instructions require that *nb_pkts* is
5959  *   divisible by 4 or 8, depending on the driver implementation.
5960  *
5961  * The rte_eth_rx_burst() function does not provide any error
5962  * notification to avoid the corresponding overhead. As a hint, the
5963  * upper-level application might check the status of the device link once
5964  * being systematically returned a 0 value for a given number of tries.
5965  *
5966  * @param port_id
5967  *   The port identifier of the Ethernet device.
5968  * @param queue_id
5969  *   The index of the receive queue from which to retrieve input packets.
5970  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
5971  *   to rte_eth_dev_configure().
5972  * @param rx_pkts
5973  *   The address of an array of pointers to *rte_mbuf* structures that
5974  *   must be large enough to store *nb_pkts* pointers in it.
5975  * @param nb_pkts
5976  *   The maximum number of packets to retrieve.
5977  *   The value must be divisible by 8 in order to work with any driver.
5978  * @return
5979  *   The number of packets actually retrieved, which is the number
5980  *   of pointers to *rte_mbuf* structures effectively supplied to the
5981  *   *rx_pkts* array.
5982  */
5983 static inline uint16_t
5984 rte_eth_rx_burst(uint16_t port_id, uint16_t queue_id,
5985 		 struct rte_mbuf **rx_pkts, const uint16_t nb_pkts)
5986 {
5987 	uint16_t nb_rx;
5988 	struct rte_eth_fp_ops *p;
5989 	void *qd;
5990 
5991 #ifdef RTE_ETHDEV_DEBUG_RX
5992 	if (port_id >= RTE_MAX_ETHPORTS ||
5993 			queue_id >= RTE_MAX_QUEUES_PER_PORT) {
5994 		RTE_ETHDEV_LOG(ERR,
5995 			"Invalid port_id=%u or queue_id=%u\n",
5996 			port_id, queue_id);
5997 		return 0;
5998 	}
5999 #endif
6000 
6001 	/* fetch pointer to queue data */
6002 	p = &rte_eth_fp_ops[port_id];
6003 	qd = p->rxq.data[queue_id];
6004 
6005 #ifdef RTE_ETHDEV_DEBUG_RX
6006 	RTE_ETH_VALID_PORTID_OR_ERR_RET(port_id, 0);
6007 
6008 	if (qd == NULL) {
6009 		RTE_ETHDEV_LOG(ERR, "Invalid Rx queue_id=%u for port_id=%u\n",
6010 			queue_id, port_id);
6011 		return 0;
6012 	}
6013 #endif
6014 
6015 	nb_rx = p->rx_pkt_burst(qd, rx_pkts, nb_pkts);
6016 
6017 #ifdef RTE_ETHDEV_RXTX_CALLBACKS
6018 	{
6019 		void *cb;
6020 
6021 		/* __ATOMIC_RELEASE memory order was used when the
6022 		 * call back was inserted into the list.
6023 		 * Since there is a clear dependency between loading
6024 		 * cb and cb->fn/cb->next, __ATOMIC_ACQUIRE memory order is
6025 		 * not required.
6026 		 */
6027 		cb = __atomic_load_n((void **)&p->rxq.clbk[queue_id],
6028 				__ATOMIC_RELAXED);
6029 		if (unlikely(cb != NULL))
6030 			nb_rx = rte_eth_call_rx_callbacks(port_id, queue_id,
6031 					rx_pkts, nb_rx, nb_pkts, cb);
6032 	}
6033 #endif
6034 
6035 	rte_ethdev_trace_rx_burst(port_id, queue_id, (void **)rx_pkts, nb_rx);
6036 	return nb_rx;
6037 }
6038 
6039 /**
6040  * Get the number of used descriptors of a Rx queue
6041  *
6042  * Since it's a dataplane function, no check is performed on port_id and
6043  * queue_id. The caller must therefore ensure that the port is enabled
6044  * and the queue is configured and running.
6045  *
6046  * @param port_id
6047  *  The port identifier of the Ethernet device.
6048  * @param queue_id
6049  *  The queue ID on the specific port.
6050  * @return
6051  *  The number of used descriptors in the specific queue, or:
6052  *   - (-ENODEV) if *port_id* is invalid.
6053  *   - (-EINVAL) if *queue_id* is invalid
6054  *   - (-ENOTSUP) if the device does not support this function
6055  */
6056 static inline int
6057 rte_eth_rx_queue_count(uint16_t port_id, uint16_t queue_id)
6058 {
6059 	struct rte_eth_fp_ops *p;
6060 	void *qd;
6061 
6062 #ifdef RTE_ETHDEV_DEBUG_RX
6063 	if (port_id >= RTE_MAX_ETHPORTS ||
6064 			queue_id >= RTE_MAX_QUEUES_PER_PORT) {
6065 		RTE_ETHDEV_LOG(ERR,
6066 			"Invalid port_id=%u or queue_id=%u\n",
6067 			port_id, queue_id);
6068 		return -EINVAL;
6069 	}
6070 #endif
6071 
6072 	/* fetch pointer to queue data */
6073 	p = &rte_eth_fp_ops[port_id];
6074 	qd = p->rxq.data[queue_id];
6075 
6076 #ifdef RTE_ETHDEV_DEBUG_RX
6077 	RTE_ETH_VALID_PORTID_OR_ERR_RET(port_id, -ENODEV);
6078 	if (qd == NULL)
6079 		return -EINVAL;
6080 #endif
6081 
6082 	if (*p->rx_queue_count == NULL)
6083 		return -ENOTSUP;
6084 	return (int)(*p->rx_queue_count)(qd);
6085 }
6086 
6087 /**@{@name Rx hardware descriptor states
6088  * @see rte_eth_rx_descriptor_status
6089  */
6090 #define RTE_ETH_RX_DESC_AVAIL    0 /**< Desc available for hw. */
6091 #define RTE_ETH_RX_DESC_DONE     1 /**< Desc done, filled by hw. */
6092 #define RTE_ETH_RX_DESC_UNAVAIL  2 /**< Desc used by driver or hw. */
6093 /**@}*/
6094 
6095 /**
6096  * Check the status of a Rx descriptor in the queue
6097  *
6098  * It should be called in a similar context than the Rx function:
6099  * - on a dataplane core
6100  * - not concurrently on the same queue
6101  *
6102  * Since it's a dataplane function, no check is performed on port_id and
6103  * queue_id. The caller must therefore ensure that the port is enabled
6104  * and the queue is configured and running.
6105  *
6106  * Note: accessing to a random descriptor in the ring may trigger cache
6107  * misses and have a performance impact.
6108  *
6109  * @param port_id
6110  *  A valid port identifier of the Ethernet device which.
6111  * @param queue_id
6112  *  A valid Rx queue identifier on this port.
6113  * @param offset
6114  *  The offset of the descriptor starting from tail (0 is the next
6115  *  packet to be received by the driver).
6116  *
6117  * @return
6118  *  - (RTE_ETH_RX_DESC_AVAIL): Descriptor is available for the hardware to
6119  *    receive a packet.
6120  *  - (RTE_ETH_RX_DESC_DONE): Descriptor is done, it is filled by hw, but
6121  *    not yet processed by the driver (i.e. in the receive queue).
6122  *  - (RTE_ETH_RX_DESC_UNAVAIL): Descriptor is unavailable, either hold by
6123  *    the driver and not yet returned to hw, or reserved by the hw.
6124  *  - (-EINVAL) bad descriptor offset.
6125  *  - (-ENOTSUP) if the device does not support this function.
6126  *  - (-ENODEV) bad port or queue (only if compiled with debug).
6127  */
6128 static inline int
6129 rte_eth_rx_descriptor_status(uint16_t port_id, uint16_t queue_id,
6130 	uint16_t offset)
6131 {
6132 	struct rte_eth_fp_ops *p;
6133 	void *qd;
6134 
6135 #ifdef RTE_ETHDEV_DEBUG_RX
6136 	if (port_id >= RTE_MAX_ETHPORTS ||
6137 			queue_id >= RTE_MAX_QUEUES_PER_PORT) {
6138 		RTE_ETHDEV_LOG(ERR,
6139 			"Invalid port_id=%u or queue_id=%u\n",
6140 			port_id, queue_id);
6141 		return -EINVAL;
6142 	}
6143 #endif
6144 
6145 	/* fetch pointer to queue data */
6146 	p = &rte_eth_fp_ops[port_id];
6147 	qd = p->rxq.data[queue_id];
6148 
6149 #ifdef RTE_ETHDEV_DEBUG_RX
6150 	RTE_ETH_VALID_PORTID_OR_ERR_RET(port_id, -ENODEV);
6151 	if (qd == NULL)
6152 		return -ENODEV;
6153 #endif
6154 	if (*p->rx_descriptor_status == NULL)
6155 		return -ENOTSUP;
6156 	return (*p->rx_descriptor_status)(qd, offset);
6157 }
6158 
6159 /**@{@name Tx hardware descriptor states
6160  * @see rte_eth_tx_descriptor_status
6161  */
6162 #define RTE_ETH_TX_DESC_FULL    0 /**< Desc filled for hw, waiting xmit. */
6163 #define RTE_ETH_TX_DESC_DONE    1 /**< Desc done, packet is transmitted. */
6164 #define RTE_ETH_TX_DESC_UNAVAIL 2 /**< Desc used by driver or hw. */
6165 /**@}*/
6166 
6167 /**
6168  * Check the status of a Tx descriptor in the queue.
6169  *
6170  * It should be called in a similar context than the Tx function:
6171  * - on a dataplane core
6172  * - not concurrently on the same queue
6173  *
6174  * Since it's a dataplane function, no check is performed on port_id and
6175  * queue_id. The caller must therefore ensure that the port is enabled
6176  * and the queue is configured and running.
6177  *
6178  * Note: accessing to a random descriptor in the ring may trigger cache
6179  * misses and have a performance impact.
6180  *
6181  * @param port_id
6182  *  A valid port identifier of the Ethernet device which.
6183  * @param queue_id
6184  *  A valid Tx queue identifier on this port.
6185  * @param offset
6186  *  The offset of the descriptor starting from tail (0 is the place where
6187  *  the next packet will be send).
6188  *
6189  * @return
6190  *  - (RTE_ETH_TX_DESC_FULL) Descriptor is being processed by the hw, i.e.
6191  *    in the transmit queue.
6192  *  - (RTE_ETH_TX_DESC_DONE) Hardware is done with this descriptor, it can
6193  *    be reused by the driver.
6194  *  - (RTE_ETH_TX_DESC_UNAVAIL): Descriptor is unavailable, reserved by the
6195  *    driver or the hardware.
6196  *  - (-EINVAL) bad descriptor offset.
6197  *  - (-ENOTSUP) if the device does not support this function.
6198  *  - (-ENODEV) bad port or queue (only if compiled with debug).
6199  */
6200 static inline int rte_eth_tx_descriptor_status(uint16_t port_id,
6201 	uint16_t queue_id, uint16_t offset)
6202 {
6203 	struct rte_eth_fp_ops *p;
6204 	void *qd;
6205 
6206 #ifdef RTE_ETHDEV_DEBUG_TX
6207 	if (port_id >= RTE_MAX_ETHPORTS ||
6208 			queue_id >= RTE_MAX_QUEUES_PER_PORT) {
6209 		RTE_ETHDEV_LOG(ERR,
6210 			"Invalid port_id=%u or queue_id=%u\n",
6211 			port_id, queue_id);
6212 		return -EINVAL;
6213 	}
6214 #endif
6215 
6216 	/* fetch pointer to queue data */
6217 	p = &rte_eth_fp_ops[port_id];
6218 	qd = p->txq.data[queue_id];
6219 
6220 #ifdef RTE_ETHDEV_DEBUG_TX
6221 	RTE_ETH_VALID_PORTID_OR_ERR_RET(port_id, -ENODEV);
6222 	if (qd == NULL)
6223 		return -ENODEV;
6224 #endif
6225 	if (*p->tx_descriptor_status == NULL)
6226 		return -ENOTSUP;
6227 	return (*p->tx_descriptor_status)(qd, offset);
6228 }
6229 
6230 /**
6231  * @internal
6232  * Helper routine for rte_eth_tx_burst().
6233  * Should be called before entry PMD's rte_eth_tx_bulk implementation.
6234  * Does necessary pre-processing - invokes Tx callbacks if any, etc.
6235  *
6236  * @param port_id
6237  *   The port identifier of the Ethernet device.
6238  * @param queue_id
6239  *   The index of the transmit queue through which output packets must be
6240  *   sent.
6241  * @param tx_pkts
6242  *   The address of an array of *nb_pkts* pointers to *rte_mbuf* structures
6243  *   which contain the output packets.
6244  * @param nb_pkts
6245  *   The maximum number of packets to transmit.
6246  * @return
6247  *   The number of output packets to transmit.
6248  */
6249 uint16_t rte_eth_call_tx_callbacks(uint16_t port_id, uint16_t queue_id,
6250 	struct rte_mbuf **tx_pkts, uint16_t nb_pkts, void *opaque);
6251 
6252 /**
6253  * Send a burst of output packets on a transmit queue of an Ethernet device.
6254  *
6255  * The rte_eth_tx_burst() function is invoked to transmit output packets
6256  * on the output queue *queue_id* of the Ethernet device designated by its
6257  * *port_id*.
6258  * The *nb_pkts* parameter is the number of packets to send which are
6259  * supplied in the *tx_pkts* array of *rte_mbuf* structures, each of them
6260  * allocated from a pool created with rte_pktmbuf_pool_create().
6261  * The rte_eth_tx_burst() function loops, sending *nb_pkts* packets,
6262  * up to the number of transmit descriptors available in the Tx ring of the
6263  * transmit queue.
6264  * For each packet to send, the rte_eth_tx_burst() function performs
6265  * the following operations:
6266  *
6267  * - Pick up the next available descriptor in the transmit ring.
6268  *
6269  * - Free the network buffer previously sent with that descriptor, if any.
6270  *
6271  * - Initialize the transmit descriptor with the information provided
6272  *   in the *rte_mbuf data structure.
6273  *
6274  * In the case of a segmented packet composed of a list of *rte_mbuf* buffers,
6275  * the rte_eth_tx_burst() function uses several transmit descriptors
6276  * of the ring.
6277  *
6278  * The rte_eth_tx_burst() function returns the number of packets it
6279  * actually sent. A return value equal to *nb_pkts* means that all packets
6280  * have been sent, and this is likely to signify that other output packets
6281  * could be immediately transmitted again. Applications that implement a
6282  * "send as many packets to transmit as possible" policy can check this
6283  * specific case and keep invoking the rte_eth_tx_burst() function until
6284  * a value less than *nb_pkts* is returned.
6285  *
6286  * It is the responsibility of the rte_eth_tx_burst() function to
6287  * transparently free the memory buffers of packets previously sent.
6288  * This feature is driven by the *tx_free_thresh* value supplied to the
6289  * rte_eth_dev_configure() function at device configuration time.
6290  * When the number of free Tx descriptors drops below this threshold, the
6291  * rte_eth_tx_burst() function must [attempt to] free the *rte_mbuf*  buffers
6292  * of those packets whose transmission was effectively completed.
6293  *
6294  * If the PMD is RTE_ETH_TX_OFFLOAD_MT_LOCKFREE capable, multiple threads can
6295  * invoke this function concurrently on the same Tx queue without SW lock.
6296  * @see rte_eth_dev_info_get, struct rte_eth_txconf::offloads
6297  *
6298  * @see rte_eth_tx_prepare to perform some prior checks or adjustments
6299  * for offloads.
6300  *
6301  * @note This function must not modify mbufs (including packets data)
6302  * unless the refcnt is 1.
6303  * An exception is the bonding PMD, which does not have "Tx prepare" support,
6304  * in this case, mbufs may be modified.
6305  *
6306  * @param port_id
6307  *   The port identifier of the Ethernet device.
6308  * @param queue_id
6309  *   The index of the transmit queue through which output packets must be
6310  *   sent.
6311  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
6312  *   to rte_eth_dev_configure().
6313  * @param tx_pkts
6314  *   The address of an array of *nb_pkts* pointers to *rte_mbuf* structures
6315  *   which contain the output packets.
6316  * @param nb_pkts
6317  *   The maximum number of packets to transmit.
6318  * @return
6319  *   The number of output packets actually stored in transmit descriptors of
6320  *   the transmit ring. The return value can be less than the value of the
6321  *   *tx_pkts* parameter when the transmit ring is full or has been filled up.
6322  */
6323 static inline uint16_t
6324 rte_eth_tx_burst(uint16_t port_id, uint16_t queue_id,
6325 		 struct rte_mbuf **tx_pkts, uint16_t nb_pkts)
6326 {
6327 	struct rte_eth_fp_ops *p;
6328 	void *qd;
6329 
6330 #ifdef RTE_ETHDEV_DEBUG_TX
6331 	if (port_id >= RTE_MAX_ETHPORTS ||
6332 			queue_id >= RTE_MAX_QUEUES_PER_PORT) {
6333 		RTE_ETHDEV_LOG(ERR,
6334 			"Invalid port_id=%u or queue_id=%u\n",
6335 			port_id, queue_id);
6336 		return 0;
6337 	}
6338 #endif
6339 
6340 	/* fetch pointer to queue data */
6341 	p = &rte_eth_fp_ops[port_id];
6342 	qd = p->txq.data[queue_id];
6343 
6344 #ifdef RTE_ETHDEV_DEBUG_TX
6345 	RTE_ETH_VALID_PORTID_OR_ERR_RET(port_id, 0);
6346 
6347 	if (qd == NULL) {
6348 		RTE_ETHDEV_LOG(ERR, "Invalid Tx queue_id=%u for port_id=%u\n",
6349 			queue_id, port_id);
6350 		return 0;
6351 	}
6352 #endif
6353 
6354 #ifdef RTE_ETHDEV_RXTX_CALLBACKS
6355 	{
6356 		void *cb;
6357 
6358 		/* __ATOMIC_RELEASE memory order was used when the
6359 		 * call back was inserted into the list.
6360 		 * Since there is a clear dependency between loading
6361 		 * cb and cb->fn/cb->next, __ATOMIC_ACQUIRE memory order is
6362 		 * not required.
6363 		 */
6364 		cb = __atomic_load_n((void **)&p->txq.clbk[queue_id],
6365 				__ATOMIC_RELAXED);
6366 		if (unlikely(cb != NULL))
6367 			nb_pkts = rte_eth_call_tx_callbacks(port_id, queue_id,
6368 					tx_pkts, nb_pkts, cb);
6369 	}
6370 #endif
6371 
6372 	nb_pkts = p->tx_pkt_burst(qd, tx_pkts, nb_pkts);
6373 
6374 	rte_ethdev_trace_tx_burst(port_id, queue_id, (void **)tx_pkts, nb_pkts);
6375 	return nb_pkts;
6376 }
6377 
6378 /**
6379  * Process a burst of output packets on a transmit queue of an Ethernet device.
6380  *
6381  * The rte_eth_tx_prepare() function is invoked to prepare output packets to be
6382  * transmitted on the output queue *queue_id* of the Ethernet device designated
6383  * by its *port_id*.
6384  * The *nb_pkts* parameter is the number of packets to be prepared which are
6385  * supplied in the *tx_pkts* array of *rte_mbuf* structures, each of them
6386  * allocated from a pool created with rte_pktmbuf_pool_create().
6387  * For each packet to send, the rte_eth_tx_prepare() function performs
6388  * the following operations:
6389  *
6390  * - Check if packet meets devices requirements for Tx offloads.
6391  *
6392  * - Check limitations about number of segments.
6393  *
6394  * - Check additional requirements when debug is enabled.
6395  *
6396  * - Update and/or reset required checksums when Tx offload is set for packet.
6397  *
6398  * Since this function can modify packet data, provided mbufs must be safely
6399  * writable (e.g. modified data cannot be in shared segment).
6400  *
6401  * The rte_eth_tx_prepare() function returns the number of packets ready to be
6402  * sent. A return value equal to *nb_pkts* means that all packets are valid and
6403  * ready to be sent, otherwise stops processing on the first invalid packet and
6404  * leaves the rest packets untouched.
6405  *
6406  * When this functionality is not implemented in the driver, all packets are
6407  * are returned untouched.
6408  *
6409  * @param port_id
6410  *   The port identifier of the Ethernet device.
6411  *   The value must be a valid port ID.
6412  * @param queue_id
6413  *   The index of the transmit queue through which output packets must be
6414  *   sent.
6415  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
6416  *   to rte_eth_dev_configure().
6417  * @param tx_pkts
6418  *   The address of an array of *nb_pkts* pointers to *rte_mbuf* structures
6419  *   which contain the output packets.
6420  * @param nb_pkts
6421  *   The maximum number of packets to process.
6422  * @return
6423  *   The number of packets correct and ready to be sent. The return value can be
6424  *   less than the value of the *tx_pkts* parameter when some packet doesn't
6425  *   meet devices requirements with rte_errno set appropriately:
6426  *   - EINVAL: offload flags are not correctly set
6427  *   - ENOTSUP: the offload feature is not supported by the hardware
6428  *   - ENODEV: if *port_id* is invalid (with debug enabled only)
6429  */
6430 
6431 #ifndef RTE_ETHDEV_TX_PREPARE_NOOP
6432 
6433 static inline uint16_t
6434 rte_eth_tx_prepare(uint16_t port_id, uint16_t queue_id,
6435 		struct rte_mbuf **tx_pkts, uint16_t nb_pkts)
6436 {
6437 	struct rte_eth_fp_ops *p;
6438 	void *qd;
6439 
6440 #ifdef RTE_ETHDEV_DEBUG_TX
6441 	if (port_id >= RTE_MAX_ETHPORTS ||
6442 			queue_id >= RTE_MAX_QUEUES_PER_PORT) {
6443 		RTE_ETHDEV_LOG(ERR,
6444 			"Invalid port_id=%u or queue_id=%u\n",
6445 			port_id, queue_id);
6446 		rte_errno = ENODEV;
6447 		return 0;
6448 	}
6449 #endif
6450 
6451 	/* fetch pointer to queue data */
6452 	p = &rte_eth_fp_ops[port_id];
6453 	qd = p->txq.data[queue_id];
6454 
6455 #ifdef RTE_ETHDEV_DEBUG_TX
6456 	if (!rte_eth_dev_is_valid_port(port_id)) {
6457 		RTE_ETHDEV_LOG(ERR, "Invalid Tx port_id=%u\n", port_id);
6458 		rte_errno = ENODEV;
6459 		return 0;
6460 	}
6461 	if (qd == NULL) {
6462 		RTE_ETHDEV_LOG(ERR, "Invalid Tx queue_id=%u for port_id=%u\n",
6463 			queue_id, port_id);
6464 		rte_errno = EINVAL;
6465 		return 0;
6466 	}
6467 #endif
6468 
6469 	if (!p->tx_pkt_prepare)
6470 		return nb_pkts;
6471 
6472 	return p->tx_pkt_prepare(qd, tx_pkts, nb_pkts);
6473 }
6474 
6475 #else
6476 
6477 /*
6478  * Native NOOP operation for compilation targets which doesn't require any
6479  * preparations steps, and functional NOOP may introduce unnecessary performance
6480  * drop.
6481  *
6482  * Generally this is not a good idea to turn it on globally and didn't should
6483  * be used if behavior of tx_preparation can change.
6484  */
6485 
6486 static inline uint16_t
6487 rte_eth_tx_prepare(__rte_unused uint16_t port_id,
6488 		__rte_unused uint16_t queue_id,
6489 		__rte_unused struct rte_mbuf **tx_pkts, uint16_t nb_pkts)
6490 {
6491 	return nb_pkts;
6492 }
6493 
6494 #endif
6495 
6496 /**
6497  * Send any packets queued up for transmission on a port and HW queue
6498  *
6499  * This causes an explicit flush of packets previously buffered via the
6500  * rte_eth_tx_buffer() function. It returns the number of packets successfully
6501  * sent to the NIC, and calls the error callback for any unsent packets. Unless
6502  * explicitly set up otherwise, the default callback simply frees the unsent
6503  * packets back to the owning mempool.
6504  *
6505  * @param port_id
6506  *   The port identifier of the Ethernet device.
6507  * @param queue_id
6508  *   The index of the transmit queue through which output packets must be
6509  *   sent.
6510  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
6511  *   to rte_eth_dev_configure().
6512  * @param buffer
6513  *   Buffer of packets to be transmit.
6514  * @return
6515  *   The number of packets successfully sent to the Ethernet device. The error
6516  *   callback is called for any packets which could not be sent.
6517  */
6518 static inline uint16_t
6519 rte_eth_tx_buffer_flush(uint16_t port_id, uint16_t queue_id,
6520 		struct rte_eth_dev_tx_buffer *buffer)
6521 {
6522 	uint16_t sent;
6523 	uint16_t to_send = buffer->length;
6524 
6525 	if (to_send == 0)
6526 		return 0;
6527 
6528 	sent = rte_eth_tx_burst(port_id, queue_id, buffer->pkts, to_send);
6529 
6530 	buffer->length = 0;
6531 
6532 	/* All packets sent, or to be dealt with by callback below */
6533 	if (unlikely(sent != to_send))
6534 		buffer->error_callback(&buffer->pkts[sent],
6535 				       (uint16_t)(to_send - sent),
6536 				       buffer->error_userdata);
6537 
6538 	return sent;
6539 }
6540 
6541 /**
6542  * Buffer a single packet for future transmission on a port and queue
6543  *
6544  * This function takes a single mbuf/packet and buffers it for later
6545  * transmission on the particular port and queue specified. Once the buffer is
6546  * full of packets, an attempt will be made to transmit all the buffered
6547  * packets. In case of error, where not all packets can be transmitted, a
6548  * callback is called with the unsent packets as a parameter. If no callback
6549  * is explicitly set up, the unsent packets are just freed back to the owning
6550  * mempool. The function returns the number of packets actually sent i.e.
6551  * 0 if no buffer flush occurred, otherwise the number of packets successfully
6552  * flushed
6553  *
6554  * @param port_id
6555  *   The port identifier of the Ethernet device.
6556  * @param queue_id
6557  *   The index of the transmit queue through which output packets must be
6558  *   sent.
6559  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
6560  *   to rte_eth_dev_configure().
6561  * @param buffer
6562  *   Buffer used to collect packets to be sent.
6563  * @param tx_pkt
6564  *   Pointer to the packet mbuf to be sent.
6565  * @return
6566  *   0 = packet has been buffered for later transmission
6567  *   N > 0 = packet has been buffered, and the buffer was subsequently flushed,
6568  *     causing N packets to be sent, and the error callback to be called for
6569  *     the rest.
6570  */
6571 static __rte_always_inline uint16_t
6572 rte_eth_tx_buffer(uint16_t port_id, uint16_t queue_id,
6573 		struct rte_eth_dev_tx_buffer *buffer, struct rte_mbuf *tx_pkt)
6574 {
6575 	buffer->pkts[buffer->length++] = tx_pkt;
6576 	if (buffer->length < buffer->size)
6577 		return 0;
6578 
6579 	return rte_eth_tx_buffer_flush(port_id, queue_id, buffer);
6580 }
6581 
6582 /**
6583  * @warning
6584  * @b EXPERIMENTAL: this API may change, or be removed, without prior notice
6585  *
6586  * Recycle used mbufs from a transmit queue of an Ethernet device, and move
6587  * these mbufs into a mbuf ring for a receive queue of an Ethernet device.
6588  * This can bypass mempool path to save CPU cycles.
6589  *
6590  * The rte_eth_recycle_mbufs() function loops, with rte_eth_rx_burst() and
6591  * rte_eth_tx_burst() functions, freeing Tx used mbufs and replenishing Rx
6592  * descriptors. The number of recycling mbufs depends on the request of Rx mbuf
6593  * ring, with the constraint of enough used mbufs from Tx mbuf ring.
6594  *
6595  * For each recycling mbufs, the rte_eth_recycle_mbufs() function performs the
6596  * following operations:
6597  *
6598  * - Copy used *rte_mbuf* buffer pointers from Tx mbuf ring into Rx mbuf ring.
6599  *
6600  * - Replenish the Rx descriptors with the recycling *rte_mbuf* mbufs freed
6601  *   from the Tx mbuf ring.
6602  *
6603  * This function spilts Rx and Tx path with different callback functions. The
6604  * callback function recycle_tx_mbufs_reuse is for Tx driver. The callback
6605  * function recycle_rx_descriptors_refill is for Rx driver. rte_eth_recycle_mbufs()
6606  * can support the case that Rx Ethernet device is different from Tx Ethernet device.
6607  *
6608  * It is the responsibility of users to select the Rx/Tx queue pair to recycle
6609  * mbufs. Before call this function, users must call rte_eth_recycle_rxq_info_get
6610  * function to retrieve selected Rx queue information.
6611  * @see rte_eth_recycle_rxq_info_get, struct rte_eth_recycle_rxq_info
6612  *
6613  * Currently, the rte_eth_recycle_mbufs() function can support to feed 1 Rx queue from
6614  * 2 Tx queues in the same thread. Do not pair the Rx queue and Tx queue in different
6615  * threads, in order to avoid memory error rewriting.
6616  *
6617  * @param rx_port_id
6618  *   Port identifying the receive side.
6619  * @param rx_queue_id
6620  *   The index of the receive queue identifying the receive side.
6621  *   The value must be in the range [0, nb_rx_queue - 1] previously supplied
6622  *   to rte_eth_dev_configure().
6623  * @param tx_port_id
6624  *   Port identifying the transmit side.
6625  * @param tx_queue_id
6626  *   The index of the transmit queue identifying the transmit side.
6627  *   The value must be in the range [0, nb_tx_queue - 1] previously supplied
6628  *   to rte_eth_dev_configure().
6629  * @param recycle_rxq_info
6630  *   A pointer to a structure of type *rte_eth_recycle_rxq_info* which contains
6631  *   the information of the Rx queue mbuf ring.
6632  * @return
6633  *   The number of recycling mbufs.
6634  */
6635 __rte_experimental
6636 static inline uint16_t
6637 rte_eth_recycle_mbufs(uint16_t rx_port_id, uint16_t rx_queue_id,
6638 		uint16_t tx_port_id, uint16_t tx_queue_id,
6639 		struct rte_eth_recycle_rxq_info *recycle_rxq_info)
6640 {
6641 	struct rte_eth_fp_ops *p1, *p2;
6642 	void *qd1, *qd2;
6643 	uint16_t nb_mbufs;
6644 
6645 #ifdef RTE_ETHDEV_DEBUG_TX
6646 	if (tx_port_id >= RTE_MAX_ETHPORTS ||
6647 			tx_queue_id >= RTE_MAX_QUEUES_PER_PORT) {
6648 		RTE_ETHDEV_LOG(ERR,
6649 				"Invalid tx_port_id=%u or tx_queue_id=%u\n",
6650 				tx_port_id, tx_queue_id);
6651 		return 0;
6652 	}
6653 #endif
6654 
6655 	/* fetch pointer to Tx queue data */
6656 	p1 = &rte_eth_fp_ops[tx_port_id];
6657 	qd1 = p1->txq.data[tx_queue_id];
6658 
6659 #ifdef RTE_ETHDEV_DEBUG_TX
6660 	RTE_ETH_VALID_PORTID_OR_ERR_RET(tx_port_id, 0);
6661 
6662 	if (qd1 == NULL) {
6663 		RTE_ETHDEV_LOG(ERR, "Invalid Tx queue_id=%u for port_id=%u\n",
6664 				tx_queue_id, tx_port_id);
6665 		return 0;
6666 	}
6667 #endif
6668 	if (p1->recycle_tx_mbufs_reuse == NULL)
6669 		return 0;
6670 
6671 #ifdef RTE_ETHDEV_DEBUG_RX
6672 	if (rx_port_id >= RTE_MAX_ETHPORTS ||
6673 			rx_queue_id >= RTE_MAX_QUEUES_PER_PORT) {
6674 		RTE_ETHDEV_LOG(ERR, "Invalid rx_port_id=%u or rx_queue_id=%u\n",
6675 				rx_port_id, rx_queue_id);
6676 		return 0;
6677 	}
6678 #endif
6679 
6680 	/* fetch pointer to Rx queue data */
6681 	p2 = &rte_eth_fp_ops[rx_port_id];
6682 	qd2 = p2->rxq.data[rx_queue_id];
6683 
6684 #ifdef RTE_ETHDEV_DEBUG_RX
6685 	RTE_ETH_VALID_PORTID_OR_ERR_RET(rx_port_id, 0);
6686 
6687 	if (qd2 == NULL) {
6688 		RTE_ETHDEV_LOG(ERR, "Invalid Rx queue_id=%u for port_id=%u\n",
6689 				rx_queue_id, rx_port_id);
6690 		return 0;
6691 	}
6692 #endif
6693 	if (p2->recycle_rx_descriptors_refill == NULL)
6694 		return 0;
6695 
6696 	/* Copy used *rte_mbuf* buffer pointers from Tx mbuf ring
6697 	 * into Rx mbuf ring.
6698 	 */
6699 	nb_mbufs = p1->recycle_tx_mbufs_reuse(qd1, recycle_rxq_info);
6700 
6701 	/* If no recycling mbufs, return 0. */
6702 	if (nb_mbufs == 0)
6703 		return 0;
6704 
6705 	/* Replenish the Rx descriptors with the recycling
6706 	 * into Rx mbuf ring.
6707 	 */
6708 	p2->recycle_rx_descriptors_refill(qd2, nb_mbufs);
6709 
6710 	return nb_mbufs;
6711 }
6712 
6713 /**
6714  * @warning
6715  * @b EXPERIMENTAL: this API may change without prior notice
6716  *
6717  * Get supported header protocols to split on Rx.
6718  *
6719  * When a packet type is announced to be split,
6720  * it *must* be supported by the PMD.
6721  * For instance, if eth-ipv4, eth-ipv4-udp is announced,
6722  * the PMD must return the following packet types for these packets:
6723  * - Ether/IPv4             -> RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV4
6724  * - Ether/IPv4/UDP         -> RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_UDP
6725  *
6726  * @param port_id
6727  *   The port identifier of the device.
6728  * @param[out] ptypes
6729  *   An array pointer to store supported protocol headers, allocated by caller.
6730  *   These ptypes are composed with RTE_PTYPE_*.
6731  * @param num
6732  *   Size of the array pointed by param ptypes.
6733  * @return
6734  *   - (>=0) Number of supported ptypes. If the number of types exceeds num,
6735  *           only num entries will be filled into the ptypes array,
6736  *           but the full count of supported ptypes will be returned.
6737  *   - (-ENOTSUP) if header protocol is not supported by device.
6738  *   - (-ENODEV) if *port_id* invalid.
6739  *   - (-EINVAL) if bad parameter.
6740  */
6741 __rte_experimental
6742 int rte_eth_buffer_split_get_supported_hdr_ptypes(uint16_t port_id, uint32_t *ptypes, int num);
6743 
6744 #ifdef __cplusplus
6745 }
6746 #endif
6747 
6748 #endif /* _RTE_ETHDEV_H_ */
6749