xref: /dpdk/drivers/net/mlx5/mlx5_trigger.c (revision e11bdd37745229bf26b557305c07d118c3dbaad7)
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright 2015 6WIND S.A.
3  * Copyright 2015 Mellanox Technologies, Ltd
4  */
5 
6 #include <unistd.h>
7 
8 #include <rte_ether.h>
9 #include <rte_ethdev_driver.h>
10 #include <rte_interrupts.h>
11 #include <rte_alarm.h>
12 
13 #include "mlx5.h"
14 #include "mlx5_mr.h"
15 #include "mlx5_rxtx.h"
16 #include "mlx5_utils.h"
17 #include "rte_pmd_mlx5.h"
18 
19 /**
20  * Stop traffic on Tx queues.
21  *
22  * @param dev
23  *   Pointer to Ethernet device structure.
24  */
25 static void
26 mlx5_txq_stop(struct rte_eth_dev *dev)
27 {
28 	struct mlx5_priv *priv = dev->data->dev_private;
29 	unsigned int i;
30 
31 	for (i = 0; i != priv->txqs_n; ++i)
32 		mlx5_txq_release(dev, i);
33 }
34 
35 /**
36  * Start traffic on Tx queues.
37  *
38  * @param dev
39  *   Pointer to Ethernet device structure.
40  *
41  * @return
42  *   0 on success, a negative errno value otherwise and rte_errno is set.
43  */
44 static int
45 mlx5_txq_start(struct rte_eth_dev *dev)
46 {
47 	struct mlx5_priv *priv = dev->data->dev_private;
48 	unsigned int i;
49 	int ret;
50 
51 	for (i = 0; i != priv->txqs_n; ++i) {
52 		struct mlx5_txq_ctrl *txq_ctrl = mlx5_txq_get(dev, i);
53 
54 		if (!txq_ctrl)
55 			continue;
56 		if (txq_ctrl->type == MLX5_TXQ_TYPE_HAIRPIN) {
57 			txq_ctrl->obj = mlx5_txq_obj_new
58 				(dev, i, MLX5_TXQ_OBJ_TYPE_DEVX_HAIRPIN);
59 		} else {
60 			txq_alloc_elts(txq_ctrl);
61 			txq_ctrl->obj = mlx5_txq_obj_new
62 				(dev, i, MLX5_TXQ_OBJ_TYPE_IBV);
63 		}
64 		if (!txq_ctrl->obj) {
65 			rte_errno = ENOMEM;
66 			goto error;
67 		}
68 	}
69 	return 0;
70 error:
71 	ret = rte_errno; /* Save rte_errno before cleanup. */
72 	do {
73 		mlx5_txq_release(dev, i);
74 	} while (i-- != 0);
75 	rte_errno = ret; /* Restore rte_errno. */
76 	return -rte_errno;
77 }
78 
79 /**
80  * Stop traffic on Rx queues.
81  *
82  * @param dev
83  *   Pointer to Ethernet device structure.
84  */
85 static void
86 mlx5_rxq_stop(struct rte_eth_dev *dev)
87 {
88 	struct mlx5_priv *priv = dev->data->dev_private;
89 	unsigned int i;
90 
91 	for (i = 0; i != priv->rxqs_n; ++i)
92 		mlx5_rxq_release(dev, i);
93 }
94 
95 /**
96  * Start traffic on Rx queues.
97  *
98  * @param dev
99  *   Pointer to Ethernet device structure.
100  *
101  * @return
102  *   0 on success, a negative errno value otherwise and rte_errno is set.
103  */
104 static int
105 mlx5_rxq_start(struct rte_eth_dev *dev)
106 {
107 	struct mlx5_priv *priv = dev->data->dev_private;
108 	unsigned int i;
109 	int ret = 0;
110 	enum mlx5_rxq_obj_type obj_type = MLX5_RXQ_OBJ_TYPE_IBV;
111 	struct mlx5_rxq_data *rxq = NULL;
112 
113 	for (i = 0; i < priv->rxqs_n; ++i) {
114 		rxq = (*priv->rxqs)[i];
115 
116 		if (rxq && rxq->lro) {
117 			obj_type =  MLX5_RXQ_OBJ_TYPE_DEVX_RQ;
118 			break;
119 		}
120 	}
121 	/* Allocate/reuse/resize mempool for Multi-Packet RQ. */
122 	if (mlx5_mprq_alloc_mp(dev)) {
123 		/* Should not release Rx queues but return immediately. */
124 		return -rte_errno;
125 	}
126 	for (i = 0; i != priv->rxqs_n; ++i) {
127 		struct mlx5_rxq_ctrl *rxq_ctrl = mlx5_rxq_get(dev, i);
128 		struct rte_mempool *mp;
129 
130 		if (!rxq_ctrl)
131 			continue;
132 		if (rxq_ctrl->type == MLX5_RXQ_TYPE_HAIRPIN) {
133 			rxq_ctrl->obj = mlx5_rxq_obj_new
134 				(dev, i, MLX5_RXQ_OBJ_TYPE_DEVX_HAIRPIN);
135 			if (!rxq_ctrl->obj)
136 				goto error;
137 			continue;
138 		}
139 		/* Pre-register Rx mempool. */
140 		mp = mlx5_rxq_mprq_enabled(&rxq_ctrl->rxq) ?
141 		     rxq_ctrl->rxq.mprq_mp : rxq_ctrl->rxq.mp;
142 		DRV_LOG(DEBUG,
143 			"port %u Rx queue %u registering"
144 			" mp %s having %u chunks",
145 			dev->data->port_id, rxq_ctrl->rxq.idx,
146 			mp->name, mp->nb_mem_chunks);
147 		mlx5_mr_update_mp(dev, &rxq_ctrl->rxq.mr_ctrl, mp);
148 		ret = rxq_alloc_elts(rxq_ctrl);
149 		if (ret)
150 			goto error;
151 		rxq_ctrl->obj = mlx5_rxq_obj_new(dev, i, obj_type);
152 		if (!rxq_ctrl->obj)
153 			goto error;
154 		if (obj_type == MLX5_RXQ_OBJ_TYPE_IBV)
155 			rxq_ctrl->wqn = rxq_ctrl->obj->wq->wq_num;
156 		else if (obj_type == MLX5_RXQ_OBJ_TYPE_DEVX_RQ)
157 			rxq_ctrl->wqn = rxq_ctrl->obj->rq->id;
158 	}
159 	return 0;
160 error:
161 	ret = rte_errno; /* Save rte_errno before cleanup. */
162 	do {
163 		mlx5_rxq_release(dev, i);
164 	} while (i-- != 0);
165 	rte_errno = ret; /* Restore rte_errno. */
166 	return -rte_errno;
167 }
168 
169 /**
170  * Binds Tx queues to Rx queues for hairpin.
171  *
172  * Binds Tx queues to the target Rx queues.
173  *
174  * @param dev
175  *   Pointer to Ethernet device structure.
176  *
177  * @return
178  *   0 on success, a negative errno value otherwise and rte_errno is set.
179  */
180 static int
181 mlx5_hairpin_bind(struct rte_eth_dev *dev)
182 {
183 	struct mlx5_priv *priv = dev->data->dev_private;
184 	struct mlx5_devx_modify_sq_attr sq_attr = { 0 };
185 	struct mlx5_devx_modify_rq_attr rq_attr = { 0 };
186 	struct mlx5_txq_ctrl *txq_ctrl;
187 	struct mlx5_rxq_ctrl *rxq_ctrl;
188 	struct mlx5_devx_obj *sq;
189 	struct mlx5_devx_obj *rq;
190 	unsigned int i;
191 	int ret = 0;
192 
193 	for (i = 0; i != priv->txqs_n; ++i) {
194 		txq_ctrl = mlx5_txq_get(dev, i);
195 		if (!txq_ctrl)
196 			continue;
197 		if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
198 			mlx5_txq_release(dev, i);
199 			continue;
200 		}
201 		if (!txq_ctrl->obj) {
202 			rte_errno = ENOMEM;
203 			DRV_LOG(ERR, "port %u no txq object found: %d",
204 				dev->data->port_id, i);
205 			mlx5_txq_release(dev, i);
206 			return -rte_errno;
207 		}
208 		sq = txq_ctrl->obj->sq;
209 		rxq_ctrl = mlx5_rxq_get(dev,
210 					txq_ctrl->hairpin_conf.peers[0].queue);
211 		if (!rxq_ctrl) {
212 			mlx5_txq_release(dev, i);
213 			rte_errno = EINVAL;
214 			DRV_LOG(ERR, "port %u no rxq object found: %d",
215 				dev->data->port_id,
216 				txq_ctrl->hairpin_conf.peers[0].queue);
217 			return -rte_errno;
218 		}
219 		if (rxq_ctrl->type != MLX5_RXQ_TYPE_HAIRPIN ||
220 		    rxq_ctrl->hairpin_conf.peers[0].queue != i) {
221 			rte_errno = ENOMEM;
222 			DRV_LOG(ERR, "port %u Tx queue %d can't be binded to "
223 				"Rx queue %d", dev->data->port_id,
224 				i, txq_ctrl->hairpin_conf.peers[0].queue);
225 			goto error;
226 		}
227 		rq = rxq_ctrl->obj->rq;
228 		if (!rq) {
229 			rte_errno = ENOMEM;
230 			DRV_LOG(ERR, "port %u hairpin no matching rxq: %d",
231 				dev->data->port_id,
232 				txq_ctrl->hairpin_conf.peers[0].queue);
233 			goto error;
234 		}
235 		sq_attr.state = MLX5_SQC_STATE_RDY;
236 		sq_attr.sq_state = MLX5_SQC_STATE_RST;
237 		sq_attr.hairpin_peer_rq = rq->id;
238 		sq_attr.hairpin_peer_vhca = priv->config.hca_attr.vhca_id;
239 		ret = mlx5_devx_cmd_modify_sq(sq, &sq_attr);
240 		if (ret)
241 			goto error;
242 		rq_attr.state = MLX5_SQC_STATE_RDY;
243 		rq_attr.rq_state = MLX5_SQC_STATE_RST;
244 		rq_attr.hairpin_peer_sq = sq->id;
245 		rq_attr.hairpin_peer_vhca = priv->config.hca_attr.vhca_id;
246 		ret = mlx5_devx_cmd_modify_rq(rq, &rq_attr);
247 		if (ret)
248 			goto error;
249 		mlx5_txq_release(dev, i);
250 		mlx5_rxq_release(dev, txq_ctrl->hairpin_conf.peers[0].queue);
251 	}
252 	return 0;
253 error:
254 	mlx5_txq_release(dev, i);
255 	mlx5_rxq_release(dev, txq_ctrl->hairpin_conf.peers[0].queue);
256 	return -rte_errno;
257 }
258 
259 /**
260  * DPDK callback to start the device.
261  *
262  * Simulate device start by attaching all configured flows.
263  *
264  * @param dev
265  *   Pointer to Ethernet device structure.
266  *
267  * @return
268  *   0 on success, a negative errno value otherwise and rte_errno is set.
269  */
270 int
271 mlx5_dev_start(struct rte_eth_dev *dev)
272 {
273 	int ret;
274 	int fine_inline;
275 
276 	DRV_LOG(DEBUG, "port %u starting device", dev->data->port_id);
277 	fine_inline = rte_mbuf_dynflag_lookup
278 		(RTE_PMD_MLX5_FINE_GRANULARITY_INLINE, NULL);
279 	if (fine_inline > 0)
280 		rte_net_mlx5_dynf_inline_mask = 1UL << fine_inline;
281 	else
282 		rte_net_mlx5_dynf_inline_mask = 0;
283 	if (dev->data->nb_rx_queues > 0) {
284 		ret = mlx5_dev_configure_rss_reta(dev);
285 		if (ret) {
286 			DRV_LOG(ERR, "port %u reta config failed: %s",
287 				dev->data->port_id, strerror(rte_errno));
288 			return -rte_errno;
289 		}
290 	}
291 	ret = mlx5_txq_start(dev);
292 	if (ret) {
293 		DRV_LOG(ERR, "port %u Tx queue allocation failed: %s",
294 			dev->data->port_id, strerror(rte_errno));
295 		return -rte_errno;
296 	}
297 	ret = mlx5_rxq_start(dev);
298 	if (ret) {
299 		DRV_LOG(ERR, "port %u Rx queue allocation failed: %s",
300 			dev->data->port_id, strerror(rte_errno));
301 		mlx5_txq_stop(dev);
302 		return -rte_errno;
303 	}
304 	ret = mlx5_hairpin_bind(dev);
305 	if (ret) {
306 		DRV_LOG(ERR, "port %u hairpin binding failed: %s",
307 			dev->data->port_id, strerror(rte_errno));
308 		mlx5_txq_stop(dev);
309 		return -rte_errno;
310 	}
311 	/* Set started flag here for the following steps like control flow. */
312 	dev->data->dev_started = 1;
313 	ret = mlx5_rx_intr_vec_enable(dev);
314 	if (ret) {
315 		DRV_LOG(ERR, "port %u Rx interrupt vector creation failed",
316 			dev->data->port_id);
317 		goto error;
318 	}
319 	mlx5_stats_init(dev);
320 	ret = mlx5_traffic_enable(dev);
321 	if (ret) {
322 		DRV_LOG(ERR, "port %u failed to set defaults flows",
323 			dev->data->port_id);
324 		goto error;
325 	}
326 	/* Set a mask and offset of dynamic metadata flows into Rx queues*/
327 	mlx5_flow_rxq_dynf_metadata_set(dev);
328 	/*
329 	 * In non-cached mode, it only needs to start the default mreg copy
330 	 * action and no flow created by application exists anymore.
331 	 * But it is worth wrapping the interface for further usage.
332 	 */
333 	ret = mlx5_flow_start_default(dev);
334 	if (ret) {
335 		DRV_LOG(DEBUG, "port %u failed to start default actions: %s",
336 			dev->data->port_id, strerror(rte_errno));
337 		goto error;
338 	}
339 	rte_wmb();
340 	dev->tx_pkt_burst = mlx5_select_tx_function(dev);
341 	dev->rx_pkt_burst = mlx5_select_rx_function(dev);
342 	/* Enable datapath on secondary process. */
343 	mlx5_mp_req_start_rxtx(dev);
344 	mlx5_dev_interrupt_handler_install(dev);
345 	return 0;
346 error:
347 	ret = rte_errno; /* Save rte_errno before cleanup. */
348 	/* Rollback. */
349 	dev->data->dev_started = 0;
350 	mlx5_flow_stop_default(dev);
351 	mlx5_traffic_disable(dev);
352 	mlx5_txq_stop(dev);
353 	mlx5_rxq_stop(dev);
354 	rte_errno = ret; /* Restore rte_errno. */
355 	return -rte_errno;
356 }
357 
358 /**
359  * DPDK callback to stop the device.
360  *
361  * Simulate device stop by detaching all configured flows.
362  *
363  * @param dev
364  *   Pointer to Ethernet device structure.
365  */
366 void
367 mlx5_dev_stop(struct rte_eth_dev *dev)
368 {
369 	struct mlx5_priv *priv = dev->data->dev_private;
370 
371 	dev->data->dev_started = 0;
372 	/* Prevent crashes when queues are still in use. */
373 	dev->rx_pkt_burst = removed_rx_burst;
374 	dev->tx_pkt_burst = removed_tx_burst;
375 	rte_wmb();
376 	/* Disable datapath on secondary process. */
377 	mlx5_mp_req_stop_rxtx(dev);
378 	usleep(1000 * priv->rxqs_n);
379 	DRV_LOG(DEBUG, "port %u stopping device", dev->data->port_id);
380 	mlx5_flow_stop_default(dev);
381 	/* Control flows for default traffic can be removed firstly. */
382 	mlx5_traffic_disable(dev);
383 	/* All RX queue flags will be cleared in the flush interface. */
384 	mlx5_flow_list_flush(dev, &priv->flows, true);
385 	mlx5_rx_intr_vec_disable(dev);
386 	mlx5_dev_interrupt_handler_uninstall(dev);
387 	mlx5_txq_stop(dev);
388 	mlx5_rxq_stop(dev);
389 }
390 
391 /**
392  * Enable traffic flows configured by control plane
393  *
394  * @param dev
395  *   Pointer to Ethernet device private data.
396  * @param dev
397  *   Pointer to Ethernet device structure.
398  *
399  * @return
400  *   0 on success, a negative errno value otherwise and rte_errno is set.
401  */
402 int
403 mlx5_traffic_enable(struct rte_eth_dev *dev)
404 {
405 	struct mlx5_priv *priv = dev->data->dev_private;
406 	struct rte_flow_item_eth bcast = {
407 		.dst.addr_bytes = "\xff\xff\xff\xff\xff\xff",
408 	};
409 	struct rte_flow_item_eth ipv6_multi_spec = {
410 		.dst.addr_bytes = "\x33\x33\x00\x00\x00\x00",
411 	};
412 	struct rte_flow_item_eth ipv6_multi_mask = {
413 		.dst.addr_bytes = "\xff\xff\x00\x00\x00\x00",
414 	};
415 	struct rte_flow_item_eth unicast = {
416 		.src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
417 	};
418 	struct rte_flow_item_eth unicast_mask = {
419 		.dst.addr_bytes = "\xff\xff\xff\xff\xff\xff",
420 	};
421 	const unsigned int vlan_filter_n = priv->vlan_filter_n;
422 	const struct rte_ether_addr cmp = {
423 		.addr_bytes = "\x00\x00\x00\x00\x00\x00",
424 	};
425 	unsigned int i;
426 	unsigned int j;
427 	int ret;
428 
429 	/*
430 	 * Hairpin txq default flow should be created no matter if it is
431 	 * isolation mode. Or else all the packets to be sent will be sent
432 	 * out directly without the TX flow actions, e.g. encapsulation.
433 	 */
434 	for (i = 0; i != priv->txqs_n; ++i) {
435 		struct mlx5_txq_ctrl *txq_ctrl = mlx5_txq_get(dev, i);
436 		if (!txq_ctrl)
437 			continue;
438 		if (txq_ctrl->type == MLX5_TXQ_TYPE_HAIRPIN) {
439 			ret = mlx5_ctrl_flow_source_queue(dev, i);
440 			if (ret) {
441 				mlx5_txq_release(dev, i);
442 				goto error;
443 			}
444 		}
445 		mlx5_txq_release(dev, i);
446 	}
447 	if (priv->config.dv_esw_en && !priv->config.vf) {
448 		if (mlx5_flow_create_esw_table_zero_flow(dev))
449 			priv->fdb_def_rule = 1;
450 		else
451 			DRV_LOG(INFO, "port %u FDB default rule cannot be"
452 				" configured - only Eswitch group 0 flows are"
453 				" supported.", dev->data->port_id);
454 	}
455 	if (priv->isolated)
456 		return 0;
457 	if (dev->data->promiscuous) {
458 		struct rte_flow_item_eth promisc = {
459 			.dst.addr_bytes = "\x00\x00\x00\x00\x00\x00",
460 			.src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
461 			.type = 0,
462 		};
463 
464 		ret = mlx5_ctrl_flow(dev, &promisc, &promisc);
465 		if (ret)
466 			goto error;
467 	}
468 	if (dev->data->all_multicast) {
469 		struct rte_flow_item_eth multicast = {
470 			.dst.addr_bytes = "\x01\x00\x00\x00\x00\x00",
471 			.src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
472 			.type = 0,
473 		};
474 
475 		ret = mlx5_ctrl_flow(dev, &multicast, &multicast);
476 		if (ret)
477 			goto error;
478 	} else {
479 		/* Add broadcast/multicast flows. */
480 		for (i = 0; i != vlan_filter_n; ++i) {
481 			uint16_t vlan = priv->vlan_filter[i];
482 
483 			struct rte_flow_item_vlan vlan_spec = {
484 				.tci = rte_cpu_to_be_16(vlan),
485 			};
486 			struct rte_flow_item_vlan vlan_mask =
487 				rte_flow_item_vlan_mask;
488 
489 			ret = mlx5_ctrl_flow_vlan(dev, &bcast, &bcast,
490 						  &vlan_spec, &vlan_mask);
491 			if (ret)
492 				goto error;
493 			ret = mlx5_ctrl_flow_vlan(dev, &ipv6_multi_spec,
494 						  &ipv6_multi_mask,
495 						  &vlan_spec, &vlan_mask);
496 			if (ret)
497 				goto error;
498 		}
499 		if (!vlan_filter_n) {
500 			ret = mlx5_ctrl_flow(dev, &bcast, &bcast);
501 			if (ret)
502 				goto error;
503 			ret = mlx5_ctrl_flow(dev, &ipv6_multi_spec,
504 					     &ipv6_multi_mask);
505 			if (ret)
506 				goto error;
507 		}
508 	}
509 	/* Add MAC address flows. */
510 	for (i = 0; i != MLX5_MAX_MAC_ADDRESSES; ++i) {
511 		struct rte_ether_addr *mac = &dev->data->mac_addrs[i];
512 
513 		if (!memcmp(mac, &cmp, sizeof(*mac)))
514 			continue;
515 		memcpy(&unicast.dst.addr_bytes,
516 		       mac->addr_bytes,
517 		       RTE_ETHER_ADDR_LEN);
518 		for (j = 0; j != vlan_filter_n; ++j) {
519 			uint16_t vlan = priv->vlan_filter[j];
520 
521 			struct rte_flow_item_vlan vlan_spec = {
522 				.tci = rte_cpu_to_be_16(vlan),
523 			};
524 			struct rte_flow_item_vlan vlan_mask =
525 				rte_flow_item_vlan_mask;
526 
527 			ret = mlx5_ctrl_flow_vlan(dev, &unicast,
528 						  &unicast_mask,
529 						  &vlan_spec,
530 						  &vlan_mask);
531 			if (ret)
532 				goto error;
533 		}
534 		if (!vlan_filter_n) {
535 			ret = mlx5_ctrl_flow(dev, &unicast, &unicast_mask);
536 			if (ret)
537 				goto error;
538 		}
539 	}
540 	return 0;
541 error:
542 	ret = rte_errno; /* Save rte_errno before cleanup. */
543 	mlx5_flow_list_flush(dev, &priv->ctrl_flows, false);
544 	rte_errno = ret; /* Restore rte_errno. */
545 	return -rte_errno;
546 }
547 
548 
549 /**
550  * Disable traffic flows configured by control plane
551  *
552  * @param dev
553  *   Pointer to Ethernet device private data.
554  */
555 void
556 mlx5_traffic_disable(struct rte_eth_dev *dev)
557 {
558 	struct mlx5_priv *priv = dev->data->dev_private;
559 
560 	mlx5_flow_list_flush(dev, &priv->ctrl_flows, false);
561 }
562 
563 /**
564  * Restart traffic flows configured by control plane
565  *
566  * @param dev
567  *   Pointer to Ethernet device private data.
568  *
569  * @return
570  *   0 on success, a negative errno value otherwise and rte_errno is set.
571  */
572 int
573 mlx5_traffic_restart(struct rte_eth_dev *dev)
574 {
575 	if (dev->data->dev_started) {
576 		mlx5_traffic_disable(dev);
577 		return mlx5_traffic_enable(dev);
578 	}
579 	return 0;
580 }
581