xref: /dpdk/drivers/event/octeontx/ssovf_worker.c (revision cf55f04a0c99fc8571afbb7a1a3133af9d33c0e1)
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright(c) 2017 Cavium, Inc
3  */
4 
5 #include "ssovf_worker.h"
6 
7 static __rte_always_inline void
8 ssows_new_event(struct ssows *ws, const struct rte_event *ev)
9 {
10 	const uint64_t event_ptr = ev->u64;
11 	const uint32_t tag = (uint32_t)ev->event;
12 	const uint8_t new_tt = ev->sched_type;
13 	const uint8_t grp = ev->queue_id;
14 
15 	ssows_add_work(ws, event_ptr, tag, new_tt, grp);
16 }
17 
18 static __rte_always_inline void
19 ssows_fwd_swtag(struct ssows *ws, const struct rte_event *ev, const uint8_t grp)
20 {
21 	const uint8_t cur_tt = ws->cur_tt;
22 	const uint8_t new_tt = ev->sched_type;
23 	const uint32_t tag = (uint32_t)ev->event;
24 	/*
25 	 * cur_tt/new_tt     SSO_SYNC_ORDERED SSO_SYNC_ATOMIC SSO_SYNC_UNTAGGED
26 	 *
27 	 * SSO_SYNC_ORDERED        norm           norm             untag
28 	 * SSO_SYNC_ATOMIC         norm           norm		   untag
29 	 * SSO_SYNC_UNTAGGED       full           full             NOOP
30 	 */
31 	if (unlikely(cur_tt == SSO_SYNC_UNTAGGED)) {
32 		if (new_tt != SSO_SYNC_UNTAGGED) {
33 			ssows_swtag_full(ws, ev->u64, tag,
34 				new_tt, grp);
35 		}
36 	} else {
37 		if (likely(new_tt != SSO_SYNC_UNTAGGED))
38 			ssows_swtag_norm(ws, tag, new_tt);
39 		else
40 			ssows_swtag_untag(ws);
41 	}
42 	ws->swtag_req = 1;
43 }
44 
45 #define OCT_EVENT_TYPE_GRP_FWD (RTE_EVENT_TYPE_MAX - 1)
46 
47 static __rte_always_inline void
48 ssows_fwd_group(struct ssows *ws, const struct rte_event *ev, const uint8_t grp)
49 {
50 	const uint64_t event_ptr = ev->u64;
51 	const uint32_t tag = (uint32_t)ev->event;
52 	const uint8_t cur_tt = ws->cur_tt;
53 	const uint8_t new_tt = ev->sched_type;
54 
55 	if (cur_tt == SSO_SYNC_ORDERED) {
56 		/* Create unique tag based on custom event type and new grp */
57 		uint32_t newtag = OCT_EVENT_TYPE_GRP_FWD << 28;
58 
59 		newtag |= grp << 20;
60 		newtag |= tag;
61 		ssows_swtag_norm(ws, newtag, SSO_SYNC_ATOMIC);
62 		rte_smp_wmb();
63 		ssows_swtag_wait(ws);
64 	} else {
65 		rte_smp_wmb();
66 	}
67 	ssows_add_work(ws, event_ptr, tag, new_tt, grp);
68 }
69 
70 static __rte_always_inline void
71 ssows_forward_event(struct ssows *ws, const struct rte_event *ev)
72 {
73 	const uint8_t grp = ev->queue_id;
74 
75 	/* Group hasn't changed, Use SWTAG to forward the event */
76 	if (ws->cur_grp == grp)
77 		ssows_fwd_swtag(ws, ev, grp);
78 	else
79 	/*
80 	 * Group has been changed for group based work pipelining,
81 	 * Use deschedule/add_work operation to transfer the event to
82 	 * new group/core
83 	 */
84 		ssows_fwd_group(ws, ev, grp);
85 }
86 
87 static __rte_always_inline void
88 ssows_release_event(struct ssows *ws)
89 {
90 	if (likely(ws->cur_tt != SSO_SYNC_UNTAGGED))
91 		ssows_swtag_untag(ws);
92 }
93 
94 #define R(name, f2, f1, f0, flags)					     \
95 static uint16_t __rte_noinline	__rte_hot				     \
96 ssows_deq_ ##name(void *port, struct rte_event *ev, uint64_t timeout_ticks)  \
97 {									     \
98 	struct ssows *ws = port;					     \
99 									     \
100 	RTE_SET_USED(timeout_ticks);					     \
101 									     \
102 	if (ws->swtag_req) {						     \
103 		ws->swtag_req = 0;					     \
104 		ssows_swtag_wait(ws);					     \
105 		return 1;						     \
106 	} else {							     \
107 		return ssows_get_work(ws, ev, flags);		             \
108 	}								     \
109 }									     \
110 									     \
111 static uint16_t __rte_hot						     \
112 ssows_deq_burst_ ##name(void *port, struct rte_event ev[],		     \
113 			 uint16_t nb_events, uint64_t timeout_ticks)	     \
114 {									     \
115 	RTE_SET_USED(nb_events);					     \
116 									     \
117 	return ssows_deq_ ##name(port, ev, timeout_ticks);		     \
118 }									     \
119 									     \
120 static uint16_t __rte_hot						     \
121 ssows_deq_timeout_ ##name(void *port, struct rte_event *ev,		     \
122 			  uint64_t timeout_ticks)			     \
123 {									     \
124 	struct ssows *ws = port;					     \
125 	uint64_t iter;							     \
126 	uint16_t ret = 1;						     \
127 									     \
128 	if (ws->swtag_req) {						     \
129 		ws->swtag_req = 0;					     \
130 		ssows_swtag_wait(ws);					     \
131 	} else {							     \
132 		ret = ssows_get_work(ws, ev, flags);			     \
133 		for (iter = 1; iter < timeout_ticks && (ret == 0); iter++)   \
134 			ret = ssows_get_work(ws, ev, flags);		     \
135 	}								     \
136 	return ret;							     \
137 }									     \
138 									     \
139 static uint16_t __rte_hot						     \
140 ssows_deq_timeout_burst_ ##name(void *port, struct rte_event ev[],	     \
141 				uint16_t nb_events, uint64_t timeout_ticks)  \
142 {									     \
143 	RTE_SET_USED(nb_events);					     \
144 									     \
145 	return ssows_deq_timeout_ ##name(port, ev, timeout_ticks);	     \
146 }
147 
148 SSO_RX_ADPTR_ENQ_FASTPATH_FUNC
149 #undef R
150 
151 __rte_always_inline uint16_t __rte_hot
152 ssows_enq(void *port, const struct rte_event *ev)
153 {
154 	struct ssows *ws = port;
155 	uint16_t ret = 1;
156 
157 	switch (ev->op) {
158 	case RTE_EVENT_OP_NEW:
159 		rte_smp_wmb();
160 		ssows_new_event(ws, ev);
161 		break;
162 	case RTE_EVENT_OP_FORWARD:
163 		ssows_forward_event(ws, ev);
164 		break;
165 	case RTE_EVENT_OP_RELEASE:
166 		ssows_release_event(ws);
167 		break;
168 	default:
169 		ret = 0;
170 	}
171 	return ret;
172 }
173 
174 uint16_t __rte_hot
175 ssows_enq_burst(void *port, const struct rte_event ev[], uint16_t nb_events)
176 {
177 	RTE_SET_USED(nb_events);
178 	return ssows_enq(port, ev);
179 }
180 
181 uint16_t __rte_hot
182 ssows_enq_new_burst(void *port, const struct rte_event ev[], uint16_t nb_events)
183 {
184 	uint16_t i;
185 	struct ssows *ws = port;
186 
187 	rte_smp_wmb();
188 	for (i = 0; i < nb_events; i++)
189 		ssows_new_event(ws,  &ev[i]);
190 
191 	return nb_events;
192 }
193 
194 uint16_t __rte_hot
195 ssows_enq_fwd_burst(void *port, const struct rte_event ev[], uint16_t nb_events)
196 {
197 	struct ssows *ws = port;
198 	RTE_SET_USED(nb_events);
199 
200 	ssows_forward_event(ws,  ev);
201 
202 	return 1;
203 }
204 
205 void
206 ssows_flush_events(struct ssows *ws, uint8_t queue_id,
207 				ssows_handle_event_t fn, void *arg)
208 {
209 	uint32_t reg_off;
210 	struct rte_event ev;
211 	uint64_t enable, aq_cnt = 1, cq_ds_cnt = 1;
212 	uint64_t get_work0, get_work1;
213 	uint64_t sched_type_queue;
214 	uint8_t *base = ssovf_bar(OCTEONTX_SSO_GROUP, queue_id, 0);
215 
216 	enable = ssovf_read64(base + SSO_VHGRP_QCTL);
217 	if (!enable)
218 		return;
219 
220 	reg_off = SSOW_VHWS_OP_GET_WORK0;
221 	reg_off |= 1 << 17; /* Grouped */
222 	reg_off |= 1 << 16; /* WAIT */
223 	reg_off |= queue_id << 4; /* INDEX_GGRP_MASK(group number) */
224 	while (aq_cnt || cq_ds_cnt) {
225 		aq_cnt = ssovf_read64(base + SSO_VHGRP_AQ_CNT);
226 		cq_ds_cnt = ssovf_read64(base + SSO_VHGRP_INT_CNT);
227 		/* Extract cq and ds count */
228 		cq_ds_cnt &= 0x1FFF1FFF0000;
229 
230 		ssovf_load_pair(get_work0, get_work1, ws->base + reg_off);
231 
232 		sched_type_queue = (get_work0 >> 32) & 0xfff;
233 		ws->cur_tt = sched_type_queue & 0x3;
234 		ws->cur_grp = sched_type_queue >> 2;
235 		sched_type_queue = sched_type_queue << 38;
236 		ev.event = sched_type_queue | (get_work0 & 0xffffffff);
237 		if (get_work1 && ev.event_type == RTE_EVENT_TYPE_ETHDEV)
238 			ev.mbuf = ssovf_octeontx_wqe_to_pkt(get_work1,
239 					(ev.event >> 20) & 0x7F,
240 					OCCTX_RX_OFFLOAD_NONE |
241 					OCCTX_RX_MULTI_SEG_F,
242 					ws->lookup_mem);
243 		else
244 			ev.u64 = get_work1;
245 
246 		if (fn != NULL && ev.u64 != 0)
247 			fn(arg, ev);
248 	}
249 }
250 
251 void
252 ssows_reset(struct ssows *ws)
253 {
254 	uint64_t tag;
255 	uint64_t pend_tag;
256 	uint8_t pend_tt;
257 	uint8_t tt;
258 
259 	tag = ssovf_read64(ws->base + SSOW_VHWS_TAG);
260 	pend_tag = ssovf_read64(ws->base + SSOW_VHWS_PENDTAG);
261 
262 	if (pend_tag & (1ULL << 63)) { /* Tagswitch pending */
263 		pend_tt = (pend_tag >> 32) & 0x3;
264 		if (pend_tt == SSO_SYNC_ORDERED || pend_tt == SSO_SYNC_ATOMIC)
265 			ssows_desched(ws);
266 	} else {
267 		tt = (tag >> 32) & 0x3;
268 		if (tt == SSO_SYNC_ORDERED || tt == SSO_SYNC_ATOMIC)
269 			ssows_swtag_untag(ws);
270 	}
271 }
272 
273 static __rte_always_inline uint16_t
274 __sso_event_tx_adapter_enqueue(void *port, struct rte_event ev[],
275 			       uint16_t nb_events, uint64_t *cmd,
276 			       const uint16_t flag)
277 {
278 	uint16_t port_id;
279 	uint16_t queue_id;
280 	struct rte_mbuf *m;
281 	struct rte_eth_dev *ethdev;
282 	struct ssows *ws = port;
283 	struct octeontx_txq *txq;
284 
285 	switch (ev->sched_type) {
286 	case SSO_SYNC_ORDERED:
287 		ssows_swtag_norm(ws, ev->event, SSO_SYNC_ATOMIC);
288 		rte_cio_wmb();
289 		ssows_swtag_wait(ws);
290 		break;
291 	case SSO_SYNC_UNTAGGED:
292 		ssows_swtag_full(ws, ev->u64, ev->event, SSO_SYNC_ATOMIC,
293 				ev->queue_id);
294 		rte_cio_wmb();
295 		ssows_swtag_wait(ws);
296 		break;
297 	case SSO_SYNC_ATOMIC:
298 		rte_cio_wmb();
299 		break;
300 	}
301 
302 	m = ev[0].mbuf;
303 	port_id = m->port;
304 	queue_id = rte_event_eth_tx_adapter_txq_get(m);
305 	ethdev = &rte_eth_devices[port_id];
306 	txq = ethdev->data->tx_queues[queue_id];
307 
308 	return __octeontx_xmit_pkts(txq, &m, nb_events, cmd, flag);
309 }
310 
311 #define T(name, f3, f2, f1, f0, sz, flags)				     \
312 static uint16_t __rte_noinline	__rte_hot				     \
313 sso_event_tx_adapter_enqueue_ ## name(void *port, struct rte_event ev[],     \
314 				  uint16_t nb_events)			     \
315 {									     \
316 	uint64_t cmd[sz];						     \
317 	return __sso_event_tx_adapter_enqueue(port, ev, nb_events, cmd,	     \
318 					      flags);			     \
319 }
320 
321 SSO_TX_ADPTR_ENQ_FASTPATH_FUNC
322 #undef T
323 
324 void
325 ssovf_fastpath_fns_set(struct rte_eventdev *dev)
326 {
327 	struct ssovf_evdev *edev = ssovf_pmd_priv(dev);
328 
329 	dev->enqueue       = ssows_enq;
330 	dev->enqueue_burst = ssows_enq_burst;
331 	dev->enqueue_new_burst = ssows_enq_new_burst;
332 	dev->enqueue_forward_burst = ssows_enq_fwd_burst;
333 
334 	const event_tx_adapter_enqueue ssow_txa_enqueue[2][2][2][2] = {
335 #define T(name, f3, f2, f1, f0, sz, flags)				\
336 	[f3][f2][f1][f0] =  sso_event_tx_adapter_enqueue_ ##name,
337 
338 SSO_TX_ADPTR_ENQ_FASTPATH_FUNC
339 #undef T
340 	};
341 
342 	dev->txa_enqueue = ssow_txa_enqueue
343 		[!!(edev->tx_offload_flags & OCCTX_TX_OFFLOAD_MBUF_NOFF_F)]
344 		[!!(edev->tx_offload_flags & OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F)]
345 		[!!(edev->tx_offload_flags & OCCTX_TX_OFFLOAD_L3_L4_CSUM_F)]
346 		[!!(edev->tx_offload_flags & OCCTX_TX_MULTI_SEG_F)];
347 
348 	dev->txa_enqueue_same_dest = dev->txa_enqueue;
349 
350 	/* Assigning dequeue func pointers */
351 	const event_dequeue_t ssow_deq[2][2][2] = {
352 #define R(name, f2, f1, f0, flags)					\
353 	[f2][f1][f0] =  ssows_deq_ ##name,
354 
355 SSO_RX_ADPTR_ENQ_FASTPATH_FUNC
356 #undef R
357 	};
358 
359 	dev->dequeue = ssow_deq
360 		[!!(edev->rx_offload_flags & OCCTX_RX_VLAN_FLTR_F)]
361 		[!!(edev->rx_offload_flags & OCCTX_RX_OFFLOAD_CSUM_F)]
362 		[!!(edev->rx_offload_flags & OCCTX_RX_MULTI_SEG_F)];
363 
364 	const event_dequeue_burst_t ssow_deq_burst[2][2][2] = {
365 #define R(name, f2, f1, f0, flags)					\
366 	[f2][f1][f0] =  ssows_deq_burst_ ##name,
367 
368 SSO_RX_ADPTR_ENQ_FASTPATH_FUNC
369 #undef R
370 	};
371 
372 	dev->dequeue_burst = ssow_deq_burst
373 		[!!(edev->rx_offload_flags & OCCTX_RX_VLAN_FLTR_F)]
374 		[!!(edev->rx_offload_flags & OCCTX_RX_OFFLOAD_CSUM_F)]
375 		[!!(edev->rx_offload_flags & OCCTX_RX_MULTI_SEG_F)];
376 
377 	if (edev->is_timeout_deq) {
378 		const event_dequeue_t ssow_deq_timeout[2][2][2] = {
379 #define R(name, f2, f1, f0, flags)					\
380 	[f2][f1][f0] =  ssows_deq_timeout_ ##name,
381 
382 SSO_RX_ADPTR_ENQ_FASTPATH_FUNC
383 #undef R
384 		};
385 
386 	dev->dequeue = ssow_deq_timeout
387 		[!!(edev->rx_offload_flags & OCCTX_RX_VLAN_FLTR_F)]
388 		[!!(edev->rx_offload_flags & OCCTX_RX_OFFLOAD_CSUM_F)]
389 		[!!(edev->rx_offload_flags & OCCTX_RX_MULTI_SEG_F)];
390 
391 	const event_dequeue_burst_t ssow_deq_timeout_burst[2][2][2] = {
392 #define R(name, f2, f1, f0, flags)					\
393 	[f2][f1][f0] =  ssows_deq_timeout_burst_ ##name,
394 
395 SSO_RX_ADPTR_ENQ_FASTPATH_FUNC
396 #undef R
397 		};
398 
399 	dev->dequeue_burst = ssow_deq_timeout_burst
400 		[!!(edev->rx_offload_flags & OCCTX_RX_VLAN_FLTR_F)]
401 		[!!(edev->rx_offload_flags & OCCTX_RX_OFFLOAD_CSUM_F)]
402 		[!!(edev->rx_offload_flags & OCCTX_RX_MULTI_SEG_F)];
403 	}
404 }
405 
406 static void
407 octeontx_create_rx_ol_flags_array(void *mem)
408 {
409 	uint16_t idx, errcode, errlev;
410 	uint32_t val, *ol_flags;
411 
412 	/* Skip ptype array memory */
413 	ol_flags = (uint32_t *)mem;
414 
415 	for (idx = 0; idx < BIT(ERRCODE_ERRLEN_WIDTH); idx++) {
416 		errcode = idx & 0xff;
417 		errlev = (idx & 0x700) >> 8;
418 
419 		val = PKT_RX_IP_CKSUM_UNKNOWN;
420 		val |= PKT_RX_L4_CKSUM_UNKNOWN;
421 		val |= PKT_RX_OUTER_L4_CKSUM_UNKNOWN;
422 
423 		switch (errlev) {
424 		case OCCTX_ERRLEV_RE:
425 			if (errcode) {
426 				val |= PKT_RX_IP_CKSUM_BAD;
427 				val |= PKT_RX_L4_CKSUM_BAD;
428 			} else {
429 				val |= PKT_RX_IP_CKSUM_GOOD;
430 				val |= PKT_RX_L4_CKSUM_GOOD;
431 			}
432 			break;
433 		case OCCTX_ERRLEV_LC:
434 			if (errcode == OCCTX_EC_IP4_CSUM) {
435 				val |= PKT_RX_IP_CKSUM_BAD;
436 				val |= PKT_RX_EIP_CKSUM_BAD;
437 			} else {
438 				val |= PKT_RX_IP_CKSUM_GOOD;
439 			}
440 			break;
441 		case OCCTX_ERRLEV_LD:
442 			/* Check if parsed packet is neither IPv4 or IPV6 */
443 			if (errcode == OCCTX_EC_IP4_NOT)
444 				break;
445 			val |= PKT_RX_IP_CKSUM_GOOD;
446 			if (errcode == OCCTX_EC_L4_CSUM)
447 				val |= PKT_RX_OUTER_L4_CKSUM_BAD;
448 			else
449 				val |= PKT_RX_L4_CKSUM_GOOD;
450 			break;
451 		case OCCTX_ERRLEV_LE:
452 			if (errcode == OCCTX_EC_IP4_CSUM)
453 				val |= PKT_RX_IP_CKSUM_BAD;
454 			else
455 				val |= PKT_RX_IP_CKSUM_GOOD;
456 			break;
457 		case OCCTX_ERRLEV_LF:
458 			/* Check if parsed packet is neither IPv4 or IPV6 */
459 			if (errcode == OCCTX_EC_IP4_NOT)
460 				break;
461 			val |= PKT_RX_IP_CKSUM_GOOD;
462 			if (errcode == OCCTX_EC_L4_CSUM)
463 				val |= PKT_RX_L4_CKSUM_BAD;
464 			else
465 				val |= PKT_RX_L4_CKSUM_GOOD;
466 			break;
467 		}
468 
469 		ol_flags[idx] = val;
470 	}
471 }
472 
473 void *
474 octeontx_fastpath_lookup_mem_get(void)
475 {
476 	const char name[] = OCCTX_FASTPATH_LOOKUP_MEM;
477 	const struct rte_memzone *mz;
478 	void *mem;
479 
480 	mz = rte_memzone_lookup(name);
481 	if (mz != NULL)
482 		return mz->addr;
483 
484 	/* Request for the first time */
485 	mz = rte_memzone_reserve_aligned(name, LOOKUP_ARRAY_SZ,
486 					 SOCKET_ID_ANY, 0, OCCTX_ALIGN);
487 	if (mz != NULL) {
488 		mem = mz->addr;
489 		/* Form the rx ol_flags based on errcode */
490 		octeontx_create_rx_ol_flags_array(mem);
491 		return mem;
492 	}
493 	return NULL;
494 }
495