1 /* SPDX-License-Identifier: BSD-3-Clause 2 * 3 * Copyright 2016 Freescale Semiconductor, Inc. All rights reserved. 4 * Copyright 2017 NXP 5 * 6 */ 7 8 /* System headers */ 9 #include <inttypes.h> 10 #include <unistd.h> 11 #include <stdio.h> 12 #include <limits.h> 13 #include <sched.h> 14 #include <pthread.h> 15 16 #include <rte_byteorder.h> 17 #include <rte_common.h> 18 #include <rte_interrupts.h> 19 #include <rte_log.h> 20 #include <rte_debug.h> 21 #include <rte_pci.h> 22 #include <rte_atomic.h> 23 #include <rte_branch_prediction.h> 24 #include <rte_memory.h> 25 #include <rte_tailq.h> 26 #include <rte_eal.h> 27 #include <rte_alarm.h> 28 #include <rte_ether.h> 29 #include <rte_ethdev_driver.h> 30 #include <rte_malloc.h> 31 #include <rte_ring.h> 32 #include <rte_ip.h> 33 #include <rte_tcp.h> 34 #include <rte_udp.h> 35 #include <rte_net.h> 36 #include <rte_eventdev.h> 37 38 #include "dpaa_ethdev.h" 39 #include "dpaa_rxtx.h" 40 #include <rte_dpaa_bus.h> 41 #include <dpaa_mempool.h> 42 43 #include <qman.h> 44 #include <fsl_usd.h> 45 #include <fsl_qman.h> 46 #include <fsl_bman.h> 47 #include <of.h> 48 #include <netcfg.h> 49 50 #define DPAA_MBUF_TO_CONTIG_FD(_mbuf, _fd, _bpid) \ 51 do { \ 52 (_fd)->cmd = 0; \ 53 (_fd)->opaque_addr = 0; \ 54 (_fd)->opaque = QM_FD_CONTIG << DPAA_FD_FORMAT_SHIFT; \ 55 (_fd)->opaque |= ((_mbuf)->data_off) << DPAA_FD_OFFSET_SHIFT; \ 56 (_fd)->opaque |= (_mbuf)->pkt_len; \ 57 (_fd)->addr = (_mbuf)->buf_iova; \ 58 (_fd)->bpid = _bpid; \ 59 } while (0) 60 61 #if (defined RTE_LIBRTE_DPAA_DEBUG_DRIVER) 62 static void dpaa_display_frame(const struct qm_fd *fd) 63 { 64 int ii; 65 char *ptr; 66 67 printf("%s::bpid %x addr %08x%08x, format %d off %d, len %d stat %x\n", 68 __func__, fd->bpid, fd->addr_hi, fd->addr_lo, fd->format, 69 fd->offset, fd->length20, fd->status); 70 71 ptr = (char *)rte_dpaa_mem_ptov(fd->addr); 72 ptr += fd->offset; 73 printf("%02x ", *ptr); 74 for (ii = 1; ii < fd->length20; ii++) { 75 printf("%02x ", *ptr); 76 if ((ii % 16) == 0) 77 printf("\n"); 78 ptr++; 79 } 80 printf("\n"); 81 } 82 #else 83 #define dpaa_display_frame(a) 84 #endif 85 86 static inline void dpaa_slow_parsing(struct rte_mbuf *m __rte_unused, 87 uint64_t prs __rte_unused) 88 { 89 DPAA_DP_LOG(DEBUG, "Slow parsing"); 90 /*TBD:XXX: to be implemented*/ 91 } 92 93 static inline void dpaa_eth_packet_info(struct rte_mbuf *m, void *fd_virt_addr) 94 { 95 struct annotations_t *annot = GET_ANNOTATIONS(fd_virt_addr); 96 uint64_t prs = *((uintptr_t *)(&annot->parse)) & DPAA_PARSE_MASK; 97 98 DPAA_DP_LOG(DEBUG, " Parsing mbuf: %p with annotations: %p", m, annot); 99 100 switch (prs) { 101 case DPAA_PKT_TYPE_IPV4: 102 m->packet_type = RTE_PTYPE_L2_ETHER | 103 RTE_PTYPE_L3_IPV4; 104 break; 105 case DPAA_PKT_TYPE_IPV6: 106 m->packet_type = RTE_PTYPE_L2_ETHER | 107 RTE_PTYPE_L3_IPV6; 108 break; 109 case DPAA_PKT_TYPE_ETHER: 110 m->packet_type = RTE_PTYPE_L2_ETHER; 111 break; 112 case DPAA_PKT_TYPE_IPV4_FRAG: 113 case DPAA_PKT_TYPE_IPV4_FRAG_UDP: 114 case DPAA_PKT_TYPE_IPV4_FRAG_TCP: 115 case DPAA_PKT_TYPE_IPV4_FRAG_SCTP: 116 m->packet_type = RTE_PTYPE_L2_ETHER | 117 RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_FRAG; 118 break; 119 case DPAA_PKT_TYPE_IPV6_FRAG: 120 case DPAA_PKT_TYPE_IPV6_FRAG_UDP: 121 case DPAA_PKT_TYPE_IPV6_FRAG_TCP: 122 case DPAA_PKT_TYPE_IPV6_FRAG_SCTP: 123 m->packet_type = RTE_PTYPE_L2_ETHER | 124 RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_FRAG; 125 break; 126 case DPAA_PKT_TYPE_IPV4_EXT: 127 m->packet_type = RTE_PTYPE_L2_ETHER | 128 RTE_PTYPE_L3_IPV4_EXT; 129 break; 130 case DPAA_PKT_TYPE_IPV6_EXT: 131 m->packet_type = RTE_PTYPE_L2_ETHER | 132 RTE_PTYPE_L3_IPV6_EXT; 133 break; 134 case DPAA_PKT_TYPE_IPV4_TCP: 135 m->packet_type = RTE_PTYPE_L2_ETHER | 136 RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_TCP; 137 break; 138 case DPAA_PKT_TYPE_IPV6_TCP: 139 m->packet_type = RTE_PTYPE_L2_ETHER | 140 RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_TCP; 141 break; 142 case DPAA_PKT_TYPE_IPV4_UDP: 143 m->packet_type = RTE_PTYPE_L2_ETHER | 144 RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_UDP; 145 break; 146 case DPAA_PKT_TYPE_IPV6_UDP: 147 m->packet_type = RTE_PTYPE_L2_ETHER | 148 RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_UDP; 149 break; 150 case DPAA_PKT_TYPE_IPV4_EXT_UDP: 151 m->packet_type = RTE_PTYPE_L2_ETHER | 152 RTE_PTYPE_L3_IPV4_EXT | RTE_PTYPE_L4_UDP; 153 break; 154 case DPAA_PKT_TYPE_IPV6_EXT_UDP: 155 m->packet_type = RTE_PTYPE_L2_ETHER | 156 RTE_PTYPE_L3_IPV6_EXT | RTE_PTYPE_L4_UDP; 157 break; 158 case DPAA_PKT_TYPE_IPV4_EXT_TCP: 159 m->packet_type = RTE_PTYPE_L2_ETHER | 160 RTE_PTYPE_L3_IPV4_EXT | RTE_PTYPE_L4_TCP; 161 break; 162 case DPAA_PKT_TYPE_IPV6_EXT_TCP: 163 m->packet_type = RTE_PTYPE_L2_ETHER | 164 RTE_PTYPE_L3_IPV6_EXT | RTE_PTYPE_L4_TCP; 165 break; 166 case DPAA_PKT_TYPE_IPV4_SCTP: 167 m->packet_type = RTE_PTYPE_L2_ETHER | 168 RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_SCTP; 169 break; 170 case DPAA_PKT_TYPE_IPV6_SCTP: 171 m->packet_type = RTE_PTYPE_L2_ETHER | 172 RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_SCTP; 173 break; 174 case DPAA_PKT_TYPE_NONE: 175 m->packet_type = 0; 176 break; 177 /* More switch cases can be added */ 178 default: 179 dpaa_slow_parsing(m, prs); 180 } 181 182 m->tx_offload = annot->parse.ip_off[0]; 183 m->tx_offload |= (annot->parse.l4_off - annot->parse.ip_off[0]) 184 << DPAA_PKT_L3_LEN_SHIFT; 185 186 /* Set the hash values */ 187 m->hash.rss = (uint32_t)(annot->hash); 188 /* All packets with Bad checksum are dropped by interface (and 189 * corresponding notification issued to RX error queues). 190 */ 191 m->ol_flags = PKT_RX_RSS_HASH | PKT_RX_IP_CKSUM_GOOD; 192 193 /* Check if Vlan is present */ 194 if (prs & DPAA_PARSE_VLAN_MASK) 195 m->ol_flags |= PKT_RX_VLAN; 196 /* Packet received without stripping the vlan */ 197 } 198 199 static inline void dpaa_checksum(struct rte_mbuf *mbuf) 200 { 201 struct ether_hdr *eth_hdr = rte_pktmbuf_mtod(mbuf, struct ether_hdr *); 202 char *l3_hdr = (char *)eth_hdr + mbuf->l2_len; 203 struct ipv4_hdr *ipv4_hdr = (struct ipv4_hdr *)l3_hdr; 204 struct ipv6_hdr *ipv6_hdr = (struct ipv6_hdr *)l3_hdr; 205 206 DPAA_DP_LOG(DEBUG, "Calculating checksum for mbuf: %p", mbuf); 207 208 if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) == RTE_PTYPE_L3_IPV4) || 209 ((mbuf->packet_type & RTE_PTYPE_L3_MASK) == 210 RTE_PTYPE_L3_IPV4_EXT)) { 211 ipv4_hdr = (struct ipv4_hdr *)l3_hdr; 212 ipv4_hdr->hdr_checksum = 0; 213 ipv4_hdr->hdr_checksum = rte_ipv4_cksum(ipv4_hdr); 214 } else if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) == 215 RTE_PTYPE_L3_IPV6) || 216 ((mbuf->packet_type & RTE_PTYPE_L3_MASK) == 217 RTE_PTYPE_L3_IPV6_EXT)) 218 ipv6_hdr = (struct ipv6_hdr *)l3_hdr; 219 220 if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) == RTE_PTYPE_L4_TCP) { 221 struct tcp_hdr *tcp_hdr = (struct tcp_hdr *)(l3_hdr + 222 mbuf->l3_len); 223 tcp_hdr->cksum = 0; 224 if (eth_hdr->ether_type == htons(ETHER_TYPE_IPv4)) 225 tcp_hdr->cksum = rte_ipv4_udptcp_cksum(ipv4_hdr, 226 tcp_hdr); 227 else /* assume ethertype == ETHER_TYPE_IPv6 */ 228 tcp_hdr->cksum = rte_ipv6_udptcp_cksum(ipv6_hdr, 229 tcp_hdr); 230 } else if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) == 231 RTE_PTYPE_L4_UDP) { 232 struct udp_hdr *udp_hdr = (struct udp_hdr *)(l3_hdr + 233 mbuf->l3_len); 234 udp_hdr->dgram_cksum = 0; 235 if (eth_hdr->ether_type == htons(ETHER_TYPE_IPv4)) 236 udp_hdr->dgram_cksum = rte_ipv4_udptcp_cksum(ipv4_hdr, 237 udp_hdr); 238 else /* assume ethertype == ETHER_TYPE_IPv6 */ 239 udp_hdr->dgram_cksum = rte_ipv6_udptcp_cksum(ipv6_hdr, 240 udp_hdr); 241 } 242 } 243 244 static inline void dpaa_checksum_offload(struct rte_mbuf *mbuf, 245 struct qm_fd *fd, char *prs_buf) 246 { 247 struct dpaa_eth_parse_results_t *prs; 248 249 DPAA_DP_LOG(DEBUG, " Offloading checksum for mbuf: %p", mbuf); 250 251 prs = GET_TX_PRS(prs_buf); 252 prs->l3r = 0; 253 prs->l4r = 0; 254 if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) == RTE_PTYPE_L3_IPV4) || 255 ((mbuf->packet_type & RTE_PTYPE_L3_MASK) == 256 RTE_PTYPE_L3_IPV4_EXT)) 257 prs->l3r = DPAA_L3_PARSE_RESULT_IPV4; 258 else if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) == 259 RTE_PTYPE_L3_IPV6) || 260 ((mbuf->packet_type & RTE_PTYPE_L3_MASK) == 261 RTE_PTYPE_L3_IPV6_EXT)) 262 prs->l3r = DPAA_L3_PARSE_RESULT_IPV6; 263 264 if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) == RTE_PTYPE_L4_TCP) 265 prs->l4r = DPAA_L4_PARSE_RESULT_TCP; 266 else if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) == RTE_PTYPE_L4_UDP) 267 prs->l4r = DPAA_L4_PARSE_RESULT_UDP; 268 269 prs->ip_off[0] = mbuf->l2_len; 270 prs->l4_off = mbuf->l3_len + mbuf->l2_len; 271 /* Enable L3 (and L4, if TCP or UDP) HW checksum*/ 272 fd->cmd = DPAA_FD_CMD_RPD | DPAA_FD_CMD_DTC; 273 } 274 275 static inline void 276 dpaa_unsegmented_checksum(struct rte_mbuf *mbuf, struct qm_fd *fd_arr) 277 { 278 if (!mbuf->packet_type) { 279 struct rte_net_hdr_lens hdr_lens; 280 281 mbuf->packet_type = rte_net_get_ptype(mbuf, &hdr_lens, 282 RTE_PTYPE_L2_MASK | RTE_PTYPE_L3_MASK 283 | RTE_PTYPE_L4_MASK); 284 mbuf->l2_len = hdr_lens.l2_len; 285 mbuf->l3_len = hdr_lens.l3_len; 286 } 287 if (mbuf->data_off < (DEFAULT_TX_ICEOF + 288 sizeof(struct dpaa_eth_parse_results_t))) { 289 DPAA_DP_LOG(DEBUG, "Checksum offload Err: " 290 "Not enough Headroom " 291 "space for correct Checksum offload." 292 "So Calculating checksum in Software."); 293 dpaa_checksum(mbuf); 294 } else { 295 dpaa_checksum_offload(mbuf, fd_arr, mbuf->buf_addr); 296 } 297 } 298 299 struct rte_mbuf * 300 dpaa_eth_sg_to_mbuf(const struct qm_fd *fd, uint32_t ifid) 301 { 302 struct dpaa_bp_info *bp_info = DPAA_BPID_TO_POOL_INFO(fd->bpid); 303 struct rte_mbuf *first_seg, *prev_seg, *cur_seg, *temp; 304 struct qm_sg_entry *sgt, *sg_temp; 305 void *vaddr, *sg_vaddr; 306 int i = 0; 307 uint8_t fd_offset = fd->offset; 308 309 vaddr = DPAA_MEMPOOL_PTOV(bp_info, qm_fd_addr(fd)); 310 if (!vaddr) { 311 DPAA_PMD_ERR("unable to convert physical address"); 312 return NULL; 313 } 314 sgt = vaddr + fd_offset; 315 sg_temp = &sgt[i++]; 316 hw_sg_to_cpu(sg_temp); 317 temp = (struct rte_mbuf *)((char *)vaddr - bp_info->meta_data_size); 318 sg_vaddr = DPAA_MEMPOOL_PTOV(bp_info, qm_sg_entry_get64(sg_temp)); 319 320 first_seg = (struct rte_mbuf *)((char *)sg_vaddr - 321 bp_info->meta_data_size); 322 first_seg->data_off = sg_temp->offset; 323 first_seg->data_len = sg_temp->length; 324 first_seg->pkt_len = sg_temp->length; 325 rte_mbuf_refcnt_set(first_seg, 1); 326 327 first_seg->port = ifid; 328 first_seg->nb_segs = 1; 329 first_seg->ol_flags = 0; 330 prev_seg = first_seg; 331 while (i < DPAA_SGT_MAX_ENTRIES) { 332 sg_temp = &sgt[i++]; 333 hw_sg_to_cpu(sg_temp); 334 sg_vaddr = DPAA_MEMPOOL_PTOV(bp_info, 335 qm_sg_entry_get64(sg_temp)); 336 cur_seg = (struct rte_mbuf *)((char *)sg_vaddr - 337 bp_info->meta_data_size); 338 cur_seg->data_off = sg_temp->offset; 339 cur_seg->data_len = sg_temp->length; 340 first_seg->pkt_len += sg_temp->length; 341 first_seg->nb_segs += 1; 342 rte_mbuf_refcnt_set(cur_seg, 1); 343 prev_seg->next = cur_seg; 344 if (sg_temp->final) { 345 cur_seg->next = NULL; 346 break; 347 } 348 prev_seg = cur_seg; 349 } 350 DPAA_DP_LOG(DEBUG, "Received an SG frame len =%d, num_sg =%d", 351 first_seg->pkt_len, first_seg->nb_segs); 352 353 dpaa_eth_packet_info(first_seg, vaddr); 354 rte_pktmbuf_free_seg(temp); 355 356 return first_seg; 357 } 358 359 static inline struct rte_mbuf * 360 dpaa_eth_fd_to_mbuf(const struct qm_fd *fd, uint32_t ifid) 361 { 362 struct rte_mbuf *mbuf; 363 struct dpaa_bp_info *bp_info = DPAA_BPID_TO_POOL_INFO(fd->bpid); 364 void *ptr; 365 uint8_t format = 366 (fd->opaque & DPAA_FD_FORMAT_MASK) >> DPAA_FD_FORMAT_SHIFT; 367 uint16_t offset; 368 uint32_t length; 369 370 if (unlikely(format == qm_fd_sg)) 371 return dpaa_eth_sg_to_mbuf(fd, ifid); 372 373 ptr = DPAA_MEMPOOL_PTOV(bp_info, qm_fd_addr(fd)); 374 375 rte_prefetch0((void *)((uint8_t *)ptr + DEFAULT_RX_ICEOF)); 376 377 offset = (fd->opaque & DPAA_FD_OFFSET_MASK) >> DPAA_FD_OFFSET_SHIFT; 378 length = fd->opaque & DPAA_FD_LENGTH_MASK; 379 380 DPAA_DP_LOG(DEBUG, " FD--->MBUF off %d len = %d", offset, length); 381 382 /* Ignoring case when format != qm_fd_contig */ 383 dpaa_display_frame(fd); 384 385 mbuf = (struct rte_mbuf *)((char *)ptr - bp_info->meta_data_size); 386 387 mbuf->data_off = offset; 388 mbuf->data_len = length; 389 mbuf->pkt_len = length; 390 391 mbuf->port = ifid; 392 mbuf->nb_segs = 1; 393 mbuf->ol_flags = 0; 394 mbuf->next = NULL; 395 rte_mbuf_refcnt_set(mbuf, 1); 396 dpaa_eth_packet_info(mbuf, mbuf->buf_addr); 397 398 return mbuf; 399 } 400 401 /* Specific for LS1043 */ 402 void 403 dpaa_rx_cb_no_prefetch(struct qman_fq **fq, struct qm_dqrr_entry **dqrr, 404 void **bufs, int num_bufs) 405 { 406 struct rte_mbuf *mbuf; 407 struct dpaa_bp_info *bp_info; 408 const struct qm_fd *fd; 409 void *ptr; 410 struct dpaa_if *dpaa_intf; 411 uint16_t offset, i; 412 uint32_t length; 413 uint8_t format; 414 415 bp_info = DPAA_BPID_TO_POOL_INFO(dqrr[0]->fd.bpid); 416 ptr = rte_dpaa_mem_ptov(qm_fd_addr(&dqrr[0]->fd)); 417 rte_prefetch0((void *)((uint8_t *)ptr + DEFAULT_RX_ICEOF)); 418 bufs[0] = (struct rte_mbuf *)((char *)ptr - bp_info->meta_data_size); 419 420 for (i = 0; i < num_bufs; i++) { 421 if (i < num_bufs - 1) { 422 bp_info = DPAA_BPID_TO_POOL_INFO(dqrr[i + 1]->fd.bpid); 423 ptr = rte_dpaa_mem_ptov(qm_fd_addr(&dqrr[i + 1]->fd)); 424 rte_prefetch0((void *)((uint8_t *)ptr + 425 DEFAULT_RX_ICEOF)); 426 bufs[i + 1] = (struct rte_mbuf *)((char *)ptr - 427 bp_info->meta_data_size); 428 } 429 430 fd = &dqrr[i]->fd; 431 dpaa_intf = fq[0]->dpaa_intf; 432 433 format = (fd->opaque & DPAA_FD_FORMAT_MASK) >> 434 DPAA_FD_FORMAT_SHIFT; 435 if (unlikely(format == qm_fd_sg)) { 436 bufs[i] = dpaa_eth_sg_to_mbuf(fd, dpaa_intf->ifid); 437 continue; 438 } 439 440 offset = (fd->opaque & DPAA_FD_OFFSET_MASK) >> 441 DPAA_FD_OFFSET_SHIFT; 442 length = fd->opaque & DPAA_FD_LENGTH_MASK; 443 444 mbuf = bufs[i]; 445 mbuf->data_off = offset; 446 mbuf->data_len = length; 447 mbuf->pkt_len = length; 448 mbuf->port = dpaa_intf->ifid; 449 450 mbuf->nb_segs = 1; 451 mbuf->ol_flags = 0; 452 mbuf->next = NULL; 453 rte_mbuf_refcnt_set(mbuf, 1); 454 dpaa_eth_packet_info(mbuf, mbuf->buf_addr); 455 } 456 } 457 458 void 459 dpaa_rx_cb(struct qman_fq **fq, struct qm_dqrr_entry **dqrr, 460 void **bufs, int num_bufs) 461 { 462 struct rte_mbuf *mbuf; 463 const struct qm_fd *fd; 464 struct dpaa_if *dpaa_intf; 465 uint16_t offset, i; 466 uint32_t length; 467 uint8_t format; 468 469 for (i = 0; i < num_bufs; i++) { 470 fd = &dqrr[i]->fd; 471 dpaa_intf = fq[0]->dpaa_intf; 472 473 format = (fd->opaque & DPAA_FD_FORMAT_MASK) >> 474 DPAA_FD_FORMAT_SHIFT; 475 if (unlikely(format == qm_fd_sg)) { 476 bufs[i] = dpaa_eth_sg_to_mbuf(fd, dpaa_intf->ifid); 477 continue; 478 } 479 480 offset = (fd->opaque & DPAA_FD_OFFSET_MASK) >> 481 DPAA_FD_OFFSET_SHIFT; 482 length = fd->opaque & DPAA_FD_LENGTH_MASK; 483 484 mbuf = bufs[i]; 485 mbuf->data_off = offset; 486 mbuf->data_len = length; 487 mbuf->pkt_len = length; 488 mbuf->port = dpaa_intf->ifid; 489 490 mbuf->nb_segs = 1; 491 mbuf->ol_flags = 0; 492 mbuf->next = NULL; 493 rte_mbuf_refcnt_set(mbuf, 1); 494 dpaa_eth_packet_info(mbuf, mbuf->buf_addr); 495 } 496 } 497 498 void dpaa_rx_cb_prepare(struct qm_dqrr_entry *dq, void **bufs) 499 { 500 struct dpaa_bp_info *bp_info = DPAA_BPID_TO_POOL_INFO(dq->fd.bpid); 501 void *ptr = rte_dpaa_mem_ptov(qm_fd_addr(&dq->fd)); 502 503 /* In case of LS1046, annotation stashing is disabled due to L2 cache 504 * being bottleneck in case of multicore scanario for this platform. 505 * So we prefetch the annoation beforehand, so that it is available 506 * in cache when accessed. 507 */ 508 rte_prefetch0((void *)((uint8_t *)ptr + DEFAULT_RX_ICEOF)); 509 510 *bufs = (struct rte_mbuf *)((char *)ptr - bp_info->meta_data_size); 511 } 512 513 static uint16_t 514 dpaa_eth_queue_portal_rx(struct qman_fq *fq, 515 struct rte_mbuf **bufs, 516 uint16_t nb_bufs) 517 { 518 int ret; 519 520 if (unlikely(fq->qp == NULL)) { 521 ret = rte_dpaa_portal_fq_init((void *)0, fq); 522 if (ret) { 523 DPAA_PMD_ERR("Failure in affining portal %d", ret); 524 return 0; 525 } 526 } 527 528 return qman_portal_poll_rx(nb_bufs, (void **)bufs, fq->qp); 529 } 530 531 enum qman_cb_dqrr_result 532 dpaa_rx_cb_parallel(void *event, 533 struct qman_portal *qm __always_unused, 534 struct qman_fq *fq, 535 const struct qm_dqrr_entry *dqrr, 536 void **bufs) 537 { 538 u32 ifid = ((struct dpaa_if *)fq->dpaa_intf)->ifid; 539 struct rte_mbuf *mbuf; 540 struct rte_event *ev = (struct rte_event *)event; 541 542 mbuf = dpaa_eth_fd_to_mbuf(&dqrr->fd, ifid); 543 ev->event_ptr = (void *)mbuf; 544 ev->flow_id = fq->ev.flow_id; 545 ev->sub_event_type = fq->ev.sub_event_type; 546 ev->event_type = RTE_EVENT_TYPE_ETHDEV; 547 ev->op = RTE_EVENT_OP_NEW; 548 ev->sched_type = fq->ev.sched_type; 549 ev->queue_id = fq->ev.queue_id; 550 ev->priority = fq->ev.priority; 551 ev->impl_opaque = (uint8_t)DPAA_INVALID_MBUF_SEQN; 552 mbuf->seqn = DPAA_INVALID_MBUF_SEQN; 553 *bufs = mbuf; 554 555 return qman_cb_dqrr_consume; 556 } 557 558 enum qman_cb_dqrr_result 559 dpaa_rx_cb_atomic(void *event, 560 struct qman_portal *qm __always_unused, 561 struct qman_fq *fq, 562 const struct qm_dqrr_entry *dqrr, 563 void **bufs) 564 { 565 u8 index; 566 u32 ifid = ((struct dpaa_if *)fq->dpaa_intf)->ifid; 567 struct rte_mbuf *mbuf; 568 struct rte_event *ev = (struct rte_event *)event; 569 570 mbuf = dpaa_eth_fd_to_mbuf(&dqrr->fd, ifid); 571 ev->event_ptr = (void *)mbuf; 572 ev->flow_id = fq->ev.flow_id; 573 ev->sub_event_type = fq->ev.sub_event_type; 574 ev->event_type = RTE_EVENT_TYPE_ETHDEV; 575 ev->op = RTE_EVENT_OP_NEW; 576 ev->sched_type = fq->ev.sched_type; 577 ev->queue_id = fq->ev.queue_id; 578 ev->priority = fq->ev.priority; 579 580 /* Save active dqrr entries */ 581 index = DQRR_PTR2IDX(dqrr); 582 DPAA_PER_LCORE_DQRR_SIZE++; 583 DPAA_PER_LCORE_DQRR_HELD |= 1 << index; 584 DPAA_PER_LCORE_DQRR_MBUF(index) = mbuf; 585 ev->impl_opaque = index + 1; 586 mbuf->seqn = (uint32_t)index + 1; 587 *bufs = mbuf; 588 589 return qman_cb_dqrr_defer; 590 } 591 592 uint16_t dpaa_eth_queue_rx(void *q, 593 struct rte_mbuf **bufs, 594 uint16_t nb_bufs) 595 { 596 struct qman_fq *fq = q; 597 struct qm_dqrr_entry *dq; 598 uint32_t num_rx = 0, ifid = ((struct dpaa_if *)fq->dpaa_intf)->ifid; 599 int num_rx_bufs, ret; 600 uint32_t vdqcr_flags = 0; 601 602 if (likely(fq->is_static)) 603 return dpaa_eth_queue_portal_rx(fq, bufs, nb_bufs); 604 605 if (unlikely(!RTE_PER_LCORE(dpaa_io))) { 606 ret = rte_dpaa_portal_init((void *)0); 607 if (ret) { 608 DPAA_PMD_ERR("Failure in affining portal"); 609 return 0; 610 } 611 } 612 613 /* Until request for four buffers, we provide exact number of buffers. 614 * Otherwise we do not set the QM_VDQCR_EXACT flag. 615 * Not setting QM_VDQCR_EXACT flag can provide two more buffers than 616 * requested, so we request two less in this case. 617 */ 618 if (nb_bufs < 4) { 619 vdqcr_flags = QM_VDQCR_EXACT; 620 num_rx_bufs = nb_bufs; 621 } else { 622 num_rx_bufs = nb_bufs > DPAA_MAX_DEQUEUE_NUM_FRAMES ? 623 (DPAA_MAX_DEQUEUE_NUM_FRAMES - 2) : (nb_bufs - 2); 624 } 625 ret = qman_set_vdq(fq, num_rx_bufs, vdqcr_flags); 626 if (ret) 627 return 0; 628 629 do { 630 dq = qman_dequeue(fq); 631 if (!dq) 632 continue; 633 bufs[num_rx++] = dpaa_eth_fd_to_mbuf(&dq->fd, ifid); 634 qman_dqrr_consume(fq, dq); 635 } while (fq->flags & QMAN_FQ_STATE_VDQCR); 636 637 return num_rx; 638 } 639 640 static void *dpaa_get_pktbuf(struct dpaa_bp_info *bp_info) 641 { 642 int ret; 643 size_t buf = 0; 644 struct bm_buffer bufs; 645 646 ret = bman_acquire(bp_info->bp, &bufs, 1, 0); 647 if (ret <= 0) { 648 DPAA_PMD_WARN("Failed to allocate buffers %d", ret); 649 return (void *)buf; 650 } 651 652 DPAA_DP_LOG(DEBUG, "got buffer 0x%" PRIx64 " from pool %d", 653 (uint64_t)bufs.addr, bufs.bpid); 654 655 buf = (size_t)DPAA_MEMPOOL_PTOV(bp_info, bufs.addr) 656 - bp_info->meta_data_size; 657 if (!buf) 658 goto out; 659 660 out: 661 return (void *)buf; 662 } 663 664 static struct rte_mbuf *dpaa_get_dmable_mbuf(struct rte_mbuf *mbuf, 665 struct dpaa_if *dpaa_intf) 666 { 667 struct rte_mbuf *dpaa_mbuf; 668 669 /* allocate pktbuffer on bpid for dpaa port */ 670 dpaa_mbuf = dpaa_get_pktbuf(dpaa_intf->bp_info); 671 if (!dpaa_mbuf) 672 return NULL; 673 674 memcpy((uint8_t *)(dpaa_mbuf->buf_addr) + RTE_PKTMBUF_HEADROOM, (void *) 675 ((uint8_t *)(mbuf->buf_addr) + mbuf->data_off), mbuf->pkt_len); 676 677 /* Copy only the required fields */ 678 dpaa_mbuf->data_off = RTE_PKTMBUF_HEADROOM; 679 dpaa_mbuf->pkt_len = mbuf->pkt_len; 680 dpaa_mbuf->ol_flags = mbuf->ol_flags; 681 dpaa_mbuf->packet_type = mbuf->packet_type; 682 dpaa_mbuf->tx_offload = mbuf->tx_offload; 683 rte_pktmbuf_free(mbuf); 684 return dpaa_mbuf; 685 } 686 687 int 688 dpaa_eth_mbuf_to_sg_fd(struct rte_mbuf *mbuf, 689 struct qm_fd *fd, 690 uint32_t bpid) 691 { 692 struct rte_mbuf *cur_seg = mbuf, *prev_seg = NULL; 693 struct dpaa_bp_info *bp_info = DPAA_BPID_TO_POOL_INFO(bpid); 694 struct rte_mbuf *temp, *mi; 695 struct qm_sg_entry *sg_temp, *sgt; 696 int i = 0; 697 698 DPAA_DP_LOG(DEBUG, "Creating SG FD to transmit"); 699 700 temp = rte_pktmbuf_alloc(bp_info->mp); 701 if (!temp) { 702 DPAA_PMD_ERR("Failure in allocation of mbuf"); 703 return -1; 704 } 705 if (temp->buf_len < ((mbuf->nb_segs * sizeof(struct qm_sg_entry)) 706 + temp->data_off)) { 707 DPAA_PMD_ERR("Insufficient space in mbuf for SG entries"); 708 return -1; 709 } 710 711 fd->cmd = 0; 712 fd->opaque_addr = 0; 713 714 if (mbuf->ol_flags & DPAA_TX_CKSUM_OFFLOAD_MASK) { 715 if (!mbuf->packet_type) { 716 struct rte_net_hdr_lens hdr_lens; 717 718 mbuf->packet_type = rte_net_get_ptype(mbuf, &hdr_lens, 719 RTE_PTYPE_L2_MASK | RTE_PTYPE_L3_MASK 720 | RTE_PTYPE_L4_MASK); 721 mbuf->l2_len = hdr_lens.l2_len; 722 mbuf->l3_len = hdr_lens.l3_len; 723 } 724 if (temp->data_off < DEFAULT_TX_ICEOF 725 + sizeof(struct dpaa_eth_parse_results_t)) 726 temp->data_off = DEFAULT_TX_ICEOF 727 + sizeof(struct dpaa_eth_parse_results_t); 728 dcbz_64(temp->buf_addr); 729 dpaa_checksum_offload(mbuf, fd, temp->buf_addr); 730 } 731 732 sgt = temp->buf_addr + temp->data_off; 733 fd->format = QM_FD_SG; 734 fd->addr = temp->buf_iova; 735 fd->offset = temp->data_off; 736 fd->bpid = bpid; 737 fd->length20 = mbuf->pkt_len; 738 739 while (i < DPAA_SGT_MAX_ENTRIES) { 740 sg_temp = &sgt[i++]; 741 sg_temp->opaque = 0; 742 sg_temp->val = 0; 743 sg_temp->addr = cur_seg->buf_iova; 744 sg_temp->offset = cur_seg->data_off; 745 sg_temp->length = cur_seg->data_len; 746 if (RTE_MBUF_DIRECT(cur_seg)) { 747 if (rte_mbuf_refcnt_read(cur_seg) > 1) { 748 /*If refcnt > 1, invalid bpid is set to ensure 749 * buffer is not freed by HW. 750 */ 751 sg_temp->bpid = 0xff; 752 rte_mbuf_refcnt_update(cur_seg, -1); 753 } else { 754 sg_temp->bpid = 755 DPAA_MEMPOOL_TO_BPID(cur_seg->pool); 756 } 757 cur_seg = cur_seg->next; 758 } else { 759 /* Get owner MBUF from indirect buffer */ 760 mi = rte_mbuf_from_indirect(cur_seg); 761 if (rte_mbuf_refcnt_read(mi) > 1) { 762 /*If refcnt > 1, invalid bpid is set to ensure 763 * owner buffer is not freed by HW. 764 */ 765 sg_temp->bpid = 0xff; 766 } else { 767 sg_temp->bpid = DPAA_MEMPOOL_TO_BPID(mi->pool); 768 rte_mbuf_refcnt_update(mi, 1); 769 } 770 prev_seg = cur_seg; 771 cur_seg = cur_seg->next; 772 prev_seg->next = NULL; 773 rte_pktmbuf_free(prev_seg); 774 } 775 if (cur_seg == NULL) { 776 sg_temp->final = 1; 777 cpu_to_hw_sg(sg_temp); 778 break; 779 } 780 cpu_to_hw_sg(sg_temp); 781 } 782 return 0; 783 } 784 785 /* Handle mbufs which are not segmented (non SG) */ 786 static inline void 787 tx_on_dpaa_pool_unsegmented(struct rte_mbuf *mbuf, 788 struct dpaa_bp_info *bp_info, 789 struct qm_fd *fd_arr) 790 { 791 struct rte_mbuf *mi = NULL; 792 793 if (RTE_MBUF_DIRECT(mbuf)) { 794 if (rte_mbuf_refcnt_read(mbuf) > 1) { 795 /* In case of direct mbuf and mbuf being cloned, 796 * BMAN should _not_ release buffer. 797 */ 798 DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, 0xff); 799 /* Buffer should be releasd by EAL */ 800 rte_mbuf_refcnt_update(mbuf, -1); 801 } else { 802 /* In case of direct mbuf and no cloning, mbuf can be 803 * released by BMAN. 804 */ 805 DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, bp_info->bpid); 806 } 807 } else { 808 /* This is data-containing core mbuf: 'mi' */ 809 mi = rte_mbuf_from_indirect(mbuf); 810 if (rte_mbuf_refcnt_read(mi) > 1) { 811 /* In case of indirect mbuf, and mbuf being cloned, 812 * BMAN should _not_ release it and let EAL release 813 * it through pktmbuf_free below. 814 */ 815 DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, 0xff); 816 } else { 817 /* In case of indirect mbuf, and no cloning, core mbuf 818 * should be released by BMAN. 819 * Increate refcnt of core mbuf so that when 820 * pktmbuf_free is called and mbuf is released, EAL 821 * doesn't try to release core mbuf which would have 822 * been released by BMAN. 823 */ 824 rte_mbuf_refcnt_update(mi, 1); 825 DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, bp_info->bpid); 826 } 827 rte_pktmbuf_free(mbuf); 828 } 829 830 if (mbuf->ol_flags & DPAA_TX_CKSUM_OFFLOAD_MASK) 831 dpaa_unsegmented_checksum(mbuf, fd_arr); 832 } 833 834 /* Handle all mbufs on dpaa BMAN managed pool */ 835 static inline uint16_t 836 tx_on_dpaa_pool(struct rte_mbuf *mbuf, 837 struct dpaa_bp_info *bp_info, 838 struct qm_fd *fd_arr) 839 { 840 DPAA_DP_LOG(DEBUG, "BMAN offloaded buffer, mbuf: %p", mbuf); 841 842 if (mbuf->nb_segs == 1) { 843 /* Case for non-segmented buffers */ 844 tx_on_dpaa_pool_unsegmented(mbuf, bp_info, fd_arr); 845 } else if (mbuf->nb_segs > 1 && 846 mbuf->nb_segs <= DPAA_SGT_MAX_ENTRIES) { 847 if (dpaa_eth_mbuf_to_sg_fd(mbuf, fd_arr, bp_info->bpid)) { 848 DPAA_PMD_DEBUG("Unable to create Scatter Gather FD"); 849 return 1; 850 } 851 } else { 852 DPAA_PMD_DEBUG("Number of Segments not supported"); 853 return 1; 854 } 855 856 return 0; 857 } 858 859 /* Handle all mbufs on an external pool (non-dpaa) */ 860 static inline uint16_t 861 tx_on_external_pool(struct qman_fq *txq, struct rte_mbuf *mbuf, 862 struct qm_fd *fd_arr) 863 { 864 struct dpaa_if *dpaa_intf = txq->dpaa_intf; 865 struct rte_mbuf *dmable_mbuf; 866 867 DPAA_DP_LOG(DEBUG, "Non-BMAN offloaded buffer." 868 "Allocating an offloaded buffer"); 869 dmable_mbuf = dpaa_get_dmable_mbuf(mbuf, dpaa_intf); 870 if (!dmable_mbuf) { 871 DPAA_DP_LOG(DEBUG, "no dpaa buffers."); 872 return 1; 873 } 874 875 DPAA_MBUF_TO_CONTIG_FD(dmable_mbuf, fd_arr, dpaa_intf->bp_info->bpid); 876 if (mbuf->ol_flags & DPAA_TX_CKSUM_OFFLOAD_MASK) 877 dpaa_unsegmented_checksum(mbuf, fd_arr); 878 879 return 0; 880 } 881 882 uint16_t 883 dpaa_eth_queue_tx(void *q, struct rte_mbuf **bufs, uint16_t nb_bufs) 884 { 885 struct rte_mbuf *mbuf, *mi = NULL; 886 struct rte_mempool *mp; 887 struct dpaa_bp_info *bp_info; 888 struct qm_fd fd_arr[DPAA_TX_BURST_SIZE]; 889 uint32_t frames_to_send, loop, sent = 0; 890 uint16_t state; 891 int ret; 892 uint32_t seqn, index, flags[DPAA_TX_BURST_SIZE] = {0}; 893 894 if (unlikely(!RTE_PER_LCORE(dpaa_io))) { 895 ret = rte_dpaa_portal_init((void *)0); 896 if (ret) { 897 DPAA_PMD_ERR("Failure in affining portal"); 898 return 0; 899 } 900 } 901 902 DPAA_DP_LOG(DEBUG, "Transmitting %d buffers on queue: %p", nb_bufs, q); 903 904 while (nb_bufs) { 905 frames_to_send = (nb_bufs > DPAA_TX_BURST_SIZE) ? 906 DPAA_TX_BURST_SIZE : nb_bufs; 907 for (loop = 0; loop < frames_to_send; loop++) { 908 mbuf = *(bufs++); 909 seqn = mbuf->seqn; 910 if (seqn != DPAA_INVALID_MBUF_SEQN) { 911 index = seqn - 1; 912 if (DPAA_PER_LCORE_DQRR_HELD & (1 << index)) { 913 flags[loop] = 914 ((index & QM_EQCR_DCA_IDXMASK) << 8); 915 flags[loop] |= QMAN_ENQUEUE_FLAG_DCA; 916 DPAA_PER_LCORE_DQRR_SIZE--; 917 DPAA_PER_LCORE_DQRR_HELD &= 918 ~(1 << index); 919 } 920 } 921 922 if (likely(RTE_MBUF_DIRECT(mbuf))) { 923 mp = mbuf->pool; 924 bp_info = DPAA_MEMPOOL_TO_POOL_INFO(mp); 925 if (likely(mp->ops_index == 926 bp_info->dpaa_ops_index && 927 mbuf->nb_segs == 1 && 928 rte_mbuf_refcnt_read(mbuf) == 1)) { 929 DPAA_MBUF_TO_CONTIG_FD(mbuf, 930 &fd_arr[loop], bp_info->bpid); 931 if (mbuf->ol_flags & 932 DPAA_TX_CKSUM_OFFLOAD_MASK) 933 dpaa_unsegmented_checksum(mbuf, 934 &fd_arr[loop]); 935 continue; 936 } 937 } else { 938 mi = rte_mbuf_from_indirect(mbuf); 939 mp = mi->pool; 940 } 941 942 bp_info = DPAA_MEMPOOL_TO_POOL_INFO(mp); 943 if (likely(mp->ops_index == bp_info->dpaa_ops_index)) { 944 state = tx_on_dpaa_pool(mbuf, bp_info, 945 &fd_arr[loop]); 946 if (unlikely(state)) { 947 /* Set frames_to_send & nb_bufs so 948 * that packets are transmitted till 949 * previous frame. 950 */ 951 frames_to_send = loop; 952 nb_bufs = loop; 953 goto send_pkts; 954 } 955 } else { 956 state = tx_on_external_pool(q, mbuf, 957 &fd_arr[loop]); 958 if (unlikely(state)) { 959 /* Set frames_to_send & nb_bufs so 960 * that packets are transmitted till 961 * previous frame. 962 */ 963 frames_to_send = loop; 964 nb_bufs = loop; 965 goto send_pkts; 966 } 967 } 968 } 969 970 send_pkts: 971 loop = 0; 972 while (loop < frames_to_send) { 973 loop += qman_enqueue_multi(q, &fd_arr[loop], 974 &flags[loop], 975 frames_to_send - loop); 976 } 977 nb_bufs -= frames_to_send; 978 sent += frames_to_send; 979 } 980 981 DPAA_DP_LOG(DEBUG, "Transmitted %d buffers on queue: %p", sent, q); 982 983 return sent; 984 } 985 986 uint16_t dpaa_eth_tx_drop_all(void *q __rte_unused, 987 struct rte_mbuf **bufs __rte_unused, 988 uint16_t nb_bufs __rte_unused) 989 { 990 DPAA_DP_LOG(DEBUG, "Drop all packets"); 991 992 /* Drop all incoming packets. No need to free packets here 993 * because the rte_eth f/w frees up the packets through tx_buffer 994 * callback in case this functions returns count less than nb_bufs 995 */ 996 return 0; 997 } 998