net/dpaa: optimize the Tx burst
[dpdk.git] / drivers / net / dpaa / dpaa_rxtx.c
1 /* SPDX-License-Identifier: BSD-3-Clause
2  *
3  *   Copyright 2016 Freescale Semiconductor, Inc. All rights reserved.
4  *   Copyright 2017 NXP
5  *
6  */
7
8 /* System headers */
9 #include <inttypes.h>
10 #include <unistd.h>
11 #include <stdio.h>
12 #include <limits.h>
13 #include <sched.h>
14 #include <pthread.h>
15
16 #include <rte_byteorder.h>
17 #include <rte_common.h>
18 #include <rte_interrupts.h>
19 #include <rte_log.h>
20 #include <rte_debug.h>
21 #include <rte_pci.h>
22 #include <rte_atomic.h>
23 #include <rte_branch_prediction.h>
24 #include <rte_memory.h>
25 #include <rte_tailq.h>
26 #include <rte_eal.h>
27 #include <rte_alarm.h>
28 #include <rte_ether.h>
29 #include <rte_ethdev.h>
30 #include <rte_malloc.h>
31 #include <rte_ring.h>
32 #include <rte_ip.h>
33 #include <rte_tcp.h>
34 #include <rte_udp.h>
35 #include <rte_net.h>
36
37 #include "dpaa_ethdev.h"
38 #include "dpaa_rxtx.h"
39 #include <rte_dpaa_bus.h>
40 #include <dpaa_mempool.h>
41
42 #include <fsl_usd.h>
43 #include <fsl_qman.h>
44 #include <fsl_bman.h>
45 #include <of.h>
46 #include <netcfg.h>
47
48 #define DPAA_MBUF_TO_CONTIG_FD(_mbuf, _fd, _bpid) \
49         do { \
50                 (_fd)->cmd = 0; \
51                 (_fd)->opaque_addr = 0; \
52                 (_fd)->opaque = QM_FD_CONTIG << DPAA_FD_FORMAT_SHIFT; \
53                 (_fd)->opaque |= ((_mbuf)->data_off) << DPAA_FD_OFFSET_SHIFT; \
54                 (_fd)->opaque |= (_mbuf)->pkt_len; \
55                 (_fd)->addr = (_mbuf)->buf_iova; \
56                 (_fd)->bpid = _bpid; \
57         } while (0)
58
59 #if (defined RTE_LIBRTE_DPAA_DEBUG_DRIVER)
60 void dpaa_display_frame(const struct qm_fd *fd)
61 {
62         int ii;
63         char *ptr;
64
65         printf("%s::bpid %x addr %08x%08x, format %d off %d, len %d stat %x\n",
66                __func__, fd->bpid, fd->addr_hi, fd->addr_lo, fd->format,
67                 fd->offset, fd->length20, fd->status);
68
69         ptr = (char *)rte_dpaa_mem_ptov(fd->addr);
70         ptr += fd->offset;
71         printf("%02x ", *ptr);
72         for (ii = 1; ii < fd->length20; ii++) {
73                 printf("%02x ", *ptr);
74                 if ((ii % 16) == 0)
75                         printf("\n");
76                 ptr++;
77         }
78         printf("\n");
79 }
80 #else
81 #define dpaa_display_frame(a)
82 #endif
83
84 static inline void dpaa_slow_parsing(struct rte_mbuf *m __rte_unused,
85                                      uint64_t prs __rte_unused)
86 {
87         DPAA_DP_LOG(DEBUG, "Slow parsing");
88         /*TBD:XXX: to be implemented*/
89 }
90
91 static inline void dpaa_eth_packet_info(struct rte_mbuf *m,
92                                         uint64_t fd_virt_addr)
93 {
94         struct annotations_t *annot = GET_ANNOTATIONS(fd_virt_addr);
95         uint64_t prs = *((uint64_t *)(&annot->parse)) & DPAA_PARSE_MASK;
96
97         DPAA_DP_LOG(DEBUG, " Parsing mbuf: %p with annotations: %p", m, annot);
98
99         switch (prs) {
100         case DPAA_PKT_TYPE_NONE:
101                 m->packet_type = 0;
102                 break;
103         case DPAA_PKT_TYPE_ETHER:
104                 m->packet_type = RTE_PTYPE_L2_ETHER;
105                 break;
106         case DPAA_PKT_TYPE_IPV4:
107                 m->packet_type = RTE_PTYPE_L2_ETHER |
108                         RTE_PTYPE_L3_IPV4;
109                 break;
110         case DPAA_PKT_TYPE_IPV6:
111                 m->packet_type = RTE_PTYPE_L2_ETHER |
112                         RTE_PTYPE_L3_IPV6;
113                 break;
114         case DPAA_PKT_TYPE_IPV4_FRAG:
115         case DPAA_PKT_TYPE_IPV4_FRAG_UDP:
116         case DPAA_PKT_TYPE_IPV4_FRAG_TCP:
117         case DPAA_PKT_TYPE_IPV4_FRAG_SCTP:
118                 m->packet_type = RTE_PTYPE_L2_ETHER |
119                         RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_FRAG;
120                 break;
121         case DPAA_PKT_TYPE_IPV6_FRAG:
122         case DPAA_PKT_TYPE_IPV6_FRAG_UDP:
123         case DPAA_PKT_TYPE_IPV6_FRAG_TCP:
124         case DPAA_PKT_TYPE_IPV6_FRAG_SCTP:
125                 m->packet_type = RTE_PTYPE_L2_ETHER |
126                         RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_FRAG;
127                 break;
128         case DPAA_PKT_TYPE_IPV4_EXT:
129                 m->packet_type = RTE_PTYPE_L2_ETHER |
130                         RTE_PTYPE_L3_IPV4_EXT;
131                 break;
132         case DPAA_PKT_TYPE_IPV6_EXT:
133                 m->packet_type = RTE_PTYPE_L2_ETHER |
134                         RTE_PTYPE_L3_IPV6_EXT;
135                 break;
136         case DPAA_PKT_TYPE_IPV4_TCP:
137                 m->packet_type = RTE_PTYPE_L2_ETHER |
138                         RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_TCP;
139                 break;
140         case DPAA_PKT_TYPE_IPV6_TCP:
141                 m->packet_type = RTE_PTYPE_L2_ETHER |
142                         RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_TCP;
143                 break;
144         case DPAA_PKT_TYPE_IPV4_UDP:
145                 m->packet_type = RTE_PTYPE_L2_ETHER |
146                         RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_UDP;
147                 break;
148         case DPAA_PKT_TYPE_IPV6_UDP:
149                 m->packet_type = RTE_PTYPE_L2_ETHER |
150                         RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_UDP;
151                 break;
152         case DPAA_PKT_TYPE_IPV4_EXT_UDP:
153                 m->packet_type = RTE_PTYPE_L2_ETHER |
154                         RTE_PTYPE_L3_IPV4_EXT | RTE_PTYPE_L4_UDP;
155                 break;
156         case DPAA_PKT_TYPE_IPV6_EXT_UDP:
157                 m->packet_type = RTE_PTYPE_L2_ETHER |
158                         RTE_PTYPE_L3_IPV6_EXT | RTE_PTYPE_L4_UDP;
159                 break;
160         case DPAA_PKT_TYPE_IPV4_EXT_TCP:
161                 m->packet_type = RTE_PTYPE_L2_ETHER |
162                         RTE_PTYPE_L3_IPV4_EXT | RTE_PTYPE_L4_TCP;
163                 break;
164         case DPAA_PKT_TYPE_IPV6_EXT_TCP:
165                 m->packet_type = RTE_PTYPE_L2_ETHER |
166                         RTE_PTYPE_L3_IPV6_EXT | RTE_PTYPE_L4_TCP;
167                 break;
168         case DPAA_PKT_TYPE_IPV4_SCTP:
169                 m->packet_type = RTE_PTYPE_L2_ETHER |
170                         RTE_PTYPE_L3_IPV4 | RTE_PTYPE_L4_SCTP;
171                 break;
172         case DPAA_PKT_TYPE_IPV6_SCTP:
173                 m->packet_type = RTE_PTYPE_L2_ETHER |
174                         RTE_PTYPE_L3_IPV6 | RTE_PTYPE_L4_SCTP;
175                 break;
176         /* More switch cases can be added */
177         default:
178                 dpaa_slow_parsing(m, prs);
179         }
180
181         m->tx_offload = annot->parse.ip_off[0];
182         m->tx_offload |= (annot->parse.l4_off - annot->parse.ip_off[0])
183                                         << DPAA_PKT_L3_LEN_SHIFT;
184
185         /* Set the hash values */
186         m->hash.rss = (uint32_t)(rte_be_to_cpu_64(annot->hash));
187         m->ol_flags = PKT_RX_RSS_HASH;
188         /* All packets with Bad checksum are dropped by interface (and
189          * corresponding notification issued to RX error queues).
190          */
191         m->ol_flags |= PKT_RX_IP_CKSUM_GOOD;
192
193         /* Check if Vlan is present */
194         if (prs & DPAA_PARSE_VLAN_MASK)
195                 m->ol_flags |= PKT_RX_VLAN;
196         /* Packet received without stripping the vlan */
197 }
198
199 static inline void dpaa_checksum(struct rte_mbuf *mbuf)
200 {
201         struct ether_hdr *eth_hdr = rte_pktmbuf_mtod(mbuf, struct ether_hdr *);
202         char *l3_hdr = (char *)eth_hdr + mbuf->l2_len;
203         struct ipv4_hdr *ipv4_hdr = (struct ipv4_hdr *)l3_hdr;
204         struct ipv6_hdr *ipv6_hdr = (struct ipv6_hdr *)l3_hdr;
205
206         DPAA_DP_LOG(DEBUG, "Calculating checksum for mbuf: %p", mbuf);
207
208         if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) == RTE_PTYPE_L3_IPV4) ||
209             ((mbuf->packet_type & RTE_PTYPE_L3_MASK) ==
210             RTE_PTYPE_L3_IPV4_EXT)) {
211                 ipv4_hdr = (struct ipv4_hdr *)l3_hdr;
212                 ipv4_hdr->hdr_checksum = 0;
213                 ipv4_hdr->hdr_checksum = rte_ipv4_cksum(ipv4_hdr);
214         } else if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) ==
215                    RTE_PTYPE_L3_IPV6) ||
216                    ((mbuf->packet_type & RTE_PTYPE_L3_MASK) ==
217                    RTE_PTYPE_L3_IPV6_EXT))
218                 ipv6_hdr = (struct ipv6_hdr *)l3_hdr;
219
220         if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) == RTE_PTYPE_L4_TCP) {
221                 struct tcp_hdr *tcp_hdr = (struct tcp_hdr *)(l3_hdr +
222                                           mbuf->l3_len);
223                 tcp_hdr->cksum = 0;
224                 if (eth_hdr->ether_type == htons(ETHER_TYPE_IPv4))
225                         tcp_hdr->cksum = rte_ipv4_udptcp_cksum(ipv4_hdr,
226                                                                tcp_hdr);
227                 else /* assume ethertype == ETHER_TYPE_IPv6 */
228                         tcp_hdr->cksum = rte_ipv6_udptcp_cksum(ipv6_hdr,
229                                                                tcp_hdr);
230         } else if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) ==
231                    RTE_PTYPE_L4_UDP) {
232                 struct udp_hdr *udp_hdr = (struct udp_hdr *)(l3_hdr +
233                                                              mbuf->l3_len);
234                 udp_hdr->dgram_cksum = 0;
235                 if (eth_hdr->ether_type == htons(ETHER_TYPE_IPv4))
236                         udp_hdr->dgram_cksum = rte_ipv4_udptcp_cksum(ipv4_hdr,
237                                                                      udp_hdr);
238                 else /* assume ethertype == ETHER_TYPE_IPv6 */
239                         udp_hdr->dgram_cksum = rte_ipv6_udptcp_cksum(ipv6_hdr,
240                                                                      udp_hdr);
241         }
242 }
243
244 static inline void dpaa_checksum_offload(struct rte_mbuf *mbuf,
245                                          struct qm_fd *fd, char *prs_buf)
246 {
247         struct dpaa_eth_parse_results_t *prs;
248
249         DPAA_DP_LOG(DEBUG, " Offloading checksum for mbuf: %p", mbuf);
250
251         prs = GET_TX_PRS(prs_buf);
252         prs->l3r = 0;
253         prs->l4r = 0;
254         if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) == RTE_PTYPE_L3_IPV4) ||
255            ((mbuf->packet_type & RTE_PTYPE_L3_MASK) ==
256            RTE_PTYPE_L3_IPV4_EXT))
257                 prs->l3r = DPAA_L3_PARSE_RESULT_IPV4;
258         else if (((mbuf->packet_type & RTE_PTYPE_L3_MASK) ==
259                    RTE_PTYPE_L3_IPV6) ||
260                  ((mbuf->packet_type & RTE_PTYPE_L3_MASK) ==
261                 RTE_PTYPE_L3_IPV6_EXT))
262                 prs->l3r = DPAA_L3_PARSE_RESULT_IPV6;
263
264         if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) == RTE_PTYPE_L4_TCP)
265                 prs->l4r = DPAA_L4_PARSE_RESULT_TCP;
266         else if ((mbuf->packet_type & RTE_PTYPE_L4_MASK) == RTE_PTYPE_L4_UDP)
267                 prs->l4r = DPAA_L4_PARSE_RESULT_UDP;
268
269         prs->ip_off[0] = mbuf->l2_len;
270         prs->l4_off = mbuf->l3_len + mbuf->l2_len;
271         /* Enable L3 (and L4, if TCP or UDP) HW checksum*/
272         fd->cmd = DPAA_FD_CMD_RPD | DPAA_FD_CMD_DTC;
273 }
274
275 static inline void
276 dpaa_unsegmented_checksum(struct rte_mbuf *mbuf, struct qm_fd *fd_arr)
277 {
278         if (!mbuf->packet_type) {
279                 struct rte_net_hdr_lens hdr_lens;
280
281                 mbuf->packet_type = rte_net_get_ptype(mbuf, &hdr_lens,
282                                 RTE_PTYPE_L2_MASK | RTE_PTYPE_L3_MASK
283                                 | RTE_PTYPE_L4_MASK);
284                 mbuf->l2_len = hdr_lens.l2_len;
285                 mbuf->l3_len = hdr_lens.l3_len;
286         }
287         if (mbuf->data_off < (DEFAULT_TX_ICEOF +
288             sizeof(struct dpaa_eth_parse_results_t))) {
289                 DPAA_DP_LOG(DEBUG, "Checksum offload Err: "
290                         "Not enough Headroom "
291                         "space for correct Checksum offload."
292                         "So Calculating checksum in Software.");
293                 dpaa_checksum(mbuf);
294         } else {
295                 dpaa_checksum_offload(mbuf, fd_arr, mbuf->buf_addr);
296         }
297 }
298
299 struct rte_mbuf *
300 dpaa_eth_sg_to_mbuf(struct qm_fd *fd, uint32_t ifid)
301 {
302         struct dpaa_bp_info *bp_info = DPAA_BPID_TO_POOL_INFO(fd->bpid);
303         struct rte_mbuf *first_seg, *prev_seg, *cur_seg, *temp;
304         struct qm_sg_entry *sgt, *sg_temp;
305         void *vaddr, *sg_vaddr;
306         int i = 0;
307         uint8_t fd_offset = fd->offset;
308
309         DPAA_DP_LOG(DEBUG, "Received an SG frame");
310
311         vaddr = rte_dpaa_mem_ptov(qm_fd_addr(fd));
312         if (!vaddr) {
313                 DPAA_PMD_ERR("unable to convert physical address");
314                 return NULL;
315         }
316         sgt = vaddr + fd_offset;
317         sg_temp = &sgt[i++];
318         hw_sg_to_cpu(sg_temp);
319         temp = (struct rte_mbuf *)((char *)vaddr - bp_info->meta_data_size);
320         sg_vaddr = rte_dpaa_mem_ptov(qm_sg_entry_get64(sg_temp));
321
322         first_seg = (struct rte_mbuf *)((char *)sg_vaddr -
323                                                 bp_info->meta_data_size);
324         first_seg->data_off = sg_temp->offset;
325         first_seg->data_len = sg_temp->length;
326         first_seg->pkt_len = sg_temp->length;
327         rte_mbuf_refcnt_set(first_seg, 1);
328
329         first_seg->port = ifid;
330         first_seg->nb_segs = 1;
331         first_seg->ol_flags = 0;
332         prev_seg = first_seg;
333         while (i < DPAA_SGT_MAX_ENTRIES) {
334                 sg_temp = &sgt[i++];
335                 hw_sg_to_cpu(sg_temp);
336                 sg_vaddr = rte_dpaa_mem_ptov(qm_sg_entry_get64(sg_temp));
337                 cur_seg = (struct rte_mbuf *)((char *)sg_vaddr -
338                                                       bp_info->meta_data_size);
339                 cur_seg->data_off = sg_temp->offset;
340                 cur_seg->data_len = sg_temp->length;
341                 first_seg->pkt_len += sg_temp->length;
342                 first_seg->nb_segs += 1;
343                 rte_mbuf_refcnt_set(cur_seg, 1);
344                 prev_seg->next = cur_seg;
345                 if (sg_temp->final) {
346                         cur_seg->next = NULL;
347                         break;
348                 }
349                 prev_seg = cur_seg;
350         }
351
352         dpaa_eth_packet_info(first_seg, (uint64_t)vaddr);
353         rte_pktmbuf_free_seg(temp);
354
355         return first_seg;
356 }
357
358 static inline struct rte_mbuf *dpaa_eth_fd_to_mbuf(struct qm_fd *fd,
359                                                         uint32_t ifid)
360 {
361         struct dpaa_bp_info *bp_info = DPAA_BPID_TO_POOL_INFO(fd->bpid);
362         struct rte_mbuf *mbuf;
363         void *ptr;
364         uint8_t format =
365                 (fd->opaque & DPAA_FD_FORMAT_MASK) >> DPAA_FD_FORMAT_SHIFT;
366         uint16_t offset =
367                 (fd->opaque & DPAA_FD_OFFSET_MASK) >> DPAA_FD_OFFSET_SHIFT;
368         uint32_t length = fd->opaque & DPAA_FD_LENGTH_MASK;
369
370         DPAA_DP_LOG(DEBUG, " FD--->MBUF");
371
372         if (unlikely(format == qm_fd_sg))
373                 return dpaa_eth_sg_to_mbuf(fd, ifid);
374
375         /* Ignoring case when format != qm_fd_contig */
376         dpaa_display_frame(fd);
377         ptr = rte_dpaa_mem_ptov(fd->addr);
378         /* Ignoring case when ptr would be NULL. That is only possible incase
379          * of a corrupted packet
380          */
381
382         mbuf = (struct rte_mbuf *)((char *)ptr - bp_info->meta_data_size);
383         /* Prefetch the Parse results and packet data to L1 */
384         rte_prefetch0((void *)((uint8_t *)ptr + DEFAULT_RX_ICEOF));
385         rte_prefetch0((void *)((uint8_t *)ptr + offset));
386
387         mbuf->data_off = offset;
388         mbuf->data_len = length;
389         mbuf->pkt_len = length;
390
391         mbuf->port = ifid;
392         mbuf->nb_segs = 1;
393         mbuf->ol_flags = 0;
394         mbuf->next = NULL;
395         rte_mbuf_refcnt_set(mbuf, 1);
396         dpaa_eth_packet_info(mbuf, (uint64_t)mbuf->buf_addr);
397
398         return mbuf;
399 }
400
401 uint16_t dpaa_eth_queue_rx(void *q,
402                            struct rte_mbuf **bufs,
403                            uint16_t nb_bufs)
404 {
405         struct qman_fq *fq = q;
406         struct qm_dqrr_entry *dq;
407         uint32_t num_rx = 0, ifid = ((struct dpaa_if *)fq->dpaa_intf)->ifid;
408         int ret;
409
410         ret = rte_dpaa_portal_init((void *)0);
411         if (ret) {
412                 DPAA_PMD_ERR("Failure in affining portal");
413                 return 0;
414         }
415
416         ret = qman_set_vdq(fq, (nb_bufs > DPAA_MAX_DEQUEUE_NUM_FRAMES) ?
417                                 DPAA_MAX_DEQUEUE_NUM_FRAMES : nb_bufs);
418         if (ret)
419                 return 0;
420
421         do {
422                 dq = qman_dequeue(fq);
423                 if (!dq)
424                         continue;
425                 bufs[num_rx++] = dpaa_eth_fd_to_mbuf(&dq->fd, ifid);
426                 qman_dqrr_consume(fq, dq);
427         } while (fq->flags & QMAN_FQ_STATE_VDQCR);
428
429         return num_rx;
430 }
431
432 static void *dpaa_get_pktbuf(struct dpaa_bp_info *bp_info)
433 {
434         int ret;
435         uint64_t buf = 0;
436         struct bm_buffer bufs;
437
438         ret = bman_acquire(bp_info->bp, &bufs, 1, 0);
439         if (ret <= 0) {
440                 DPAA_PMD_WARN("Failed to allocate buffers %d", ret);
441                 return (void *)buf;
442         }
443
444         DPAA_DP_LOG(DEBUG, "got buffer 0x%lx from pool %d",
445                     (uint64_t)bufs.addr, bufs.bpid);
446
447         buf = (uint64_t)rte_dpaa_mem_ptov(bufs.addr) - bp_info->meta_data_size;
448         if (!buf)
449                 goto out;
450
451 out:
452         return (void *)buf;
453 }
454
455 static struct rte_mbuf *dpaa_get_dmable_mbuf(struct rte_mbuf *mbuf,
456                                              struct dpaa_if *dpaa_intf)
457 {
458         struct rte_mbuf *dpaa_mbuf;
459
460         /* allocate pktbuffer on bpid for dpaa port */
461         dpaa_mbuf = dpaa_get_pktbuf(dpaa_intf->bp_info);
462         if (!dpaa_mbuf)
463                 return NULL;
464
465         memcpy((uint8_t *)(dpaa_mbuf->buf_addr) + mbuf->data_off, (void *)
466                 ((uint8_t *)(mbuf->buf_addr) + mbuf->data_off), mbuf->pkt_len);
467
468         /* Copy only the required fields */
469         dpaa_mbuf->data_off = mbuf->data_off;
470         dpaa_mbuf->pkt_len = mbuf->pkt_len;
471         dpaa_mbuf->ol_flags = mbuf->ol_flags;
472         dpaa_mbuf->packet_type = mbuf->packet_type;
473         dpaa_mbuf->tx_offload = mbuf->tx_offload;
474         rte_pktmbuf_free(mbuf);
475         return dpaa_mbuf;
476 }
477
478 int
479 dpaa_eth_mbuf_to_sg_fd(struct rte_mbuf *mbuf,
480                 struct qm_fd *fd,
481                 uint32_t bpid)
482 {
483         struct rte_mbuf *cur_seg = mbuf, *prev_seg = NULL;
484         struct dpaa_bp_info *bp_info = DPAA_BPID_TO_POOL_INFO(bpid);
485         struct rte_mbuf *temp, *mi;
486         struct qm_sg_entry *sg_temp, *sgt;
487         int i = 0;
488
489         DPAA_DP_LOG(DEBUG, "Creating SG FD to transmit");
490
491         temp = rte_pktmbuf_alloc(bp_info->mp);
492         if (!temp) {
493                 DPAA_PMD_ERR("Failure in allocation of mbuf");
494                 return -1;
495         }
496         if (temp->buf_len < ((mbuf->nb_segs * sizeof(struct qm_sg_entry))
497                                 + temp->data_off)) {
498                 DPAA_PMD_ERR("Insufficient space in mbuf for SG entries");
499                 return -1;
500         }
501
502         fd->cmd = 0;
503         fd->opaque_addr = 0;
504
505         if (mbuf->ol_flags & DPAA_TX_CKSUM_OFFLOAD_MASK) {
506                 if (!mbuf->packet_type) {
507                         struct rte_net_hdr_lens hdr_lens;
508
509                         mbuf->packet_type = rte_net_get_ptype(mbuf, &hdr_lens,
510                                         RTE_PTYPE_L2_MASK | RTE_PTYPE_L3_MASK
511                                         | RTE_PTYPE_L4_MASK);
512                         mbuf->l2_len = hdr_lens.l2_len;
513                         mbuf->l3_len = hdr_lens.l3_len;
514                 }
515                 if (temp->data_off < DEFAULT_TX_ICEOF
516                         + sizeof(struct dpaa_eth_parse_results_t))
517                         temp->data_off = DEFAULT_TX_ICEOF
518                                 + sizeof(struct dpaa_eth_parse_results_t);
519                 dcbz_64(temp->buf_addr);
520                 dpaa_checksum_offload(mbuf, fd, temp->buf_addr);
521         }
522
523         sgt = temp->buf_addr + temp->data_off;
524         fd->format = QM_FD_SG;
525         fd->addr = temp->buf_iova;
526         fd->offset = temp->data_off;
527         fd->bpid = bpid;
528         fd->length20 = mbuf->pkt_len;
529
530         while (i < DPAA_SGT_MAX_ENTRIES) {
531                 sg_temp = &sgt[i++];
532                 sg_temp->opaque = 0;
533                 sg_temp->val = 0;
534                 sg_temp->addr = cur_seg->buf_iova;
535                 sg_temp->offset = cur_seg->data_off;
536                 sg_temp->length = cur_seg->data_len;
537                 if (RTE_MBUF_DIRECT(cur_seg)) {
538                         if (rte_mbuf_refcnt_read(cur_seg) > 1) {
539                                 /*If refcnt > 1, invalid bpid is set to ensure
540                                  * buffer is not freed by HW.
541                                  */
542                                 sg_temp->bpid = 0xff;
543                                 rte_mbuf_refcnt_update(cur_seg, -1);
544                         } else {
545                                 sg_temp->bpid =
546                                         DPAA_MEMPOOL_TO_BPID(cur_seg->pool);
547                         }
548                         cur_seg = cur_seg->next;
549                 } else {
550                         /* Get owner MBUF from indirect buffer */
551                         mi = rte_mbuf_from_indirect(cur_seg);
552                         if (rte_mbuf_refcnt_read(mi) > 1) {
553                                 /*If refcnt > 1, invalid bpid is set to ensure
554                                  * owner buffer is not freed by HW.
555                                  */
556                                 sg_temp->bpid = 0xff;
557                         } else {
558                                 sg_temp->bpid = DPAA_MEMPOOL_TO_BPID(mi->pool);
559                                 rte_mbuf_refcnt_update(mi, 1);
560                         }
561                         prev_seg = cur_seg;
562                         cur_seg = cur_seg->next;
563                         prev_seg->next = NULL;
564                         rte_pktmbuf_free(prev_seg);
565                 }
566                 if (cur_seg == NULL) {
567                         sg_temp->final = 1;
568                         cpu_to_hw_sg(sg_temp);
569                         break;
570                 }
571                 cpu_to_hw_sg(sg_temp);
572         }
573         return 0;
574 }
575
576 /* Handle mbufs which are not segmented (non SG) */
577 static inline void
578 tx_on_dpaa_pool_unsegmented(struct rte_mbuf *mbuf,
579                             struct dpaa_bp_info *bp_info,
580                             struct qm_fd *fd_arr)
581 {
582         struct rte_mbuf *mi = NULL;
583
584         if (RTE_MBUF_DIRECT(mbuf)) {
585                 if (rte_mbuf_refcnt_read(mbuf) > 1) {
586                         /* In case of direct mbuf and mbuf being cloned,
587                          * BMAN should _not_ release buffer.
588                          */
589                         DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, 0xff);
590                         /* Buffer should be releasd by EAL */
591                         rte_mbuf_refcnt_update(mbuf, -1);
592                 } else {
593                         /* In case of direct mbuf and no cloning, mbuf can be
594                          * released by BMAN.
595                          */
596                         DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, bp_info->bpid);
597                 }
598         } else {
599                 /* This is data-containing core mbuf: 'mi' */
600                 mi = rte_mbuf_from_indirect(mbuf);
601                 if (rte_mbuf_refcnt_read(mi) > 1) {
602                         /* In case of indirect mbuf, and mbuf being cloned,
603                          * BMAN should _not_ release it and let EAL release
604                          * it through pktmbuf_free below.
605                          */
606                         DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, 0xff);
607                 } else {
608                         /* In case of indirect mbuf, and no cloning, core mbuf
609                          * should be released by BMAN.
610                          * Increate refcnt of core mbuf so that when
611                          * pktmbuf_free is called and mbuf is released, EAL
612                          * doesn't try to release core mbuf which would have
613                          * been released by BMAN.
614                          */
615                         rte_mbuf_refcnt_update(mi, 1);
616                         DPAA_MBUF_TO_CONTIG_FD(mbuf, fd_arr, bp_info->bpid);
617                 }
618                 rte_pktmbuf_free(mbuf);
619         }
620
621         if (mbuf->ol_flags & DPAA_TX_CKSUM_OFFLOAD_MASK)
622                 dpaa_unsegmented_checksum(mbuf, fd_arr);
623 }
624
625 /* Handle all mbufs on dpaa BMAN managed pool */
626 static inline uint16_t
627 tx_on_dpaa_pool(struct rte_mbuf *mbuf,
628                 struct dpaa_bp_info *bp_info,
629                 struct qm_fd *fd_arr)
630 {
631         DPAA_DP_LOG(DEBUG, "BMAN offloaded buffer, mbuf: %p", mbuf);
632
633         if (mbuf->nb_segs == 1) {
634                 /* Case for non-segmented buffers */
635                 tx_on_dpaa_pool_unsegmented(mbuf, bp_info, fd_arr);
636         } else if (mbuf->nb_segs > 1 &&
637                    mbuf->nb_segs <= DPAA_SGT_MAX_ENTRIES) {
638                 if (dpaa_eth_mbuf_to_sg_fd(mbuf, fd_arr, bp_info->bpid)) {
639                         DPAA_PMD_DEBUG("Unable to create Scatter Gather FD");
640                         return 1;
641                 }
642         } else {
643                 DPAA_PMD_DEBUG("Number of Segments not supported");
644                 return 1;
645         }
646
647         return 0;
648 }
649
650 /* Handle all mbufs on an external pool (non-dpaa) */
651 static inline uint16_t
652 tx_on_external_pool(struct qman_fq *txq, struct rte_mbuf *mbuf,
653                     struct qm_fd *fd_arr)
654 {
655         struct dpaa_if *dpaa_intf = txq->dpaa_intf;
656         struct rte_mbuf *dmable_mbuf;
657
658         DPAA_DP_LOG(DEBUG, "Non-BMAN offloaded buffer."
659                     "Allocating an offloaded buffer");
660         dmable_mbuf = dpaa_get_dmable_mbuf(mbuf, dpaa_intf);
661         if (!dmable_mbuf) {
662                 DPAA_DP_LOG(DEBUG, "no dpaa buffers.");
663                 return 1;
664         }
665
666         DPAA_MBUF_TO_CONTIG_FD(dmable_mbuf, fd_arr, dpaa_intf->bp_info->bpid);
667
668         return 0;
669 }
670
671 uint16_t
672 dpaa_eth_queue_tx(void *q, struct rte_mbuf **bufs, uint16_t nb_bufs)
673 {
674         struct rte_mbuf *mbuf, *mi = NULL;
675         struct rte_mempool *mp;
676         struct dpaa_bp_info *bp_info;
677         struct qm_fd fd_arr[DPAA_TX_BURST_SIZE];
678         uint32_t frames_to_send, loop, sent = 0;
679         uint16_t state;
680         int ret;
681
682         ret = rte_dpaa_portal_init((void *)0);
683         if (ret) {
684                 DPAA_PMD_ERR("Failure in affining portal");
685                 return 0;
686         }
687
688         DPAA_DP_LOG(DEBUG, "Transmitting %d buffers on queue: %p", nb_bufs, q);
689
690         while (nb_bufs) {
691                 frames_to_send = (nb_bufs > DPAA_TX_BURST_SIZE) ?
692                                 DPAA_TX_BURST_SIZE : nb_bufs;
693                 for (loop = 0; loop < frames_to_send; loop++) {
694                         mbuf = *(bufs++);
695                         if (likely(RTE_MBUF_DIRECT(mbuf))) {
696                                 mp = mbuf->pool;
697                                 bp_info = DPAA_MEMPOOL_TO_POOL_INFO(mp);
698                                 if (likely(mp->ops_index ==
699                                                 bp_info->dpaa_ops_index &&
700                                         mbuf->nb_segs == 1 &&
701                                         rte_mbuf_refcnt_read(mbuf) == 1)) {
702                                         DPAA_MBUF_TO_CONTIG_FD(mbuf,
703                                                 &fd_arr[loop], bp_info->bpid);
704                                         if (mbuf->ol_flags &
705                                                 DPAA_TX_CKSUM_OFFLOAD_MASK)
706                                                 dpaa_unsegmented_checksum(mbuf,
707                                                         &fd_arr[loop]);
708                                         continue;
709                                 }
710                         } else {
711                                 mi = rte_mbuf_from_indirect(mbuf);
712                                 mp = mi->pool;
713                         }
714
715                         bp_info = DPAA_MEMPOOL_TO_POOL_INFO(mp);
716                         if (likely(mp->ops_index == bp_info->dpaa_ops_index)) {
717                                 state = tx_on_dpaa_pool(mbuf, bp_info,
718                                                         &fd_arr[loop]);
719                                 if (unlikely(state)) {
720                                         /* Set frames_to_send & nb_bufs so
721                                          * that packets are transmitted till
722                                          * previous frame.
723                                          */
724                                         frames_to_send = loop;
725                                         nb_bufs = loop;
726                                         goto send_pkts;
727                                 }
728                         } else {
729                                 state = tx_on_external_pool(q, mbuf,
730                                                             &fd_arr[loop]);
731                                 if (unlikely(state)) {
732                                         /* Set frames_to_send & nb_bufs so
733                                          * that packets are transmitted till
734                                          * previous frame.
735                                          */
736                                         frames_to_send = loop;
737                                         nb_bufs = loop;
738                                         goto send_pkts;
739                                 }
740                         }
741                 }
742
743 send_pkts:
744                 loop = 0;
745                 while (loop < frames_to_send) {
746                         loop += qman_enqueue_multi(q, &fd_arr[loop],
747                                         frames_to_send - loop);
748                 }
749                 nb_bufs -= frames_to_send;
750                 sent += frames_to_send;
751         }
752
753         DPAA_DP_LOG(DEBUG, "Transmitted %d buffers on queue: %p", sent, q);
754
755         return sent;
756 }
757
758 uint16_t dpaa_eth_tx_drop_all(void *q  __rte_unused,
759                               struct rte_mbuf **bufs __rte_unused,
760                 uint16_t nb_bufs __rte_unused)
761 {
762         DPAA_DP_LOG(DEBUG, "Drop all packets");
763
764         /* Drop all incoming packets. No need to free packets here
765          * because the rte_eth f/w frees up the packets through tx_buffer
766          * callback in case this functions returns count less than nb_bufs
767          */
768         return 0;
769 }