net/dpaa2: support Tx confirmation mode
[dpdk.git] / drivers / net / dpaa2 / dpaa2_rxtx.c
index 816ea00..1c14b73 100644 (file)
@@ -1,7 +1,7 @@
 /* SPDX-License-Identifier: BSD-3-Clause
  *
  *   Copyright (c) 2016 Freescale Semiconductor, Inc. All rights reserved.
- *   Copyright 2016-2018 NXP
+ *   Copyright 2016-2019 NXP
  *
  */
 
@@ -370,8 +370,9 @@ eth_mbuf_to_sg_fd(struct rte_mbuf *mbuf,
        DPAA2_SET_FD_LEN(fd, mbuf->pkt_len);
        DPAA2_SET_ONLY_FD_BPID(fd, bpid);
        DPAA2_SET_FD_OFFSET(fd, temp->data_off);
-       DPAA2_SET_FD_ASAL(fd, DPAA2_ASAL_VAL);
        DPAA2_FD_SET_FORMAT(fd, qbman_fd_sg);
+       DPAA2_RESET_FD_FRC(fd);
+       DPAA2_RESET_FD_CTRL(fd);
        /*Set Scatter gather table and Scatter gather entries*/
        sgt = (struct qbman_sge *)(
                        (size_t)DPAA2_IOVA_TO_VADDR(DPAA2_GET_FD_ADDR(fd))
@@ -509,7 +510,7 @@ dpaa2_dev_prefetch_rx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
        const struct qbman_fd *fd, *next_fd;
        struct qbman_pull_desc pulldesc;
        struct queue_storage_info_t *q_storage = dpaa2_q->q_storage;
-       struct rte_eth_dev *dev = dpaa2_q->dev;
+       struct rte_eth_dev_data *eth_data = dpaa2_q->eth_data;
 
        if (unlikely(!DPAA2_PER_LCORE_ETHRX_DPIO)) {
                ret = dpaa2_affine_qbman_ethrx_swp();
@@ -518,6 +519,11 @@ dpaa2_dev_prefetch_rx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
                        return 0;
                }
        }
+
+       if (unlikely(!rte_dpaa2_bpid_info &&
+                    rte_eal_process_type() == RTE_PROC_SECONDARY))
+               rte_dpaa2_bpid_info = dpaa2_q->bp_array;
+
        swp = DPAA2_PER_LCORE_ETHRX_PORTAL;
        pull_size = (nb_pkts > dpaa2_dqrr_size) ? dpaa2_dqrr_size : nb_pkts;
        if (unlikely(!q_storage->active_dqs)) {
@@ -608,9 +614,10 @@ dpaa2_dev_prefetch_rx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
                        bufs[num_rx] = eth_sg_fd_to_mbuf(fd);
                else
                        bufs[num_rx] = eth_fd_to_mbuf(fd);
-               bufs[num_rx]->port = dev->data->port_id;
+               bufs[num_rx]->port = eth_data->port_id;
 
-               if (dev->data->dev_conf.rxmode.offloads & DEV_RX_OFFLOAD_VLAN_STRIP)
+               if (eth_data->dev_conf.rxmode.offloads &
+                               DEV_RX_OFFLOAD_VLAN_STRIP)
                        rte_vlan_strip(bufs[num_rx]);
 
                dq_storage++;
@@ -693,6 +700,242 @@ dpaa2_dev_process_atomic_event(struct qbman_swp *swp __attribute__((unused)),
        DPAA2_PER_LCORE_DQRR_MBUF(dqrr_index) = ev->mbuf;
 }
 
+void __attribute__((hot))
+dpaa2_dev_process_ordered_event(struct qbman_swp *swp,
+                               const struct qbman_fd *fd,
+                               const struct qbman_result *dq,
+                               struct dpaa2_queue *rxq,
+                               struct rte_event *ev)
+{
+       rte_prefetch0((void *)(size_t)(DPAA2_GET_FD_ADDR(fd) +
+               DPAA2_FD_PTA_SIZE + 16));
+
+       ev->flow_id = rxq->ev.flow_id;
+       ev->sub_event_type = rxq->ev.sub_event_type;
+       ev->event_type = RTE_EVENT_TYPE_ETHDEV;
+       ev->op = RTE_EVENT_OP_NEW;
+       ev->sched_type = rxq->ev.sched_type;
+       ev->queue_id = rxq->ev.queue_id;
+       ev->priority = rxq->ev.priority;
+
+       ev->mbuf = eth_fd_to_mbuf(fd);
+
+       ev->mbuf->seqn = DPAA2_ENQUEUE_FLAG_ORP;
+       ev->mbuf->seqn |= qbman_result_DQ_odpid(dq) << DPAA2_EQCR_OPRID_SHIFT;
+       ev->mbuf->seqn |= qbman_result_DQ_seqnum(dq) << DPAA2_EQCR_SEQNUM_SHIFT;
+
+       qbman_swp_dqrr_consume(swp, dq);
+}
+
+uint16_t
+dpaa2_dev_rx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
+{
+       /* Function receive frames for a given device and VQ */
+       struct dpaa2_queue *dpaa2_q = (struct dpaa2_queue *)queue;
+       struct qbman_result *dq_storage;
+       uint32_t fqid = dpaa2_q->fqid;
+       int ret, num_rx = 0, next_pull = nb_pkts, num_pulled;
+       uint8_t pending, status;
+       struct qbman_swp *swp;
+       const struct qbman_fd *fd, *next_fd;
+       struct qbman_pull_desc pulldesc;
+       struct rte_eth_dev_data *eth_data = dpaa2_q->eth_data;
+
+       if (unlikely(!DPAA2_PER_LCORE_DPIO)) {
+               ret = dpaa2_affine_qbman_swp();
+               if (ret) {
+                       DPAA2_PMD_ERR("Failure in affining portal\n");
+                       return 0;
+               }
+       }
+       swp = DPAA2_PER_LCORE_PORTAL;
+
+       do {
+               dq_storage = dpaa2_q->q_storage->dq_storage[0];
+               qbman_pull_desc_clear(&pulldesc);
+               qbman_pull_desc_set_fq(&pulldesc, fqid);
+               qbman_pull_desc_set_storage(&pulldesc, dq_storage,
+                               (size_t)(DPAA2_VADDR_TO_IOVA(dq_storage)), 1);
+
+               if (next_pull > dpaa2_dqrr_size) {
+                       qbman_pull_desc_set_numframes(&pulldesc,
+                               dpaa2_dqrr_size);
+                       next_pull -= dpaa2_dqrr_size;
+               } else {
+                       qbman_pull_desc_set_numframes(&pulldesc, next_pull);
+                       next_pull = 0;
+               }
+
+               while (1) {
+                       if (qbman_swp_pull(swp, &pulldesc)) {
+                               DPAA2_PMD_DP_DEBUG(
+                                       "VDQ command is not issued.QBMAN is busy\n");
+                               /* Portal was busy, try again */
+                               continue;
+                       }
+                       break;
+               }
+
+               rte_prefetch0((void *)((size_t)(dq_storage + 1)));
+               /* Check if the previous issued command is completed. */
+               while (!qbman_check_command_complete(dq_storage))
+                       ;
+
+               num_pulled = 0;
+               pending = 1;
+               do {
+                       /* Loop until the dq_storage is updated with
+                        * new token by QBMAN
+                        */
+                       while (!qbman_check_new_result(dq_storage))
+                               ;
+                       rte_prefetch0((void *)((size_t)(dq_storage + 2)));
+                       /* Check whether Last Pull command is Expired and
+                        * setting Condition for Loop termination
+                        */
+                       if (qbman_result_DQ_is_pull_complete(dq_storage)) {
+                               pending = 0;
+                               /* Check for valid frame. */
+                               status = qbman_result_DQ_flags(dq_storage);
+                               if (unlikely((status &
+                                       QBMAN_DQ_STAT_VALIDFRAME) == 0))
+                                       continue;
+                       }
+                       fd = qbman_result_DQ_fd(dq_storage);
+
+                       next_fd = qbman_result_DQ_fd(dq_storage + 1);
+                       /* Prefetch Annotation address for the parse results */
+                       rte_prefetch0(
+                               (void *)(size_t)(DPAA2_GET_FD_ADDR(next_fd)
+                                       + DPAA2_FD_PTA_SIZE + 16));
+
+                       if (unlikely(DPAA2_FD_GET_FORMAT(fd) == qbman_fd_sg))
+                               bufs[num_rx] = eth_sg_fd_to_mbuf(fd);
+                       else
+                               bufs[num_rx] = eth_fd_to_mbuf(fd);
+                       bufs[num_rx]->port = eth_data->port_id;
+
+               if (eth_data->dev_conf.rxmode.offloads &
+                               DEV_RX_OFFLOAD_VLAN_STRIP) {
+                       rte_vlan_strip(bufs[num_rx]);
+               }
+
+                       dq_storage++;
+                       num_rx++;
+                       num_pulled++;
+               } while (pending);
+       /* Last VDQ provided all packets and more packets are requested */
+       } while (next_pull && num_pulled == dpaa2_dqrr_size);
+
+       dpaa2_q->rx_pkts += num_rx;
+
+       return num_rx;
+}
+
+uint16_t dpaa2_dev_tx_conf(void *queue)
+{
+       /* Function receive frames for a given device and VQ */
+       struct dpaa2_queue *dpaa2_q = (struct dpaa2_queue *)queue;
+       struct qbman_result *dq_storage;
+       uint32_t fqid = dpaa2_q->fqid;
+       int ret, num_tx_conf = 0, num_pulled;
+       uint8_t pending, status;
+       struct qbman_swp *swp;
+       const struct qbman_fd *fd, *next_fd;
+       struct qbman_pull_desc pulldesc;
+       struct qbman_release_desc releasedesc;
+       uint32_t bpid;
+       uint64_t buf;
+
+       if (unlikely(!DPAA2_PER_LCORE_DPIO)) {
+               ret = dpaa2_affine_qbman_swp();
+               if (ret) {
+                       DPAA2_PMD_ERR("Failure in affining portal\n");
+                       return 0;
+               }
+       }
+       swp = DPAA2_PER_LCORE_PORTAL;
+
+       do {
+               dq_storage = dpaa2_q->q_storage->dq_storage[0];
+               qbman_pull_desc_clear(&pulldesc);
+               qbman_pull_desc_set_fq(&pulldesc, fqid);
+               qbman_pull_desc_set_storage(&pulldesc, dq_storage,
+                               (size_t)(DPAA2_VADDR_TO_IOVA(dq_storage)), 1);
+
+               qbman_pull_desc_set_numframes(&pulldesc, dpaa2_dqrr_size);
+
+               while (1) {
+                       if (qbman_swp_pull(swp, &pulldesc)) {
+                               DPAA2_PMD_DP_DEBUG("VDQ command is not issued."
+                                                  "QBMAN is busy\n");
+                               /* Portal was busy, try again */
+                               continue;
+                       }
+                       break;
+               }
+
+               rte_prefetch0((void *)((size_t)(dq_storage + 1)));
+               /* Check if the previous issued command is completed. */
+               while (!qbman_check_command_complete(dq_storage))
+                       ;
+
+               num_pulled = 0;
+               pending = 1;
+               do {
+                       /* Loop until the dq_storage is updated with
+                        * new token by QBMAN
+                        */
+                       while (!qbman_check_new_result(dq_storage))
+                               ;
+                       rte_prefetch0((void *)((size_t)(dq_storage + 2)));
+                       /* Check whether Last Pull command is Expired and
+                        * setting Condition for Loop termination
+                        */
+                       if (qbman_result_DQ_is_pull_complete(dq_storage)) {
+                               pending = 0;
+                               /* Check for valid frame. */
+                               status = qbman_result_DQ_flags(dq_storage);
+                               if (unlikely((status &
+                                       QBMAN_DQ_STAT_VALIDFRAME) == 0))
+                                       continue;
+                       }
+                       fd = qbman_result_DQ_fd(dq_storage);
+
+                       next_fd = qbman_result_DQ_fd(dq_storage + 1);
+                       /* Prefetch Annotation address for the parse results */
+                       rte_prefetch0((void *)(size_t)
+                               (DPAA2_GET_FD_ADDR(next_fd) +
+                                DPAA2_FD_PTA_SIZE + 16));
+
+                       bpid = DPAA2_GET_FD_BPID(fd);
+
+                       /* Create a release descriptor required for releasing
+                        * buffers into QBMAN
+                        */
+                       qbman_release_desc_clear(&releasedesc);
+                       qbman_release_desc_set_bpid(&releasedesc, bpid);
+
+                       buf = DPAA2_GET_FD_ADDR(fd);
+                       /* feed them to bman */
+                       do {
+                               ret = qbman_swp_release(swp, &releasedesc,
+                                                       &buf, 1);
+                       } while (ret == -EBUSY);
+
+                       dq_storage++;
+                       num_tx_conf++;
+                       num_pulled++;
+               } while (pending);
+
+       /* Last VDQ provided all packets and more packets are requested */
+       } while (num_pulled == dpaa2_dqrr_size);
+
+       dpaa2_q->rx_pkts += num_tx_conf;
+
+       return num_tx_conf;
+}
+
 /*
  * Callback to handle sending packets through WRIOP based interface
  */
@@ -711,8 +954,8 @@ dpaa2_dev_tx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
        struct qbman_swp *swp;
        uint16_t num_tx = 0;
        uint16_t bpid;
-       struct rte_eth_dev *dev = dpaa2_q->dev;
-       struct dpaa2_dev_priv *priv = dev->data->dev_private;
+       struct rte_eth_dev_data *eth_data = dpaa2_q->eth_data;
+       struct dpaa2_dev_priv *priv = eth_data->dev_private;
        uint32_t flags[MAX_TX_RING_SLOTS] = {0};
 
        if (unlikely(!DPAA2_PER_LCORE_DPIO)) {
@@ -724,13 +967,14 @@ dpaa2_dev_tx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
        }
        swp = DPAA2_PER_LCORE_PORTAL;
 
-       DPAA2_PMD_DP_DEBUG("===> dev =%p, fqid =%d\n", dev, dpaa2_q->fqid);
+       DPAA2_PMD_DP_DEBUG("===> eth_data =%p, fqid =%d\n",
+                       eth_data, dpaa2_q->fqid);
 
        /*Prepare enqueue descriptor*/
        qbman_eq_desc_clear(&eqdesc);
        qbman_eq_desc_set_no_orp(&eqdesc, DPAA2_EQ_RESP_ERR_FQ);
-       qbman_eq_desc_set_qd(&eqdesc, priv->qdid,
-                            dpaa2_q->flow_id, dpaa2_q->tc_index);
+       qbman_eq_desc_set_fq(&eqdesc, dpaa2_q->fqid);
+
        /*Clear the unused FD fields before sending*/
        while (nb_pkts) {
                /*Check if the queue is congested*/
@@ -767,7 +1011,7 @@ dpaa2_dev_tx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
                                    rte_mbuf_refcnt_read((*bufs)) == 1)) {
                                        if (unlikely(((*bufs)->ol_flags
                                                & PKT_TX_VLAN_PKT) ||
-                                               (dev->data->dev_conf.txmode.offloads
+                                               (eth_data->dev_conf.txmode.offloads
                                                & DEV_TX_OFFLOAD_VLAN_INSERT))) {
                                                ret = rte_vlan_insert(bufs);
                                                if (ret)
@@ -789,7 +1033,7 @@ dpaa2_dev_tx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
                        }
 
                        if (unlikely(((*bufs)->ol_flags & PKT_TX_VLAN_PKT) ||
-                               (dev->data->dev_conf.txmode.offloads
+                               (eth_data->dev_conf.txmode.offloads
                                & DEV_TX_OFFLOAD_VLAN_INSERT))) {
                                int ret = rte_vlan_insert(bufs);
                                if (ret)
@@ -857,6 +1101,232 @@ skip_tx:
        return num_tx;
 }
 
+void
+dpaa2_dev_free_eqresp_buf(uint16_t eqresp_ci)
+{
+       struct dpaa2_dpio_dev *dpio_dev = DPAA2_PER_LCORE_DPIO;
+       struct qbman_fd *fd;
+       struct rte_mbuf *m;
+
+       fd = qbman_result_eqresp_fd(&dpio_dev->eqresp[eqresp_ci]);
+       m = eth_fd_to_mbuf(fd);
+       rte_pktmbuf_free(m);
+}
+
+static void
+dpaa2_set_enqueue_descriptor(struct dpaa2_queue *dpaa2_q,
+                            struct rte_mbuf *m,
+                            struct qbman_eq_desc *eqdesc)
+{
+       struct rte_eth_dev_data *eth_data = dpaa2_q->eth_data;
+       struct dpaa2_dev_priv *priv = eth_data->dev_private;
+       struct dpaa2_dpio_dev *dpio_dev = DPAA2_PER_LCORE_DPIO;
+       struct eqresp_metadata *eqresp_meta;
+       uint16_t orpid, seqnum;
+       uint8_t dq_idx;
+
+       qbman_eq_desc_set_fq(eqdesc, dpaa2_q->fqid);
+
+       if (m->seqn & DPAA2_ENQUEUE_FLAG_ORP) {
+               orpid = (m->seqn & DPAA2_EQCR_OPRID_MASK) >>
+                       DPAA2_EQCR_OPRID_SHIFT;
+               seqnum = (m->seqn & DPAA2_EQCR_SEQNUM_MASK) >>
+                       DPAA2_EQCR_SEQNUM_SHIFT;
+
+               if (!priv->en_loose_ordered) {
+                       qbman_eq_desc_set_orp(eqdesc, 1, orpid, seqnum, 0);
+                       qbman_eq_desc_set_response(eqdesc, (uint64_t)
+                               DPAA2_VADDR_TO_IOVA(&dpio_dev->eqresp[
+                               dpio_dev->eqresp_pi]), 1);
+                       qbman_eq_desc_set_token(eqdesc, 1);
+
+                       eqresp_meta = &dpio_dev->eqresp_meta[
+                               dpio_dev->eqresp_pi];
+                       eqresp_meta->dpaa2_q = dpaa2_q;
+                       eqresp_meta->mp = m->pool;
+
+                       dpio_dev->eqresp_pi + 1 < MAX_EQ_RESP_ENTRIES ?
+                               dpio_dev->eqresp_pi++ :
+                               (dpio_dev->eqresp_pi = 0);
+               } else {
+                       qbman_eq_desc_set_orp(eqdesc, 0, orpid, seqnum, 0);
+               }
+       } else {
+               dq_idx = m->seqn - 1;
+               qbman_eq_desc_set_dca(eqdesc, 1, dq_idx, 0);
+               DPAA2_PER_LCORE_DQRR_SIZE--;
+               DPAA2_PER_LCORE_DQRR_HELD &= ~(1 << dq_idx);
+       }
+       m->seqn = DPAA2_INVALID_MBUF_SEQN;
+}
+
+/* Callback to handle sending ordered packets through WRIOP based interface */
+uint16_t
+dpaa2_dev_tx_ordered(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
+{
+       /* Function to transmit the frames to given device and VQ*/
+       struct dpaa2_queue *dpaa2_q = (struct dpaa2_queue *)queue;
+       struct rte_eth_dev_data *eth_data = dpaa2_q->eth_data;
+       struct dpaa2_dev_priv *priv = eth_data->dev_private;
+       struct dpaa2_queue *order_sendq = (struct dpaa2_queue *)priv->tx_vq[0];
+       struct qbman_fd fd_arr[MAX_TX_RING_SLOTS];
+       struct rte_mbuf *mi;
+       struct rte_mempool *mp;
+       struct qbman_eq_desc eqdesc[MAX_TX_RING_SLOTS];
+       struct qbman_swp *swp;
+       uint32_t frames_to_send, num_free_eq_desc;
+       uint32_t loop, retry_count;
+       int32_t ret;
+       uint16_t num_tx = 0;
+       uint16_t bpid;
+
+       if (unlikely(!DPAA2_PER_LCORE_DPIO)) {
+               ret = dpaa2_affine_qbman_swp();
+               if (ret) {
+                       DPAA2_PMD_ERR("Failure in affining portal");
+                       return 0;
+               }
+       }
+       swp = DPAA2_PER_LCORE_PORTAL;
+
+       DPAA2_PMD_DP_DEBUG("===> eth_data =%p, fqid =%d\n",
+                          eth_data, dpaa2_q->fqid);
+
+       /* This would also handle normal and atomic queues as any type
+        * of packet can be enqueued when ordered queues are being used.
+        */
+       while (nb_pkts) {
+               /*Check if the queue is congested*/
+               retry_count = 0;
+               while (qbman_result_SCN_state(dpaa2_q->cscn)) {
+                       retry_count++;
+                       /* Retry for some time before giving up */
+                       if (retry_count > CONG_RETRY_COUNT)
+                               goto skip_tx;
+               }
+
+               frames_to_send = (nb_pkts > dpaa2_eqcr_size) ?
+                       dpaa2_eqcr_size : nb_pkts;
+
+               if (!priv->en_loose_ordered) {
+                       if ((*bufs)->seqn & DPAA2_ENQUEUE_FLAG_ORP) {
+                               num_free_eq_desc = dpaa2_free_eq_descriptors();
+                               if (num_free_eq_desc < frames_to_send)
+                                       frames_to_send = num_free_eq_desc;
+                       }
+               }
+
+               for (loop = 0; loop < frames_to_send; loop++) {
+                       /*Prepare enqueue descriptor*/
+                       qbman_eq_desc_clear(&eqdesc[loop]);
+
+                       if ((*bufs)->seqn) {
+                               /* Use only queue 0 for Tx in case of atomic/
+                                * ordered packets as packets can get unordered
+                                * when being tranmitted out from the interface
+                                */
+                               dpaa2_set_enqueue_descriptor(order_sendq,
+                                                            (*bufs),
+                                                            &eqdesc[loop]);
+                       } else {
+                               qbman_eq_desc_set_no_orp(&eqdesc[loop],
+                                                        DPAA2_EQ_RESP_ERR_FQ);
+                               qbman_eq_desc_set_fq(&eqdesc[loop],
+                                                    dpaa2_q->fqid);
+                       }
+
+                       if (likely(RTE_MBUF_DIRECT(*bufs))) {
+                               mp = (*bufs)->pool;
+                               /* Check the basic scenario and set
+                                * the FD appropriately here itself.
+                                */
+                               if (likely(mp && mp->ops_index ==
+                                   priv->bp_list->dpaa2_ops_index &&
+                                   (*bufs)->nb_segs == 1 &&
+                                   rte_mbuf_refcnt_read((*bufs)) == 1)) {
+                                       if (unlikely((*bufs)->ol_flags
+                                               & PKT_TX_VLAN_PKT)) {
+                                         ret = rte_vlan_insert(bufs);
+                                         if (ret)
+                                               goto send_n_return;
+                                       }
+                                       DPAA2_MBUF_TO_CONTIG_FD((*bufs),
+                                               &fd_arr[loop],
+                                               mempool_to_bpid(mp));
+                                       bufs++;
+                                       continue;
+                               }
+                       } else {
+                               mi = rte_mbuf_from_indirect(*bufs);
+                               mp = mi->pool;
+                       }
+                       /* Not a hw_pkt pool allocated frame */
+                       if (unlikely(!mp || !priv->bp_list)) {
+                               DPAA2_PMD_ERR("Err: No buffer pool attached");
+                               goto send_n_return;
+                       }
+
+                       if (mp->ops_index != priv->bp_list->dpaa2_ops_index) {
+                               DPAA2_PMD_WARN("Non DPAA2 buffer pool");
+                               /* alloc should be from the default buffer pool
+                                * attached to this interface
+                                */
+                               bpid = priv->bp_list->buf_pool.bpid;
+
+                               if (unlikely((*bufs)->nb_segs > 1)) {
+                                       DPAA2_PMD_ERR(
+                                               "S/G not supp for non hw offload buffer");
+                                       goto send_n_return;
+                               }
+                               if (eth_copy_mbuf_to_fd(*bufs,
+                                                       &fd_arr[loop], bpid)) {
+                                       goto send_n_return;
+                               }
+                               /* free the original packet */
+                               rte_pktmbuf_free(*bufs);
+                       } else {
+                               bpid = mempool_to_bpid(mp);
+                               if (unlikely((*bufs)->nb_segs > 1)) {
+                                       if (eth_mbuf_to_sg_fd(*bufs,
+                                                             &fd_arr[loop],
+                                                             bpid))
+                                               goto send_n_return;
+                               } else {
+                                       eth_mbuf_to_fd(*bufs,
+                                                      &fd_arr[loop], bpid);
+                               }
+                       }
+                       bufs++;
+               }
+               loop = 0;
+               while (loop < frames_to_send) {
+                       loop += qbman_swp_enqueue_multiple_desc(swp,
+                                       &eqdesc[loop], &fd_arr[loop],
+                                       frames_to_send - loop);
+               }
+
+               num_tx += frames_to_send;
+               nb_pkts -= frames_to_send;
+       }
+       dpaa2_q->tx_pkts += num_tx;
+       return num_tx;
+
+send_n_return:
+       /* send any already prepared fd */
+       if (loop) {
+               unsigned int i = 0;
+
+               while (i < loop) {
+                       i += qbman_swp_enqueue_multiple_desc(swp, &eqdesc[loop],
+                                                       &fd_arr[i], loop - i);
+               }
+               num_tx += loop;
+       }
+skip_tx:
+       dpaa2_q->tx_pkts += num_tx;
+       return num_tx;
+}
+
 /**
  * Dummy DPDK callback for TX.
  *
@@ -881,3 +1351,164 @@ dummy_dev_tx(void *queue, struct rte_mbuf **bufs, uint16_t nb_pkts)
        (void)nb_pkts;
        return 0;
 }
+
+#if defined(RTE_TOOLCHAIN_GCC)
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wcast-qual"
+#elif defined(RTE_TOOLCHAIN_CLANG)
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wcast-qual"
+#endif
+
+/* This function loopbacks all the received packets.*/
+uint16_t
+dpaa2_dev_loopback_rx(void *queue,
+                     struct rte_mbuf **bufs __rte_unused,
+                     uint16_t nb_pkts)
+{
+       /* Function receive frames for a given device and VQ*/
+       struct dpaa2_queue *dpaa2_q = (struct dpaa2_queue *)queue;
+       struct qbman_result *dq_storage, *dq_storage1 = NULL;
+       uint32_t fqid = dpaa2_q->fqid;
+       int ret, num_rx = 0, num_tx = 0, pull_size;
+       uint8_t pending, status;
+       struct qbman_swp *swp;
+       struct qbman_fd *fd[DPAA2_LX2_DQRR_RING_SIZE];
+       struct qbman_pull_desc pulldesc;
+       struct qbman_eq_desc eqdesc;
+       struct queue_storage_info_t *q_storage = dpaa2_q->q_storage;
+       struct rte_eth_dev_data *eth_data = dpaa2_q->eth_data;
+       struct dpaa2_dev_priv *priv = eth_data->dev_private;
+       struct dpaa2_queue *tx_q = priv->tx_vq[0];
+       /* todo - currently we are using 1st TX queue only for loopback*/
+
+       if (unlikely(!DPAA2_PER_LCORE_ETHRX_DPIO)) {
+               ret = dpaa2_affine_qbman_ethrx_swp();
+               if (ret) {
+                       DPAA2_PMD_ERR("Failure in affining portal");
+                       return 0;
+               }
+       }
+       swp = DPAA2_PER_LCORE_ETHRX_PORTAL;
+       pull_size = (nb_pkts > dpaa2_dqrr_size) ? dpaa2_dqrr_size : nb_pkts;
+       if (unlikely(!q_storage->active_dqs)) {
+               q_storage->toggle = 0;
+               dq_storage = q_storage->dq_storage[q_storage->toggle];
+               q_storage->last_num_pkts = pull_size;
+               qbman_pull_desc_clear(&pulldesc);
+               qbman_pull_desc_set_numframes(&pulldesc,
+                                             q_storage->last_num_pkts);
+               qbman_pull_desc_set_fq(&pulldesc, fqid);
+               qbman_pull_desc_set_storage(&pulldesc, dq_storage,
+                       (size_t)(DPAA2_VADDR_TO_IOVA(dq_storage)), 1);
+               if (check_swp_active_dqs(DPAA2_PER_LCORE_ETHRX_DPIO->index)) {
+                       while (!qbman_check_command_complete(
+                              get_swp_active_dqs(
+                              DPAA2_PER_LCORE_ETHRX_DPIO->index)))
+                               ;
+                       clear_swp_active_dqs(DPAA2_PER_LCORE_ETHRX_DPIO->index);
+               }
+               while (1) {
+                       if (qbman_swp_pull(swp, &pulldesc)) {
+                               DPAA2_PMD_DP_DEBUG(
+                                       "VDQ command not issued.QBMAN busy\n");
+                               /* Portal was busy, try again */
+                               continue;
+                       }
+                       break;
+               }
+               q_storage->active_dqs = dq_storage;
+               q_storage->active_dpio_id = DPAA2_PER_LCORE_ETHRX_DPIO->index;
+               set_swp_active_dqs(DPAA2_PER_LCORE_ETHRX_DPIO->index,
+                                  dq_storage);
+       }
+
+       dq_storage = q_storage->active_dqs;
+       rte_prefetch0((void *)(size_t)(dq_storage));
+       rte_prefetch0((void *)(size_t)(dq_storage + 1));
+
+       /* Prepare next pull descriptor. This will give space for the
+        * prefething done on DQRR entries
+        */
+       q_storage->toggle ^= 1;
+       dq_storage1 = q_storage->dq_storage[q_storage->toggle];
+       qbman_pull_desc_clear(&pulldesc);
+       qbman_pull_desc_set_numframes(&pulldesc, pull_size);
+       qbman_pull_desc_set_fq(&pulldesc, fqid);
+       qbman_pull_desc_set_storage(&pulldesc, dq_storage1,
+               (size_t)(DPAA2_VADDR_TO_IOVA(dq_storage1)), 1);
+
+       /*Prepare enqueue descriptor*/
+       qbman_eq_desc_clear(&eqdesc);
+       qbman_eq_desc_set_no_orp(&eqdesc, DPAA2_EQ_RESP_ERR_FQ);
+       qbman_eq_desc_set_response(&eqdesc, 0, 0);
+       qbman_eq_desc_set_fq(&eqdesc, tx_q->fqid);
+
+       /* Check if the previous issued command is completed.
+        * Also seems like the SWP is shared between the Ethernet Driver
+        * and the SEC driver.
+        */
+       while (!qbman_check_command_complete(dq_storage))
+               ;
+       if (dq_storage == get_swp_active_dqs(q_storage->active_dpio_id))
+               clear_swp_active_dqs(q_storage->active_dpio_id);
+
+       pending = 1;
+
+       do {
+               /* Loop until the dq_storage is updated with
+                * new token by QBMAN
+                */
+               while (!qbman_check_new_result(dq_storage))
+                       ;
+               rte_prefetch0((void *)((size_t)(dq_storage + 2)));
+               /* Check whether Last Pull command is Expired and
+                * setting Condition for Loop termination
+                */
+               if (qbman_result_DQ_is_pull_complete(dq_storage)) {
+                       pending = 0;
+                       /* Check for valid frame. */
+                       status = qbman_result_DQ_flags(dq_storage);
+                       if (unlikely((status & QBMAN_DQ_STAT_VALIDFRAME) == 0))
+                               continue;
+               }
+               fd[num_rx] = (struct qbman_fd *)qbman_result_DQ_fd(dq_storage);
+
+               dq_storage++;
+               num_rx++;
+       } while (pending);
+
+       while (num_tx < num_rx) {
+               num_tx += qbman_swp_enqueue_multiple_fd(swp, &eqdesc,
+                               &fd[num_tx], 0, num_rx - num_tx);
+       }
+
+       if (check_swp_active_dqs(DPAA2_PER_LCORE_ETHRX_DPIO->index)) {
+               while (!qbman_check_command_complete(
+                      get_swp_active_dqs(DPAA2_PER_LCORE_ETHRX_DPIO->index)))
+                       ;
+               clear_swp_active_dqs(DPAA2_PER_LCORE_ETHRX_DPIO->index);
+       }
+       /* issue a volatile dequeue command for next pull */
+       while (1) {
+               if (qbman_swp_pull(swp, &pulldesc)) {
+                       DPAA2_PMD_DP_DEBUG("VDQ command is not issued."
+                                         "QBMAN is busy (2)\n");
+                       continue;
+               }
+               break;
+       }
+       q_storage->active_dqs = dq_storage1;
+       q_storage->active_dpio_id = DPAA2_PER_LCORE_ETHRX_DPIO->index;
+       set_swp_active_dqs(DPAA2_PER_LCORE_ETHRX_DPIO->index, dq_storage1);
+
+       dpaa2_q->rx_pkts += num_rx;
+       dpaa2_q->tx_pkts += num_tx;
+
+       return 0;
+}
+#if defined(RTE_TOOLCHAIN_GCC)
+#pragma GCC diagnostic pop
+#elif defined(RTE_TOOLCHAIN_CLANG)
+#pragma clang diagnostic pop
+#endif