net/bnxt: remove references to Thor
[dpdk.git] / drivers / net / bnxt / bnxt_rxr.c
index ee1acb1..e9c4fff 100644 (file)
@@ -12,6 +12,7 @@
 #include <rte_memory.h>
 
 #include "bnxt.h"
+#include "bnxt_reps.h"
 #include "bnxt_ring.h"
 #include "bnxt_rxr.h"
 #include "bnxt_rxq.h"
@@ -41,7 +42,7 @@ static inline int bnxt_alloc_rx_data(struct bnxt_rx_queue *rxq,
                                     uint16_t prod)
 {
        struct rx_prod_pkt_bd *rxbd = &rxr->rx_desc_ring[prod];
-       struct bnxt_sw_rx_bd *rx_buf = &rxr->rx_buf_ring[prod];
+       struct rte_mbuf **rx_buf = &rxr->rx_buf_ring[prod];
        struct rte_mbuf *mbuf;
 
        mbuf = __bnxt_alloc_rx_data(rxq->mb_pool);
@@ -50,7 +51,7 @@ static inline int bnxt_alloc_rx_data(struct bnxt_rx_queue *rxq,
                return -ENOMEM;
        }
 
-       rx_buf->mbuf = mbuf;
+       *rx_buf = mbuf;
        mbuf->data_off = RTE_PKTMBUF_HEADROOM;
 
        rxbd->address = rte_cpu_to_le_64(rte_mbuf_data_iova_default(mbuf));
@@ -63,7 +64,7 @@ static inline int bnxt_alloc_ag_data(struct bnxt_rx_queue *rxq,
                                     uint16_t prod)
 {
        struct rx_prod_pkt_bd *rxbd = &rxr->ag_desc_ring[prod];
-       struct bnxt_sw_rx_bd *rx_buf = &rxr->ag_buf_ring[prod];
+       struct rte_mbuf **rx_buf = &rxr->ag_buf_ring[prod];
        struct rte_mbuf *mbuf;
 
        if (rxbd == NULL) {
@@ -82,7 +83,7 @@ static inline int bnxt_alloc_ag_data(struct bnxt_rx_queue *rxq,
                return -ENOMEM;
        }
 
-       rx_buf->mbuf = mbuf;
+       *rx_buf = mbuf;
        mbuf->data_off = RTE_PKTMBUF_HEADROOM;
 
        rxbd->address = rte_cpu_to_le_64(rte_mbuf_data_iova_default(mbuf));
@@ -94,15 +95,15 @@ static inline void bnxt_reuse_rx_mbuf(struct bnxt_rx_ring_info *rxr,
                               struct rte_mbuf *mbuf)
 {
        uint16_t prod = RING_NEXT(rxr->rx_ring_struct, rxr->rx_prod);
-       struct bnxt_sw_rx_bd *prod_rx_buf;
+       struct rte_mbuf **prod_rx_buf;
        struct rx_prod_pkt_bd *prod_bd;
 
        prod_rx_buf = &rxr->rx_buf_ring[prod];
 
-       RTE_ASSERT(prod_rx_buf->mbuf == NULL);
+       RTE_ASSERT(*prod_rx_buf == NULL);
        RTE_ASSERT(mbuf != NULL);
 
-       prod_rx_buf->mbuf = mbuf;
+       *prod_rx_buf = mbuf;
 
        prod_bd = &rxr->rx_desc_ring[prod];
 
@@ -115,13 +116,14 @@ static inline
 struct rte_mbuf *bnxt_consume_rx_buf(struct bnxt_rx_ring_info *rxr,
                                     uint16_t cons)
 {
-       struct bnxt_sw_rx_bd *cons_rx_buf;
+       struct rte_mbuf **cons_rx_buf;
        struct rte_mbuf *mbuf;
 
        cons_rx_buf = &rxr->rx_buf_ring[cons];
-       RTE_ASSERT(cons_rx_buf->mbuf != NULL);
-       mbuf = cons_rx_buf->mbuf;
-       cons_rx_buf->mbuf = NULL;
+       RTE_ASSERT(*cons_rx_buf != NULL);
+       mbuf = *cons_rx_buf;
+       *cons_rx_buf = NULL;
+
        return mbuf;
 }
 
@@ -148,6 +150,7 @@ static void bnxt_tpa_start(struct bnxt_rx_queue *rxq,
        tpa_info->mbuf = mbuf;
        tpa_info->len = rte_le_to_cpu_32(tpa_start->len);
 
+       mbuf->data_off = RTE_PKTMBUF_HEADROOM;
        mbuf->nb_segs = 1;
        mbuf->next = NULL;
        mbuf->pkt_len = rte_le_to_cpu_32(tpa_start->len);
@@ -222,13 +225,13 @@ static int bnxt_rx_pages(struct bnxt_rx_queue *rxq,
        uint16_t cp_cons, ag_cons;
        struct rx_pkt_cmpl *rxcmp;
        struct rte_mbuf *last = mbuf;
-       bool is_thor_tpa = tpa_info && BNXT_CHIP_THOR(rxq->bp);
+       bool is_p5_tpa = tpa_info && BNXT_CHIP_P5(rxq->bp);
 
        for (i = 0; i < agg_buf; i++) {
-               struct bnxt_sw_rx_bd *ag_buf;
+               struct rte_mbuf **ag_buf;
                struct rte_mbuf *ag_mbuf;
 
-               if (is_thor_tpa) {
+               if (is_p5_tpa) {
                        rxcmp = (void *)&tpa_info->agg_arr[i];
                } else {
                        *tmp_raw_cons = NEXT_RAW_CMP(*tmp_raw_cons);
@@ -244,7 +247,7 @@ static int bnxt_rx_pages(struct bnxt_rx_queue *rxq,
                ag_cons = rxcmp->opaque;
                RTE_ASSERT(ag_cons <= rxr->ag_ring_struct->ring_mask);
                ag_buf = &rxr->ag_buf_ring[ag_cons];
-               ag_mbuf = ag_buf->mbuf;
+               ag_mbuf = *ag_buf;
                RTE_ASSERT(ag_mbuf != NULL);
 
                ag_mbuf->data_len = rte_le_to_cpu_16(rxcmp->len);
@@ -255,7 +258,7 @@ static int bnxt_rx_pages(struct bnxt_rx_queue *rxq,
                last->next = ag_mbuf;
                last = ag_mbuf;
 
-               ag_buf->mbuf = NULL;
+               *ag_buf = NULL;
 
                /*
                 * As aggregation buffer consumed out of order in TPA module,
@@ -282,7 +285,7 @@ static inline struct rte_mbuf *bnxt_tpa_end(
        uint8_t payload_offset;
        struct bnxt_tpa_info *tpa_info;
 
-       if (BNXT_CHIP_THOR(rxq->bp)) {
+       if (BNXT_CHIP_P5(rxq->bp)) {
                struct rx_tpa_v2_end_cmpl *th_tpa_end;
                struct rx_tpa_v2_end_cmpl_hi *th_tpa_end1;
 
@@ -303,7 +306,6 @@ static inline struct rte_mbuf *bnxt_tpa_end(
        mbuf = tpa_info->mbuf;
        RTE_ASSERT(mbuf != NULL);
 
-       rte_prefetch0(mbuf);
        if (agg_bufs) {
                bnxt_rx_pages(rxq, mbuf, raw_cp_cons, agg_bufs, tpa_info);
        }
@@ -320,71 +322,186 @@ static inline struct rte_mbuf *bnxt_tpa_end(
        return mbuf;
 }
 
+uint32_t bnxt_ptype_table[BNXT_PTYPE_TBL_DIM] __rte_cache_aligned;
+
+static void __rte_cold
+bnxt_init_ptype_table(void)
+{
+       uint32_t *pt = bnxt_ptype_table;
+       static bool initialized;
+       int ip6, tun, type;
+       uint32_t l3;
+       int i;
+
+       if (initialized)
+               return;
+
+       for (i = 0; i < BNXT_PTYPE_TBL_DIM; i++) {
+               if (i & (RX_PKT_CMPL_FLAGS2_META_FORMAT_VLAN >> 2))
+                       pt[i] = RTE_PTYPE_L2_ETHER_VLAN;
+               else
+                       pt[i] = RTE_PTYPE_L2_ETHER;
+
+               ip6 = i & (RX_PKT_CMPL_FLAGS2_IP_TYPE >> 7);
+               tun = i & (RX_PKT_CMPL_FLAGS2_T_IP_CS_CALC >> 2);
+               type = (i & 0x38) << 9;
+
+               if (!tun && !ip6)
+                       l3 = RTE_PTYPE_L3_IPV4_EXT_UNKNOWN;
+               else if (!tun && ip6)
+                       l3 = RTE_PTYPE_L3_IPV6_EXT_UNKNOWN;
+               else if (tun && !ip6)
+                       l3 = RTE_PTYPE_INNER_L3_IPV4_EXT_UNKNOWN;
+               else
+                       l3 = RTE_PTYPE_INNER_L3_IPV6_EXT_UNKNOWN;
+
+               switch (type) {
+               case RX_PKT_CMPL_FLAGS_ITYPE_ICMP:
+                       if (tun)
+                               pt[i] |= l3 | RTE_PTYPE_INNER_L4_ICMP;
+                       else
+                               pt[i] |= l3 | RTE_PTYPE_L4_ICMP;
+                       break;
+               case RX_PKT_CMPL_FLAGS_ITYPE_TCP:
+                       if (tun)
+                               pt[i] |= l3 | RTE_PTYPE_INNER_L4_TCP;
+                       else
+                               pt[i] |= l3 | RTE_PTYPE_L4_TCP;
+                       break;
+               case RX_PKT_CMPL_FLAGS_ITYPE_UDP:
+                       if (tun)
+                               pt[i] |= l3 | RTE_PTYPE_INNER_L4_UDP;
+                       else
+                               pt[i] |= l3 | RTE_PTYPE_L4_UDP;
+                       break;
+               case RX_PKT_CMPL_FLAGS_ITYPE_IP:
+                       pt[i] |= l3;
+                       break;
+               }
+       }
+       initialized = true;
+}
+
 static uint32_t
 bnxt_parse_pkt_type(struct rx_pkt_cmpl *rxcmp, struct rx_pkt_cmpl_hi *rxcmp1)
 {
-       uint32_t l3, pkt_type = 0;
-       uint32_t t_ipcs = 0, ip6 = 0, vlan = 0;
-       uint32_t flags_type;
-
-       vlan = !!(rxcmp1->flags2 &
-               rte_cpu_to_le_32(RX_PKT_CMPL_FLAGS2_META_FORMAT_VLAN));
-       pkt_type |= vlan ? RTE_PTYPE_L2_ETHER_VLAN : RTE_PTYPE_L2_ETHER;
-
-       t_ipcs = !!(rxcmp1->flags2 &
-               rte_cpu_to_le_32(RX_PKT_CMPL_FLAGS2_T_IP_CS_CALC));
-       ip6 = !!(rxcmp1->flags2 &
-                rte_cpu_to_le_32(RX_PKT_CMPL_FLAGS2_IP_TYPE));
-
-       flags_type = rxcmp->flags_type &
-               rte_cpu_to_le_32(RX_PKT_CMPL_FLAGS_ITYPE_MASK);
-
-       if (!t_ipcs && !ip6)
-               l3 = RTE_PTYPE_L3_IPV4_EXT_UNKNOWN;
-       else if (!t_ipcs && ip6)
-               l3 = RTE_PTYPE_L3_IPV6_EXT_UNKNOWN;
-       else if (t_ipcs && !ip6)
-               l3 = RTE_PTYPE_INNER_L3_IPV4_EXT_UNKNOWN;
-       else
-               l3 = RTE_PTYPE_INNER_L3_IPV6_EXT_UNKNOWN;
+       uint32_t flags_type, flags2;
+       uint8_t index;
 
-       switch (flags_type) {
-       case RTE_LE32(RX_PKT_CMPL_FLAGS_ITYPE_ICMP):
-               if (!t_ipcs)
-                       pkt_type |= l3 | RTE_PTYPE_L4_ICMP;
-               else
-                       pkt_type |= l3 | RTE_PTYPE_INNER_L4_ICMP;
-               break;
+       flags_type = rte_le_to_cpu_16(rxcmp->flags_type);
+       flags2 = rte_le_to_cpu_32(rxcmp1->flags2);
 
-       case RTE_LE32(RX_PKT_CMPL_FLAGS_ITYPE_TCP):
-               if (!t_ipcs)
-                       pkt_type |= l3 | RTE_PTYPE_L4_TCP;
-               else
-                       pkt_type |= l3 | RTE_PTYPE_INNER_L4_TCP;
-               break;
+       /*
+        * Index format:
+        *     bit 0: RX_PKT_CMPL_FLAGS2_T_IP_CS_CALC
+        *     bit 1: RX_CMPL_FLAGS2_IP_TYPE
+        *     bit 2: RX_PKT_CMPL_FLAGS2_META_FORMAT_VLAN
+        *     bits 3-6: RX_PKT_CMPL_FLAGS_ITYPE
+        */
+       index = ((flags_type & RX_PKT_CMPL_FLAGS_ITYPE_MASK) >> 9) |
+               ((flags2 & (RX_PKT_CMPL_FLAGS2_META_FORMAT_VLAN |
+                          RX_PKT_CMPL_FLAGS2_T_IP_CS_CALC)) >> 2) |
+               ((flags2 & RX_PKT_CMPL_FLAGS2_IP_TYPE) >> 7);
 
-       case RTE_LE32(RX_PKT_CMPL_FLAGS_ITYPE_UDP):
-               if (!t_ipcs)
-                       pkt_type |= l3 | RTE_PTYPE_L4_UDP;
-               else
-                       pkt_type |= l3 | RTE_PTYPE_INNER_L4_UDP;
-               break;
+       return bnxt_ptype_table[index];
+}
 
-       case RTE_LE32(RX_PKT_CMPL_FLAGS_ITYPE_IP):
-               pkt_type |= l3;
-               break;
+uint32_t
+bnxt_ol_flags_table[BNXT_OL_FLAGS_TBL_DIM] __rte_cache_aligned;
+
+uint32_t
+bnxt_ol_flags_err_table[BNXT_OL_FLAGS_ERR_TBL_DIM] __rte_cache_aligned;
+
+static void __rte_cold
+bnxt_init_ol_flags_tables(void)
+{
+       static bool initialized;
+       uint32_t *pt;
+       int i;
+
+       if (initialized)
+               return;
+
+       /* Initialize ol_flags table. */
+       pt = bnxt_ol_flags_table;
+       for (i = 0; i < BNXT_OL_FLAGS_TBL_DIM; i++) {
+               pt[i] = 0;
+               if (i & RX_PKT_CMPL_FLAGS2_META_FORMAT_VLAN)
+                       pt[i] |= PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED;
+
+               if (i & RX_PKT_CMPL_FLAGS2_IP_CS_CALC)
+                       pt[i] |= PKT_RX_IP_CKSUM_GOOD;
+
+               if (i & RX_PKT_CMPL_FLAGS2_L4_CS_CALC)
+                       pt[i] |= PKT_RX_L4_CKSUM_GOOD;
+
+               if (i & RX_PKT_CMPL_FLAGS2_T_L4_CS_CALC)
+                       pt[i] |= PKT_RX_OUTER_L4_CKSUM_GOOD;
+       }
+
+       /* Initialize checksum error table. */
+       pt = bnxt_ol_flags_err_table;
+       for (i = 0; i < BNXT_OL_FLAGS_ERR_TBL_DIM; i++) {
+               pt[i] = 0;
+               if (i & (RX_PKT_CMPL_ERRORS_IP_CS_ERROR >> 4))
+                       pt[i] |= PKT_RX_IP_CKSUM_BAD;
+
+               if (i & (RX_PKT_CMPL_ERRORS_L4_CS_ERROR >> 4))
+                       pt[i] |= PKT_RX_L4_CKSUM_BAD;
+
+               if (i & (RX_PKT_CMPL_ERRORS_T_IP_CS_ERROR >> 4))
+                       pt[i] |= PKT_RX_EIP_CKSUM_BAD;
+
+               if (i & (RX_PKT_CMPL_ERRORS_T_L4_CS_ERROR >> 4))
+                       pt[i] |= PKT_RX_OUTER_L4_CKSUM_BAD;
        }
 
-       return pkt_type;
+       initialized = true;
+}
+
+static void
+bnxt_set_ol_flags(struct rx_pkt_cmpl *rxcmp, struct rx_pkt_cmpl_hi *rxcmp1,
+                 struct rte_mbuf *mbuf)
+{
+       uint16_t flags_type, errors, flags;
+       uint64_t ol_flags;
+
+       flags_type = rte_le_to_cpu_16(rxcmp->flags_type);
+
+       flags = rte_le_to_cpu_32(rxcmp1->flags2) &
+                               (RX_PKT_CMPL_FLAGS2_IP_CS_CALC |
+                                RX_PKT_CMPL_FLAGS2_L4_CS_CALC |
+                                RX_PKT_CMPL_FLAGS2_T_IP_CS_CALC |
+                                RX_PKT_CMPL_FLAGS2_T_L4_CS_CALC |
+                                RX_PKT_CMPL_FLAGS2_META_FORMAT_VLAN);
+
+       errors = rte_le_to_cpu_16(rxcmp1->errors_v2) &
+                               (RX_PKT_CMPL_ERRORS_IP_CS_ERROR |
+                                RX_PKT_CMPL_ERRORS_L4_CS_ERROR |
+                                RX_PKT_CMPL_ERRORS_T_IP_CS_ERROR |
+                                RX_PKT_CMPL_ERRORS_T_L4_CS_ERROR);
+       errors = (errors >> 4) & flags;
+
+       ol_flags = bnxt_ol_flags_table[flags & ~errors];
+
+       if (errors)
+               ol_flags |= bnxt_ol_flags_err_table[errors];
+
+       if (flags_type & RX_PKT_CMPL_FLAGS_RSS_VALID) {
+               mbuf->hash.rss = rte_le_to_cpu_32(rxcmp->rss_hash);
+               ol_flags |= PKT_RX_RSS_HASH;
+       }
+
+       mbuf->ol_flags = ol_flags;
 }
 
 #ifdef RTE_LIBRTE_IEEE1588
 static void
-bnxt_get_rx_ts_thor(struct bnxt *bp, uint32_t rx_ts_cmpl)
+bnxt_get_rx_ts_p5(struct bnxt *bp, uint32_t rx_ts_cmpl)
 {
        uint64_t systime_cycles = 0;
 
-       if (!BNXT_CHIP_THOR(bp))
+       if (!BNXT_CHIP_P5(bp))
                return;
 
        /* On Thor, Rx timestamps are provided directly in the
@@ -402,9 +519,9 @@ bnxt_get_rx_ts_thor(struct bnxt *bp, uint32_t rx_ts_cmpl)
 }
 #endif
 
-static void
+static uint32_t
 bnxt_ulp_set_mark_in_mbuf(struct bnxt *bp, struct rx_pkt_cmpl_hi *rxcmp1,
-                         struct rte_mbuf *mbuf)
+                         struct rte_mbuf *mbuf, uint32_t *vfr_flag)
 {
        uint32_t cfa_code;
        uint32_t meta_fmt;
@@ -412,8 +529,12 @@ bnxt_ulp_set_mark_in_mbuf(struct bnxt *bp, struct rx_pkt_cmpl_hi *rxcmp1,
        bool gfid = false;
        uint32_t mark_id;
        uint32_t flags2;
+       uint32_t gfid_support = 0;
        int rc;
 
+       if (BNXT_GFID_ENABLED(bp))
+               gfid_support = 1;
+
        cfa_code = rte_le_to_cpu_16(rxcmp1->cfa_code);
        flags2 = rte_le_to_cpu_32(rxcmp1->flags2);
        meta = rte_le_to_cpu_32(rxcmp1->metadata);
@@ -427,8 +548,14 @@ bnxt_ulp_set_mark_in_mbuf(struct bnxt *bp, struct rx_pkt_cmpl_hi *rxcmp1,
 
        switch (meta_fmt) {
        case 0:
-               /* Not an LFID or GFID, a flush cmd. */
-               goto skip_mark;
+               if (gfid_support) {
+                       /* Not an LFID or GFID, a flush cmd. */
+                       goto skip_mark;
+               } else {
+                       /* LFID mode, no vlan scenario */
+                       gfid = false;
+               }
+               break;
        case 4:
        case 5:
                /*
@@ -437,13 +564,19 @@ bnxt_ulp_set_mark_in_mbuf(struct bnxt *bp, struct rx_pkt_cmpl_hi *rxcmp1,
                 * collisions with EEM.  Simply return without setting the mark
                 * in the mbuf.
                 */
-               if (BNXT_CFA_META_EM_TEST(meta))
-                       goto skip_mark;
-               /*
-                * It is a TCAM entry, so it is an LFID. The TCAM IDX and Mode
-                * can also be determined by decoding the meta_data.  We are not
-                * using these for now.
-                */
+               if (BNXT_CFA_META_EM_TEST(meta)) {
+                       /*This is EM hit {EM(1), GFID[27:16], 19'd0 or vtag } */
+                       gfid = true;
+                       meta >>= BNXT_RX_META_CFA_CODE_SHIFT;
+                       cfa_code |= meta << BNXT_CFA_CODE_META_SHIFT;
+               } else {
+                       /*
+                        * It is a TCAM entry, so it is an LFID.
+                        * The TCAM IDX and Mode can also be determined
+                        * by decoding the meta_data. We are not
+                        * using these for now.
+                        */
+               }
                break;
        case 6:
        case 7:
@@ -465,22 +598,25 @@ bnxt_ulp_set_mark_in_mbuf(struct bnxt *bp, struct rx_pkt_cmpl_hi *rxcmp1,
                break;
        }
 
-       if (cfa_code) {
-               rc = ulp_mark_db_mark_get(bp->ulp_ctx, gfid,
-                                         cfa_code, &mark_id);
-               if (!rc) {
-                       /* Got the mark, write it to the mbuf and return */
-                       mbuf->hash.fdir.hi = mark_id;
-                       mbuf->udata64 = (cfa_code & 0xffffffffull) << 32;
-                       mbuf->hash.fdir.id = rxcmp1->cfa_code;
-                       mbuf->ol_flags |= PKT_RX_FDIR | PKT_RX_FDIR_ID;
-                       return;
-               }
+       rc = ulp_mark_db_mark_get(bp->ulp_ctx, gfid,
+                                 cfa_code, vfr_flag, &mark_id);
+       if (!rc) {
+               /* VF to VFR Rx path. So, skip mark_id injection in mbuf */
+               if (vfr_flag && *vfr_flag)
+                       return mark_id;
+               /* Got the mark, write it to the mbuf and return */
+               mbuf->hash.fdir.hi = mark_id;
+               *bnxt_cfa_code_dynfield(mbuf) = cfa_code & 0xffffffffull;
+               mbuf->hash.fdir.id = rxcmp1->cfa_code;
+               mbuf->ol_flags |= PKT_RX_FDIR | PKT_RX_FDIR_ID;
+               return mark_id;
        }
 
 skip_mark:
        mbuf->hash.fdir.hi = 0;
        mbuf->hash.fdir.id = 0;
+
+       return 0;
 }
 
 void bnxt_set_mark_in_mbuf(struct bnxt *bp,
@@ -523,7 +659,7 @@ void bnxt_set_mark_in_mbuf(struct bnxt *bp,
 }
 
 static int bnxt_rx_pkt(struct rte_mbuf **rx_pkt,
-                           struct bnxt_rx_queue *rxq, uint32_t *raw_cons)
+                      struct bnxt_rx_queue *rxq, uint32_t *raw_cons)
 {
        struct bnxt_cp_ring_info *cpr = rxq->cp_ring;
        struct bnxt_rx_ring_info *rxr = rxq->rx_ring;
@@ -536,8 +672,7 @@ static int bnxt_rx_pkt(struct rte_mbuf **rx_pkt,
        int rc = 0;
        uint8_t agg_buf = 0;
        uint16_t cmp_type;
-       uint32_t flags2_f = 0;
-       uint16_t flags_type;
+       uint32_t vfr_flag = 0, mark_id = 0;
        struct bnxt *bp = rxq->bp;
 
        rxcmp = (struct rx_pkt_cmpl *)
@@ -598,87 +733,33 @@ static int bnxt_rx_pkt(struct rte_mbuf **rx_pkt,
        if (mbuf == NULL)
                return -EBUSY;
 
-       rte_prefetch0(mbuf);
-
        mbuf->data_off = RTE_PKTMBUF_HEADROOM;
        mbuf->nb_segs = 1;
        mbuf->next = NULL;
        mbuf->pkt_len = rxcmp->len;
        mbuf->data_len = mbuf->pkt_len;
        mbuf->port = rxq->port_id;
-       mbuf->ol_flags = 0;
 
-       flags_type = rte_le_to_cpu_16(rxcmp->flags_type);
-       if (flags_type & RX_PKT_CMPL_FLAGS_RSS_VALID) {
-               mbuf->hash.rss = rxcmp->rss_hash;
-               mbuf->ol_flags |= PKT_RX_RSS_HASH;
+       bnxt_set_ol_flags(rxcmp, rxcmp1, mbuf);
+
+#ifdef RTE_LIBRTE_IEEE1588
+       if (unlikely((rte_le_to_cpu_16(rxcmp->flags_type) &
+                     RX_PKT_CMPL_FLAGS_MASK) ==
+                     RX_PKT_CMPL_FLAGS_ITYPE_PTP_W_TIMESTAMP)) {
+               mbuf->ol_flags |= PKT_RX_IEEE1588_PTP | PKT_RX_IEEE1588_TMST;
+               bnxt_get_rx_ts_p5(rxq->bp, rxcmp1->reorder);
        }
+#endif
 
        if (BNXT_TRUFLOW_EN(bp))
-               bnxt_ulp_set_mark_in_mbuf(rxq->bp, rxcmp1, mbuf);
+               mark_id = bnxt_ulp_set_mark_in_mbuf(rxq->bp, rxcmp1, mbuf,
+                                                   &vfr_flag);
        else
                bnxt_set_mark_in_mbuf(rxq->bp, rxcmp1, mbuf);
 
-#ifdef RTE_LIBRTE_IEEE1588
-       if (unlikely((flags_type & RX_PKT_CMPL_FLAGS_MASK) ==
-                    RX_PKT_CMPL_FLAGS_ITYPE_PTP_W_TIMESTAMP)) {
-               mbuf->ol_flags |= PKT_RX_IEEE1588_PTP | PKT_RX_IEEE1588_TMST;
-               bnxt_get_rx_ts_thor(rxq->bp, rxcmp1->reorder);
-       }
-#endif
        if (agg_buf)
                bnxt_rx_pages(rxq, mbuf, &tmp_raw_cons, agg_buf, NULL);
 
-       if (rxcmp1->flags2 & RX_PKT_CMPL_FLAGS2_META_FORMAT_VLAN) {
-               mbuf->vlan_tci = rxcmp1->metadata &
-                       (RX_PKT_CMPL_METADATA_VID_MASK |
-                       RX_PKT_CMPL_METADATA_DE |
-                       RX_PKT_CMPL_METADATA_PRI_MASK);
-               mbuf->ol_flags |= PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED;
-       }
-
-       flags2_f = flags2_0xf(rxcmp1);
-       /* IP Checksum */
-       if (likely(IS_IP_NONTUNNEL_PKT(flags2_f))) {
-               if (unlikely(RX_CMP_IP_CS_ERROR(rxcmp1)))
-                       mbuf->ol_flags |= PKT_RX_IP_CKSUM_BAD;
-               else if (unlikely(RX_CMP_IP_CS_UNKNOWN(rxcmp1)))
-                       mbuf->ol_flags |= PKT_RX_IP_CKSUM_UNKNOWN;
-               else
-                       mbuf->ol_flags |= PKT_RX_IP_CKSUM_GOOD;
-       } else if (IS_IP_TUNNEL_PKT(flags2_f)) {
-               if (unlikely(RX_CMP_IP_OUTER_CS_ERROR(rxcmp1) ||
-                            RX_CMP_IP_CS_ERROR(rxcmp1)))
-                       mbuf->ol_flags |= PKT_RX_IP_CKSUM_BAD;
-               else if (unlikely(RX_CMP_IP_CS_UNKNOWN(rxcmp1)))
-                       mbuf->ol_flags |= PKT_RX_IP_CKSUM_UNKNOWN;
-               else
-                       mbuf->ol_flags |= PKT_RX_IP_CKSUM_GOOD;
-       }
-
-       /* L4 Checksum */
-       if (likely(IS_L4_NONTUNNEL_PKT(flags2_f))) {
-               if (unlikely(RX_CMP_L4_INNER_CS_ERR2(rxcmp1)))
-                       mbuf->ol_flags |= PKT_RX_L4_CKSUM_BAD;
-               else
-                       mbuf->ol_flags |= PKT_RX_L4_CKSUM_GOOD;
-       } else if (IS_L4_TUNNEL_PKT(flags2_f)) {
-               if (unlikely(RX_CMP_L4_INNER_CS_ERR2(rxcmp1)))
-                       mbuf->ol_flags |= PKT_RX_L4_CKSUM_BAD;
-               else
-                       mbuf->ol_flags |= PKT_RX_L4_CKSUM_GOOD;
-               if (unlikely(RX_CMP_L4_OUTER_CS_ERR2(rxcmp1))) {
-                       mbuf->ol_flags |= PKT_RX_OUTER_L4_CKSUM_BAD;
-               } else if (unlikely(IS_L4_TUNNEL_PKT_ONLY_INNER_L4_CS
-                                   (flags2_f))) {
-                       mbuf->ol_flags |= PKT_RX_OUTER_L4_CKSUM_UNKNOWN;
-               } else {
-                       mbuf->ol_flags |= PKT_RX_OUTER_L4_CKSUM_GOOD;
-               }
-       } else if (unlikely(RX_CMP_L4_CS_UNKNOWN(rxcmp1))) {
-               mbuf->ol_flags |= PKT_RX_L4_CKSUM_UNKNOWN;
-       }
-
        mbuf->packet_type = bnxt_parse_pkt_type(rxcmp, rxcmp1);
 
 #ifdef BNXT_DEBUG
@@ -712,6 +793,19 @@ static int bnxt_rx_pkt(struct rte_mbuf **rx_pkt,
                goto rx;
        }
        rxr->rx_prod = prod;
+
+       if (BNXT_TRUFLOW_EN(bp) && (BNXT_VF_IS_TRUSTED(bp) || BNXT_PF(bp)) &&
+           vfr_flag) {
+               bnxt_vfr_recv(mark_id, rxq->queue_id, mbuf);
+               /* Now return an error so that nb_rx_pkts is not
+                * incremented.
+                * This packet was meant to be given to the representor.
+                * So no need to account the packet and give it to
+                * parent Rx burst function.
+                */
+               rc = -ENODEV;
+               goto next_rx;
+       }
        /*
         * All MBUFs are allocated with the same size under DPDK,
         * no optimization for rx_copy_thresh
@@ -735,6 +829,7 @@ uint16_t bnxt_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
        uint32_t raw_cons = cpr->cp_raw_cons;
        uint32_t cons;
        int nb_rx_pkts = 0;
+       int nb_rep_rx_pkts = 0;
        struct rx_pkt_cmpl *rxcmp;
        uint16_t prod = rxr->rx_prod;
        uint16_t ag_prod = rxr->ag_prod;
@@ -745,14 +840,30 @@ uint16_t bnxt_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
                return 0;
 
        /* If Rx Q was stopped return */
-       if (unlikely(!rxq->rx_started ||
-                    !rte_spinlock_trylock(&rxq->lock)))
+       if (unlikely(!rxq->rx_started))
                return 0;
 
+#if defined(RTE_ARCH_X86) || defined(RTE_ARCH_ARM64)
+       /*
+        * Replenish buffers if needed when a transition has been made from
+        * vector- to non-vector- receive processing.
+        */
+       while (unlikely(rxq->rxrearm_nb)) {
+               if (!bnxt_alloc_rx_data(rxq, rxr, rxq->rxrearm_start)) {
+                       rxr->rx_prod = rxq->rxrearm_start;
+                       bnxt_db_write(&rxr->rx_db, rxr->rx_prod);
+                       rxq->rxrearm_start++;
+                       rxq->rxrearm_nb--;
+               } else {
+                       /* Retry allocation on next call. */
+                       break;
+               }
+       }
+#endif
+
        /* Handle RX burst request */
        while (1) {
                cons = RING_CMP(cpr->cp_ring_struct, raw_cons);
-               rte_prefetch0(&cpr->cp_desc_ring[cons]);
                rxcmp = (struct rx_pkt_cmpl *)&cpr->cp_desc_ring[cons];
 
                if (!CMP_VALID(rxcmp, raw_cons, cpr->cp_ring_struct))
@@ -768,6 +879,8 @@ uint16_t bnxt_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
                                nb_rx_pkts++;
                        if (rc == -EBUSY)       /* partial completion */
                                break;
+                       if (rc == -ENODEV)      /* completion for representor */
+                               nb_rep_rx_pkts++;
                } else if (!BNXT_NUM_ASYNC_CPR(rxq->bp)) {
                        evt =
                        bnxt_event_hwrm_resp_handler(rxq->bp,
@@ -786,7 +899,7 @@ uint16_t bnxt_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
        }
 
        cpr->cp_raw_cons = raw_cons;
-       if (!nb_rx_pkts && !evt) {
+       if (!nb_rx_pkts && !nb_rep_rx_pkts && !evt) {
                /*
                 * For PMD, there is no need to keep on pushing to REARM
                 * the doorbell if there are no new completions
@@ -810,10 +923,10 @@ uint16_t bnxt_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
 
                for (; cnt;
                        i = RING_NEXT(rxr->rx_ring_struct, i), cnt--) {
-                       struct bnxt_sw_rx_bd *rx_buf = &rxr->rx_buf_ring[i];
+                       struct rte_mbuf **rx_buf = &rxr->rx_buf_ring[i];
 
                        /* Buffer already allocated for this index. */
-                       if (rx_buf->mbuf != NULL)
+                       if (*rx_buf != NULL && *rx_buf != &rxq->fake_mbuf)
                                continue;
 
                        /* This slot is empty. Alloc buffer for Rx */
@@ -828,8 +941,6 @@ uint16_t bnxt_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
        }
 
 done:
-       rte_spinlock_unlock(&rxq->lock);
-
        return nb_rx_pkts;
 }
 
@@ -881,9 +992,12 @@ void bnxt_free_rx_rings(struct bnxt *bp)
 
 int bnxt_init_rx_ring_struct(struct bnxt_rx_queue *rxq, unsigned int socket_id)
 {
+       struct rte_eth_dev *eth_dev = rxq->bp->eth_dev;
+       struct rte_eth_rxmode *rxmode;
        struct bnxt_cp_ring_info *cpr;
        struct bnxt_rx_ring_info *rxr;
        struct bnxt_ring *ring;
+       bool use_agg_ring;
 
        rxq->rx_buf_size = BNXT_MAX_PKT_LEN + sizeof(struct rte_mbuf);
 
@@ -904,8 +1018,13 @@ int bnxt_init_rx_ring_struct(struct bnxt_rx_queue *rxq, unsigned int socket_id)
        ring->ring_mask = ring->ring_size - 1;
        ring->bd = (void *)rxr->rx_desc_ring;
        ring->bd_dma = rxr->rx_desc_mapping;
-       ring->vmem_size = ring->ring_size * sizeof(struct bnxt_sw_rx_bd);
+
+       /* Allocate extra rx ring entries for vector rx. */
+       ring->vmem_size = sizeof(struct rte_mbuf *) *
+                               (ring->ring_size + RTE_BNXT_DESCS_PER_LOOP);
+
        ring->vmem = (void **)&rxr->rx_buf_ring;
+       ring->fw_ring_id = INVALID_HW_RING_ID;
 
        cpr = rte_zmalloc_socket("bnxt_rx_ring",
                                 sizeof(struct bnxt_cp_ring_info),
@@ -920,13 +1039,28 @@ int bnxt_init_rx_ring_struct(struct bnxt_rx_queue *rxq, unsigned int socket_id)
        if (ring == NULL)
                return -ENOMEM;
        cpr->cp_ring_struct = ring;
-       ring->ring_size = rte_align32pow2(rxr->rx_ring_struct->ring_size *
-                                         (2 + AGG_RING_SIZE_FACTOR));
+
+       rxmode = &eth_dev->data->dev_conf.rxmode;
+       use_agg_ring = (rxmode->offloads & DEV_RX_OFFLOAD_SCATTER) ||
+                      (rxmode->offloads & DEV_RX_OFFLOAD_TCP_LRO) ||
+                      (rxmode->max_rx_pkt_len >
+                        (uint32_t)(rte_pktmbuf_data_room_size(rxq->mb_pool) -
+                                   RTE_PKTMBUF_HEADROOM));
+
+       /* Allocate two completion slots per entry in desc ring. */
+       ring->ring_size = rxr->rx_ring_struct->ring_size * 2;
+
+       /* Allocate additional slots if aggregation ring is in use. */
+       if (use_agg_ring)
+               ring->ring_size *= AGG_RING_SIZE_FACTOR;
+
+       ring->ring_size = rte_align32pow2(ring->ring_size);
        ring->ring_mask = ring->ring_size - 1;
        ring->bd = (void *)cpr->cp_desc_ring;
        ring->bd_dma = cpr->cp_desc_mapping;
        ring->vmem_size = 0;
        ring->vmem = NULL;
+       ring->fw_ring_id = INVALID_HW_RING_ID;
 
        /* Allocate Aggregator rings */
        ring = rte_zmalloc_socket("bnxt_rx_ring_struct",
@@ -940,8 +1074,9 @@ int bnxt_init_rx_ring_struct(struct bnxt_rx_queue *rxq, unsigned int socket_id)
        ring->ring_mask = ring->ring_size - 1;
        ring->bd = (void *)rxr->ag_desc_ring;
        ring->bd_dma = rxr->ag_desc_mapping;
-       ring->vmem_size = ring->ring_size * sizeof(struct bnxt_sw_rx_bd);
+       ring->vmem_size = ring->ring_size * sizeof(struct rte_mbuf *);
        ring->vmem = (void **)&rxr->ag_buf_ring;
+       ring->fw_ring_id = INVALID_HW_RING_ID;
 
        return 0;
 }
@@ -969,10 +1104,16 @@ int bnxt_init_one_rx_ring(struct bnxt_rx_queue *rxq)
        unsigned int i;
        uint16_t size;
 
+       /* Initialize packet type table. */
+       bnxt_init_ptype_table();
+
+       /* Initialize offload flags parsing table. */
+       bnxt_init_ol_flags_tables();
+
        size = rte_pktmbuf_data_room_size(rxq->mb_pool) - RTE_PKTMBUF_HEADROOM;
        size = RTE_MIN(BNXT_MAX_PKT_LEN, size);
 
-       type = RX_PROD_PKT_BD_TYPE_RX_PROD_PKT | RX_PROD_PKT_BD_FLAGS_EOP_PAD;
+       type = RX_PROD_PKT_BD_TYPE_RX_PROD_PKT;
 
        rxr = rxq->rx_ring;
        ring = rxr->rx_ring_struct;
@@ -980,7 +1121,7 @@ int bnxt_init_one_rx_ring(struct bnxt_rx_queue *rxq)
 
        prod = rxr->rx_prod;
        for (i = 0; i < ring->ring_size; i++) {
-               if (unlikely(!rxr->rx_buf_ring[i].mbuf)) {
+               if (unlikely(!rxr->rx_buf_ring[i])) {
                        if (bnxt_alloc_rx_data(rxq, rxr, prod) != 0) {
                                PMD_DRV_LOG(WARNING,
                                            "init'ed rx ring %d with %d/%d mbufs only\n",
@@ -992,13 +1133,19 @@ int bnxt_init_one_rx_ring(struct bnxt_rx_queue *rxq)
                prod = RING_NEXT(rxr->rx_ring_struct, prod);
        }
 
+       /* Initialize dummy mbuf pointers for vector mode rx. */
+       for (i = ring->ring_size;
+            i < ring->ring_size + RTE_BNXT_DESCS_PER_LOOP; i++) {
+               rxr->rx_buf_ring[i] = &rxq->fake_mbuf;
+       }
+
        ring = rxr->ag_ring_struct;
        type = RX_PROD_AGG_BD_TYPE_RX_PROD_AGG;
        bnxt_init_rxbds(ring, type, size);
        prod = rxr->ag_prod;
 
        for (i = 0; i < ring->ring_size; i++) {
-               if (unlikely(!rxr->ag_buf_ring[i].mbuf)) {
+               if (unlikely(!rxr->ag_buf_ring[i])) {
                        if (bnxt_alloc_ag_data(rxq, rxr, prod) != 0) {
                                PMD_DRV_LOG(WARNING,
                                            "init'ed AG ring %d with %d/%d mbufs only\n",