net/cnxk: support all multicast
[dpdk.git] / drivers / net / cnxk / cnxk_ethdev.c
index 109fd35..516788c 100644 (file)
@@ -37,8 +37,1083 @@ nix_get_speed_capa(struct cnxk_eth_dev *dev)
        return speed_capa;
 }
 
+static void
+nix_enable_mseg_on_jumbo(struct cnxk_eth_rxq_sp *rxq)
+{
+       struct rte_pktmbuf_pool_private *mbp_priv;
+       struct rte_eth_dev *eth_dev;
+       struct cnxk_eth_dev *dev;
+       uint32_t buffsz;
+
+       dev = rxq->dev;
+       eth_dev = dev->eth_dev;
+
+       /* Get rx buffer size */
+       mbp_priv = rte_mempool_get_priv(rxq->qconf.mp);
+       buffsz = mbp_priv->mbuf_data_room_size - RTE_PKTMBUF_HEADROOM;
+
+       if (eth_dev->data->dev_conf.rxmode.max_rx_pkt_len > buffsz) {
+               dev->rx_offloads |= DEV_RX_OFFLOAD_SCATTER;
+               dev->tx_offloads |= DEV_TX_OFFLOAD_MULTI_SEGS;
+       }
+}
+
+static int
+nix_recalc_mtu(struct rte_eth_dev *eth_dev)
+{
+       struct rte_eth_dev_data *data = eth_dev->data;
+       struct cnxk_eth_rxq_sp *rxq;
+       uint16_t mtu;
+       int rc;
+
+       rxq = ((struct cnxk_eth_rxq_sp *)data->rx_queues[0]) - 1;
+       /* Setup scatter mode if needed by jumbo */
+       nix_enable_mseg_on_jumbo(rxq);
+
+       /* Setup MTU based on max_rx_pkt_len */
+       mtu = data->dev_conf.rxmode.max_rx_pkt_len - CNXK_NIX_L2_OVERHEAD +
+                               CNXK_NIX_MAX_VTAG_ACT_SIZE;
+
+       rc = cnxk_nix_mtu_set(eth_dev, mtu);
+       if (rc)
+               plt_err("Failed to set default MTU size, rc=%d", rc);
+
+       return rc;
+}
+
+uint64_t
+cnxk_nix_rxq_mbuf_setup(struct cnxk_eth_dev *dev)
+{
+       uint16_t port_id = dev->eth_dev->data->port_id;
+       struct rte_mbuf mb_def;
+       uint64_t *tmp;
+
+       RTE_BUILD_BUG_ON(offsetof(struct rte_mbuf, data_off) % 8 != 0);
+       RTE_BUILD_BUG_ON(offsetof(struct rte_mbuf, refcnt) -
+                                offsetof(struct rte_mbuf, data_off) !=
+                        2);
+       RTE_BUILD_BUG_ON(offsetof(struct rte_mbuf, nb_segs) -
+                                offsetof(struct rte_mbuf, data_off) !=
+                        4);
+       RTE_BUILD_BUG_ON(offsetof(struct rte_mbuf, port) -
+                                offsetof(struct rte_mbuf, data_off) !=
+                        6);
+       mb_def.nb_segs = 1;
+       mb_def.data_off = RTE_PKTMBUF_HEADROOM;
+       mb_def.port = port_id;
+       rte_mbuf_refcnt_set(&mb_def, 1);
+
+       /* Prevent compiler reordering: rearm_data covers previous fields */
+       rte_compiler_barrier();
+       tmp = (uint64_t *)&mb_def.rearm_data;
+
+       return *tmp;
+}
+
+static inline uint8_t
+nix_sq_max_sqe_sz(struct cnxk_eth_dev *dev)
+{
+       /*
+        * Maximum three segments can be supported with W8, Choose
+        * NIX_MAXSQESZ_W16 for multi segment offload.
+        */
+       if (dev->tx_offloads & DEV_TX_OFFLOAD_MULTI_SEGS)
+               return NIX_MAXSQESZ_W16;
+       else
+               return NIX_MAXSQESZ_W8;
+}
+
+int
+cnxk_nix_tx_queue_setup(struct rte_eth_dev *eth_dev, uint16_t qid,
+                       uint16_t nb_desc, uint16_t fp_tx_q_sz,
+                       const struct rte_eth_txconf *tx_conf)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       const struct eth_dev_ops *dev_ops = eth_dev->dev_ops;
+       struct cnxk_eth_txq_sp *txq_sp;
+       struct roc_nix_sq *sq;
+       size_t txq_sz;
+       int rc;
+
+       /* Free memory prior to re-allocation if needed. */
+       if (eth_dev->data->tx_queues[qid] != NULL) {
+               plt_nix_dbg("Freeing memory prior to re-allocation %d", qid);
+               dev_ops->tx_queue_release(eth_dev->data->tx_queues[qid]);
+               eth_dev->data->tx_queues[qid] = NULL;
+       }
+
+       /* Setup ROC SQ */
+       sq = &dev->sqs[qid];
+       sq->qid = qid;
+       sq->nb_desc = nb_desc;
+       sq->max_sqe_sz = nix_sq_max_sqe_sz(dev);
+
+       rc = roc_nix_sq_init(&dev->nix, sq);
+       if (rc) {
+               plt_err("Failed to init sq=%d, rc=%d", qid, rc);
+               return rc;
+       }
+
+       rc = -ENOMEM;
+       txq_sz = sizeof(struct cnxk_eth_txq_sp) + fp_tx_q_sz;
+       txq_sp = plt_zmalloc(txq_sz, PLT_CACHE_LINE_SIZE);
+       if (!txq_sp) {
+               plt_err("Failed to alloc tx queue mem");
+               rc |= roc_nix_sq_fini(sq);
+               return rc;
+       }
+
+       txq_sp->dev = dev;
+       txq_sp->qid = qid;
+       txq_sp->qconf.conf.tx = *tx_conf;
+       txq_sp->qconf.nb_desc = nb_desc;
+
+       plt_nix_dbg("sq=%d fc=%p offload=0x%" PRIx64 " lmt_addr=%p"
+                   " nb_sqb_bufs=%d sqes_per_sqb_log2=%d",
+                   qid, sq->fc, dev->tx_offloads, sq->lmt_addr,
+                   sq->nb_sqb_bufs, sq->sqes_per_sqb_log2);
+
+       /* Store start of fast path area */
+       eth_dev->data->tx_queues[qid] = txq_sp + 1;
+       eth_dev->data->tx_queue_state[qid] = RTE_ETH_QUEUE_STATE_STOPPED;
+       return 0;
+}
+
+static void
+cnxk_nix_tx_queue_release(void *txq)
+{
+       struct cnxk_eth_txq_sp *txq_sp;
+       struct cnxk_eth_dev *dev;
+       struct roc_nix_sq *sq;
+       uint16_t qid;
+       int rc;
+
+       if (!txq)
+               return;
+
+       txq_sp = cnxk_eth_txq_to_sp(txq);
+       dev = txq_sp->dev;
+       qid = txq_sp->qid;
+
+       plt_nix_dbg("Releasing txq %u", qid);
+
+       /* Cleanup ROC SQ */
+       sq = &dev->sqs[qid];
+       rc = roc_nix_sq_fini(sq);
+       if (rc)
+               plt_err("Failed to cleanup sq, rc=%d", rc);
+
+       /* Finally free */
+       plt_free(txq_sp);
+}
+
+int
+cnxk_nix_rx_queue_setup(struct rte_eth_dev *eth_dev, uint16_t qid,
+                       uint16_t nb_desc, uint16_t fp_rx_q_sz,
+                       const struct rte_eth_rxconf *rx_conf,
+                       struct rte_mempool *mp)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       struct cnxk_eth_rxq_sp *rxq_sp;
+       struct rte_mempool_ops *ops;
+       const char *platform_ops;
+       struct roc_nix_rq *rq;
+       struct roc_nix_cq *cq;
+       uint16_t first_skip;
+       int rc = -EINVAL;
+       size_t rxq_sz;
+
+       /* Sanity checks */
+       if (rx_conf->rx_deferred_start == 1) {
+               plt_err("Deferred Rx start is not supported");
+               goto fail;
+       }
+
+       platform_ops = rte_mbuf_platform_mempool_ops();
+       /* This driver needs cnxk_npa mempool ops to work */
+       ops = rte_mempool_get_ops(mp->ops_index);
+       if (strncmp(ops->name, platform_ops, RTE_MEMPOOL_OPS_NAMESIZE)) {
+               plt_err("mempool ops should be of cnxk_npa type");
+               goto fail;
+       }
+
+       if (mp->pool_id == 0) {
+               plt_err("Invalid pool_id");
+               goto fail;
+       }
+
+       /* Free memory prior to re-allocation if needed */
+       if (eth_dev->data->rx_queues[qid] != NULL) {
+               const struct eth_dev_ops *dev_ops = eth_dev->dev_ops;
+
+               plt_nix_dbg("Freeing memory prior to re-allocation %d", qid);
+               dev_ops->rx_queue_release(eth_dev->data->rx_queues[qid]);
+               eth_dev->data->rx_queues[qid] = NULL;
+       }
+
+       /* Setup ROC CQ */
+       cq = &dev->cqs[qid];
+       cq->qid = qid;
+       cq->nb_desc = nb_desc;
+       rc = roc_nix_cq_init(&dev->nix, cq);
+       if (rc) {
+               plt_err("Failed to init roc cq for rq=%d, rc=%d", qid, rc);
+               goto fail;
+       }
+
+       /* Setup ROC RQ */
+       rq = &dev->rqs[qid];
+       rq->qid = qid;
+       rq->aura_handle = mp->pool_id;
+       rq->flow_tag_width = 32;
+       rq->sso_ena = false;
+
+       /* Calculate first mbuf skip */
+       first_skip = (sizeof(struct rte_mbuf));
+       first_skip += RTE_PKTMBUF_HEADROOM;
+       first_skip += rte_pktmbuf_priv_size(mp);
+       rq->first_skip = first_skip;
+       rq->later_skip = sizeof(struct rte_mbuf);
+       rq->lpb_size = mp->elt_size;
+
+       rc = roc_nix_rq_init(&dev->nix, rq, !!eth_dev->data->dev_started);
+       if (rc) {
+               plt_err("Failed to init roc rq for rq=%d, rc=%d", qid, rc);
+               goto cq_fini;
+       }
+
+       /* Allocate and setup fast path rx queue */
+       rc = -ENOMEM;
+       rxq_sz = sizeof(struct cnxk_eth_rxq_sp) + fp_rx_q_sz;
+       rxq_sp = plt_zmalloc(rxq_sz, PLT_CACHE_LINE_SIZE);
+       if (!rxq_sp) {
+               plt_err("Failed to alloc rx queue for rq=%d", qid);
+               goto rq_fini;
+       }
+
+       /* Setup slow path fields */
+       rxq_sp->dev = dev;
+       rxq_sp->qid = qid;
+       rxq_sp->qconf.conf.rx = *rx_conf;
+       rxq_sp->qconf.nb_desc = nb_desc;
+       rxq_sp->qconf.mp = mp;
+
+       plt_nix_dbg("rq=%d pool=%s nb_desc=%d->%d", qid, mp->name, nb_desc,
+                   cq->nb_desc);
+
+       /* Store start of fast path area */
+       eth_dev->data->rx_queues[qid] = rxq_sp + 1;
+       eth_dev->data->rx_queue_state[qid] = RTE_ETH_QUEUE_STATE_STOPPED;
+
+       return 0;
+rq_fini:
+       rc |= roc_nix_rq_fini(rq);
+cq_fini:
+       rc |= roc_nix_cq_fini(cq);
+fail:
+       return rc;
+}
+
+static void
+cnxk_nix_rx_queue_release(void *rxq)
+{
+       struct cnxk_eth_rxq_sp *rxq_sp;
+       struct cnxk_eth_dev *dev;
+       struct roc_nix_rq *rq;
+       struct roc_nix_cq *cq;
+       uint16_t qid;
+       int rc;
+
+       if (!rxq)
+               return;
+
+       rxq_sp = cnxk_eth_rxq_to_sp(rxq);
+       dev = rxq_sp->dev;
+       qid = rxq_sp->qid;
+
+       plt_nix_dbg("Releasing rxq %u", qid);
+
+       /* Cleanup ROC RQ */
+       rq = &dev->rqs[qid];
+       rc = roc_nix_rq_fini(rq);
+       if (rc)
+               plt_err("Failed to cleanup rq, rc=%d", rc);
+
+       /* Cleanup ROC CQ */
+       cq = &dev->cqs[qid];
+       rc = roc_nix_cq_fini(cq);
+       if (rc)
+               plt_err("Failed to cleanup cq, rc=%d", rc);
+
+       /* Finally free fast path area */
+       plt_free(rxq_sp);
+}
+
+uint32_t
+cnxk_rss_ethdev_to_nix(struct cnxk_eth_dev *dev, uint64_t ethdev_rss,
+                      uint8_t rss_level)
+{
+       uint32_t flow_key_type[RSS_MAX_LEVELS][6] = {
+               {FLOW_KEY_TYPE_IPV4, FLOW_KEY_TYPE_IPV6, FLOW_KEY_TYPE_TCP,
+                FLOW_KEY_TYPE_UDP, FLOW_KEY_TYPE_SCTP, FLOW_KEY_TYPE_ETH_DMAC},
+               {FLOW_KEY_TYPE_INNR_IPV4, FLOW_KEY_TYPE_INNR_IPV6,
+                FLOW_KEY_TYPE_INNR_TCP, FLOW_KEY_TYPE_INNR_UDP,
+                FLOW_KEY_TYPE_INNR_SCTP, FLOW_KEY_TYPE_INNR_ETH_DMAC},
+               {FLOW_KEY_TYPE_IPV4 | FLOW_KEY_TYPE_INNR_IPV4,
+                FLOW_KEY_TYPE_IPV6 | FLOW_KEY_TYPE_INNR_IPV6,
+                FLOW_KEY_TYPE_TCP | FLOW_KEY_TYPE_INNR_TCP,
+                FLOW_KEY_TYPE_UDP | FLOW_KEY_TYPE_INNR_UDP,
+                FLOW_KEY_TYPE_SCTP | FLOW_KEY_TYPE_INNR_SCTP,
+                FLOW_KEY_TYPE_ETH_DMAC | FLOW_KEY_TYPE_INNR_ETH_DMAC}
+       };
+       uint32_t flowkey_cfg = 0;
+
+       dev->ethdev_rss_hf = ethdev_rss;
+
+       if (ethdev_rss & ETH_RSS_L2_PAYLOAD)
+               flowkey_cfg |= FLOW_KEY_TYPE_CH_LEN_90B;
+
+       if (ethdev_rss & ETH_RSS_C_VLAN)
+               flowkey_cfg |= FLOW_KEY_TYPE_VLAN;
+
+       if (ethdev_rss & ETH_RSS_L3_SRC_ONLY)
+               flowkey_cfg |= FLOW_KEY_TYPE_L3_SRC;
+
+       if (ethdev_rss & ETH_RSS_L3_DST_ONLY)
+               flowkey_cfg |= FLOW_KEY_TYPE_L3_DST;
+
+       if (ethdev_rss & ETH_RSS_L4_SRC_ONLY)
+               flowkey_cfg |= FLOW_KEY_TYPE_L4_SRC;
+
+       if (ethdev_rss & ETH_RSS_L4_DST_ONLY)
+               flowkey_cfg |= FLOW_KEY_TYPE_L4_DST;
+
+       if (ethdev_rss & RSS_IPV4_ENABLE)
+               flowkey_cfg |= flow_key_type[rss_level][RSS_IPV4_INDEX];
+
+       if (ethdev_rss & RSS_IPV6_ENABLE)
+               flowkey_cfg |= flow_key_type[rss_level][RSS_IPV6_INDEX];
+
+       if (ethdev_rss & ETH_RSS_TCP)
+               flowkey_cfg |= flow_key_type[rss_level][RSS_TCP_INDEX];
+
+       if (ethdev_rss & ETH_RSS_UDP)
+               flowkey_cfg |= flow_key_type[rss_level][RSS_UDP_INDEX];
+
+       if (ethdev_rss & ETH_RSS_SCTP)
+               flowkey_cfg |= flow_key_type[rss_level][RSS_SCTP_INDEX];
+
+       if (ethdev_rss & ETH_RSS_L2_PAYLOAD)
+               flowkey_cfg |= flow_key_type[rss_level][RSS_DMAC_INDEX];
+
+       if (ethdev_rss & RSS_IPV6_EX_ENABLE)
+               flowkey_cfg |= FLOW_KEY_TYPE_IPV6_EXT;
+
+       if (ethdev_rss & ETH_RSS_PORT)
+               flowkey_cfg |= FLOW_KEY_TYPE_PORT;
+
+       if (ethdev_rss & ETH_RSS_NVGRE)
+               flowkey_cfg |= FLOW_KEY_TYPE_NVGRE;
+
+       if (ethdev_rss & ETH_RSS_VXLAN)
+               flowkey_cfg |= FLOW_KEY_TYPE_VXLAN;
+
+       if (ethdev_rss & ETH_RSS_GENEVE)
+               flowkey_cfg |= FLOW_KEY_TYPE_GENEVE;
+
+       if (ethdev_rss & ETH_RSS_GTPU)
+               flowkey_cfg |= FLOW_KEY_TYPE_GTPU;
+
+       return flowkey_cfg;
+}
+
+static void
+nix_free_queue_mem(struct cnxk_eth_dev *dev)
+{
+       plt_free(dev->rqs);
+       plt_free(dev->cqs);
+       plt_free(dev->sqs);
+       dev->rqs = NULL;
+       dev->cqs = NULL;
+       dev->sqs = NULL;
+}
+
+static int
+nix_rss_default_setup(struct cnxk_eth_dev *dev)
+{
+       struct rte_eth_dev *eth_dev = dev->eth_dev;
+       uint8_t rss_hash_level;
+       uint32_t flowkey_cfg;
+       uint64_t rss_hf;
+
+       rss_hf = eth_dev->data->dev_conf.rx_adv_conf.rss_conf.rss_hf;
+       rss_hash_level = ETH_RSS_LEVEL(rss_hf);
+       if (rss_hash_level)
+               rss_hash_level -= 1;
+
+       flowkey_cfg = cnxk_rss_ethdev_to_nix(dev, rss_hf, rss_hash_level);
+       return roc_nix_rss_default_setup(&dev->nix, flowkey_cfg);
+}
+
+static int
+nix_store_queue_cfg_and_then_release(struct rte_eth_dev *eth_dev)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       const struct eth_dev_ops *dev_ops = eth_dev->dev_ops;
+       struct cnxk_eth_qconf *tx_qconf = NULL;
+       struct cnxk_eth_qconf *rx_qconf = NULL;
+       struct cnxk_eth_rxq_sp *rxq_sp;
+       struct cnxk_eth_txq_sp *txq_sp;
+       int i, nb_rxq, nb_txq;
+       void **txq, **rxq;
+
+       nb_rxq = RTE_MIN(dev->nb_rxq, eth_dev->data->nb_rx_queues);
+       nb_txq = RTE_MIN(dev->nb_txq, eth_dev->data->nb_tx_queues);
+
+       tx_qconf = malloc(nb_txq * sizeof(*tx_qconf));
+       if (tx_qconf == NULL) {
+               plt_err("Failed to allocate memory for tx_qconf");
+               goto fail;
+       }
+
+       rx_qconf = malloc(nb_rxq * sizeof(*rx_qconf));
+       if (rx_qconf == NULL) {
+               plt_err("Failed to allocate memory for rx_qconf");
+               goto fail;
+       }
+
+       txq = eth_dev->data->tx_queues;
+       for (i = 0; i < nb_txq; i++) {
+               if (txq[i] == NULL) {
+                       tx_qconf[i].valid = false;
+                       plt_info("txq[%d] is already released", i);
+                       continue;
+               }
+               txq_sp = cnxk_eth_txq_to_sp(txq[i]);
+               memcpy(&tx_qconf[i], &txq_sp->qconf, sizeof(*tx_qconf));
+               tx_qconf[i].valid = true;
+               dev_ops->tx_queue_release(txq[i]);
+               eth_dev->data->tx_queues[i] = NULL;
+       }
+
+       rxq = eth_dev->data->rx_queues;
+       for (i = 0; i < nb_rxq; i++) {
+               if (rxq[i] == NULL) {
+                       rx_qconf[i].valid = false;
+                       plt_info("rxq[%d] is already released", i);
+                       continue;
+               }
+               rxq_sp = cnxk_eth_rxq_to_sp(rxq[i]);
+               memcpy(&rx_qconf[i], &rxq_sp->qconf, sizeof(*rx_qconf));
+               rx_qconf[i].valid = true;
+               dev_ops->rx_queue_release(rxq[i]);
+               eth_dev->data->rx_queues[i] = NULL;
+       }
+
+       dev->tx_qconf = tx_qconf;
+       dev->rx_qconf = rx_qconf;
+       return 0;
+
+fail:
+       free(tx_qconf);
+       free(rx_qconf);
+       return -ENOMEM;
+}
+
+static int
+nix_restore_queue_cfg(struct rte_eth_dev *eth_dev)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       const struct eth_dev_ops *dev_ops = eth_dev->dev_ops;
+       struct cnxk_eth_qconf *tx_qconf = dev->tx_qconf;
+       struct cnxk_eth_qconf *rx_qconf = dev->rx_qconf;
+       int rc, i, nb_rxq, nb_txq;
+       void **txq, **rxq;
+
+       nb_rxq = RTE_MIN(dev->nb_rxq, eth_dev->data->nb_rx_queues);
+       nb_txq = RTE_MIN(dev->nb_txq, eth_dev->data->nb_tx_queues);
+
+       rc = -ENOMEM;
+       /* Setup tx & rx queues with previous configuration so
+        * that the queues can be functional in cases like ports
+        * are started without re configuring queues.
+        *
+        * Usual re config sequence is like below:
+        * port_configure() {
+        *      if(reconfigure) {
+        *              queue_release()
+        *              queue_setup()
+        *      }
+        *      queue_configure() {
+        *              queue_release()
+        *              queue_setup()
+        *      }
+        * }
+        * port_start()
+        *
+        * In some application's control path, queue_configure() would
+        * NOT be invoked for TXQs/RXQs in port_configure().
+        * In such cases, queues can be functional after start as the
+        * queues are already setup in port_configure().
+        */
+       for (i = 0; i < nb_txq; i++) {
+               if (!tx_qconf[i].valid)
+                       continue;
+               rc = dev_ops->tx_queue_setup(eth_dev, i, tx_qconf[i].nb_desc, 0,
+                                            &tx_qconf[i].conf.tx);
+               if (rc) {
+                       plt_err("Failed to setup tx queue rc=%d", rc);
+                       txq = eth_dev->data->tx_queues;
+                       for (i -= 1; i >= 0; i--)
+                               dev_ops->tx_queue_release(txq[i]);
+                       goto fail;
+               }
+       }
+
+       free(tx_qconf);
+       tx_qconf = NULL;
+
+       for (i = 0; i < nb_rxq; i++) {
+               if (!rx_qconf[i].valid)
+                       continue;
+               rc = dev_ops->rx_queue_setup(eth_dev, i, rx_qconf[i].nb_desc, 0,
+                                            &rx_qconf[i].conf.rx,
+                                            rx_qconf[i].mp);
+               if (rc) {
+                       plt_err("Failed to setup rx queue rc=%d", rc);
+                       rxq = eth_dev->data->rx_queues;
+                       for (i -= 1; i >= 0; i--)
+                               dev_ops->rx_queue_release(rxq[i]);
+                       goto tx_queue_release;
+               }
+       }
+
+       free(rx_qconf);
+       rx_qconf = NULL;
+
+       return 0;
+
+tx_queue_release:
+       txq = eth_dev->data->tx_queues;
+       for (i = 0; i < eth_dev->data->nb_tx_queues; i++)
+               dev_ops->tx_queue_release(txq[i]);
+fail:
+       if (tx_qconf)
+               free(tx_qconf);
+       if (rx_qconf)
+               free(rx_qconf);
+
+       return rc;
+}
+
+static uint16_t
+nix_eth_nop_burst(void *queue, struct rte_mbuf **mbufs, uint16_t pkts)
+{
+       RTE_SET_USED(queue);
+       RTE_SET_USED(mbufs);
+       RTE_SET_USED(pkts);
+
+       return 0;
+}
+
+static void
+nix_set_nop_rxtx_function(struct rte_eth_dev *eth_dev)
+{
+       /* These dummy functions are required for supporting
+        * some applications which reconfigure queues without
+        * stopping tx burst and rx burst threads(eg kni app)
+        * When the queues context is saved, txq/rxqs are released
+        * which caused app crash since rx/tx burst is still
+        * on different lcores
+        */
+       eth_dev->tx_pkt_burst = nix_eth_nop_burst;
+       eth_dev->rx_pkt_burst = nix_eth_nop_burst;
+       rte_mb();
+}
+
+static int
+nix_lso_tun_fmt_update(struct cnxk_eth_dev *dev)
+{
+       uint8_t udp_tun[ROC_NIX_LSO_TUN_MAX];
+       uint8_t tun[ROC_NIX_LSO_TUN_MAX];
+       struct roc_nix *nix = &dev->nix;
+       int rc;
+
+       rc = roc_nix_lso_fmt_get(nix, udp_tun, tun);
+       if (rc)
+               return rc;
+
+       dev->lso_tun_fmt = ((uint64_t)tun[ROC_NIX_LSO_TUN_V4V4] |
+                           (uint64_t)tun[ROC_NIX_LSO_TUN_V4V6] << 8 |
+                           (uint64_t)tun[ROC_NIX_LSO_TUN_V6V4] << 16 |
+                           (uint64_t)tun[ROC_NIX_LSO_TUN_V6V6] << 24);
+
+       dev->lso_tun_fmt |= ((uint64_t)udp_tun[ROC_NIX_LSO_TUN_V4V4] << 32 |
+                            (uint64_t)udp_tun[ROC_NIX_LSO_TUN_V4V6] << 40 |
+                            (uint64_t)udp_tun[ROC_NIX_LSO_TUN_V6V4] << 48 |
+                            (uint64_t)udp_tun[ROC_NIX_LSO_TUN_V6V6] << 56);
+       return 0;
+}
+
+static int
+nix_lso_fmt_setup(struct cnxk_eth_dev *dev)
+{
+       struct roc_nix *nix = &dev->nix;
+       int rc;
+
+       /* Nothing much to do if offload is not enabled */
+       if (!(dev->tx_offloads &
+             (DEV_TX_OFFLOAD_TCP_TSO | DEV_TX_OFFLOAD_VXLAN_TNL_TSO |
+              DEV_TX_OFFLOAD_GENEVE_TNL_TSO | DEV_TX_OFFLOAD_GRE_TNL_TSO)))
+               return 0;
+
+       /* Setup LSO formats in AF. Its a no-op if other ethdev has
+        * already set it up
+        */
+       rc = roc_nix_lso_fmt_setup(nix);
+       if (rc)
+               return rc;
+
+       return nix_lso_tun_fmt_update(dev);
+}
+
+int
+cnxk_nix_configure(struct rte_eth_dev *eth_dev)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       struct rte_eth_dev_data *data = eth_dev->data;
+       struct rte_eth_conf *conf = &data->dev_conf;
+       struct rte_eth_rxmode *rxmode = &conf->rxmode;
+       struct rte_eth_txmode *txmode = &conf->txmode;
+       char ea_fmt[RTE_ETHER_ADDR_FMT_SIZE];
+       struct roc_nix *nix = &dev->nix;
+       struct rte_ether_addr *ea;
+       uint8_t nb_rxq, nb_txq;
+       uint64_t rx_cfg;
+       void *qs;
+       int rc;
+
+       rc = -EINVAL;
+
+       /* Sanity checks */
+       if (rte_eal_has_hugepages() == 0) {
+               plt_err("Huge page is not configured");
+               goto fail_configure;
+       }
+
+       if (conf->dcb_capability_en == 1) {
+               plt_err("dcb enable is not supported");
+               goto fail_configure;
+       }
+
+       if (conf->fdir_conf.mode != RTE_FDIR_MODE_NONE) {
+               plt_err("Flow director is not supported");
+               goto fail_configure;
+       }
+
+       if (rxmode->mq_mode != ETH_MQ_RX_NONE &&
+           rxmode->mq_mode != ETH_MQ_RX_RSS) {
+               plt_err("Unsupported mq rx mode %d", rxmode->mq_mode);
+               goto fail_configure;
+       }
+
+       if (txmode->mq_mode != ETH_MQ_TX_NONE) {
+               plt_err("Unsupported mq tx mode %d", txmode->mq_mode);
+               goto fail_configure;
+       }
+
+       /* Free the resources allocated from the previous configure */
+       if (dev->configured == 1) {
+               /* Unregister queue irq's */
+               roc_nix_unregister_queue_irqs(nix);
+
+               /* Unregister CQ irqs if present */
+               if (eth_dev->data->dev_conf.intr_conf.rxq)
+                       roc_nix_unregister_cq_irqs(nix);
+
+               /* Set no-op functions */
+               nix_set_nop_rxtx_function(eth_dev);
+               /* Store queue config for later */
+               rc = nix_store_queue_cfg_and_then_release(eth_dev);
+               if (rc)
+                       goto fail_configure;
+               roc_nix_tm_fini(nix);
+               roc_nix_lf_free(nix);
+       }
+
+       dev->rx_offloads = rxmode->offloads;
+       dev->tx_offloads = txmode->offloads;
+
+       /* Prepare rx cfg */
+       rx_cfg = ROC_NIX_LF_RX_CFG_DIS_APAD;
+       if (dev->rx_offloads &
+           (DEV_RX_OFFLOAD_TCP_CKSUM | DEV_RX_OFFLOAD_UDP_CKSUM)) {
+               rx_cfg |= ROC_NIX_LF_RX_CFG_CSUM_OL4;
+               rx_cfg |= ROC_NIX_LF_RX_CFG_CSUM_IL4;
+       }
+       rx_cfg |= (ROC_NIX_LF_RX_CFG_DROP_RE | ROC_NIX_LF_RX_CFG_L2_LEN_ERR |
+                  ROC_NIX_LF_RX_CFG_LEN_IL4 | ROC_NIX_LF_RX_CFG_LEN_IL3 |
+                  ROC_NIX_LF_RX_CFG_LEN_OL4 | ROC_NIX_LF_RX_CFG_LEN_OL3);
+
+       nb_rxq = RTE_MAX(data->nb_rx_queues, 1);
+       nb_txq = RTE_MAX(data->nb_tx_queues, 1);
+
+       /* Alloc a nix lf */
+       rc = roc_nix_lf_alloc(nix, nb_rxq, nb_txq, rx_cfg);
+       if (rc) {
+               plt_err("Failed to init nix_lf rc=%d", rc);
+               goto fail_configure;
+       }
+
+       nb_rxq = data->nb_rx_queues;
+       nb_txq = data->nb_tx_queues;
+       rc = -ENOMEM;
+       if (nb_rxq) {
+               /* Allocate memory for roc rq's and cq's */
+               qs = plt_zmalloc(sizeof(struct roc_nix_rq) * nb_rxq, 0);
+               if (!qs) {
+                       plt_err("Failed to alloc rqs");
+                       goto free_nix_lf;
+               }
+               dev->rqs = qs;
+
+               qs = plt_zmalloc(sizeof(struct roc_nix_cq) * nb_rxq, 0);
+               if (!qs) {
+                       plt_err("Failed to alloc cqs");
+                       goto free_nix_lf;
+               }
+               dev->cqs = qs;
+       }
+
+       if (nb_txq) {
+               /* Allocate memory for roc sq's */
+               qs = plt_zmalloc(sizeof(struct roc_nix_sq) * nb_txq, 0);
+               if (!qs) {
+                       plt_err("Failed to alloc sqs");
+                       goto free_nix_lf;
+               }
+               dev->sqs = qs;
+       }
+
+       /* Re-enable NIX LF error interrupts */
+       roc_nix_err_intr_ena_dis(nix, true);
+       roc_nix_ras_intr_ena_dis(nix, true);
+
+       if (nix->rx_ptp_ena) {
+               plt_err("Both PTP and switch header enabled");
+               goto free_nix_lf;
+       }
+
+       /* Setup LSO if needed */
+       rc = nix_lso_fmt_setup(dev);
+       if (rc) {
+               plt_err("Failed to setup nix lso format fields, rc=%d", rc);
+               goto free_nix_lf;
+       }
+
+       /* Configure RSS */
+       rc = nix_rss_default_setup(dev);
+       if (rc) {
+               plt_err("Failed to configure rss rc=%d", rc);
+               goto free_nix_lf;
+       }
+
+       /* Init the default TM scheduler hierarchy */
+       rc = roc_nix_tm_init(nix);
+       if (rc) {
+               plt_err("Failed to init traffic manager, rc=%d", rc);
+               goto free_nix_lf;
+       }
+
+       rc = roc_nix_tm_hierarchy_enable(nix, ROC_NIX_TM_DEFAULT, false);
+       if (rc) {
+               plt_err("Failed to enable default tm hierarchy, rc=%d", rc);
+               goto tm_fini;
+       }
+
+       /* Register queue IRQs */
+       rc = roc_nix_register_queue_irqs(nix);
+       if (rc) {
+               plt_err("Failed to register queue interrupts rc=%d", rc);
+               goto tm_fini;
+       }
+
+       /* Register cq IRQs */
+       if (eth_dev->data->dev_conf.intr_conf.rxq) {
+               if (eth_dev->data->nb_rx_queues > dev->nix.cints) {
+                       plt_err("Rx interrupt cannot be enabled, rxq > %d",
+                               dev->nix.cints);
+                       goto q_irq_fini;
+               }
+               /* Rx interrupt feature cannot work with vector mode because,
+                * vector mode does not process packets unless min 4 pkts are
+                * received, while cq interrupts are generated even for 1 pkt
+                * in the CQ.
+                */
+               dev->scalar_ena = true;
+
+               rc = roc_nix_register_cq_irqs(nix);
+               if (rc) {
+                       plt_err("Failed to register CQ interrupts rc=%d", rc);
+                       goto q_irq_fini;
+               }
+       }
+
+       /* Configure loop back mode */
+       rc = roc_nix_mac_loopback_enable(nix,
+                                        eth_dev->data->dev_conf.lpbk_mode);
+       if (rc) {
+               plt_err("Failed to configure cgx loop back mode rc=%d", rc);
+               goto cq_fini;
+       }
+
+       /*
+        * Restore queue config when reconfigure followed by
+        * reconfigure and no queue configure invoked from application case.
+        */
+       if (dev->configured == 1) {
+               rc = nix_restore_queue_cfg(eth_dev);
+               if (rc)
+                       goto cq_fini;
+       }
+
+       /* Update the mac address */
+       ea = eth_dev->data->mac_addrs;
+       memcpy(ea, dev->mac_addr, RTE_ETHER_ADDR_LEN);
+       if (rte_is_zero_ether_addr(ea))
+               rte_eth_random_addr((uint8_t *)ea);
+
+       rte_ether_format_addr(ea_fmt, RTE_ETHER_ADDR_FMT_SIZE, ea);
+
+       plt_nix_dbg("Configured port%d mac=%s nb_rxq=%d nb_txq=%d"
+                   " rx_offloads=0x%" PRIx64 " tx_offloads=0x%" PRIx64 "",
+                   eth_dev->data->port_id, ea_fmt, nb_rxq, nb_txq,
+                   dev->rx_offloads, dev->tx_offloads);
+
+       /* All good */
+       dev->configured = 1;
+       dev->nb_rxq = data->nb_rx_queues;
+       dev->nb_txq = data->nb_tx_queues;
+       return 0;
+
+cq_fini:
+       roc_nix_unregister_cq_irqs(nix);
+q_irq_fini:
+       roc_nix_unregister_queue_irqs(nix);
+tm_fini:
+       roc_nix_tm_fini(nix);
+free_nix_lf:
+       nix_free_queue_mem(dev);
+       rc |= roc_nix_lf_free(nix);
+fail_configure:
+       dev->configured = 0;
+       return rc;
+}
+
+static int
+cnxk_nix_tx_queue_start(struct rte_eth_dev *eth_dev, uint16_t qid)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       struct rte_eth_dev_data *data = eth_dev->data;
+       struct roc_nix_sq *sq = &dev->sqs[qid];
+       int rc = -EINVAL;
+
+       if (data->tx_queue_state[qid] == RTE_ETH_QUEUE_STATE_STARTED)
+               return 0;
+
+       rc = roc_nix_tm_sq_aura_fc(sq, true);
+       if (rc) {
+               plt_err("Failed to enable sq aura fc, txq=%u, rc=%d", qid, rc);
+               goto done;
+       }
+
+       data->tx_queue_state[qid] = RTE_ETH_QUEUE_STATE_STARTED;
+done:
+       return rc;
+}
+
+int
+cnxk_nix_tx_queue_stop(struct rte_eth_dev *eth_dev, uint16_t qid)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       struct rte_eth_dev_data *data = eth_dev->data;
+       struct roc_nix_sq *sq = &dev->sqs[qid];
+       int rc;
+
+       if (data->tx_queue_state[qid] == RTE_ETH_QUEUE_STATE_STOPPED)
+               return 0;
+
+       rc = roc_nix_tm_sq_aura_fc(sq, false);
+       if (rc) {
+               plt_err("Failed to disable sqb aura fc, txq=%u, rc=%d", qid,
+                       rc);
+               goto done;
+       }
+
+       data->tx_queue_state[qid] = RTE_ETH_QUEUE_STATE_STOPPED;
+done:
+       return rc;
+}
+
+static int
+cnxk_nix_rx_queue_start(struct rte_eth_dev *eth_dev, uint16_t qid)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       struct rte_eth_dev_data *data = eth_dev->data;
+       struct roc_nix_rq *rq = &dev->rqs[qid];
+       int rc;
+
+       if (data->rx_queue_state[qid] == RTE_ETH_QUEUE_STATE_STARTED)
+               return 0;
+
+       rc = roc_nix_rq_ena_dis(rq, true);
+       if (rc) {
+               plt_err("Failed to enable rxq=%u, rc=%d", qid, rc);
+               goto done;
+       }
+
+       data->rx_queue_state[qid] = RTE_ETH_QUEUE_STATE_STARTED;
+done:
+       return rc;
+}
+
+static int
+cnxk_nix_rx_queue_stop(struct rte_eth_dev *eth_dev, uint16_t qid)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       struct rte_eth_dev_data *data = eth_dev->data;
+       struct roc_nix_rq *rq = &dev->rqs[qid];
+       int rc;
+
+       if (data->rx_queue_state[qid] == RTE_ETH_QUEUE_STATE_STOPPED)
+               return 0;
+
+       rc = roc_nix_rq_ena_dis(rq, false);
+       if (rc) {
+               plt_err("Failed to disable rxq=%u, rc=%d", qid, rc);
+               goto done;
+       }
+
+       data->rx_queue_state[qid] = RTE_ETH_QUEUE_STATE_STOPPED;
+done:
+       return rc;
+}
+
+static int
+cnxk_nix_dev_stop(struct rte_eth_dev *eth_dev)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       const struct eth_dev_ops *dev_ops = eth_dev->dev_ops;
+       struct rte_mbuf *rx_pkts[32];
+       int count, i, j, rc;
+       void *rxq;
+
+       /* Disable switch hdr pkind */
+       roc_nix_switch_hdr_set(&dev->nix, 0);
+
+       /* Stop link change events */
+       if (!roc_nix_is_vf_or_sdp(&dev->nix))
+               roc_nix_mac_link_event_start_stop(&dev->nix, false);
+
+       /* Disable Rx via NPC */
+       roc_nix_npc_rx_ena_dis(&dev->nix, false);
+
+       /* Stop rx queues and free up pkts pending */
+       for (i = 0; i < eth_dev->data->nb_rx_queues; i++) {
+               rc = dev_ops->rx_queue_stop(eth_dev, i);
+               if (rc)
+                       continue;
+
+               rxq = eth_dev->data->rx_queues[i];
+               count = dev->rx_pkt_burst_no_offload(rxq, rx_pkts, 32);
+               while (count) {
+                       for (j = 0; j < count; j++)
+                               rte_pktmbuf_free(rx_pkts[j]);
+                       count = dev->rx_pkt_burst_no_offload(rxq, rx_pkts, 32);
+               }
+       }
+
+       /* Stop tx queues  */
+       for (i = 0; i < eth_dev->data->nb_tx_queues; i++)
+               dev_ops->tx_queue_stop(eth_dev, i);
+
+       return 0;
+}
+
+int
+cnxk_nix_dev_start(struct rte_eth_dev *eth_dev)
+{
+       struct cnxk_eth_dev *dev = cnxk_eth_pmd_priv(eth_dev);
+       int rc, i;
+
+       if (eth_dev->data->nb_rx_queues != 0) {
+               rc = nix_recalc_mtu(eth_dev);
+               if (rc)
+                       return rc;
+       }
+
+       /* Start rx queues */
+       for (i = 0; i < eth_dev->data->nb_rx_queues; i++) {
+               rc = cnxk_nix_rx_queue_start(eth_dev, i);
+               if (rc)
+                       return rc;
+       }
+
+       /* Start tx queues  */
+       for (i = 0; i < eth_dev->data->nb_tx_queues; i++) {
+               rc = cnxk_nix_tx_queue_start(eth_dev, i);
+               if (rc)
+                       return rc;
+       }
+
+       /* Enable Rx in NPC */
+       rc = roc_nix_npc_rx_ena_dis(&dev->nix, true);
+       if (rc) {
+               plt_err("Failed to enable NPC rx %d", rc);
+               return rc;
+       }
+
+       cnxk_nix_toggle_flag_link_cfg(dev, true);
+
+       /* Start link change events */
+       if (!roc_nix_is_vf_or_sdp(&dev->nix)) {
+               rc = roc_nix_mac_link_event_start_stop(&dev->nix, true);
+               if (rc) {
+                       plt_err("Failed to start cgx link event %d", rc);
+                       goto rx_disable;
+               }
+       }
+
+       cnxk_nix_toggle_flag_link_cfg(dev, false);
+
+       return 0;
+
+rx_disable:
+       roc_nix_npc_rx_ena_dis(&dev->nix, false);
+       cnxk_nix_toggle_flag_link_cfg(dev, false);
+       return rc;
+}
+
 /* CNXK platform independent eth dev ops */
-struct eth_dev_ops cnxk_eth_dev_ops;
+struct eth_dev_ops cnxk_eth_dev_ops = {
+       .mtu_set = cnxk_nix_mtu_set,
+       .mac_addr_add = cnxk_nix_mac_addr_add,
+       .mac_addr_remove = cnxk_nix_mac_addr_del,
+       .mac_addr_set = cnxk_nix_mac_addr_set,
+       .dev_infos_get = cnxk_nix_info_get,
+       .link_update = cnxk_nix_link_update,
+       .tx_queue_release = cnxk_nix_tx_queue_release,
+       .rx_queue_release = cnxk_nix_rx_queue_release,
+       .dev_stop = cnxk_nix_dev_stop,
+       .tx_queue_start = cnxk_nix_tx_queue_start,
+       .rx_queue_start = cnxk_nix_rx_queue_start,
+       .rx_queue_stop = cnxk_nix_rx_queue_stop,
+       .dev_supported_ptypes_get = cnxk_nix_supported_ptypes_get,
+       .promiscuous_enable = cnxk_nix_promisc_enable,
+       .promiscuous_disable = cnxk_nix_promisc_disable,
+       .allmulticast_enable = cnxk_nix_allmulticast_enable,
+       .allmulticast_disable = cnxk_nix_allmulticast_disable,
+};
 
 static int
 cnxk_eth_dev_init(struct rte_eth_dev *eth_dev)
@@ -72,7 +1147,12 @@ cnxk_eth_dev_init(struct rte_eth_dev *eth_dev)
                goto error;
        }
 
+       /* Register up msg callbacks */
+       roc_nix_mac_link_cb_register(nix, cnxk_eth_dev_link_status_cb);
+
        dev->eth_dev = eth_dev;
+       dev->configured = 0;
+       dev->ptype_disable = 0;
 
        /* For vfs, returned max_entries will be 0. but to keep default mac
         * address, one entry must be allocated. so setting up to 1.
@@ -154,8 +1234,14 @@ cnxk_eth_dev_uninit(struct rte_eth_dev *eth_dev, bool mbox_close)
        if (rte_eal_process_type() != RTE_PROC_PRIMARY)
                return 0;
 
+       /* Clear the flag since we are closing down */
+       dev->configured = 0;
+
        roc_nix_npc_rx_ena_dis(nix, false);
 
+       /* Disable link status events */
+       roc_nix_mac_link_event_start_stop(nix, false);
+
        /* Free up SQs */
        for (i = 0; i < eth_dev->data->nb_tx_queues; i++) {
                dev_ops->tx_queue_release(eth_dev->data->tx_queues[i]);
@@ -180,6 +1266,9 @@ cnxk_eth_dev_uninit(struct rte_eth_dev *eth_dev, bool mbox_close)
        if (eth_dev->data->dev_conf.intr_conf.rxq)
                roc_nix_unregister_cq_irqs(nix);
 
+       /* Free ROC RQ's, SQ's and CQ's memory */
+       nix_free_queue_mem(dev);
+
        /* Free nix lf resources */
        rc = roc_nix_lf_free(nix);
        if (rc)