net/ice: support RSS RETA configuration in DCF mode
[dpdk.git] / drivers / net / ice / ice_dcf_ethdev.c
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright(c) 2020 Intel Corporation
3  */
4
5 #include <errno.h>
6 #include <stdbool.h>
7 #include <sys/queue.h>
8 #include <sys/types.h>
9 #include <unistd.h>
10
11 #include <rte_interrupts.h>
12 #include <rte_debug.h>
13 #include <rte_pci.h>
14 #include <rte_atomic.h>
15 #include <rte_eal.h>
16 #include <rte_ether.h>
17 #include <ethdev_pci.h>
18 #include <rte_kvargs.h>
19 #include <rte_malloc.h>
20 #include <rte_memzone.h>
21 #include <rte_dev.h>
22
23 #include <iavf_devids.h>
24
25 #include "ice_generic_flow.h"
26 #include "ice_dcf_ethdev.h"
27 #include "ice_rxtx.h"
28
29 static int
30 ice_dcf_dev_udp_tunnel_port_add(struct rte_eth_dev *dev,
31                                 struct rte_eth_udp_tunnel *udp_tunnel);
32 static int
33 ice_dcf_dev_udp_tunnel_port_del(struct rte_eth_dev *dev,
34                                 struct rte_eth_udp_tunnel *udp_tunnel);
35
36 static int
37 ice_dcf_dev_init(struct rte_eth_dev *eth_dev);
38
39 static int
40 ice_dcf_dev_uninit(struct rte_eth_dev *eth_dev);
41
42 static uint16_t
43 ice_dcf_recv_pkts(__rte_unused void *rx_queue,
44                   __rte_unused struct rte_mbuf **bufs,
45                   __rte_unused uint16_t nb_pkts)
46 {
47         return 0;
48 }
49
50 static uint16_t
51 ice_dcf_xmit_pkts(__rte_unused void *tx_queue,
52                   __rte_unused struct rte_mbuf **bufs,
53                   __rte_unused uint16_t nb_pkts)
54 {
55         return 0;
56 }
57
58 static int
59 ice_dcf_init_rxq(struct rte_eth_dev *dev, struct ice_rx_queue *rxq)
60 {
61         struct ice_dcf_adapter *dcf_ad = dev->data->dev_private;
62         struct rte_eth_dev_data *dev_data = dev->data;
63         struct iavf_hw *hw = &dcf_ad->real_hw.avf;
64         uint16_t buf_size, max_pkt_len;
65
66         buf_size = rte_pktmbuf_data_room_size(rxq->mp) - RTE_PKTMBUF_HEADROOM;
67         rxq->rx_hdr_len = 0;
68         rxq->rx_buf_len = RTE_ALIGN(buf_size, (1 << ICE_RLAN_CTX_DBUF_S));
69         max_pkt_len = RTE_MIN(ICE_SUPPORT_CHAIN_NUM * rxq->rx_buf_len,
70                               dev->data->mtu + ICE_ETH_OVERHEAD);
71
72         /* Check maximum packet length is set correctly.  */
73         if (max_pkt_len <= RTE_ETHER_MIN_LEN ||
74             max_pkt_len > ICE_FRAME_SIZE_MAX) {
75                 PMD_DRV_LOG(ERR, "maximum packet length must be "
76                             "larger than %u and smaller than %u",
77                             (uint32_t)RTE_ETHER_MIN_LEN,
78                             (uint32_t)ICE_FRAME_SIZE_MAX);
79                 return -EINVAL;
80         }
81
82         rxq->max_pkt_len = max_pkt_len;
83         if ((dev_data->dev_conf.rxmode.offloads & RTE_ETH_RX_OFFLOAD_SCATTER) ||
84             (rxq->max_pkt_len + 2 * RTE_VLAN_HLEN) > buf_size) {
85                 dev_data->scattered_rx = 1;
86         }
87         rxq->qrx_tail = hw->hw_addr + IAVF_QRX_TAIL1(rxq->queue_id);
88         IAVF_PCI_REG_WRITE(rxq->qrx_tail, rxq->nb_rx_desc - 1);
89         IAVF_WRITE_FLUSH(hw);
90
91         return 0;
92 }
93
94 static int
95 ice_dcf_init_rx_queues(struct rte_eth_dev *dev)
96 {
97         struct ice_rx_queue **rxq =
98                 (struct ice_rx_queue **)dev->data->rx_queues;
99         int i, ret;
100
101         for (i = 0; i < dev->data->nb_rx_queues; i++) {
102                 if (!rxq[i] || !rxq[i]->q_set)
103                         continue;
104                 ret = ice_dcf_init_rxq(dev, rxq[i]);
105                 if (ret)
106                         return ret;
107         }
108
109         ice_set_rx_function(dev);
110         ice_set_tx_function(dev);
111
112         return 0;
113 }
114
115 #define IAVF_MISC_VEC_ID                RTE_INTR_VEC_ZERO_OFFSET
116 #define IAVF_RX_VEC_START               RTE_INTR_VEC_RXTX_OFFSET
117
118 #define IAVF_ITR_INDEX_DEFAULT          0
119 #define IAVF_QUEUE_ITR_INTERVAL_DEFAULT 32 /* 32 us */
120 #define IAVF_QUEUE_ITR_INTERVAL_MAX     8160 /* 8160 us */
121
122 static inline uint16_t
123 iavf_calc_itr_interval(int16_t interval)
124 {
125         if (interval < 0 || interval > IAVF_QUEUE_ITR_INTERVAL_MAX)
126                 interval = IAVF_QUEUE_ITR_INTERVAL_DEFAULT;
127
128         /* Convert to hardware count, as writing each 1 represents 2 us */
129         return interval / 2;
130 }
131
132 static int
133 ice_dcf_config_rx_queues_irqs(struct rte_eth_dev *dev,
134                                      struct rte_intr_handle *intr_handle)
135 {
136         struct ice_dcf_adapter *adapter = dev->data->dev_private;
137         struct ice_dcf_hw *hw = &adapter->real_hw;
138         uint16_t interval, i;
139         int vec;
140
141         if (rte_intr_cap_multiple(intr_handle) &&
142             dev->data->dev_conf.intr_conf.rxq) {
143                 if (rte_intr_efd_enable(intr_handle, dev->data->nb_rx_queues))
144                         return -1;
145         }
146
147         if (rte_intr_dp_is_en(intr_handle)) {
148                 if (rte_intr_vec_list_alloc(intr_handle, "intr_vec",
149                                                    dev->data->nb_rx_queues)) {
150                         PMD_DRV_LOG(ERR, "Failed to allocate %d rx intr_vec",
151                                     dev->data->nb_rx_queues);
152                         return -1;
153                 }
154         }
155
156         if (!dev->data->dev_conf.intr_conf.rxq ||
157             !rte_intr_dp_is_en(intr_handle)) {
158                 /* Rx interrupt disabled, Map interrupt only for writeback */
159                 hw->nb_msix = 1;
160                 if (hw->vf_res->vf_cap_flags &
161                     VIRTCHNL_VF_OFFLOAD_WB_ON_ITR) {
162                         /* If WB_ON_ITR supports, enable it */
163                         hw->msix_base = IAVF_RX_VEC_START;
164                         /* Set the ITR for index zero, to 2us to make sure that
165                          * we leave time for aggregation to occur, but don't
166                          * increase latency dramatically.
167                          */
168                         IAVF_WRITE_REG(&hw->avf,
169                                        IAVF_VFINT_DYN_CTLN1(hw->msix_base - 1),
170                                        (0 << IAVF_VFINT_DYN_CTLN1_ITR_INDX_SHIFT) |
171                                        IAVF_VFINT_DYN_CTLN1_WB_ON_ITR_MASK |
172                                        (2UL << IAVF_VFINT_DYN_CTLN1_INTERVAL_SHIFT));
173                 } else {
174                         /* If no WB_ON_ITR offload flags, need to set
175                          * interrupt for descriptor write back.
176                          */
177                         hw->msix_base = IAVF_MISC_VEC_ID;
178
179                         /* set ITR to max */
180                         interval =
181                         iavf_calc_itr_interval(IAVF_QUEUE_ITR_INTERVAL_MAX);
182                         IAVF_WRITE_REG(&hw->avf, IAVF_VFINT_DYN_CTL01,
183                                        IAVF_VFINT_DYN_CTL01_INTENA_MASK |
184                                        (IAVF_ITR_INDEX_DEFAULT <<
185                                         IAVF_VFINT_DYN_CTL01_ITR_INDX_SHIFT) |
186                                        (interval <<
187                                         IAVF_VFINT_DYN_CTL01_INTERVAL_SHIFT));
188                 }
189                 IAVF_WRITE_FLUSH(&hw->avf);
190                 /* map all queues to the same interrupt */
191                 for (i = 0; i < dev->data->nb_rx_queues; i++)
192                         hw->rxq_map[hw->msix_base] |= 1 << i;
193         } else {
194                 if (!rte_intr_allow_others(intr_handle)) {
195                         hw->nb_msix = 1;
196                         hw->msix_base = IAVF_MISC_VEC_ID;
197                         for (i = 0; i < dev->data->nb_rx_queues; i++) {
198                                 hw->rxq_map[hw->msix_base] |= 1 << i;
199                                 rte_intr_vec_list_index_set(intr_handle,
200                                                         i, IAVF_MISC_VEC_ID);
201                         }
202                         PMD_DRV_LOG(DEBUG,
203                                     "vector %u are mapping to all Rx queues",
204                                     hw->msix_base);
205                 } else {
206                         /* If Rx interrupt is required, and we can use
207                          * multi interrupts, then the vec is from 1
208                          */
209                         hw->nb_msix = RTE_MIN(hw->vf_res->max_vectors,
210                                       rte_intr_nb_efd_get(intr_handle));
211                         hw->msix_base = IAVF_MISC_VEC_ID;
212                         vec = IAVF_MISC_VEC_ID;
213                         for (i = 0; i < dev->data->nb_rx_queues; i++) {
214                                 hw->rxq_map[vec] |= 1 << i;
215                                 rte_intr_vec_list_index_set(intr_handle,
216                                                                    i, vec++);
217                                 if (vec >= hw->nb_msix)
218                                         vec = IAVF_RX_VEC_START;
219                         }
220                         PMD_DRV_LOG(DEBUG,
221                                     "%u vectors are mapping to %u Rx queues",
222                                     hw->nb_msix, dev->data->nb_rx_queues);
223                 }
224         }
225
226         if (ice_dcf_config_irq_map(hw)) {
227                 PMD_DRV_LOG(ERR, "config interrupt mapping failed");
228                 return -1;
229         }
230         return 0;
231 }
232
233 static int
234 alloc_rxq_mbufs(struct ice_rx_queue *rxq)
235 {
236         volatile union ice_rx_flex_desc *rxd;
237         struct rte_mbuf *mbuf = NULL;
238         uint64_t dma_addr;
239         uint16_t i;
240
241         for (i = 0; i < rxq->nb_rx_desc; i++) {
242                 mbuf = rte_mbuf_raw_alloc(rxq->mp);
243                 if (unlikely(!mbuf)) {
244                         PMD_DRV_LOG(ERR, "Failed to allocate mbuf for RX");
245                         return -ENOMEM;
246                 }
247
248                 rte_mbuf_refcnt_set(mbuf, 1);
249                 mbuf->next = NULL;
250                 mbuf->data_off = RTE_PKTMBUF_HEADROOM;
251                 mbuf->nb_segs = 1;
252                 mbuf->port = rxq->port_id;
253
254                 dma_addr =
255                         rte_cpu_to_le_64(rte_mbuf_data_iova_default(mbuf));
256
257                 rxd = &rxq->rx_ring[i];
258                 rxd->read.pkt_addr = dma_addr;
259                 rxd->read.hdr_addr = 0;
260 #ifndef RTE_LIBRTE_ICE_16BYTE_RX_DESC
261                 rxd->read.rsvd1 = 0;
262                 rxd->read.rsvd2 = 0;
263 #endif
264
265                 rxq->sw_ring[i].mbuf = (void *)mbuf;
266         }
267
268         return 0;
269 }
270
271 static int
272 ice_dcf_rx_queue_start(struct rte_eth_dev *dev, uint16_t rx_queue_id)
273 {
274         struct ice_dcf_adapter *ad = dev->data->dev_private;
275         struct iavf_hw *hw = &ad->real_hw.avf;
276         struct ice_rx_queue *rxq;
277         int err = 0;
278
279         if (rx_queue_id >= dev->data->nb_rx_queues)
280                 return -EINVAL;
281
282         rxq = dev->data->rx_queues[rx_queue_id];
283
284         err = alloc_rxq_mbufs(rxq);
285         if (err) {
286                 PMD_DRV_LOG(ERR, "Failed to allocate RX queue mbuf");
287                 return err;
288         }
289
290         rte_wmb();
291
292         /* Init the RX tail register. */
293         IAVF_PCI_REG_WRITE(rxq->qrx_tail, rxq->nb_rx_desc - 1);
294         IAVF_WRITE_FLUSH(hw);
295
296         /* Ready to switch the queue on */
297         err = ice_dcf_switch_queue(&ad->real_hw, rx_queue_id, true, true);
298         if (err) {
299                 PMD_DRV_LOG(ERR, "Failed to switch RX queue %u on",
300                             rx_queue_id);
301                 return err;
302         }
303
304         dev->data->rx_queue_state[rx_queue_id] = RTE_ETH_QUEUE_STATE_STARTED;
305
306         return 0;
307 }
308
309 static inline void
310 reset_rx_queue(struct ice_rx_queue *rxq)
311 {
312         uint16_t len;
313         uint32_t i;
314
315         if (!rxq)
316                 return;
317
318         len = rxq->nb_rx_desc + ICE_RX_MAX_BURST;
319
320         for (i = 0; i < len * sizeof(union ice_rx_flex_desc); i++)
321                 ((volatile char *)rxq->rx_ring)[i] = 0;
322
323         memset(&rxq->fake_mbuf, 0x0, sizeof(rxq->fake_mbuf));
324
325         for (i = 0; i < ICE_RX_MAX_BURST; i++)
326                 rxq->sw_ring[rxq->nb_rx_desc + i].mbuf = &rxq->fake_mbuf;
327
328         /* for rx bulk */
329         rxq->rx_nb_avail = 0;
330         rxq->rx_next_avail = 0;
331         rxq->rx_free_trigger = (uint16_t)(rxq->rx_free_thresh - 1);
332
333         rxq->rx_tail = 0;
334         rxq->nb_rx_hold = 0;
335         rxq->pkt_first_seg = NULL;
336         rxq->pkt_last_seg = NULL;
337 }
338
339 static inline void
340 reset_tx_queue(struct ice_tx_queue *txq)
341 {
342         struct ice_tx_entry *txe;
343         uint32_t i, size;
344         uint16_t prev;
345
346         if (!txq) {
347                 PMD_DRV_LOG(DEBUG, "Pointer to txq is NULL");
348                 return;
349         }
350
351         txe = txq->sw_ring;
352         size = sizeof(struct ice_tx_desc) * txq->nb_tx_desc;
353         for (i = 0; i < size; i++)
354                 ((volatile char *)txq->tx_ring)[i] = 0;
355
356         prev = (uint16_t)(txq->nb_tx_desc - 1);
357         for (i = 0; i < txq->nb_tx_desc; i++) {
358                 txq->tx_ring[i].cmd_type_offset_bsz =
359                         rte_cpu_to_le_64(IAVF_TX_DESC_DTYPE_DESC_DONE);
360                 txe[i].mbuf =  NULL;
361                 txe[i].last_id = i;
362                 txe[prev].next_id = i;
363                 prev = i;
364         }
365
366         txq->tx_tail = 0;
367         txq->nb_tx_used = 0;
368
369         txq->last_desc_cleaned = txq->nb_tx_desc - 1;
370         txq->nb_tx_free = txq->nb_tx_desc - 1;
371
372         txq->tx_next_dd = txq->tx_rs_thresh - 1;
373         txq->tx_next_rs = txq->tx_rs_thresh - 1;
374 }
375
376 static int
377 ice_dcf_rx_queue_stop(struct rte_eth_dev *dev, uint16_t rx_queue_id)
378 {
379         struct ice_dcf_adapter *ad = dev->data->dev_private;
380         struct ice_dcf_hw *hw = &ad->real_hw;
381         struct ice_rx_queue *rxq;
382         int err;
383
384         if (rx_queue_id >= dev->data->nb_rx_queues)
385                 return -EINVAL;
386
387         err = ice_dcf_switch_queue(hw, rx_queue_id, true, false);
388         if (err) {
389                 PMD_DRV_LOG(ERR, "Failed to switch RX queue %u off",
390                             rx_queue_id);
391                 return err;
392         }
393
394         rxq = dev->data->rx_queues[rx_queue_id];
395         rxq->rx_rel_mbufs(rxq);
396         reset_rx_queue(rxq);
397         dev->data->rx_queue_state[rx_queue_id] = RTE_ETH_QUEUE_STATE_STOPPED;
398
399         return 0;
400 }
401
402 static int
403 ice_dcf_tx_queue_start(struct rte_eth_dev *dev, uint16_t tx_queue_id)
404 {
405         struct ice_dcf_adapter *ad = dev->data->dev_private;
406         struct iavf_hw *hw = &ad->real_hw.avf;
407         struct ice_tx_queue *txq;
408         int err = 0;
409
410         if (tx_queue_id >= dev->data->nb_tx_queues)
411                 return -EINVAL;
412
413         txq = dev->data->tx_queues[tx_queue_id];
414
415         /* Init the RX tail register. */
416         txq->qtx_tail = hw->hw_addr + IAVF_QTX_TAIL1(tx_queue_id);
417         IAVF_PCI_REG_WRITE(txq->qtx_tail, 0);
418         IAVF_WRITE_FLUSH(hw);
419
420         /* Ready to switch the queue on */
421         err = ice_dcf_switch_queue(&ad->real_hw, tx_queue_id, false, true);
422
423         if (err) {
424                 PMD_DRV_LOG(ERR, "Failed to switch TX queue %u on",
425                             tx_queue_id);
426                 return err;
427         }
428
429         dev->data->tx_queue_state[tx_queue_id] = RTE_ETH_QUEUE_STATE_STARTED;
430
431         return 0;
432 }
433
434 static int
435 ice_dcf_tx_queue_stop(struct rte_eth_dev *dev, uint16_t tx_queue_id)
436 {
437         struct ice_dcf_adapter *ad = dev->data->dev_private;
438         struct ice_dcf_hw *hw = &ad->real_hw;
439         struct ice_tx_queue *txq;
440         int err;
441
442         if (tx_queue_id >= dev->data->nb_tx_queues)
443                 return -EINVAL;
444
445         err = ice_dcf_switch_queue(hw, tx_queue_id, false, false);
446         if (err) {
447                 PMD_DRV_LOG(ERR, "Failed to switch TX queue %u off",
448                             tx_queue_id);
449                 return err;
450         }
451
452         txq = dev->data->tx_queues[tx_queue_id];
453         txq->tx_rel_mbufs(txq);
454         reset_tx_queue(txq);
455         dev->data->tx_queue_state[tx_queue_id] = RTE_ETH_QUEUE_STATE_STOPPED;
456
457         return 0;
458 }
459
460 static int
461 ice_dcf_start_queues(struct rte_eth_dev *dev)
462 {
463         struct ice_rx_queue *rxq;
464         struct ice_tx_queue *txq;
465         int nb_rxq = 0;
466         int nb_txq, i;
467
468         for (nb_txq = 0; nb_txq < dev->data->nb_tx_queues; nb_txq++) {
469                 txq = dev->data->tx_queues[nb_txq];
470                 if (txq->tx_deferred_start)
471                         continue;
472                 if (ice_dcf_tx_queue_start(dev, nb_txq) != 0) {
473                         PMD_DRV_LOG(ERR, "Fail to start queue %u", nb_txq);
474                         goto tx_err;
475                 }
476         }
477
478         for (nb_rxq = 0; nb_rxq < dev->data->nb_rx_queues; nb_rxq++) {
479                 rxq = dev->data->rx_queues[nb_rxq];
480                 if (rxq->rx_deferred_start)
481                         continue;
482                 if (ice_dcf_rx_queue_start(dev, nb_rxq) != 0) {
483                         PMD_DRV_LOG(ERR, "Fail to start queue %u", nb_rxq);
484                         goto rx_err;
485                 }
486         }
487
488         return 0;
489
490         /* stop the started queues if failed to start all queues */
491 rx_err:
492         for (i = 0; i < nb_rxq; i++)
493                 ice_dcf_rx_queue_stop(dev, i);
494 tx_err:
495         for (i = 0; i < nb_txq; i++)
496                 ice_dcf_tx_queue_stop(dev, i);
497
498         return -1;
499 }
500
501 static int
502 ice_dcf_dev_start(struct rte_eth_dev *dev)
503 {
504         struct ice_dcf_adapter *dcf_ad = dev->data->dev_private;
505         struct rte_intr_handle *intr_handle = dev->intr_handle;
506         struct ice_adapter *ad = &dcf_ad->parent;
507         struct ice_dcf_hw *hw = &dcf_ad->real_hw;
508         int ret;
509
510         if (hw->resetting) {
511                 PMD_DRV_LOG(ERR,
512                             "The DCF has been reset by PF, please reinit first");
513                 return -EIO;
514         }
515
516         if (hw->tm_conf.root && !hw->tm_conf.committed) {
517                 PMD_DRV_LOG(ERR,
518                         "please call hierarchy_commit() before starting the port");
519                 return -EIO;
520         }
521
522         ad->pf.adapter_stopped = 0;
523
524         hw->num_queue_pairs = RTE_MAX(dev->data->nb_rx_queues,
525                                       dev->data->nb_tx_queues);
526
527         ret = ice_dcf_init_rx_queues(dev);
528         if (ret) {
529                 PMD_DRV_LOG(ERR, "Fail to init queues");
530                 return ret;
531         }
532
533         if (hw->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF) {
534                 ret = ice_dcf_init_rss(hw);
535                 if (ret) {
536                         PMD_DRV_LOG(ERR, "Failed to configure RSS");
537                         return ret;
538                 }
539         }
540
541         ret = ice_dcf_configure_queues(hw);
542         if (ret) {
543                 PMD_DRV_LOG(ERR, "Fail to config queues");
544                 return ret;
545         }
546
547         ret = ice_dcf_config_rx_queues_irqs(dev, intr_handle);
548         if (ret) {
549                 PMD_DRV_LOG(ERR, "Fail to config rx queues' irqs");
550                 return ret;
551         }
552
553         if (dev->data->dev_conf.intr_conf.rxq != 0) {
554                 rte_intr_disable(intr_handle);
555                 rte_intr_enable(intr_handle);
556         }
557
558         ret = ice_dcf_start_queues(dev);
559         if (ret) {
560                 PMD_DRV_LOG(ERR, "Failed to enable queues");
561                 return ret;
562         }
563
564         ret = ice_dcf_add_del_all_mac_addr(hw, true);
565         if (ret) {
566                 PMD_DRV_LOG(ERR, "Failed to add mac addr");
567                 return ret;
568         }
569
570         dev->data->dev_link.link_status = RTE_ETH_LINK_UP;
571
572         return 0;
573 }
574
575 static void
576 ice_dcf_stop_queues(struct rte_eth_dev *dev)
577 {
578         struct ice_dcf_adapter *ad = dev->data->dev_private;
579         struct ice_dcf_hw *hw = &ad->real_hw;
580         struct ice_rx_queue *rxq;
581         struct ice_tx_queue *txq;
582         int ret, i;
583
584         /* Stop All queues */
585         ret = ice_dcf_disable_queues(hw);
586         if (ret)
587                 PMD_DRV_LOG(WARNING, "Fail to stop queues");
588
589         for (i = 0; i < dev->data->nb_tx_queues; i++) {
590                 txq = dev->data->tx_queues[i];
591                 if (!txq)
592                         continue;
593                 txq->tx_rel_mbufs(txq);
594                 reset_tx_queue(txq);
595                 dev->data->tx_queue_state[i] = RTE_ETH_QUEUE_STATE_STOPPED;
596         }
597         for (i = 0; i < dev->data->nb_rx_queues; i++) {
598                 rxq = dev->data->rx_queues[i];
599                 if (!rxq)
600                         continue;
601                 rxq->rx_rel_mbufs(rxq);
602                 reset_rx_queue(rxq);
603                 dev->data->rx_queue_state[i] = RTE_ETH_QUEUE_STATE_STOPPED;
604         }
605 }
606
607 static int
608 ice_dcf_dev_stop(struct rte_eth_dev *dev)
609 {
610         struct ice_dcf_adapter *dcf_ad = dev->data->dev_private;
611         struct rte_intr_handle *intr_handle = dev->intr_handle;
612         struct ice_adapter *ad = &dcf_ad->parent;
613         struct ice_dcf_hw *hw = &dcf_ad->real_hw;
614
615         if (ad->pf.adapter_stopped == 1) {
616                 PMD_DRV_LOG(DEBUG, "Port is already stopped");
617                 return 0;
618         }
619
620         /* Stop the VF representors for this device */
621         ice_dcf_vf_repr_stop_all(dcf_ad);
622
623         ice_dcf_stop_queues(dev);
624
625         rte_intr_efd_disable(intr_handle);
626         rte_intr_vec_list_free(intr_handle);
627
628         ice_dcf_add_del_all_mac_addr(&dcf_ad->real_hw, false);
629         dev->data->dev_link.link_status = RTE_ETH_LINK_DOWN;
630         ad->pf.adapter_stopped = 1;
631         hw->tm_conf.committed = false;
632
633         return 0;
634 }
635
636 static int
637 ice_dcf_dev_configure(struct rte_eth_dev *dev)
638 {
639         struct ice_dcf_adapter *dcf_ad = dev->data->dev_private;
640         struct ice_adapter *ad = &dcf_ad->parent;
641
642         ad->rx_bulk_alloc_allowed = true;
643         ad->tx_simple_allowed = true;
644
645         if (dev->data->dev_conf.rxmode.mq_mode & RTE_ETH_MQ_RX_RSS_FLAG)
646                 dev->data->dev_conf.rxmode.offloads |= RTE_ETH_RX_OFFLOAD_RSS_HASH;
647
648         return 0;
649 }
650
651 static int
652 ice_dcf_dev_info_get(struct rte_eth_dev *dev,
653                      struct rte_eth_dev_info *dev_info)
654 {
655         struct ice_dcf_adapter *adapter = dev->data->dev_private;
656         struct ice_dcf_hw *hw = &adapter->real_hw;
657
658         dev_info->max_mac_addrs = 1;
659         dev_info->max_rx_queues = hw->vsi_res->num_queue_pairs;
660         dev_info->max_tx_queues = hw->vsi_res->num_queue_pairs;
661         dev_info->min_rx_bufsize = ICE_BUF_SIZE_MIN;
662         dev_info->max_rx_pktlen = ICE_FRAME_SIZE_MAX;
663         dev_info->hash_key_size = hw->vf_res->rss_key_size;
664         dev_info->reta_size = hw->vf_res->rss_lut_size;
665         dev_info->flow_type_rss_offloads = ICE_RSS_OFFLOAD_ALL;
666         dev_info->dev_capa &= ~RTE_ETH_DEV_CAPA_FLOW_RULE_KEEP;
667
668         dev_info->rx_offload_capa =
669                 RTE_ETH_RX_OFFLOAD_VLAN_STRIP |
670                 RTE_ETH_RX_OFFLOAD_IPV4_CKSUM |
671                 RTE_ETH_RX_OFFLOAD_UDP_CKSUM |
672                 RTE_ETH_RX_OFFLOAD_TCP_CKSUM |
673                 RTE_ETH_RX_OFFLOAD_OUTER_IPV4_CKSUM |
674                 RTE_ETH_RX_OFFLOAD_SCATTER |
675                 RTE_ETH_RX_OFFLOAD_VLAN_FILTER |
676                 RTE_ETH_RX_OFFLOAD_RSS_HASH;
677         dev_info->tx_offload_capa =
678                 RTE_ETH_TX_OFFLOAD_VLAN_INSERT |
679                 RTE_ETH_TX_OFFLOAD_IPV4_CKSUM |
680                 RTE_ETH_TX_OFFLOAD_UDP_CKSUM |
681                 RTE_ETH_TX_OFFLOAD_TCP_CKSUM |
682                 RTE_ETH_TX_OFFLOAD_SCTP_CKSUM |
683                 RTE_ETH_TX_OFFLOAD_OUTER_IPV4_CKSUM |
684                 RTE_ETH_TX_OFFLOAD_OUTER_UDP_CKSUM |
685                 RTE_ETH_TX_OFFLOAD_TCP_TSO |
686                 RTE_ETH_TX_OFFLOAD_VXLAN_TNL_TSO |
687                 RTE_ETH_TX_OFFLOAD_GRE_TNL_TSO |
688                 RTE_ETH_TX_OFFLOAD_IPIP_TNL_TSO |
689                 RTE_ETH_TX_OFFLOAD_GENEVE_TNL_TSO |
690                 RTE_ETH_TX_OFFLOAD_MULTI_SEGS;
691
692         dev_info->default_rxconf = (struct rte_eth_rxconf) {
693                 .rx_thresh = {
694                         .pthresh = ICE_DEFAULT_RX_PTHRESH,
695                         .hthresh = ICE_DEFAULT_RX_HTHRESH,
696                         .wthresh = ICE_DEFAULT_RX_WTHRESH,
697                 },
698                 .rx_free_thresh = ICE_DEFAULT_RX_FREE_THRESH,
699                 .rx_drop_en = 0,
700                 .offloads = 0,
701         };
702
703         dev_info->default_txconf = (struct rte_eth_txconf) {
704                 .tx_thresh = {
705                         .pthresh = ICE_DEFAULT_TX_PTHRESH,
706                         .hthresh = ICE_DEFAULT_TX_HTHRESH,
707                         .wthresh = ICE_DEFAULT_TX_WTHRESH,
708                 },
709                 .tx_free_thresh = ICE_DEFAULT_TX_FREE_THRESH,
710                 .tx_rs_thresh = ICE_DEFAULT_TX_RSBIT_THRESH,
711                 .offloads = 0,
712         };
713
714         dev_info->rx_desc_lim = (struct rte_eth_desc_lim) {
715                 .nb_max = ICE_MAX_RING_DESC,
716                 .nb_min = ICE_MIN_RING_DESC,
717                 .nb_align = ICE_ALIGN_RING_DESC,
718         };
719
720         dev_info->tx_desc_lim = (struct rte_eth_desc_lim) {
721                 .nb_max = ICE_MAX_RING_DESC,
722                 .nb_min = ICE_MIN_RING_DESC,
723                 .nb_align = ICE_ALIGN_RING_DESC,
724         };
725
726         return 0;
727 }
728
729 static int
730 ice_dcf_dev_promiscuous_enable(__rte_unused struct rte_eth_dev *dev)
731 {
732         return 0;
733 }
734
735 static int
736 ice_dcf_dev_promiscuous_disable(__rte_unused struct rte_eth_dev *dev)
737 {
738         return 0;
739 }
740
741 static int
742 ice_dcf_dev_allmulticast_enable(__rte_unused struct rte_eth_dev *dev)
743 {
744         return 0;
745 }
746
747 static int
748 ice_dcf_dev_allmulticast_disable(__rte_unused struct rte_eth_dev *dev)
749 {
750         return 0;
751 }
752
753 static int
754 ice_dcf_dev_flow_ops_get(struct rte_eth_dev *dev,
755                          const struct rte_flow_ops **ops)
756 {
757         if (!dev)
758                 return -EINVAL;
759
760         *ops = &ice_flow_ops;
761         return 0;
762 }
763
764 static int
765 ice_dcf_dev_rss_reta_update(struct rte_eth_dev *dev,
766                         struct rte_eth_rss_reta_entry64 *reta_conf,
767                         uint16_t reta_size)
768 {
769         struct ice_dcf_adapter *adapter = dev->data->dev_private;
770         struct ice_dcf_hw *hw = &adapter->real_hw;
771         uint8_t *lut;
772         uint16_t i, idx, shift;
773         int ret;
774
775         if (!(hw->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF))
776                 return -ENOTSUP;
777
778         if (reta_size != hw->vf_res->rss_lut_size) {
779                 PMD_DRV_LOG(ERR, "The size of hash lookup table configured "
780                         "(%d) doesn't match the number of hardware can "
781                         "support (%d)", reta_size, hw->vf_res->rss_lut_size);
782                 return -EINVAL;
783         }
784
785         lut = rte_zmalloc("rss_lut", reta_size, 0);
786         if (!lut) {
787                 PMD_DRV_LOG(ERR, "No memory can be allocated");
788                 return -ENOMEM;
789         }
790         /* store the old lut table temporarily */
791         rte_memcpy(lut, hw->rss_lut, reta_size);
792
793         for (i = 0; i < reta_size; i++) {
794                 idx = i / RTE_ETH_RETA_GROUP_SIZE;
795                 shift = i % RTE_ETH_RETA_GROUP_SIZE;
796                 if (reta_conf[idx].mask & (1ULL << shift))
797                         lut[i] = reta_conf[idx].reta[shift];
798         }
799
800         rte_memcpy(hw->rss_lut, lut, reta_size);
801         /* send virtchnnl ops to configure rss*/
802         ret = ice_dcf_configure_rss_lut(hw);
803         if (ret) /* revert back */
804                 rte_memcpy(hw->rss_lut, lut, reta_size);
805         rte_free(lut);
806
807         return ret;
808 }
809
810 static int
811 ice_dcf_dev_rss_reta_query(struct rte_eth_dev *dev,
812                        struct rte_eth_rss_reta_entry64 *reta_conf,
813                        uint16_t reta_size)
814 {
815         struct ice_dcf_adapter *adapter = dev->data->dev_private;
816         struct ice_dcf_hw *hw = &adapter->real_hw;
817         uint16_t i, idx, shift;
818
819         if (!(hw->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF))
820                 return -ENOTSUP;
821
822         if (reta_size != hw->vf_res->rss_lut_size) {
823                 PMD_DRV_LOG(ERR, "The size of hash lookup table configured "
824                         "(%d) doesn't match the number of hardware can "
825                         "support (%d)", reta_size, hw->vf_res->rss_lut_size);
826                 return -EINVAL;
827         }
828
829         for (i = 0; i < reta_size; i++) {
830                 idx = i / RTE_ETH_RETA_GROUP_SIZE;
831                 shift = i % RTE_ETH_RETA_GROUP_SIZE;
832                 if (reta_conf[idx].mask & (1ULL << shift))
833                         reta_conf[idx].reta[shift] = hw->rss_lut[i];
834         }
835
836         return 0;
837 }
838
839 #define ICE_DCF_32_BIT_WIDTH (CHAR_BIT * 4)
840 #define ICE_DCF_48_BIT_WIDTH (CHAR_BIT * 6)
841 #define ICE_DCF_48_BIT_MASK  RTE_LEN2MASK(ICE_DCF_48_BIT_WIDTH, uint64_t)
842
843 static void
844 ice_dcf_stat_update_48(uint64_t *offset, uint64_t *stat)
845 {
846         if (*stat >= *offset)
847                 *stat = *stat - *offset;
848         else
849                 *stat = (uint64_t)((*stat +
850                         ((uint64_t)1 << ICE_DCF_48_BIT_WIDTH)) - *offset);
851
852         *stat &= ICE_DCF_48_BIT_MASK;
853 }
854
855 static void
856 ice_dcf_stat_update_32(uint64_t *offset, uint64_t *stat)
857 {
858         if (*stat >= *offset)
859                 *stat = (uint64_t)(*stat - *offset);
860         else
861                 *stat = (uint64_t)((*stat +
862                         ((uint64_t)1 << ICE_DCF_32_BIT_WIDTH)) - *offset);
863 }
864
865 static void
866 ice_dcf_update_stats(struct virtchnl_eth_stats *oes,
867                      struct virtchnl_eth_stats *nes)
868 {
869         ice_dcf_stat_update_48(&oes->rx_bytes, &nes->rx_bytes);
870         ice_dcf_stat_update_48(&oes->rx_unicast, &nes->rx_unicast);
871         ice_dcf_stat_update_48(&oes->rx_multicast, &nes->rx_multicast);
872         ice_dcf_stat_update_48(&oes->rx_broadcast, &nes->rx_broadcast);
873         ice_dcf_stat_update_32(&oes->rx_discards, &nes->rx_discards);
874         ice_dcf_stat_update_48(&oes->tx_bytes, &nes->tx_bytes);
875         ice_dcf_stat_update_48(&oes->tx_unicast, &nes->tx_unicast);
876         ice_dcf_stat_update_48(&oes->tx_multicast, &nes->tx_multicast);
877         ice_dcf_stat_update_48(&oes->tx_broadcast, &nes->tx_broadcast);
878         ice_dcf_stat_update_32(&oes->tx_errors, &nes->tx_errors);
879         ice_dcf_stat_update_32(&oes->tx_discards, &nes->tx_discards);
880 }
881
882
883 static int
884 ice_dcf_stats_get(struct rte_eth_dev *dev, struct rte_eth_stats *stats)
885 {
886         struct ice_dcf_adapter *ad = dev->data->dev_private;
887         struct ice_dcf_hw *hw = &ad->real_hw;
888         struct virtchnl_eth_stats pstats;
889         int ret;
890
891         if (hw->resetting) {
892                 PMD_DRV_LOG(ERR,
893                             "The DCF has been reset by PF, please reinit first");
894                 return -EIO;
895         }
896
897         ret = ice_dcf_query_stats(hw, &pstats);
898         if (ret == 0) {
899                 ice_dcf_update_stats(&hw->eth_stats_offset, &pstats);
900                 stats->ipackets = pstats.rx_unicast + pstats.rx_multicast +
901                                 pstats.rx_broadcast - pstats.rx_discards;
902                 stats->opackets = pstats.tx_broadcast + pstats.tx_multicast +
903                                                 pstats.tx_unicast;
904                 stats->imissed = pstats.rx_discards;
905                 stats->oerrors = pstats.tx_errors + pstats.tx_discards;
906                 stats->ibytes = pstats.rx_bytes;
907                 stats->ibytes -= stats->ipackets * RTE_ETHER_CRC_LEN;
908                 stats->obytes = pstats.tx_bytes;
909         } else {
910                 PMD_DRV_LOG(ERR, "Get statistics failed");
911         }
912         return ret;
913 }
914
915 static int
916 ice_dcf_stats_reset(struct rte_eth_dev *dev)
917 {
918         struct ice_dcf_adapter *ad = dev->data->dev_private;
919         struct ice_dcf_hw *hw = &ad->real_hw;
920         struct virtchnl_eth_stats pstats;
921         int ret;
922
923         if (hw->resetting)
924                 return 0;
925
926         /* read stat values to clear hardware registers */
927         ret = ice_dcf_query_stats(hw, &pstats);
928         if (ret != 0)
929                 return ret;
930
931         /* set stats offset base on current values */
932         hw->eth_stats_offset = pstats;
933
934         return 0;
935 }
936
937 static void
938 ice_dcf_free_repr_info(struct ice_dcf_adapter *dcf_adapter)
939 {
940         if (dcf_adapter->repr_infos) {
941                 rte_free(dcf_adapter->repr_infos);
942                 dcf_adapter->repr_infos = NULL;
943         }
944 }
945
946 static int
947 ice_dcf_init_repr_info(struct ice_dcf_adapter *dcf_adapter)
948 {
949         dcf_adapter->repr_infos =
950                         rte_calloc("ice_dcf_rep_info",
951                                    dcf_adapter->real_hw.num_vfs,
952                                    sizeof(dcf_adapter->repr_infos[0]), 0);
953         if (!dcf_adapter->repr_infos) {
954                 PMD_DRV_LOG(ERR, "Failed to alloc memory for VF representors\n");
955                 return -ENOMEM;
956         }
957
958         return 0;
959 }
960
961 static int
962 ice_dcf_dev_close(struct rte_eth_dev *dev)
963 {
964         struct ice_dcf_adapter *adapter = dev->data->dev_private;
965
966         if (rte_eal_process_type() != RTE_PROC_PRIMARY)
967                 return 0;
968
969         (void)ice_dcf_dev_stop(dev);
970
971         ice_free_queues(dev);
972
973         ice_dcf_free_repr_info(adapter);
974         ice_dcf_uninit_parent_adapter(dev);
975         ice_dcf_uninit_hw(dev, &adapter->real_hw);
976
977         return 0;
978 }
979
980 int
981 ice_dcf_link_update(struct rte_eth_dev *dev,
982                     __rte_unused int wait_to_complete)
983 {
984         struct ice_dcf_adapter *ad = dev->data->dev_private;
985         struct ice_dcf_hw *hw = &ad->real_hw;
986         struct rte_eth_link new_link;
987
988         memset(&new_link, 0, sizeof(new_link));
989
990         /* Only read status info stored in VF, and the info is updated
991          * when receive LINK_CHANGE event from PF by virtchnl.
992          */
993         switch (hw->link_speed) {
994         case 10:
995                 new_link.link_speed = RTE_ETH_SPEED_NUM_10M;
996                 break;
997         case 100:
998                 new_link.link_speed = RTE_ETH_SPEED_NUM_100M;
999                 break;
1000         case 1000:
1001                 new_link.link_speed = RTE_ETH_SPEED_NUM_1G;
1002                 break;
1003         case 10000:
1004                 new_link.link_speed = RTE_ETH_SPEED_NUM_10G;
1005                 break;
1006         case 20000:
1007                 new_link.link_speed = RTE_ETH_SPEED_NUM_20G;
1008                 break;
1009         case 25000:
1010                 new_link.link_speed = RTE_ETH_SPEED_NUM_25G;
1011                 break;
1012         case 40000:
1013                 new_link.link_speed = RTE_ETH_SPEED_NUM_40G;
1014                 break;
1015         case 50000:
1016                 new_link.link_speed = RTE_ETH_SPEED_NUM_50G;
1017                 break;
1018         case 100000:
1019                 new_link.link_speed = RTE_ETH_SPEED_NUM_100G;
1020                 break;
1021         default:
1022                 new_link.link_speed = RTE_ETH_SPEED_NUM_NONE;
1023                 break;
1024         }
1025
1026         new_link.link_duplex = RTE_ETH_LINK_FULL_DUPLEX;
1027         new_link.link_status = hw->link_up ? RTE_ETH_LINK_UP :
1028                                              RTE_ETH_LINK_DOWN;
1029         new_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
1030                                 RTE_ETH_LINK_SPEED_FIXED);
1031
1032         return rte_eth_linkstatus_set(dev, &new_link);
1033 }
1034
1035 bool
1036 ice_dcf_adminq_need_retry(struct ice_adapter *ad)
1037 {
1038         return ad->hw.dcf_enabled &&
1039                !__atomic_load_n(&ad->dcf_state_on, __ATOMIC_RELAXED);
1040 }
1041
1042 /* Add UDP tunneling port */
1043 static int
1044 ice_dcf_dev_udp_tunnel_port_add(struct rte_eth_dev *dev,
1045                                 struct rte_eth_udp_tunnel *udp_tunnel)
1046 {
1047         struct ice_dcf_adapter *adapter = dev->data->dev_private;
1048         struct ice_adapter *parent_adapter = &adapter->parent;
1049         struct ice_hw *parent_hw = &parent_adapter->hw;
1050         int ret = 0;
1051
1052         if (!udp_tunnel)
1053                 return -EINVAL;
1054
1055         switch (udp_tunnel->prot_type) {
1056         case RTE_ETH_TUNNEL_TYPE_VXLAN:
1057                 ret = ice_create_tunnel(parent_hw, TNL_VXLAN,
1058                                         udp_tunnel->udp_port);
1059                 break;
1060         case RTE_ETH_TUNNEL_TYPE_ECPRI:
1061                 ret = ice_create_tunnel(parent_hw, TNL_ECPRI,
1062                                         udp_tunnel->udp_port);
1063                 break;
1064         default:
1065                 PMD_DRV_LOG(ERR, "Invalid tunnel type");
1066                 ret = -EINVAL;
1067                 break;
1068         }
1069
1070         return ret;
1071 }
1072
1073 /* Delete UDP tunneling port */
1074 static int
1075 ice_dcf_dev_udp_tunnel_port_del(struct rte_eth_dev *dev,
1076                                 struct rte_eth_udp_tunnel *udp_tunnel)
1077 {
1078         struct ice_dcf_adapter *adapter = dev->data->dev_private;
1079         struct ice_adapter *parent_adapter = &adapter->parent;
1080         struct ice_hw *parent_hw = &parent_adapter->hw;
1081         int ret = 0;
1082
1083         if (!udp_tunnel)
1084                 return -EINVAL;
1085
1086         switch (udp_tunnel->prot_type) {
1087         case RTE_ETH_TUNNEL_TYPE_VXLAN:
1088         case RTE_ETH_TUNNEL_TYPE_ECPRI:
1089                 ret = ice_destroy_tunnel(parent_hw, udp_tunnel->udp_port, 0);
1090                 break;
1091         default:
1092                 PMD_DRV_LOG(ERR, "Invalid tunnel type");
1093                 ret = -EINVAL;
1094                 break;
1095         }
1096
1097         return ret;
1098 }
1099
1100 static int
1101 ice_dcf_tm_ops_get(struct rte_eth_dev *dev __rte_unused,
1102                 void *arg)
1103 {
1104         if (!arg)
1105                 return -EINVAL;
1106
1107         *(const void **)arg = &ice_dcf_tm_ops;
1108
1109         return 0;
1110 }
1111
1112 static inline void
1113 ice_dcf_reset_hw(struct rte_eth_dev *eth_dev, struct ice_dcf_hw *hw)
1114 {
1115         ice_dcf_uninit_hw(eth_dev, hw);
1116         ice_dcf_init_hw(eth_dev, hw);
1117 }
1118
1119 /* Check if reset has been triggered by PF */
1120 static inline bool
1121 ice_dcf_is_reset(struct rte_eth_dev *dev)
1122 {
1123         struct ice_dcf_adapter *ad = dev->data->dev_private;
1124         struct iavf_hw *hw = &ad->real_hw.avf;
1125
1126         return !(IAVF_READ_REG(hw, IAVF_VF_ARQLEN1) &
1127                  IAVF_VF_ARQLEN1_ARQENABLE_MASK);
1128 }
1129
1130 static int
1131 ice_dcf_dev_reset(struct rte_eth_dev *dev)
1132 {
1133         struct ice_dcf_adapter *ad = dev->data->dev_private;
1134         struct ice_dcf_hw *hw = &ad->real_hw;
1135         int ret;
1136
1137         if (ice_dcf_is_reset(dev)) {
1138                 if (!ad->real_hw.resetting)
1139                         ad->real_hw.resetting = true;
1140                 PMD_DRV_LOG(ERR, "The DCF has been reset by PF");
1141
1142                 /*
1143                  * Simply reset hw to trigger an additional DCF enable/disable
1144                  * cycle which help to workaround the issue that kernel driver
1145                  * may not clean up resource during previous reset.
1146                  */
1147                 ice_dcf_reset_hw(dev, hw);
1148         }
1149
1150         ret = ice_dcf_dev_uninit(dev);
1151         if (ret)
1152                 return ret;
1153
1154         ret = ice_dcf_dev_init(dev);
1155
1156         return ret;
1157 }
1158
1159 static const struct eth_dev_ops ice_dcf_eth_dev_ops = {
1160         .dev_start               = ice_dcf_dev_start,
1161         .dev_stop                = ice_dcf_dev_stop,
1162         .dev_close               = ice_dcf_dev_close,
1163         .dev_reset               = ice_dcf_dev_reset,
1164         .dev_configure           = ice_dcf_dev_configure,
1165         .dev_infos_get           = ice_dcf_dev_info_get,
1166         .rx_queue_setup          = ice_rx_queue_setup,
1167         .tx_queue_setup          = ice_tx_queue_setup,
1168         .rx_queue_release        = ice_dev_rx_queue_release,
1169         .tx_queue_release        = ice_dev_tx_queue_release,
1170         .rx_queue_start          = ice_dcf_rx_queue_start,
1171         .tx_queue_start          = ice_dcf_tx_queue_start,
1172         .rx_queue_stop           = ice_dcf_rx_queue_stop,
1173         .tx_queue_stop           = ice_dcf_tx_queue_stop,
1174         .link_update             = ice_dcf_link_update,
1175         .stats_get               = ice_dcf_stats_get,
1176         .stats_reset             = ice_dcf_stats_reset,
1177         .promiscuous_enable      = ice_dcf_dev_promiscuous_enable,
1178         .promiscuous_disable     = ice_dcf_dev_promiscuous_disable,
1179         .allmulticast_enable     = ice_dcf_dev_allmulticast_enable,
1180         .allmulticast_disable    = ice_dcf_dev_allmulticast_disable,
1181         .flow_ops_get            = ice_dcf_dev_flow_ops_get,
1182         .udp_tunnel_port_add     = ice_dcf_dev_udp_tunnel_port_add,
1183         .udp_tunnel_port_del     = ice_dcf_dev_udp_tunnel_port_del,
1184         .tm_ops_get              = ice_dcf_tm_ops_get,
1185         .reta_update             = ice_dcf_dev_rss_reta_update,
1186         .reta_query              = ice_dcf_dev_rss_reta_query,
1187 };
1188
1189 static int
1190 ice_dcf_dev_init(struct rte_eth_dev *eth_dev)
1191 {
1192         struct ice_dcf_adapter *adapter = eth_dev->data->dev_private;
1193         struct ice_adapter *parent_adapter = &adapter->parent;
1194
1195         eth_dev->dev_ops = &ice_dcf_eth_dev_ops;
1196         eth_dev->rx_pkt_burst = ice_dcf_recv_pkts;
1197         eth_dev->tx_pkt_burst = ice_dcf_xmit_pkts;
1198
1199         if (rte_eal_process_type() != RTE_PROC_PRIMARY)
1200                 return 0;
1201
1202         adapter->real_hw.vc_event_msg_cb = ice_dcf_handle_pf_event_msg;
1203         if (ice_dcf_init_hw(eth_dev, &adapter->real_hw) != 0) {
1204                 PMD_INIT_LOG(ERR, "Failed to init DCF hardware");
1205                 __atomic_store_n(&parent_adapter->dcf_state_on, false,
1206                                  __ATOMIC_RELAXED);
1207                 return -1;
1208         }
1209
1210         __atomic_store_n(&parent_adapter->dcf_state_on, true, __ATOMIC_RELAXED);
1211
1212         if (ice_dcf_init_parent_adapter(eth_dev) != 0) {
1213                 PMD_INIT_LOG(ERR, "Failed to init DCF parent adapter");
1214                 ice_dcf_uninit_hw(eth_dev, &adapter->real_hw);
1215                 return -1;
1216         }
1217
1218         return 0;
1219 }
1220
1221 static int
1222 ice_dcf_dev_uninit(struct rte_eth_dev *eth_dev)
1223 {
1224         ice_dcf_dev_close(eth_dev);
1225
1226         return 0;
1227 }
1228
1229 static int
1230 ice_dcf_cap_check_handler(__rte_unused const char *key,
1231                           const char *value, __rte_unused void *opaque)
1232 {
1233         if (strcmp(value, "dcf"))
1234                 return -1;
1235
1236         return 0;
1237 }
1238
1239 static int
1240 ice_dcf_cap_selected(struct rte_devargs *devargs)
1241 {
1242         struct rte_kvargs *kvlist;
1243         const char *key = "cap";
1244         int ret = 0;
1245
1246         if (devargs == NULL)
1247                 return 0;
1248
1249         kvlist = rte_kvargs_parse(devargs->args, NULL);
1250         if (kvlist == NULL)
1251                 return 0;
1252
1253         if (!rte_kvargs_count(kvlist, key))
1254                 goto exit;
1255
1256         /* dcf capability selected when there's a key-value pair: cap=dcf */
1257         if (rte_kvargs_process(kvlist, key,
1258                                ice_dcf_cap_check_handler, NULL) < 0)
1259                 goto exit;
1260
1261         ret = 1;
1262
1263 exit:
1264         rte_kvargs_free(kvlist);
1265         return ret;
1266 }
1267
1268 static int
1269 eth_ice_dcf_pci_probe(__rte_unused struct rte_pci_driver *pci_drv,
1270                       struct rte_pci_device *pci_dev)
1271 {
1272         struct rte_eth_devargs eth_da = { .nb_representor_ports = 0 };
1273         struct ice_dcf_vf_repr_param repr_param;
1274         char repr_name[RTE_ETH_NAME_MAX_LEN];
1275         struct ice_dcf_adapter *dcf_adapter;
1276         struct rte_eth_dev *dcf_ethdev;
1277         uint16_t dcf_vsi_id;
1278         int i, ret;
1279
1280         if (!ice_dcf_cap_selected(pci_dev->device.devargs))
1281                 return 1;
1282
1283         ret = rte_eth_devargs_parse(pci_dev->device.devargs->args, &eth_da);
1284         if (ret)
1285                 return ret;
1286
1287         ret = rte_eth_dev_pci_generic_probe(pci_dev,
1288                                             sizeof(struct ice_dcf_adapter),
1289                                             ice_dcf_dev_init);
1290         if (ret || !eth_da.nb_representor_ports)
1291                 return ret;
1292         if (eth_da.type != RTE_ETH_REPRESENTOR_VF)
1293                 return -ENOTSUP;
1294
1295         dcf_ethdev = rte_eth_dev_allocated(pci_dev->device.name);
1296         if (dcf_ethdev == NULL)
1297                 return -ENODEV;
1298
1299         dcf_adapter = dcf_ethdev->data->dev_private;
1300         ret = ice_dcf_init_repr_info(dcf_adapter);
1301         if (ret)
1302                 return ret;
1303
1304         if (eth_da.nb_representor_ports > dcf_adapter->real_hw.num_vfs ||
1305             eth_da.nb_representor_ports >= RTE_MAX_ETHPORTS) {
1306                 PMD_DRV_LOG(ERR, "the number of port representors is too large: %u",
1307                             eth_da.nb_representor_ports);
1308                 ice_dcf_free_repr_info(dcf_adapter);
1309                 return -EINVAL;
1310         }
1311
1312         dcf_vsi_id = dcf_adapter->real_hw.vsi_id | VIRTCHNL_DCF_VF_VSI_VALID;
1313
1314         repr_param.dcf_eth_dev = dcf_ethdev;
1315         repr_param.switch_domain_id = 0;
1316
1317         for (i = 0; i < eth_da.nb_representor_ports; i++) {
1318                 uint16_t vf_id = eth_da.representor_ports[i];
1319                 struct rte_eth_dev *vf_rep_eth_dev;
1320
1321                 if (vf_id >= dcf_adapter->real_hw.num_vfs) {
1322                         PMD_DRV_LOG(ERR, "VF ID %u is out of range (0 ~ %u)",
1323                                     vf_id, dcf_adapter->real_hw.num_vfs - 1);
1324                         ret = -EINVAL;
1325                         break;
1326                 }
1327
1328                 if (dcf_adapter->real_hw.vf_vsi_map[vf_id] == dcf_vsi_id) {
1329                         PMD_DRV_LOG(ERR, "VF ID %u is DCF's ID.\n", vf_id);
1330                         ret = -EINVAL;
1331                         break;
1332                 }
1333
1334                 repr_param.vf_id = vf_id;
1335                 snprintf(repr_name, sizeof(repr_name), "net_%s_representor_%u",
1336                          pci_dev->device.name, vf_id);
1337                 ret = rte_eth_dev_create(&pci_dev->device, repr_name,
1338                                          sizeof(struct ice_dcf_vf_repr),
1339                                          NULL, NULL, ice_dcf_vf_repr_init,
1340                                          &repr_param);
1341                 if (ret) {
1342                         PMD_DRV_LOG(ERR, "failed to create DCF VF representor %s",
1343                                     repr_name);
1344                         break;
1345                 }
1346
1347                 vf_rep_eth_dev = rte_eth_dev_allocated(repr_name);
1348                 if (!vf_rep_eth_dev) {
1349                         PMD_DRV_LOG(ERR,
1350                                     "Failed to find the ethdev for DCF VF representor: %s",
1351                                     repr_name);
1352                         ret = -ENODEV;
1353                         break;
1354                 }
1355
1356                 dcf_adapter->repr_infos[vf_id].vf_rep_eth_dev = vf_rep_eth_dev;
1357                 dcf_adapter->num_reprs++;
1358         }
1359
1360         return ret;
1361 }
1362
1363 static int
1364 eth_ice_dcf_pci_remove(struct rte_pci_device *pci_dev)
1365 {
1366         struct rte_eth_dev *eth_dev;
1367
1368         eth_dev = rte_eth_dev_allocated(pci_dev->device.name);
1369         if (!eth_dev)
1370                 return 0;
1371
1372         if (eth_dev->data->dev_flags & RTE_ETH_DEV_REPRESENTOR)
1373                 return rte_eth_dev_pci_generic_remove(pci_dev,
1374                                                       ice_dcf_vf_repr_uninit);
1375         else
1376                 return rte_eth_dev_pci_generic_remove(pci_dev,
1377                                                       ice_dcf_dev_uninit);
1378 }
1379
1380 static const struct rte_pci_id pci_id_ice_dcf_map[] = {
1381         { RTE_PCI_DEVICE(IAVF_INTEL_VENDOR_ID, IAVF_DEV_ID_ADAPTIVE_VF) },
1382         { .vendor_id = 0, /* sentinel */ },
1383 };
1384
1385 static struct rte_pci_driver rte_ice_dcf_pmd = {
1386         .id_table = pci_id_ice_dcf_map,
1387         .drv_flags = RTE_PCI_DRV_NEED_MAPPING,
1388         .probe = eth_ice_dcf_pci_probe,
1389         .remove = eth_ice_dcf_pci_remove,
1390 };
1391
1392 RTE_PMD_REGISTER_PCI(net_ice_dcf, rte_ice_dcf_pmd);
1393 RTE_PMD_REGISTER_PCI_TABLE(net_ice_dcf, pci_id_ice_dcf_map);
1394 RTE_PMD_REGISTER_KMOD_DEP(net_ice_dcf, "* igb_uio | vfio-pci");
1395 RTE_PMD_REGISTER_PARAM_STRING(net_ice_dcf, "cap=dcf");