d2fa1682561b6ad4654eecf01f861598f55c621a
[dpdk.git] / drivers / net / iavf / iavf_ethdev.c
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright(c) 2017 Intel Corporation
3  */
4
5 #include <sys/queue.h>
6 #include <stdio.h>
7 #include <errno.h>
8 #include <stdint.h>
9 #include <string.h>
10 #include <unistd.h>
11 #include <stdarg.h>
12 #include <inttypes.h>
13 #include <rte_byteorder.h>
14 #include <rte_common.h>
15
16 #include <rte_interrupts.h>
17 #include <rte_debug.h>
18 #include <rte_pci.h>
19 #include <rte_atomic.h>
20 #include <rte_eal.h>
21 #include <rte_ether.h>
22 #include <rte_ethdev_driver.h>
23 #include <rte_ethdev_pci.h>
24 #include <rte_malloc.h>
25 #include <rte_memzone.h>
26 #include <rte_dev.h>
27
28 #include "iavf.h"
29 #include "iavf_rxtx.h"
30 #include "iavf_generic_flow.h"
31 #include "rte_pmd_iavf.h"
32
33 /* devargs */
34 #define IAVF_PROTO_XTR_ARG         "proto_xtr"
35
36 static const char * const iavf_valid_args[] = {
37         IAVF_PROTO_XTR_ARG,
38         NULL
39 };
40
41 static const struct rte_mbuf_dynfield iavf_proto_xtr_metadata_param = {
42         .name = "intel_pmd_dynfield_proto_xtr_metadata",
43         .size = sizeof(uint32_t),
44         .align = __alignof__(uint32_t),
45         .flags = 0,
46 };
47
48 struct iavf_proto_xtr_ol {
49         const struct rte_mbuf_dynflag param;
50         uint64_t *ol_flag;
51         bool required;
52 };
53
54 static struct iavf_proto_xtr_ol iavf_proto_xtr_params[] = {
55         [IAVF_PROTO_XTR_VLAN] = {
56                 .param = { .name = "intel_pmd_dynflag_proto_xtr_vlan" },
57                 .ol_flag = &rte_pmd_ifd_dynflag_proto_xtr_vlan_mask },
58         [IAVF_PROTO_XTR_IPV4] = {
59                 .param = { .name = "intel_pmd_dynflag_proto_xtr_ipv4" },
60                 .ol_flag = &rte_pmd_ifd_dynflag_proto_xtr_ipv4_mask },
61         [IAVF_PROTO_XTR_IPV6] = {
62                 .param = { .name = "intel_pmd_dynflag_proto_xtr_ipv6" },
63                 .ol_flag = &rte_pmd_ifd_dynflag_proto_xtr_ipv6_mask },
64         [IAVF_PROTO_XTR_IPV6_FLOW] = {
65                 .param = { .name = "intel_pmd_dynflag_proto_xtr_ipv6_flow" },
66                 .ol_flag = &rte_pmd_ifd_dynflag_proto_xtr_ipv6_flow_mask },
67         [IAVF_PROTO_XTR_TCP] = {
68                 .param = { .name = "intel_pmd_dynflag_proto_xtr_tcp" },
69                 .ol_flag = &rte_pmd_ifd_dynflag_proto_xtr_tcp_mask },
70         [IAVF_PROTO_XTR_IP_OFFSET] = {
71                 .param = { .name = "intel_pmd_dynflag_proto_xtr_ip_offset" },
72                 .ol_flag = &rte_pmd_ifd_dynflag_proto_xtr_ip_offset_mask },
73 };
74
75 static int iavf_dev_configure(struct rte_eth_dev *dev);
76 static int iavf_dev_start(struct rte_eth_dev *dev);
77 static int iavf_dev_stop(struct rte_eth_dev *dev);
78 static int iavf_dev_close(struct rte_eth_dev *dev);
79 static int iavf_dev_reset(struct rte_eth_dev *dev);
80 static int iavf_dev_info_get(struct rte_eth_dev *dev,
81                              struct rte_eth_dev_info *dev_info);
82 static const uint32_t *iavf_dev_supported_ptypes_get(struct rte_eth_dev *dev);
83 static int iavf_dev_stats_get(struct rte_eth_dev *dev,
84                              struct rte_eth_stats *stats);
85 static int iavf_dev_stats_reset(struct rte_eth_dev *dev);
86 static int iavf_dev_xstats_get(struct rte_eth_dev *dev,
87                                  struct rte_eth_xstat *xstats, unsigned int n);
88 static int iavf_dev_xstats_get_names(struct rte_eth_dev *dev,
89                                        struct rte_eth_xstat_name *xstats_names,
90                                        unsigned int limit);
91 static int iavf_dev_promiscuous_enable(struct rte_eth_dev *dev);
92 static int iavf_dev_promiscuous_disable(struct rte_eth_dev *dev);
93 static int iavf_dev_allmulticast_enable(struct rte_eth_dev *dev);
94 static int iavf_dev_allmulticast_disable(struct rte_eth_dev *dev);
95 static int iavf_dev_add_mac_addr(struct rte_eth_dev *dev,
96                                 struct rte_ether_addr *addr,
97                                 uint32_t index,
98                                 uint32_t pool);
99 static void iavf_dev_del_mac_addr(struct rte_eth_dev *dev, uint32_t index);
100 static int iavf_dev_vlan_filter_set(struct rte_eth_dev *dev,
101                                    uint16_t vlan_id, int on);
102 static int iavf_dev_vlan_offload_set(struct rte_eth_dev *dev, int mask);
103 static int iavf_dev_rss_reta_update(struct rte_eth_dev *dev,
104                                    struct rte_eth_rss_reta_entry64 *reta_conf,
105                                    uint16_t reta_size);
106 static int iavf_dev_rss_reta_query(struct rte_eth_dev *dev,
107                                   struct rte_eth_rss_reta_entry64 *reta_conf,
108                                   uint16_t reta_size);
109 static int iavf_dev_rss_hash_update(struct rte_eth_dev *dev,
110                                    struct rte_eth_rss_conf *rss_conf);
111 static int iavf_dev_rss_hash_conf_get(struct rte_eth_dev *dev,
112                                      struct rte_eth_rss_conf *rss_conf);
113 static int iavf_dev_mtu_set(struct rte_eth_dev *dev, uint16_t mtu);
114 static int iavf_dev_set_default_mac_addr(struct rte_eth_dev *dev,
115                                          struct rte_ether_addr *mac_addr);
116 static int iavf_dev_rx_queue_intr_enable(struct rte_eth_dev *dev,
117                                         uint16_t queue_id);
118 static int iavf_dev_rx_queue_intr_disable(struct rte_eth_dev *dev,
119                                          uint16_t queue_id);
120 static int iavf_dev_filter_ctrl(struct rte_eth_dev *dev,
121                      enum rte_filter_type filter_type,
122                      enum rte_filter_op filter_op,
123                      void *arg);
124 static int iavf_set_mc_addr_list(struct rte_eth_dev *dev,
125                         struct rte_ether_addr *mc_addrs,
126                         uint32_t mc_addrs_num);
127
128 static const struct rte_pci_id pci_id_iavf_map[] = {
129         { RTE_PCI_DEVICE(IAVF_INTEL_VENDOR_ID, IAVF_DEV_ID_ADAPTIVE_VF) },
130         { .vendor_id = 0, /* sentinel */ },
131 };
132
133 struct rte_iavf_xstats_name_off {
134         char name[RTE_ETH_XSTATS_NAME_SIZE];
135         unsigned int offset;
136 };
137
138 static const struct rte_iavf_xstats_name_off rte_iavf_stats_strings[] = {
139         {"rx_bytes", offsetof(struct iavf_eth_stats, rx_bytes)},
140         {"rx_unicast_packets", offsetof(struct iavf_eth_stats, rx_unicast)},
141         {"rx_multicast_packets", offsetof(struct iavf_eth_stats, rx_multicast)},
142         {"rx_broadcast_packets", offsetof(struct iavf_eth_stats, rx_broadcast)},
143         {"rx_dropped_packets", offsetof(struct iavf_eth_stats, rx_discards)},
144         {"rx_unknown_protocol_packets", offsetof(struct iavf_eth_stats,
145                 rx_unknown_protocol)},
146         {"tx_bytes", offsetof(struct iavf_eth_stats, tx_bytes)},
147         {"tx_unicast_packets", offsetof(struct iavf_eth_stats, tx_unicast)},
148         {"tx_multicast_packets", offsetof(struct iavf_eth_stats, tx_multicast)},
149         {"tx_broadcast_packets", offsetof(struct iavf_eth_stats, tx_broadcast)},
150         {"tx_dropped_packets", offsetof(struct iavf_eth_stats, tx_discards)},
151         {"tx_error_packets", offsetof(struct iavf_eth_stats, tx_errors)},
152 };
153
154 #define IAVF_NB_XSTATS (sizeof(rte_iavf_stats_strings) / \
155                 sizeof(rte_iavf_stats_strings[0]))
156
157 static const struct eth_dev_ops iavf_eth_dev_ops = {
158         .dev_configure              = iavf_dev_configure,
159         .dev_start                  = iavf_dev_start,
160         .dev_stop                   = iavf_dev_stop,
161         .dev_close                  = iavf_dev_close,
162         .dev_reset                  = iavf_dev_reset,
163         .dev_infos_get              = iavf_dev_info_get,
164         .dev_supported_ptypes_get   = iavf_dev_supported_ptypes_get,
165         .link_update                = iavf_dev_link_update,
166         .stats_get                  = iavf_dev_stats_get,
167         .stats_reset                = iavf_dev_stats_reset,
168         .xstats_get                 = iavf_dev_xstats_get,
169         .xstats_get_names           = iavf_dev_xstats_get_names,
170         .xstats_reset               = iavf_dev_stats_reset,
171         .promiscuous_enable         = iavf_dev_promiscuous_enable,
172         .promiscuous_disable        = iavf_dev_promiscuous_disable,
173         .allmulticast_enable        = iavf_dev_allmulticast_enable,
174         .allmulticast_disable       = iavf_dev_allmulticast_disable,
175         .mac_addr_add               = iavf_dev_add_mac_addr,
176         .mac_addr_remove            = iavf_dev_del_mac_addr,
177         .set_mc_addr_list                       = iavf_set_mc_addr_list,
178         .vlan_filter_set            = iavf_dev_vlan_filter_set,
179         .vlan_offload_set           = iavf_dev_vlan_offload_set,
180         .rx_queue_start             = iavf_dev_rx_queue_start,
181         .rx_queue_stop              = iavf_dev_rx_queue_stop,
182         .tx_queue_start             = iavf_dev_tx_queue_start,
183         .tx_queue_stop              = iavf_dev_tx_queue_stop,
184         .rx_queue_setup             = iavf_dev_rx_queue_setup,
185         .rx_queue_release           = iavf_dev_rx_queue_release,
186         .tx_queue_setup             = iavf_dev_tx_queue_setup,
187         .tx_queue_release           = iavf_dev_tx_queue_release,
188         .mac_addr_set               = iavf_dev_set_default_mac_addr,
189         .reta_update                = iavf_dev_rss_reta_update,
190         .reta_query                 = iavf_dev_rss_reta_query,
191         .rss_hash_update            = iavf_dev_rss_hash_update,
192         .rss_hash_conf_get          = iavf_dev_rss_hash_conf_get,
193         .rxq_info_get               = iavf_dev_rxq_info_get,
194         .txq_info_get               = iavf_dev_txq_info_get,
195         .mtu_set                    = iavf_dev_mtu_set,
196         .rx_queue_intr_enable       = iavf_dev_rx_queue_intr_enable,
197         .rx_queue_intr_disable      = iavf_dev_rx_queue_intr_disable,
198         .filter_ctrl                = iavf_dev_filter_ctrl,
199         .tx_done_cleanup            = iavf_dev_tx_done_cleanup,
200 };
201
202 static int
203 iavf_set_mc_addr_list(struct rte_eth_dev *dev,
204                         struct rte_ether_addr *mc_addrs,
205                         uint32_t mc_addrs_num)
206 {
207         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
208         struct iavf_adapter *adapter =
209                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
210         int err, ret;
211
212         if (mc_addrs_num > IAVF_NUM_MACADDR_MAX) {
213                 PMD_DRV_LOG(ERR,
214                             "can't add more than a limited number (%u) of addresses.",
215                             (uint32_t)IAVF_NUM_MACADDR_MAX);
216                 return -EINVAL;
217         }
218
219         /* flush previous addresses */
220         err = iavf_add_del_mc_addr_list(adapter, vf->mc_addrs, vf->mc_addrs_num,
221                                         false);
222         if (err)
223                 return err;
224
225         /* add new ones */
226         err = iavf_add_del_mc_addr_list(adapter, mc_addrs, mc_addrs_num, true);
227
228         if (err) {
229                 /* if adding mac address list fails, should add the previous
230                  * addresses back.
231                  */
232                 ret = iavf_add_del_mc_addr_list(adapter, vf->mc_addrs,
233                                                 vf->mc_addrs_num, true);
234                 if (ret)
235                         return ret;
236         } else {
237                 vf->mc_addrs_num = mc_addrs_num;
238                 memcpy(vf->mc_addrs,
239                        mc_addrs, mc_addrs_num * sizeof(*mc_addrs));
240         }
241
242         return err;
243 }
244
245 static int
246 iavf_init_rss(struct iavf_adapter *adapter)
247 {
248         struct iavf_info *vf =  IAVF_DEV_PRIVATE_TO_VF(adapter);
249         struct rte_eth_rss_conf *rss_conf;
250         uint16_t i, j, nb_q;
251         int ret;
252
253         rss_conf = &adapter->eth_dev->data->dev_conf.rx_adv_conf.rss_conf;
254         nb_q = RTE_MIN(adapter->eth_dev->data->nb_rx_queues,
255                        vf->max_rss_qregion);
256
257         if (!(vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF)) {
258                 PMD_DRV_LOG(DEBUG, "RSS is not supported");
259                 return -ENOTSUP;
260         }
261         if (adapter->eth_dev->data->dev_conf.rxmode.mq_mode != ETH_MQ_RX_RSS) {
262                 PMD_DRV_LOG(WARNING, "RSS is enabled by PF by default");
263                 /* set all lut items to default queue */
264                 for (i = 0; i < vf->vf_res->rss_lut_size; i++)
265                         vf->rss_lut[i] = 0;
266                 ret = iavf_configure_rss_lut(adapter);
267                 return ret;
268         }
269
270         /* configure RSS key */
271         if (!rss_conf->rss_key) {
272                 /* Calculate the default hash key */
273                 for (i = 0; i <= vf->vf_res->rss_key_size; i++)
274                         vf->rss_key[i] = (uint8_t)rte_rand();
275         } else
276                 rte_memcpy(vf->rss_key, rss_conf->rss_key,
277                            RTE_MIN(rss_conf->rss_key_len,
278                                    vf->vf_res->rss_key_size));
279
280         /* init RSS LUT table */
281         for (i = 0, j = 0; i < vf->vf_res->rss_lut_size; i++, j++) {
282                 if (j >= nb_q)
283                         j = 0;
284                 vf->rss_lut[i] = j;
285         }
286         /* send virtchnnl ops to configure rss*/
287         ret = iavf_configure_rss_lut(adapter);
288         if (ret)
289                 return ret;
290         ret = iavf_configure_rss_key(adapter);
291         if (ret)
292                 return ret;
293
294         /* Set RSS hash configuration based on rss_conf->rss_hf. */
295         ret = iavf_rss_hash_set(adapter, rss_conf->rss_hf, true);
296         if (ret) {
297                 PMD_DRV_LOG(ERR, "fail to set default RSS");
298                 return ret;
299         }
300
301         return 0;
302 }
303
304 static int
305 iavf_queues_req_reset(struct rte_eth_dev *dev, uint16_t num)
306 {
307         struct iavf_adapter *ad =
308                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
309         struct iavf_info *vf =  IAVF_DEV_PRIVATE_TO_VF(ad);
310         int ret;
311
312         ret = iavf_request_queues(ad, num);
313         if (ret) {
314                 PMD_DRV_LOG(ERR, "request queues from PF failed");
315                 return ret;
316         }
317         PMD_DRV_LOG(INFO, "change queue pairs from %u to %u",
318                         vf->vsi_res->num_queue_pairs, num);
319
320         ret = iavf_dev_reset(dev);
321         if (ret) {
322                 PMD_DRV_LOG(ERR, "vf reset failed");
323                 return ret;
324         }
325
326         return 0;
327 }
328
329 static int
330 iavf_dev_configure(struct rte_eth_dev *dev)
331 {
332         struct iavf_adapter *ad =
333                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
334         struct iavf_info *vf =  IAVF_DEV_PRIVATE_TO_VF(ad);
335         struct rte_eth_conf *dev_conf = &dev->data->dev_conf;
336         uint16_t num_queue_pairs = RTE_MAX(dev->data->nb_rx_queues,
337                 dev->data->nb_tx_queues);
338         int ret;
339
340         ad->rx_bulk_alloc_allowed = true;
341         /* Initialize to TRUE. If any of Rx queues doesn't meet the
342          * vector Rx/Tx preconditions, it will be reset.
343          */
344         ad->rx_vec_allowed = true;
345         ad->tx_vec_allowed = true;
346
347         if (dev->data->dev_conf.rxmode.mq_mode & ETH_MQ_RX_RSS_FLAG)
348                 dev->data->dev_conf.rxmode.offloads |= DEV_RX_OFFLOAD_RSS_HASH;
349
350         /* Large VF setting */
351         if (num_queue_pairs > IAVF_MAX_NUM_QUEUES_DFLT) {
352                 if (!(vf->vf_res->vf_cap_flags &
353                                 VIRTCHNL_VF_LARGE_NUM_QPAIRS)) {
354                         PMD_DRV_LOG(ERR, "large VF is not supported");
355                         return -1;
356                 }
357
358                 if (num_queue_pairs > IAVF_MAX_NUM_QUEUES_LV) {
359                         PMD_DRV_LOG(ERR, "queue pairs number cannot be larger than %u",
360                                 IAVF_MAX_NUM_QUEUES_LV);
361                         return -1;
362                 }
363
364                 ret = iavf_queues_req_reset(dev, num_queue_pairs);
365                 if (ret)
366                         return ret;
367
368                 ret = iavf_get_max_rss_queue_region(ad);
369                 if (ret) {
370                         PMD_INIT_LOG(ERR, "get max rss queue region failed");
371                         return ret;
372                 }
373
374                 vf->lv_enabled = true;
375         } else {
376                 /* Check if large VF is already enabled. If so, disable and
377                  * release redundant queue resource.
378                  */
379                 if (vf->lv_enabled) {
380                         ret = iavf_queues_req_reset(dev, num_queue_pairs);
381                         if (ret)
382                                 return ret;
383
384                         vf->lv_enabled = false;
385                 }
386                 /* if large VF is not required, use default rss queue region */
387                 vf->max_rss_qregion = IAVF_MAX_NUM_QUEUES_DFLT;
388         }
389
390         /* Vlan stripping setting */
391         if (vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_VLAN) {
392                 if (dev_conf->rxmode.offloads & DEV_RX_OFFLOAD_VLAN_STRIP)
393                         iavf_enable_vlan_strip(ad);
394                 else
395                         iavf_disable_vlan_strip(ad);
396         }
397
398         if (vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF) {
399                 if (iavf_init_rss(ad) != 0) {
400                         PMD_DRV_LOG(ERR, "configure rss failed");
401                         return -1;
402                 }
403         }
404         return 0;
405 }
406
407 static int
408 iavf_init_rxq(struct rte_eth_dev *dev, struct iavf_rx_queue *rxq)
409 {
410         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(dev->data->dev_private);
411         struct rte_eth_dev_data *dev_data = dev->data;
412         uint16_t buf_size, max_pkt_len, len;
413
414         buf_size = rte_pktmbuf_data_room_size(rxq->mp) - RTE_PKTMBUF_HEADROOM;
415
416         /* Calculate the maximum packet length allowed */
417         len = rxq->rx_buf_len * IAVF_MAX_CHAINED_RX_BUFFERS;
418         max_pkt_len = RTE_MIN(len, dev->data->dev_conf.rxmode.max_rx_pkt_len);
419
420         /* Check if the jumbo frame and maximum packet length are set
421          * correctly.
422          */
423         if (dev->data->dev_conf.rxmode.offloads & DEV_RX_OFFLOAD_JUMBO_FRAME) {
424                 if (max_pkt_len <= RTE_ETHER_MAX_LEN ||
425                     max_pkt_len > IAVF_FRAME_SIZE_MAX) {
426                         PMD_DRV_LOG(ERR, "maximum packet length must be "
427                                     "larger than %u and smaller than %u, "
428                                     "as jumbo frame is enabled",
429                                     (uint32_t)RTE_ETHER_MAX_LEN,
430                                     (uint32_t)IAVF_FRAME_SIZE_MAX);
431                         return -EINVAL;
432                 }
433         } else {
434                 if (max_pkt_len < RTE_ETHER_MIN_LEN ||
435                     max_pkt_len > RTE_ETHER_MAX_LEN) {
436                         PMD_DRV_LOG(ERR, "maximum packet length must be "
437                                     "larger than %u and smaller than %u, "
438                                     "as jumbo frame is disabled",
439                                     (uint32_t)RTE_ETHER_MIN_LEN,
440                                     (uint32_t)RTE_ETHER_MAX_LEN);
441                         return -EINVAL;
442                 }
443         }
444
445         rxq->max_pkt_len = max_pkt_len;
446         if ((dev_data->dev_conf.rxmode.offloads & DEV_RX_OFFLOAD_SCATTER) ||
447             rxq->max_pkt_len > buf_size) {
448                 dev_data->scattered_rx = 1;
449         }
450         IAVF_PCI_REG_WRITE(rxq->qrx_tail, rxq->nb_rx_desc - 1);
451         IAVF_WRITE_FLUSH(hw);
452
453         return 0;
454 }
455
456 static int
457 iavf_init_queues(struct rte_eth_dev *dev)
458 {
459         struct iavf_rx_queue **rxq =
460                 (struct iavf_rx_queue **)dev->data->rx_queues;
461         int i, ret = IAVF_SUCCESS;
462
463         for (i = 0; i < dev->data->nb_rx_queues; i++) {
464                 if (!rxq[i] || !rxq[i]->q_set)
465                         continue;
466                 ret = iavf_init_rxq(dev, rxq[i]);
467                 if (ret != IAVF_SUCCESS)
468                         break;
469         }
470         /* set rx/tx function to vector/scatter/single-segment
471          * according to parameters
472          */
473         iavf_set_rx_function(dev);
474         iavf_set_tx_function(dev);
475
476         return ret;
477 }
478
479 static int iavf_config_rx_queues_irqs(struct rte_eth_dev *dev,
480                                      struct rte_intr_handle *intr_handle)
481 {
482         struct iavf_adapter *adapter =
483                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
484         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
485         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(adapter);
486         struct iavf_qv_map *qv_map;
487         uint16_t interval, i;
488         int vec;
489
490         if (rte_intr_cap_multiple(intr_handle) &&
491             dev->data->dev_conf.intr_conf.rxq) {
492                 if (rte_intr_efd_enable(intr_handle, dev->data->nb_rx_queues))
493                         return -1;
494         }
495
496         if (rte_intr_dp_is_en(intr_handle) && !intr_handle->intr_vec) {
497                 intr_handle->intr_vec =
498                         rte_zmalloc("intr_vec",
499                                     dev->data->nb_rx_queues * sizeof(int), 0);
500                 if (!intr_handle->intr_vec) {
501                         PMD_DRV_LOG(ERR, "Failed to allocate %d rx intr_vec",
502                                     dev->data->nb_rx_queues);
503                         return -1;
504                 }
505         }
506
507         qv_map = rte_zmalloc("qv_map",
508                 dev->data->nb_rx_queues * sizeof(struct iavf_qv_map), 0);
509         if (!qv_map) {
510                 PMD_DRV_LOG(ERR, "Failed to allocate %d queue-vector map",
511                                 dev->data->nb_rx_queues);
512                 return -1;
513         }
514
515         if (!dev->data->dev_conf.intr_conf.rxq ||
516             !rte_intr_dp_is_en(intr_handle)) {
517                 /* Rx interrupt disabled, Map interrupt only for writeback */
518                 vf->nb_msix = 1;
519                 if (vf->vf_res->vf_cap_flags &
520                     VIRTCHNL_VF_OFFLOAD_WB_ON_ITR) {
521                         /* If WB_ON_ITR supports, enable it */
522                         vf->msix_base = IAVF_RX_VEC_START;
523                         /* Set the ITR for index zero, to 2us to make sure that
524                          * we leave time for aggregation to occur, but don't
525                          * increase latency dramatically.
526                          */
527                         IAVF_WRITE_REG(hw,
528                                        IAVF_VFINT_DYN_CTLN1(vf->msix_base - 1),
529                                        (0 << IAVF_VFINT_DYN_CTLN1_ITR_INDX_SHIFT) |
530                                        IAVF_VFINT_DYN_CTLN1_WB_ON_ITR_MASK |
531                                        (2UL << IAVF_VFINT_DYN_CTLN1_INTERVAL_SHIFT));
532                         /* debug - check for success! the return value
533                          * should be 2, offset is 0x2800
534                          */
535                         /* IAVF_READ_REG(hw, IAVF_VFINT_ITRN1(0, 0)); */
536                 } else {
537                         /* If no WB_ON_ITR offload flags, need to set
538                          * interrupt for descriptor write back.
539                          */
540                         vf->msix_base = IAVF_MISC_VEC_ID;
541
542                         /* set ITR to max */
543                         interval = iavf_calc_itr_interval(
544                                         IAVF_QUEUE_ITR_INTERVAL_MAX);
545                         IAVF_WRITE_REG(hw, IAVF_VFINT_DYN_CTL01,
546                                        IAVF_VFINT_DYN_CTL01_INTENA_MASK |
547                                        (IAVF_ITR_INDEX_DEFAULT <<
548                                         IAVF_VFINT_DYN_CTL01_ITR_INDX_SHIFT) |
549                                        (interval <<
550                                         IAVF_VFINT_DYN_CTL01_INTERVAL_SHIFT));
551                 }
552                 IAVF_WRITE_FLUSH(hw);
553                 /* map all queues to the same interrupt */
554                 for (i = 0; i < dev->data->nb_rx_queues; i++) {
555                         qv_map[i].queue_id = i;
556                         qv_map[i].vector_id = vf->msix_base;
557                 }
558                 vf->qv_map = qv_map;
559         } else {
560                 if (!rte_intr_allow_others(intr_handle)) {
561                         vf->nb_msix = 1;
562                         vf->msix_base = IAVF_MISC_VEC_ID;
563                         for (i = 0; i < dev->data->nb_rx_queues; i++) {
564                                 qv_map[i].queue_id = i;
565                                 qv_map[i].vector_id = vf->msix_base;
566                                 intr_handle->intr_vec[i] = IAVF_MISC_VEC_ID;
567                         }
568                         vf->qv_map = qv_map;
569                         PMD_DRV_LOG(DEBUG,
570                                     "vector %u are mapping to all Rx queues",
571                                     vf->msix_base);
572                 } else {
573                         /* If Rx interrupt is reuquired, and we can use
574                          * multi interrupts, then the vec is from 1
575                          */
576                         vf->nb_msix = RTE_MIN(vf->vf_res->max_vectors,
577                                               intr_handle->nb_efd);
578                         vf->msix_base = IAVF_RX_VEC_START;
579                         vec = IAVF_RX_VEC_START;
580                         for (i = 0; i < dev->data->nb_rx_queues; i++) {
581                                 qv_map[i].queue_id = i;
582                                 qv_map[i].vector_id = vec;
583                                 intr_handle->intr_vec[i] = vec++;
584                                 if (vec >= vf->nb_msix)
585                                         vec = IAVF_RX_VEC_START;
586                         }
587                         vf->qv_map = qv_map;
588                         PMD_DRV_LOG(DEBUG,
589                                     "%u vectors are mapping to %u Rx queues",
590                                     vf->nb_msix, dev->data->nb_rx_queues);
591                 }
592         }
593
594         if (!vf->lv_enabled) {
595                 if (iavf_config_irq_map(adapter)) {
596                         PMD_DRV_LOG(ERR, "config interrupt mapping failed");
597                         return -1;
598                 }
599         } else {
600                 uint16_t num_qv_maps = dev->data->nb_rx_queues;
601                 uint16_t index = 0;
602
603                 while (num_qv_maps > IAVF_IRQ_MAP_NUM_PER_BUF) {
604                         if (iavf_config_irq_map_lv(adapter,
605                                         IAVF_IRQ_MAP_NUM_PER_BUF, index)) {
606                                 PMD_DRV_LOG(ERR, "config interrupt mapping for large VF failed");
607                                 return -1;
608                         }
609                         num_qv_maps -= IAVF_IRQ_MAP_NUM_PER_BUF;
610                         index += IAVF_IRQ_MAP_NUM_PER_BUF;
611                 }
612
613                 if (iavf_config_irq_map_lv(adapter, num_qv_maps, index)) {
614                         PMD_DRV_LOG(ERR, "config interrupt mapping for large VF failed");
615                         return -1;
616                 }
617         }
618         return 0;
619 }
620
621 static int
622 iavf_start_queues(struct rte_eth_dev *dev)
623 {
624         struct iavf_rx_queue *rxq;
625         struct iavf_tx_queue *txq;
626         int i;
627
628         for (i = 0; i < dev->data->nb_tx_queues; i++) {
629                 txq = dev->data->tx_queues[i];
630                 if (txq->tx_deferred_start)
631                         continue;
632                 if (iavf_dev_tx_queue_start(dev, i) != 0) {
633                         PMD_DRV_LOG(ERR, "Fail to start queue %u", i);
634                         return -1;
635                 }
636         }
637
638         for (i = 0; i < dev->data->nb_rx_queues; i++) {
639                 rxq = dev->data->rx_queues[i];
640                 if (rxq->rx_deferred_start)
641                         continue;
642                 if (iavf_dev_rx_queue_start(dev, i) != 0) {
643                         PMD_DRV_LOG(ERR, "Fail to start queue %u", i);
644                         return -1;
645                 }
646         }
647
648         return 0;
649 }
650
651 static int
652 iavf_dev_start(struct rte_eth_dev *dev)
653 {
654         struct iavf_adapter *adapter =
655                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
656         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
657         struct rte_intr_handle *intr_handle = dev->intr_handle;
658         uint16_t num_queue_pairs;
659         uint16_t index = 0;
660
661         PMD_INIT_FUNC_TRACE();
662
663         adapter->stopped = 0;
664
665         vf->max_pkt_len = dev->data->dev_conf.rxmode.max_rx_pkt_len;
666         vf->num_queue_pairs = RTE_MAX(dev->data->nb_rx_queues,
667                                       dev->data->nb_tx_queues);
668         num_queue_pairs = vf->num_queue_pairs;
669
670         if (iavf_init_queues(dev) != 0) {
671                 PMD_DRV_LOG(ERR, "failed to do Queue init");
672                 return -1;
673         }
674
675         /* If needed, send configure queues msg multiple times to make the
676          * adminq buffer length smaller than the 4K limitation.
677          */
678         while (num_queue_pairs > IAVF_CFG_Q_NUM_PER_BUF) {
679                 if (iavf_configure_queues(adapter,
680                                 IAVF_CFG_Q_NUM_PER_BUF, index) != 0) {
681                         PMD_DRV_LOG(ERR, "configure queues failed");
682                         goto err_queue;
683                 }
684                 num_queue_pairs -= IAVF_CFG_Q_NUM_PER_BUF;
685                 index += IAVF_CFG_Q_NUM_PER_BUF;
686         }
687
688         if (iavf_configure_queues(adapter, num_queue_pairs, index) != 0) {
689                 PMD_DRV_LOG(ERR, "configure queues failed");
690                 goto err_queue;
691         }
692
693         if (iavf_config_rx_queues_irqs(dev, intr_handle) != 0) {
694                 PMD_DRV_LOG(ERR, "configure irq failed");
695                 goto err_queue;
696         }
697         /* re-enable intr again, because efd assign may change */
698         if (dev->data->dev_conf.intr_conf.rxq != 0) {
699                 rte_intr_disable(intr_handle);
700                 rte_intr_enable(intr_handle);
701         }
702
703         /* Set all mac addrs */
704         iavf_add_del_all_mac_addr(adapter, true);
705
706         /* Set all multicast addresses */
707         iavf_add_del_mc_addr_list(adapter, vf->mc_addrs, vf->mc_addrs_num,
708                                   true);
709
710         if (iavf_start_queues(dev) != 0) {
711                 PMD_DRV_LOG(ERR, "enable queues failed");
712                 goto err_mac;
713         }
714
715         return 0;
716
717 err_mac:
718         iavf_add_del_all_mac_addr(adapter, false);
719 err_queue:
720         return -1;
721 }
722
723 static int
724 iavf_dev_stop(struct rte_eth_dev *dev)
725 {
726         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
727         struct iavf_adapter *adapter =
728                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
729         struct rte_intr_handle *intr_handle = dev->intr_handle;
730
731         PMD_INIT_FUNC_TRACE();
732
733         if (adapter->stopped == 1)
734                 return 0;
735
736         iavf_stop_queues(dev);
737
738         /* Disable the interrupt for Rx */
739         rte_intr_efd_disable(intr_handle);
740         /* Rx interrupt vector mapping free */
741         if (intr_handle->intr_vec) {
742                 rte_free(intr_handle->intr_vec);
743                 intr_handle->intr_vec = NULL;
744         }
745
746         /* remove all mac addrs */
747         iavf_add_del_all_mac_addr(adapter, false);
748
749         /* remove all multicast addresses */
750         iavf_add_del_mc_addr_list(adapter, vf->mc_addrs, vf->mc_addrs_num,
751                                   false);
752
753         adapter->stopped = 1;
754         dev->data->dev_started = 0;
755
756         return 0;
757 }
758
759 static int
760 iavf_dev_info_get(struct rte_eth_dev *dev, struct rte_eth_dev_info *dev_info)
761 {
762         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
763
764         dev_info->max_rx_queues = IAVF_MAX_NUM_QUEUES_LV;
765         dev_info->max_tx_queues = IAVF_MAX_NUM_QUEUES_LV;
766         dev_info->min_rx_bufsize = IAVF_BUF_SIZE_MIN;
767         dev_info->max_rx_pktlen = IAVF_FRAME_SIZE_MAX;
768         dev_info->max_mtu = dev_info->max_rx_pktlen - IAVF_ETH_OVERHEAD;
769         dev_info->min_mtu = RTE_ETHER_MIN_MTU;
770         dev_info->hash_key_size = vf->vf_res->rss_key_size;
771         dev_info->reta_size = vf->vf_res->rss_lut_size;
772         dev_info->flow_type_rss_offloads = IAVF_RSS_OFFLOAD_ALL;
773         dev_info->max_mac_addrs = IAVF_NUM_MACADDR_MAX;
774         dev_info->rx_offload_capa =
775                 DEV_RX_OFFLOAD_VLAN_STRIP |
776                 DEV_RX_OFFLOAD_QINQ_STRIP |
777                 DEV_RX_OFFLOAD_IPV4_CKSUM |
778                 DEV_RX_OFFLOAD_UDP_CKSUM |
779                 DEV_RX_OFFLOAD_TCP_CKSUM |
780                 DEV_RX_OFFLOAD_OUTER_IPV4_CKSUM |
781                 DEV_RX_OFFLOAD_SCATTER |
782                 DEV_RX_OFFLOAD_JUMBO_FRAME |
783                 DEV_RX_OFFLOAD_VLAN_FILTER |
784                 DEV_RX_OFFLOAD_RSS_HASH;
785         dev_info->tx_offload_capa =
786                 DEV_TX_OFFLOAD_VLAN_INSERT |
787                 DEV_TX_OFFLOAD_QINQ_INSERT |
788                 DEV_TX_OFFLOAD_IPV4_CKSUM |
789                 DEV_TX_OFFLOAD_UDP_CKSUM |
790                 DEV_TX_OFFLOAD_TCP_CKSUM |
791                 DEV_TX_OFFLOAD_SCTP_CKSUM |
792                 DEV_TX_OFFLOAD_OUTER_IPV4_CKSUM |
793                 DEV_TX_OFFLOAD_TCP_TSO |
794                 DEV_TX_OFFLOAD_VXLAN_TNL_TSO |
795                 DEV_TX_OFFLOAD_GRE_TNL_TSO |
796                 DEV_TX_OFFLOAD_IPIP_TNL_TSO |
797                 DEV_TX_OFFLOAD_GENEVE_TNL_TSO |
798                 DEV_TX_OFFLOAD_MULTI_SEGS |
799                 DEV_TX_OFFLOAD_MBUF_FAST_FREE;
800
801         dev_info->default_rxconf = (struct rte_eth_rxconf) {
802                 .rx_free_thresh = IAVF_DEFAULT_RX_FREE_THRESH,
803                 .rx_drop_en = 0,
804                 .offloads = 0,
805         };
806
807         dev_info->default_txconf = (struct rte_eth_txconf) {
808                 .tx_free_thresh = IAVF_DEFAULT_TX_FREE_THRESH,
809                 .tx_rs_thresh = IAVF_DEFAULT_TX_RS_THRESH,
810                 .offloads = 0,
811         };
812
813         dev_info->rx_desc_lim = (struct rte_eth_desc_lim) {
814                 .nb_max = IAVF_MAX_RING_DESC,
815                 .nb_min = IAVF_MIN_RING_DESC,
816                 .nb_align = IAVF_ALIGN_RING_DESC,
817         };
818
819         dev_info->tx_desc_lim = (struct rte_eth_desc_lim) {
820                 .nb_max = IAVF_MAX_RING_DESC,
821                 .nb_min = IAVF_MIN_RING_DESC,
822                 .nb_align = IAVF_ALIGN_RING_DESC,
823         };
824
825         return 0;
826 }
827
828 static const uint32_t *
829 iavf_dev_supported_ptypes_get(struct rte_eth_dev *dev __rte_unused)
830 {
831         static const uint32_t ptypes[] = {
832                 RTE_PTYPE_L2_ETHER,
833                 RTE_PTYPE_L3_IPV4_EXT_UNKNOWN,
834                 RTE_PTYPE_L4_FRAG,
835                 RTE_PTYPE_L4_ICMP,
836                 RTE_PTYPE_L4_NONFRAG,
837                 RTE_PTYPE_L4_SCTP,
838                 RTE_PTYPE_L4_TCP,
839                 RTE_PTYPE_L4_UDP,
840                 RTE_PTYPE_UNKNOWN
841         };
842         return ptypes;
843 }
844
845 int
846 iavf_dev_link_update(struct rte_eth_dev *dev,
847                     __rte_unused int wait_to_complete)
848 {
849         struct rte_eth_link new_link;
850         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
851
852         memset(&new_link, 0, sizeof(new_link));
853
854         /* Only read status info stored in VF, and the info is updated
855          *  when receive LINK_CHANGE evnet from PF by Virtchnnl.
856          */
857         switch (vf->link_speed) {
858         case 10:
859                 new_link.link_speed = ETH_SPEED_NUM_10M;
860                 break;
861         case 100:
862                 new_link.link_speed = ETH_SPEED_NUM_100M;
863                 break;
864         case 1000:
865                 new_link.link_speed = ETH_SPEED_NUM_1G;
866                 break;
867         case 10000:
868                 new_link.link_speed = ETH_SPEED_NUM_10G;
869                 break;
870         case 20000:
871                 new_link.link_speed = ETH_SPEED_NUM_20G;
872                 break;
873         case 25000:
874                 new_link.link_speed = ETH_SPEED_NUM_25G;
875                 break;
876         case 40000:
877                 new_link.link_speed = ETH_SPEED_NUM_40G;
878                 break;
879         case 50000:
880                 new_link.link_speed = ETH_SPEED_NUM_50G;
881                 break;
882         case 100000:
883                 new_link.link_speed = ETH_SPEED_NUM_100G;
884                 break;
885         default:
886                 new_link.link_speed = ETH_SPEED_NUM_NONE;
887                 break;
888         }
889
890         new_link.link_duplex = ETH_LINK_FULL_DUPLEX;
891         new_link.link_status = vf->link_up ? ETH_LINK_UP :
892                                              ETH_LINK_DOWN;
893         new_link.link_autoneg = !(dev->data->dev_conf.link_speeds &
894                                 ETH_LINK_SPEED_FIXED);
895
896         return rte_eth_linkstatus_set(dev, &new_link);
897 }
898
899 static int
900 iavf_dev_promiscuous_enable(struct rte_eth_dev *dev)
901 {
902         struct iavf_adapter *adapter =
903                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
904         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
905
906         return iavf_config_promisc(adapter,
907                                   true, vf->promisc_multicast_enabled);
908 }
909
910 static int
911 iavf_dev_promiscuous_disable(struct rte_eth_dev *dev)
912 {
913         struct iavf_adapter *adapter =
914                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
915         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
916
917         return iavf_config_promisc(adapter,
918                                   false, vf->promisc_multicast_enabled);
919 }
920
921 static int
922 iavf_dev_allmulticast_enable(struct rte_eth_dev *dev)
923 {
924         struct iavf_adapter *adapter =
925                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
926         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
927
928         return iavf_config_promisc(adapter,
929                                   vf->promisc_unicast_enabled, true);
930 }
931
932 static int
933 iavf_dev_allmulticast_disable(struct rte_eth_dev *dev)
934 {
935         struct iavf_adapter *adapter =
936                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
937         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
938
939         return iavf_config_promisc(adapter,
940                                   vf->promisc_unicast_enabled, false);
941 }
942
943 static int
944 iavf_dev_add_mac_addr(struct rte_eth_dev *dev, struct rte_ether_addr *addr,
945                      __rte_unused uint32_t index,
946                      __rte_unused uint32_t pool)
947 {
948         struct iavf_adapter *adapter =
949                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
950         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
951         int err;
952
953         if (rte_is_zero_ether_addr(addr)) {
954                 PMD_DRV_LOG(ERR, "Invalid Ethernet Address");
955                 return -EINVAL;
956         }
957
958         err = iavf_add_del_eth_addr(adapter, addr, true);
959         if (err) {
960                 PMD_DRV_LOG(ERR, "fail to add MAC address");
961                 return -EIO;
962         }
963
964         vf->mac_num++;
965
966         return 0;
967 }
968
969 static void
970 iavf_dev_del_mac_addr(struct rte_eth_dev *dev, uint32_t index)
971 {
972         struct iavf_adapter *adapter =
973                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
974         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
975         struct rte_ether_addr *addr;
976         int err;
977
978         addr = &dev->data->mac_addrs[index];
979
980         err = iavf_add_del_eth_addr(adapter, addr, false);
981         if (err)
982                 PMD_DRV_LOG(ERR, "fail to delete MAC address");
983
984         vf->mac_num--;
985 }
986
987 static int
988 iavf_dev_vlan_filter_set(struct rte_eth_dev *dev, uint16_t vlan_id, int on)
989 {
990         struct iavf_adapter *adapter =
991                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
992         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
993         int err;
994
995         if (!(vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_VLAN))
996                 return -ENOTSUP;
997
998         err = iavf_add_del_vlan(adapter, vlan_id, on);
999         if (err)
1000                 return -EIO;
1001         return 0;
1002 }
1003
1004 static int
1005 iavf_dev_vlan_offload_set(struct rte_eth_dev *dev, int mask)
1006 {
1007         struct iavf_adapter *adapter =
1008                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1009         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
1010         struct rte_eth_conf *dev_conf = &dev->data->dev_conf;
1011         int err;
1012
1013         if (!(vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_VLAN))
1014                 return -ENOTSUP;
1015
1016         /* Vlan stripping setting */
1017         if (mask & ETH_VLAN_STRIP_MASK) {
1018                 /* Enable or disable VLAN stripping */
1019                 if (dev_conf->rxmode.offloads & DEV_RX_OFFLOAD_VLAN_STRIP)
1020                         err = iavf_enable_vlan_strip(adapter);
1021                 else
1022                         err = iavf_disable_vlan_strip(adapter);
1023
1024                 if (err)
1025                         return -EIO;
1026         }
1027         return 0;
1028 }
1029
1030 static int
1031 iavf_dev_rss_reta_update(struct rte_eth_dev *dev,
1032                         struct rte_eth_rss_reta_entry64 *reta_conf,
1033                         uint16_t reta_size)
1034 {
1035         struct iavf_adapter *adapter =
1036                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1037         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
1038         uint8_t *lut;
1039         uint16_t i, idx, shift;
1040         int ret;
1041
1042         if (!(vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF))
1043                 return -ENOTSUP;
1044
1045         if (reta_size != vf->vf_res->rss_lut_size) {
1046                 PMD_DRV_LOG(ERR, "The size of hash lookup table configured "
1047                         "(%d) doesn't match the number of hardware can "
1048                         "support (%d)", reta_size, vf->vf_res->rss_lut_size);
1049                 return -EINVAL;
1050         }
1051
1052         lut = rte_zmalloc("rss_lut", reta_size, 0);
1053         if (!lut) {
1054                 PMD_DRV_LOG(ERR, "No memory can be allocated");
1055                 return -ENOMEM;
1056         }
1057         /* store the old lut table temporarily */
1058         rte_memcpy(lut, vf->rss_lut, reta_size);
1059
1060         for (i = 0; i < reta_size; i++) {
1061                 idx = i / RTE_RETA_GROUP_SIZE;
1062                 shift = i % RTE_RETA_GROUP_SIZE;
1063                 if (reta_conf[idx].mask & (1ULL << shift))
1064                         lut[i] = reta_conf[idx].reta[shift];
1065         }
1066
1067         rte_memcpy(vf->rss_lut, lut, reta_size);
1068         /* send virtchnnl ops to configure rss*/
1069         ret = iavf_configure_rss_lut(adapter);
1070         if (ret) /* revert back */
1071                 rte_memcpy(vf->rss_lut, lut, reta_size);
1072         rte_free(lut);
1073
1074         return ret;
1075 }
1076
1077 static int
1078 iavf_dev_rss_reta_query(struct rte_eth_dev *dev,
1079                        struct rte_eth_rss_reta_entry64 *reta_conf,
1080                        uint16_t reta_size)
1081 {
1082         struct iavf_adapter *adapter =
1083                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1084         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
1085         uint16_t i, idx, shift;
1086
1087         if (!(vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF))
1088                 return -ENOTSUP;
1089
1090         if (reta_size != vf->vf_res->rss_lut_size) {
1091                 PMD_DRV_LOG(ERR, "The size of hash lookup table configured "
1092                         "(%d) doesn't match the number of hardware can "
1093                         "support (%d)", reta_size, vf->vf_res->rss_lut_size);
1094                 return -EINVAL;
1095         }
1096
1097         for (i = 0; i < reta_size; i++) {
1098                 idx = i / RTE_RETA_GROUP_SIZE;
1099                 shift = i % RTE_RETA_GROUP_SIZE;
1100                 if (reta_conf[idx].mask & (1ULL << shift))
1101                         reta_conf[idx].reta[shift] = vf->rss_lut[i];
1102         }
1103
1104         return 0;
1105 }
1106
1107 static int
1108 iavf_set_rss_key(struct iavf_adapter *adapter, uint8_t *key, uint8_t key_len)
1109 {
1110         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
1111
1112         /* HENA setting, it is enabled by default, no change */
1113         if (!key || key_len == 0) {
1114                 PMD_DRV_LOG(DEBUG, "No key to be configured");
1115                 return 0;
1116         } else if (key_len != vf->vf_res->rss_key_size) {
1117                 PMD_DRV_LOG(ERR, "The size of hash key configured "
1118                         "(%d) doesn't match the size of hardware can "
1119                         "support (%d)", key_len,
1120                         vf->vf_res->rss_key_size);
1121                 return -EINVAL;
1122         }
1123
1124         rte_memcpy(vf->rss_key, key, key_len);
1125
1126         return iavf_configure_rss_key(adapter);
1127 }
1128
1129 static int
1130 iavf_dev_rss_hash_update(struct rte_eth_dev *dev,
1131                         struct rte_eth_rss_conf *rss_conf)
1132 {
1133         struct iavf_adapter *adapter =
1134                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1135         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
1136         int ret;
1137
1138         adapter->eth_dev->data->dev_conf.rx_adv_conf.rss_conf = *rss_conf;
1139
1140         if (!(vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF))
1141                 return -ENOTSUP;
1142
1143         /* Set hash key. */
1144         ret = iavf_set_rss_key(adapter, rss_conf->rss_key,
1145                                rss_conf->rss_key_len);
1146         if (ret)
1147                 return ret;
1148
1149         if (rss_conf->rss_hf == 0)
1150                 return 0;
1151
1152         /* Overwritten default RSS. */
1153         ret = iavf_set_hena(adapter, 0);
1154         if (ret)
1155                 PMD_DRV_LOG(ERR, "%s Remove rss vsi fail %d",
1156                             __func__, ret);
1157
1158         /* Set new RSS configuration. */
1159         ret = iavf_rss_hash_set(adapter, rss_conf->rss_hf, true);
1160         if (ret) {
1161                 PMD_DRV_LOG(ERR, "fail to set new RSS");
1162                 return ret;
1163         }
1164
1165         return 0;
1166 }
1167
1168 static int
1169 iavf_dev_rss_hash_conf_get(struct rte_eth_dev *dev,
1170                           struct rte_eth_rss_conf *rss_conf)
1171 {
1172         struct iavf_adapter *adapter =
1173                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1174         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(adapter);
1175
1176         if (!(vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF))
1177                 return -ENOTSUP;
1178
1179         rss_conf->rss_hf = vf->rss_hf;
1180
1181         if (!rss_conf->rss_key)
1182                 return 0;
1183
1184         rss_conf->rss_key_len = vf->vf_res->rss_key_size;
1185         rte_memcpy(rss_conf->rss_key, vf->rss_key, rss_conf->rss_key_len);
1186
1187         return 0;
1188 }
1189
1190 static int
1191 iavf_dev_mtu_set(struct rte_eth_dev *dev, uint16_t mtu)
1192 {
1193         uint32_t frame_size = mtu + IAVF_ETH_OVERHEAD;
1194         int ret = 0;
1195
1196         if (mtu < RTE_ETHER_MIN_MTU || frame_size > IAVF_FRAME_SIZE_MAX)
1197                 return -EINVAL;
1198
1199         /* mtu setting is forbidden if port is start */
1200         if (dev->data->dev_started) {
1201                 PMD_DRV_LOG(ERR, "port must be stopped before configuration");
1202                 return -EBUSY;
1203         }
1204
1205         if (frame_size > RTE_ETHER_MAX_LEN)
1206                 dev->data->dev_conf.rxmode.offloads |=
1207                                 DEV_RX_OFFLOAD_JUMBO_FRAME;
1208         else
1209                 dev->data->dev_conf.rxmode.offloads &=
1210                                 ~DEV_RX_OFFLOAD_JUMBO_FRAME;
1211
1212         dev->data->dev_conf.rxmode.max_rx_pkt_len = frame_size;
1213
1214         return ret;
1215 }
1216
1217 static int
1218 iavf_dev_set_default_mac_addr(struct rte_eth_dev *dev,
1219                              struct rte_ether_addr *mac_addr)
1220 {
1221         struct iavf_adapter *adapter =
1222                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1223         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(adapter);
1224         struct rte_ether_addr *perm_addr, *old_addr;
1225         int ret;
1226
1227         old_addr = (struct rte_ether_addr *)hw->mac.addr;
1228         perm_addr = (struct rte_ether_addr *)hw->mac.perm_addr;
1229
1230         /* If the MAC address is configured by host, skip the setting */
1231         if (rte_is_valid_assigned_ether_addr(perm_addr))
1232                 return -EPERM;
1233
1234         ret = iavf_add_del_eth_addr(adapter, old_addr, false);
1235         if (ret)
1236                 PMD_DRV_LOG(ERR, "Fail to delete old MAC:"
1237                             " %02X:%02X:%02X:%02X:%02X:%02X",
1238                             old_addr->addr_bytes[0],
1239                             old_addr->addr_bytes[1],
1240                             old_addr->addr_bytes[2],
1241                             old_addr->addr_bytes[3],
1242                             old_addr->addr_bytes[4],
1243                             old_addr->addr_bytes[5]);
1244
1245         ret = iavf_add_del_eth_addr(adapter, mac_addr, true);
1246         if (ret)
1247                 PMD_DRV_LOG(ERR, "Fail to add new MAC:"
1248                             " %02X:%02X:%02X:%02X:%02X:%02X",
1249                             mac_addr->addr_bytes[0],
1250                             mac_addr->addr_bytes[1],
1251                             mac_addr->addr_bytes[2],
1252                             mac_addr->addr_bytes[3],
1253                             mac_addr->addr_bytes[4],
1254                             mac_addr->addr_bytes[5]);
1255
1256         if (ret)
1257                 return -EIO;
1258
1259         rte_ether_addr_copy(mac_addr, (struct rte_ether_addr *)hw->mac.addr);
1260         return 0;
1261 }
1262
1263 static void
1264 iavf_stat_update_48(uint64_t *offset, uint64_t *stat)
1265 {
1266         if (*stat >= *offset)
1267                 *stat = *stat - *offset;
1268         else
1269                 *stat = (uint64_t)((*stat +
1270                         ((uint64_t)1 << IAVF_48_BIT_WIDTH)) - *offset);
1271
1272         *stat &= IAVF_48_BIT_MASK;
1273 }
1274
1275 static void
1276 iavf_stat_update_32(uint64_t *offset, uint64_t *stat)
1277 {
1278         if (*stat >= *offset)
1279                 *stat = (uint64_t)(*stat - *offset);
1280         else
1281                 *stat = (uint64_t)((*stat +
1282                         ((uint64_t)1 << IAVF_32_BIT_WIDTH)) - *offset);
1283 }
1284
1285 static void
1286 iavf_update_stats(struct iavf_vsi *vsi, struct virtchnl_eth_stats *nes)
1287 {
1288         struct virtchnl_eth_stats *oes = &vsi->eth_stats_offset;
1289
1290         iavf_stat_update_48(&oes->rx_bytes, &nes->rx_bytes);
1291         iavf_stat_update_48(&oes->rx_unicast, &nes->rx_unicast);
1292         iavf_stat_update_48(&oes->rx_multicast, &nes->rx_multicast);
1293         iavf_stat_update_48(&oes->rx_broadcast, &nes->rx_broadcast);
1294         iavf_stat_update_32(&oes->rx_discards, &nes->rx_discards);
1295         iavf_stat_update_48(&oes->tx_bytes, &nes->tx_bytes);
1296         iavf_stat_update_48(&oes->tx_unicast, &nes->tx_unicast);
1297         iavf_stat_update_48(&oes->tx_multicast, &nes->tx_multicast);
1298         iavf_stat_update_48(&oes->tx_broadcast, &nes->tx_broadcast);
1299         iavf_stat_update_32(&oes->tx_errors, &nes->tx_errors);
1300         iavf_stat_update_32(&oes->tx_discards, &nes->tx_discards);
1301 }
1302
1303 static int
1304 iavf_dev_stats_get(struct rte_eth_dev *dev, struct rte_eth_stats *stats)
1305 {
1306         struct iavf_adapter *adapter =
1307                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1308         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
1309         struct iavf_vsi *vsi = &vf->vsi;
1310         struct virtchnl_eth_stats *pstats = NULL;
1311         int ret;
1312
1313         ret = iavf_query_stats(adapter, &pstats);
1314         if (ret == 0) {
1315                 iavf_update_stats(vsi, pstats);
1316                 stats->ipackets = pstats->rx_unicast + pstats->rx_multicast +
1317                                 pstats->rx_broadcast - pstats->rx_discards;
1318                 stats->opackets = pstats->tx_broadcast + pstats->tx_multicast +
1319                                                 pstats->tx_unicast;
1320                 stats->imissed = pstats->rx_discards;
1321                 stats->oerrors = pstats->tx_errors + pstats->tx_discards;
1322                 stats->ibytes = pstats->rx_bytes;
1323                 stats->ibytes -= stats->ipackets * RTE_ETHER_CRC_LEN;
1324                 stats->obytes = pstats->tx_bytes;
1325         } else {
1326                 PMD_DRV_LOG(ERR, "Get statistics failed");
1327         }
1328         return ret;
1329 }
1330
1331 static int
1332 iavf_dev_stats_reset(struct rte_eth_dev *dev)
1333 {
1334         int ret;
1335         struct iavf_adapter *adapter =
1336                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1337         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
1338         struct iavf_vsi *vsi = &vf->vsi;
1339         struct virtchnl_eth_stats *pstats = NULL;
1340
1341         /* read stat values to clear hardware registers */
1342         ret = iavf_query_stats(adapter, &pstats);
1343         if (ret != 0)
1344                 return ret;
1345
1346         /* set stats offset base on current values */
1347         vsi->eth_stats_offset = *pstats;
1348
1349         return 0;
1350 }
1351
1352 static int iavf_dev_xstats_get_names(__rte_unused struct rte_eth_dev *dev,
1353                                       struct rte_eth_xstat_name *xstats_names,
1354                                       __rte_unused unsigned int limit)
1355 {
1356         unsigned int i;
1357
1358         if (xstats_names != NULL)
1359                 for (i = 0; i < IAVF_NB_XSTATS; i++) {
1360                         snprintf(xstats_names[i].name,
1361                                 sizeof(xstats_names[i].name),
1362                                 "%s", rte_iavf_stats_strings[i].name);
1363                 }
1364         return IAVF_NB_XSTATS;
1365 }
1366
1367 static int iavf_dev_xstats_get(struct rte_eth_dev *dev,
1368                                  struct rte_eth_xstat *xstats, unsigned int n)
1369 {
1370         int ret;
1371         unsigned int i;
1372         struct iavf_adapter *adapter =
1373                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1374         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
1375         struct iavf_vsi *vsi = &vf->vsi;
1376         struct virtchnl_eth_stats *pstats = NULL;
1377
1378         if (n < IAVF_NB_XSTATS)
1379                 return IAVF_NB_XSTATS;
1380
1381         ret = iavf_query_stats(adapter, &pstats);
1382         if (ret != 0)
1383                 return 0;
1384
1385         if (!xstats)
1386                 return 0;
1387
1388         iavf_update_stats(vsi, pstats);
1389
1390         /* loop over xstats array and values from pstats */
1391         for (i = 0; i < IAVF_NB_XSTATS; i++) {
1392                 xstats[i].id = i;
1393                 xstats[i].value = *(uint64_t *)(((char *)pstats) +
1394                         rte_iavf_stats_strings[i].offset);
1395         }
1396
1397         return IAVF_NB_XSTATS;
1398 }
1399
1400
1401 static int
1402 iavf_dev_rx_queue_intr_enable(struct rte_eth_dev *dev, uint16_t queue_id)
1403 {
1404         struct iavf_adapter *adapter =
1405                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1406         struct rte_pci_device *pci_dev = RTE_ETH_DEV_TO_PCI(dev);
1407         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(adapter);
1408         uint16_t msix_intr;
1409
1410         msix_intr = pci_dev->intr_handle.intr_vec[queue_id];
1411         if (msix_intr == IAVF_MISC_VEC_ID) {
1412                 PMD_DRV_LOG(INFO, "MISC is also enabled for control");
1413                 IAVF_WRITE_REG(hw, IAVF_VFINT_DYN_CTL01,
1414                                IAVF_VFINT_DYN_CTL01_INTENA_MASK |
1415                                IAVF_VFINT_DYN_CTL01_CLEARPBA_MASK |
1416                                IAVF_VFINT_DYN_CTL01_ITR_INDX_MASK);
1417         } else {
1418                 IAVF_WRITE_REG(hw,
1419                                IAVF_VFINT_DYN_CTLN1
1420                                 (msix_intr - IAVF_RX_VEC_START),
1421                                IAVF_VFINT_DYN_CTLN1_INTENA_MASK |
1422                                IAVF_VFINT_DYN_CTL01_CLEARPBA_MASK |
1423                                IAVF_VFINT_DYN_CTLN1_ITR_INDX_MASK);
1424         }
1425
1426         IAVF_WRITE_FLUSH(hw);
1427
1428         rte_intr_ack(&pci_dev->intr_handle);
1429
1430         return 0;
1431 }
1432
1433 static int
1434 iavf_dev_rx_queue_intr_disable(struct rte_eth_dev *dev, uint16_t queue_id)
1435 {
1436         struct rte_pci_device *pci_dev = RTE_ETH_DEV_TO_PCI(dev);
1437         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(dev->data->dev_private);
1438         uint16_t msix_intr;
1439
1440         msix_intr = pci_dev->intr_handle.intr_vec[queue_id];
1441         if (msix_intr == IAVF_MISC_VEC_ID) {
1442                 PMD_DRV_LOG(ERR, "MISC is used for control, cannot disable it");
1443                 return -EIO;
1444         }
1445
1446         IAVF_WRITE_REG(hw,
1447                       IAVF_VFINT_DYN_CTLN1(msix_intr - IAVF_RX_VEC_START),
1448                       0);
1449
1450         IAVF_WRITE_FLUSH(hw);
1451         return 0;
1452 }
1453
1454 static int
1455 iavf_check_vf_reset_done(struct iavf_hw *hw)
1456 {
1457         int i, reset;
1458
1459         for (i = 0; i < IAVF_RESET_WAIT_CNT; i++) {
1460                 reset = IAVF_READ_REG(hw, IAVF_VFGEN_RSTAT) &
1461                         IAVF_VFGEN_RSTAT_VFR_STATE_MASK;
1462                 reset = reset >> IAVF_VFGEN_RSTAT_VFR_STATE_SHIFT;
1463                 if (reset == VIRTCHNL_VFR_VFACTIVE ||
1464                     reset == VIRTCHNL_VFR_COMPLETED)
1465                         break;
1466                 rte_delay_ms(20);
1467         }
1468
1469         if (i >= IAVF_RESET_WAIT_CNT)
1470                 return -1;
1471
1472         return 0;
1473 }
1474
1475 static int
1476 iavf_lookup_proto_xtr_type(const char *flex_name)
1477 {
1478         static struct {
1479                 const char *name;
1480                 enum iavf_proto_xtr_type type;
1481         } xtr_type_map[] = {
1482                 { "vlan",      IAVF_PROTO_XTR_VLAN      },
1483                 { "ipv4",      IAVF_PROTO_XTR_IPV4      },
1484                 { "ipv6",      IAVF_PROTO_XTR_IPV6      },
1485                 { "ipv6_flow", IAVF_PROTO_XTR_IPV6_FLOW },
1486                 { "tcp",       IAVF_PROTO_XTR_TCP       },
1487                 { "ip_offset", IAVF_PROTO_XTR_IP_OFFSET },
1488         };
1489         uint32_t i;
1490
1491         for (i = 0; i < RTE_DIM(xtr_type_map); i++) {
1492                 if (strcmp(flex_name, xtr_type_map[i].name) == 0)
1493                         return xtr_type_map[i].type;
1494         }
1495
1496         PMD_DRV_LOG(ERR, "wrong proto_xtr type, "
1497                     "it should be: vlan|ipv4|ipv6|ipv6_flow|tcp|ip_offset");
1498
1499         return -1;
1500 }
1501
1502 /**
1503  * Parse elem, the elem could be single number/range or '(' ')' group
1504  * 1) A single number elem, it's just a simple digit. e.g. 9
1505  * 2) A single range elem, two digits with a '-' between. e.g. 2-6
1506  * 3) A group elem, combines multiple 1) or 2) with '( )'. e.g (0,2-4,6)
1507  *    Within group elem, '-' used for a range separator;
1508  *                       ',' used for a single number.
1509  */
1510 static int
1511 iavf_parse_queue_set(const char *input, int xtr_type,
1512                      struct iavf_devargs *devargs)
1513 {
1514         const char *str = input;
1515         char *end = NULL;
1516         uint32_t min, max;
1517         uint32_t idx;
1518
1519         while (isblank(*str))
1520                 str++;
1521
1522         if (!isdigit(*str) && *str != '(')
1523                 return -1;
1524
1525         /* process single number or single range of number */
1526         if (*str != '(') {
1527                 errno = 0;
1528                 idx = strtoul(str, &end, 10);
1529                 if (errno || !end || idx >= IAVF_MAX_QUEUE_NUM)
1530                         return -1;
1531
1532                 while (isblank(*end))
1533                         end++;
1534
1535                 min = idx;
1536                 max = idx;
1537
1538                 /* process single <number>-<number> */
1539                 if (*end == '-') {
1540                         end++;
1541                         while (isblank(*end))
1542                                 end++;
1543                         if (!isdigit(*end))
1544                                 return -1;
1545
1546                         errno = 0;
1547                         idx = strtoul(end, &end, 10);
1548                         if (errno || !end || idx >= IAVF_MAX_QUEUE_NUM)
1549                                 return -1;
1550
1551                         max = idx;
1552                         while (isblank(*end))
1553                                 end++;
1554                 }
1555
1556                 if (*end != ':')
1557                         return -1;
1558
1559                 for (idx = RTE_MIN(min, max);
1560                      idx <= RTE_MAX(min, max); idx++)
1561                         devargs->proto_xtr[idx] = xtr_type;
1562
1563                 return 0;
1564         }
1565
1566         /* process set within bracket */
1567         str++;
1568         while (isblank(*str))
1569                 str++;
1570         if (*str == '\0')
1571                 return -1;
1572
1573         min = IAVF_MAX_QUEUE_NUM;
1574         do {
1575                 /* go ahead to the first digit */
1576                 while (isblank(*str))
1577                         str++;
1578                 if (!isdigit(*str))
1579                         return -1;
1580
1581                 /* get the digit value */
1582                 errno = 0;
1583                 idx = strtoul(str, &end, 10);
1584                 if (errno || !end || idx >= IAVF_MAX_QUEUE_NUM)
1585                         return -1;
1586
1587                 /* go ahead to separator '-',',' and ')' */
1588                 while (isblank(*end))
1589                         end++;
1590                 if (*end == '-') {
1591                         if (min == IAVF_MAX_QUEUE_NUM)
1592                                 min = idx;
1593                         else /* avoid continuous '-' */
1594                                 return -1;
1595                 } else if (*end == ',' || *end == ')') {
1596                         max = idx;
1597                         if (min == IAVF_MAX_QUEUE_NUM)
1598                                 min = idx;
1599
1600                         for (idx = RTE_MIN(min, max);
1601                              idx <= RTE_MAX(min, max); idx++)
1602                                 devargs->proto_xtr[idx] = xtr_type;
1603
1604                         min = IAVF_MAX_QUEUE_NUM;
1605                 } else {
1606                         return -1;
1607                 }
1608
1609                 str = end + 1;
1610         } while (*end != ')' && *end != '\0');
1611
1612         return 0;
1613 }
1614
1615 static int
1616 iavf_parse_queue_proto_xtr(const char *queues, struct iavf_devargs *devargs)
1617 {
1618         const char *queue_start;
1619         uint32_t idx;
1620         int xtr_type;
1621         char flex_name[32];
1622
1623         while (isblank(*queues))
1624                 queues++;
1625
1626         if (*queues != '[') {
1627                 xtr_type = iavf_lookup_proto_xtr_type(queues);
1628                 if (xtr_type < 0)
1629                         return -1;
1630
1631                 devargs->proto_xtr_dflt = xtr_type;
1632
1633                 return 0;
1634         }
1635
1636         queues++;
1637         do {
1638                 while (isblank(*queues))
1639                         queues++;
1640                 if (*queues == '\0')
1641                         return -1;
1642
1643                 queue_start = queues;
1644
1645                 /* go across a complete bracket */
1646                 if (*queue_start == '(') {
1647                         queues += strcspn(queues, ")");
1648                         if (*queues != ')')
1649                                 return -1;
1650                 }
1651
1652                 /* scan the separator ':' */
1653                 queues += strcspn(queues, ":");
1654                 if (*queues++ != ':')
1655                         return -1;
1656                 while (isblank(*queues))
1657                         queues++;
1658
1659                 for (idx = 0; ; idx++) {
1660                         if (isblank(queues[idx]) ||
1661                             queues[idx] == ',' ||
1662                             queues[idx] == ']' ||
1663                             queues[idx] == '\0')
1664                                 break;
1665
1666                         if (idx > sizeof(flex_name) - 2)
1667                                 return -1;
1668
1669                         flex_name[idx] = queues[idx];
1670                 }
1671                 flex_name[idx] = '\0';
1672                 xtr_type = iavf_lookup_proto_xtr_type(flex_name);
1673                 if (xtr_type < 0)
1674                         return -1;
1675
1676                 queues += idx;
1677
1678                 while (isblank(*queues) || *queues == ',' || *queues == ']')
1679                         queues++;
1680
1681                 if (iavf_parse_queue_set(queue_start, xtr_type, devargs) < 0)
1682                         return -1;
1683         } while (*queues != '\0');
1684
1685         return 0;
1686 }
1687
1688 static int
1689 iavf_handle_proto_xtr_arg(__rte_unused const char *key, const char *value,
1690                           void *extra_args)
1691 {
1692         struct iavf_devargs *devargs = extra_args;
1693
1694         if (!value || !extra_args)
1695                 return -EINVAL;
1696
1697         if (iavf_parse_queue_proto_xtr(value, devargs) < 0) {
1698                 PMD_DRV_LOG(ERR, "the proto_xtr's parameter is wrong : '%s'",
1699                             value);
1700                 return -1;
1701         }
1702
1703         return 0;
1704 }
1705
1706 static int iavf_parse_devargs(struct rte_eth_dev *dev)
1707 {
1708         struct iavf_adapter *ad =
1709                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1710         struct rte_devargs *devargs = dev->device->devargs;
1711         struct rte_kvargs *kvlist;
1712         int ret;
1713
1714         if (!devargs)
1715                 return 0;
1716
1717         kvlist = rte_kvargs_parse(devargs->args, iavf_valid_args);
1718         if (!kvlist) {
1719                 PMD_INIT_LOG(ERR, "invalid kvargs key\n");
1720                 return -EINVAL;
1721         }
1722
1723         ad->devargs.proto_xtr_dflt = IAVF_PROTO_XTR_NONE;
1724         memset(ad->devargs.proto_xtr, IAVF_PROTO_XTR_NONE,
1725                sizeof(ad->devargs.proto_xtr));
1726
1727         ret = rte_kvargs_process(kvlist, IAVF_PROTO_XTR_ARG,
1728                                  &iavf_handle_proto_xtr_arg, &ad->devargs);
1729         if (ret)
1730                 goto bail;
1731
1732 bail:
1733         rte_kvargs_free(kvlist);
1734         return ret;
1735 }
1736
1737 static void
1738 iavf_init_proto_xtr(struct rte_eth_dev *dev)
1739 {
1740         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
1741         struct iavf_adapter *ad =
1742                         IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1743         const struct iavf_proto_xtr_ol *xtr_ol;
1744         bool proto_xtr_enable = false;
1745         int offset;
1746         uint16_t i;
1747
1748         vf->proto_xtr = rte_zmalloc("vf proto xtr",
1749                                     vf->vsi_res->num_queue_pairs, 0);
1750         if (unlikely(!(vf->proto_xtr))) {
1751                 PMD_DRV_LOG(ERR, "no memory for setting up proto_xtr's table");
1752                 return;
1753         }
1754
1755         for (i = 0; i < vf->vsi_res->num_queue_pairs; i++) {
1756                 vf->proto_xtr[i] = ad->devargs.proto_xtr[i] !=
1757                                         IAVF_PROTO_XTR_NONE ?
1758                                         ad->devargs.proto_xtr[i] :
1759                                         ad->devargs.proto_xtr_dflt;
1760
1761                 if (vf->proto_xtr[i] != IAVF_PROTO_XTR_NONE) {
1762                         uint8_t type = vf->proto_xtr[i];
1763
1764                         iavf_proto_xtr_params[type].required = true;
1765                         proto_xtr_enable = true;
1766                 }
1767         }
1768
1769         if (likely(!proto_xtr_enable))
1770                 return;
1771
1772         offset = rte_mbuf_dynfield_register(&iavf_proto_xtr_metadata_param);
1773         if (unlikely(offset == -1)) {
1774                 PMD_DRV_LOG(ERR,
1775                             "failed to extract protocol metadata, error %d",
1776                             -rte_errno);
1777                 return;
1778         }
1779
1780         PMD_DRV_LOG(DEBUG,
1781                     "proto_xtr metadata offset in mbuf is : %d",
1782                     offset);
1783         rte_pmd_ifd_dynfield_proto_xtr_metadata_offs = offset;
1784
1785         for (i = 0; i < RTE_DIM(iavf_proto_xtr_params); i++) {
1786                 xtr_ol = &iavf_proto_xtr_params[i];
1787
1788                 uint8_t rxdid = iavf_proto_xtr_type_to_rxdid((uint8_t)i);
1789
1790                 if (!xtr_ol->required)
1791                         continue;
1792
1793                 if (!(vf->supported_rxdid & BIT(rxdid))) {
1794                         PMD_DRV_LOG(ERR,
1795                                     "rxdid[%u] is not supported in hardware",
1796                                     rxdid);
1797                         rte_pmd_ifd_dynfield_proto_xtr_metadata_offs = -1;
1798                         break;
1799                 }
1800
1801                 offset = rte_mbuf_dynflag_register(&xtr_ol->param);
1802                 if (unlikely(offset == -1)) {
1803                         PMD_DRV_LOG(ERR,
1804                                     "failed to register proto_xtr offload '%s', error %d",
1805                                     xtr_ol->param.name, -rte_errno);
1806
1807                         rte_pmd_ifd_dynfield_proto_xtr_metadata_offs = -1;
1808                         break;
1809                 }
1810
1811                 PMD_DRV_LOG(DEBUG,
1812                             "proto_xtr offload '%s' offset in mbuf is : %d",
1813                             xtr_ol->param.name, offset);
1814                 *xtr_ol->ol_flag = 1ULL << offset;
1815         }
1816 }
1817
1818 static int
1819 iavf_init_vf(struct rte_eth_dev *dev)
1820 {
1821         int err, bufsz;
1822         struct iavf_adapter *adapter =
1823                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
1824         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(dev->data->dev_private);
1825         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
1826
1827         err = iavf_parse_devargs(dev);
1828         if (err) {
1829                 PMD_INIT_LOG(ERR, "Failed to parse devargs");
1830                 goto err;
1831         }
1832
1833         err = iavf_set_mac_type(hw);
1834         if (err) {
1835                 PMD_INIT_LOG(ERR, "set_mac_type failed: %d", err);
1836                 goto err;
1837         }
1838
1839         err = iavf_check_vf_reset_done(hw);
1840         if (err) {
1841                 PMD_INIT_LOG(ERR, "VF is still resetting");
1842                 goto err;
1843         }
1844
1845         iavf_init_adminq_parameter(hw);
1846         err = iavf_init_adminq(hw);
1847         if (err) {
1848                 PMD_INIT_LOG(ERR, "init_adminq failed: %d", err);
1849                 goto err;
1850         }
1851
1852         vf->aq_resp = rte_zmalloc("vf_aq_resp", IAVF_AQ_BUF_SZ, 0);
1853         if (!vf->aq_resp) {
1854                 PMD_INIT_LOG(ERR, "unable to allocate vf_aq_resp memory");
1855                 goto err_aq;
1856         }
1857         if (iavf_check_api_version(adapter) != 0) {
1858                 PMD_INIT_LOG(ERR, "check_api version failed");
1859                 goto err_api;
1860         }
1861
1862         bufsz = sizeof(struct virtchnl_vf_resource) +
1863                 (IAVF_MAX_VF_VSI * sizeof(struct virtchnl_vsi_resource));
1864         vf->vf_res = rte_zmalloc("vf_res", bufsz, 0);
1865         if (!vf->vf_res) {
1866                 PMD_INIT_LOG(ERR, "unable to allocate vf_res memory");
1867                 goto err_api;
1868         }
1869         if (iavf_get_vf_resource(adapter) != 0) {
1870                 PMD_INIT_LOG(ERR, "iavf_get_vf_config failed");
1871                 goto err_alloc;
1872         }
1873         /* Allocate memort for RSS info */
1874         if (vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF) {
1875                 vf->rss_key = rte_zmalloc("rss_key",
1876                                           vf->vf_res->rss_key_size, 0);
1877                 if (!vf->rss_key) {
1878                         PMD_INIT_LOG(ERR, "unable to allocate rss_key memory");
1879                         goto err_rss;
1880                 }
1881                 vf->rss_lut = rte_zmalloc("rss_lut",
1882                                           vf->vf_res->rss_lut_size, 0);
1883                 if (!vf->rss_lut) {
1884                         PMD_INIT_LOG(ERR, "unable to allocate rss_lut memory");
1885                         goto err_rss;
1886                 }
1887         }
1888
1889         if (vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RX_FLEX_DESC) {
1890                 if (iavf_get_supported_rxdid(adapter) != 0) {
1891                         PMD_INIT_LOG(ERR, "failed to do get supported rxdid");
1892                         goto err_rss;
1893                 }
1894         }
1895
1896         iavf_init_proto_xtr(dev);
1897
1898         return 0;
1899 err_rss:
1900         rte_free(vf->rss_key);
1901         rte_free(vf->rss_lut);
1902 err_alloc:
1903         rte_free(vf->vf_res);
1904         vf->vsi_res = NULL;
1905 err_api:
1906         rte_free(vf->aq_resp);
1907 err_aq:
1908         iavf_shutdown_adminq(hw);
1909 err:
1910         return -1;
1911 }
1912
1913 /* Enable default admin queue interrupt setting */
1914 static inline void
1915 iavf_enable_irq0(struct iavf_hw *hw)
1916 {
1917         /* Enable admin queue interrupt trigger */
1918         IAVF_WRITE_REG(hw, IAVF_VFINT_ICR0_ENA1,
1919                        IAVF_VFINT_ICR0_ENA1_ADMINQ_MASK);
1920
1921         IAVF_WRITE_REG(hw, IAVF_VFINT_DYN_CTL01,
1922                        IAVF_VFINT_DYN_CTL01_INTENA_MASK |
1923                        IAVF_VFINT_DYN_CTL01_CLEARPBA_MASK |
1924                        IAVF_VFINT_DYN_CTL01_ITR_INDX_MASK);
1925
1926         IAVF_WRITE_FLUSH(hw);
1927 }
1928
1929 static inline void
1930 iavf_disable_irq0(struct iavf_hw *hw)
1931 {
1932         /* Disable all interrupt types */
1933         IAVF_WRITE_REG(hw, IAVF_VFINT_ICR0_ENA1, 0);
1934         IAVF_WRITE_REG(hw, IAVF_VFINT_DYN_CTL01,
1935                        IAVF_VFINT_DYN_CTL01_ITR_INDX_MASK);
1936         IAVF_WRITE_FLUSH(hw);
1937 }
1938
1939 static void
1940 iavf_dev_interrupt_handler(void *param)
1941 {
1942         struct rte_eth_dev *dev = (struct rte_eth_dev *)param;
1943         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(dev->data->dev_private);
1944
1945         iavf_disable_irq0(hw);
1946
1947         iavf_handle_virtchnl_msg(dev);
1948
1949         iavf_enable_irq0(hw);
1950 }
1951
1952 static int
1953 iavf_dev_filter_ctrl(struct rte_eth_dev *dev,
1954                      enum rte_filter_type filter_type,
1955                      enum rte_filter_op filter_op,
1956                      void *arg)
1957 {
1958         int ret = 0;
1959
1960         if (!dev)
1961                 return -EINVAL;
1962
1963         switch (filter_type) {
1964         case RTE_ETH_FILTER_GENERIC:
1965                 if (filter_op != RTE_ETH_FILTER_GET)
1966                         return -EINVAL;
1967                 *(const void **)arg = &iavf_flow_ops;
1968                 break;
1969         default:
1970                 PMD_DRV_LOG(WARNING, "Filter type (%d) not supported",
1971                             filter_type);
1972                 ret = -EINVAL;
1973                 break;
1974         }
1975
1976         return ret;
1977 }
1978
1979
1980 static int
1981 iavf_dev_init(struct rte_eth_dev *eth_dev)
1982 {
1983         struct iavf_adapter *adapter =
1984                 IAVF_DEV_PRIVATE_TO_ADAPTER(eth_dev->data->dev_private);
1985         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(adapter);
1986         struct rte_pci_device *pci_dev = RTE_ETH_DEV_TO_PCI(eth_dev);
1987         int ret = 0;
1988
1989         PMD_INIT_FUNC_TRACE();
1990
1991         /* assign ops func pointer */
1992         eth_dev->dev_ops = &iavf_eth_dev_ops;
1993         eth_dev->rx_queue_count = iavf_dev_rxq_count;
1994         eth_dev->rx_descriptor_status = iavf_dev_rx_desc_status;
1995         eth_dev->tx_descriptor_status = iavf_dev_tx_desc_status;
1996         eth_dev->rx_pkt_burst = &iavf_recv_pkts;
1997         eth_dev->tx_pkt_burst = &iavf_xmit_pkts;
1998         eth_dev->tx_pkt_prepare = &iavf_prep_pkts;
1999
2000         /* For secondary processes, we don't initialise any further as primary
2001          * has already done this work. Only check if we need a different RX
2002          * and TX function.
2003          */
2004         if (rte_eal_process_type() != RTE_PROC_PRIMARY) {
2005                 iavf_set_rx_function(eth_dev);
2006                 iavf_set_tx_function(eth_dev);
2007                 return 0;
2008         }
2009         rte_eth_copy_pci_info(eth_dev, pci_dev);
2010         eth_dev->data->dev_flags |= RTE_ETH_DEV_AUTOFILL_QUEUE_XSTATS;
2011
2012         hw->vendor_id = pci_dev->id.vendor_id;
2013         hw->device_id = pci_dev->id.device_id;
2014         hw->subsystem_vendor_id = pci_dev->id.subsystem_vendor_id;
2015         hw->subsystem_device_id = pci_dev->id.subsystem_device_id;
2016         hw->bus.bus_id = pci_dev->addr.bus;
2017         hw->bus.device = pci_dev->addr.devid;
2018         hw->bus.func = pci_dev->addr.function;
2019         hw->hw_addr = (void *)pci_dev->mem_resource[0].addr;
2020         hw->back = IAVF_DEV_PRIVATE_TO_ADAPTER(eth_dev->data->dev_private);
2021         adapter->eth_dev = eth_dev;
2022         adapter->stopped = 1;
2023
2024         if (iavf_init_vf(eth_dev) != 0) {
2025                 PMD_INIT_LOG(ERR, "Init vf failed");
2026                 return -1;
2027         }
2028
2029         /* set default ptype table */
2030         adapter->ptype_tbl = iavf_get_default_ptype_table();
2031
2032         /* copy mac addr */
2033         eth_dev->data->mac_addrs = rte_zmalloc(
2034                 "iavf_mac", RTE_ETHER_ADDR_LEN * IAVF_NUM_MACADDR_MAX, 0);
2035         if (!eth_dev->data->mac_addrs) {
2036                 PMD_INIT_LOG(ERR, "Failed to allocate %d bytes needed to"
2037                              " store MAC addresses",
2038                              RTE_ETHER_ADDR_LEN * IAVF_NUM_MACADDR_MAX);
2039                 return -ENOMEM;
2040         }
2041         /* If the MAC address is not configured by host,
2042          * generate a random one.
2043          */
2044         if (!rte_is_valid_assigned_ether_addr(
2045                         (struct rte_ether_addr *)hw->mac.addr))
2046                 rte_eth_random_addr(hw->mac.addr);
2047         rte_ether_addr_copy((struct rte_ether_addr *)hw->mac.addr,
2048                         &eth_dev->data->mac_addrs[0]);
2049
2050         /* register callback func to eal lib */
2051         rte_intr_callback_register(&pci_dev->intr_handle,
2052                                    iavf_dev_interrupt_handler,
2053                                    (void *)eth_dev);
2054
2055         /* enable uio intr after callback register */
2056         rte_intr_enable(&pci_dev->intr_handle);
2057
2058         /* configure and enable device interrupt */
2059         iavf_enable_irq0(hw);
2060
2061         ret = iavf_flow_init(adapter);
2062         if (ret) {
2063                 PMD_INIT_LOG(ERR, "Failed to initialize flow");
2064                 return ret;
2065         }
2066
2067         /* Set hena = 0 to ask PF to cleanup all existing RSS. */
2068         ret = iavf_set_hena(adapter, 0);
2069         if (ret) {
2070                 PMD_DRV_LOG(ERR, "fail to disable default PF RSS");
2071                 return ret;
2072         }
2073
2074         return 0;
2075 }
2076
2077 static int
2078 iavf_dev_close(struct rte_eth_dev *dev)
2079 {
2080         struct iavf_hw *hw = IAVF_DEV_PRIVATE_TO_HW(dev->data->dev_private);
2081         struct rte_pci_device *pci_dev = RTE_ETH_DEV_TO_PCI(dev);
2082         struct rte_intr_handle *intr_handle = &pci_dev->intr_handle;
2083         struct iavf_adapter *adapter =
2084                 IAVF_DEV_PRIVATE_TO_ADAPTER(dev->data->dev_private);
2085         struct iavf_info *vf = IAVF_DEV_PRIVATE_TO_VF(dev->data->dev_private);
2086         int ret;
2087
2088         if (rte_eal_process_type() != RTE_PROC_PRIMARY)
2089                 return 0;
2090
2091         ret = iavf_dev_stop(dev);
2092
2093         iavf_flow_flush(dev, NULL);
2094         iavf_flow_uninit(adapter);
2095
2096         /*
2097          * disable promiscuous mode before reset vf
2098          * it is a workaround solution when work with kernel driver
2099          * and it is not the normal way
2100          */
2101         if (vf->promisc_unicast_enabled || vf->promisc_multicast_enabled)
2102                 iavf_config_promisc(adapter, false, false);
2103
2104         iavf_shutdown_adminq(hw);
2105         /* disable uio intr before callback unregister */
2106         rte_intr_disable(intr_handle);
2107
2108         /* unregister callback func from eal lib */
2109         rte_intr_callback_unregister(intr_handle,
2110                                      iavf_dev_interrupt_handler, dev);
2111         iavf_disable_irq0(hw);
2112
2113         if (vf->vf_res->vf_cap_flags & VIRTCHNL_VF_OFFLOAD_RSS_PF) {
2114                 if (vf->rss_lut) {
2115                         rte_free(vf->rss_lut);
2116                         vf->rss_lut = NULL;
2117                 }
2118                 if (vf->rss_key) {
2119                         rte_free(vf->rss_key);
2120                         vf->rss_key = NULL;
2121                 }
2122         }
2123
2124         rte_free(vf->vf_res);
2125         vf->vsi_res = NULL;
2126         vf->vf_res = NULL;
2127
2128         rte_free(vf->aq_resp);
2129         vf->aq_resp = NULL;
2130
2131         vf->vf_reset = false;
2132
2133         return ret;
2134 }
2135
2136 static int
2137 iavf_dev_uninit(struct rte_eth_dev *dev)
2138 {
2139         if (rte_eal_process_type() != RTE_PROC_PRIMARY)
2140                 return -EPERM;
2141
2142         iavf_dev_close(dev);
2143
2144         return 0;
2145 }
2146
2147 /*
2148  * Reset VF device only to re-initialize resources in PMD layer
2149  */
2150 static int
2151 iavf_dev_reset(struct rte_eth_dev *dev)
2152 {
2153         int ret;
2154
2155         ret = iavf_dev_uninit(dev);
2156         if (ret)
2157                 return ret;
2158
2159         return iavf_dev_init(dev);
2160 }
2161
2162 static int
2163 iavf_dcf_cap_check_handler(__rte_unused const char *key,
2164                            const char *value, __rte_unused void *opaque)
2165 {
2166         if (strcmp(value, "dcf"))
2167                 return -1;
2168
2169         return 0;
2170 }
2171
2172 static int
2173 iavf_dcf_cap_selected(struct rte_devargs *devargs)
2174 {
2175         struct rte_kvargs *kvlist;
2176         const char *key = "cap";
2177         int ret = 0;
2178
2179         if (devargs == NULL)
2180                 return 0;
2181
2182         kvlist = rte_kvargs_parse(devargs->args, NULL);
2183         if (kvlist == NULL)
2184                 return 0;
2185
2186         if (!rte_kvargs_count(kvlist, key))
2187                 goto exit;
2188
2189         /* dcf capability selected when there's a key-value pair: cap=dcf */
2190         if (rte_kvargs_process(kvlist, key,
2191                                iavf_dcf_cap_check_handler, NULL) < 0)
2192                 goto exit;
2193
2194         ret = 1;
2195
2196 exit:
2197         rte_kvargs_free(kvlist);
2198         return ret;
2199 }
2200
2201 static int eth_iavf_pci_probe(struct rte_pci_driver *pci_drv __rte_unused,
2202                              struct rte_pci_device *pci_dev)
2203 {
2204         if (iavf_dcf_cap_selected(pci_dev->device.devargs))
2205                 return 1;
2206
2207         return rte_eth_dev_pci_generic_probe(pci_dev,
2208                 sizeof(struct iavf_adapter), iavf_dev_init);
2209 }
2210
2211 static int eth_iavf_pci_remove(struct rte_pci_device *pci_dev)
2212 {
2213         return rte_eth_dev_pci_generic_remove(pci_dev, iavf_dev_uninit);
2214 }
2215
2216 /* Adaptive virtual function driver struct */
2217 static struct rte_pci_driver rte_iavf_pmd = {
2218         .id_table = pci_id_iavf_map,
2219         .drv_flags = RTE_PCI_DRV_NEED_MAPPING | RTE_PCI_DRV_INTR_LSC,
2220         .probe = eth_iavf_pci_probe,
2221         .remove = eth_iavf_pci_remove,
2222 };
2223
2224 RTE_PMD_REGISTER_PCI(net_iavf, rte_iavf_pmd);
2225 RTE_PMD_REGISTER_PCI_TABLE(net_iavf, pci_id_iavf_map);
2226 RTE_PMD_REGISTER_KMOD_DEP(net_iavf, "* igb_uio | vfio-pci");
2227 RTE_PMD_REGISTER_PARAM_STRING(net_iavf, "cap=dcf");
2228 RTE_LOG_REGISTER(iavf_logtype_init, pmd.net.iavf.init, NOTICE);
2229 RTE_LOG_REGISTER(iavf_logtype_driver, pmd.net.iavf.driver, NOTICE);
2230 #ifdef RTE_LIBRTE_IAVF_DEBUG_RX
2231 RTE_LOG_REGISTER(iavf_logtype_rx, pmd.net.iavf.rx, DEBUG);
2232 #endif
2233 #ifdef RTE_LIBRTE_IAVF_DEBUG_TX
2234 RTE_LOG_REGISTER(iavf_logtype_tx, pmd.net.iavf.tx, DEBUG);
2235 #endif
2236 #ifdef RTE_LIBRTE_IAVF_DEBUG_TX_FREE
2237 RTE_LOG_REGISTER(iavf_logtype_tx_free, pmd.net.iavf.tx_free, DEBUG);
2238 #endif