ethdev: allow drivers to return error on close
[dpdk.git] / drivers / net / octeontx / octeontx_ethdev.c
1 /* SPDX-License-Identifier: BSD-3-Clause
2  * Copyright(c) 2017 Cavium, Inc
3  */
4
5 #include <stdio.h>
6 #include <stdarg.h>
7 #include <stdbool.h>
8 #include <stdint.h>
9 #include <string.h>
10 #include <unistd.h>
11
12 #include <rte_alarm.h>
13 #include <rte_branch_prediction.h>
14 #include <rte_bus_vdev.h>
15 #include <rte_cycles.h>
16 #include <rte_debug.h>
17 #include <rte_devargs.h>
18 #include <rte_dev.h>
19 #include <rte_kvargs.h>
20 #include <rte_malloc.h>
21 #include <rte_mbuf_pool_ops.h>
22 #include <rte_prefetch.h>
23
24 #include "octeontx_ethdev.h"
25 #include "octeontx_rxtx.h"
26 #include "octeontx_logs.h"
27
28 struct evdev_priv_data {
29         OFFLOAD_FLAGS; /*Sequence should not be changed */
30 } __rte_cache_aligned;
31
32 struct octeontx_vdev_init_params {
33         uint8_t nr_port;
34 };
35
36 uint16_t
37 rte_octeontx_pchan_map[OCTEONTX_MAX_BGX_PORTS][OCTEONTX_MAX_LMAC_PER_BGX];
38
39 enum octeontx_link_speed {
40         OCTEONTX_LINK_SPEED_SGMII,
41         OCTEONTX_LINK_SPEED_XAUI,
42         OCTEONTX_LINK_SPEED_RXAUI,
43         OCTEONTX_LINK_SPEED_10G_R,
44         OCTEONTX_LINK_SPEED_40G_R,
45         OCTEONTX_LINK_SPEED_RESERVE1,
46         OCTEONTX_LINK_SPEED_QSGMII,
47         OCTEONTX_LINK_SPEED_RESERVE2
48 };
49
50 RTE_LOG_REGISTER(otx_net_logtype_mbox, pmd.net.octeontx.mbox, NOTICE);
51 RTE_LOG_REGISTER(otx_net_logtype_init, pmd.net.octeontx.init, NOTICE);
52 RTE_LOG_REGISTER(otx_net_logtype_driver, pmd.net.octeontx.driver, NOTICE);
53
54 /* Parse integer from integer argument */
55 static int
56 parse_integer_arg(const char *key __rte_unused,
57                 const char *value, void *extra_args)
58 {
59         int *i = (int *)extra_args;
60
61         *i = atoi(value);
62         if (*i < 0) {
63                 octeontx_log_err("argument has to be positive.");
64                 return -1;
65         }
66
67         return 0;
68 }
69
70 static int
71 octeontx_parse_vdev_init_params(struct octeontx_vdev_init_params *params,
72                                 struct rte_vdev_device *dev)
73 {
74         struct rte_kvargs *kvlist = NULL;
75         int ret = 0;
76
77         static const char * const octeontx_vdev_valid_params[] = {
78                 OCTEONTX_VDEV_NR_PORT_ARG,
79                 NULL
80         };
81
82         const char *input_args = rte_vdev_device_args(dev);
83         if (params == NULL)
84                 return -EINVAL;
85
86
87         if (input_args) {
88                 kvlist = rte_kvargs_parse(input_args,
89                                 octeontx_vdev_valid_params);
90                 if (kvlist == NULL)
91                         return -1;
92
93                 ret = rte_kvargs_process(kvlist,
94                                         OCTEONTX_VDEV_NR_PORT_ARG,
95                                         &parse_integer_arg,
96                                         &params->nr_port);
97                 if (ret < 0)
98                         goto free_kvlist;
99         }
100
101 free_kvlist:
102         rte_kvargs_free(kvlist);
103         return ret;
104 }
105
106 static int
107 octeontx_port_open(struct octeontx_nic *nic)
108 {
109         octeontx_mbox_bgx_port_conf_t bgx_port_conf;
110         octeontx_mbox_bgx_port_fifo_cfg_t fifo_cfg;
111         int res;
112
113         res = 0;
114         memset(&bgx_port_conf, 0x0, sizeof(bgx_port_conf));
115         PMD_INIT_FUNC_TRACE();
116
117         res = octeontx_bgx_port_open(nic->port_id, &bgx_port_conf);
118         if (res < 0) {
119                 octeontx_log_err("failed to open port %d", res);
120                 return res;
121         }
122
123         nic->node = bgx_port_conf.node;
124         nic->port_ena = bgx_port_conf.enable;
125         nic->base_ichan = bgx_port_conf.base_chan;
126         nic->base_ochan = bgx_port_conf.base_chan;
127         nic->num_ichans = bgx_port_conf.num_chans;
128         nic->num_ochans = bgx_port_conf.num_chans;
129         nic->bgx_mtu = bgx_port_conf.mtu;
130         nic->bpen = bgx_port_conf.bpen;
131         nic->fcs_strip = bgx_port_conf.fcs_strip;
132         nic->bcast_mode = bgx_port_conf.bcast_mode;
133         nic->mcast_mode = bgx_port_conf.mcast_mode;
134         nic->speed      = bgx_port_conf.mode;
135
136         memset(&fifo_cfg, 0x0, sizeof(fifo_cfg));
137
138         res = octeontx_bgx_port_get_fifo_cfg(nic->port_id, &fifo_cfg);
139         if (res < 0) {
140                 octeontx_log_err("failed to get port %d fifo cfg", res);
141                 return res;
142         }
143
144         nic->fc.rx_fifosz = fifo_cfg.rx_fifosz;
145
146         memcpy(&nic->mac_addr[0], &bgx_port_conf.macaddr[0],
147                 RTE_ETHER_ADDR_LEN);
148
149         octeontx_log_dbg("port opened %d", nic->port_id);
150         return res;
151 }
152
153 static void
154 octeontx_link_status_print(struct rte_eth_dev *eth_dev,
155                            struct rte_eth_link *link)
156 {
157         if (link && link->link_status)
158                 octeontx_log_info("Port %u: Link Up - speed %u Mbps - %s",
159                           (eth_dev->data->port_id),
160                           link->link_speed,
161                           link->link_duplex == ETH_LINK_FULL_DUPLEX ?
162                           "full-duplex" : "half-duplex");
163         else
164                 octeontx_log_info("Port %d: Link Down",
165                                   (int)(eth_dev->data->port_id));
166 }
167
168 static void
169 octeontx_link_status_update(struct octeontx_nic *nic,
170                          struct rte_eth_link *link)
171 {
172         memset(link, 0, sizeof(*link));
173
174         link->link_status = nic->link_up ? ETH_LINK_UP : ETH_LINK_DOWN;
175
176         switch (nic->speed) {
177         case OCTEONTX_LINK_SPEED_SGMII:
178                 link->link_speed = ETH_SPEED_NUM_1G;
179                 break;
180
181         case OCTEONTX_LINK_SPEED_XAUI:
182                 link->link_speed = ETH_SPEED_NUM_10G;
183                 break;
184
185         case OCTEONTX_LINK_SPEED_RXAUI:
186         case OCTEONTX_LINK_SPEED_10G_R:
187                 link->link_speed = ETH_SPEED_NUM_10G;
188                 break;
189         case OCTEONTX_LINK_SPEED_QSGMII:
190                 link->link_speed = ETH_SPEED_NUM_5G;
191                 break;
192         case OCTEONTX_LINK_SPEED_40G_R:
193                 link->link_speed = ETH_SPEED_NUM_40G;
194                 break;
195
196         case OCTEONTX_LINK_SPEED_RESERVE1:
197         case OCTEONTX_LINK_SPEED_RESERVE2:
198         default:
199                 link->link_speed = ETH_SPEED_NUM_NONE;
200                 octeontx_log_err("incorrect link speed %d", nic->speed);
201                 break;
202         }
203
204         link->link_duplex = ETH_LINK_FULL_DUPLEX;
205         link->link_autoneg = ETH_LINK_AUTONEG;
206 }
207
208 static void
209 octeontx_link_status_poll(void *arg)
210 {
211         struct octeontx_nic *nic = arg;
212         struct rte_eth_link link;
213         struct rte_eth_dev *dev;
214         int res;
215
216         PMD_INIT_FUNC_TRACE();
217
218         dev = nic->dev;
219
220         res = octeontx_bgx_port_link_status(nic->port_id);
221         if (res < 0) {
222                 octeontx_log_err("Failed to get port %d link status",
223                                 nic->port_id);
224         } else {
225                 if (nic->link_up != (uint8_t)res) {
226                         nic->link_up = (uint8_t)res;
227                         octeontx_link_status_update(nic, &link);
228                         octeontx_link_status_print(dev, &link);
229                         rte_eth_linkstatus_set(dev, &link);
230                         rte_eth_dev_callback_process(dev,
231                                                      RTE_ETH_EVENT_INTR_LSC,
232                                                      NULL);
233                 }
234         }
235
236         res = rte_eal_alarm_set(OCCTX_INTR_POLL_INTERVAL_MS * 1000,
237                                 octeontx_link_status_poll, nic);
238         if (res < 0)
239                 octeontx_log_err("Failed to restart alarm for port %d, err: %d",
240                                 nic->port_id, res);
241 }
242
243 static void
244 octeontx_port_close(struct octeontx_nic *nic)
245 {
246         PMD_INIT_FUNC_TRACE();
247
248         rte_eal_alarm_cancel(octeontx_link_status_poll, nic);
249         octeontx_bgx_port_close(nic->port_id);
250         octeontx_log_dbg("port closed %d", nic->port_id);
251 }
252
253 static int
254 octeontx_port_start(struct octeontx_nic *nic)
255 {
256         PMD_INIT_FUNC_TRACE();
257
258         return octeontx_bgx_port_start(nic->port_id);
259 }
260
261 static int
262 octeontx_port_stop(struct octeontx_nic *nic)
263 {
264         PMD_INIT_FUNC_TRACE();
265
266         return octeontx_bgx_port_stop(nic->port_id);
267 }
268
269 static int
270 octeontx_port_promisc_set(struct octeontx_nic *nic, int en)
271 {
272         struct rte_eth_dev *dev;
273         int res;
274
275         res = 0;
276         PMD_INIT_FUNC_TRACE();
277         dev = nic->dev;
278
279         res = octeontx_bgx_port_promisc_set(nic->port_id, en);
280         if (res < 0) {
281                 octeontx_log_err("failed to set promiscuous mode %d",
282                                 nic->port_id);
283                 return res;
284         }
285
286         /* Set proper flag for the mode */
287         dev->data->promiscuous = (en != 0) ? 1 : 0;
288
289         octeontx_log_dbg("port %d : promiscuous mode %s",
290                         nic->port_id, en ? "set" : "unset");
291
292         return 0;
293 }
294
295 static int
296 octeontx_port_stats(struct octeontx_nic *nic, struct rte_eth_stats *stats)
297 {
298         octeontx_mbox_bgx_port_stats_t bgx_stats;
299         int res;
300
301         PMD_INIT_FUNC_TRACE();
302
303         res = octeontx_bgx_port_stats(nic->port_id, &bgx_stats);
304         if (res < 0) {
305                 octeontx_log_err("failed to get port stats %d", nic->port_id);
306                 return res;
307         }
308
309         stats->ipackets = bgx_stats.rx_packets;
310         stats->ibytes = bgx_stats.rx_bytes;
311         stats->imissed = bgx_stats.rx_dropped;
312         stats->ierrors = bgx_stats.rx_errors;
313         stats->opackets = bgx_stats.tx_packets;
314         stats->obytes = bgx_stats.tx_bytes;
315         stats->oerrors = bgx_stats.tx_errors;
316
317         octeontx_log_dbg("port%d stats inpkts=%" PRIx64 " outpkts=%" PRIx64 "",
318                         nic->port_id, stats->ipackets, stats->opackets);
319
320         return 0;
321 }
322
323 static int
324 octeontx_port_stats_clr(struct octeontx_nic *nic)
325 {
326         PMD_INIT_FUNC_TRACE();
327
328         return octeontx_bgx_port_stats_clr(nic->port_id);
329 }
330
331 static inline void
332 devconf_set_default_sane_values(struct rte_event_dev_config *dev_conf,
333                                 struct rte_event_dev_info *info)
334 {
335         memset(dev_conf, 0, sizeof(struct rte_event_dev_config));
336         dev_conf->dequeue_timeout_ns = info->min_dequeue_timeout_ns;
337
338         dev_conf->nb_event_ports = info->max_event_ports;
339         dev_conf->nb_event_queues = info->max_event_queues;
340
341         dev_conf->nb_event_queue_flows = info->max_event_queue_flows;
342         dev_conf->nb_event_port_dequeue_depth =
343                         info->max_event_port_dequeue_depth;
344         dev_conf->nb_event_port_enqueue_depth =
345                         info->max_event_port_enqueue_depth;
346         dev_conf->nb_event_port_enqueue_depth =
347                         info->max_event_port_enqueue_depth;
348         dev_conf->nb_events_limit =
349                         info->max_num_events;
350 }
351
352 static uint16_t
353 octeontx_tx_offload_flags(struct rte_eth_dev *eth_dev)
354 {
355         struct octeontx_nic *nic = octeontx_pmd_priv(eth_dev);
356         uint16_t flags = 0;
357
358         if (nic->tx_offloads & DEV_TX_OFFLOAD_OUTER_IPV4_CKSUM ||
359             nic->tx_offloads & DEV_TX_OFFLOAD_OUTER_UDP_CKSUM)
360                 flags |= OCCTX_TX_OFFLOAD_OL3_OL4_CSUM_F;
361
362         if (nic->tx_offloads & DEV_TX_OFFLOAD_IPV4_CKSUM ||
363             nic->tx_offloads & DEV_TX_OFFLOAD_TCP_CKSUM ||
364             nic->tx_offloads & DEV_TX_OFFLOAD_UDP_CKSUM ||
365             nic->tx_offloads & DEV_TX_OFFLOAD_SCTP_CKSUM)
366                 flags |= OCCTX_TX_OFFLOAD_L3_L4_CSUM_F;
367
368         if (!(nic->tx_offloads & DEV_TX_OFFLOAD_MBUF_FAST_FREE))
369                 flags |= OCCTX_TX_OFFLOAD_MBUF_NOFF_F;
370
371         if (nic->tx_offloads & DEV_TX_OFFLOAD_MULTI_SEGS)
372                 flags |= OCCTX_TX_MULTI_SEG_F;
373
374         return flags;
375 }
376
377 static uint16_t
378 octeontx_rx_offload_flags(struct rte_eth_dev *eth_dev)
379 {
380         struct octeontx_nic *nic = octeontx_pmd_priv(eth_dev);
381         uint16_t flags = 0;
382
383         if (nic->rx_offloads & (DEV_RX_OFFLOAD_TCP_CKSUM |
384                          DEV_RX_OFFLOAD_UDP_CKSUM))
385                 flags |= OCCTX_RX_OFFLOAD_CSUM_F;
386
387         if (nic->rx_offloads & (DEV_RX_OFFLOAD_IPV4_CKSUM |
388                                 DEV_RX_OFFLOAD_OUTER_IPV4_CKSUM))
389                 flags |= OCCTX_RX_OFFLOAD_CSUM_F;
390
391         if (nic->rx_offloads & DEV_RX_OFFLOAD_SCATTER) {
392                 flags |= OCCTX_RX_MULTI_SEG_F;
393                 eth_dev->data->scattered_rx = 1;
394                 /* If scatter mode is enabled, TX should also be in multi
395                  * seg mode, else memory leak will occur
396                  */
397                 nic->tx_offloads |= DEV_TX_OFFLOAD_MULTI_SEGS;
398         }
399
400         return flags;
401 }
402
403 static int
404 octeontx_dev_configure(struct rte_eth_dev *dev)
405 {
406         struct rte_eth_dev_data *data = dev->data;
407         struct rte_eth_conf *conf = &data->dev_conf;
408         struct rte_eth_rxmode *rxmode = &conf->rxmode;
409         struct rte_eth_txmode *txmode = &conf->txmode;
410         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
411         int ret;
412
413         PMD_INIT_FUNC_TRACE();
414         RTE_SET_USED(conf);
415
416         if (!rte_eal_has_hugepages()) {
417                 octeontx_log_err("huge page is not configured");
418                 return -EINVAL;
419         }
420
421         if (txmode->mq_mode) {
422                 octeontx_log_err("tx mq_mode DCB or VMDq not supported");
423                 return -EINVAL;
424         }
425
426         if (rxmode->mq_mode != ETH_MQ_RX_NONE &&
427                 rxmode->mq_mode != ETH_MQ_RX_RSS) {
428                 octeontx_log_err("unsupported rx qmode %d", rxmode->mq_mode);
429                 return -EINVAL;
430         }
431
432         if (!(txmode->offloads & DEV_TX_OFFLOAD_MT_LOCKFREE)) {
433                 PMD_INIT_LOG(NOTICE, "cant disable lockfree tx");
434                 txmode->offloads |= DEV_TX_OFFLOAD_MT_LOCKFREE;
435         }
436
437         if (conf->link_speeds & ETH_LINK_SPEED_FIXED) {
438                 octeontx_log_err("setting link speed/duplex not supported");
439                 return -EINVAL;
440         }
441
442         if (conf->dcb_capability_en) {
443                 octeontx_log_err("DCB enable not supported");
444                 return -EINVAL;
445         }
446
447         if (conf->fdir_conf.mode != RTE_FDIR_MODE_NONE) {
448                 octeontx_log_err("flow director not supported");
449                 return -EINVAL;
450         }
451
452         nic->num_tx_queues = dev->data->nb_tx_queues;
453
454         ret = octeontx_pko_channel_open(nic->pko_vfid * PKO_VF_NUM_DQ,
455                                         nic->num_tx_queues,
456                                         nic->base_ochan);
457         if (ret) {
458                 octeontx_log_err("failed to open channel %d no-of-txq %d",
459                            nic->base_ochan, nic->num_tx_queues);
460                 return -EFAULT;
461         }
462
463         ret = octeontx_dev_vlan_offload_init(dev);
464         if (ret) {
465                 octeontx_log_err("failed to initialize vlan offload");
466                 return -EFAULT;
467         }
468
469         nic->pki.classifier_enable = false;
470         nic->pki.hash_enable = true;
471         nic->pki.initialized = false;
472
473         nic->rx_offloads |= rxmode->offloads;
474         nic->tx_offloads |= txmode->offloads;
475         nic->rx_offload_flags |= octeontx_rx_offload_flags(dev);
476         nic->tx_offload_flags |= octeontx_tx_offload_flags(dev);
477
478         return 0;
479 }
480
481 static int
482 octeontx_dev_close(struct rte_eth_dev *dev)
483 {
484         struct octeontx_txq *txq = NULL;
485         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
486         unsigned int i;
487         int ret;
488
489         PMD_INIT_FUNC_TRACE();
490
491         rte_event_dev_close(nic->evdev);
492
493         octeontx_dev_flow_ctrl_fini(dev);
494
495         octeontx_dev_vlan_offload_fini(dev);
496
497         ret = octeontx_pko_channel_close(nic->base_ochan);
498         if (ret < 0) {
499                 octeontx_log_err("failed to close channel %d VF%d %d %d",
500                              nic->base_ochan, nic->port_id, nic->num_tx_queues,
501                              ret);
502         }
503         /* Free txq resources for this port */
504         for (i = 0; i < nic->num_tx_queues; i++) {
505                 txq = dev->data->tx_queues[i];
506                 if (!txq)
507                         continue;
508
509                 rte_free(txq);
510         }
511
512         /* Free MAC address table */
513         rte_free(dev->data->mac_addrs);
514         dev->data->mac_addrs = NULL;
515
516         octeontx_port_close(nic);
517
518         dev->tx_pkt_burst = NULL;
519         dev->rx_pkt_burst = NULL;
520
521         return 0;
522 }
523
524 static int
525 octeontx_dev_mtu_set(struct rte_eth_dev *eth_dev, uint16_t mtu)
526 {
527         uint32_t buffsz, frame_size = mtu + OCCTX_L2_OVERHEAD;
528         struct octeontx_nic *nic = octeontx_pmd_priv(eth_dev);
529         struct rte_eth_dev_data *data = eth_dev->data;
530         int rc = 0;
531
532         /* Check if MTU is within the allowed range */
533         if (frame_size < OCCTX_MIN_FRS || frame_size > OCCTX_MAX_FRS)
534                 return -EINVAL;
535
536         buffsz = data->min_rx_buf_size - RTE_PKTMBUF_HEADROOM;
537
538         /* Refuse MTU that requires the support of scattered packets
539          * when this feature has not been enabled before.
540          */
541         if (data->dev_started && frame_size > buffsz &&
542             !(nic->rx_offloads & DEV_RX_OFFLOAD_SCATTER)) {
543                 octeontx_log_err("Scatter mode is disabled");
544                 return -EINVAL;
545         }
546
547         /* Check <seg size> * <max_seg>  >= max_frame */
548         if ((nic->rx_offloads & DEV_RX_OFFLOAD_SCATTER) &&
549             (frame_size > buffsz * OCCTX_RX_NB_SEG_MAX))
550                 return -EINVAL;
551
552         rc = octeontx_pko_send_mtu(nic->port_id, frame_size);
553         if (rc)
554                 return rc;
555
556         rc = octeontx_bgx_port_mtu_set(nic->port_id, frame_size);
557         if (rc)
558                 return rc;
559
560         if (frame_size > RTE_ETHER_MAX_LEN)
561                 nic->rx_offloads |= DEV_RX_OFFLOAD_JUMBO_FRAME;
562         else
563                 nic->rx_offloads &= ~DEV_RX_OFFLOAD_JUMBO_FRAME;
564
565         /* Update max_rx_pkt_len */
566         data->dev_conf.rxmode.max_rx_pkt_len = frame_size;
567         octeontx_log_info("Received pkt beyond  maxlen %d will be dropped",
568                           frame_size);
569
570         return rc;
571 }
572
573 static int
574 octeontx_recheck_rx_offloads(struct octeontx_rxq *rxq)
575 {
576         struct rte_eth_dev *eth_dev = rxq->eth_dev;
577         struct octeontx_nic *nic = octeontx_pmd_priv(eth_dev);
578         struct rte_eth_dev_data *data = eth_dev->data;
579         struct rte_pktmbuf_pool_private *mbp_priv;
580         struct evdev_priv_data *evdev_priv;
581         struct rte_eventdev *dev;
582         uint32_t buffsz;
583
584         /* Get rx buffer size */
585         mbp_priv = rte_mempool_get_priv(rxq->pool);
586         buffsz = mbp_priv->mbuf_data_room_size - RTE_PKTMBUF_HEADROOM;
587
588         /* Setup scatter mode if needed by jumbo */
589         if (data->dev_conf.rxmode.max_rx_pkt_len > buffsz) {
590                 nic->rx_offloads |= DEV_RX_OFFLOAD_SCATTER;
591                 nic->rx_offload_flags |= octeontx_rx_offload_flags(eth_dev);
592                 nic->tx_offload_flags |= octeontx_tx_offload_flags(eth_dev);
593         }
594
595         /* Sharing offload flags via eventdev priv region */
596         dev = &rte_eventdevs[rxq->evdev];
597         evdev_priv = dev->data->dev_private;
598         evdev_priv->rx_offload_flags = nic->rx_offload_flags;
599         evdev_priv->tx_offload_flags = nic->tx_offload_flags;
600
601         /* Setup MTU based on max_rx_pkt_len */
602         nic->mtu = data->dev_conf.rxmode.max_rx_pkt_len - OCCTX_L2_OVERHEAD;
603
604         return 0;
605 }
606
607 static int
608 octeontx_dev_start(struct rte_eth_dev *dev)
609 {
610         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
611         struct octeontx_rxq *rxq;
612         int ret, i;
613
614         PMD_INIT_FUNC_TRACE();
615         /* Rechecking if any new offload set to update
616          * rx/tx burst function pointer accordingly.
617          */
618         for (i = 0; i < dev->data->nb_rx_queues; i++) {
619                 rxq = dev->data->rx_queues[i];
620                 octeontx_recheck_rx_offloads(rxq);
621         }
622
623         /* Setting up the mtu based on max_rx_pkt_len */
624         ret = octeontx_dev_mtu_set(dev, nic->mtu);
625         if (ret) {
626                 octeontx_log_err("Failed to set default MTU size %d", ret);
627                 goto error;
628         }
629
630         /*
631          * Tx start
632          */
633         octeontx_set_tx_function(dev);
634         ret = octeontx_pko_channel_start(nic->base_ochan);
635         if (ret < 0) {
636                 octeontx_log_err("fail to conf VF%d no. txq %d chan %d ret %d",
637                            nic->port_id, nic->num_tx_queues, nic->base_ochan,
638                            ret);
639                 goto error;
640         }
641
642         /*
643          * Rx start
644          */
645         dev->rx_pkt_burst = octeontx_recv_pkts;
646         ret = octeontx_pki_port_start(nic->port_id);
647         if (ret < 0) {
648                 octeontx_log_err("fail to start Rx on port %d", nic->port_id);
649                 goto channel_stop_error;
650         }
651
652         /*
653          * Start port
654          */
655         ret = octeontx_port_start(nic);
656         if (ret < 0) {
657                 octeontx_log_err("failed start port %d", ret);
658                 goto pki_port_stop_error;
659         }
660
661         PMD_TX_LOG(DEBUG, "pko: start channel %d no.of txq %d port %d",
662                         nic->base_ochan, nic->num_tx_queues, nic->port_id);
663
664         ret = rte_event_dev_start(nic->evdev);
665         if (ret < 0) {
666                 octeontx_log_err("failed to start evdev: ret (%d)", ret);
667                 goto pki_port_stop_error;
668         }
669
670         /* Success */
671         return ret;
672
673 pki_port_stop_error:
674         octeontx_pki_port_stop(nic->port_id);
675 channel_stop_error:
676         octeontx_pko_channel_stop(nic->base_ochan);
677 error:
678         return ret;
679 }
680
681 static void
682 octeontx_dev_stop(struct rte_eth_dev *dev)
683 {
684         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
685         int ret;
686
687         PMD_INIT_FUNC_TRACE();
688
689         rte_event_dev_stop(nic->evdev);
690
691         ret = octeontx_port_stop(nic);
692         if (ret < 0) {
693                 octeontx_log_err("failed to req stop port %d res=%d",
694                                         nic->port_id, ret);
695                 return;
696         }
697
698         ret = octeontx_pki_port_stop(nic->port_id);
699         if (ret < 0) {
700                 octeontx_log_err("failed to stop pki port %d res=%d",
701                                         nic->port_id, ret);
702                 return;
703         }
704
705         ret = octeontx_pko_channel_stop(nic->base_ochan);
706         if (ret < 0) {
707                 octeontx_log_err("failed to stop channel %d VF%d %d %d",
708                              nic->base_ochan, nic->port_id, nic->num_tx_queues,
709                              ret);
710                 return;
711         }
712 }
713
714 static int
715 octeontx_dev_promisc_enable(struct rte_eth_dev *dev)
716 {
717         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
718
719         PMD_INIT_FUNC_TRACE();
720         return octeontx_port_promisc_set(nic, 1);
721 }
722
723 static int
724 octeontx_dev_promisc_disable(struct rte_eth_dev *dev)
725 {
726         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
727
728         PMD_INIT_FUNC_TRACE();
729         return octeontx_port_promisc_set(nic, 0);
730 }
731
732 static int
733 octeontx_port_link_status(struct octeontx_nic *nic)
734 {
735         int res;
736
737         PMD_INIT_FUNC_TRACE();
738         res = octeontx_bgx_port_link_status(nic->port_id);
739         if (res < 0) {
740                 octeontx_log_err("failed to get port %d link status",
741                                 nic->port_id);
742                 return res;
743         }
744
745         if (nic->link_up != (uint8_t)res || nic->print_flag == -1) {
746                 nic->link_up = (uint8_t)res;
747                 nic->print_flag = 1;
748         }
749         octeontx_log_dbg("port %d link status %d", nic->port_id, nic->link_up);
750
751         return res;
752 }
753
754 /*
755  * Return 0 means link status changed, -1 means not changed
756  */
757 static int
758 octeontx_dev_link_update(struct rte_eth_dev *dev,
759                          int wait_to_complete __rte_unused)
760 {
761         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
762         struct rte_eth_link link;
763         int res;
764
765         PMD_INIT_FUNC_TRACE();
766
767         res = octeontx_port_link_status(nic);
768         if (res < 0) {
769                 octeontx_log_err("failed to request link status %d", res);
770                 return res;
771         }
772
773         octeontx_link_status_update(nic, &link);
774         if (nic->print_flag) {
775                 octeontx_link_status_print(nic->dev, &link);
776                 nic->print_flag = 0;
777         }
778
779         return rte_eth_linkstatus_set(dev, &link);
780 }
781
782 static int
783 octeontx_dev_stats_get(struct rte_eth_dev *dev, struct rte_eth_stats *stats)
784 {
785         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
786
787         PMD_INIT_FUNC_TRACE();
788         return octeontx_port_stats(nic, stats);
789 }
790
791 static int
792 octeontx_dev_stats_reset(struct rte_eth_dev *dev)
793 {
794         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
795
796         PMD_INIT_FUNC_TRACE();
797         return octeontx_port_stats_clr(nic);
798 }
799
800 static void
801 octeontx_dev_mac_addr_del(struct rte_eth_dev *dev, uint32_t index)
802 {
803         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
804         int ret;
805
806         ret = octeontx_bgx_port_mac_del(nic->port_id, index);
807         if (ret != 0)
808                 octeontx_log_err("failed to del MAC address filter on port %d",
809                                  nic->port_id);
810 }
811
812 static int
813 octeontx_dev_mac_addr_add(struct rte_eth_dev *dev,
814                           struct rte_ether_addr *mac_addr,
815                           uint32_t index,
816                           __rte_unused uint32_t vmdq)
817 {
818         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
819         int ret;
820
821         ret = octeontx_bgx_port_mac_add(nic->port_id, mac_addr->addr_bytes,
822                                         index);
823         if (ret < 0) {
824                 octeontx_log_err("failed to add MAC address filter on port %d",
825                                  nic->port_id);
826                 return ret;
827         }
828
829         return 0;
830 }
831
832 static int
833 octeontx_dev_default_mac_addr_set(struct rte_eth_dev *dev,
834                                         struct rte_ether_addr *addr)
835 {
836         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
837         int ret;
838
839         ret = octeontx_bgx_port_mac_set(nic->port_id, addr->addr_bytes);
840         if (ret == 0) {
841                 /* Update same mac address to BGX CAM table */
842                 ret = octeontx_bgx_port_mac_add(nic->port_id, addr->addr_bytes,
843                                                 0);
844         }
845         if (ret < 0) {
846                 octeontx_log_err("failed to set MAC address on port %d",
847                                  nic->port_id);
848         }
849
850         return ret;
851 }
852
853 static int
854 octeontx_dev_info(struct rte_eth_dev *dev,
855                 struct rte_eth_dev_info *dev_info)
856 {
857         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
858
859         /* Autonegotiation may be disabled */
860         dev_info->speed_capa = ETH_LINK_SPEED_FIXED;
861         dev_info->speed_capa |= ETH_LINK_SPEED_10M | ETH_LINK_SPEED_100M |
862                         ETH_LINK_SPEED_1G | ETH_LINK_SPEED_10G |
863                         ETH_LINK_SPEED_40G;
864
865         /* Min/Max MTU supported */
866         dev_info->min_rx_bufsize = OCCTX_MIN_FRS;
867         dev_info->max_rx_pktlen = OCCTX_MAX_FRS;
868         dev_info->max_mtu = dev_info->max_rx_pktlen - OCCTX_L2_OVERHEAD;
869         dev_info->min_mtu = dev_info->min_rx_bufsize - OCCTX_L2_OVERHEAD;
870
871         dev_info->max_mac_addrs =
872                                 octeontx_bgx_port_mac_entries_get(nic->port_id);
873         dev_info->max_rx_pktlen = PKI_MAX_PKTLEN;
874         dev_info->max_rx_queues = 1;
875         dev_info->max_tx_queues = PKO_MAX_NUM_DQ;
876         dev_info->min_rx_bufsize = 0;
877
878         dev_info->default_rxconf = (struct rte_eth_rxconf) {
879                 .rx_free_thresh = 0,
880                 .rx_drop_en = 0,
881                 .offloads = OCTEONTX_RX_OFFLOADS,
882         };
883
884         dev_info->default_txconf = (struct rte_eth_txconf) {
885                 .tx_free_thresh = 0,
886                 .offloads = OCTEONTX_TX_OFFLOADS,
887         };
888
889         dev_info->rx_offload_capa = OCTEONTX_RX_OFFLOADS;
890         dev_info->tx_offload_capa = OCTEONTX_TX_OFFLOADS;
891         dev_info->rx_queue_offload_capa = OCTEONTX_RX_OFFLOADS;
892         dev_info->tx_queue_offload_capa = OCTEONTX_TX_OFFLOADS;
893
894         return 0;
895 }
896
897 static void
898 octeontx_dq_info_getter(octeontx_dq_t *dq, void *out)
899 {
900         ((octeontx_dq_t *)out)->lmtline_va = dq->lmtline_va;
901         ((octeontx_dq_t *)out)->ioreg_va = dq->ioreg_va;
902         ((octeontx_dq_t *)out)->fc_status_va = dq->fc_status_va;
903 }
904
905 static int
906 octeontx_vf_start_tx_queue(struct rte_eth_dev *dev, struct octeontx_nic *nic,
907                                 uint16_t qidx)
908 {
909         struct octeontx_txq *txq;
910         int res;
911
912         PMD_INIT_FUNC_TRACE();
913
914         if (dev->data->tx_queue_state[qidx] == RTE_ETH_QUEUE_STATE_STARTED)
915                 return 0;
916
917         txq = dev->data->tx_queues[qidx];
918
919         res = octeontx_pko_channel_query_dqs(nic->base_ochan,
920                                                 &txq->dq,
921                                                 sizeof(octeontx_dq_t),
922                                                 txq->queue_id,
923                                                 octeontx_dq_info_getter);
924         if (res < 0) {
925                 res = -EFAULT;
926                 goto close_port;
927         }
928
929         dev->data->tx_queue_state[qidx] = RTE_ETH_QUEUE_STATE_STARTED;
930         return res;
931
932 close_port:
933         (void)octeontx_port_stop(nic);
934         octeontx_pko_channel_stop(nic->base_ochan);
935         octeontx_pko_channel_close(nic->base_ochan);
936         dev->data->tx_queue_state[qidx] = RTE_ETH_QUEUE_STATE_STOPPED;
937         return res;
938 }
939
940 int
941 octeontx_dev_tx_queue_start(struct rte_eth_dev *dev, uint16_t qidx)
942 {
943         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
944
945         PMD_INIT_FUNC_TRACE();
946         qidx = qidx % PKO_VF_NUM_DQ;
947         return octeontx_vf_start_tx_queue(dev, nic, qidx);
948 }
949
950 static inline int
951 octeontx_vf_stop_tx_queue(struct rte_eth_dev *dev, struct octeontx_nic *nic,
952                           uint16_t qidx)
953 {
954         int ret = 0;
955
956         RTE_SET_USED(nic);
957         PMD_INIT_FUNC_TRACE();
958
959         if (dev->data->tx_queue_state[qidx] == RTE_ETH_QUEUE_STATE_STOPPED)
960                 return 0;
961
962         dev->data->tx_queue_state[qidx] = RTE_ETH_QUEUE_STATE_STOPPED;
963         return ret;
964 }
965
966 int
967 octeontx_dev_tx_queue_stop(struct rte_eth_dev *dev, uint16_t qidx)
968 {
969         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
970
971         PMD_INIT_FUNC_TRACE();
972         qidx = qidx % PKO_VF_NUM_DQ;
973
974         return octeontx_vf_stop_tx_queue(dev, nic, qidx);
975 }
976
977 static void
978 octeontx_dev_tx_queue_release(void *tx_queue)
979 {
980         struct octeontx_txq *txq = tx_queue;
981         int res;
982
983         PMD_INIT_FUNC_TRACE();
984
985         if (txq) {
986                 res = octeontx_dev_tx_queue_stop(txq->eth_dev, txq->queue_id);
987                 if (res < 0)
988                         octeontx_log_err("failed stop tx_queue(%d)\n",
989                                    txq->queue_id);
990
991                 rte_free(txq);
992         }
993 }
994
995 static int
996 octeontx_dev_tx_queue_setup(struct rte_eth_dev *dev, uint16_t qidx,
997                             uint16_t nb_desc, unsigned int socket_id,
998                             const struct rte_eth_txconf *tx_conf __rte_unused)
999 {
1000         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
1001         struct octeontx_txq *txq = NULL;
1002         uint16_t dq_num;
1003         int res = 0;
1004
1005         RTE_SET_USED(nb_desc);
1006         RTE_SET_USED(socket_id);
1007
1008         dq_num = (nic->pko_vfid * PKO_VF_NUM_DQ) + qidx;
1009
1010         /* Socket id check */
1011         if (socket_id != (unsigned int)SOCKET_ID_ANY &&
1012                         socket_id != (unsigned int)nic->node)
1013                 PMD_TX_LOG(INFO, "socket_id expected %d, configured %d",
1014                                                 socket_id, nic->node);
1015
1016         /* Free memory prior to re-allocation if needed. */
1017         if (dev->data->tx_queues[qidx] != NULL) {
1018                 PMD_TX_LOG(DEBUG, "freeing memory prior to re-allocation %d",
1019                                 qidx);
1020                 octeontx_dev_tx_queue_release(dev->data->tx_queues[qidx]);
1021                 dev->data->tx_queues[qidx] = NULL;
1022         }
1023
1024         /* Allocating tx queue data structure */
1025         txq = rte_zmalloc_socket("ethdev TX queue", sizeof(struct octeontx_txq),
1026                                  RTE_CACHE_LINE_SIZE, nic->node);
1027         if (txq == NULL) {
1028                 octeontx_log_err("failed to allocate txq=%d", qidx);
1029                 res = -ENOMEM;
1030                 goto err;
1031         }
1032
1033         txq->eth_dev = dev;
1034         txq->queue_id = dq_num;
1035         dev->data->tx_queues[qidx] = txq;
1036         dev->data->tx_queue_state[qidx] = RTE_ETH_QUEUE_STATE_STOPPED;
1037
1038         res = octeontx_pko_channel_query_dqs(nic->base_ochan,
1039                                                 &txq->dq,
1040                                                 sizeof(octeontx_dq_t),
1041                                                 txq->queue_id,
1042                                                 octeontx_dq_info_getter);
1043         if (res < 0) {
1044                 res = -EFAULT;
1045                 goto err;
1046         }
1047
1048         PMD_TX_LOG(DEBUG, "[%d]:[%d] txq=%p nb_desc=%d lmtline=%p ioreg_va=%p fc_status_va=%p",
1049                         qidx, txq->queue_id, txq, nb_desc, txq->dq.lmtline_va,
1050                         txq->dq.ioreg_va,
1051                         txq->dq.fc_status_va);
1052
1053         return res;
1054
1055 err:
1056         if (txq)
1057                 rte_free(txq);
1058
1059         return res;
1060 }
1061
1062 static int
1063 octeontx_dev_rx_queue_setup(struct rte_eth_dev *dev, uint16_t qidx,
1064                                 uint16_t nb_desc, unsigned int socket_id,
1065                                 const struct rte_eth_rxconf *rx_conf,
1066                                 struct rte_mempool *mb_pool)
1067 {
1068         struct octeontx_nic *nic = octeontx_pmd_priv(dev);
1069         struct rte_mempool_ops *mp_ops = NULL;
1070         struct octeontx_rxq *rxq = NULL;
1071         pki_pktbuf_cfg_t pktbuf_conf;
1072         pki_hash_cfg_t pki_hash;
1073         pki_qos_cfg_t pki_qos;
1074         uintptr_t pool;
1075         int ret, port;
1076         uint16_t gaura;
1077         unsigned int ev_queues = (nic->ev_queues * nic->port_id) + qidx;
1078         unsigned int ev_ports = (nic->ev_ports * nic->port_id) + qidx;
1079
1080         RTE_SET_USED(nb_desc);
1081
1082         memset(&pktbuf_conf, 0, sizeof(pktbuf_conf));
1083         memset(&pki_hash, 0, sizeof(pki_hash));
1084         memset(&pki_qos, 0, sizeof(pki_qos));
1085
1086         mp_ops = rte_mempool_get_ops(mb_pool->ops_index);
1087         if (strcmp(mp_ops->name, "octeontx_fpavf")) {
1088                 octeontx_log_err("failed to find octeontx_fpavf mempool");
1089                 return -ENOTSUP;
1090         }
1091
1092         /* Handle forbidden configurations */
1093         if (nic->pki.classifier_enable) {
1094                 octeontx_log_err("cannot setup queue %d. "
1095                                         "Classifier option unsupported", qidx);
1096                 return -EINVAL;
1097         }
1098
1099         port = nic->port_id;
1100
1101         /* Rx deferred start is not supported */
1102         if (rx_conf->rx_deferred_start) {
1103                 octeontx_log_err("rx deferred start not supported");
1104                 return -EINVAL;
1105         }
1106
1107         /* Verify queue index */
1108         if (qidx >= dev->data->nb_rx_queues) {
1109                 octeontx_log_err("QID %d not supporteded (0 - %d available)\n",
1110                                 qidx, (dev->data->nb_rx_queues - 1));
1111                 return -ENOTSUP;
1112         }
1113
1114         /* Socket id check */
1115         if (socket_id != (unsigned int)SOCKET_ID_ANY &&
1116                         socket_id != (unsigned int)nic->node)
1117                 PMD_RX_LOG(INFO, "socket_id expected %d, configured %d",
1118                                                 socket_id, nic->node);
1119
1120         /* Allocating rx queue data structure */
1121         rxq = rte_zmalloc_socket("ethdev RX queue", sizeof(struct octeontx_rxq),
1122                                  RTE_CACHE_LINE_SIZE, nic->node);
1123         if (rxq == NULL) {
1124                 octeontx_log_err("failed to allocate rxq=%d", qidx);
1125                 return -ENOMEM;
1126         }
1127
1128         if (!nic->pki.initialized) {
1129                 pktbuf_conf.port_type = 0;
1130                 pki_hash.port_type = 0;
1131                 pki_qos.port_type = 0;
1132
1133                 pktbuf_conf.mmask.f_wqe_skip = 1;
1134                 pktbuf_conf.mmask.f_first_skip = 1;
1135                 pktbuf_conf.mmask.f_later_skip = 1;
1136                 pktbuf_conf.mmask.f_mbuff_size = 1;
1137                 pktbuf_conf.mmask.f_cache_mode = 1;
1138
1139                 pktbuf_conf.wqe_skip = OCTTX_PACKET_WQE_SKIP;
1140                 pktbuf_conf.first_skip = OCTTX_PACKET_FIRST_SKIP(mb_pool);
1141                 pktbuf_conf.later_skip = OCTTX_PACKET_LATER_SKIP;
1142                 pktbuf_conf.mbuff_size = (mb_pool->elt_size -
1143                                         RTE_PKTMBUF_HEADROOM -
1144                                         rte_pktmbuf_priv_size(mb_pool) -
1145                                         sizeof(struct rte_mbuf));
1146
1147                 pktbuf_conf.cache_mode = PKI_OPC_MODE_STF2_STT;
1148
1149                 ret = octeontx_pki_port_pktbuf_config(port, &pktbuf_conf);
1150                 if (ret != 0) {
1151                         octeontx_log_err("fail to configure pktbuf for port %d",
1152                                         port);
1153                         rte_free(rxq);
1154                         return ret;
1155                 }
1156                 PMD_RX_LOG(DEBUG, "Port %d Rx pktbuf configured:\n"
1157                                 "\tmbuf_size:\t0x%0x\n"
1158                                 "\twqe_skip:\t0x%0x\n"
1159                                 "\tfirst_skip:\t0x%0x\n"
1160                                 "\tlater_skip:\t0x%0x\n"
1161                                 "\tcache_mode:\t%s\n",
1162                                 port,
1163                                 pktbuf_conf.mbuff_size,
1164                                 pktbuf_conf.wqe_skip,
1165                                 pktbuf_conf.first_skip,
1166                                 pktbuf_conf.later_skip,
1167                                 (pktbuf_conf.cache_mode ==
1168                                                 PKI_OPC_MODE_STT) ?
1169                                 "STT" :
1170                                 (pktbuf_conf.cache_mode ==
1171                                                 PKI_OPC_MODE_STF) ?
1172                                 "STF" :
1173                                 (pktbuf_conf.cache_mode ==
1174                                                 PKI_OPC_MODE_STF1_STT) ?
1175                                 "STF1_STT" : "STF2_STT");
1176
1177                 if (nic->pki.hash_enable) {
1178                         pki_hash.tag_dlc = 1;
1179                         pki_hash.tag_slc = 1;
1180                         pki_hash.tag_dlf = 1;
1181                         pki_hash.tag_slf = 1;
1182                         pki_hash.tag_prt = 1;
1183                         octeontx_pki_port_hash_config(port, &pki_hash);
1184                 }
1185
1186                 pool = (uintptr_t)mb_pool->pool_id;
1187
1188                 /* Get the gaura Id */
1189                 gaura = octeontx_fpa_bufpool_gaura(pool);
1190
1191                 pki_qos.qpg_qos = PKI_QPG_QOS_NONE;
1192                 pki_qos.num_entry = 1;
1193                 pki_qos.drop_policy = 0;
1194                 pki_qos.tag_type = 0L;
1195                 pki_qos.qos_entry[0].port_add = 0;
1196                 pki_qos.qos_entry[0].gaura = gaura;
1197                 pki_qos.qos_entry[0].ggrp_ok = ev_queues;
1198                 pki_qos.qos_entry[0].ggrp_bad = ev_queues;
1199                 pki_qos.qos_entry[0].grptag_bad = 0;
1200                 pki_qos.qos_entry[0].grptag_ok = 0;
1201
1202                 ret = octeontx_pki_port_create_qos(port, &pki_qos);
1203                 if (ret < 0) {
1204                         octeontx_log_err("failed to create QOS port=%d, q=%d",
1205                                         port, qidx);
1206                         rte_free(rxq);
1207                         return ret;
1208                 }
1209                 nic->pki.initialized = true;
1210         }
1211
1212         rxq->port_id = nic->port_id;
1213         rxq->eth_dev = dev;
1214         rxq->queue_id = qidx;
1215         rxq->evdev = nic->evdev;
1216         rxq->ev_queues = ev_queues;
1217         rxq->ev_ports = ev_ports;
1218         rxq->pool = mb_pool;
1219
1220         octeontx_recheck_rx_offloads(rxq);
1221         dev->data->rx_queues[qidx] = rxq;
1222         dev->data->rx_queue_state[qidx] = RTE_ETH_QUEUE_STATE_STOPPED;
1223
1224         return 0;
1225 }
1226
1227 static void
1228 octeontx_dev_rx_queue_release(void *rxq)
1229 {
1230         rte_free(rxq);
1231 }
1232
1233 static const uint32_t *
1234 octeontx_dev_supported_ptypes_get(struct rte_eth_dev *dev)
1235 {
1236         static const uint32_t ptypes[] = {
1237                 RTE_PTYPE_L3_IPV4,
1238                 RTE_PTYPE_L3_IPV4_EXT,
1239                 RTE_PTYPE_L3_IPV6,
1240                 RTE_PTYPE_L3_IPV6_EXT,
1241                 RTE_PTYPE_L4_TCP,
1242                 RTE_PTYPE_L4_UDP,
1243                 RTE_PTYPE_L4_FRAG,
1244                 RTE_PTYPE_UNKNOWN
1245         };
1246
1247         if (dev->rx_pkt_burst == octeontx_recv_pkts)
1248                 return ptypes;
1249
1250         return NULL;
1251 }
1252
1253 static int
1254 octeontx_pool_ops(struct rte_eth_dev *dev, const char *pool)
1255 {
1256         RTE_SET_USED(dev);
1257
1258         if (!strcmp(pool, "octeontx_fpavf"))
1259                 return 0;
1260
1261         return -ENOTSUP;
1262 }
1263
1264 /* Initialize and register driver with DPDK Application */
1265 static const struct eth_dev_ops octeontx_dev_ops = {
1266         .dev_configure           = octeontx_dev_configure,
1267         .dev_infos_get           = octeontx_dev_info,
1268         .dev_close               = octeontx_dev_close,
1269         .dev_start               = octeontx_dev_start,
1270         .dev_stop                = octeontx_dev_stop,
1271         .promiscuous_enable      = octeontx_dev_promisc_enable,
1272         .promiscuous_disable     = octeontx_dev_promisc_disable,
1273         .link_update             = octeontx_dev_link_update,
1274         .stats_get               = octeontx_dev_stats_get,
1275         .stats_reset             = octeontx_dev_stats_reset,
1276         .mac_addr_remove         = octeontx_dev_mac_addr_del,
1277         .mac_addr_add            = octeontx_dev_mac_addr_add,
1278         .mac_addr_set            = octeontx_dev_default_mac_addr_set,
1279         .vlan_offload_set        = octeontx_dev_vlan_offload_set,
1280         .vlan_filter_set         = octeontx_dev_vlan_filter_set,
1281         .tx_queue_start          = octeontx_dev_tx_queue_start,
1282         .tx_queue_stop           = octeontx_dev_tx_queue_stop,
1283         .tx_queue_setup          = octeontx_dev_tx_queue_setup,
1284         .tx_queue_release        = octeontx_dev_tx_queue_release,
1285         .rx_queue_setup          = octeontx_dev_rx_queue_setup,
1286         .rx_queue_release        = octeontx_dev_rx_queue_release,
1287         .dev_set_link_up          = octeontx_dev_set_link_up,
1288         .dev_set_link_down        = octeontx_dev_set_link_down,
1289         .dev_supported_ptypes_get = octeontx_dev_supported_ptypes_get,
1290         .mtu_set                 = octeontx_dev_mtu_set,
1291         .pool_ops_supported      = octeontx_pool_ops,
1292         .flow_ctrl_get           = octeontx_dev_flow_ctrl_get,
1293         .flow_ctrl_set           = octeontx_dev_flow_ctrl_set,
1294 };
1295
1296 /* Create Ethdev interface per BGX LMAC ports */
1297 static int
1298 octeontx_create(struct rte_vdev_device *dev, int port, uint8_t evdev,
1299                         int socket_id)
1300 {
1301         int res;
1302         size_t pko_vfid;
1303         char octtx_name[OCTEONTX_MAX_NAME_LEN];
1304         struct octeontx_nic *nic = NULL;
1305         struct rte_eth_dev *eth_dev = NULL;
1306         struct rte_eth_dev_data *data;
1307         const char *name = rte_vdev_device_name(dev);
1308         int max_entries;
1309
1310         PMD_INIT_FUNC_TRACE();
1311
1312         sprintf(octtx_name, "%s_%d", name, port);
1313         if (rte_eal_process_type() != RTE_PROC_PRIMARY) {
1314                 eth_dev = rte_eth_dev_attach_secondary(octtx_name);
1315                 if (eth_dev == NULL)
1316                         return -ENODEV;
1317
1318                 eth_dev->dev_ops = &octeontx_dev_ops;
1319                 eth_dev->device = &dev->device;
1320                 octeontx_set_tx_function(eth_dev);
1321                 eth_dev->rx_pkt_burst = octeontx_recv_pkts;
1322                 rte_eth_dev_probing_finish(eth_dev);
1323                 return 0;
1324         }
1325
1326         /* Reserve an ethdev entry */
1327         eth_dev = rte_eth_dev_allocate(octtx_name);
1328         if (eth_dev == NULL) {
1329                 octeontx_log_err("failed to allocate rte_eth_dev");
1330                 res = -ENOMEM;
1331                 goto err;
1332         }
1333         data = eth_dev->data;
1334
1335         nic = rte_zmalloc_socket(octtx_name, sizeof(*nic), 0, socket_id);
1336         if (nic == NULL) {
1337                 octeontx_log_err("failed to allocate nic structure");
1338                 res = -ENOMEM;
1339                 goto err;
1340         }
1341         data->dev_private = nic;
1342         pko_vfid = octeontx_pko_get_vfid();
1343
1344         if (pko_vfid == SIZE_MAX) {
1345                 octeontx_log_err("failed to get pko vfid");
1346                 res = -ENODEV;
1347                 goto err;
1348         }
1349
1350         nic->pko_vfid = pko_vfid;
1351         nic->port_id = port;
1352         nic->evdev = evdev;
1353
1354         res = octeontx_port_open(nic);
1355         if (res < 0)
1356                 goto err;
1357
1358         /* Rx side port configuration */
1359         res = octeontx_pki_port_open(port);
1360         if (res != 0) {
1361                 octeontx_log_err("failed to open PKI port %d", port);
1362                 res = -ENODEV;
1363                 goto err;
1364         }
1365
1366         eth_dev->device = &dev->device;
1367         eth_dev->intr_handle = NULL;
1368         eth_dev->data->numa_node = dev->device.numa_node;
1369
1370         data->port_id = eth_dev->data->port_id;
1371
1372         nic->ev_queues = 1;
1373         nic->ev_ports = 1;
1374         nic->print_flag = -1;
1375
1376         data->dev_link.link_status = ETH_LINK_DOWN;
1377         data->dev_started = 0;
1378         data->promiscuous = 0;
1379         data->all_multicast = 0;
1380         data->scattered_rx = 0;
1381
1382         /* Get maximum number of supported MAC entries */
1383         max_entries = octeontx_bgx_port_mac_entries_get(nic->port_id);
1384         if (max_entries < 0) {
1385                 octeontx_log_err("Failed to get max entries for mac addr");
1386                 res = -ENOTSUP;
1387                 goto err;
1388         }
1389
1390         data->mac_addrs = rte_zmalloc_socket(octtx_name, max_entries *
1391                                              RTE_ETHER_ADDR_LEN, 0,
1392                                                         socket_id);
1393         if (data->mac_addrs == NULL) {
1394                 octeontx_log_err("failed to allocate memory for mac_addrs");
1395                 res = -ENOMEM;
1396                 goto err;
1397         }
1398
1399         eth_dev->dev_ops = &octeontx_dev_ops;
1400
1401         /* Finally save ethdev pointer to the NIC structure */
1402         nic->dev = eth_dev;
1403
1404         if (nic->port_id != data->port_id) {
1405                 octeontx_log_err("eth_dev->port_id (%d) is diff to orig (%d)",
1406                                 data->port_id, nic->port_id);
1407                 res = -EINVAL;
1408                 goto free_mac_addrs;
1409         }
1410
1411         res = rte_eal_alarm_set(OCCTX_INTR_POLL_INTERVAL_MS * 1000,
1412                                 octeontx_link_status_poll, nic);
1413         if (res) {
1414                 octeontx_log_err("Failed to start link polling alarm");
1415                 goto err;
1416         }
1417
1418         /* Update port_id mac to eth_dev */
1419         memcpy(data->mac_addrs, nic->mac_addr, RTE_ETHER_ADDR_LEN);
1420
1421         /* Update same mac address to BGX CAM table at index 0 */
1422         octeontx_bgx_port_mac_add(nic->port_id, nic->mac_addr, 0);
1423
1424         res = octeontx_dev_flow_ctrl_init(eth_dev);
1425         if (res < 0)
1426                 goto err;
1427
1428         PMD_INIT_LOG(DEBUG, "ethdev info: ");
1429         PMD_INIT_LOG(DEBUG, "port %d, port_ena %d ochan %d num_ochan %d tx_q %d",
1430                                 nic->port_id, nic->port_ena,
1431                                 nic->base_ochan, nic->num_ochans,
1432                                 nic->num_tx_queues);
1433         PMD_INIT_LOG(DEBUG, "speed %d mtu %d", nic->speed, nic->bgx_mtu);
1434
1435         rte_octeontx_pchan_map[(nic->base_ochan >> 8) & 0x7]
1436                 [(nic->base_ochan >> 4) & 0xF] = data->port_id;
1437
1438         rte_eth_dev_probing_finish(eth_dev);
1439         return data->port_id;
1440
1441 free_mac_addrs:
1442         rte_free(data->mac_addrs);
1443         data->mac_addrs = NULL;
1444 err:
1445         if (nic)
1446                 octeontx_port_close(nic);
1447
1448         rte_eth_dev_release_port(eth_dev);
1449
1450         return res;
1451 }
1452
1453 /* Un initialize octeontx device */
1454 static int
1455 octeontx_remove(struct rte_vdev_device *dev)
1456 {
1457         char octtx_name[OCTEONTX_MAX_NAME_LEN];
1458         struct rte_eth_dev *eth_dev = NULL;
1459         struct octeontx_nic *nic = NULL;
1460         int i;
1461
1462         if (dev == NULL)
1463                 return -EINVAL;
1464
1465         for (i = 0; i < OCTEONTX_VDEV_DEFAULT_MAX_NR_PORT; i++) {
1466                 sprintf(octtx_name, "eth_octeontx_%d", i);
1467
1468                 /* reserve an ethdev entry */
1469                 eth_dev = rte_eth_dev_allocated(octtx_name);
1470                 if (eth_dev == NULL)
1471                         return -ENODEV;
1472
1473                 if (rte_eal_process_type() != RTE_PROC_PRIMARY) {
1474                         rte_eth_dev_release_port(eth_dev);
1475                         continue;
1476                 }
1477
1478                 nic = octeontx_pmd_priv(eth_dev);
1479                 rte_event_dev_stop(nic->evdev);
1480                 PMD_INIT_LOG(INFO, "Closing octeontx device %s", octtx_name);
1481
1482                 rte_eth_dev_release_port(eth_dev);
1483                 rte_event_dev_close(nic->evdev);
1484         }
1485
1486         if (rte_eal_process_type() != RTE_PROC_PRIMARY)
1487                 return 0;
1488
1489         /* Free FC resource */
1490         octeontx_pko_fc_free();
1491
1492         return 0;
1493 }
1494
1495 /* Initialize octeontx device */
1496 static int
1497 octeontx_probe(struct rte_vdev_device *dev)
1498 {
1499         const char *dev_name;
1500         static int probe_once;
1501         uint8_t socket_id, qlist;
1502         int tx_vfcnt, port_id, evdev, qnum, pnum, res, i;
1503         struct rte_event_dev_config dev_conf;
1504         const char *eventdev_name = "event_octeontx";
1505         struct rte_event_dev_info info;
1506         struct rte_eth_dev *eth_dev;
1507
1508         struct octeontx_vdev_init_params init_params = {
1509                 OCTEONTX_VDEV_DEFAULT_MAX_NR_PORT
1510         };
1511
1512         dev_name = rte_vdev_device_name(dev);
1513
1514         if (rte_eal_process_type() == RTE_PROC_SECONDARY &&
1515             strlen(rte_vdev_device_args(dev)) == 0) {
1516                 eth_dev = rte_eth_dev_attach_secondary(dev_name);
1517                 if (!eth_dev) {
1518                         PMD_INIT_LOG(ERR, "Failed to probe %s", dev_name);
1519                         return -1;
1520                 }
1521                 /* TODO: request info from primary to set up Rx and Tx */
1522                 eth_dev->dev_ops = &octeontx_dev_ops;
1523                 eth_dev->device = &dev->device;
1524                 rte_eth_dev_probing_finish(eth_dev);
1525                 return 0;
1526         }
1527
1528         res = octeontx_parse_vdev_init_params(&init_params, dev);
1529         if (res < 0)
1530                 return -EINVAL;
1531
1532         if (init_params.nr_port > OCTEONTX_VDEV_DEFAULT_MAX_NR_PORT) {
1533                 octeontx_log_err("nr_port (%d) > max (%d)", init_params.nr_port,
1534                                 OCTEONTX_VDEV_DEFAULT_MAX_NR_PORT);
1535                 return -ENOTSUP;
1536         }
1537
1538         PMD_INIT_LOG(DEBUG, "initializing %s pmd", dev_name);
1539
1540         socket_id = rte_socket_id();
1541
1542         tx_vfcnt = octeontx_pko_vf_count();
1543
1544         if (tx_vfcnt < init_params.nr_port) {
1545                 octeontx_log_err("not enough PKO (%d) for port number (%d)",
1546                                 tx_vfcnt, init_params.nr_port);
1547                 return -EINVAL;
1548         }
1549         evdev = rte_event_dev_get_dev_id(eventdev_name);
1550         if (evdev < 0) {
1551                 octeontx_log_err("eventdev %s not found", eventdev_name);
1552                 return -ENODEV;
1553         }
1554
1555         res = rte_event_dev_info_get(evdev, &info);
1556         if (res < 0) {
1557                 octeontx_log_err("failed to eventdev info %d", res);
1558                 return -EINVAL;
1559         }
1560
1561         PMD_INIT_LOG(DEBUG, "max_queue %d max_port %d",
1562                         info.max_event_queues, info.max_event_ports);
1563
1564         if (octeontx_pko_init_fc(tx_vfcnt))
1565                 return -ENOMEM;
1566
1567         devconf_set_default_sane_values(&dev_conf, &info);
1568         res = rte_event_dev_configure(evdev, &dev_conf);
1569         if (res < 0)
1570                 goto parse_error;
1571
1572         rte_event_dev_attr_get(evdev, RTE_EVENT_DEV_ATTR_PORT_COUNT,
1573                         (uint32_t *)&pnum);
1574         rte_event_dev_attr_get(evdev, RTE_EVENT_DEV_ATTR_QUEUE_COUNT,
1575                         (uint32_t *)&qnum);
1576         if (pnum < qnum) {
1577                 octeontx_log_err("too few event ports (%d) for event_q(%d)",
1578                                 pnum, qnum);
1579                 res = -EINVAL;
1580                 goto parse_error;
1581         }
1582
1583         /* Enable all queues available */
1584         for (i = 0; i < qnum; i++) {
1585                 res = rte_event_queue_setup(evdev, i, NULL);
1586                 if (res < 0) {
1587                         octeontx_log_err("failed to setup event_q(%d): res %d",
1588                                         i, res);
1589                         goto parse_error;
1590                 }
1591         }
1592
1593         /* Enable all ports available */
1594         for (i = 0; i < pnum; i++) {
1595                 res = rte_event_port_setup(evdev, i, NULL);
1596                 if (res < 0) {
1597                         res = -ENODEV;
1598                         octeontx_log_err("failed to setup ev port(%d) res=%d",
1599                                                 i, res);
1600                         goto parse_error;
1601                 }
1602         }
1603
1604         /*
1605          * Do 1:1 links for ports & queues. All queues would be mapped to
1606          * one port. If there are more ports than queues, then some ports
1607          * won't be linked to any queue.
1608          */
1609         for (i = 0; i < qnum; i++) {
1610                 /* Link one queue to one event port */
1611                 qlist = i;
1612                 res = rte_event_port_link(evdev, i, &qlist, NULL, 1);
1613                 if (res < 0) {
1614                         res = -ENODEV;
1615                         octeontx_log_err("failed to link port (%d): res=%d",
1616                                         i, res);
1617                         goto parse_error;
1618                 }
1619         }
1620
1621         /* Create ethdev interface */
1622         for (i = 0; i < init_params.nr_port; i++) {
1623                 port_id = octeontx_create(dev, i, evdev, socket_id);
1624                 if (port_id < 0) {
1625                         octeontx_log_err("failed to create device %s",
1626                                         dev_name);
1627                         res = -ENODEV;
1628                         goto parse_error;
1629                 }
1630
1631                 PMD_INIT_LOG(INFO, "created ethdev %s for port %d", dev_name,
1632                                         port_id);
1633         }
1634
1635         if (probe_once) {
1636                 octeontx_log_err("interface %s not supported", dev_name);
1637                 octeontx_remove(dev);
1638                 res = -ENOTSUP;
1639                 goto parse_error;
1640         }
1641         rte_mbuf_set_platform_mempool_ops("octeontx_fpavf");
1642         probe_once = 1;
1643
1644         return 0;
1645
1646 parse_error:
1647         octeontx_pko_fc_free();
1648         return res;
1649 }
1650
1651 static struct rte_vdev_driver octeontx_pmd_drv = {
1652         .probe = octeontx_probe,
1653         .remove = octeontx_remove,
1654 };
1655
1656 RTE_PMD_REGISTER_VDEV(OCTEONTX_PMD, octeontx_pmd_drv);
1657 RTE_PMD_REGISTER_ALIAS(OCTEONTX_PMD, eth_octeontx);
1658 RTE_PMD_REGISTER_PARAM_STRING(OCTEONTX_PMD, "nr_port=<int> ");