net/ionic: improve link state handling
[dpdk.git] / drivers / net / ionic / ionic_rxtx.c
1 /* SPDX-License-Identifier: (BSD-3-Clause OR GPL-2.0)
2  * Copyright(c) 2018-2019 Pensando Systems, Inc. All rights reserved.
3  */
4
5 #include <sys/queue.h>
6 #include <stdio.h>
7 #include <stdlib.h>
8 #include <string.h>
9 #include <errno.h>
10 #include <stdint.h>
11 #include <stdarg.h>
12 #include <unistd.h>
13 #include <inttypes.h>
14
15 #include <rte_byteorder.h>
16 #include <rte_common.h>
17 #include <rte_cycles.h>
18 #include <rte_log.h>
19 #include <rte_debug.h>
20 #include <rte_interrupts.h>
21 #include <rte_pci.h>
22 #include <rte_memory.h>
23 #include <rte_memzone.h>
24 #include <rte_launch.h>
25 #include <rte_eal.h>
26 #include <rte_per_lcore.h>
27 #include <rte_lcore.h>
28 #include <rte_atomic.h>
29 #include <rte_branch_prediction.h>
30 #include <rte_mempool.h>
31 #include <rte_malloc.h>
32 #include <rte_mbuf.h>
33 #include <rte_ether.h>
34 #include <rte_ethdev_driver.h>
35 #include <rte_prefetch.h>
36 #include <rte_udp.h>
37 #include <rte_tcp.h>
38 #include <rte_sctp.h>
39 #include <rte_string_fns.h>
40 #include <rte_errno.h>
41 #include <rte_ip.h>
42 #include <rte_net.h>
43
44 #include "ionic_logs.h"
45 #include "ionic_mac_api.h"
46 #include "ionic_ethdev.h"
47 #include "ionic_lif.h"
48 #include "ionic_rxtx.h"
49
50 #define IONIC_RX_RING_DOORBELL_STRIDE           (32 - 1)
51
52 /*********************************************************************
53  *
54  *  TX functions
55  *
56  **********************************************************************/
57
58 void
59 ionic_txq_info_get(struct rte_eth_dev *dev, uint16_t queue_id,
60                 struct rte_eth_txq_info *qinfo)
61 {
62         struct ionic_qcq *txq = dev->data->tx_queues[queue_id];
63         struct ionic_queue *q = &txq->q;
64
65         qinfo->nb_desc = q->num_descs;
66         qinfo->conf.offloads = txq->offloads;
67         qinfo->conf.tx_deferred_start = txq->flags & IONIC_QCQ_F_DEFERRED;
68 }
69
70 static inline void __rte_cold
71 ionic_tx_flush(struct ionic_cq *cq)
72 {
73         struct ionic_queue *q = cq->bound_q;
74         struct ionic_desc_info *q_desc_info;
75         struct rte_mbuf *txm, *next;
76         struct ionic_txq_comp *cq_desc_base = cq->base;
77         struct ionic_txq_comp *cq_desc;
78         u_int32_t comp_index = (u_int32_t)-1;
79
80         cq_desc = &cq_desc_base[cq->tail_idx];
81         while (color_match(cq_desc->color, cq->done_color)) {
82                 cq->tail_idx = (cq->tail_idx + 1) & (cq->num_descs - 1);
83
84                 /* Prefetch the next 4 descriptors (not really useful here) */
85                 if ((cq->tail_idx & 0x3) == 0)
86                         rte_prefetch0(&cq_desc_base[cq->tail_idx]);
87
88                 if (cq->tail_idx == 0)
89                         cq->done_color = !cq->done_color;
90
91                 comp_index = cq_desc->comp_index;
92
93                 cq_desc = &cq_desc_base[cq->tail_idx];
94         }
95
96         if (comp_index != (u_int32_t)-1) {
97                 while (q->tail_idx != comp_index) {
98                         q_desc_info = &q->info[q->tail_idx];
99
100                         q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);
101
102                         /* Prefetch the next 4 descriptors */
103                         if ((q->tail_idx & 0x3) == 0)
104                                 /* q desc info */
105                                 rte_prefetch0(&q->info[q->tail_idx]);
106
107                         /*
108                          * Note: you can just use rte_pktmbuf_free,
109                          * but this loop is faster
110                          */
111                         txm = q_desc_info->cb_arg;
112                         while (txm != NULL) {
113                                 next = txm->next;
114                                 rte_pktmbuf_free_seg(txm);
115                                 txm = next;
116                         }
117                 }
118         }
119 }
120
121 void __rte_cold
122 ionic_dev_tx_queue_release(void *tx_queue)
123 {
124         struct ionic_qcq *txq = (struct ionic_qcq *)tx_queue;
125
126         IONIC_PRINT_CALL();
127
128         ionic_qcq_free(txq);
129 }
130
131 int __rte_cold
132 ionic_dev_tx_queue_stop(struct rte_eth_dev *eth_dev, uint16_t tx_queue_id)
133 {
134         struct ionic_qcq *txq;
135
136         IONIC_PRINT(DEBUG, "Stopping TX queue %u", tx_queue_id);
137
138         txq = eth_dev->data->tx_queues[tx_queue_id];
139
140         /*
141          * Note: we should better post NOP Tx desc and wait for its completion
142          * before disabling Tx queue
143          */
144
145         ionic_qcq_disable(txq);
146
147         ionic_tx_flush(&txq->cq);
148
149         ionic_lif_txq_deinit(txq);
150
151         eth_dev->data->tx_queue_state[tx_queue_id] =
152                 RTE_ETH_QUEUE_STATE_STOPPED;
153
154         return 0;
155 }
156
157 int __rte_cold
158 ionic_dev_tx_queue_setup(struct rte_eth_dev *eth_dev, uint16_t tx_queue_id,
159                 uint16_t nb_desc, uint32_t socket_id,
160                 const struct rte_eth_txconf *tx_conf)
161 {
162         struct ionic_lif *lif = IONIC_ETH_DEV_TO_LIF(eth_dev);
163         struct ionic_qcq *txq;
164         uint64_t offloads;
165         int err;
166
167         if (tx_queue_id >= lif->ntxqcqs) {
168                 IONIC_PRINT(DEBUG, "Queue index %u not available "
169                         "(max %u queues)",
170                         tx_queue_id, lif->ntxqcqs);
171                 return -EINVAL;
172         }
173
174         offloads = tx_conf->offloads | eth_dev->data->dev_conf.txmode.offloads;
175         IONIC_PRINT(DEBUG,
176                 "Configuring skt %u TX queue %u with %u buffers, offloads %jx",
177                 socket_id, tx_queue_id, nb_desc, offloads);
178
179         /* Validate number of receive descriptors */
180         if (!rte_is_power_of_2(nb_desc) || nb_desc < IONIC_MIN_RING_DESC)
181                 return -EINVAL; /* or use IONIC_DEFAULT_RING_DESC */
182
183         /* Free memory prior to re-allocation if needed... */
184         if (eth_dev->data->tx_queues[tx_queue_id] != NULL) {
185                 void *tx_queue = eth_dev->data->tx_queues[tx_queue_id];
186                 ionic_dev_tx_queue_release(tx_queue);
187                 eth_dev->data->tx_queues[tx_queue_id] = NULL;
188         }
189
190         err = ionic_tx_qcq_alloc(lif, tx_queue_id, nb_desc, &txq);
191         if (err) {
192                 IONIC_PRINT(DEBUG, "Queue allocation failure");
193                 return -EINVAL;
194         }
195
196         /* Do not start queue with rte_eth_dev_start() */
197         if (tx_conf->tx_deferred_start)
198                 txq->flags |= IONIC_QCQ_F_DEFERRED;
199
200         txq->offloads = offloads;
201
202         eth_dev->data->tx_queues[tx_queue_id] = txq;
203
204         return 0;
205 }
206
207 /*
208  * Start Transmit Units for specified queue.
209  */
210 int __rte_cold
211 ionic_dev_tx_queue_start(struct rte_eth_dev *eth_dev, uint16_t tx_queue_id)
212 {
213         struct ionic_qcq *txq;
214         int err;
215
216         txq = eth_dev->data->tx_queues[tx_queue_id];
217
218         IONIC_PRINT(DEBUG, "Starting TX queue %u, %u descs",
219                 tx_queue_id, txq->q.num_descs);
220
221         err = ionic_lif_txq_init(txq);
222         if (err)
223                 return err;
224
225         ionic_qcq_enable(txq);
226
227         eth_dev->data->tx_queue_state[tx_queue_id] =
228                 RTE_ETH_QUEUE_STATE_STARTED;
229
230         return 0;
231 }
232
233 static void
234 ionic_tx_tcp_pseudo_csum(struct rte_mbuf *txm)
235 {
236         struct ether_hdr *eth_hdr = rte_pktmbuf_mtod(txm, struct ether_hdr *);
237         char *l3_hdr = ((char *)eth_hdr) + txm->l2_len;
238         struct rte_tcp_hdr *tcp_hdr = (struct rte_tcp_hdr *)
239                 (l3_hdr + txm->l3_len);
240
241         if (txm->ol_flags & PKT_TX_IP_CKSUM) {
242                 struct rte_ipv4_hdr *ipv4_hdr = (struct rte_ipv4_hdr *)l3_hdr;
243                 ipv4_hdr->hdr_checksum = 0;
244                 tcp_hdr->cksum = 0;
245                 tcp_hdr->cksum = rte_ipv4_udptcp_cksum(ipv4_hdr, tcp_hdr);
246         } else {
247                 struct rte_ipv6_hdr *ipv6_hdr = (struct rte_ipv6_hdr *)l3_hdr;
248                 tcp_hdr->cksum = 0;
249                 tcp_hdr->cksum = rte_ipv6_udptcp_cksum(ipv6_hdr, tcp_hdr);
250         }
251 }
252
253 static void
254 ionic_tx_tcp_inner_pseudo_csum(struct rte_mbuf *txm)
255 {
256         struct ether_hdr *eth_hdr = rte_pktmbuf_mtod(txm, struct ether_hdr *);
257         char *l3_hdr = ((char *)eth_hdr) + txm->outer_l2_len +
258                 txm->outer_l3_len + txm->l2_len;
259         struct rte_tcp_hdr *tcp_hdr = (struct rte_tcp_hdr *)
260                 (l3_hdr + txm->l3_len);
261
262         if (txm->ol_flags & PKT_TX_IPV4) {
263                 struct rte_ipv4_hdr *ipv4_hdr = (struct rte_ipv4_hdr *)l3_hdr;
264                 ipv4_hdr->hdr_checksum = 0;
265                 tcp_hdr->cksum = 0;
266                 tcp_hdr->cksum = rte_ipv4_udptcp_cksum(ipv4_hdr, tcp_hdr);
267         } else {
268                 struct rte_ipv6_hdr *ipv6_hdr = (struct rte_ipv6_hdr *)l3_hdr;
269                 tcp_hdr->cksum = 0;
270                 tcp_hdr->cksum = rte_ipv6_udptcp_cksum(ipv6_hdr, tcp_hdr);
271         }
272 }
273
274 static void
275 ionic_tx_tso_post(struct ionic_queue *q, struct ionic_txq_desc *desc,
276                 struct rte_mbuf *txm,
277                 rte_iova_t addr, uint8_t nsge, uint16_t len,
278                 uint32_t hdrlen, uint32_t mss,
279                 bool encap,
280                 uint16_t vlan_tci, bool has_vlan,
281                 bool start, bool done)
282 {
283         uint8_t flags = 0;
284         flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
285         flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
286         flags |= start ? IONIC_TXQ_DESC_FLAG_TSO_SOT : 0;
287         flags |= done ? IONIC_TXQ_DESC_FLAG_TSO_EOT : 0;
288
289         desc->cmd = encode_txq_desc_cmd(IONIC_TXQ_DESC_OPCODE_TSO,
290                 flags, nsge, addr);
291         desc->len = len;
292         desc->vlan_tci = vlan_tci;
293         desc->hdr_len = hdrlen;
294         desc->mss = mss;
295
296         ionic_q_post(q, done, NULL, done ? txm : NULL);
297 }
298
299 static struct ionic_txq_desc *
300 ionic_tx_tso_next(struct ionic_queue *q, struct ionic_txq_sg_elem **elem)
301 {
302         struct ionic_txq_desc *desc_base = q->base;
303         struct ionic_txq_sg_desc *sg_desc_base = q->sg_base;
304         struct ionic_txq_desc *desc = &desc_base[q->head_idx];
305         struct ionic_txq_sg_desc *sg_desc = &sg_desc_base[q->head_idx];
306
307         *elem = sg_desc->elems;
308         return desc;
309 }
310
311 static int
312 ionic_tx_tso(struct ionic_queue *q, struct rte_mbuf *txm,
313                 uint64_t offloads __rte_unused, bool not_xmit_more)
314 {
315         struct ionic_tx_stats *stats = IONIC_Q_TO_TX_STATS(q);
316         struct ionic_txq_desc *desc;
317         struct ionic_txq_sg_elem *elem;
318         struct rte_mbuf *txm_seg;
319         uint64_t desc_addr = 0;
320         uint16_t desc_len = 0;
321         uint8_t desc_nsge;
322         uint32_t hdrlen;
323         uint32_t mss = txm->tso_segsz;
324         uint32_t frag_left = 0;
325         uint32_t left;
326         uint32_t seglen;
327         uint32_t len;
328         uint32_t offset = 0;
329         bool start, done;
330         bool encap;
331         bool has_vlan = !!(txm->ol_flags & PKT_TX_VLAN_PKT);
332         uint16_t vlan_tci = txm->vlan_tci;
333         uint64_t ol_flags = txm->ol_flags;
334
335         encap = ((ol_flags & PKT_TX_OUTER_IP_CKSUM) ||
336                 (ol_flags & PKT_TX_OUTER_UDP_CKSUM)) &&
337                 ((ol_flags & PKT_TX_OUTER_IPV4) ||
338                 (ol_flags & PKT_TX_OUTER_IPV6));
339
340         /* Preload inner-most TCP csum field with IP pseudo hdr
341          * calculated with IP length set to zero.  HW will later
342          * add in length to each TCP segment resulting from the TSO.
343          */
344
345         if (encap) {
346                 ionic_tx_tcp_inner_pseudo_csum(txm);
347                 hdrlen = txm->outer_l2_len + txm->outer_l3_len +
348                         txm->l2_len + txm->l3_len + txm->l4_len;
349         } else {
350                 ionic_tx_tcp_pseudo_csum(txm);
351                 hdrlen = txm->l2_len + txm->l3_len + txm->l4_len;
352         }
353
354         seglen = hdrlen + mss;
355         left = txm->data_len;
356
357         desc = ionic_tx_tso_next(q, &elem);
358         start = true;
359
360         /* Chop data up into desc segments */
361
362         while (left > 0) {
363                 len = RTE_MIN(seglen, left);
364                 frag_left = seglen - len;
365                 desc_addr = rte_cpu_to_le_64(rte_mbuf_data_iova_default(txm));
366                 desc_len = len;
367                 desc_nsge = 0;
368                 left -= len;
369                 offset += len;
370                 if (txm->nb_segs > 1 && frag_left > 0)
371                         continue;
372                 done = (txm->nb_segs == 1 && left == 0);
373                 ionic_tx_tso_post(q, desc, txm,
374                         desc_addr, desc_nsge, desc_len,
375                         hdrlen, mss,
376                         encap,
377                         vlan_tci, has_vlan,
378                         start, done && not_xmit_more);
379                 desc = ionic_tx_tso_next(q, &elem);
380                 start = false;
381                 seglen = mss;
382         }
383
384         /* Chop frags into desc segments */
385
386         txm_seg = txm->next;
387         while (txm_seg != NULL) {
388                 offset = 0;
389                 left = txm_seg->data_len;
390                 stats->frags++;
391
392                 while (left > 0) {
393                         rte_iova_t data_iova;
394                         data_iova = rte_mbuf_data_iova(txm_seg);
395                         elem->addr = rte_cpu_to_le_64(data_iova) + offset;
396                         if (frag_left > 0) {
397                                 len = RTE_MIN(frag_left, left);
398                                 frag_left -= len;
399                                 elem->len = len;
400                                 elem++;
401                                 desc_nsge++;
402                         } else {
403                                 len = RTE_MIN(mss, left);
404                                 frag_left = mss - len;
405                                 data_iova = rte_mbuf_data_iova(txm_seg);
406                                 desc_addr = rte_cpu_to_le_64(data_iova);
407                                 desc_len = len;
408                                 desc_nsge = 0;
409                         }
410                         left -= len;
411                         offset += len;
412                         if (txm_seg->next != NULL && frag_left > 0)
413                                 continue;
414                         done = (txm_seg->next == NULL && left == 0);
415                         ionic_tx_tso_post(q, desc, txm_seg,
416                                 desc_addr, desc_nsge, desc_len,
417                                 hdrlen, mss,
418                                 encap,
419                                 vlan_tci, has_vlan,
420                                 start, done && not_xmit_more);
421                         desc = ionic_tx_tso_next(q, &elem);
422                         start = false;
423                 }
424
425                 txm_seg = txm_seg->next;
426         }
427
428         stats->tso++;
429
430         return 0;
431 }
432
433 static int
434 ionic_tx(struct ionic_queue *q, struct rte_mbuf *txm,
435                 uint64_t offloads, bool not_xmit_more)
436 {
437         struct ionic_txq_desc *desc_base = q->base;
438         struct ionic_txq_sg_desc *sg_desc_base = q->sg_base;
439         struct ionic_txq_desc *desc = &desc_base[q->head_idx];
440         struct ionic_txq_sg_desc *sg_desc = &sg_desc_base[q->head_idx];
441         struct ionic_txq_sg_elem *elem = sg_desc->elems;
442         struct ionic_tx_stats *stats = IONIC_Q_TO_TX_STATS(q);
443         struct rte_mbuf *txm_seg;
444         bool encap;
445         bool has_vlan;
446         uint64_t ol_flags = txm->ol_flags;
447         uint64_t addr = rte_cpu_to_le_64(rte_mbuf_data_iova_default(txm));
448         uint8_t opcode = IONIC_TXQ_DESC_OPCODE_CSUM_NONE;
449         uint8_t flags = 0;
450
451         if ((ol_flags & PKT_TX_IP_CKSUM) &&
452                         (offloads & DEV_TX_OFFLOAD_IPV4_CKSUM)) {
453                 opcode = IONIC_TXQ_DESC_OPCODE_CSUM_HW;
454                 flags |= IONIC_TXQ_DESC_FLAG_CSUM_L3;
455                 if (((ol_flags & PKT_TX_TCP_CKSUM) &&
456                                 (offloads & DEV_TX_OFFLOAD_TCP_CKSUM)) ||
457                                 ((ol_flags & PKT_TX_UDP_CKSUM) &&
458                                 (offloads & DEV_TX_OFFLOAD_UDP_CKSUM)))
459                         flags |= IONIC_TXQ_DESC_FLAG_CSUM_L4;
460         } else {
461                 stats->no_csum++;
462         }
463
464         has_vlan = (ol_flags & PKT_TX_VLAN_PKT);
465         encap = ((ol_flags & PKT_TX_OUTER_IP_CKSUM) ||
466                         (ol_flags & PKT_TX_OUTER_UDP_CKSUM)) &&
467                         ((ol_flags & PKT_TX_OUTER_IPV4) ||
468                         (ol_flags & PKT_TX_OUTER_IPV6));
469
470         flags |= has_vlan ? IONIC_TXQ_DESC_FLAG_VLAN : 0;
471         flags |= encap ? IONIC_TXQ_DESC_FLAG_ENCAP : 0;
472
473         desc->cmd = encode_txq_desc_cmd(opcode, flags, txm->nb_segs - 1, addr);
474         desc->len = txm->data_len;
475         desc->vlan_tci = txm->vlan_tci;
476
477         txm_seg = txm->next;
478         while (txm_seg != NULL) {
479                 elem->len = txm_seg->data_len;
480                 elem->addr = rte_cpu_to_le_64(rte_mbuf_data_iova(txm_seg));
481                 stats->frags++;
482                 elem++;
483                 txm_seg = txm_seg->next;
484         }
485
486         ionic_q_post(q, not_xmit_more, NULL, txm);
487
488         return 0;
489 }
490
491 uint16_t
492 ionic_xmit_pkts(void *tx_queue, struct rte_mbuf **tx_pkts,
493                 uint16_t nb_pkts)
494 {
495         struct ionic_qcq *txq = (struct ionic_qcq *)tx_queue;
496         struct ionic_queue *q = &txq->q;
497         struct ionic_cq *cq = &txq->cq;
498         struct ionic_tx_stats *stats = IONIC_Q_TO_TX_STATS(q);
499         uint32_t next_q_head_idx;
500         uint32_t bytes_tx = 0;
501         uint16_t nb_tx = 0;
502         int err;
503         bool last;
504
505         /* Cleaning old buffers */
506         ionic_tx_flush(cq);
507
508         if (unlikely(ionic_q_space_avail(q) < nb_pkts)) {
509                 stats->stop += nb_pkts;
510                 return 0;
511         }
512
513         while (nb_tx < nb_pkts) {
514                 last = (nb_tx == (nb_pkts - 1));
515
516                 next_q_head_idx = (q->head_idx + 1) & (q->num_descs - 1);
517                 if ((next_q_head_idx & 0x3) == 0) {
518                         struct ionic_txq_desc *desc_base = q->base;
519                         rte_prefetch0(&desc_base[next_q_head_idx]);
520                         rte_prefetch0(&q->info[next_q_head_idx]);
521                 }
522
523                 if (tx_pkts[nb_tx]->ol_flags & PKT_TX_TCP_SEG)
524                         err = ionic_tx_tso(q, tx_pkts[nb_tx], txq->offloads,
525                                 last);
526                 else
527                         err = ionic_tx(q, tx_pkts[nb_tx], txq->offloads, last);
528                 if (err) {
529                         stats->drop += nb_pkts - nb_tx;
530                         if (nb_tx > 0)
531                                 ionic_q_flush(q);
532                         break;
533                 }
534
535                 bytes_tx += tx_pkts[nb_tx]->pkt_len;
536                 nb_tx++;
537         }
538
539         stats->packets += nb_tx;
540         stats->bytes += bytes_tx;
541
542         return nb_tx;
543 }
544
545 /*********************************************************************
546  *
547  *  TX prep functions
548  *
549  **********************************************************************/
550
551 #define IONIC_TX_OFFLOAD_MASK ( \
552         PKT_TX_IPV4 |           \
553         PKT_TX_IPV6 |           \
554         PKT_TX_VLAN |           \
555         PKT_TX_IP_CKSUM |       \
556         PKT_TX_TCP_SEG |        \
557         PKT_TX_L4_MASK)
558
559 #define IONIC_TX_OFFLOAD_NOTSUP_MASK \
560         (PKT_TX_OFFLOAD_MASK ^ IONIC_TX_OFFLOAD_MASK)
561
562 uint16_t
563 ionic_prep_pkts(void *tx_queue __rte_unused, struct rte_mbuf **tx_pkts,
564                 uint16_t nb_pkts)
565 {
566         struct rte_mbuf *txm;
567         uint64_t offloads;
568         int i = 0;
569
570         for (i = 0; i < nb_pkts; i++) {
571                 txm = tx_pkts[i];
572
573                 if (txm->nb_segs > IONIC_TX_MAX_SG_ELEMS) {
574                         rte_errno = -EINVAL;
575                         break;
576                 }
577
578                 offloads = txm->ol_flags;
579
580                 if (offloads & IONIC_TX_OFFLOAD_NOTSUP_MASK) {
581                         rte_errno = -ENOTSUP;
582                         break;
583                 }
584         }
585
586         return i;
587 }
588
589 /*********************************************************************
590  *
591  *  RX functions
592  *
593  **********************************************************************/
594
595 static void ionic_rx_recycle(struct ionic_queue *q, uint32_t q_desc_index,
596                 struct rte_mbuf *mbuf);
597
598 void
599 ionic_rxq_info_get(struct rte_eth_dev *dev, uint16_t queue_id,
600                 struct rte_eth_rxq_info *qinfo)
601 {
602         struct ionic_qcq *rxq = dev->data->rx_queues[queue_id];
603         struct ionic_queue *q = &rxq->q;
604
605         qinfo->mp = rxq->mb_pool;
606         qinfo->scattered_rx = dev->data->scattered_rx;
607         qinfo->nb_desc = q->num_descs;
608         qinfo->conf.rx_deferred_start = rxq->flags & IONIC_QCQ_F_DEFERRED;
609         qinfo->conf.offloads = rxq->offloads;
610 }
611
612 static void __rte_cold
613 ionic_rx_empty(struct ionic_queue *q)
614 {
615         struct ionic_qcq *rxq = IONIC_Q_TO_QCQ(q);
616         struct ionic_desc_info *cur;
617         struct rte_mbuf *mbuf;
618
619         while (q->tail_idx != q->head_idx) {
620                 cur = &q->info[q->tail_idx];
621                 mbuf = cur->cb_arg;
622                 rte_mempool_put(rxq->mb_pool, mbuf);
623
624                 q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);
625         }
626 }
627
628 void __rte_cold
629 ionic_dev_rx_queue_release(void *rx_queue)
630 {
631         struct ionic_qcq *rxq = (struct ionic_qcq *)rx_queue;
632
633         IONIC_PRINT_CALL();
634
635         ionic_rx_empty(&rxq->q);
636
637         ionic_qcq_free(rxq);
638 }
639
640 int __rte_cold
641 ionic_dev_rx_queue_setup(struct rte_eth_dev *eth_dev,
642                 uint16_t rx_queue_id,
643                 uint16_t nb_desc,
644                 uint32_t socket_id,
645                 const struct rte_eth_rxconf *rx_conf,
646                 struct rte_mempool *mp)
647 {
648         struct ionic_lif *lif = IONIC_ETH_DEV_TO_LIF(eth_dev);
649         struct ionic_qcq *rxq;
650         uint64_t offloads;
651         int err;
652
653         if (rx_queue_id >= lif->nrxqcqs) {
654                 IONIC_PRINT(ERR,
655                         "Queue index %u not available (max %u queues)",
656                         rx_queue_id, lif->nrxqcqs);
657                 return -EINVAL;
658         }
659
660         offloads = rx_conf->offloads | eth_dev->data->dev_conf.rxmode.offloads;
661         IONIC_PRINT(DEBUG,
662                 "Configuring skt %u RX queue %u with %u buffers, offloads %jx",
663                 socket_id, rx_queue_id, nb_desc, offloads);
664
665         /* Validate number of receive descriptors */
666         if (!rte_is_power_of_2(nb_desc) ||
667                         nb_desc < IONIC_MIN_RING_DESC ||
668                         nb_desc > IONIC_MAX_RING_DESC) {
669                 IONIC_PRINT(ERR,
670                         "Bad descriptor count (%u) for queue %u (min: %u)",
671                         nb_desc, rx_queue_id, IONIC_MIN_RING_DESC);
672                 return -EINVAL; /* or use IONIC_DEFAULT_RING_DESC */
673         }
674
675         if (rx_conf->offloads & DEV_RX_OFFLOAD_SCATTER)
676                 eth_dev->data->scattered_rx = 1;
677
678         /* Free memory prior to re-allocation if needed... */
679         if (eth_dev->data->rx_queues[rx_queue_id] != NULL) {
680                 void *rx_queue = eth_dev->data->rx_queues[rx_queue_id];
681                 ionic_dev_rx_queue_release(rx_queue);
682                 eth_dev->data->rx_queues[rx_queue_id] = NULL;
683         }
684
685         err = ionic_rx_qcq_alloc(lif, rx_queue_id, nb_desc, &rxq);
686         if (err) {
687                 IONIC_PRINT(ERR, "Queue %d allocation failure", rx_queue_id);
688                 return -EINVAL;
689         }
690
691         rxq->mb_pool = mp;
692
693         /*
694          * Note: the interface does not currently support
695          * DEV_RX_OFFLOAD_KEEP_CRC, please also consider ETHER_CRC_LEN
696          * when the adapter will be able to keep the CRC and subtract
697          * it to the length for all received packets:
698          * if (eth_dev->data->dev_conf.rxmode.offloads &
699          *     DEV_RX_OFFLOAD_KEEP_CRC)
700          *   rxq->crc_len = ETHER_CRC_LEN;
701          */
702
703         /* Do not start queue with rte_eth_dev_start() */
704         if (rx_conf->rx_deferred_start)
705                 rxq->flags |= IONIC_QCQ_F_DEFERRED;
706
707         rxq->offloads = offloads;
708
709         eth_dev->data->rx_queues[rx_queue_id] = rxq;
710
711         return 0;
712 }
713
714 static void
715 ionic_rx_clean(struct ionic_queue *q,
716                 uint32_t q_desc_index, uint32_t cq_desc_index,
717                 void *cb_arg, void *service_cb_arg)
718 {
719         struct ionic_rxq_comp *cq_desc_base = q->bound_cq->base;
720         struct ionic_rxq_comp *cq_desc = &cq_desc_base[cq_desc_index];
721         struct rte_mbuf *rxm = cb_arg;
722         struct rte_mbuf *rxm_seg;
723         struct ionic_qcq *rxq = IONIC_Q_TO_QCQ(q);
724         uint32_t max_frame_size =
725                 rxq->lif->eth_dev->data->dev_conf.rxmode.max_rx_pkt_len;
726         uint64_t pkt_flags = 0;
727         uint32_t pkt_type;
728         struct ionic_rx_stats *stats = IONIC_Q_TO_RX_STATS(q);
729         struct ionic_rx_service *recv_args = (struct ionic_rx_service *)
730                 service_cb_arg;
731         uint32_t buf_size = (uint16_t)
732                 (rte_pktmbuf_data_room_size(rxq->mb_pool) -
733                 RTE_PKTMBUF_HEADROOM);
734         uint32_t left;
735
736         if (!recv_args) {
737                 stats->no_cb_arg++;
738                 /* Flush */
739                 rte_pktmbuf_free(rxm);
740                 /*
741                  * Note: rte_mempool_put is faster with no segs
742                  * rte_mempool_put(rxq->mb_pool, rxm);
743                  */
744                 return;
745         }
746
747         if (cq_desc->status) {
748                 stats->bad_cq_status++;
749                 ionic_rx_recycle(q, q_desc_index, rxm);
750                 return;
751         }
752
753         if (recv_args->nb_rx >= recv_args->nb_pkts) {
754                 stats->no_room++;
755                 ionic_rx_recycle(q, q_desc_index, rxm);
756                 return;
757         }
758
759         if (cq_desc->len > max_frame_size ||
760                         cq_desc->len == 0) {
761                 stats->bad_len++;
762                 ionic_rx_recycle(q, q_desc_index, rxm);
763                 return;
764         }
765
766         rxm->data_off = RTE_PKTMBUF_HEADROOM;
767         rte_prefetch1((char *)rxm->buf_addr + rxm->data_off);
768         rxm->nb_segs = 1; /* cq_desc->num_sg_elems */
769         rxm->pkt_len = cq_desc->len;
770         rxm->port = rxq->lif->port_id;
771
772         left = cq_desc->len;
773
774         rxm->data_len = RTE_MIN(buf_size, left);
775         left -= rxm->data_len;
776
777         rxm_seg = rxm->next;
778         while (rxm_seg && left) {
779                 rxm_seg->data_len = RTE_MIN(buf_size, left);
780                 left -= rxm_seg->data_len;
781
782                 rxm_seg = rxm_seg->next;
783                 rxm->nb_segs++;
784         }
785
786         /* RSS */
787         pkt_flags |= PKT_RX_RSS_HASH;
788         rxm->hash.rss = cq_desc->rss_hash;
789
790         /* Vlan Strip */
791         if (cq_desc->csum_flags & IONIC_RXQ_COMP_CSUM_F_VLAN) {
792                 pkt_flags |= PKT_RX_VLAN | PKT_RX_VLAN_STRIPPED;
793                 rxm->vlan_tci = cq_desc->vlan_tci;
794         }
795
796         /* Checksum */
797         if (cq_desc->csum_flags & IONIC_RXQ_COMP_CSUM_F_CALC) {
798                 if (cq_desc->csum_flags & IONIC_RXQ_COMP_CSUM_F_IP_OK)
799                         pkt_flags |= PKT_RX_IP_CKSUM_GOOD;
800                 else if (cq_desc->csum_flags & IONIC_RXQ_COMP_CSUM_F_IP_BAD)
801                         pkt_flags |= PKT_RX_IP_CKSUM_BAD;
802
803                 if ((cq_desc->csum_flags & IONIC_RXQ_COMP_CSUM_F_TCP_OK) ||
804                         (cq_desc->csum_flags & IONIC_RXQ_COMP_CSUM_F_UDP_OK))
805                         pkt_flags |= PKT_RX_L4_CKSUM_GOOD;
806                 else if ((cq_desc->csum_flags &
807                                 IONIC_RXQ_COMP_CSUM_F_TCP_BAD) ||
808                                 (cq_desc->csum_flags &
809                                 IONIC_RXQ_COMP_CSUM_F_UDP_BAD))
810                         pkt_flags |= PKT_RX_L4_CKSUM_BAD;
811         }
812
813         rxm->ol_flags = pkt_flags;
814
815         /* Packet Type */
816         switch (cq_desc->pkt_type_color & IONIC_RXQ_COMP_PKT_TYPE_MASK) {
817         case IONIC_PKT_TYPE_IPV4:
818                 pkt_type = RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV4;
819                 break;
820         case IONIC_PKT_TYPE_IPV6:
821                 pkt_type = RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV6;
822                 break;
823         case IONIC_PKT_TYPE_IPV4_TCP:
824                 pkt_type = RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV4 |
825                         RTE_PTYPE_L4_TCP;
826                 break;
827         case IONIC_PKT_TYPE_IPV6_TCP:
828                 pkt_type = RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV6 |
829                         RTE_PTYPE_L4_TCP;
830                 break;
831         case IONIC_PKT_TYPE_IPV4_UDP:
832                 pkt_type = RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV4 |
833                         RTE_PTYPE_L4_UDP;
834                 break;
835         case IONIC_PKT_TYPE_IPV6_UDP:
836                 pkt_type = RTE_PTYPE_L2_ETHER | RTE_PTYPE_L3_IPV6 |
837                         RTE_PTYPE_L4_UDP;
838                 break;
839         default:
840                 {
841                         struct rte_ether_hdr *eth_h = rte_pktmbuf_mtod(rxm,
842                                 struct rte_ether_hdr *);
843                         uint16_t ether_type = eth_h->ether_type;
844                         if (ether_type == rte_cpu_to_be_16(RTE_ETHER_TYPE_ARP))
845                                 pkt_type = RTE_PTYPE_L2_ETHER_ARP;
846                         else
847                                 pkt_type = RTE_PTYPE_UNKNOWN;
848                         break;
849                 }
850         }
851
852         rxm->packet_type = pkt_type;
853
854         recv_args->rx_pkts[recv_args->nb_rx] = rxm;
855         recv_args->nb_rx++;
856
857         stats->packets++;
858         stats->bytes += rxm->pkt_len;
859 }
860
861 static void
862 ionic_rx_recycle(struct ionic_queue *q, uint32_t q_desc_index,
863                  struct rte_mbuf *mbuf)
864 {
865         struct ionic_rxq_desc *desc_base = q->base;
866         struct ionic_rxq_desc *old = &desc_base[q_desc_index];
867         struct ionic_rxq_desc *new = &desc_base[q->head_idx];
868
869         new->addr = old->addr;
870         new->len = old->len;
871
872         ionic_q_post(q, true, ionic_rx_clean, mbuf);
873 }
874
875 static int __rte_cold
876 ionic_rx_fill(struct ionic_qcq *rxq, uint32_t len)
877 {
878         struct ionic_queue *q = &rxq->q;
879         struct ionic_rxq_desc *desc_base = q->base;
880         struct ionic_rxq_sg_desc *sg_desc_base = q->sg_base;
881         struct ionic_rxq_desc *desc;
882         struct ionic_rxq_sg_desc *sg_desc;
883         struct ionic_rxq_sg_elem *elem;
884         rte_iova_t dma_addr;
885         uint32_t i, j, nsegs, buf_size, size;
886         bool ring_doorbell;
887
888         buf_size = (uint16_t)(rte_pktmbuf_data_room_size(rxq->mb_pool) -
889                 RTE_PKTMBUF_HEADROOM);
890
891         /* Initialize software ring entries */
892         for (i = ionic_q_space_avail(q); i; i--) {
893                 struct rte_mbuf *rxm = rte_mbuf_raw_alloc(rxq->mb_pool);
894                 struct rte_mbuf *prev_rxm_seg;
895
896                 if (rxm == NULL) {
897                         IONIC_PRINT(ERR, "RX mbuf alloc failed");
898                         return -ENOMEM;
899                 }
900
901                 nsegs = (len + buf_size - 1) / buf_size;
902
903                 desc = &desc_base[q->head_idx];
904                 dma_addr = rte_cpu_to_le_64(rte_mbuf_data_iova_default(rxm));
905                 desc->addr = dma_addr;
906                 desc->len = buf_size;
907                 size = buf_size;
908                 desc->opcode = (nsegs > 1) ? IONIC_RXQ_DESC_OPCODE_SG :
909                         IONIC_RXQ_DESC_OPCODE_SIMPLE;
910                 rxm->next = NULL;
911
912                 prev_rxm_seg = rxm;
913                 sg_desc = &sg_desc_base[q->head_idx];
914                 elem = sg_desc->elems;
915                 for (j = 0; j < nsegs - 1 && j < IONIC_RX_MAX_SG_ELEMS; j++) {
916                         struct rte_mbuf *rxm_seg;
917                         rte_iova_t data_iova;
918
919                         rxm_seg = rte_mbuf_raw_alloc(rxq->mb_pool);
920                         if (rxm_seg == NULL) {
921                                 IONIC_PRINT(ERR, "RX mbuf alloc failed");
922                                 return -ENOMEM;
923                         }
924
925                         data_iova = rte_mbuf_data_iova(rxm_seg);
926                         dma_addr = rte_cpu_to_le_64(data_iova);
927                         elem->addr = dma_addr;
928                         elem->len = buf_size;
929                         size += buf_size;
930                         elem++;
931                         rxm_seg->next = NULL;
932                         prev_rxm_seg->next = rxm_seg;
933                         prev_rxm_seg = rxm_seg;
934                 }
935
936                 if (size < len)
937                         IONIC_PRINT(ERR, "Rx SG size is not sufficient (%d < %d)",
938                                 size, len);
939
940                 ring_doorbell = ((q->head_idx + 1) &
941                         IONIC_RX_RING_DOORBELL_STRIDE) == 0;
942
943                 ionic_q_post(q, ring_doorbell, ionic_rx_clean, rxm);
944         }
945
946         return 0;
947 }
948
949 /*
950  * Start Receive Units for specified queue.
951  */
952 int __rte_cold
953 ionic_dev_rx_queue_start(struct rte_eth_dev *eth_dev, uint16_t rx_queue_id)
954 {
955         uint32_t frame_size = eth_dev->data->dev_conf.rxmode.max_rx_pkt_len;
956         struct ionic_qcq *rxq;
957         int err;
958
959         rxq = eth_dev->data->rx_queues[rx_queue_id];
960
961         IONIC_PRINT(DEBUG, "Starting RX queue %u, %u descs (size: %u)",
962                 rx_queue_id, rxq->q.num_descs, frame_size);
963
964         err = ionic_lif_rxq_init(rxq);
965         if (err)
966                 return err;
967
968         /* Allocate buffers for descriptor rings */
969         if (ionic_rx_fill(rxq, frame_size) != 0) {
970                 IONIC_PRINT(ERR, "Could not alloc mbuf for queue:%d",
971                         rx_queue_id);
972                 return -1;
973         }
974
975         ionic_qcq_enable(rxq);
976
977         eth_dev->data->rx_queue_state[rx_queue_id] =
978                 RTE_ETH_QUEUE_STATE_STARTED;
979
980         return 0;
981 }
982
983 static inline void __rte_cold
984 ionic_rxq_service(struct ionic_cq *cq, uint32_t work_to_do,
985                 void *service_cb_arg)
986 {
987         struct ionic_queue *q = cq->bound_q;
988         struct ionic_desc_info *q_desc_info;
989         struct ionic_rxq_comp *cq_desc_base = cq->base;
990         struct ionic_rxq_comp *cq_desc;
991         bool more;
992         uint32_t curr_q_tail_idx, curr_cq_tail_idx;
993         uint32_t work_done = 0;
994
995         if (work_to_do == 0)
996                 return;
997
998         cq_desc = &cq_desc_base[cq->tail_idx];
999         while (color_match(cq_desc->pkt_type_color, cq->done_color)) {
1000                 curr_cq_tail_idx = cq->tail_idx;
1001                 cq->tail_idx = (cq->tail_idx + 1) & (cq->num_descs - 1);
1002
1003                 if (cq->tail_idx == 0)
1004                         cq->done_color = !cq->done_color;
1005
1006                 /* Prefetch the next 4 descriptors */
1007                 if ((cq->tail_idx & 0x3) == 0)
1008                         rte_prefetch0(&cq_desc_base[cq->tail_idx]);
1009
1010                 do {
1011                         more = (q->tail_idx != cq_desc->comp_index);
1012
1013                         q_desc_info = &q->info[q->tail_idx];
1014
1015                         curr_q_tail_idx = q->tail_idx;
1016                         q->tail_idx = (q->tail_idx + 1) & (q->num_descs - 1);
1017
1018                         /* Prefetch the next 4 descriptors */
1019                         if ((q->tail_idx & 0x3) == 0)
1020                                 /* q desc info */
1021                                 rte_prefetch0(&q->info[q->tail_idx]);
1022
1023                         ionic_rx_clean(q, curr_q_tail_idx, curr_cq_tail_idx,
1024                                 q_desc_info->cb_arg, service_cb_arg);
1025
1026                 } while (more);
1027
1028                 if (++work_done == work_to_do)
1029                         break;
1030
1031                 cq_desc = &cq_desc_base[cq->tail_idx];
1032         }
1033 }
1034
1035 /*
1036  * Stop Receive Units for specified queue.
1037  */
1038 int __rte_cold
1039 ionic_dev_rx_queue_stop(struct rte_eth_dev *eth_dev, uint16_t rx_queue_id)
1040 {
1041         struct ionic_qcq *rxq;
1042
1043         IONIC_PRINT(DEBUG, "Stopping RX queue %u", rx_queue_id);
1044
1045         rxq = eth_dev->data->rx_queues[rx_queue_id];
1046
1047         ionic_qcq_disable(rxq);
1048
1049         /* Flush */
1050         ionic_rxq_service(&rxq->cq, -1, NULL);
1051
1052         ionic_lif_rxq_deinit(rxq);
1053
1054         eth_dev->data->rx_queue_state[rx_queue_id] =
1055                 RTE_ETH_QUEUE_STATE_STOPPED;
1056
1057         return 0;
1058 }
1059
1060 uint16_t
1061 ionic_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
1062                 uint16_t nb_pkts)
1063 {
1064         struct ionic_qcq *rxq = (struct ionic_qcq *)rx_queue;
1065         uint32_t frame_size =
1066                 rxq->lif->eth_dev->data->dev_conf.rxmode.max_rx_pkt_len;
1067         struct ionic_cq *cq = &rxq->cq;
1068         struct ionic_rx_service service_cb_arg;
1069
1070         service_cb_arg.rx_pkts = rx_pkts;
1071         service_cb_arg.nb_pkts = nb_pkts;
1072         service_cb_arg.nb_rx = 0;
1073
1074         ionic_rxq_service(cq, nb_pkts, &service_cb_arg);
1075
1076         ionic_rx_fill(rxq, frame_size);
1077
1078         return service_cb_arg.nb_rx;
1079 }