d9bf28525b133a9c116e41b3f021bf9aff57cc2f
[dpdk.git] / drivers / net / sfc / sfc_ef10_essb_rx.c
1 /* SPDX-License-Identifier: BSD-3-Clause
2  *
3  * Copyright(c) 2019-2020 Xilinx, Inc.
4  * Copyright(c) 2017-2019 Solarflare Communications Inc.
5  *
6  * This software was jointly developed between OKTET Labs (under contract
7  * for Solarflare) and Solarflare Communications, Inc.
8  */
9
10 /* EF10 equal stride packed stream receive native datapath implementation */
11
12 #include <stdbool.h>
13
14 #include <rte_byteorder.h>
15 #include <rte_mbuf.h>
16 #include <rte_io.h>
17
18 #include "efx_types.h"
19 #include "efx_regs_ef10.h"
20
21 #include "sfc_debug.h"
22 #include "sfc_tweak.h"
23 #include "sfc_dp_rx.h"
24 #include "sfc_kvargs.h"
25 #include "sfc_ef10.h"
26
27 /* Tunnels are not supported */
28 #define SFC_EF10_RX_EV_ENCAP_SUPPORT    0
29 #include "sfc_ef10_rx_ev.h"
30
31 #define sfc_ef10_essb_rx_err(dpq, ...) \
32         SFC_DP_LOG(SFC_KVARG_DATAPATH_EF10_ESSB, ERR, dpq, __VA_ARGS__)
33
34 #define sfc_ef10_essb_rx_info(dpq, ...) \
35         SFC_DP_LOG(SFC_KVARG_DATAPATH_EF10_ESSB, INFO, dpq, __VA_ARGS__)
36
37 /*
38  * Fake length for RXQ descriptors in equal stride super-buffer mode
39  * to make hardware happy.
40  */
41 #define SFC_EF10_ESSB_RX_FAKE_BUF_SIZE  32
42
43 /**
44  * Minimum number of Rx buffers the datapath allows to use.
45  *
46  * Each HW Rx descriptor has many Rx buffers. The number of buffers
47  * in one HW Rx descriptor is equal to size of contiguous block
48  * provided by Rx buffers memory pool. The contiguous block size
49  * depends on CONFIG_RTE_DRIVER_MEMPOOL_BUCKET_SIZE_KB and rte_mbuf
50  * data size specified on the memory pool creation. Typical rte_mbuf
51  * data size is about 2k which makes a bit less than 32 buffers in
52  * contiguous block with default bucket size equal to 64k.
53  * Since HW Rx descriptors are pushed by 8 (see SFC_EF10_RX_WPTR_ALIGN),
54  * it makes about 256 as required minimum. Double it in advertised
55  * minimum to allow for at least 2 refill blocks.
56  */
57 #define SFC_EF10_ESSB_RX_DESCS_MIN      512
58
59 /**
60  * Number of Rx buffers should be aligned to.
61  *
62  * There are no extra requirements on alignment since actual number of
63  * pushed Rx buffers will be multiple by contiguous block size which
64  * is unknown beforehand.
65  */
66 #define SFC_EF10_ESSB_RX_DESCS_ALIGN    1
67
68 /**
69  * Maximum number of descriptors/buffers in the Rx ring.
70  * It should guarantee that corresponding event queue never overfill.
71  */
72 #define SFC_EF10_ESSB_RXQ_LIMIT(_nevs) \
73         ((_nevs) - 1 /* head must not step on tail */ - \
74          (SFC_EF10_EV_PER_CACHE_LINE - 1) /* max unused EvQ entries */ - \
75          1 /* Rx error */ - 1 /* flush */)
76
77 struct sfc_ef10_essb_rx_sw_desc {
78         struct rte_mbuf                 *first_mbuf;
79 };
80
81 struct sfc_ef10_essb_rxq {
82         /* Used on data path */
83         unsigned int                    flags;
84 #define SFC_EF10_ESSB_RXQ_STARTED       0x1
85 #define SFC_EF10_ESSB_RXQ_NOT_RUNNING   0x2
86 #define SFC_EF10_ESSB_RXQ_EXCEPTION     0x4
87         unsigned int                    rxq_ptr_mask;
88         unsigned int                    block_size;
89         unsigned int                    buf_stride;
90         unsigned int                    bufs_ptr;
91         unsigned int                    completed;
92         unsigned int                    pending_id;
93         unsigned int                    bufs_pending;
94         unsigned int                    left_in_completed;
95         unsigned int                    left_in_pending;
96         unsigned int                    evq_read_ptr;
97         unsigned int                    evq_ptr_mask;
98         efx_qword_t                     *evq_hw_ring;
99         struct sfc_ef10_essb_rx_sw_desc *sw_ring;
100         uint16_t                        port_id;
101
102         /* Used on refill */
103         unsigned int                    added;
104         unsigned int                    max_fill_level;
105         unsigned int                    refill_threshold;
106         struct rte_mempool              *refill_mb_pool;
107         efx_qword_t                     *rxq_hw_ring;
108         volatile void                   *doorbell;
109
110         /* Datapath receive queue anchor */
111         struct sfc_dp_rxq               dp;
112 };
113
114 static inline struct sfc_ef10_essb_rxq *
115 sfc_ef10_essb_rxq_by_dp_rxq(struct sfc_dp_rxq *dp_rxq)
116 {
117         return container_of(dp_rxq, struct sfc_ef10_essb_rxq, dp);
118 }
119
120 static struct rte_mbuf *
121 sfc_ef10_essb_next_mbuf(const struct sfc_ef10_essb_rxq *rxq,
122                         struct rte_mbuf *mbuf)
123 {
124         struct rte_mbuf *m;
125
126         m = (struct rte_mbuf *)((uintptr_t)mbuf + rxq->buf_stride);
127         MBUF_RAW_ALLOC_CHECK(m);
128         return m;
129 }
130
131 static struct rte_mbuf *
132 sfc_ef10_essb_mbuf_by_index(const struct sfc_ef10_essb_rxq *rxq,
133                             struct rte_mbuf *mbuf, unsigned int idx)
134 {
135         struct rte_mbuf *m;
136
137         m = (struct rte_mbuf *)((uintptr_t)mbuf + idx * rxq->buf_stride);
138         MBUF_RAW_ALLOC_CHECK(m);
139         return m;
140 }
141
142 static struct rte_mbuf *
143 sfc_ef10_essb_maybe_next_completed(struct sfc_ef10_essb_rxq *rxq)
144 {
145         const struct sfc_ef10_essb_rx_sw_desc *rxd;
146
147         if (rxq->left_in_completed != 0) {
148                 rxd = &rxq->sw_ring[rxq->completed & rxq->rxq_ptr_mask];
149                 return sfc_ef10_essb_mbuf_by_index(rxq, rxd->first_mbuf,
150                                 rxq->block_size - rxq->left_in_completed);
151         } else {
152                 rxq->completed++;
153                 rxd = &rxq->sw_ring[rxq->completed & rxq->rxq_ptr_mask];
154                 rxq->left_in_completed = rxq->block_size;
155                 return rxd->first_mbuf;
156         }
157 }
158
159 static void
160 sfc_ef10_essb_rx_qrefill(struct sfc_ef10_essb_rxq *rxq)
161 {
162         const unsigned int rxq_ptr_mask = rxq->rxq_ptr_mask;
163         unsigned int free_space;
164         unsigned int bulks;
165         void *mbuf_blocks[SFC_EF10_RX_WPTR_ALIGN];
166         unsigned int added = rxq->added;
167
168         free_space = rxq->max_fill_level - (added - rxq->completed);
169
170         if (free_space < rxq->refill_threshold)
171                 return;
172
173         bulks = free_space / RTE_DIM(mbuf_blocks);
174         /* refill_threshold guarantees that bulks is positive */
175         SFC_ASSERT(bulks > 0);
176
177         do {
178                 unsigned int id;
179                 unsigned int i;
180
181                 if (unlikely(rte_mempool_get_contig_blocks(rxq->refill_mb_pool,
182                                 mbuf_blocks, RTE_DIM(mbuf_blocks)) < 0)) {
183                         struct rte_eth_dev_data *dev_data =
184                                 rte_eth_devices[rxq->port_id].data;
185
186                         /*
187                          * It is hardly a safe way to increment counter
188                          * from different contexts, but all PMDs do it.
189                          */
190                         dev_data->rx_mbuf_alloc_failed += RTE_DIM(mbuf_blocks);
191                         /* Return if we have posted nothing yet */
192                         if (added == rxq->added)
193                                 return;
194                         /* Push posted */
195                         break;
196                 }
197
198                 for (i = 0, id = added & rxq_ptr_mask;
199                      i < RTE_DIM(mbuf_blocks);
200                      ++i, ++id) {
201                         struct rte_mbuf *m = mbuf_blocks[i];
202                         struct sfc_ef10_essb_rx_sw_desc *rxd;
203
204                         SFC_ASSERT((id & ~rxq_ptr_mask) == 0);
205                         rxd = &rxq->sw_ring[id];
206                         rxd->first_mbuf = m;
207
208                         /* RX_KER_BYTE_CNT is ignored by firmware */
209                         EFX_POPULATE_QWORD_2(rxq->rxq_hw_ring[id],
210                                              ESF_DZ_RX_KER_BYTE_CNT,
211                                              SFC_EF10_ESSB_RX_FAKE_BUF_SIZE,
212                                              ESF_DZ_RX_KER_BUF_ADDR,
213                                              rte_mbuf_data_iova_default(m));
214                 }
215
216                 added += RTE_DIM(mbuf_blocks);
217
218         } while (--bulks > 0);
219
220         SFC_ASSERT(rxq->added != added);
221         rxq->added = added;
222         sfc_ef10_rx_qpush(rxq->doorbell, added, rxq_ptr_mask);
223 }
224
225 static bool
226 sfc_ef10_essb_rx_event_get(struct sfc_ef10_essb_rxq *rxq, efx_qword_t *rx_ev)
227 {
228         *rx_ev = rxq->evq_hw_ring[rxq->evq_read_ptr & rxq->evq_ptr_mask];
229
230         if (!sfc_ef10_ev_present(*rx_ev))
231                 return false;
232
233         if (unlikely(EFX_QWORD_FIELD(*rx_ev, FSF_AZ_EV_CODE) !=
234                      FSE_AZ_EV_CODE_RX_EV)) {
235                 /*
236                  * Do not move read_ptr to keep the event for exception
237                  * handling
238                  */
239                 rxq->flags |= SFC_EF10_ESSB_RXQ_EXCEPTION;
240                 sfc_ef10_essb_rx_err(&rxq->dp.dpq,
241                                      "RxQ exception at EvQ read ptr %#x",
242                                      rxq->evq_read_ptr);
243                 return false;
244         }
245
246         rxq->evq_read_ptr++;
247         return true;
248 }
249
250 static void
251 sfc_ef10_essb_rx_process_ev(struct sfc_ef10_essb_rxq *rxq, efx_qword_t rx_ev)
252 {
253         unsigned int ready;
254
255         ready = (EFX_QWORD_FIELD(rx_ev, ESF_DZ_RX_DSC_PTR_LBITS) -
256                  rxq->bufs_ptr) &
257                 EFX_MASK32(ESF_DZ_RX_DSC_PTR_LBITS);
258
259         rxq->bufs_ptr += ready;
260         rxq->bufs_pending += ready;
261
262         SFC_ASSERT(ready > 0);
263         do {
264                 const struct sfc_ef10_essb_rx_sw_desc *rxd;
265                 struct rte_mbuf *m;
266                 unsigned int todo_bufs;
267                 struct rte_mbuf *m0;
268
269                 rxd = &rxq->sw_ring[rxq->pending_id];
270                 m = sfc_ef10_essb_mbuf_by_index(rxq, rxd->first_mbuf,
271                         rxq->block_size - rxq->left_in_pending);
272
273                 if (ready < rxq->left_in_pending) {
274                         todo_bufs = ready;
275                         ready = 0;
276                         rxq->left_in_pending -= todo_bufs;
277                 } else {
278                         todo_bufs = rxq->left_in_pending;
279                         ready -= todo_bufs;
280                         rxq->left_in_pending = rxq->block_size;
281                         if (rxq->pending_id != rxq->rxq_ptr_mask)
282                                 rxq->pending_id++;
283                         else
284                                 rxq->pending_id = 0;
285                 }
286
287                 SFC_ASSERT(todo_bufs > 0);
288                 --todo_bufs;
289
290                 sfc_ef10_rx_ev_to_offloads(rx_ev, m, ~0ull);
291
292                 /* Prefetch pseudo-header */
293                 rte_prefetch0((uint8_t *)m->buf_addr + RTE_PKTMBUF_HEADROOM);
294
295                 m0 = m;
296                 while (todo_bufs-- > 0) {
297                         m = sfc_ef10_essb_next_mbuf(rxq, m);
298                         m->ol_flags = m0->ol_flags;
299                         m->packet_type = m0->packet_type;
300                         /* Prefetch pseudo-header */
301                         rte_prefetch0((uint8_t *)m->buf_addr +
302                                       RTE_PKTMBUF_HEADROOM);
303                 }
304         } while (ready > 0);
305 }
306
307 static unsigned int
308 sfc_ef10_essb_rx_get_pending(struct sfc_ef10_essb_rxq *rxq,
309                              struct rte_mbuf **rx_pkts, uint16_t nb_pkts)
310 {
311         unsigned int n_rx_pkts = 0;
312         unsigned int todo_bufs;
313         struct rte_mbuf *m;
314
315         while ((todo_bufs = RTE_MIN(nb_pkts - n_rx_pkts,
316                                     rxq->bufs_pending)) > 0) {
317                 m = sfc_ef10_essb_maybe_next_completed(rxq);
318
319                 todo_bufs = RTE_MIN(todo_bufs, rxq->left_in_completed);
320
321                 rxq->bufs_pending -= todo_bufs;
322                 rxq->left_in_completed -= todo_bufs;
323
324                 SFC_ASSERT(todo_bufs > 0);
325                 todo_bufs--;
326
327                 do {
328                         const efx_qword_t *qwordp;
329                         uint16_t pkt_len;
330
331                         /* Buffers to be discarded have 0 in packet type */
332                         if (unlikely(m->packet_type == 0)) {
333                                 rte_mbuf_raw_free(m);
334                                 goto next_buf;
335                         }
336
337                         rx_pkts[n_rx_pkts++] = m;
338
339                         /* Parse pseudo-header */
340                         qwordp = (const efx_qword_t *)
341                                 ((uint8_t *)m->buf_addr + RTE_PKTMBUF_HEADROOM);
342                         pkt_len =
343                                 EFX_QWORD_FIELD(*qwordp,
344                                                 ES_EZ_ESSB_RX_PREFIX_DATA_LEN);
345
346                         m->data_off = RTE_PKTMBUF_HEADROOM +
347                                 ES_EZ_ESSB_RX_PREFIX_LEN;
348                         m->port = rxq->port_id;
349
350                         rte_pktmbuf_pkt_len(m) = pkt_len;
351                         rte_pktmbuf_data_len(m) = pkt_len;
352
353                         m->ol_flags |=
354                                 (PKT_RX_RSS_HASH *
355                                  !!EFX_TEST_QWORD_BIT(*qwordp,
356                                         ES_EZ_ESSB_RX_PREFIX_HASH_VALID_LBN)) |
357                                 (PKT_RX_FDIR_ID *
358                                  !!EFX_TEST_QWORD_BIT(*qwordp,
359                                         ES_EZ_ESSB_RX_PREFIX_MARK_VALID_LBN)) |
360                                 (PKT_RX_FDIR *
361                                  !!EFX_TEST_QWORD_BIT(*qwordp,
362                                         ES_EZ_ESSB_RX_PREFIX_MATCH_FLAG_LBN));
363
364                         /* EFX_QWORD_FIELD converts little-endian to CPU */
365                         m->hash.rss =
366                                 EFX_QWORD_FIELD(*qwordp,
367                                                 ES_EZ_ESSB_RX_PREFIX_HASH);
368                         m->hash.fdir.hi =
369                                 EFX_QWORD_FIELD(*qwordp,
370                                                 ES_EZ_ESSB_RX_PREFIX_MARK);
371
372 next_buf:
373                         m = sfc_ef10_essb_next_mbuf(rxq, m);
374                 } while (todo_bufs-- > 0);
375         }
376
377         return n_rx_pkts;
378 }
379
380
381 static uint16_t
382 sfc_ef10_essb_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
383                         uint16_t nb_pkts)
384 {
385         struct sfc_ef10_essb_rxq *rxq = sfc_ef10_essb_rxq_by_dp_rxq(rx_queue);
386         const unsigned int evq_old_read_ptr = rxq->evq_read_ptr;
387         uint16_t n_rx_pkts;
388         efx_qword_t rx_ev;
389
390         if (unlikely(rxq->flags & (SFC_EF10_ESSB_RXQ_NOT_RUNNING |
391                                    SFC_EF10_ESSB_RXQ_EXCEPTION)))
392                 return 0;
393
394         n_rx_pkts = sfc_ef10_essb_rx_get_pending(rxq, rx_pkts, nb_pkts);
395
396         while (n_rx_pkts != nb_pkts &&
397                sfc_ef10_essb_rx_event_get(rxq, &rx_ev)) {
398                 /*
399                  * DROP_EVENT is an internal to the NIC, software should
400                  * never see it and, therefore, may ignore it.
401                  */
402
403                 sfc_ef10_essb_rx_process_ev(rxq, rx_ev);
404                 n_rx_pkts += sfc_ef10_essb_rx_get_pending(rxq,
405                                                           rx_pkts + n_rx_pkts,
406                                                           nb_pkts - n_rx_pkts);
407         }
408
409         sfc_ef10_ev_qclear(rxq->evq_hw_ring, rxq->evq_ptr_mask,
410                            evq_old_read_ptr, rxq->evq_read_ptr);
411
412         /* It is not a problem if we refill in the case of exception */
413         sfc_ef10_essb_rx_qrefill(rxq);
414
415         return n_rx_pkts;
416 }
417
418 static sfc_dp_rx_qdesc_npending_t sfc_ef10_essb_rx_qdesc_npending;
419 static unsigned int
420 sfc_ef10_essb_rx_qdesc_npending(struct sfc_dp_rxq *dp_rxq)
421 {
422         struct sfc_ef10_essb_rxq *rxq = sfc_ef10_essb_rxq_by_dp_rxq(dp_rxq);
423         const unsigned int evq_old_read_ptr = rxq->evq_read_ptr;
424         efx_qword_t rx_ev;
425
426         if (unlikely(rxq->flags & (SFC_EF10_ESSB_RXQ_NOT_RUNNING |
427                                    SFC_EF10_ESSB_RXQ_EXCEPTION)))
428                 return rxq->bufs_pending;
429
430         while (sfc_ef10_essb_rx_event_get(rxq, &rx_ev)) {
431                 /*
432                  * DROP_EVENT is an internal to the NIC, software should
433                  * never see it and, therefore, may ignore it.
434                  */
435                 sfc_ef10_essb_rx_process_ev(rxq, rx_ev);
436         }
437
438         sfc_ef10_ev_qclear(rxq->evq_hw_ring, rxq->evq_ptr_mask,
439                            evq_old_read_ptr, rxq->evq_read_ptr);
440
441         return rxq->bufs_pending;
442 }
443
444 static sfc_dp_rx_qdesc_status_t sfc_ef10_essb_rx_qdesc_status;
445 static int
446 sfc_ef10_essb_rx_qdesc_status(struct sfc_dp_rxq *dp_rxq, uint16_t offset)
447 {
448         struct sfc_ef10_essb_rxq *rxq = sfc_ef10_essb_rxq_by_dp_rxq(dp_rxq);
449         unsigned int pending = sfc_ef10_essb_rx_qdesc_npending(dp_rxq);
450
451         if (offset < pending)
452                 return RTE_ETH_RX_DESC_DONE;
453
454         if (offset < (rxq->added - rxq->completed) * rxq->block_size +
455                      rxq->left_in_completed - rxq->block_size)
456                 return RTE_ETH_RX_DESC_AVAIL;
457
458         return RTE_ETH_RX_DESC_UNAVAIL;
459 }
460
461 static sfc_dp_rx_get_dev_info_t sfc_ef10_essb_rx_get_dev_info;
462 static void
463 sfc_ef10_essb_rx_get_dev_info(struct rte_eth_dev_info *dev_info)
464 {
465         /*
466          * Number of descriptors just defines maximum number of pushed
467          * descriptors (fill level).
468          */
469         dev_info->rx_desc_lim.nb_min = SFC_EF10_ESSB_RX_DESCS_MIN;
470         dev_info->rx_desc_lim.nb_align = SFC_EF10_ESSB_RX_DESCS_ALIGN;
471 }
472
473 static sfc_dp_rx_pool_ops_supported_t sfc_ef10_essb_rx_pool_ops_supported;
474 static int
475 sfc_ef10_essb_rx_pool_ops_supported(const char *pool)
476 {
477         SFC_ASSERT(pool != NULL);
478
479         if (strcmp(pool, "bucket") == 0)
480                 return 0;
481
482         return -ENOTSUP;
483 }
484
485 static sfc_dp_rx_qsize_up_rings_t sfc_ef10_essb_rx_qsize_up_rings;
486 static int
487 sfc_ef10_essb_rx_qsize_up_rings(uint16_t nb_rx_desc,
488                                 struct sfc_dp_rx_hw_limits *limits,
489                                 struct rte_mempool *mb_pool,
490                                 unsigned int *rxq_entries,
491                                 unsigned int *evq_entries,
492                                 unsigned int *rxq_max_fill_level)
493 {
494         int rc;
495         struct rte_mempool_info mp_info;
496         unsigned int nb_hw_rx_desc;
497         unsigned int max_events;
498
499         rc = rte_mempool_ops_get_info(mb_pool, &mp_info);
500         if (rc != 0)
501                 return -rc;
502         if (mp_info.contig_block_size == 0)
503                 return EINVAL;
504
505         /*
506          * Calculate required number of hardware Rx descriptors each
507          * carrying contig block size Rx buffers.
508          * It cannot be less than Rx write pointer alignment plus 1
509          * in order to avoid cases when the ring is guaranteed to be
510          * empty.
511          */
512         nb_hw_rx_desc = RTE_MAX(SFC_DIV_ROUND_UP(nb_rx_desc,
513                                                  mp_info.contig_block_size),
514                                 SFC_EF10_RX_WPTR_ALIGN + 1);
515         if (nb_hw_rx_desc <= limits->rxq_min_entries) {
516                 *rxq_entries = limits->rxq_min_entries;
517         } else {
518                 *rxq_entries = rte_align32pow2(nb_hw_rx_desc);
519                 if (*rxq_entries > limits->rxq_max_entries)
520                         return EINVAL;
521         }
522
523         max_events = RTE_ALIGN_FLOOR(nb_hw_rx_desc, SFC_EF10_RX_WPTR_ALIGN) *
524                 mp_info.contig_block_size +
525                 (SFC_EF10_EV_PER_CACHE_LINE - 1) /* max unused EvQ entries */ +
526                 1 /* Rx error */ + 1 /* flush */ + 1 /* head-tail space */;
527
528         *evq_entries = rte_align32pow2(max_events);
529         *evq_entries = RTE_MAX(*evq_entries, limits->evq_min_entries);
530         *evq_entries = RTE_MIN(*evq_entries, limits->evq_max_entries);
531
532         /*
533          * May be even maximum event queue size is insufficient to handle
534          * so many Rx descriptors. If so, we should limit Rx queue fill level.
535          */
536         *rxq_max_fill_level = RTE_MIN(nb_rx_desc,
537                                       SFC_EF10_ESSB_RXQ_LIMIT(*evq_entries));
538         return 0;
539 }
540
541 static sfc_dp_rx_qcreate_t sfc_ef10_essb_rx_qcreate;
542 static int
543 sfc_ef10_essb_rx_qcreate(uint16_t port_id, uint16_t queue_id,
544                          const struct rte_pci_addr *pci_addr, int socket_id,
545                          const struct sfc_dp_rx_qcreate_info *info,
546                          struct sfc_dp_rxq **dp_rxqp)
547 {
548         struct rte_mempool * const mp = info->refill_mb_pool;
549         struct rte_mempool_info mp_info;
550         struct sfc_ef10_essb_rxq *rxq;
551         int rc;
552
553         rc = rte_mempool_ops_get_info(mp, &mp_info);
554         if (rc != 0) {
555                 /* Positive errno is used in the driver */
556                 rc = -rc;
557                 goto fail_get_contig_block_size;
558         }
559
560         /* Check if the mempool provides block dequeue */
561         rc = EINVAL;
562         if (mp_info.contig_block_size == 0)
563                 goto fail_no_block_dequeue;
564
565         rc = ENOMEM;
566         rxq = rte_zmalloc_socket("sfc-ef10-rxq", sizeof(*rxq),
567                                  RTE_CACHE_LINE_SIZE, socket_id);
568         if (rxq == NULL)
569                 goto fail_rxq_alloc;
570
571         sfc_dp_queue_init(&rxq->dp.dpq, port_id, queue_id, pci_addr);
572
573         rc = ENOMEM;
574         rxq->sw_ring = rte_calloc_socket("sfc-ef10-rxq-sw_ring",
575                                          info->rxq_entries,
576                                          sizeof(*rxq->sw_ring),
577                                          RTE_CACHE_LINE_SIZE, socket_id);
578         if (rxq->sw_ring == NULL)
579                 goto fail_desc_alloc;
580
581         rxq->block_size = mp_info.contig_block_size;
582         rxq->buf_stride = mp->header_size + mp->elt_size + mp->trailer_size;
583         rxq->rxq_ptr_mask = info->rxq_entries - 1;
584         rxq->evq_ptr_mask = info->evq_entries - 1;
585         rxq->evq_hw_ring = info->evq_hw_ring;
586         rxq->port_id = port_id;
587
588         rxq->max_fill_level = info->max_fill_level / mp_info.contig_block_size;
589         rxq->refill_threshold =
590                 RTE_MAX(info->refill_threshold / mp_info.contig_block_size,
591                         SFC_EF10_RX_WPTR_ALIGN);
592         rxq->refill_mb_pool = mp;
593         rxq->rxq_hw_ring = info->rxq_hw_ring;
594
595         rxq->doorbell = (volatile uint8_t *)info->mem_bar +
596                         ER_DZ_RX_DESC_UPD_REG_OFST +
597                         (info->hw_index << info->vi_window_shift);
598
599         sfc_ef10_essb_rx_info(&rxq->dp.dpq, "RxQ doorbell is %p",
600                               rxq->doorbell);
601         sfc_ef10_essb_rx_info(&rxq->dp.dpq,
602                               "block size is %u, buf stride is %u",
603                               rxq->block_size, rxq->buf_stride);
604         sfc_ef10_essb_rx_info(&rxq->dp.dpq,
605                               "max fill level is %u descs (%u bufs), "
606                               "refill threashold %u descs (%u bufs)",
607                               rxq->max_fill_level,
608                               rxq->max_fill_level * rxq->block_size,
609                               rxq->refill_threshold,
610                               rxq->refill_threshold * rxq->block_size);
611
612         *dp_rxqp = &rxq->dp;
613         return 0;
614
615 fail_desc_alloc:
616         rte_free(rxq);
617
618 fail_rxq_alloc:
619 fail_no_block_dequeue:
620 fail_get_contig_block_size:
621         return rc;
622 }
623
624 static sfc_dp_rx_qdestroy_t sfc_ef10_essb_rx_qdestroy;
625 static void
626 sfc_ef10_essb_rx_qdestroy(struct sfc_dp_rxq *dp_rxq)
627 {
628         struct sfc_ef10_essb_rxq *rxq = sfc_ef10_essb_rxq_by_dp_rxq(dp_rxq);
629
630         rte_free(rxq->sw_ring);
631         rte_free(rxq);
632 }
633
634 static sfc_dp_rx_qstart_t sfc_ef10_essb_rx_qstart;
635 static int
636 sfc_ef10_essb_rx_qstart(struct sfc_dp_rxq *dp_rxq, unsigned int evq_read_ptr)
637 {
638         struct sfc_ef10_essb_rxq *rxq = sfc_ef10_essb_rxq_by_dp_rxq(dp_rxq);
639
640         rxq->evq_read_ptr = evq_read_ptr;
641
642         /* Initialize before refill */
643         rxq->completed = rxq->pending_id = rxq->added = 0;
644         rxq->left_in_completed = rxq->left_in_pending = rxq->block_size;
645         rxq->bufs_ptr = UINT_MAX;
646         rxq->bufs_pending = 0;
647
648         sfc_ef10_essb_rx_qrefill(rxq);
649
650         rxq->flags |= SFC_EF10_ESSB_RXQ_STARTED;
651         rxq->flags &=
652                 ~(SFC_EF10_ESSB_RXQ_NOT_RUNNING | SFC_EF10_ESSB_RXQ_EXCEPTION);
653
654         return 0;
655 }
656
657 static sfc_dp_rx_qstop_t sfc_ef10_essb_rx_qstop;
658 static void
659 sfc_ef10_essb_rx_qstop(struct sfc_dp_rxq *dp_rxq, unsigned int *evq_read_ptr)
660 {
661         struct sfc_ef10_essb_rxq *rxq = sfc_ef10_essb_rxq_by_dp_rxq(dp_rxq);
662
663         rxq->flags |= SFC_EF10_ESSB_RXQ_NOT_RUNNING;
664
665         *evq_read_ptr = rxq->evq_read_ptr;
666 }
667
668 static sfc_dp_rx_qrx_ev_t sfc_ef10_essb_rx_qrx_ev;
669 static bool
670 sfc_ef10_essb_rx_qrx_ev(struct sfc_dp_rxq *dp_rxq, __rte_unused unsigned int id)
671 {
672         __rte_unused struct sfc_ef10_essb_rxq *rxq;
673
674         rxq = sfc_ef10_essb_rxq_by_dp_rxq(dp_rxq);
675         SFC_ASSERT(rxq->flags & SFC_EF10_ESSB_RXQ_NOT_RUNNING);
676
677         /*
678          * It is safe to ignore Rx event since we free all mbufs on
679          * queue purge anyway.
680          */
681
682         return false;
683 }
684
685 static sfc_dp_rx_qpurge_t sfc_ef10_essb_rx_qpurge;
686 static void
687 sfc_ef10_essb_rx_qpurge(struct sfc_dp_rxq *dp_rxq)
688 {
689         struct sfc_ef10_essb_rxq *rxq = sfc_ef10_essb_rxq_by_dp_rxq(dp_rxq);
690         unsigned int i;
691         const struct sfc_ef10_essb_rx_sw_desc *rxd;
692         struct rte_mbuf *m;
693
694         for (i = rxq->completed; i != rxq->added; ++i) {
695                 rxd = &rxq->sw_ring[i & rxq->rxq_ptr_mask];
696                 m = sfc_ef10_essb_mbuf_by_index(rxq, rxd->first_mbuf,
697                                 rxq->block_size - rxq->left_in_completed);
698                 while (rxq->left_in_completed > 0) {
699                         rte_mbuf_raw_free(m);
700                         m = sfc_ef10_essb_next_mbuf(rxq, m);
701                         rxq->left_in_completed--;
702                 }
703                 rxq->left_in_completed = rxq->block_size;
704         }
705
706         rxq->flags &= ~SFC_EF10_ESSB_RXQ_STARTED;
707 }
708
709 struct sfc_dp_rx sfc_ef10_essb_rx = {
710         .dp = {
711                 .name           = SFC_KVARG_DATAPATH_EF10_ESSB,
712                 .type           = SFC_DP_RX,
713                 .hw_fw_caps     = SFC_DP_HW_FW_CAP_EF10 |
714                                   SFC_DP_HW_FW_CAP_RX_ES_SUPER_BUFFER,
715         },
716         .features               = SFC_DP_RX_FEAT_FLOW_FLAG |
717                                   SFC_DP_RX_FEAT_FLOW_MARK,
718         .dev_offload_capa       = DEV_RX_OFFLOAD_CHECKSUM |
719                                   DEV_RX_OFFLOAD_RSS_HASH,
720         .queue_offload_capa     = 0,
721         .get_dev_info           = sfc_ef10_essb_rx_get_dev_info,
722         .pool_ops_supported     = sfc_ef10_essb_rx_pool_ops_supported,
723         .qsize_up_rings         = sfc_ef10_essb_rx_qsize_up_rings,
724         .qcreate                = sfc_ef10_essb_rx_qcreate,
725         .qdestroy               = sfc_ef10_essb_rx_qdestroy,
726         .qstart                 = sfc_ef10_essb_rx_qstart,
727         .qstop                  = sfc_ef10_essb_rx_qstop,
728         .qrx_ev                 = sfc_ef10_essb_rx_qrx_ev,
729         .qpurge                 = sfc_ef10_essb_rx_qpurge,
730         .supported_ptypes_get   = sfc_ef10_supported_ptypes_get,
731         .qdesc_npending         = sfc_ef10_essb_rx_qdesc_npending,
732         .qdesc_status           = sfc_ef10_essb_rx_qdesc_status,
733         .pkt_burst              = sfc_ef10_essb_recv_pkts,
734 };