1 /* SPDX-License-Identifier: BSD-3-Clause
3 * Copyright (c) 2012-2018 Solarflare Communications Inc.
9 #if EFSYS_OPT_MON_STATS
13 #if EFSYS_OPT_HUNTINGTON || EFSYS_OPT_MEDFORD
16 #define EFX_EV_QSTAT_INCR(_eep, _stat) \
18 (_eep)->ee_stat[_stat]++; \
19 _NOTE(CONSTANTCONDITION) \
22 #define EFX_EV_QSTAT_INCR(_eep, _stat)
26 * Non-interrupting event queue requires interrrupting event queue to
27 * refer to for wake-up events even if wake ups are never used.
28 * It could be even non-allocated event queue.
30 #define EFX_EF10_ALWAYS_INTERRUPTING_EVQ_INDEX (0)
32 static __checkReturn boolean_t
35 __in efx_qword_t *eqp,
36 __in const efx_ev_callbacks_t *eecp,
39 static __checkReturn boolean_t
42 __in efx_qword_t *eqp,
43 __in const efx_ev_callbacks_t *eecp,
46 static __checkReturn boolean_t
49 __in efx_qword_t *eqp,
50 __in const efx_ev_callbacks_t *eecp,
53 static __checkReturn boolean_t
56 __in efx_qword_t *eqp,
57 __in const efx_ev_callbacks_t *eecp,
60 static __checkReturn boolean_t
63 __in efx_qword_t *eqp,
64 __in const efx_ev_callbacks_t *eecp,
68 static __checkReturn efx_rc_t
71 __in uint32_t instance,
73 __in uint32_t timer_ns)
76 uint8_t payload[MAX(MC_CMD_SET_EVQ_TMR_IN_LEN,
77 MC_CMD_SET_EVQ_TMR_OUT_LEN)];
80 (void) memset(payload, 0, sizeof (payload));
81 req.emr_cmd = MC_CMD_SET_EVQ_TMR;
82 req.emr_in_buf = payload;
83 req.emr_in_length = MC_CMD_SET_EVQ_TMR_IN_LEN;
84 req.emr_out_buf = payload;
85 req.emr_out_length = MC_CMD_SET_EVQ_TMR_OUT_LEN;
87 MCDI_IN_SET_DWORD(req, SET_EVQ_TMR_IN_INSTANCE, instance);
88 MCDI_IN_SET_DWORD(req, SET_EVQ_TMR_IN_TMR_LOAD_REQ_NS, timer_ns);
89 MCDI_IN_SET_DWORD(req, SET_EVQ_TMR_IN_TMR_RELOAD_REQ_NS, timer_ns);
90 MCDI_IN_SET_DWORD(req, SET_EVQ_TMR_IN_TMR_MODE, mode);
92 efx_mcdi_execute(enp, &req);
94 if (req.emr_rc != 0) {
99 if (req.emr_out_length_used < MC_CMD_SET_EVQ_TMR_OUT_LEN) {
109 EFSYS_PROBE1(fail1, efx_rc_t, rc);
114 static __checkReturn efx_rc_t
117 __in unsigned int instance,
118 __in efsys_mem_t *esmp,
123 __in boolean_t low_latency)
127 MAX(MC_CMD_INIT_EVQ_IN_LEN(EFX_EVQ_NBUFS(EFX_EVQ_MAXNEVS)),
128 MC_CMD_INIT_EVQ_OUT_LEN)];
129 efx_qword_t *dma_addr;
133 boolean_t interrupting;
137 npages = EFX_EVQ_NBUFS(nevs);
138 if (MC_CMD_INIT_EVQ_IN_LEN(npages) > MC_CMD_INIT_EVQ_IN_LENMAX) {
143 (void) memset(payload, 0, sizeof (payload));
144 req.emr_cmd = MC_CMD_INIT_EVQ;
145 req.emr_in_buf = payload;
146 req.emr_in_length = MC_CMD_INIT_EVQ_IN_LEN(npages);
147 req.emr_out_buf = payload;
148 req.emr_out_length = MC_CMD_INIT_EVQ_OUT_LEN;
150 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_SIZE, nevs);
151 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_INSTANCE, instance);
152 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_IRQ_NUM, irq);
154 interrupting = ((flags & EFX_EVQ_FLAGS_NOTIFY_MASK) ==
155 EFX_EVQ_FLAGS_NOTIFY_INTERRUPT);
158 * On Huntington RX and TX event batching can only be requested together
159 * (even if the datapath firmware doesn't actually support RX
160 * batching). If event cut through is enabled no RX batching will occur.
162 * So always enable RX and TX event batching, and enable event cut
163 * through if we want low latency operation.
165 switch (flags & EFX_EVQ_FLAGS_TYPE_MASK) {
166 case EFX_EVQ_FLAGS_TYPE_AUTO:
167 ev_cut_through = low_latency ? 1 : 0;
169 case EFX_EVQ_FLAGS_TYPE_THROUGHPUT:
172 case EFX_EVQ_FLAGS_TYPE_LOW_LATENCY:
179 MCDI_IN_POPULATE_DWORD_6(req, INIT_EVQ_IN_FLAGS,
180 INIT_EVQ_IN_FLAG_INTERRUPTING, interrupting,
181 INIT_EVQ_IN_FLAG_RPTR_DOS, 0,
182 INIT_EVQ_IN_FLAG_INT_ARMD, 0,
183 INIT_EVQ_IN_FLAG_CUT_THRU, ev_cut_through,
184 INIT_EVQ_IN_FLAG_RX_MERGE, 1,
185 INIT_EVQ_IN_FLAG_TX_MERGE, 1);
187 /* If the value is zero then disable the timer */
189 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_TMR_MODE,
190 MC_CMD_INIT_EVQ_IN_TMR_MODE_DIS);
191 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_TMR_LOAD, 0);
192 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_TMR_RELOAD, 0);
196 if ((rc = efx_ev_usecs_to_ticks(enp, us, &ticks)) != 0)
199 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_TMR_MODE,
200 MC_CMD_INIT_EVQ_IN_TMR_INT_HLDOFF);
201 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_TMR_LOAD, ticks);
202 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_TMR_RELOAD, ticks);
205 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_COUNT_MODE,
206 MC_CMD_INIT_EVQ_IN_COUNT_MODE_DIS);
207 MCDI_IN_SET_DWORD(req, INIT_EVQ_IN_COUNT_THRSHLD, 0);
209 dma_addr = MCDI_IN2(req, efx_qword_t, INIT_EVQ_IN_DMA_ADDR);
210 addr = EFSYS_MEM_ADDR(esmp);
212 for (i = 0; i < npages; i++) {
213 EFX_POPULATE_QWORD_2(*dma_addr,
214 EFX_DWORD_1, (uint32_t)(addr >> 32),
215 EFX_DWORD_0, (uint32_t)(addr & 0xffffffff));
218 addr += EFX_BUF_SIZE;
221 efx_mcdi_execute(enp, &req);
223 if (req.emr_rc != 0) {
228 if (req.emr_out_length_used < MC_CMD_INIT_EVQ_OUT_LEN) {
233 /* NOTE: ignore the returned IRQ param as firmware does not set it. */
246 EFSYS_PROBE1(fail1, efx_rc_t, rc);
252 static __checkReturn efx_rc_t
253 efx_mcdi_init_evq_v2(
255 __in unsigned int instance,
256 __in efsys_mem_t *esmp,
264 MAX(MC_CMD_INIT_EVQ_V2_IN_LEN(EFX_EVQ_NBUFS(EFX_EVQ_MAXNEVS)),
265 MC_CMD_INIT_EVQ_V2_OUT_LEN)];
266 boolean_t interrupting;
267 unsigned int evq_type;
268 efx_qword_t *dma_addr;
274 npages = EFX_EVQ_NBUFS(nevs);
275 if (MC_CMD_INIT_EVQ_V2_IN_LEN(npages) > MC_CMD_INIT_EVQ_V2_IN_LENMAX) {
280 (void) memset(payload, 0, sizeof (payload));
281 req.emr_cmd = MC_CMD_INIT_EVQ;
282 req.emr_in_buf = payload;
283 req.emr_in_length = MC_CMD_INIT_EVQ_V2_IN_LEN(npages);
284 req.emr_out_buf = payload;
285 req.emr_out_length = MC_CMD_INIT_EVQ_V2_OUT_LEN;
287 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_SIZE, nevs);
288 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_INSTANCE, instance);
289 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_IRQ_NUM, irq);
291 interrupting = ((flags & EFX_EVQ_FLAGS_NOTIFY_MASK) ==
292 EFX_EVQ_FLAGS_NOTIFY_INTERRUPT);
294 switch (flags & EFX_EVQ_FLAGS_TYPE_MASK) {
295 case EFX_EVQ_FLAGS_TYPE_AUTO:
296 evq_type = MC_CMD_INIT_EVQ_V2_IN_FLAG_TYPE_AUTO;
298 case EFX_EVQ_FLAGS_TYPE_THROUGHPUT:
299 evq_type = MC_CMD_INIT_EVQ_V2_IN_FLAG_TYPE_THROUGHPUT;
301 case EFX_EVQ_FLAGS_TYPE_LOW_LATENCY:
302 evq_type = MC_CMD_INIT_EVQ_V2_IN_FLAG_TYPE_LOW_LATENCY;
308 MCDI_IN_POPULATE_DWORD_4(req, INIT_EVQ_V2_IN_FLAGS,
309 INIT_EVQ_V2_IN_FLAG_INTERRUPTING, interrupting,
310 INIT_EVQ_V2_IN_FLAG_RPTR_DOS, 0,
311 INIT_EVQ_V2_IN_FLAG_INT_ARMD, 0,
312 INIT_EVQ_V2_IN_FLAG_TYPE, evq_type);
314 /* If the value is zero then disable the timer */
316 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_TMR_MODE,
317 MC_CMD_INIT_EVQ_V2_IN_TMR_MODE_DIS);
318 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_TMR_LOAD, 0);
319 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_TMR_RELOAD, 0);
323 if ((rc = efx_ev_usecs_to_ticks(enp, us, &ticks)) != 0)
326 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_TMR_MODE,
327 MC_CMD_INIT_EVQ_V2_IN_TMR_INT_HLDOFF);
328 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_TMR_LOAD, ticks);
329 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_TMR_RELOAD, ticks);
332 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_COUNT_MODE,
333 MC_CMD_INIT_EVQ_V2_IN_COUNT_MODE_DIS);
334 MCDI_IN_SET_DWORD(req, INIT_EVQ_V2_IN_COUNT_THRSHLD, 0);
336 dma_addr = MCDI_IN2(req, efx_qword_t, INIT_EVQ_V2_IN_DMA_ADDR);
337 addr = EFSYS_MEM_ADDR(esmp);
339 for (i = 0; i < npages; i++) {
340 EFX_POPULATE_QWORD_2(*dma_addr,
341 EFX_DWORD_1, (uint32_t)(addr >> 32),
342 EFX_DWORD_0, (uint32_t)(addr & 0xffffffff));
345 addr += EFX_BUF_SIZE;
348 efx_mcdi_execute(enp, &req);
350 if (req.emr_rc != 0) {
355 if (req.emr_out_length_used < MC_CMD_INIT_EVQ_V2_OUT_LEN) {
360 /* NOTE: ignore the returned IRQ param as firmware does not set it. */
362 EFSYS_PROBE1(mcdi_evq_flags, uint32_t,
363 MCDI_OUT_DWORD(req, INIT_EVQ_V2_OUT_FLAGS));
376 EFSYS_PROBE1(fail1, efx_rc_t, rc);
381 static __checkReturn efx_rc_t
384 __in uint32_t instance)
387 uint8_t payload[MAX(MC_CMD_FINI_EVQ_IN_LEN,
388 MC_CMD_FINI_EVQ_OUT_LEN)];
391 (void) memset(payload, 0, sizeof (payload));
392 req.emr_cmd = MC_CMD_FINI_EVQ;
393 req.emr_in_buf = payload;
394 req.emr_in_length = MC_CMD_FINI_EVQ_IN_LEN;
395 req.emr_out_buf = payload;
396 req.emr_out_length = MC_CMD_FINI_EVQ_OUT_LEN;
398 MCDI_IN_SET_DWORD(req, FINI_EVQ_IN_INSTANCE, instance);
400 efx_mcdi_execute_quiet(enp, &req);
402 if (req.emr_rc != 0) {
411 * EALREADY is not an error, but indicates that the MC has rebooted and
412 * that the EVQ has already been destroyed.
415 EFSYS_PROBE1(fail1, efx_rc_t, rc);
422 __checkReturn efx_rc_t
426 _NOTE(ARGUNUSED(enp))
434 _NOTE(ARGUNUSED(enp))
437 __checkReturn efx_rc_t
440 __in unsigned int index,
441 __in efsys_mem_t *esmp,
448 efx_nic_cfg_t *encp = &(enp->en_nic_cfg);
452 _NOTE(ARGUNUSED(id)) /* buftbl id managed by MC */
453 EFX_STATIC_ASSERT(ISP2(EFX_EVQ_MAXNEVS));
454 EFX_STATIC_ASSERT(ISP2(EFX_EVQ_MINNEVS));
457 (ndescs < EFX_EVQ_MINNEVS) || (ndescs > EFX_EVQ_MAXNEVS)) {
462 if (index >= encp->enc_evq_limit) {
467 if (us > encp->enc_evq_timer_max_us) {
472 /* Set up the handler table */
473 eep->ee_rx = ef10_ev_rx;
474 eep->ee_tx = ef10_ev_tx;
475 eep->ee_driver = ef10_ev_driver;
476 eep->ee_drv_gen = ef10_ev_drv_gen;
477 eep->ee_mcdi = ef10_ev_mcdi;
479 /* Set up the event queue */
480 /* INIT_EVQ expects function-relative vector number */
481 if ((flags & EFX_EVQ_FLAGS_NOTIFY_MASK) ==
482 EFX_EVQ_FLAGS_NOTIFY_INTERRUPT) {
484 } else if (index == EFX_EF10_ALWAYS_INTERRUPTING_EVQ_INDEX) {
486 flags = (flags & ~EFX_EVQ_FLAGS_NOTIFY_MASK) |
487 EFX_EVQ_FLAGS_NOTIFY_INTERRUPT;
489 irq = EFX_EF10_ALWAYS_INTERRUPTING_EVQ_INDEX;
493 * Interrupts may be raised for events immediately after the queue is
494 * created. See bug58606.
497 if (encp->enc_init_evq_v2_supported) {
499 * On Medford the low latency license is required to enable RX
500 * and event cut through and to disable RX batching. If event
501 * queue type in flags is auto, we let the firmware decide the
502 * settings to use. If the adapter has a low latency license,
503 * it will choose the best settings for low latency, otherwise
504 * it will choose the best settings for throughput.
506 rc = efx_mcdi_init_evq_v2(enp, index, esmp, ndescs, irq, us,
512 * On Huntington we need to specify the settings to use.
513 * If event queue type in flags is auto, we favour throughput
514 * if the adapter is running virtualization supporting firmware
515 * (i.e. the full featured firmware variant)
516 * and latency otherwise. The Ethernet Virtual Bridging
517 * capability is used to make this decision. (Note though that
518 * the low latency firmware variant is also best for
519 * throughput and corresponding type should be specified
522 boolean_t low_latency = encp->enc_datapath_cap_evb ? 0 : 1;
523 rc = efx_mcdi_init_evq(enp, index, esmp, ndescs, irq, us, flags,
540 EFSYS_PROBE1(fail1, efx_rc_t, rc);
549 efx_nic_t *enp = eep->ee_enp;
551 EFSYS_ASSERT(enp->en_family == EFX_FAMILY_HUNTINGTON ||
552 enp->en_family == EFX_FAMILY_MEDFORD);
554 (void) efx_mcdi_fini_evq(enp, eep->ee_index);
557 __checkReturn efx_rc_t
560 __in unsigned int count)
562 efx_nic_t *enp = eep->ee_enp;
566 rptr = count & eep->ee_mask;
568 if (enp->en_nic_cfg.enc_bug35388_workaround) {
569 EFX_STATIC_ASSERT(EFX_EVQ_MINNEVS >
570 (1 << ERF_DD_EVQ_IND_RPTR_WIDTH));
571 EFX_STATIC_ASSERT(EFX_EVQ_MAXNEVS <
572 (1 << 2 * ERF_DD_EVQ_IND_RPTR_WIDTH));
574 EFX_POPULATE_DWORD_2(dword,
575 ERF_DD_EVQ_IND_RPTR_FLAGS,
576 EFE_DD_EVQ_IND_RPTR_FLAGS_HIGH,
578 (rptr >> ERF_DD_EVQ_IND_RPTR_WIDTH));
579 EFX_BAR_TBL_WRITED(enp, ER_DD_EVQ_INDIRECT, eep->ee_index,
582 EFX_POPULATE_DWORD_2(dword,
583 ERF_DD_EVQ_IND_RPTR_FLAGS,
584 EFE_DD_EVQ_IND_RPTR_FLAGS_LOW,
586 rptr & ((1 << ERF_DD_EVQ_IND_RPTR_WIDTH) - 1));
587 EFX_BAR_TBL_WRITED(enp, ER_DD_EVQ_INDIRECT, eep->ee_index,
590 EFX_POPULATE_DWORD_1(dword, ERF_DZ_EVQ_RPTR, rptr);
591 EFX_BAR_TBL_WRITED(enp, ER_DZ_EVQ_RPTR_REG, eep->ee_index,
598 static __checkReturn efx_rc_t
599 efx_mcdi_driver_event(
602 __in efx_qword_t data)
605 uint8_t payload[MAX(MC_CMD_DRIVER_EVENT_IN_LEN,
606 MC_CMD_DRIVER_EVENT_OUT_LEN)];
609 req.emr_cmd = MC_CMD_DRIVER_EVENT;
610 req.emr_in_buf = payload;
611 req.emr_in_length = MC_CMD_DRIVER_EVENT_IN_LEN;
612 req.emr_out_buf = payload;
613 req.emr_out_length = MC_CMD_DRIVER_EVENT_OUT_LEN;
615 MCDI_IN_SET_DWORD(req, DRIVER_EVENT_IN_EVQ, evq);
617 MCDI_IN_SET_DWORD(req, DRIVER_EVENT_IN_DATA_LO,
618 EFX_QWORD_FIELD(data, EFX_DWORD_0));
619 MCDI_IN_SET_DWORD(req, DRIVER_EVENT_IN_DATA_HI,
620 EFX_QWORD_FIELD(data, EFX_DWORD_1));
622 efx_mcdi_execute(enp, &req);
624 if (req.emr_rc != 0) {
632 EFSYS_PROBE1(fail1, efx_rc_t, rc);
642 efx_nic_t *enp = eep->ee_enp;
645 EFX_POPULATE_QWORD_3(event,
646 ESF_DZ_DRV_CODE, ESE_DZ_EV_CODE_DRV_GEN_EV,
647 ESF_DZ_DRV_SUB_CODE, 0,
648 ESF_DZ_DRV_SUB_DATA_DW0, (uint32_t)data);
650 (void) efx_mcdi_driver_event(enp, eep->ee_index, event);
653 __checkReturn efx_rc_t
656 __in unsigned int us)
658 efx_nic_t *enp = eep->ee_enp;
659 efx_nic_cfg_t *encp = &(enp->en_nic_cfg);
664 /* Check that hardware and MCDI use the same timer MODE values */
665 EFX_STATIC_ASSERT(FFE_CZ_TIMER_MODE_DIS ==
666 MC_CMD_SET_EVQ_TMR_IN_TIMER_MODE_DIS);
667 EFX_STATIC_ASSERT(FFE_CZ_TIMER_MODE_IMMED_START ==
668 MC_CMD_SET_EVQ_TMR_IN_TIMER_MODE_IMMED_START);
669 EFX_STATIC_ASSERT(FFE_CZ_TIMER_MODE_TRIG_START ==
670 MC_CMD_SET_EVQ_TMR_IN_TIMER_MODE_TRIG_START);
671 EFX_STATIC_ASSERT(FFE_CZ_TIMER_MODE_INT_HLDOFF ==
672 MC_CMD_SET_EVQ_TMR_IN_TIMER_MODE_INT_HLDOFF);
674 if (us > encp->enc_evq_timer_max_us) {
679 /* If the value is zero then disable the timer */
681 mode = FFE_CZ_TIMER_MODE_DIS;
683 mode = FFE_CZ_TIMER_MODE_INT_HLDOFF;
686 if (encp->enc_bug61265_workaround) {
687 uint32_t ns = us * 1000;
689 rc = efx_mcdi_set_evq_tmr(enp, eep->ee_index, mode, ns);
695 if ((rc = efx_ev_usecs_to_ticks(enp, us, &ticks)) != 0)
698 if (encp->enc_bug35388_workaround) {
699 EFX_POPULATE_DWORD_3(dword,
700 ERF_DD_EVQ_IND_TIMER_FLAGS,
701 EFE_DD_EVQ_IND_TIMER_FLAGS,
702 ERF_DD_EVQ_IND_TIMER_MODE, mode,
703 ERF_DD_EVQ_IND_TIMER_VAL, ticks);
704 EFX_BAR_TBL_WRITED(enp, ER_DD_EVQ_INDIRECT,
705 eep->ee_index, &dword, 0);
707 EFX_POPULATE_DWORD_2(dword,
708 ERF_DZ_TC_TIMER_MODE, mode,
709 ERF_DZ_TC_TIMER_VAL, ticks);
710 EFX_BAR_TBL_WRITED(enp, ER_DZ_EVQ_TMR_REG,
711 eep->ee_index, &dword, 0);
722 EFSYS_PROBE1(fail1, efx_rc_t, rc);
730 ef10_ev_qstats_update(
732 __inout_ecount(EV_NQSTATS) efsys_stat_t *stat)
736 for (id = 0; id < EV_NQSTATS; id++) {
737 efsys_stat_t *essp = &stat[id];
739 EFSYS_STAT_INCR(essp, eep->ee_stat[id]);
740 eep->ee_stat[id] = 0;
743 #endif /* EFSYS_OPT_QSTATS */
745 #if EFSYS_OPT_RX_PACKED_STREAM
747 static __checkReturn boolean_t
748 ef10_ev_rx_packed_stream(
750 __in efx_qword_t *eqp,
751 __in const efx_ev_callbacks_t *eecp,
755 uint32_t pkt_count_lbits;
757 boolean_t should_abort;
758 efx_evq_rxq_state_t *eersp;
759 unsigned int pkt_count;
760 unsigned int current_id;
761 boolean_t new_buffer;
763 pkt_count_lbits = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_DSC_PTR_LBITS);
764 label = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_QLABEL);
765 new_buffer = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_EV_ROTATE);
769 eersp = &eep->ee_rxq_state[label];
772 * RX_DSC_PTR_LBITS has least significant bits of the global
773 * (not per-buffer) packet counter. It is guaranteed that
774 * maximum number of completed packets fits in lbits-mask.
775 * So, modulo lbits-mask arithmetic should be used to calculate
776 * packet counter increment.
778 pkt_count = (pkt_count_lbits - eersp->eers_rx_stream_npackets) &
779 EFX_MASK32(ESF_DZ_RX_DSC_PTR_LBITS);
780 eersp->eers_rx_stream_npackets += pkt_count;
783 flags |= EFX_PKT_PACKED_STREAM_NEW_BUFFER;
784 eersp->eers_rx_packed_stream_credits++;
785 eersp->eers_rx_read_ptr++;
787 current_id = eersp->eers_rx_read_ptr & eersp->eers_rx_mask;
789 /* Check for errors that invalidate checksum and L3/L4 fields */
790 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_ECC_ERR) != 0) {
791 /* RX frame truncated (error flag is misnamed) */
792 EFX_EV_QSTAT_INCR(eep, EV_RX_FRM_TRUNC);
793 flags |= EFX_DISCARD;
796 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_ECRC_ERR) != 0) {
797 /* Bad Ethernet frame CRC */
798 EFX_EV_QSTAT_INCR(eep, EV_RX_ETH_CRC_ERR);
799 flags |= EFX_DISCARD;
803 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_PARSE_INCOMPLETE)) {
804 flags |= EFX_PKT_PACKED_STREAM_PARSE_INCOMPLETE;
808 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_IPCKSUM_ERR))
809 EFX_EV_QSTAT_INCR(eep, EV_RX_IPV4_HDR_CHKSUM_ERR);
811 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_TCPUDP_CKSUM_ERR))
812 EFX_EV_QSTAT_INCR(eep, EV_RX_TCP_UDP_CHKSUM_ERR);
815 /* If we're not discarding the packet then it is ok */
816 if (~flags & EFX_DISCARD)
817 EFX_EV_QSTAT_INCR(eep, EV_RX_OK);
819 EFSYS_ASSERT(eecp->eec_rx_ps != NULL);
820 should_abort = eecp->eec_rx_ps(arg, label, current_id, pkt_count,
823 return (should_abort);
826 #endif /* EFSYS_OPT_RX_PACKED_STREAM */
828 static __checkReturn boolean_t
831 __in efx_qword_t *eqp,
832 __in const efx_ev_callbacks_t *eecp,
835 efx_nic_t *enp = eep->ee_enp;
839 uint32_t eth_tag_class;
842 uint32_t next_read_lbits;
845 boolean_t should_abort;
846 efx_evq_rxq_state_t *eersp;
847 unsigned int desc_count;
848 unsigned int last_used_id;
850 EFX_EV_QSTAT_INCR(eep, EV_RX);
852 /* Discard events after RXQ/TXQ errors */
853 if (enp->en_reset_flags & (EFX_RESET_RXQ_ERR | EFX_RESET_TXQ_ERR))
856 /* Basic packet information */
857 label = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_QLABEL);
858 eersp = &eep->ee_rxq_state[label];
860 #if EFSYS_OPT_RX_PACKED_STREAM
862 * Packed stream events are very different,
863 * so handle them separately
865 if (eersp->eers_rx_packed_stream)
866 return (ef10_ev_rx_packed_stream(eep, eqp, eecp, arg));
869 size = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_BYTES);
870 next_read_lbits = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_DSC_PTR_LBITS);
871 eth_tag_class = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_ETH_TAG_CLASS);
872 mac_class = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_MAC_CLASS);
873 l3_class = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_L3_CLASS);
874 l4_class = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_L4_CLASS);
875 cont = EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_CONT);
877 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_DROP_EVENT) != 0) {
878 /* Drop this event */
885 * This may be part of a scattered frame, or it may be a
886 * truncated frame if scatter is disabled on this RXQ.
887 * Overlength frames can be received if e.g. a VF is configured
888 * for 1500 MTU but connected to a port set to 9000 MTU
890 * FIXME: There is not yet any driver that supports scatter on
891 * Huntington. Scatter support is required for OSX.
893 flags |= EFX_PKT_CONT;
896 if (mac_class == ESE_DZ_MAC_CLASS_UCAST)
897 flags |= EFX_PKT_UNICAST;
899 /* Increment the count of descriptors read */
900 desc_count = (next_read_lbits - eersp->eers_rx_read_ptr) &
901 EFX_MASK32(ESF_DZ_RX_DSC_PTR_LBITS);
902 eersp->eers_rx_read_ptr += desc_count;
905 * FIXME: add error checking to make sure this a batched event.
906 * This could also be an aborted scatter, see Bug36629.
908 if (desc_count > 1) {
909 EFX_EV_QSTAT_INCR(eep, EV_RX_BATCH);
910 flags |= EFX_PKT_PREFIX_LEN;
913 /* Calculate the index of the last descriptor consumed */
914 last_used_id = (eersp->eers_rx_read_ptr - 1) & eersp->eers_rx_mask;
916 /* Check for errors that invalidate checksum and L3/L4 fields */
917 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_ECC_ERR) != 0) {
918 /* RX frame truncated (error flag is misnamed) */
919 EFX_EV_QSTAT_INCR(eep, EV_RX_FRM_TRUNC);
920 flags |= EFX_DISCARD;
923 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_ECRC_ERR) != 0) {
924 /* Bad Ethernet frame CRC */
925 EFX_EV_QSTAT_INCR(eep, EV_RX_ETH_CRC_ERR);
926 flags |= EFX_DISCARD;
929 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_PARSE_INCOMPLETE)) {
931 * Hardware parse failed, due to malformed headers
932 * or headers that are too long for the parser.
933 * Headers and checksums must be validated by the host.
935 /* TODO: EFX_EV_QSTAT_INCR(eep, EV_RX_PARSE_INCOMPLETE); */
939 if ((eth_tag_class == ESE_DZ_ETH_TAG_CLASS_VLAN1) ||
940 (eth_tag_class == ESE_DZ_ETH_TAG_CLASS_VLAN2)) {
941 flags |= EFX_PKT_VLAN_TAGGED;
945 case ESE_DZ_L3_CLASS_IP4:
946 case ESE_DZ_L3_CLASS_IP4_FRAG:
947 flags |= EFX_PKT_IPV4;
948 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_IPCKSUM_ERR)) {
949 EFX_EV_QSTAT_INCR(eep, EV_RX_IPV4_HDR_CHKSUM_ERR);
951 flags |= EFX_CKSUM_IPV4;
954 if (l4_class == ESE_DZ_L4_CLASS_TCP) {
955 EFX_EV_QSTAT_INCR(eep, EV_RX_TCP_IPV4);
956 flags |= EFX_PKT_TCP;
957 } else if (l4_class == ESE_DZ_L4_CLASS_UDP) {
958 EFX_EV_QSTAT_INCR(eep, EV_RX_UDP_IPV4);
959 flags |= EFX_PKT_UDP;
961 EFX_EV_QSTAT_INCR(eep, EV_RX_OTHER_IPV4);
965 case ESE_DZ_L3_CLASS_IP6:
966 case ESE_DZ_L3_CLASS_IP6_FRAG:
967 flags |= EFX_PKT_IPV6;
969 if (l4_class == ESE_DZ_L4_CLASS_TCP) {
970 EFX_EV_QSTAT_INCR(eep, EV_RX_TCP_IPV6);
971 flags |= EFX_PKT_TCP;
972 } else if (l4_class == ESE_DZ_L4_CLASS_UDP) {
973 EFX_EV_QSTAT_INCR(eep, EV_RX_UDP_IPV6);
974 flags |= EFX_PKT_UDP;
976 EFX_EV_QSTAT_INCR(eep, EV_RX_OTHER_IPV6);
981 EFX_EV_QSTAT_INCR(eep, EV_RX_NON_IP);
985 if (flags & (EFX_PKT_TCP | EFX_PKT_UDP)) {
986 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_RX_TCPUDP_CKSUM_ERR)) {
987 EFX_EV_QSTAT_INCR(eep, EV_RX_TCP_UDP_CHKSUM_ERR);
989 flags |= EFX_CKSUM_TCPUDP;
994 /* If we're not discarding the packet then it is ok */
995 if (~flags & EFX_DISCARD)
996 EFX_EV_QSTAT_INCR(eep, EV_RX_OK);
998 EFSYS_ASSERT(eecp->eec_rx != NULL);
999 should_abort = eecp->eec_rx(arg, label, last_used_id, size, flags);
1001 return (should_abort);
1004 static __checkReturn boolean_t
1006 __in efx_evq_t *eep,
1007 __in efx_qword_t *eqp,
1008 __in const efx_ev_callbacks_t *eecp,
1011 efx_nic_t *enp = eep->ee_enp;
1014 boolean_t should_abort;
1016 EFX_EV_QSTAT_INCR(eep, EV_TX);
1018 /* Discard events after RXQ/TXQ errors */
1019 if (enp->en_reset_flags & (EFX_RESET_RXQ_ERR | EFX_RESET_TXQ_ERR))
1022 if (EFX_QWORD_FIELD(*eqp, ESF_DZ_TX_DROP_EVENT) != 0) {
1023 /* Drop this event */
1027 /* Per-packet TX completion (was per-descriptor for Falcon/Siena) */
1028 id = EFX_QWORD_FIELD(*eqp, ESF_DZ_TX_DESCR_INDX);
1029 label = EFX_QWORD_FIELD(*eqp, ESF_DZ_TX_QLABEL);
1031 EFSYS_PROBE2(tx_complete, uint32_t, label, uint32_t, id);
1033 EFSYS_ASSERT(eecp->eec_tx != NULL);
1034 should_abort = eecp->eec_tx(arg, label, id);
1036 return (should_abort);
1039 static __checkReturn boolean_t
1041 __in efx_evq_t *eep,
1042 __in efx_qword_t *eqp,
1043 __in const efx_ev_callbacks_t *eecp,
1047 boolean_t should_abort;
1049 EFX_EV_QSTAT_INCR(eep, EV_DRIVER);
1050 should_abort = B_FALSE;
1052 code = EFX_QWORD_FIELD(*eqp, ESF_DZ_DRV_SUB_CODE);
1054 case ESE_DZ_DRV_TIMER_EV: {
1057 id = EFX_QWORD_FIELD(*eqp, ESF_DZ_DRV_TMR_ID);
1059 EFSYS_ASSERT(eecp->eec_timer != NULL);
1060 should_abort = eecp->eec_timer(arg, id);
1064 case ESE_DZ_DRV_WAKE_UP_EV: {
1067 id = EFX_QWORD_FIELD(*eqp, ESF_DZ_DRV_EVQ_ID);
1069 EFSYS_ASSERT(eecp->eec_wake_up != NULL);
1070 should_abort = eecp->eec_wake_up(arg, id);
1074 case ESE_DZ_DRV_START_UP_EV:
1075 EFSYS_ASSERT(eecp->eec_initialized != NULL);
1076 should_abort = eecp->eec_initialized(arg);
1080 EFSYS_PROBE3(bad_event, unsigned int, eep->ee_index,
1081 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_1),
1082 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_0));
1086 return (should_abort);
1089 static __checkReturn boolean_t
1091 __in efx_evq_t *eep,
1092 __in efx_qword_t *eqp,
1093 __in const efx_ev_callbacks_t *eecp,
1097 boolean_t should_abort;
1099 EFX_EV_QSTAT_INCR(eep, EV_DRV_GEN);
1100 should_abort = B_FALSE;
1102 data = EFX_QWORD_FIELD(*eqp, ESF_DZ_DRV_SUB_DATA_DW0);
1103 if (data >= ((uint32_t)1 << 16)) {
1104 EFSYS_PROBE3(bad_event, unsigned int, eep->ee_index,
1105 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_1),
1106 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_0));
1111 EFSYS_ASSERT(eecp->eec_software != NULL);
1112 should_abort = eecp->eec_software(arg, (uint16_t)data);
1114 return (should_abort);
1117 static __checkReturn boolean_t
1119 __in efx_evq_t *eep,
1120 __in efx_qword_t *eqp,
1121 __in const efx_ev_callbacks_t *eecp,
1124 efx_nic_t *enp = eep->ee_enp;
1126 boolean_t should_abort = B_FALSE;
1128 EFX_EV_QSTAT_INCR(eep, EV_MCDI_RESPONSE);
1130 code = EFX_QWORD_FIELD(*eqp, MCDI_EVENT_CODE);
1132 case MCDI_EVENT_CODE_BADSSERT:
1133 efx_mcdi_ev_death(enp, EINTR);
1136 case MCDI_EVENT_CODE_CMDDONE:
1137 efx_mcdi_ev_cpl(enp,
1138 MCDI_EV_FIELD(eqp, CMDDONE_SEQ),
1139 MCDI_EV_FIELD(eqp, CMDDONE_DATALEN),
1140 MCDI_EV_FIELD(eqp, CMDDONE_ERRNO));
1143 #if EFSYS_OPT_MCDI_PROXY_AUTH
1144 case MCDI_EVENT_CODE_PROXY_RESPONSE:
1146 * This event notifies a function that an authorization request
1147 * has been processed. If the request was authorized then the
1148 * function can now re-send the original MCDI request.
1149 * See SF-113652-SW "SR-IOV Proxied Network Access Control".
1151 efx_mcdi_ev_proxy_response(enp,
1152 MCDI_EV_FIELD(eqp, PROXY_RESPONSE_HANDLE),
1153 MCDI_EV_FIELD(eqp, PROXY_RESPONSE_RC));
1155 #endif /* EFSYS_OPT_MCDI_PROXY_AUTH */
1157 case MCDI_EVENT_CODE_LINKCHANGE: {
1158 efx_link_mode_t link_mode;
1160 ef10_phy_link_ev(enp, eqp, &link_mode);
1161 should_abort = eecp->eec_link_change(arg, link_mode);
1165 case MCDI_EVENT_CODE_SENSOREVT: {
1166 #if EFSYS_OPT_MON_STATS
1168 efx_mon_stat_value_t value;
1171 /* Decode monitor stat for MCDI sensor (if supported) */
1172 if ((rc = mcdi_mon_ev(enp, eqp, &id, &value)) == 0) {
1173 /* Report monitor stat change */
1174 should_abort = eecp->eec_monitor(arg, id, value);
1175 } else if (rc == ENOTSUP) {
1176 should_abort = eecp->eec_exception(arg,
1177 EFX_EXCEPTION_UNKNOWN_SENSOREVT,
1178 MCDI_EV_FIELD(eqp, DATA));
1180 EFSYS_ASSERT(rc == ENODEV); /* Wrong port */
1186 case MCDI_EVENT_CODE_SCHEDERR:
1187 /* Informational only */
1190 case MCDI_EVENT_CODE_REBOOT:
1191 /* Falcon/Siena only (should not been seen with Huntington). */
1192 efx_mcdi_ev_death(enp, EIO);
1195 case MCDI_EVENT_CODE_MC_REBOOT:
1196 /* MC_REBOOT event is used for Huntington (EF10) and later. */
1197 efx_mcdi_ev_death(enp, EIO);
1200 case MCDI_EVENT_CODE_MAC_STATS_DMA:
1201 #if EFSYS_OPT_MAC_STATS
1202 if (eecp->eec_mac_stats != NULL) {
1203 eecp->eec_mac_stats(arg,
1204 MCDI_EV_FIELD(eqp, MAC_STATS_DMA_GENERATION));
1209 case MCDI_EVENT_CODE_FWALERT: {
1210 uint32_t reason = MCDI_EV_FIELD(eqp, FWALERT_REASON);
1212 if (reason == MCDI_EVENT_FWALERT_REASON_SRAM_ACCESS)
1213 should_abort = eecp->eec_exception(arg,
1214 EFX_EXCEPTION_FWALERT_SRAM,
1215 MCDI_EV_FIELD(eqp, FWALERT_DATA));
1217 should_abort = eecp->eec_exception(arg,
1218 EFX_EXCEPTION_UNKNOWN_FWALERT,
1219 MCDI_EV_FIELD(eqp, DATA));
1223 case MCDI_EVENT_CODE_TX_ERR: {
1225 * After a TXQ error is detected, firmware sends a TX_ERR event.
1226 * This may be followed by TX completions (which we discard),
1227 * and then finally by a TX_FLUSH event. Firmware destroys the
1228 * TXQ automatically after sending the TX_FLUSH event.
1230 enp->en_reset_flags |= EFX_RESET_TXQ_ERR;
1232 EFSYS_PROBE2(tx_descq_err,
1233 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_1),
1234 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_0));
1236 /* Inform the driver that a reset is required. */
1237 eecp->eec_exception(arg, EFX_EXCEPTION_TX_ERROR,
1238 MCDI_EV_FIELD(eqp, TX_ERR_DATA));
1242 case MCDI_EVENT_CODE_TX_FLUSH: {
1243 uint32_t txq_index = MCDI_EV_FIELD(eqp, TX_FLUSH_TXQ);
1246 * EF10 firmware sends two TX_FLUSH events: one to the txq's
1247 * event queue, and one to evq 0 (with TX_FLUSH_TO_DRIVER set).
1248 * We want to wait for all completions, so ignore the events
1249 * with TX_FLUSH_TO_DRIVER.
1251 if (MCDI_EV_FIELD(eqp, TX_FLUSH_TO_DRIVER) != 0) {
1252 should_abort = B_FALSE;
1256 EFX_EV_QSTAT_INCR(eep, EV_DRIVER_TX_DESCQ_FLS_DONE);
1258 EFSYS_PROBE1(tx_descq_fls_done, uint32_t, txq_index);
1260 EFSYS_ASSERT(eecp->eec_txq_flush_done != NULL);
1261 should_abort = eecp->eec_txq_flush_done(arg, txq_index);
1265 case MCDI_EVENT_CODE_RX_ERR: {
1267 * After an RXQ error is detected, firmware sends an RX_ERR
1268 * event. This may be followed by RX events (which we discard),
1269 * and then finally by an RX_FLUSH event. Firmware destroys the
1270 * RXQ automatically after sending the RX_FLUSH event.
1272 enp->en_reset_flags |= EFX_RESET_RXQ_ERR;
1274 EFSYS_PROBE2(rx_descq_err,
1275 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_1),
1276 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_0));
1278 /* Inform the driver that a reset is required. */
1279 eecp->eec_exception(arg, EFX_EXCEPTION_RX_ERROR,
1280 MCDI_EV_FIELD(eqp, RX_ERR_DATA));
1284 case MCDI_EVENT_CODE_RX_FLUSH: {
1285 uint32_t rxq_index = MCDI_EV_FIELD(eqp, RX_FLUSH_RXQ);
1288 * EF10 firmware sends two RX_FLUSH events: one to the rxq's
1289 * event queue, and one to evq 0 (with RX_FLUSH_TO_DRIVER set).
1290 * We want to wait for all completions, so ignore the events
1291 * with RX_FLUSH_TO_DRIVER.
1293 if (MCDI_EV_FIELD(eqp, RX_FLUSH_TO_DRIVER) != 0) {
1294 should_abort = B_FALSE;
1298 EFX_EV_QSTAT_INCR(eep, EV_DRIVER_RX_DESCQ_FLS_DONE);
1300 EFSYS_PROBE1(rx_descq_fls_done, uint32_t, rxq_index);
1302 EFSYS_ASSERT(eecp->eec_rxq_flush_done != NULL);
1303 should_abort = eecp->eec_rxq_flush_done(arg, rxq_index);
1308 EFSYS_PROBE3(bad_event, unsigned int, eep->ee_index,
1309 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_1),
1310 uint32_t, EFX_QWORD_FIELD(*eqp, EFX_DWORD_0));
1314 return (should_abort);
1318 ef10_ev_rxlabel_init(
1319 __in efx_evq_t *eep,
1320 __in efx_rxq_t *erp,
1321 __in unsigned int label,
1322 __in efx_rxq_type_t type)
1324 efx_evq_rxq_state_t *eersp;
1325 #if EFSYS_OPT_RX_PACKED_STREAM
1326 boolean_t packed_stream = (type == EFX_RXQ_TYPE_PACKED_STREAM);
1329 _NOTE(ARGUNUSED(type))
1330 EFSYS_ASSERT3U(label, <, EFX_ARRAY_SIZE(eep->ee_rxq_state));
1331 eersp = &eep->ee_rxq_state[label];
1333 EFSYS_ASSERT3U(eersp->eers_rx_mask, ==, 0);
1335 #if EFSYS_OPT_RX_PACKED_STREAM
1337 * For packed stream modes, the very first event will
1338 * have a new buffer flag set, so it will be incremented,
1339 * yielding the correct pointer. That results in a simpler
1340 * code than trying to detect start-of-the-world condition
1341 * in the event handler.
1343 eersp->eers_rx_read_ptr = packed_stream ? ~0 : 0;
1345 eersp->eers_rx_read_ptr = 0;
1347 eersp->eers_rx_mask = erp->er_mask;
1348 #if EFSYS_OPT_RX_PACKED_STREAM
1349 eersp->eers_rx_stream_npackets = 0;
1350 eersp->eers_rx_packed_stream = packed_stream;
1351 if (packed_stream) {
1352 eersp->eers_rx_packed_stream_credits = (eep->ee_mask + 1) /
1353 EFX_DIV_ROUND_UP(EFX_RX_PACKED_STREAM_MEM_PER_CREDIT,
1354 EFX_RX_PACKED_STREAM_MIN_PACKET_SPACE);
1355 EFSYS_ASSERT3U(eersp->eers_rx_packed_stream_credits, !=, 0);
1357 * A single credit is allocated to the queue when it is started.
1358 * It is immediately spent by the first packet which has NEW
1359 * BUFFER flag set, though, but still we shall take into
1360 * account, as to not wrap around the maximum number of credits
1363 eersp->eers_rx_packed_stream_credits--;
1364 EFSYS_ASSERT3U(eersp->eers_rx_packed_stream_credits, <=,
1365 EFX_RX_PACKED_STREAM_MAX_CREDITS);
1371 ef10_ev_rxlabel_fini(
1372 __in efx_evq_t *eep,
1373 __in unsigned int label)
1375 efx_evq_rxq_state_t *eersp;
1377 EFSYS_ASSERT3U(label, <, EFX_ARRAY_SIZE(eep->ee_rxq_state));
1378 eersp = &eep->ee_rxq_state[label];
1380 EFSYS_ASSERT3U(eersp->eers_rx_mask, !=, 0);
1382 eersp->eers_rx_read_ptr = 0;
1383 eersp->eers_rx_mask = 0;
1384 #if EFSYS_OPT_RX_PACKED_STREAM
1385 eersp->eers_rx_stream_npackets = 0;
1386 eersp->eers_rx_packed_stream = B_FALSE;
1387 eersp->eers_rx_packed_stream_credits = 0;
1391 #endif /* EFSYS_OPT_HUNTINGTON || EFSYS_OPT_MEDFORD */