1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright 2008-2017 Cisco Systems, Inc. All rights reserved.
3 * Copyright 2007 Nuova Systems, Inc. All rights reserved.
13 #include <rte_bus_pci.h>
14 #include <rte_memzone.h>
15 #include <rte_malloc.h>
17 #include <rte_string_fns.h>
18 #include <rte_ethdev_driver.h>
20 #include "enic_compat.h"
22 #include "wq_enet_desc.h"
23 #include "rq_enet_desc.h"
24 #include "cq_enet_desc.h"
25 #include "vnic_enet.h"
30 #include "vnic_intr.h"
33 static inline int enic_is_sriov_vf(struct enic *enic)
35 return enic->pdev->id.device_id == PCI_DEVICE_ID_CISCO_VIC_ENET_VF;
38 static int is_zero_addr(uint8_t *addr)
40 return !(addr[0] | addr[1] | addr[2] | addr[3] | addr[4] | addr[5]);
43 static int is_mcast_addr(uint8_t *addr)
48 static int is_eth_addr_valid(uint8_t *addr)
50 return !is_mcast_addr(addr) && !is_zero_addr(addr);
54 enic_rxmbuf_queue_release(__rte_unused struct enic *enic, struct vnic_rq *rq)
58 if (!rq || !rq->mbuf_ring) {
59 dev_debug(enic, "Pointer to rq or mbuf_ring is NULL");
63 for (i = 0; i < rq->ring.desc_count; i++) {
64 if (rq->mbuf_ring[i]) {
65 rte_pktmbuf_free_seg(rq->mbuf_ring[i]);
66 rq->mbuf_ring[i] = NULL;
71 static void enic_free_wq_buf(struct rte_mbuf **buf)
73 struct rte_mbuf *mbuf = *buf;
75 rte_pktmbuf_free_seg(mbuf);
79 static void enic_log_q_error(struct enic *enic)
84 for (i = 0; i < enic->wq_count; i++) {
85 error_status = vnic_wq_error_status(&enic->wq[i]);
87 dev_err(enic, "WQ[%d] error_status %d\n", i,
91 for (i = 0; i < enic_vnic_rq_count(enic); i++) {
92 if (!enic->rq[i].in_use)
94 error_status = vnic_rq_error_status(&enic->rq[i]);
96 dev_err(enic, "RQ[%d] error_status %d\n", i,
101 static void enic_clear_soft_stats(struct enic *enic)
103 struct enic_soft_stats *soft_stats = &enic->soft_stats;
104 rte_atomic64_clear(&soft_stats->rx_nombuf);
105 rte_atomic64_clear(&soft_stats->rx_packet_errors);
106 rte_atomic64_clear(&soft_stats->tx_oversized);
109 static void enic_init_soft_stats(struct enic *enic)
111 struct enic_soft_stats *soft_stats = &enic->soft_stats;
112 rte_atomic64_init(&soft_stats->rx_nombuf);
113 rte_atomic64_init(&soft_stats->rx_packet_errors);
114 rte_atomic64_init(&soft_stats->tx_oversized);
115 enic_clear_soft_stats(enic);
118 void enic_dev_stats_clear(struct enic *enic)
120 if (vnic_dev_stats_clear(enic->vdev))
121 dev_err(enic, "Error in clearing stats\n");
122 enic_clear_soft_stats(enic);
125 int enic_dev_stats_get(struct enic *enic, struct rte_eth_stats *r_stats)
127 struct vnic_stats *stats;
128 struct enic_soft_stats *soft_stats = &enic->soft_stats;
129 int64_t rx_truncated;
130 uint64_t rx_packet_errors;
131 int ret = vnic_dev_stats_dump(enic->vdev, &stats);
134 dev_err(enic, "Error in getting stats\n");
138 /* The number of truncated packets can only be calculated by
139 * subtracting a hardware counter from error packets received by
140 * the driver. Note: this causes transient inaccuracies in the
141 * ipackets count. Also, the length of truncated packets are
142 * counted in ibytes even though truncated packets are dropped
143 * which can make ibytes be slightly higher than it should be.
145 rx_packet_errors = rte_atomic64_read(&soft_stats->rx_packet_errors);
146 rx_truncated = rx_packet_errors - stats->rx.rx_errors;
148 r_stats->ipackets = stats->rx.rx_frames_ok - rx_truncated;
149 r_stats->opackets = stats->tx.tx_frames_ok;
151 r_stats->ibytes = stats->rx.rx_bytes_ok;
152 r_stats->obytes = stats->tx.tx_bytes_ok;
154 r_stats->ierrors = stats->rx.rx_errors + stats->rx.rx_drop;
155 r_stats->oerrors = stats->tx.tx_errors
156 + rte_atomic64_read(&soft_stats->tx_oversized);
158 r_stats->imissed = stats->rx.rx_no_bufs + rx_truncated;
160 r_stats->rx_nombuf = rte_atomic64_read(&soft_stats->rx_nombuf);
164 int enic_del_mac_address(struct enic *enic, int mac_index)
166 struct rte_eth_dev *eth_dev = enic->rte_dev;
167 uint8_t *mac_addr = eth_dev->data->mac_addrs[mac_index].addr_bytes;
169 return vnic_dev_del_addr(enic->vdev, mac_addr);
172 int enic_set_mac_address(struct enic *enic, uint8_t *mac_addr)
176 if (!is_eth_addr_valid(mac_addr)) {
177 dev_err(enic, "invalid mac address\n");
181 err = vnic_dev_add_addr(enic->vdev, mac_addr);
183 dev_err(enic, "add mac addr failed\n");
188 enic_free_rq_buf(struct rte_mbuf **mbuf)
193 rte_pktmbuf_free(*mbuf);
197 void enic_init_vnic_resources(struct enic *enic)
199 unsigned int error_interrupt_enable = 1;
200 unsigned int error_interrupt_offset = 0;
201 unsigned int rxq_interrupt_enable = 0;
202 unsigned int rxq_interrupt_offset = ENICPMD_RXQ_INTR_OFFSET;
203 unsigned int index = 0;
205 struct vnic_rq *data_rq;
207 if (enic->rte_dev->data->dev_conf.intr_conf.rxq)
208 rxq_interrupt_enable = 1;
210 for (index = 0; index < enic->rq_count; index++) {
211 cq_idx = enic_cq_rq(enic, enic_rte_rq_idx_to_sop_idx(index));
213 vnic_rq_init(&enic->rq[enic_rte_rq_idx_to_sop_idx(index)],
215 error_interrupt_enable,
216 error_interrupt_offset);
218 data_rq = &enic->rq[enic_rte_rq_idx_to_data_idx(index)];
220 vnic_rq_init(data_rq,
222 error_interrupt_enable,
223 error_interrupt_offset);
225 vnic_cq_init(&enic->cq[cq_idx],
226 0 /* flow_control_enable */,
227 1 /* color_enable */,
230 1 /* cq_tail_color */,
231 rxq_interrupt_enable,
232 1 /* cq_entry_enable */,
233 0 /* cq_message_enable */,
234 rxq_interrupt_offset,
235 0 /* cq_message_addr */);
236 if (rxq_interrupt_enable)
237 rxq_interrupt_offset++;
240 for (index = 0; index < enic->wq_count; index++) {
241 vnic_wq_init(&enic->wq[index],
242 enic_cq_wq(enic, index),
243 error_interrupt_enable,
244 error_interrupt_offset);
245 /* Compute unsupported ol flags for enic_prep_pkts() */
246 enic->wq[index].tx_offload_notsup_mask =
247 PKT_TX_OFFLOAD_MASK ^ enic->tx_offload_mask;
249 cq_idx = enic_cq_wq(enic, index);
250 vnic_cq_init(&enic->cq[cq_idx],
251 0 /* flow_control_enable */,
252 1 /* color_enable */,
255 1 /* cq_tail_color */,
256 0 /* interrupt_enable */,
257 0 /* cq_entry_enable */,
258 1 /* cq_message_enable */,
259 0 /* interrupt offset */,
260 (u64)enic->wq[index].cqmsg_rz->iova);
263 for (index = 0; index < enic->intr_count; index++) {
264 vnic_intr_init(&enic->intr[index],
265 enic->config.intr_timer_usec,
266 enic->config.intr_timer_type,
267 /*mask_on_assertion*/1);
273 enic_alloc_rx_queue_mbufs(struct enic *enic, struct vnic_rq *rq)
276 struct rq_enet_desc *rqd = rq->ring.descs;
279 uint32_t max_rx_pkt_len;
285 dev_debug(enic, "queue %u, allocating %u rx queue mbufs\n", rq->index,
286 rq->ring.desc_count);
289 * If *not* using scatter and the mbuf size is greater than the
290 * requested max packet size (max_rx_pkt_len), then reduce the
291 * posted buffer size to max_rx_pkt_len. HW still receives packets
292 * larger than max_rx_pkt_len, but they will be truncated, which we
293 * drop in the rx handler. Not ideal, but better than returning
294 * large packets when the user is not expecting them.
296 max_rx_pkt_len = enic->rte_dev->data->dev_conf.rxmode.max_rx_pkt_len;
297 rq_buf_len = rte_pktmbuf_data_room_size(rq->mp) - RTE_PKTMBUF_HEADROOM;
298 if (max_rx_pkt_len < rq_buf_len && !rq->data_queue_enable)
299 rq_buf_len = max_rx_pkt_len;
300 for (i = 0; i < rq->ring.desc_count; i++, rqd++) {
301 mb = rte_mbuf_raw_alloc(rq->mp);
303 dev_err(enic, "RX mbuf alloc failed queue_id=%u\n",
304 (unsigned)rq->index);
308 mb->data_off = RTE_PKTMBUF_HEADROOM;
309 dma_addr = (dma_addr_t)(mb->buf_iova
310 + RTE_PKTMBUF_HEADROOM);
311 rq_enet_desc_enc(rqd, dma_addr,
312 (rq->is_sop ? RQ_ENET_TYPE_ONLY_SOP
313 : RQ_ENET_TYPE_NOT_SOP),
315 rq->mbuf_ring[i] = mb;
318 * Do not post the buffers to the NIC until we enable the RQ via
321 rq->need_initial_post = true;
322 /* Initialize fetch index while RQ is disabled */
323 iowrite32(0, &rq->ctrl->fetch_index);
328 * Post the Rx buffers for the first time. enic_alloc_rx_queue_mbufs() has
329 * allocated the buffers and filled the RQ descriptor ring. Just need to push
330 * the post index to the NIC.
333 enic_initial_post_rx(struct enic *enic, struct vnic_rq *rq)
335 if (!rq->in_use || !rq->need_initial_post)
338 /* make sure all prior writes are complete before doing the PIO write */
341 /* Post all but the last buffer to VIC. */
342 rq->posted_index = rq->ring.desc_count - 1;
346 dev_debug(enic, "port=%u, qidx=%u, Write %u posted idx, %u sw held\n",
347 enic->port_id, rq->index, rq->posted_index, rq->rx_nb_hold);
348 iowrite32(rq->posted_index, &rq->ctrl->posted_index);
350 rq->need_initial_post = false;
354 enic_alloc_consistent(void *priv, size_t size,
355 dma_addr_t *dma_handle, u8 *name)
358 const struct rte_memzone *rz;
360 struct enic *enic = (struct enic *)priv;
361 struct enic_memzone_entry *mze;
363 rz = rte_memzone_reserve_aligned((const char *)name, size,
364 SOCKET_ID_ANY, RTE_MEMZONE_IOVA_CONTIG, ENIC_ALIGN);
366 pr_err("%s : Failed to allocate memory requested for %s\n",
372 *dma_handle = (dma_addr_t)rz->iova;
374 mze = rte_malloc("enic memzone entry",
375 sizeof(struct enic_memzone_entry), 0);
378 pr_err("%s : Failed to allocate memory for memzone list\n",
380 rte_memzone_free(rz);
386 rte_spinlock_lock(&enic->memzone_list_lock);
387 LIST_INSERT_HEAD(&enic->memzone_list, mze, entries);
388 rte_spinlock_unlock(&enic->memzone_list_lock);
394 enic_free_consistent(void *priv,
395 __rte_unused size_t size,
397 dma_addr_t dma_handle)
399 struct enic_memzone_entry *mze;
400 struct enic *enic = (struct enic *)priv;
402 rte_spinlock_lock(&enic->memzone_list_lock);
403 LIST_FOREACH(mze, &enic->memzone_list, entries) {
404 if (mze->rz->addr == vaddr &&
405 mze->rz->iova == dma_handle)
409 rte_spinlock_unlock(&enic->memzone_list_lock);
411 "Tried to free memory, but couldn't find it in the memzone list\n");
414 LIST_REMOVE(mze, entries);
415 rte_spinlock_unlock(&enic->memzone_list_lock);
416 rte_memzone_free(mze->rz);
420 int enic_link_update(struct enic *enic)
422 struct rte_eth_dev *eth_dev = enic->rte_dev;
423 struct rte_eth_link link;
425 memset(&link, 0, sizeof(link));
426 link.link_status = enic_get_link_status(enic);
427 link.link_duplex = ETH_LINK_FULL_DUPLEX;
428 link.link_speed = vnic_dev_port_speed(enic->vdev);
430 return rte_eth_linkstatus_set(eth_dev, &link);
434 enic_intr_handler(void *arg)
436 struct rte_eth_dev *dev = (struct rte_eth_dev *)arg;
437 struct enic *enic = pmd_priv(dev);
439 vnic_intr_return_all_credits(&enic->intr[ENICPMD_LSC_INTR_OFFSET]);
441 enic_link_update(enic);
442 _rte_eth_dev_callback_process(dev, RTE_ETH_EVENT_INTR_LSC, NULL);
443 enic_log_q_error(enic);
446 static int enic_rxq_intr_init(struct enic *enic)
448 struct rte_intr_handle *intr_handle;
449 uint32_t rxq_intr_count, i;
452 intr_handle = enic->rte_dev->intr_handle;
453 if (!enic->rte_dev->data->dev_conf.intr_conf.rxq)
456 * Rx queue interrupts only work when we have MSI-X interrupts,
457 * one per queue. Sharing one interrupt is technically
458 * possible with VIC, but it is not worth the complications it brings.
460 if (!rte_intr_cap_multiple(intr_handle)) {
461 dev_err(enic, "Rx queue interrupts require MSI-X interrupts"
462 " (vfio-pci driver)\n");
465 rxq_intr_count = enic->intr_count - ENICPMD_RXQ_INTR_OFFSET;
466 err = rte_intr_efd_enable(intr_handle, rxq_intr_count);
468 dev_err(enic, "Failed to enable event fds for Rx queue"
472 intr_handle->intr_vec = rte_zmalloc("enic_intr_vec",
473 rxq_intr_count * sizeof(int), 0);
474 if (intr_handle->intr_vec == NULL) {
475 dev_err(enic, "Failed to allocate intr_vec\n");
478 for (i = 0; i < rxq_intr_count; i++)
479 intr_handle->intr_vec[i] = i + ENICPMD_RXQ_INTR_OFFSET;
483 static void enic_rxq_intr_deinit(struct enic *enic)
485 struct rte_intr_handle *intr_handle;
487 intr_handle = enic->rte_dev->intr_handle;
488 rte_intr_efd_disable(intr_handle);
489 if (intr_handle->intr_vec != NULL) {
490 rte_free(intr_handle->intr_vec);
491 intr_handle->intr_vec = NULL;
495 static void enic_prep_wq_for_simple_tx(struct enic *enic, uint16_t queue_idx)
497 struct wq_enet_desc *desc;
502 * Fill WQ descriptor fields that never change. Every descriptor is
503 * one packet, so set EOP. Also set CQ_ENTRY every ENIC_WQ_CQ_THRESH
504 * descriptors (i.e. request one completion update every 32 packets).
506 wq = &enic->wq[queue_idx];
507 desc = (struct wq_enet_desc *)wq->ring.descs;
508 for (i = 0; i < wq->ring.desc_count; i++, desc++) {
509 desc->header_length_flags = 1 << WQ_ENET_FLAGS_EOP_SHIFT;
510 if (i % ENIC_WQ_CQ_THRESH == ENIC_WQ_CQ_THRESH - 1)
511 desc->header_length_flags |=
512 (1 << WQ_ENET_FLAGS_CQ_ENTRY_SHIFT);
517 * The 'strong' version is in enic_rxtx_vec_avx2.c. This weak version is used
518 * used when that file is not compiled.
521 enic_use_vector_rx_handler(__rte_unused struct enic *enic)
526 static void pick_rx_handler(struct enic *enic)
528 struct rte_eth_dev *eth_dev;
532 * 1. The vectorized handler if possible and requested.
533 * 2. The non-scatter, simplified handler if scatter Rx is not used.
534 * 3. The default handler as a fallback.
536 eth_dev = enic->rte_dev;
537 if (enic_use_vector_rx_handler(enic))
539 if (enic->rq_count > 0 && enic->rq[0].data_queue_enable == 0) {
540 ENICPMD_LOG(DEBUG, " use the non-scatter Rx handler");
541 eth_dev->rx_pkt_burst = &enic_noscatter_recv_pkts;
543 ENICPMD_LOG(DEBUG, " use the normal Rx handler");
544 eth_dev->rx_pkt_burst = &enic_recv_pkts;
548 int enic_enable(struct enic *enic)
552 struct rte_eth_dev *eth_dev = enic->rte_dev;
553 uint64_t simple_tx_offloads;
556 if (enic->enable_avx2_rx) {
557 struct rte_mbuf mb_def = { .buf_addr = 0 };
560 * mbuf_initializer contains const-after-init fields of
561 * receive mbufs (i.e. 64 bits of fields from rearm_data).
562 * It is currently used by the vectorized handler.
565 mb_def.data_off = RTE_PKTMBUF_HEADROOM;
566 mb_def.port = enic->port_id;
567 rte_mbuf_refcnt_set(&mb_def, 1);
568 rte_compiler_barrier();
569 p = (uintptr_t)&mb_def.rearm_data;
570 enic->mbuf_initializer = *(uint64_t *)p;
573 eth_dev->data->dev_link.link_speed = vnic_dev_port_speed(enic->vdev);
574 eth_dev->data->dev_link.link_duplex = ETH_LINK_FULL_DUPLEX;
576 /* vnic notification of link status has already been turned on in
577 * enic_dev_init() which is called during probe time. Here we are
578 * just turning on interrupt vector 0 if needed.
580 if (eth_dev->data->dev_conf.intr_conf.lsc)
581 vnic_dev_notify_set(enic->vdev, 0);
583 err = enic_rxq_intr_init(enic);
586 if (enic_clsf_init(enic))
587 dev_warning(enic, "Init of hash table for clsf failed."\
588 "Flow director feature will not work\n");
590 for (index = 0; index < enic->rq_count; index++) {
591 err = enic_alloc_rx_queue_mbufs(enic,
592 &enic->rq[enic_rte_rq_idx_to_sop_idx(index)]);
594 dev_err(enic, "Failed to alloc sop RX queue mbufs\n");
597 err = enic_alloc_rx_queue_mbufs(enic,
598 &enic->rq[enic_rte_rq_idx_to_data_idx(index)]);
600 /* release the allocated mbufs for the sop rq*/
601 enic_rxmbuf_queue_release(enic,
602 &enic->rq[enic_rte_rq_idx_to_sop_idx(index)]);
604 dev_err(enic, "Failed to alloc data RX queue mbufs\n");
610 * Use the simple TX handler if possible. Only checksum offloads
611 * and vlan insertion are supported.
613 simple_tx_offloads = enic->tx_offload_capa &
614 (DEV_TX_OFFLOAD_OUTER_IPV4_CKSUM |
615 DEV_TX_OFFLOAD_VLAN_INSERT |
616 DEV_TX_OFFLOAD_IPV4_CKSUM |
617 DEV_TX_OFFLOAD_UDP_CKSUM |
618 DEV_TX_OFFLOAD_TCP_CKSUM);
619 if ((eth_dev->data->dev_conf.txmode.offloads &
620 ~simple_tx_offloads) == 0) {
621 ENICPMD_LOG(DEBUG, " use the simple tx handler");
622 eth_dev->tx_pkt_burst = &enic_simple_xmit_pkts;
623 for (index = 0; index < enic->wq_count; index++)
624 enic_prep_wq_for_simple_tx(enic, index);
626 ENICPMD_LOG(DEBUG, " use the default tx handler");
627 eth_dev->tx_pkt_burst = &enic_xmit_pkts;
630 pick_rx_handler(enic);
632 for (index = 0; index < enic->wq_count; index++)
633 enic_start_wq(enic, index);
634 for (index = 0; index < enic->rq_count; index++)
635 enic_start_rq(enic, index);
637 vnic_dev_add_addr(enic->vdev, enic->mac_addr);
639 vnic_dev_enable_wait(enic->vdev);
641 /* Register and enable error interrupt */
642 rte_intr_callback_register(&(enic->pdev->intr_handle),
643 enic_intr_handler, (void *)enic->rte_dev);
645 rte_intr_enable(&(enic->pdev->intr_handle));
646 /* Unmask LSC interrupt */
647 vnic_intr_unmask(&enic->intr[ENICPMD_LSC_INTR_OFFSET]);
652 int enic_alloc_intr_resources(struct enic *enic)
657 dev_info(enic, "vNIC resources used: "\
658 "wq %d rq %d cq %d intr %d\n",
659 enic->wq_count, enic_vnic_rq_count(enic),
660 enic->cq_count, enic->intr_count);
662 for (i = 0; i < enic->intr_count; i++) {
663 err = vnic_intr_alloc(enic->vdev, &enic->intr[i], i);
665 enic_free_vnic_resources(enic);
672 void enic_free_rq(void *rxq)
674 struct vnic_rq *rq_sop, *rq_data;
680 rq_sop = (struct vnic_rq *)rxq;
681 enic = vnic_dev_priv(rq_sop->vdev);
682 rq_data = &enic->rq[rq_sop->data_queue_idx];
684 if (rq_sop->free_mbufs) {
685 struct rte_mbuf **mb;
688 mb = rq_sop->free_mbufs;
689 for (i = ENIC_RX_BURST_MAX - rq_sop->num_free_mbufs;
690 i < ENIC_RX_BURST_MAX; i++)
691 rte_pktmbuf_free(mb[i]);
692 rte_free(rq_sop->free_mbufs);
693 rq_sop->free_mbufs = NULL;
694 rq_sop->num_free_mbufs = 0;
697 enic_rxmbuf_queue_release(enic, rq_sop);
699 enic_rxmbuf_queue_release(enic, rq_data);
701 rte_free(rq_sop->mbuf_ring);
703 rte_free(rq_data->mbuf_ring);
705 rq_sop->mbuf_ring = NULL;
706 rq_data->mbuf_ring = NULL;
708 vnic_rq_free(rq_sop);
710 vnic_rq_free(rq_data);
712 vnic_cq_free(&enic->cq[enic_sop_rq_idx_to_cq_idx(rq_sop->index)]);
718 void enic_start_wq(struct enic *enic, uint16_t queue_idx)
720 struct rte_eth_dev *eth_dev = enic->rte_dev;
721 vnic_wq_enable(&enic->wq[queue_idx]);
722 eth_dev->data->tx_queue_state[queue_idx] = RTE_ETH_QUEUE_STATE_STARTED;
725 int enic_stop_wq(struct enic *enic, uint16_t queue_idx)
727 struct rte_eth_dev *eth_dev = enic->rte_dev;
730 ret = vnic_wq_disable(&enic->wq[queue_idx]);
734 eth_dev->data->tx_queue_state[queue_idx] = RTE_ETH_QUEUE_STATE_STOPPED;
738 void enic_start_rq(struct enic *enic, uint16_t queue_idx)
740 struct vnic_rq *rq_sop;
741 struct vnic_rq *rq_data;
742 rq_sop = &enic->rq[enic_rte_rq_idx_to_sop_idx(queue_idx)];
743 rq_data = &enic->rq[rq_sop->data_queue_idx];
744 struct rte_eth_dev *eth_dev = enic->rte_dev;
746 if (rq_data->in_use) {
747 vnic_rq_enable(rq_data);
748 enic_initial_post_rx(enic, rq_data);
751 vnic_rq_enable(rq_sop);
752 enic_initial_post_rx(enic, rq_sop);
753 eth_dev->data->rx_queue_state[queue_idx] = RTE_ETH_QUEUE_STATE_STARTED;
756 int enic_stop_rq(struct enic *enic, uint16_t queue_idx)
758 int ret1 = 0, ret2 = 0;
759 struct rte_eth_dev *eth_dev = enic->rte_dev;
760 struct vnic_rq *rq_sop;
761 struct vnic_rq *rq_data;
762 rq_sop = &enic->rq[enic_rte_rq_idx_to_sop_idx(queue_idx)];
763 rq_data = &enic->rq[rq_sop->data_queue_idx];
765 ret2 = vnic_rq_disable(rq_sop);
768 ret1 = vnic_rq_disable(rq_data);
775 eth_dev->data->rx_queue_state[queue_idx] = RTE_ETH_QUEUE_STATE_STOPPED;
779 int enic_alloc_rq(struct enic *enic, uint16_t queue_idx,
780 unsigned int socket_id, struct rte_mempool *mp,
781 uint16_t nb_desc, uint16_t free_thresh)
784 uint16_t sop_queue_idx = enic_rte_rq_idx_to_sop_idx(queue_idx);
785 uint16_t data_queue_idx = enic_rte_rq_idx_to_data_idx(queue_idx);
786 struct vnic_rq *rq_sop = &enic->rq[sop_queue_idx];
787 struct vnic_rq *rq_data = &enic->rq[data_queue_idx];
788 unsigned int mbuf_size, mbufs_per_pkt;
789 unsigned int nb_sop_desc, nb_data_desc;
790 uint16_t min_sop, max_sop, min_data, max_data;
791 uint32_t max_rx_pkt_len;
794 rq_sop->data_queue_idx = data_queue_idx;
796 rq_data->data_queue_idx = 0;
797 rq_sop->socket_id = socket_id;
799 rq_data->socket_id = socket_id;
802 rq_sop->rx_free_thresh = free_thresh;
803 rq_data->rx_free_thresh = free_thresh;
804 dev_debug(enic, "Set queue_id:%u free thresh:%u\n", queue_idx,
807 mbuf_size = (uint16_t)(rte_pktmbuf_data_room_size(mp) -
808 RTE_PKTMBUF_HEADROOM);
809 /* max_rx_pkt_len includes the ethernet header and CRC. */
810 max_rx_pkt_len = enic->rte_dev->data->dev_conf.rxmode.max_rx_pkt_len;
812 if (enic->rte_dev->data->dev_conf.rxmode.offloads &
813 DEV_RX_OFFLOAD_SCATTER) {
814 dev_info(enic, "Rq %u Scatter rx mode enabled\n", queue_idx);
815 /* ceil((max pkt len)/mbuf_size) */
816 mbufs_per_pkt = (max_rx_pkt_len + mbuf_size - 1) / mbuf_size;
818 dev_info(enic, "Scatter rx mode disabled\n");
820 if (max_rx_pkt_len > mbuf_size) {
821 dev_warning(enic, "The maximum Rx packet size (%u) is"
822 " larger than the mbuf size (%u), and"
823 " scatter is disabled. Larger packets will"
825 max_rx_pkt_len, mbuf_size);
829 if (mbufs_per_pkt > 1) {
830 dev_info(enic, "Rq %u Scatter rx mode in use\n", queue_idx);
831 rq_sop->data_queue_enable = 1;
834 * HW does not directly support rxmode.max_rx_pkt_len. HW always
835 * receives packet sizes up to the "max" MTU.
836 * If not using scatter, we can achieve the effect of dropping
837 * larger packets by reducing the size of posted buffers.
838 * See enic_alloc_rx_queue_mbufs().
841 enic_mtu_to_max_rx_pktlen(enic->max_mtu)) {
842 dev_warning(enic, "rxmode.max_rx_pkt_len is ignored"
843 " when scatter rx mode is in use.\n");
846 dev_info(enic, "Rq %u Scatter rx mode not being used\n",
848 rq_sop->data_queue_enable = 0;
852 /* number of descriptors have to be a multiple of 32 */
853 nb_sop_desc = (nb_desc / mbufs_per_pkt) & ENIC_ALIGN_DESCS_MASK;
854 nb_data_desc = (nb_desc - nb_sop_desc) & ENIC_ALIGN_DESCS_MASK;
856 rq_sop->max_mbufs_per_pkt = mbufs_per_pkt;
857 rq_data->max_mbufs_per_pkt = mbufs_per_pkt;
859 if (mbufs_per_pkt > 1) {
860 min_sop = ENIC_RX_BURST_MAX;
861 max_sop = ((enic->config.rq_desc_count /
862 (mbufs_per_pkt - 1)) & ENIC_ALIGN_DESCS_MASK);
863 min_data = min_sop * (mbufs_per_pkt - 1);
864 max_data = enic->config.rq_desc_count;
866 min_sop = ENIC_RX_BURST_MAX;
867 max_sop = enic->config.rq_desc_count;
872 if (nb_desc < (min_sop + min_data)) {
874 "Number of rx descs too low, adjusting to minimum\n");
875 nb_sop_desc = min_sop;
876 nb_data_desc = min_data;
877 } else if (nb_desc > (max_sop + max_data)) {
879 "Number of rx_descs too high, adjusting to maximum\n");
880 nb_sop_desc = max_sop;
881 nb_data_desc = max_data;
883 if (mbufs_per_pkt > 1) {
884 dev_info(enic, "For max packet size %u and mbuf size %u valid"
885 " rx descriptor range is %u to %u\n",
886 max_rx_pkt_len, mbuf_size, min_sop + min_data,
889 dev_info(enic, "Using %d rx descriptors (sop %d, data %d)\n",
890 nb_sop_desc + nb_data_desc, nb_sop_desc, nb_data_desc);
892 /* Allocate sop queue resources */
893 rc = vnic_rq_alloc(enic->vdev, rq_sop, sop_queue_idx,
894 nb_sop_desc, sizeof(struct rq_enet_desc));
896 dev_err(enic, "error in allocation of sop rq\n");
899 nb_sop_desc = rq_sop->ring.desc_count;
901 if (rq_data->in_use) {
902 /* Allocate data queue resources */
903 rc = vnic_rq_alloc(enic->vdev, rq_data, data_queue_idx,
905 sizeof(struct rq_enet_desc));
907 dev_err(enic, "error in allocation of data rq\n");
908 goto err_free_rq_sop;
910 nb_data_desc = rq_data->ring.desc_count;
912 rc = vnic_cq_alloc(enic->vdev, &enic->cq[queue_idx], queue_idx,
913 socket_id, nb_sop_desc + nb_data_desc,
914 sizeof(struct cq_enet_rq_desc));
916 dev_err(enic, "error in allocation of cq for rq\n");
917 goto err_free_rq_data;
920 /* Allocate the mbuf rings */
921 rq_sop->mbuf_ring = (struct rte_mbuf **)
922 rte_zmalloc_socket("rq->mbuf_ring",
923 sizeof(struct rte_mbuf *) * nb_sop_desc,
924 RTE_CACHE_LINE_SIZE, rq_sop->socket_id);
925 if (rq_sop->mbuf_ring == NULL)
928 if (rq_data->in_use) {
929 rq_data->mbuf_ring = (struct rte_mbuf **)
930 rte_zmalloc_socket("rq->mbuf_ring",
931 sizeof(struct rte_mbuf *) * nb_data_desc,
932 RTE_CACHE_LINE_SIZE, rq_sop->socket_id);
933 if (rq_data->mbuf_ring == NULL)
934 goto err_free_sop_mbuf;
937 rq_sop->free_mbufs = (struct rte_mbuf **)
938 rte_zmalloc_socket("rq->free_mbufs",
939 sizeof(struct rte_mbuf *) *
941 RTE_CACHE_LINE_SIZE, rq_sop->socket_id);
942 if (rq_sop->free_mbufs == NULL)
943 goto err_free_data_mbuf;
944 rq_sop->num_free_mbufs = 0;
946 rq_sop->tot_nb_desc = nb_desc; /* squirl away for MTU update function */
951 rte_free(rq_data->mbuf_ring);
953 rte_free(rq_sop->mbuf_ring);
955 /* cleanup on error */
956 vnic_cq_free(&enic->cq[queue_idx]);
959 vnic_rq_free(rq_data);
961 vnic_rq_free(rq_sop);
966 void enic_free_wq(void *txq)
974 wq = (struct vnic_wq *)txq;
975 enic = vnic_dev_priv(wq->vdev);
976 rte_memzone_free(wq->cqmsg_rz);
978 vnic_cq_free(&enic->cq[enic->rq_count + wq->index]);
981 int enic_alloc_wq(struct enic *enic, uint16_t queue_idx,
982 unsigned int socket_id, uint16_t nb_desc)
985 struct vnic_wq *wq = &enic->wq[queue_idx];
986 unsigned int cq_index = enic_cq_wq(enic, queue_idx);
990 wq->socket_id = socket_id;
992 * rte_eth_tx_queue_setup() checks min, max, and alignment. So just
993 * print an info message for diagnostics.
995 dev_info(enic, "TX Queues - effective number of descs:%d\n", nb_desc);
997 /* Allocate queue resources */
998 err = vnic_wq_alloc(enic->vdev, &enic->wq[queue_idx], queue_idx,
1000 sizeof(struct wq_enet_desc));
1002 dev_err(enic, "error in allocation of wq\n");
1006 err = vnic_cq_alloc(enic->vdev, &enic->cq[cq_index], cq_index,
1008 sizeof(struct cq_enet_wq_desc));
1011 dev_err(enic, "error in allocation of cq for wq\n");
1014 /* setup up CQ message */
1015 snprintf((char *)name, sizeof(name),
1016 "vnic_cqmsg-%s-%d-%d", enic->bdf_name, queue_idx,
1019 wq->cqmsg_rz = rte_memzone_reserve_aligned((const char *)name,
1020 sizeof(uint32_t), SOCKET_ID_ANY,
1021 RTE_MEMZONE_IOVA_CONTIG, ENIC_ALIGN);
1028 int enic_disable(struct enic *enic)
1033 for (i = 0; i < enic->intr_count; i++) {
1034 vnic_intr_mask(&enic->intr[i]);
1035 (void)vnic_intr_masked(&enic->intr[i]); /* flush write */
1037 enic_rxq_intr_deinit(enic);
1038 rte_intr_disable(&enic->pdev->intr_handle);
1039 rte_intr_callback_unregister(&enic->pdev->intr_handle,
1041 (void *)enic->rte_dev);
1043 vnic_dev_disable(enic->vdev);
1045 enic_clsf_destroy(enic);
1047 if (!enic_is_sriov_vf(enic))
1048 vnic_dev_del_addr(enic->vdev, enic->mac_addr);
1050 for (i = 0; i < enic->wq_count; i++) {
1051 err = vnic_wq_disable(&enic->wq[i]);
1055 for (i = 0; i < enic_vnic_rq_count(enic); i++) {
1056 if (enic->rq[i].in_use) {
1057 err = vnic_rq_disable(&enic->rq[i]);
1063 /* If we were using interrupts, set the interrupt vector to -1
1064 * to disable interrupts. We are not disabling link notifcations,
1065 * though, as we want the polling of link status to continue working.
1067 if (enic->rte_dev->data->dev_conf.intr_conf.lsc)
1068 vnic_dev_notify_set(enic->vdev, -1);
1070 vnic_dev_set_reset_flag(enic->vdev, 1);
1072 for (i = 0; i < enic->wq_count; i++)
1073 vnic_wq_clean(&enic->wq[i], enic_free_wq_buf);
1075 for (i = 0; i < enic_vnic_rq_count(enic); i++)
1076 if (enic->rq[i].in_use)
1077 vnic_rq_clean(&enic->rq[i], enic_free_rq_buf);
1078 for (i = 0; i < enic->cq_count; i++)
1079 vnic_cq_clean(&enic->cq[i]);
1080 for (i = 0; i < enic->intr_count; i++)
1081 vnic_intr_clean(&enic->intr[i]);
1086 static int enic_dev_wait(struct vnic_dev *vdev,
1087 int (*start)(struct vnic_dev *, int),
1088 int (*finished)(struct vnic_dev *, int *),
1095 err = start(vdev, arg);
1099 /* Wait for func to complete...2 seconds max */
1100 for (i = 0; i < 2000; i++) {
1101 err = finished(vdev, &done);
1111 static int enic_dev_open(struct enic *enic)
1114 int flags = CMD_OPENF_IG_DESCCACHE;
1116 err = enic_dev_wait(enic->vdev, vnic_dev_open,
1117 vnic_dev_open_done, flags);
1119 dev_err(enic_get_dev(enic),
1120 "vNIC device open failed, err %d\n", err);
1125 static int enic_set_rsskey(struct enic *enic, uint8_t *user_key)
1127 dma_addr_t rss_key_buf_pa;
1128 union vnic_rss_key *rss_key_buf_va = NULL;
1132 RTE_ASSERT(user_key != NULL);
1133 snprintf((char *)name, NAME_MAX, "rss_key-%s", enic->bdf_name);
1134 rss_key_buf_va = enic_alloc_consistent(enic, sizeof(union vnic_rss_key),
1135 &rss_key_buf_pa, name);
1136 if (!rss_key_buf_va)
1139 for (i = 0; i < ENIC_RSS_HASH_KEY_SIZE; i++)
1140 rss_key_buf_va->key[i / 10].b[i % 10] = user_key[i];
1142 err = enic_set_rss_key(enic,
1144 sizeof(union vnic_rss_key));
1146 /* Save for later queries */
1148 rte_memcpy(&enic->rss_key, rss_key_buf_va,
1149 sizeof(union vnic_rss_key));
1151 enic_free_consistent(enic, sizeof(union vnic_rss_key),
1152 rss_key_buf_va, rss_key_buf_pa);
1157 int enic_set_rss_reta(struct enic *enic, union vnic_rss_cpu *rss_cpu)
1159 dma_addr_t rss_cpu_buf_pa;
1160 union vnic_rss_cpu *rss_cpu_buf_va = NULL;
1164 snprintf((char *)name, NAME_MAX, "rss_cpu-%s", enic->bdf_name);
1165 rss_cpu_buf_va = enic_alloc_consistent(enic, sizeof(union vnic_rss_cpu),
1166 &rss_cpu_buf_pa, name);
1167 if (!rss_cpu_buf_va)
1170 rte_memcpy(rss_cpu_buf_va, rss_cpu, sizeof(union vnic_rss_cpu));
1172 err = enic_set_rss_cpu(enic,
1174 sizeof(union vnic_rss_cpu));
1176 enic_free_consistent(enic, sizeof(union vnic_rss_cpu),
1177 rss_cpu_buf_va, rss_cpu_buf_pa);
1179 /* Save for later queries */
1181 rte_memcpy(&enic->rss_cpu, rss_cpu, sizeof(union vnic_rss_cpu));
1185 static int enic_set_niccfg(struct enic *enic, u8 rss_default_cpu,
1186 u8 rss_hash_type, u8 rss_hash_bits, u8 rss_base_cpu, u8 rss_enable)
1188 const u8 tso_ipid_split_en = 0;
1191 err = enic_set_nic_cfg(enic,
1192 rss_default_cpu, rss_hash_type,
1193 rss_hash_bits, rss_base_cpu,
1194 rss_enable, tso_ipid_split_en,
1195 enic->ig_vlan_strip_en);
1200 /* Initialize RSS with defaults, called from dev_configure */
1201 int enic_init_rss_nic_cfg(struct enic *enic)
1203 static uint8_t default_rss_key[] = {
1204 85, 67, 83, 97, 119, 101, 115, 111, 109, 101,
1205 80, 65, 76, 79, 117, 110, 105, 113, 117, 101,
1206 76, 73, 78, 85, 88, 114, 111, 99, 107, 115,
1207 69, 78, 73, 67, 105, 115, 99, 111, 111, 108,
1209 struct rte_eth_rss_conf rss_conf;
1210 union vnic_rss_cpu rss_cpu;
1213 rss_conf = enic->rte_dev->data->dev_conf.rx_adv_conf.rss_conf;
1215 * If setting key for the first time, and the user gives us none, then
1216 * push the default key to NIC.
1218 if (rss_conf.rss_key == NULL) {
1219 rss_conf.rss_key = default_rss_key;
1220 rss_conf.rss_key_len = ENIC_RSS_HASH_KEY_SIZE;
1222 ret = enic_set_rss_conf(enic, &rss_conf);
1224 dev_err(enic, "Failed to configure RSS\n");
1227 if (enic->rss_enable) {
1228 /* If enabling RSS, use the default reta */
1229 for (i = 0; i < ENIC_RSS_RETA_SIZE; i++) {
1230 rss_cpu.cpu[i / 4].b[i % 4] =
1231 enic_rte_rq_idx_to_sop_idx(i % enic->rq_count);
1233 ret = enic_set_rss_reta(enic, &rss_cpu);
1235 dev_err(enic, "Failed to set RSS indirection table\n");
1240 int enic_setup_finish(struct enic *enic)
1242 enic_init_soft_stats(enic);
1245 vnic_dev_packet_filter(enic->vdev,
1258 static int enic_rss_conf_valid(struct enic *enic,
1259 struct rte_eth_rss_conf *rss_conf)
1261 /* RSS is disabled per VIC settings. Ignore rss_conf. */
1262 if (enic->flow_type_rss_offloads == 0)
1264 if (rss_conf->rss_key != NULL &&
1265 rss_conf->rss_key_len != ENIC_RSS_HASH_KEY_SIZE) {
1266 dev_err(enic, "Given rss_key is %d bytes, it must be %d\n",
1267 rss_conf->rss_key_len, ENIC_RSS_HASH_KEY_SIZE);
1270 if (rss_conf->rss_hf != 0 &&
1271 (rss_conf->rss_hf & enic->flow_type_rss_offloads) == 0) {
1272 dev_err(enic, "Given rss_hf contains none of the supported"
1279 /* Set hash type and key according to rss_conf */
1280 int enic_set_rss_conf(struct enic *enic, struct rte_eth_rss_conf *rss_conf)
1282 struct rte_eth_dev *eth_dev;
1288 RTE_ASSERT(rss_conf != NULL);
1289 ret = enic_rss_conf_valid(enic, rss_conf);
1291 dev_err(enic, "RSS configuration (rss_conf) is invalid\n");
1295 eth_dev = enic->rte_dev;
1297 rss_hf = rss_conf->rss_hf & enic->flow_type_rss_offloads;
1298 if (enic->rq_count > 1 &&
1299 (eth_dev->data->dev_conf.rxmode.mq_mode & ETH_MQ_RX_RSS_FLAG) &&
1302 if (rss_hf & (ETH_RSS_IPV4 | ETH_RSS_FRAG_IPV4 |
1303 ETH_RSS_NONFRAG_IPV4_OTHER))
1304 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_IPV4;
1305 if (rss_hf & ETH_RSS_NONFRAG_IPV4_TCP)
1306 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_TCP_IPV4;
1307 if (rss_hf & ETH_RSS_NONFRAG_IPV4_UDP) {
1308 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_UDP_IPV4;
1309 if (enic->udp_rss_weak) {
1311 * 'TCP' is not a typo. The "weak" version of
1312 * UDP RSS requires both the TCP and UDP bits
1313 * be set. It does enable TCP RSS as well.
1315 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_TCP_IPV4;
1318 if (rss_hf & (ETH_RSS_IPV6 | ETH_RSS_IPV6_EX |
1319 ETH_RSS_FRAG_IPV6 | ETH_RSS_NONFRAG_IPV6_OTHER))
1320 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_IPV6;
1321 if (rss_hf & (ETH_RSS_NONFRAG_IPV6_TCP | ETH_RSS_IPV6_TCP_EX))
1322 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_TCP_IPV6;
1323 if (rss_hf & (ETH_RSS_NONFRAG_IPV6_UDP | ETH_RSS_IPV6_UDP_EX)) {
1324 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_UDP_IPV6;
1325 if (enic->udp_rss_weak)
1326 rss_hash_type |= NIC_CFG_RSS_HASH_TYPE_TCP_IPV6;
1333 /* Set the hash key if provided */
1334 if (rss_enable && rss_conf->rss_key) {
1335 ret = enic_set_rsskey(enic, rss_conf->rss_key);
1337 dev_err(enic, "Failed to set RSS key\n");
1342 ret = enic_set_niccfg(enic, ENIC_RSS_DEFAULT_CPU, rss_hash_type,
1343 ENIC_RSS_HASH_BITS, ENIC_RSS_BASE_CPU,
1346 enic->rss_hf = rss_hf;
1347 enic->rss_hash_type = rss_hash_type;
1348 enic->rss_enable = rss_enable;
1350 dev_err(enic, "Failed to update RSS configurations."
1351 " hash=0x%x\n", rss_hash_type);
1356 int enic_set_vlan_strip(struct enic *enic)
1359 * Unfortunately, VLAN strip on/off and RSS on/off are configured
1360 * together. So, re-do niccfg, preserving the current RSS settings.
1362 return enic_set_niccfg(enic, ENIC_RSS_DEFAULT_CPU, enic->rss_hash_type,
1363 ENIC_RSS_HASH_BITS, ENIC_RSS_BASE_CPU,
1367 void enic_add_packet_filter(struct enic *enic)
1369 /* Args -> directed, multicast, broadcast, promisc, allmulti */
1370 vnic_dev_packet_filter(enic->vdev, 1, 1, 1,
1371 enic->promisc, enic->allmulti);
1374 int enic_get_link_status(struct enic *enic)
1376 return vnic_dev_link_status(enic->vdev);
1379 static void enic_dev_deinit(struct enic *enic)
1381 /* stop link status checking */
1382 vnic_dev_notify_unset(enic->vdev);
1384 /* mac_addrs is freed by rte_eth_dev_release_port() */
1386 rte_free(enic->intr);
1392 int enic_set_vnic_res(struct enic *enic)
1394 struct rte_eth_dev *eth_dev = enic->rte_dev;
1396 unsigned int required_rq, required_wq, required_cq, required_intr;
1398 /* Always use two vNIC RQs per eth_dev RQ, regardless of Rx scatter. */
1399 required_rq = eth_dev->data->nb_rx_queues * 2;
1400 required_wq = eth_dev->data->nb_tx_queues;
1401 required_cq = eth_dev->data->nb_rx_queues + eth_dev->data->nb_tx_queues;
1402 required_intr = 1; /* 1 for LSC even if intr_conf.lsc is 0 */
1403 if (eth_dev->data->dev_conf.intr_conf.rxq) {
1404 required_intr += eth_dev->data->nb_rx_queues;
1407 if (enic->conf_rq_count < required_rq) {
1408 dev_err(dev, "Not enough Receive queues. Requested:%u which uses %d RQs on VIC, Configured:%u\n",
1409 eth_dev->data->nb_rx_queues,
1410 required_rq, enic->conf_rq_count);
1413 if (enic->conf_wq_count < required_wq) {
1414 dev_err(dev, "Not enough Transmit queues. Requested:%u, Configured:%u\n",
1415 eth_dev->data->nb_tx_queues, enic->conf_wq_count);
1419 if (enic->conf_cq_count < required_cq) {
1420 dev_err(dev, "Not enough Completion queues. Required:%u, Configured:%u\n",
1421 required_cq, enic->conf_cq_count);
1424 if (enic->conf_intr_count < required_intr) {
1425 dev_err(dev, "Not enough Interrupts to support Rx queue"
1426 " interrupts. Required:%u, Configured:%u\n",
1427 required_intr, enic->conf_intr_count);
1432 enic->rq_count = eth_dev->data->nb_rx_queues;
1433 enic->wq_count = eth_dev->data->nb_tx_queues;
1434 enic->cq_count = enic->rq_count + enic->wq_count;
1435 enic->intr_count = required_intr;
1441 /* Initialize the completion queue for an RQ */
1443 enic_reinit_rq(struct enic *enic, unsigned int rq_idx)
1445 struct vnic_rq *sop_rq, *data_rq;
1446 unsigned int cq_idx;
1449 sop_rq = &enic->rq[enic_rte_rq_idx_to_sop_idx(rq_idx)];
1450 data_rq = &enic->rq[enic_rte_rq_idx_to_data_idx(rq_idx)];
1453 vnic_cq_clean(&enic->cq[cq_idx]);
1454 vnic_cq_init(&enic->cq[cq_idx],
1455 0 /* flow_control_enable */,
1456 1 /* color_enable */,
1459 1 /* cq_tail_color */,
1460 0 /* interrupt_enable */,
1461 1 /* cq_entry_enable */,
1462 0 /* cq_message_enable */,
1463 0 /* interrupt offset */,
1464 0 /* cq_message_addr */);
1467 vnic_rq_init_start(sop_rq, enic_cq_rq(enic,
1468 enic_rte_rq_idx_to_sop_idx(rq_idx)), 0,
1469 sop_rq->ring.desc_count - 1, 1, 0);
1470 if (data_rq->in_use) {
1471 vnic_rq_init_start(data_rq,
1473 enic_rte_rq_idx_to_data_idx(rq_idx)), 0,
1474 data_rq->ring.desc_count - 1, 1, 0);
1477 rc = enic_alloc_rx_queue_mbufs(enic, sop_rq);
1481 if (data_rq->in_use) {
1482 rc = enic_alloc_rx_queue_mbufs(enic, data_rq);
1484 enic_rxmbuf_queue_release(enic, sop_rq);
1492 /* The Cisco NIC can send and receive packets up to a max packet size
1493 * determined by the NIC type and firmware. There is also an MTU
1494 * configured into the NIC via the CIMC/UCSM management interface
1495 * which can be overridden by this function (up to the max packet size).
1496 * Depending on the network setup, doing so may cause packet drops
1497 * and unexpected behavior.
1499 int enic_set_mtu(struct enic *enic, uint16_t new_mtu)
1501 unsigned int rq_idx;
1504 uint16_t old_mtu; /* previous setting */
1505 uint16_t config_mtu; /* Value configured into NIC via CIMC/UCSM */
1506 struct rte_eth_dev *eth_dev = enic->rte_dev;
1508 old_mtu = eth_dev->data->mtu;
1509 config_mtu = enic->config.mtu;
1511 if (rte_eal_process_type() != RTE_PROC_PRIMARY)
1512 return -E_RTE_SECONDARY;
1514 if (new_mtu > enic->max_mtu) {
1516 "MTU not updated: requested (%u) greater than max (%u)\n",
1517 new_mtu, enic->max_mtu);
1520 if (new_mtu < ENIC_MIN_MTU) {
1522 "MTU not updated: requested (%u) less than min (%u)\n",
1523 new_mtu, ENIC_MIN_MTU);
1526 if (new_mtu > config_mtu)
1528 "MTU (%u) is greater than value configured in NIC (%u)\n",
1529 new_mtu, config_mtu);
1531 /* Update the MTU and maximum packet length */
1532 eth_dev->data->mtu = new_mtu;
1533 eth_dev->data->dev_conf.rxmode.max_rx_pkt_len =
1534 enic_mtu_to_max_rx_pktlen(new_mtu);
1537 * If the device has not started (enic_enable), nothing to do.
1538 * Later, enic_enable() will set up RQs reflecting the new maximum
1541 if (!eth_dev->data->dev_started)
1545 * The device has started, re-do RQs on the fly. In the process, we
1546 * pick up the new maximum packet length.
1548 * Some applications rely on the ability to change MTU without stopping
1549 * the device. So keep this behavior for now.
1551 rte_spinlock_lock(&enic->mtu_lock);
1553 /* Stop traffic on all RQs */
1554 for (rq_idx = 0; rq_idx < enic->rq_count * 2; rq_idx++) {
1555 rq = &enic->rq[rq_idx];
1556 if (rq->is_sop && rq->in_use) {
1557 rc = enic_stop_rq(enic,
1558 enic_sop_rq_idx_to_rte_idx(rq_idx));
1560 dev_err(enic, "Failed to stop Rq %u\n", rq_idx);
1566 /* replace Rx function with a no-op to avoid getting stale pkts */
1567 eth_dev->rx_pkt_burst = enic_dummy_recv_pkts;
1570 /* Allow time for threads to exit the real Rx function. */
1573 /* now it is safe to reconfigure the RQs */
1576 /* free and reallocate RQs with the new MTU */
1577 for (rq_idx = 0; rq_idx < enic->rq_count; rq_idx++) {
1578 rq = &enic->rq[enic_rte_rq_idx_to_sop_idx(rq_idx)];
1583 rc = enic_alloc_rq(enic, rq_idx, rq->socket_id, rq->mp,
1584 rq->tot_nb_desc, rq->rx_free_thresh);
1587 "Fatal MTU alloc error- No traffic will pass\n");
1591 rc = enic_reinit_rq(enic, rq_idx);
1594 "Fatal MTU RQ reinit- No traffic will pass\n");
1599 /* put back the real receive function */
1601 pick_rx_handler(enic);
1604 /* restart Rx traffic */
1605 for (rq_idx = 0; rq_idx < enic->rq_count; rq_idx++) {
1606 rq = &enic->rq[enic_rte_rq_idx_to_sop_idx(rq_idx)];
1607 if (rq->is_sop && rq->in_use)
1608 enic_start_rq(enic, rq_idx);
1612 dev_info(enic, "MTU changed from %u to %u\n", old_mtu, new_mtu);
1613 rte_spinlock_unlock(&enic->mtu_lock);
1617 static int enic_dev_init(struct enic *enic)
1620 struct rte_eth_dev *eth_dev = enic->rte_dev;
1622 vnic_dev_intr_coal_timer_info_default(enic->vdev);
1624 /* Get vNIC configuration
1626 err = enic_get_vnic_config(enic);
1628 dev_err(dev, "Get vNIC configuration failed, aborting\n");
1632 /* Get available resource counts */
1633 enic_get_res_counts(enic);
1634 if (enic->conf_rq_count == 1) {
1635 dev_err(enic, "Running with only 1 RQ configured in the vNIC is not supported.\n");
1636 dev_err(enic, "Please configure 2 RQs in the vNIC for each Rx queue used by DPDK.\n");
1637 dev_err(enic, "See the ENIC PMD guide for more information.\n");
1640 /* Queue counts may be zeros. rte_zmalloc returns NULL in that case. */
1641 enic->cq = rte_zmalloc("enic_vnic_cq", sizeof(struct vnic_cq) *
1642 enic->conf_cq_count, 8);
1643 enic->intr = rte_zmalloc("enic_vnic_intr", sizeof(struct vnic_intr) *
1644 enic->conf_intr_count, 8);
1645 enic->rq = rte_zmalloc("enic_vnic_rq", sizeof(struct vnic_rq) *
1646 enic->conf_rq_count, 8);
1647 enic->wq = rte_zmalloc("enic_vnic_wq", sizeof(struct vnic_wq) *
1648 enic->conf_wq_count, 8);
1649 if (enic->conf_cq_count > 0 && enic->cq == NULL) {
1650 dev_err(enic, "failed to allocate vnic_cq, aborting.\n");
1653 if (enic->conf_intr_count > 0 && enic->intr == NULL) {
1654 dev_err(enic, "failed to allocate vnic_intr, aborting.\n");
1657 if (enic->conf_rq_count > 0 && enic->rq == NULL) {
1658 dev_err(enic, "failed to allocate vnic_rq, aborting.\n");
1661 if (enic->conf_wq_count > 0 && enic->wq == NULL) {
1662 dev_err(enic, "failed to allocate vnic_wq, aborting.\n");
1666 /* Get the supported filters */
1667 enic_fdir_info(enic);
1669 eth_dev->data->mac_addrs = rte_zmalloc("enic_mac_addr",
1670 sizeof(struct rte_ether_addr) *
1671 ENIC_UNICAST_PERFECT_FILTERS, 0);
1672 if (!eth_dev->data->mac_addrs) {
1673 dev_err(enic, "mac addr storage alloc failed, aborting.\n");
1676 rte_ether_addr_copy((struct rte_ether_addr *)enic->mac_addr,
1677 eth_dev->data->mac_addrs);
1679 vnic_dev_set_reset_flag(enic->vdev, 0);
1681 LIST_INIT(&enic->flows);
1683 /* set up link status checking */
1684 vnic_dev_notify_set(enic->vdev, -1); /* No Intr for notify */
1686 enic->overlay_offload = false;
1687 if (enic->disable_overlay && enic->vxlan) {
1689 * Explicitly disable overlay offload as the setting is
1690 * sticky, and resetting vNIC does not disable it.
1692 if (vnic_dev_overlay_offload_ctrl(enic->vdev,
1693 OVERLAY_FEATURE_VXLAN,
1694 OVERLAY_OFFLOAD_DISABLE)) {
1695 dev_err(enic, "failed to disable overlay offload\n");
1697 dev_info(enic, "Overlay offload is disabled\n");
1700 if (!enic->disable_overlay && enic->vxlan &&
1701 /* 'VXLAN feature' enables VXLAN, NVGRE, and GENEVE. */
1702 vnic_dev_overlay_offload_ctrl(enic->vdev,
1703 OVERLAY_FEATURE_VXLAN,
1704 OVERLAY_OFFLOAD_ENABLE) == 0) {
1705 enic->tx_offload_capa |=
1706 DEV_TX_OFFLOAD_OUTER_IPV4_CKSUM |
1707 DEV_TX_OFFLOAD_GENEVE_TNL_TSO |
1708 DEV_TX_OFFLOAD_VXLAN_TNL_TSO;
1709 enic->tx_offload_mask |=
1712 PKT_TX_OUTER_IP_CKSUM |
1714 enic->overlay_offload = true;
1715 dev_info(enic, "Overlay offload is enabled\n");
1718 * Reset the vxlan port if HW vxlan parsing is available. It
1719 * is always enabled regardless of overlay offload
1723 enic->vxlan_port = ENIC_DEFAULT_VXLAN_PORT;
1725 * Reset the vxlan port to the default, as the NIC firmware
1726 * does not reset it automatically and keeps the old setting.
1728 if (vnic_dev_overlay_offload_cfg(enic->vdev,
1729 OVERLAY_CFG_VXLAN_PORT_UPDATE,
1730 ENIC_DEFAULT_VXLAN_PORT)) {
1731 dev_err(enic, "failed to update vxlan port\n");
1740 int enic_probe(struct enic *enic)
1742 struct rte_pci_device *pdev = enic->pdev;
1745 dev_debug(enic, "Initializing ENIC PMD\n");
1747 /* if this is a secondary process the hardware is already initialized */
1748 if (rte_eal_process_type() != RTE_PROC_PRIMARY)
1751 enic->bar0.vaddr = (void *)pdev->mem_resource[0].addr;
1752 enic->bar0.len = pdev->mem_resource[0].len;
1754 /* Register vNIC device */
1755 enic->vdev = vnic_dev_register(NULL, enic, enic->pdev, &enic->bar0, 1);
1757 dev_err(enic, "vNIC registration failed, aborting\n");
1761 LIST_INIT(&enic->memzone_list);
1762 rte_spinlock_init(&enic->memzone_list_lock);
1764 vnic_register_cbacks(enic->vdev,
1765 enic_alloc_consistent,
1766 enic_free_consistent);
1769 * Allocate the consistent memory for stats upfront so both primary and
1770 * secondary processes can dump stats.
1772 err = vnic_dev_alloc_stats_mem(enic->vdev);
1774 dev_err(enic, "Failed to allocate cmd memory, aborting\n");
1775 goto err_out_unregister;
1777 /* Issue device open to get device in known state */
1778 err = enic_dev_open(enic);
1780 dev_err(enic, "vNIC dev open failed, aborting\n");
1781 goto err_out_unregister;
1784 /* Set ingress vlan rewrite mode before vnic initialization */
1785 dev_debug(enic, "Set ig_vlan_rewrite_mode=%u\n",
1786 enic->ig_vlan_rewrite_mode);
1787 err = vnic_dev_set_ig_vlan_rewrite_mode(enic->vdev,
1788 enic->ig_vlan_rewrite_mode);
1791 "Failed to set ingress vlan rewrite mode, aborting.\n");
1792 goto err_out_dev_close;
1795 /* Issue device init to initialize the vnic-to-switch link.
1796 * We'll start with carrier off and wait for link UP
1797 * notification later to turn on carrier. We don't need
1798 * to wait here for the vnic-to-switch link initialization
1799 * to complete; link UP notification is the indication that
1800 * the process is complete.
1803 err = vnic_dev_init(enic->vdev, 0);
1805 dev_err(enic, "vNIC dev init failed, aborting\n");
1806 goto err_out_dev_close;
1809 err = enic_dev_init(enic);
1811 dev_err(enic, "Device initialization failed, aborting\n");
1812 goto err_out_dev_close;
1818 vnic_dev_close(enic->vdev);
1820 vnic_dev_unregister(enic->vdev);
1825 void enic_remove(struct enic *enic)
1827 enic_dev_deinit(enic);
1828 vnic_dev_close(enic->vdev);
1829 vnic_dev_unregister(enic->vdev);