1 /* SPDX-License-Identifier: BSD-3-Clause
2 * Copyright 2015 6WIND S.A.
3 * Copyright 2015 Mellanox Technologies, Ltd
9 #include <rte_ethdev_driver.h>
10 #include <rte_interrupts.h>
11 #include <rte_alarm.h>
15 #include "mlx5_rxtx.h"
16 #include "mlx5_utils.h"
17 #include "rte_pmd_mlx5.h"
20 * Stop traffic on Tx queues.
23 * Pointer to Ethernet device structure.
26 mlx5_txq_stop(struct rte_eth_dev *dev)
28 struct mlx5_priv *priv = dev->data->dev_private;
31 for (i = 0; i != priv->txqs_n; ++i)
32 mlx5_txq_release(dev, i);
36 * Start traffic on Tx queues.
39 * Pointer to Ethernet device structure.
42 * 0 on success, a negative errno value otherwise and rte_errno is set.
45 mlx5_txq_start(struct rte_eth_dev *dev)
47 struct mlx5_priv *priv = dev->data->dev_private;
51 for (i = 0; i != priv->txqs_n; ++i) {
52 struct mlx5_txq_ctrl *txq_ctrl = mlx5_txq_get(dev, i);
56 if (txq_ctrl->type == MLX5_TXQ_TYPE_HAIRPIN) {
57 txq_ctrl->obj = mlx5_txq_obj_new
58 (dev, i, MLX5_TXQ_OBJ_TYPE_DEVX_HAIRPIN);
60 txq_alloc_elts(txq_ctrl);
61 txq_ctrl->obj = mlx5_txq_obj_new
62 (dev, i, MLX5_TXQ_OBJ_TYPE_IBV);
71 ret = rte_errno; /* Save rte_errno before cleanup. */
73 mlx5_txq_release(dev, i);
75 rte_errno = ret; /* Restore rte_errno. */
80 * Stop traffic on Rx queues.
83 * Pointer to Ethernet device structure.
86 mlx5_rxq_stop(struct rte_eth_dev *dev)
88 struct mlx5_priv *priv = dev->data->dev_private;
91 for (i = 0; i != priv->rxqs_n; ++i)
92 mlx5_rxq_release(dev, i);
96 * Start traffic on Rx queues.
99 * Pointer to Ethernet device structure.
102 * 0 on success, a negative errno value otherwise and rte_errno is set.
105 mlx5_rxq_start(struct rte_eth_dev *dev)
107 struct mlx5_priv *priv = dev->data->dev_private;
110 enum mlx5_rxq_obj_type obj_type =
111 priv->config.dv_flow_en && priv->config.devx &&
112 priv->config.dest_tir ?
113 MLX5_RXQ_OBJ_TYPE_DEVX_RQ : MLX5_RXQ_OBJ_TYPE_IBV;
115 /* Allocate/reuse/resize mempool for Multi-Packet RQ. */
116 if (mlx5_mprq_alloc_mp(dev)) {
117 /* Should not release Rx queues but return immediately. */
120 for (i = 0; i != priv->rxqs_n; ++i) {
121 struct mlx5_rxq_ctrl *rxq_ctrl = mlx5_rxq_get(dev, i);
122 struct rte_mempool *mp;
126 if (rxq_ctrl->type == MLX5_RXQ_TYPE_HAIRPIN) {
127 rxq_ctrl->obj = mlx5_rxq_obj_new
128 (dev, i, MLX5_RXQ_OBJ_TYPE_DEVX_HAIRPIN);
133 /* Pre-register Rx mempool. */
134 mp = mlx5_rxq_mprq_enabled(&rxq_ctrl->rxq) ?
135 rxq_ctrl->rxq.mprq_mp : rxq_ctrl->rxq.mp;
137 "port %u Rx queue %u registering"
138 " mp %s having %u chunks",
139 dev->data->port_id, rxq_ctrl->rxq.idx,
140 mp->name, mp->nb_mem_chunks);
141 mlx5_mr_update_mp(dev, &rxq_ctrl->rxq.mr_ctrl, mp);
142 ret = rxq_alloc_elts(rxq_ctrl);
145 rxq_ctrl->obj = mlx5_rxq_obj_new(dev, i, obj_type);
148 if (obj_type == MLX5_RXQ_OBJ_TYPE_IBV)
149 rxq_ctrl->wqn = rxq_ctrl->obj->wq->wq_num;
150 else if (obj_type == MLX5_RXQ_OBJ_TYPE_DEVX_RQ)
151 rxq_ctrl->wqn = rxq_ctrl->obj->rq->id;
155 ret = rte_errno; /* Save rte_errno before cleanup. */
157 mlx5_rxq_release(dev, i);
159 rte_errno = ret; /* Restore rte_errno. */
164 * Binds Tx queues to Rx queues for hairpin.
166 * Binds Tx queues to the target Rx queues.
169 * Pointer to Ethernet device structure.
172 * 0 on success, a negative errno value otherwise and rte_errno is set.
175 mlx5_hairpin_bind(struct rte_eth_dev *dev)
177 struct mlx5_priv *priv = dev->data->dev_private;
178 struct mlx5_devx_modify_sq_attr sq_attr = { 0 };
179 struct mlx5_devx_modify_rq_attr rq_attr = { 0 };
180 struct mlx5_txq_ctrl *txq_ctrl;
181 struct mlx5_rxq_ctrl *rxq_ctrl;
182 struct mlx5_devx_obj *sq;
183 struct mlx5_devx_obj *rq;
187 for (i = 0; i != priv->txqs_n; ++i) {
188 txq_ctrl = mlx5_txq_get(dev, i);
191 if (txq_ctrl->type != MLX5_TXQ_TYPE_HAIRPIN) {
192 mlx5_txq_release(dev, i);
195 if (!txq_ctrl->obj) {
197 DRV_LOG(ERR, "port %u no txq object found: %d",
198 dev->data->port_id, i);
199 mlx5_txq_release(dev, i);
202 sq = txq_ctrl->obj->sq;
203 rxq_ctrl = mlx5_rxq_get(dev,
204 txq_ctrl->hairpin_conf.peers[0].queue);
206 mlx5_txq_release(dev, i);
208 DRV_LOG(ERR, "port %u no rxq object found: %d",
210 txq_ctrl->hairpin_conf.peers[0].queue);
213 if (rxq_ctrl->type != MLX5_RXQ_TYPE_HAIRPIN ||
214 rxq_ctrl->hairpin_conf.peers[0].queue != i) {
216 DRV_LOG(ERR, "port %u Tx queue %d can't be binded to "
217 "Rx queue %d", dev->data->port_id,
218 i, txq_ctrl->hairpin_conf.peers[0].queue);
221 rq = rxq_ctrl->obj->rq;
224 DRV_LOG(ERR, "port %u hairpin no matching rxq: %d",
226 txq_ctrl->hairpin_conf.peers[0].queue);
229 sq_attr.state = MLX5_SQC_STATE_RDY;
230 sq_attr.sq_state = MLX5_SQC_STATE_RST;
231 sq_attr.hairpin_peer_rq = rq->id;
232 sq_attr.hairpin_peer_vhca = priv->config.hca_attr.vhca_id;
233 ret = mlx5_devx_cmd_modify_sq(sq, &sq_attr);
236 rq_attr.state = MLX5_SQC_STATE_RDY;
237 rq_attr.rq_state = MLX5_SQC_STATE_RST;
238 rq_attr.hairpin_peer_sq = sq->id;
239 rq_attr.hairpin_peer_vhca = priv->config.hca_attr.vhca_id;
240 ret = mlx5_devx_cmd_modify_rq(rq, &rq_attr);
243 mlx5_txq_release(dev, i);
244 mlx5_rxq_release(dev, txq_ctrl->hairpin_conf.peers[0].queue);
248 mlx5_txq_release(dev, i);
249 mlx5_rxq_release(dev, txq_ctrl->hairpin_conf.peers[0].queue);
254 * DPDK callback to start the device.
256 * Simulate device start by attaching all configured flows.
259 * Pointer to Ethernet device structure.
262 * 0 on success, a negative errno value otherwise and rte_errno is set.
265 mlx5_dev_start(struct rte_eth_dev *dev)
270 DRV_LOG(DEBUG, "port %u starting device", dev->data->port_id);
271 fine_inline = rte_mbuf_dynflag_lookup
272 (RTE_PMD_MLX5_FINE_GRANULARITY_INLINE, NULL);
274 rte_net_mlx5_dynf_inline_mask = 1UL << fine_inline;
276 rte_net_mlx5_dynf_inline_mask = 0;
277 if (dev->data->nb_rx_queues > 0) {
278 ret = mlx5_dev_configure_rss_reta(dev);
280 DRV_LOG(ERR, "port %u reta config failed: %s",
281 dev->data->port_id, strerror(rte_errno));
285 ret = mlx5_txq_start(dev);
287 DRV_LOG(ERR, "port %u Tx queue allocation failed: %s",
288 dev->data->port_id, strerror(rte_errno));
291 ret = mlx5_rxq_start(dev);
293 DRV_LOG(ERR, "port %u Rx queue allocation failed: %s",
294 dev->data->port_id, strerror(rte_errno));
298 ret = mlx5_hairpin_bind(dev);
300 DRV_LOG(ERR, "port %u hairpin binding failed: %s",
301 dev->data->port_id, strerror(rte_errno));
305 /* Set started flag here for the following steps like control flow. */
306 dev->data->dev_started = 1;
307 ret = mlx5_rx_intr_vec_enable(dev);
309 DRV_LOG(ERR, "port %u Rx interrupt vector creation failed",
313 mlx5_stats_init(dev);
314 ret = mlx5_traffic_enable(dev);
316 DRV_LOG(ERR, "port %u failed to set defaults flows",
320 /* Set a mask and offset of dynamic metadata flows into Rx queues*/
321 mlx5_flow_rxq_dynf_metadata_set(dev);
323 * In non-cached mode, it only needs to start the default mreg copy
324 * action and no flow created by application exists anymore.
325 * But it is worth wrapping the interface for further usage.
327 ret = mlx5_flow_start_default(dev);
329 DRV_LOG(DEBUG, "port %u failed to start default actions: %s",
330 dev->data->port_id, strerror(rte_errno));
334 dev->tx_pkt_burst = mlx5_select_tx_function(dev);
335 dev->rx_pkt_burst = mlx5_select_rx_function(dev);
336 /* Enable datapath on secondary process. */
337 mlx5_mp_req_start_rxtx(dev);
338 mlx5_dev_interrupt_handler_install(dev);
341 ret = rte_errno; /* Save rte_errno before cleanup. */
343 dev->data->dev_started = 0;
344 mlx5_flow_stop_default(dev);
345 mlx5_traffic_disable(dev);
348 rte_errno = ret; /* Restore rte_errno. */
353 * DPDK callback to stop the device.
355 * Simulate device stop by detaching all configured flows.
358 * Pointer to Ethernet device structure.
361 mlx5_dev_stop(struct rte_eth_dev *dev)
363 struct mlx5_priv *priv = dev->data->dev_private;
365 dev->data->dev_started = 0;
366 /* Prevent crashes when queues are still in use. */
367 dev->rx_pkt_burst = removed_rx_burst;
368 dev->tx_pkt_burst = removed_tx_burst;
370 /* Disable datapath on secondary process. */
371 mlx5_mp_req_stop_rxtx(dev);
372 usleep(1000 * priv->rxqs_n);
373 DRV_LOG(DEBUG, "port %u stopping device", dev->data->port_id);
374 mlx5_flow_stop_default(dev);
375 /* Control flows for default traffic can be removed firstly. */
376 mlx5_traffic_disable(dev);
377 /* All RX queue flags will be cleared in the flush interface. */
378 mlx5_flow_list_flush(dev, &priv->flows, true);
379 mlx5_rx_intr_vec_disable(dev);
380 mlx5_dev_interrupt_handler_uninstall(dev);
386 * Enable traffic flows configured by control plane
389 * Pointer to Ethernet device private data.
391 * Pointer to Ethernet device structure.
394 * 0 on success, a negative errno value otherwise and rte_errno is set.
397 mlx5_traffic_enable(struct rte_eth_dev *dev)
399 struct mlx5_priv *priv = dev->data->dev_private;
400 struct rte_flow_item_eth bcast = {
401 .dst.addr_bytes = "\xff\xff\xff\xff\xff\xff",
403 struct rte_flow_item_eth ipv6_multi_spec = {
404 .dst.addr_bytes = "\x33\x33\x00\x00\x00\x00",
406 struct rte_flow_item_eth ipv6_multi_mask = {
407 .dst.addr_bytes = "\xff\xff\x00\x00\x00\x00",
409 struct rte_flow_item_eth unicast = {
410 .src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
412 struct rte_flow_item_eth unicast_mask = {
413 .dst.addr_bytes = "\xff\xff\xff\xff\xff\xff",
415 const unsigned int vlan_filter_n = priv->vlan_filter_n;
416 const struct rte_ether_addr cmp = {
417 .addr_bytes = "\x00\x00\x00\x00\x00\x00",
424 * Hairpin txq default flow should be created no matter if it is
425 * isolation mode. Or else all the packets to be sent will be sent
426 * out directly without the TX flow actions, e.g. encapsulation.
428 for (i = 0; i != priv->txqs_n; ++i) {
429 struct mlx5_txq_ctrl *txq_ctrl = mlx5_txq_get(dev, i);
432 if (txq_ctrl->type == MLX5_TXQ_TYPE_HAIRPIN) {
433 ret = mlx5_ctrl_flow_source_queue(dev, i);
435 mlx5_txq_release(dev, i);
439 mlx5_txq_release(dev, i);
441 if (priv->config.dv_esw_en && !priv->config.vf) {
442 if (mlx5_flow_create_esw_table_zero_flow(dev))
443 priv->fdb_def_rule = 1;
445 DRV_LOG(INFO, "port %u FDB default rule cannot be"
446 " configured - only Eswitch group 0 flows are"
447 " supported.", dev->data->port_id);
451 if (dev->data->promiscuous) {
452 struct rte_flow_item_eth promisc = {
453 .dst.addr_bytes = "\x00\x00\x00\x00\x00\x00",
454 .src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
458 ret = mlx5_ctrl_flow(dev, &promisc, &promisc);
462 if (dev->data->all_multicast) {
463 struct rte_flow_item_eth multicast = {
464 .dst.addr_bytes = "\x01\x00\x00\x00\x00\x00",
465 .src.addr_bytes = "\x00\x00\x00\x00\x00\x00",
469 ret = mlx5_ctrl_flow(dev, &multicast, &multicast);
473 /* Add broadcast/multicast flows. */
474 for (i = 0; i != vlan_filter_n; ++i) {
475 uint16_t vlan = priv->vlan_filter[i];
477 struct rte_flow_item_vlan vlan_spec = {
478 .tci = rte_cpu_to_be_16(vlan),
480 struct rte_flow_item_vlan vlan_mask =
481 rte_flow_item_vlan_mask;
483 ret = mlx5_ctrl_flow_vlan(dev, &bcast, &bcast,
484 &vlan_spec, &vlan_mask);
487 ret = mlx5_ctrl_flow_vlan(dev, &ipv6_multi_spec,
489 &vlan_spec, &vlan_mask);
493 if (!vlan_filter_n) {
494 ret = mlx5_ctrl_flow(dev, &bcast, &bcast);
497 ret = mlx5_ctrl_flow(dev, &ipv6_multi_spec,
503 /* Add MAC address flows. */
504 for (i = 0; i != MLX5_MAX_MAC_ADDRESSES; ++i) {
505 struct rte_ether_addr *mac = &dev->data->mac_addrs[i];
507 if (!memcmp(mac, &cmp, sizeof(*mac)))
509 memcpy(&unicast.dst.addr_bytes,
512 for (j = 0; j != vlan_filter_n; ++j) {
513 uint16_t vlan = priv->vlan_filter[j];
515 struct rte_flow_item_vlan vlan_spec = {
516 .tci = rte_cpu_to_be_16(vlan),
518 struct rte_flow_item_vlan vlan_mask =
519 rte_flow_item_vlan_mask;
521 ret = mlx5_ctrl_flow_vlan(dev, &unicast,
528 if (!vlan_filter_n) {
529 ret = mlx5_ctrl_flow(dev, &unicast, &unicast_mask);
536 ret = rte_errno; /* Save rte_errno before cleanup. */
537 mlx5_flow_list_flush(dev, &priv->ctrl_flows, false);
538 rte_errno = ret; /* Restore rte_errno. */
544 * Disable traffic flows configured by control plane
547 * Pointer to Ethernet device private data.
550 mlx5_traffic_disable(struct rte_eth_dev *dev)
552 struct mlx5_priv *priv = dev->data->dev_private;
554 mlx5_flow_list_flush(dev, &priv->ctrl_flows, false);
558 * Restart traffic flows configured by control plane
561 * Pointer to Ethernet device private data.
564 * 0 on success, a negative errno value otherwise and rte_errno is set.
567 mlx5_traffic_restart(struct rte_eth_dev *dev)
569 if (dev->data->dev_started) {
570 mlx5_traffic_disable(dev);
571 return mlx5_traffic_enable(dev);