4 * Copyright 2017 6WIND S.A.
5 * Copyright 2017 Mellanox
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in
15 * the documentation and/or other materials provided with the
17 * * Neither the name of 6WIND S.A. nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 * Interrupts handling for mlx4 driver.
44 /* Verbs headers do not support -pedantic. */
46 #pragma GCC diagnostic ignored "-Wpedantic"
48 #include <infiniband/verbs.h>
50 #pragma GCC diagnostic error "-Wpedantic"
53 #include <rte_alarm.h>
54 #include <rte_errno.h>
55 #include <rte_ethdev.h>
57 #include <rte_interrupts.h>
60 #include "mlx4_rxtx.h"
61 #include "mlx4_utils.h"
63 static int mlx4_link_status_check(struct priv *priv);
66 * Clean up Rx interrupts handler.
69 * Pointer to private structure.
72 mlx4_rx_intr_vec_disable(struct priv *priv)
74 struct rte_intr_handle *intr_handle = &priv->intr_handle;
76 rte_intr_free_epoll_fd(intr_handle);
77 free(intr_handle->intr_vec);
78 intr_handle->nb_efd = 0;
79 intr_handle->intr_vec = NULL;
83 * Allocate queue vector and fill epoll fd list for Rx interrupts.
86 * Pointer to private structure.
89 * 0 on success, negative errno value otherwise and rte_errno is set.
92 mlx4_rx_intr_vec_enable(struct priv *priv)
95 unsigned int rxqs_n = priv->dev->data->nb_rx_queues;
96 unsigned int n = RTE_MIN(rxqs_n, (uint32_t)RTE_MAX_RXTX_INTR_VEC_ID);
97 unsigned int count = 0;
98 struct rte_intr_handle *intr_handle = &priv->intr_handle;
100 mlx4_rx_intr_vec_disable(priv);
101 intr_handle->intr_vec = malloc(sizeof(intr_handle->intr_vec[rxqs_n]));
102 if (intr_handle->intr_vec == NULL) {
104 ERROR("failed to allocate memory for interrupt vector,"
105 " Rx interrupts will not be supported");
108 for (i = 0; i != n; ++i) {
109 struct rxq *rxq = priv->dev->data->rx_queues[i];
111 /* Skip queues that cannot request interrupts. */
112 if (!rxq || !rxq->channel) {
113 /* Use invalid intr_vec[] index to disable entry. */
114 intr_handle->intr_vec[i] =
115 RTE_INTR_VEC_RXTX_OFFSET +
116 RTE_MAX_RXTX_INTR_VEC_ID;
119 if (count >= RTE_MAX_RXTX_INTR_VEC_ID) {
121 ERROR("too many Rx queues for interrupt vector size"
122 " (%d), Rx interrupts cannot be enabled",
123 RTE_MAX_RXTX_INTR_VEC_ID);
124 mlx4_rx_intr_vec_disable(priv);
127 intr_handle->intr_vec[i] = RTE_INTR_VEC_RXTX_OFFSET + count;
128 intr_handle->efds[count] = rxq->channel->fd;
132 mlx4_rx_intr_vec_disable(priv);
134 intr_handle->nb_efd = count;
139 * Process scheduled link status check.
141 * If LSC interrupts are requested, process related callback.
144 * Pointer to private structure.
147 mlx4_link_status_alarm(struct priv *priv)
149 const struct rte_intr_conf *const intr_conf =
150 &priv->dev->data->dev_conf.intr_conf;
152 assert(priv->intr_alarm == 1);
153 priv->intr_alarm = 0;
154 if (intr_conf->lsc && !mlx4_link_status_check(priv))
155 _rte_eth_dev_callback_process(priv->dev,
156 RTE_ETH_EVENT_INTR_LSC,
163 * In case of inconsistency, another check is scheduled.
166 * Pointer to private structure.
169 * 0 on success (link status is consistent), negative errno value
170 * otherwise and rte_errno is set.
173 mlx4_link_status_check(struct priv *priv)
175 struct rte_eth_link *link = &priv->dev->data->dev_link;
176 int ret = mlx4_link_update(priv->dev, 0);
180 if ((!link->link_speed && link->link_status) ||
181 (link->link_speed && !link->link_status)) {
182 if (!priv->intr_alarm) {
183 /* Inconsistent status, check again later. */
184 ret = rte_eal_alarm_set(MLX4_INTR_ALARM_TIMEOUT,
186 mlx4_link_status_alarm,
190 priv->intr_alarm = 1;
192 rte_errno = EINPROGRESS;
199 * Handle interrupts from the NIC.
202 * Pointer to private structure.
205 mlx4_interrupt_handler(struct priv *priv)
208 static const enum rte_eth_event_type type[] = {
209 [LSC] = RTE_ETH_EVENT_INTR_LSC,
210 [RMV] = RTE_ETH_EVENT_INTR_RMV,
212 uint32_t caught[RTE_DIM(type)] = { 0 };
213 struct ibv_async_event event;
214 const struct rte_intr_conf *const intr_conf =
215 &priv->dev->data->dev_conf.intr_conf;
218 /* Read all message and acknowledge them. */
219 while (!ibv_get_async_event(priv->ctx, &event)) {
220 switch (event.event_type) {
221 case IBV_EVENT_PORT_ACTIVE:
222 case IBV_EVENT_PORT_ERR:
223 if (intr_conf->lsc && !mlx4_link_status_check(priv))
226 case IBV_EVENT_DEVICE_FATAL:
231 DEBUG("event type %d on physical port %d not handled",
232 event.event_type, event.element.port_num);
234 ibv_ack_async_event(&event);
236 for (i = 0; i != RTE_DIM(caught); ++i)
238 _rte_eth_dev_callback_process(priv->dev, type[i],
243 * MLX4 CQ notification .
246 * Pointer to receive queue structure.
248 * Is request solicited or not.
251 mlx4_arm_cq(struct rxq *rxq, int solicited)
253 struct mlx4_cq *cq = &rxq->mcq;
255 uint32_t sn = cq->arm_sn & MLX4_CQ_DB_GEQ_N_MASK;
256 uint32_t ci = cq->cons_index & MLX4_CQ_DB_CI_MASK;
257 uint32_t cmd = solicited ? MLX4_CQ_DB_REQ_NOT_SOL : MLX4_CQ_DB_REQ_NOT;
259 *cq->arm_db = rte_cpu_to_be_32(sn << 28 | cmd | ci);
261 * Make sure that the doorbell record in host memory is
262 * written before ringing the doorbell via PCI MMIO.
265 doorbell = sn << 28 | cmd | cq->cqn;
268 rte_write64(rte_cpu_to_be_64(doorbell), cq->cq_db_reg);
272 * Uninstall interrupt handler.
275 * Pointer to private structure.
278 * 0 on success, negative errno value otherwise and rte_errno is set.
281 mlx4_intr_uninstall(struct priv *priv)
283 int err = rte_errno; /* Make sure rte_errno remains unchanged. */
285 if (priv->intr_handle.fd != -1) {
286 rte_intr_callback_unregister(&priv->intr_handle,
288 mlx4_interrupt_handler,
290 priv->intr_handle.fd = -1;
292 rte_eal_alarm_cancel((void (*)(void *))mlx4_link_status_alarm, priv);
293 priv->intr_alarm = 0;
294 mlx4_rx_intr_vec_disable(priv);
300 * Install interrupt handler.
303 * Pointer to private structure.
306 * 0 on success, negative errno value otherwise and rte_errno is set.
309 mlx4_intr_install(struct priv *priv)
311 const struct rte_intr_conf *const intr_conf =
312 &priv->dev->data->dev_conf.intr_conf;
315 mlx4_intr_uninstall(priv);
316 if (intr_conf->rxq && mlx4_rx_intr_vec_enable(priv) < 0)
318 if (intr_conf->lsc | intr_conf->rmv) {
319 priv->intr_handle.fd = priv->ctx->async_fd;
320 rc = rte_intr_callback_register(&priv->intr_handle,
322 mlx4_interrupt_handler,
331 mlx4_intr_uninstall(priv);
336 * DPDK callback for Rx queue interrupt disable.
339 * Pointer to Ethernet device structure.
344 * 0 on success, negative errno value otherwise and rte_errno is set.
347 mlx4_rx_intr_disable(struct rte_eth_dev *dev, uint16_t idx)
349 struct rxq *rxq = dev->data->rx_queues[idx];
350 struct ibv_cq *ev_cq;
354 if (!rxq || !rxq->channel) {
357 ret = ibv_get_cq_event(rxq->cq->channel, &ev_cq, &ev_ctx);
358 if (ret || ev_cq != rxq->cq)
363 WARN("unable to disable interrupt on rx queue %d",
367 ibv_ack_cq_events(rxq->cq, 1);
373 * DPDK callback for Rx queue interrupt enable.
376 * Pointer to Ethernet device structure.
381 * 0 on success, negative errno value otherwise and rte_errno is set.
384 mlx4_rx_intr_enable(struct rte_eth_dev *dev, uint16_t idx)
386 struct rxq *rxq = dev->data->rx_queues[idx];
389 if (!rxq || !rxq->channel) {
392 WARN("unable to arm interrupt on rx queue %d", idx);