net/hns3: refactor multi-process initialization
[dpdk.git] / drivers / vdpa / mlx5 / mlx5_vdpa_virtq.c
index 17e71cf..cb37ba0 100644 (file)
@@ -4,6 +4,7 @@
 #include <string.h>
 #include <unistd.h>
 #include <sys/mman.h>
+#include <sys/eventfd.h>
 
 #include <rte_malloc.h>
 #include <rte_errno.h>
@@ -24,7 +25,8 @@ mlx5_vdpa_virtq_handler(void *cb_arg)
        int nbytes;
 
        do {
-               nbytes = read(virtq->intr_handle.fd, &buf, 8);
+               nbytes = read(rte_intr_fd_get(virtq->intr_handle), &buf,
+                             8);
                if (nbytes < 0) {
                        if (errno == EINTR ||
                            errno == EWOULDBLOCK ||
@@ -57,21 +59,23 @@ mlx5_vdpa_virtq_unset(struct mlx5_vdpa_virtq *virtq)
        int retries = MLX5_VDPA_INTR_RETRIES;
        int ret = -EAGAIN;
 
-       if (virtq->intr_handle.fd != -1) {
+       if (rte_intr_fd_get(virtq->intr_handle) != -1) {
                while (retries-- && ret == -EAGAIN) {
-                       ret = rte_intr_callback_unregister(&virtq->intr_handle,
+                       ret = rte_intr_callback_unregister(virtq->intr_handle,
                                                        mlx5_vdpa_virtq_handler,
                                                        virtq);
                        if (ret == -EAGAIN) {
                                DRV_LOG(DEBUG, "Try again to unregister fd %d "
-                                       "of virtq %d interrupt, retries = %d.",
-                                       virtq->intr_handle.fd,
-                                       (int)virtq->index, retries);
+                               "of virtq %d interrupt, retries = %d.",
+                               rte_intr_fd_get(virtq->intr_handle),
+                               (int)virtq->index, retries);
+
                                usleep(MLX5_VDPA_INTR_RETRIES_USEC);
                        }
                }
-               virtq->intr_handle.fd = -1;
+               rte_intr_fd_set(virtq->intr_handle, -1);
        }
+       rte_intr_instance_free(virtq->intr_handle);
        if (virtq->virtq) {
                ret = mlx5_vdpa_virtq_stop(virtq->priv, virtq->index);
                if (ret)
@@ -88,11 +92,6 @@ mlx5_vdpa_virtq_unset(struct mlx5_vdpa_virtq *virtq)
                        rte_free(virtq->umems[i].buf);
        }
        memset(&virtq->umems, 0, sizeof(virtq->umems));
-       if (virtq->counters) {
-               claim_zero(mlx5_devx_cmd_destroy(virtq->counters));
-               virtq->counters = NULL;
-       }
-       memset(&virtq->reset, 0, sizeof(virtq->reset));
        if (virtq->eqp.fw_qp)
                mlx5_vdpa_event_qp_destroy(&virtq->eqp);
        virtq->notifier_state = MLX5_VDPA_NOTIFIER_STATE_DISABLED;
@@ -103,12 +102,19 @@ void
 mlx5_vdpa_virtqs_release(struct mlx5_vdpa_priv *priv)
 {
        int i;
+       struct mlx5_vdpa_virtq *virtq;
 
-       for (i = 0; i < priv->nr_virtqs; i++)
-               mlx5_vdpa_virtq_unset(&priv->virtqs[i]);
-       if (priv->tis) {
-               claim_zero(mlx5_devx_cmd_destroy(priv->tis));
-               priv->tis = NULL;
+       for (i = 0; i < priv->nr_virtqs; i++) {
+               virtq = &priv->virtqs[i];
+               mlx5_vdpa_virtq_unset(virtq);
+               if (virtq->counters)
+                       claim_zero(mlx5_devx_cmd_destroy(virtq->counters));
+       }
+       for (i = 0; i < priv->num_lag_ports; i++) {
+               if (priv->tiss[i]) {
+                       claim_zero(mlx5_devx_cmd_destroy(priv->tiss[i]));
+                       priv->tiss[i] = NULL;
+               }
        }
        if (priv->td) {
                claim_zero(mlx5_devx_cmd_destroy(priv->td));
@@ -119,6 +125,7 @@ mlx5_vdpa_virtqs_release(struct mlx5_vdpa_priv *priv)
                priv->virtq_db_addr = NULL;
        }
        priv->features = 0;
+       memset(priv->virtqs, 0, sizeof(*virtq) * priv->nr_virtqs);
        priv->nr_virtqs = 0;
 }
 
@@ -138,7 +145,6 @@ mlx5_vdpa_virtq_modify(struct mlx5_vdpa_virtq *virtq, int state)
 int
 mlx5_vdpa_virtq_stop(struct mlx5_vdpa_priv *priv, int index)
 {
-       struct mlx5_devx_virtq_attr attr = {0};
        struct mlx5_vdpa_virtq *virtq = &priv->virtqs[index];
        int ret;
 
@@ -148,6 +154,17 @@ mlx5_vdpa_virtq_stop(struct mlx5_vdpa_priv *priv, int index)
        if (ret)
                return -1;
        virtq->stopped = true;
+       DRV_LOG(DEBUG, "vid %u virtq %u was stopped.", priv->vid, index);
+       return mlx5_vdpa_virtq_query(priv, index);
+}
+
+int
+mlx5_vdpa_virtq_query(struct mlx5_vdpa_priv *priv, int index)
+{
+       struct mlx5_devx_virtq_attr attr = {0};
+       struct mlx5_vdpa_virtq *virtq = &priv->virtqs[index];
+       int ret;
+
        if (mlx5_devx_cmd_query_virtq(virtq->virtq, &attr)) {
                DRV_LOG(ERR, "Failed to query virtq %d.", index);
                return -1;
@@ -162,7 +179,9 @@ mlx5_vdpa_virtq_stop(struct mlx5_vdpa_priv *priv, int index)
                DRV_LOG(ERR, "Failed to set virtq %d base.", index);
                return -1;
        }
-       DRV_LOG(DEBUG, "vid %u virtq %u was stopped.", priv->vid, index);
+       if (attr.state == MLX5_VIRTQ_STATE_ERROR)
+               DRV_LOG(WARNING, "vid %d vring %d hw error=%hhu",
+                       priv->vid, index, attr.error_type);
        return 0;
 }
 
@@ -195,6 +214,8 @@ mlx5_vdpa_virtq_setup(struct mlx5_vdpa_priv *priv, int index)
        unsigned int i;
        uint16_t last_avail_idx;
        uint16_t last_used_idx;
+       uint16_t event_num = MLX5_EVENT_TYPE_OBJECT_CHANGE;
+       uint64_t cookie;
 
        ret = rte_vhost_get_vhost_vring(priv->vid, index, &vq);
        if (ret)
@@ -231,8 +252,9 @@ mlx5_vdpa_virtq_setup(struct mlx5_vdpa_priv *priv, int index)
                        " need event QPs and event mechanism.", index);
        }
        if (priv->caps.queue_counters_valid) {
-               virtq->counters = mlx5_devx_cmd_create_virtio_q_counters
-                                                                   (priv->ctx);
+               if (!virtq->counters)
+                       virtq->counters = mlx5_devx_cmd_create_virtio_q_counters
+                                                             (priv->cdev->ctx);
                if (!virtq->counters) {
                        DRV_LOG(ERR, "Failed to create virtq couners for virtq"
                                " %d.", index);
@@ -251,7 +273,7 @@ mlx5_vdpa_virtq_setup(struct mlx5_vdpa_priv *priv, int index)
                                " %u.", i, index);
                        goto error;
                }
-               virtq->umems[i].obj = mlx5_glue->devx_umem_reg(priv->ctx,
+               virtq->umems[i].obj = mlx5_glue->devx_umem_reg(priv->cdev->ctx,
                                                        virtq->umems[i].buf,
                                                        virtq->umems[i].size,
                                                        IBV_ACCESS_LOCAL_WRITE);
@@ -302,10 +324,13 @@ mlx5_vdpa_virtq_setup(struct mlx5_vdpa_priv *priv, int index)
        attr.hw_used_index = last_used_idx;
        attr.q_size = vq.size;
        attr.mkey = priv->gpa_mkey_index;
-       attr.tis_id = priv->tis->id;
+       attr.tis_id = priv->tiss[(index / 2) % priv->num_lag_ports]->id;
        attr.queue_index = index;
-       attr.pd = priv->pdn;
-       virtq->virtq = mlx5_devx_cmd_create_virtq(priv->ctx, &attr);
+       attr.pd = priv->cdev->pdn;
+       attr.hw_latency_mode = priv->hw_latency_mode;
+       attr.hw_max_latency_us = priv->hw_max_latency_us;
+       attr.hw_max_pending_comp = priv->hw_max_pending_comp;
+       virtq->virtq = mlx5_devx_cmd_create_virtq(priv->cdev->ctx, &attr);
        virtq->priv = priv;
        if (!virtq->virtq)
                goto error;
@@ -315,24 +340,52 @@ mlx5_vdpa_virtq_setup(struct mlx5_vdpa_priv *priv, int index)
        virtq->priv = priv;
        rte_write32(virtq->index, priv->virtq_db_addr);
        /* Setup doorbell mapping. */
-       virtq->intr_handle.fd = vq.kickfd;
-       if (virtq->intr_handle.fd == -1) {
+       virtq->intr_handle =
+               rte_intr_instance_alloc(RTE_INTR_INSTANCE_F_SHARED);
+       if (virtq->intr_handle == NULL) {
+               DRV_LOG(ERR, "Fail to allocate intr_handle");
+               goto error;
+       }
+
+       if (rte_intr_fd_set(virtq->intr_handle, vq.kickfd))
+               goto error;
+
+       if (rte_intr_fd_get(virtq->intr_handle) == -1) {
                DRV_LOG(WARNING, "Virtq %d kickfd is invalid.", index);
        } else {
-               virtq->intr_handle.type = RTE_INTR_HANDLE_EXT;
-               if (rte_intr_callback_register(&virtq->intr_handle,
+               if (rte_intr_type_set(virtq->intr_handle, RTE_INTR_HANDLE_EXT))
+                       goto error;
+
+               if (rte_intr_callback_register(virtq->intr_handle,
                                               mlx5_vdpa_virtq_handler,
                                               virtq)) {
-                       virtq->intr_handle.fd = -1;
+                       rte_intr_fd_set(virtq->intr_handle, -1);
                        DRV_LOG(ERR, "Failed to register virtq %d interrupt.",
                                index);
                        goto error;
                } else {
                        DRV_LOG(DEBUG, "Register fd %d interrupt for virtq %d.",
-                               virtq->intr_handle.fd, index);
+                               rte_intr_fd_get(virtq->intr_handle),
+                               index);
                }
        }
+       /* Subscribe virtq error event. */
+       virtq->version++;
+       cookie = ((uint64_t)virtq->version << 32) + index;
+       ret = mlx5_glue->devx_subscribe_devx_event(priv->err_chnl,
+                                                  virtq->virtq->obj,
+                                                  sizeof(event_num),
+                                                  &event_num, cookie);
+       if (ret) {
+               DRV_LOG(ERR, "Failed to subscribe device %d virtq %d error event.",
+                       priv->vid, index);
+               rte_errno = errno;
+               goto error;
+       }
        virtq->stopped = false;
+       /* Initial notification to ask Qemu handling completed buffers. */
+       if (virtq->eqp.cq.callfd != -1)
+               eventfd_write(virtq->eqp.cq.callfd, (eventfd_t)1);
        DRV_LOG(DEBUG, "vid %u virtq %u was created successfully.", priv->vid,
                index);
        return 0;
@@ -400,6 +453,7 @@ int
 mlx5_vdpa_virtqs_prepare(struct mlx5_vdpa_priv *priv)
 {
        struct mlx5_devx_tis_attr tis_attr = {0};
+       struct ibv_context *ctx = priv->cdev->ctx;
        uint32_t i;
        uint16_t nr_vring = rte_vhost_get_vring_num(priv->vid);
        int ret = rte_vhost_get_negotiated_features(priv->vid, &priv->features);
@@ -408,6 +462,13 @@ mlx5_vdpa_virtqs_prepare(struct mlx5_vdpa_priv *priv)
                DRV_LOG(ERR, "Failed to configure negotiated features.");
                return -1;
        }
+       if ((priv->features & (1ULL << VIRTIO_NET_F_CSUM)) == 0 &&
+           ((priv->features & (1ULL << VIRTIO_NET_F_HOST_TSO4)) > 0 ||
+            (priv->features & (1ULL << VIRTIO_NET_F_HOST_TSO6)) > 0)) {
+               /* Packet may be corrupted if TSO is enabled without CSUM. */
+               DRV_LOG(INFO, "TSO is enabled without CSUM, force CSUM.");
+               priv->features |= (1ULL << VIRTIO_NET_F_CSUM);
+       }
        if (nr_vring > priv->caps.max_num_virtio_queues * 2) {
                DRV_LOG(ERR, "Do not support more than %d virtqs(%d).",
                        (int)priv->caps.max_num_virtio_queues * 2,
@@ -416,7 +477,7 @@ mlx5_vdpa_virtqs_prepare(struct mlx5_vdpa_priv *priv)
        }
        /* Always map the entire page. */
        priv->virtq_db_addr = mmap(NULL, priv->var->length, PROT_READ |
-                                  PROT_WRITE, MAP_SHARED, priv->ctx->cmd_fd,
+                                  PROT_WRITE, MAP_SHARED, ctx->cmd_fd,
                                   priv->var->mmap_off);
        if (priv->virtq_db_addr == MAP_FAILED) {
                DRV_LOG(ERR, "Failed to map doorbell page %u.", errno);
@@ -426,16 +487,20 @@ mlx5_vdpa_virtqs_prepare(struct mlx5_vdpa_priv *priv)
                DRV_LOG(DEBUG, "VAR address of doorbell mapping is %p.",
                        priv->virtq_db_addr);
        }
-       priv->td = mlx5_devx_cmd_create_td(priv->ctx);
+       priv->td = mlx5_devx_cmd_create_td(ctx);
        if (!priv->td) {
                DRV_LOG(ERR, "Failed to create transport domain.");
                return -rte_errno;
        }
        tis_attr.transport_domain = priv->td->id;
-       priv->tis = mlx5_devx_cmd_create_tis(priv->ctx, &tis_attr);
-       if (!priv->tis) {
-               DRV_LOG(ERR, "Failed to create TIS.");
-               goto error;
+       for (i = 0; i < priv->num_lag_ports; i++) {
+               /* 0 is auto affinity, non-zero value to propose port. */
+               tis_attr.lag_tx_port_affinity = i + 1;
+               priv->tiss[i] = mlx5_devx_cmd_create_tis(ctx, &tis_attr);
+               if (!priv->tiss[i]) {
+                       DRV_LOG(ERR, "Failed to create TIS %u.", i);
+                       goto error;
+               }
        }
        priv->nr_virtqs = nr_vring;
        for (i = 0; i < nr_vring; i++)
@@ -456,9 +521,10 @@ mlx5_vdpa_virtq_is_modified(struct mlx5_vdpa_priv *priv,
 
        if (ret)
                return -1;
-       if (vq.size != virtq->vq_size || vq.kickfd != virtq->intr_handle.fd)
+       if (vq.size != virtq->vq_size || vq.kickfd !=
+           rte_intr_fd_get(virtq->intr_handle))
                return 1;
-       if (virtq->eqp.cq.cq) {
+       if (virtq->eqp.cq.cq_obj.cq) {
                if (vq.callfd != virtq->eqp.cq.callfd)
                        return 1;
        } else if (vq.callfd != -1) {
@@ -526,12 +592,11 @@ mlx5_vdpa_virtq_stats_get(struct mlx5_vdpa_priv *priv, int qid,
        struct mlx5_devx_virtio_q_couners_attr attr = {0};
        int ret;
 
-       if (!virtq->virtq || !virtq->enable) {
+       if (!virtq->counters) {
                DRV_LOG(ERR, "Failed to read virtq %d statistics - virtq "
                        "is invalid.", qid);
                return -EINVAL;
        }
-       MLX5_ASSERT(virtq->counters);
        ret = mlx5_devx_cmd_query_virtio_q_counters(virtq->counters, &attr);
        if (ret) {
                DRV_LOG(ERR, "Failed to read virtq %d stats from HW.", qid);
@@ -583,12 +648,11 @@ mlx5_vdpa_virtq_stats_reset(struct mlx5_vdpa_priv *priv, int qid)
        struct mlx5_vdpa_virtq *virtq = &priv->virtqs[qid];
        int ret;
 
-       if (!virtq->virtq || !virtq->enable) {
+       if (!virtq->counters) {
                DRV_LOG(ERR, "Failed to read virtq %d statistics - virtq "
                        "is invalid.", qid);
                return -EINVAL;
        }
-       MLX5_ASSERT(virtq->counters);
        ret = mlx5_devx_cmd_query_virtio_q_counters(virtq->counters,
                                                    &virtq->reset);
        if (ret)