net/mlx5: add 128B padding of Rx completion entry

author Yongseok Koh <yskoh@mellanox.com>

Thu, 25 Oct 2018 06:24:00 +0000 (06:24 +0000)

committer Ferruh Yigit <ferruh.yigit@intel.com>

Mon, 5 Nov 2018 14:01:25 +0000 (15:01 +0100)
author Yongseok Koh <yskoh@mellanox.com>
Thu, 25 Oct 2018 06:24:00 +0000 (06:24 +0000)
committer Ferruh Yigit <ferruh.yigit@intel.com>
Mon, 5 Nov 2018 14:01:25 +0000 (15:01 +0100)
diff --git a/doc/guides/nics/mlx5.rst b/doc/guides/nics/mlx5.rst

index 67696283e51bb35541648ff737875e4a9a021a08..1dc32829ffa033895efac32bb1c985509b95550d 100644 (file)
--- a/doc/guides/nics/mlx5.rst
+++ b/doc/guides/nics/mlx5.rst
@@ -246,6 +246,24 @@ Run-time configuration
    - x86_64 with ConnectX-4, ConnectX-4 LX, ConnectX-5 and Bluefield.
    - POWER8 and ARMv8 with ConnectX-4 LX, ConnectX-5 and Bluefield.
  
+- ``rxq_cqe_pad_en`` parameter [int]
+
+  A nonzero value enables 128B padding of CQE on RX side. The size of CQE
+  is aligned with the size of a cacheline of the core. If cacheline size is
+  128B, the CQE size is configured to be 128B even though the device writes
+  only 64B data on the cacheline. This is to avoid unnecessary cache
+  invalidation by device's two consecutive writes on to one cacheline.
+  However in some architecture, it is more beneficial to update entire
+  cacheline with padding the rest 64B rather than striding because
+  read-modify-write could drop performance a lot. On the other hand,
+  writing extra data will consume more PCIe bandwidth and could also drop
+  the maximum throughput. It is recommended to empirically set this
+  parameter. Disabled by default.
+
+  Supported on:
+
+  - CPU having 128B cacheline with ConnectX-5 and Bluefield.
+
  - ``mprq_en`` parameter [int]
  
    A nonzero value enables configuring Multi-Packet Rx queues. Rx queue is
diff --git a/drivers/net/mlx5/Makefile b/drivers/net/mlx5/Makefile

index 0beb139eacf8e1636c09791ca9eb8b1b71f025ef..ba433d35bbc573171a287acdf2acfca643cc0d45 100644 (file)
--- a/drivers/net/mlx5/Makefile
+++ b/drivers/net/mlx5/Makefile
@@ -137,6 +137,11 @@ mlx5_autoconf.h.new: $(RTE_SDK)/buildtools/auto-config-h.sh
                 infiniband/mlx5dv.h \
                 enum MLX5DV_CONTEXT_FLAGS_CQE_128B_COMP \
                 $(AUTOCONF_OUTPUT)
+       $Q sh -- '$<' '$@' \
+               HAVE_IBV_MLX5_MOD_CQE_128B_PAD \
+               infiniband/mlx5dv.h \
+               enum MLX5DV_CQ_INIT_ATTR_FLAGS_CQE_PAD \
+               $(AUTOCONF_OUTPUT)
         $Q sh -- '$<' '$@' \
                 HAVE_IBV_FLOW_DV_SUPPORT \
                 infiniband/mlx5dv.h \
diff --git a/drivers/net/mlx5/meson.build b/drivers/net/mlx5/meson.build

index e8cbe3eec1794d3f85fb55ec3705c2384c6c579d..f8e0c1b65b0a1bd474b65d473b5332bf89dc3a22 100644 (file)
--- a/drivers/net/mlx5/meson.build
+++ b/drivers/net/mlx5/meson.build
@@ -96,6 +96,8 @@ if build
                 'MLX5DV_CONTEXT_FLAGS_MPW_ALLOWED' ],
                 [ 'HAVE_IBV_MLX5_MOD_CQE_128B_COMP', 'infiniband/mlx5dv.h',
                 'MLX5DV_CONTEXT_FLAGS_CQE_128B_COMP' ],
+               [ 'HAVE_IBV_MLX5_MOD_CQE_128B_PAD', 'infiniband/mlx5dv.h',
+               'MLX5DV_CQ_INIT_ATTR_FLAGS_CQE_PAD' ],
                 [ 'HAVE_IBV_FLOW_DV_SUPPORT', 'infiniband/mlx5dv.h',
                 'MLX5DV_FLOW_ACTION_TAG' ],
                 [ 'HAVE_IBV_DEVICE_MPLS_SUPPORT', 'infiniband/verbs.h',
diff --git a/drivers/net/mlx5/mlx5.c b/drivers/net/mlx5/mlx5.c

index a277b5730e70d393c8ad7a9084e10ab510ecc444..ec6a482a9a1e3cf9c8d1f06695736f94179d8796 100644 (file)
--- a/drivers/net/mlx5/mlx5.c
+++ b/drivers/net/mlx5/mlx5.c
@@ -51,6 +51,9 @@
  /* Device parameter to enable RX completion queue compression. */
  #define MLX5_RXQ_CQE_COMP_EN "rxq_cqe_comp_en"
  
+/* Device parameter to enable RX completion entry padding to 128B. */
+#define MLX5_RXQ_CQE_PAD_EN "rxq_cqe_pad_en"
+
  /* Device parameter to enable Multi-Packet Rx queue. */
  #define MLX5_RX_MPRQ_EN "mprq_en"
  
@@ -479,6 +482,8 @@ mlx5_args_check(const char *key, const char *val, void *opaque)
         }
         if (strcmp(MLX5_RXQ_CQE_COMP_EN, key) == 0) {
                 config->cqe_comp = !!tmp;
+       } else if (strcmp(MLX5_RXQ_CQE_PAD_EN, key) == 0) {
+               config->cqe_pad = !!tmp;
         } else if (strcmp(MLX5_RX_MPRQ_EN, key) == 0) {
                 config->mprq.enabled = !!tmp;
         } else if (strcmp(MLX5_RX_MPRQ_LOG_STRIDE_NUM, key) == 0) {
@@ -531,6 +536,7 @@ mlx5_args(struct mlx5_dev_config *config, struct rte_devargs *devargs)
  {
         const char **params = (const char *[]){
                 MLX5_RXQ_CQE_COMP_EN,
+               MLX5_RXQ_CQE_PAD_EN,
                 MLX5_RX_MPRQ_EN,
                 MLX5_RX_MPRQ_LOG_STRIDE_NUM,
                 MLX5_RX_MPRQ_MAX_MEMCPY_LEN,
@@ -723,6 +729,7 @@ mlx5_dev_spawn(struct rte_device *dpdk_dev,
         struct mlx5dv_context dv_attr = { .comp_mask = 0 };
         struct mlx5_dev_config config = {
                 .vf = !!vf,
+               .cqe_pad = 0,
                 .mps = MLX5_ARG_UNSET,
                 .tx_vec_en = 1,
                 .rx_vec_en = 1,
@@ -743,6 +750,7 @@ mlx5_dev_spawn(struct rte_device *dpdk_dev,
         int err = 0;
         unsigned int mps;
         unsigned int cqe_comp;
+       unsigned int cqe_pad = 0;
         unsigned int tunnel_en = 0;
         unsigned int mpls_en = 0;
         unsigned int swp = 0;
@@ -863,6 +871,11 @@ mlx5_dev_spawn(struct rte_device *dpdk_dev,
         else
                 cqe_comp = 1;
         config.cqe_comp = cqe_comp;
+#ifdef HAVE_IBV_MLX5_MOD_CQE_128B_PAD
+       /* Whether device supports 128B Rx CQE padding. */
+       cqe_pad = RTE_CACHE_LINE_SIZE == 128 &&
+                 (dv_attr.flags & MLX5DV_CONTEXT_FLAGS_CQE_128B_PAD);
+#endif
  #ifdef HAVE_IBV_DEVICE_TUNNEL_SUPPORT
         if (dv_attr.comp_mask & MLX5DV_CONTEXT_MASK_TUNNEL_OFFLOADS) {
                 tunnel_en = ((dv_attr.tunnel_offloads_caps &
@@ -1079,6 +1092,12 @@ mlx5_dev_spawn(struct rte_device *dpdk_dev,
                 DRV_LOG(WARNING, "Rx CQE compression isn't supported");
                 config.cqe_comp = 0;
         }
+       if (config.cqe_pad && !cqe_pad) {
+               DRV_LOG(WARNING, "Rx CQE padding isn't supported");
+               config.cqe_pad = 0;
+       } else if (config.cqe_pad) {
+               DRV_LOG(INFO, "Rx CQE padding is enabled");
+       }
         if (config.mprq.enabled && mprq) {
                 if (config.mprq.stride_num_n > mprq_max_stride_num_n ||
                     config.mprq.stride_num_n < mprq_min_stride_num_n) {
diff --git a/drivers/net/mlx5/mlx5.h b/drivers/net/mlx5/mlx5.h

index 74d87c054bf49c5cfd28f5e7d3f8d7d8f2028fa7..24a3415c8d8a0bb8bf5dd8648d11f28cde9b0132 100644 (file)
--- a/drivers/net/mlx5/mlx5.h
+++ b/drivers/net/mlx5/mlx5.h
@@ -115,6 +115,7 @@ struct mlx5_dev_config {
         /* Whether tunnel stateless offloads are supported. */
         unsigned int mpls_en:1; /* MPLS over GRE/UDP is enabled. */
         unsigned int cqe_comp:1; /* CQE compression is enabled. */
+       unsigned int cqe_pad:1; /* CQE padding is enabled. */
         unsigned int tso:1; /* Whether TSO is supported. */
         unsigned int tx_vec_en:1; /* Tx vector is enabled. */
         unsigned int rx_vec_en:1; /* Rx vector is enabled. */
diff --git a/drivers/net/mlx5/mlx5_rxq.c b/drivers/net/mlx5/mlx5_rxq.c

index ed993ea6d96d6115a0b41ce13ec729a17f872c14..7db3f68a8172c639f5ff90a4e86f1d4db6eadd48 100644 (file)
--- a/drivers/net/mlx5/mlx5_rxq.c
+++ b/drivers/net/mlx5/mlx5_rxq.c
@@ -841,6 +841,12 @@ mlx5_rxq_ibv_new(struct rte_eth_dev *dev, uint16_t idx)
                         " timestamp",
                         dev->data->port_id);
         }
+#ifdef HAVE_IBV_MLX5_MOD_CQE_128B_PAD
+       if (config->cqe_pad) {
+               attr.cq.mlx5.comp_mask |= MLX5DV_CQ_INIT_ATTR_MASK_FLAGS;
+               attr.cq.mlx5.flags |= MLX5DV_CQ_INIT_ATTR_FLAGS_CQE_PAD;
+       }
+#endif
         tmpl->cq = mlx5_glue->cq_ex_to_cq
                 (mlx5_glue->dv_create_cq(priv->ctx, &attr.cq.ibv,
                                          &attr.cq.mlx5));
author	Yongseok Koh <yskoh@mellanox.com>
	Thu, 25 Oct 2018 06:24:00 +0000 (06:24 +0000)
committer	Ferruh Yigit <ferruh.yigit@intel.com>
	Mon, 5 Nov 2018 14:01:25 +0000 (15:01 +0100)
doc/guides/nics/mlx5.rst		patch \| blob \| history
drivers/net/mlx5/Makefile		patch \| blob \| history
drivers/net/mlx5/meson.build		patch \| blob \| history
drivers/net/mlx5/mlx5.c		patch \| blob \| history
drivers/net/mlx5/mlx5.h		patch \| blob \| history
drivers/net/mlx5/mlx5_rxq.c		patch \| blob \| history