net/mlx5: expose flow counters management
[dpdk.git] / drivers / net / mlx5 / mlx5_flow_dv.c
index e277b85..b273b6c 100644 (file)
@@ -102,6 +102,31 @@ flow_dv_attr_init(const struct rte_flow_item *item, union flow_dv_attr *attr)
        attr->valid = 1;
 }
 
+/**
+ * Convert rte_mtr_color to mlx5 color.
+ *
+ * @param[in] rcol
+ *   rte_mtr_color.
+ *
+ * @return
+ *   mlx5 color.
+ */
+static int
+rte_col_2_mlx5_col(enum rte_color rcol)
+{
+       switch (rcol) {
+       case RTE_COLOR_GREEN:
+               return MLX5_FLOW_COLOR_GREEN;
+       case RTE_COLOR_YELLOW:
+               return MLX5_FLOW_COLOR_YELLOW;
+       case RTE_COLOR_RED:
+               return MLX5_FLOW_COLOR_RED;
+       default:
+               break;
+       }
+       return MLX5_FLOW_COLOR_UNDEFINED;
+}
+
 struct field_modify_info {
        uint32_t size; /* Size of field in protocol header, in bytes. */
        uint32_t offset; /* Offset of field in protocol header, in bytes. */
@@ -1059,6 +1084,103 @@ flow_dv_convert_action_mark(struct rte_eth_dev *dev,
                                             MLX5_MODIFICATION_TYPE_SET, error);
 }
 
+/**
+ * Get metadata register index for specified steering domain.
+ *
+ * @param[in] dev
+ *   Pointer to the rte_eth_dev structure.
+ * @param[in] attr
+ *   Attributes of flow to determine steering domain.
+ * @param[out] error
+ *   Pointer to the error structure.
+ *
+ * @return
+ *   positive index on success, a negative errno value otherwise
+ *   and rte_errno is set.
+ */
+static enum modify_reg
+flow_dv_get_metadata_reg(struct rte_eth_dev *dev,
+                        const struct rte_flow_attr *attr,
+                        struct rte_flow_error *error)
+{
+       enum modify_reg reg =
+               mlx5_flow_get_reg_id(dev, attr->transfer ?
+                                         MLX5_METADATA_FDB :
+                                           attr->egress ?
+                                           MLX5_METADATA_TX :
+                                           MLX5_METADATA_RX, 0, error);
+       if (reg < 0)
+               return rte_flow_error_set(error,
+                                         ENOTSUP, RTE_FLOW_ERROR_TYPE_ITEM,
+                                         NULL, "unavailable "
+                                         "metadata register");
+       return reg;
+}
+
+/**
+ * Convert SET_META action to DV specification.
+ *
+ * @param[in] dev
+ *   Pointer to the rte_eth_dev structure.
+ * @param[in,out] resource
+ *   Pointer to the modify-header resource.
+ * @param[in] attr
+ *   Attributes of flow that includes this item.
+ * @param[in] conf
+ *   Pointer to action specification.
+ * @param[out] error
+ *   Pointer to the error structure.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+flow_dv_convert_action_set_meta
+                       (struct rte_eth_dev *dev,
+                        struct mlx5_flow_dv_modify_hdr_resource *resource,
+                        const struct rte_flow_attr *attr,
+                        const struct rte_flow_action_set_meta *conf,
+                        struct rte_flow_error *error)
+{
+       uint32_t data = conf->data;
+       uint32_t mask = conf->mask;
+       struct rte_flow_item item = {
+               .spec = &data,
+               .mask = &mask,
+       };
+       struct field_modify_info reg_c_x[] = {
+               [1] = {0, 0, 0},
+       };
+       enum modify_reg reg = flow_dv_get_metadata_reg(dev, attr, error);
+
+       if (reg < 0)
+               return reg;
+       /*
+        * In datapath code there is no endianness
+        * coversions for perfromance reasons, all
+        * pattern conversions are done in rte_flow.
+        */
+       if (reg == REG_C_0) {
+               struct mlx5_priv *priv = dev->data->dev_private;
+               uint32_t msk_c0 = priv->sh->dv_regc0_mask;
+               uint32_t shl_c0;
+
+               assert(msk_c0);
+#if RTE_BYTE_ORDER == RTE_BIG_ENDIAN
+               shl_c0 = rte_bsf32(msk_c0);
+#else
+               shl_c0 = sizeof(msk_c0) * CHAR_BIT - rte_fls_u32(msk_c0);
+#endif
+               mask <<= shl_c0;
+               data <<= shl_c0;
+               assert(!(~msk_c0 & rte_cpu_to_be_32(mask)));
+       }
+       reg_c_x[0] = (struct field_modify_info){4, 0, reg_to_field[reg]};
+       /* The routine expects parameters in memory as big-endian ones. */
+       return flow_dv_convert_modify_action(&item, reg_c_x, NULL, resource,
+                                            MLX5_MODIFICATION_TYPE_SET, error);
+}
+
 /**
  * Validate MARK item.
  *
@@ -1149,11 +1271,14 @@ flow_dv_validate_item_meta(struct rte_eth_dev *dev __rte_unused,
                           const struct rte_flow_attr *attr,
                           struct rte_flow_error *error)
 {
+       struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_dev_config *config = &priv->config;
        const struct rte_flow_item_meta *spec = item->spec;
        const struct rte_flow_item_meta *mask = item->mask;
-       const struct rte_flow_item_meta nic_mask = {
+       struct rte_flow_item_meta nic_mask = {
                .data = UINT32_MAX
        };
+       enum modify_reg reg;
        int ret;
 
        if (!spec)
@@ -1163,23 +1288,32 @@ flow_dv_validate_item_meta(struct rte_eth_dev *dev __rte_unused,
                                          "data cannot be empty");
        if (!spec->data)
                return rte_flow_error_set(error, EINVAL,
-                                         RTE_FLOW_ERROR_TYPE_ITEM_SPEC,
-                                         NULL,
+                                         RTE_FLOW_ERROR_TYPE_ITEM_SPEC, NULL,
                                          "data cannot be zero");
+       if (config->dv_xmeta_en != MLX5_XMETA_MODE_LEGACY) {
+               if (!mlx5_flow_ext_mreg_supported(dev))
+                       return rte_flow_error_set(error, ENOTSUP,
+                                         RTE_FLOW_ERROR_TYPE_ITEM, item,
+                                         "extended metadata register"
+                                         " isn't supported");
+               reg = flow_dv_get_metadata_reg(dev, attr, error);
+               if (reg < 0)
+                       return reg;
+               if (reg == REG_B)
+                       return rte_flow_error_set(error, ENOTSUP,
+                                         RTE_FLOW_ERROR_TYPE_ITEM, item,
+                                         "match on reg_b "
+                                         "isn't supported");
+               if (reg != REG_A)
+                       nic_mask.data = priv->sh->dv_meta_mask;
+       }
        if (!mask)
                mask = &rte_flow_item_meta_mask;
        ret = mlx5_flow_item_acceptable(item, (const uint8_t *)mask,
                                        (const uint8_t *)&nic_mask,
                                        sizeof(struct rte_flow_item_meta),
                                        error);
-       if (ret < 0)
-               return ret;
-       if (attr->ingress)
-               return rte_flow_error_set(error, ENOTSUP,
-                                         RTE_FLOW_ERROR_TYPE_ATTR_INGRESS,
-                                         NULL,
-                                         "pattern not supported for ingress");
-       return 0;
+       return ret;
 }
 
 /**
@@ -1734,6 +1868,67 @@ flow_dv_validate_action_mark(struct rte_eth_dev *dev,
        return 0;
 }
 
+/**
+ * Validate SET_META action.
+ *
+ * @param[in] dev
+ *   Pointer to the rte_eth_dev structure.
+ * @param[in] action
+ *   Pointer to the encap action.
+ * @param[in] action_flags
+ *   Holds the actions detected until now.
+ * @param[in] attr
+ *   Pointer to flow attributes
+ * @param[out] error
+ *   Pointer to error structure.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+flow_dv_validate_action_set_meta(struct rte_eth_dev *dev,
+                                const struct rte_flow_action *action,
+                                uint64_t action_flags __rte_unused,
+                                const struct rte_flow_attr *attr,
+                                struct rte_flow_error *error)
+{
+       const struct rte_flow_action_set_meta *conf;
+       uint32_t nic_mask = UINT32_MAX;
+       enum modify_reg reg;
+
+       if (!mlx5_flow_ext_mreg_supported(dev))
+               return rte_flow_error_set(error, ENOTSUP,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, action,
+                                         "extended metadata register"
+                                         " isn't supported");
+       reg = flow_dv_get_metadata_reg(dev, attr, error);
+       if (reg < 0)
+               return reg;
+       if (reg != REG_A && reg != REG_B) {
+               struct mlx5_priv *priv = dev->data->dev_private;
+
+               nic_mask = priv->sh->dv_meta_mask;
+       }
+       if (!(action->conf))
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, action,
+                                         "configuration cannot be null");
+       conf = (const struct rte_flow_action_set_meta *)action->conf;
+       if (!conf->mask)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, action,
+                                         "zero mask doesn't have any effect");
+       if (conf->mask & ~nic_mask)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, action,
+                                         "meta data must be within reg C0");
+       if (!(conf->data & conf->mask))
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, action,
+                                         "zero value has no effect");
+       return 0;
+}
+
 /**
  * Validate SET_TAG action.
  *
@@ -3085,10 +3280,10 @@ flow_dv_validate_action_jump(const struct rte_flow_action *action,
                return rte_flow_error_set(error, EINVAL,
                                          RTE_FLOW_ERROR_TYPE_ATTR_GROUP, NULL,
                                          "target group index out of range");
-       if (attributes->group >= target_group)
+       if (attributes->group == target_group)
                return rte_flow_error_set(error, EINVAL,
                                          RTE_FLOW_ERROR_TYPE_ACTION, NULL,
-                                         "target group must be higher than"
+                                         "target group must be other than"
                                          " the current flow group");
        return 0;
 }
@@ -3916,8 +4111,11 @@ flow_dv_validate_attributes(struct rte_eth_dev *dev,
                                          NULL,
                                          "groups are not supported");
 #else
-       uint32_t max_group = attributes->transfer ? MLX5_MAX_TABLES_FDB :
-                                                   MLX5_MAX_TABLES;
+       uint32_t max_group = attributes->transfer ?
+                            MLX5_MAX_TABLES_FDB :
+                               external ?
+                               MLX5_MAX_TABLES_EXTERNAL :
+                               MLX5_MAX_TABLES;
        uint32_t table;
        int ret;
 
@@ -4289,6 +4487,17 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                ++actions_n;
                        }
                        break;
+               case RTE_FLOW_ACTION_TYPE_SET_META:
+                       ret = flow_dv_validate_action_set_meta(dev, actions,
+                                                              action_flags,
+                                                              attr, error);
+                       if (ret < 0)
+                               return ret;
+                       /* Count all modify-header actions as one action. */
+                       if (!(action_flags & MLX5_FLOW_MODIFY_HDR_ACTIONS))
+                               ++actions_n;
+                       action_flags |= MLX5_FLOW_ACTION_SET_META;
+                       break;
                case RTE_FLOW_ACTION_TYPE_SET_TAG:
                        ret = flow_dv_validate_action_set_tag(dev, actions,
                                                              action_flags,
@@ -4540,6 +4749,7 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                                MLX5_FLOW_ACTION_DEC_TCP_ACK;
                        break;
                case MLX5_RTE_FLOW_ACTION_TYPE_TAG:
+               case MLX5_RTE_FLOW_ACTION_TYPE_MARK:
                case MLX5_RTE_FLOW_ACTION_TYPE_COPY_MREG:
                        break;
                default:
@@ -5568,15 +5778,21 @@ flow_dv_translate_item_mark(struct rte_eth_dev *dev,
 /**
  * Add META item to matcher
  *
+ * @param[in] dev
+ *   The devich to configure through.
  * @param[in, out] matcher
  *   Flow matcher.
  * @param[in, out] key
  *   Flow matcher value.
+ * @param[in] attr
+ *   Attributes of flow that includes this item.
  * @param[in] item
  *   Flow pattern to translate.
  */
 static void
-flow_dv_translate_item_meta(void *matcher, void *key,
+flow_dv_translate_item_meta(struct rte_eth_dev *dev,
+                           void *matcher, void *key,
+                           const struct rte_flow_attr *attr,
                            const struct rte_flow_item *item)
 {
        const struct rte_flow_item_meta *meta_m;
@@ -5586,10 +5802,34 @@ flow_dv_translate_item_meta(void *matcher, void *key,
        if (!meta_m)
                meta_m = &rte_flow_item_meta_mask;
        meta_v = (const void *)item->spec;
-       if (meta_v)
-               flow_dv_match_meta_reg(matcher, key, REG_A,
-                                      rte_cpu_to_be_32(meta_v->data),
-                                      rte_cpu_to_be_32(meta_m->data));
+       if (meta_v) {
+               enum modify_reg reg;
+               uint32_t value = meta_v->data;
+               uint32_t mask = meta_m->data;
+
+               reg = flow_dv_get_metadata_reg(dev, attr, NULL);
+               if (reg < 0)
+                       return;
+               /*
+                * In datapath code there is no endianness
+                * coversions for perfromance reasons, all
+                * pattern conversions are done in rte_flow.
+                */
+               value = rte_cpu_to_be_32(value);
+               mask = rte_cpu_to_be_32(mask);
+               if (reg == REG_C_0) {
+                       struct mlx5_priv *priv = dev->data->dev_private;
+                       uint32_t msk_c0 = priv->sh->dv_regc0_mask;
+                       uint32_t shl_c0 = rte_bsf32(msk_c0);
+
+                       msk_c0 = rte_cpu_to_be_32(msk_c0);
+                       value <<= shl_c0;
+                       mask <<= shl_c0;
+                       assert(msk_c0);
+                       assert(!(~msk_c0 & mask));
+               }
+               flow_dv_match_meta_reg(matcher, key, reg, value, mask);
+       }
 }
 
 /**
@@ -6346,6 +6586,8 @@ __flow_dv_translate(struct rte_eth_dev *dev,
                                action_flags |= MLX5_FLOW_ACTION_MARK_EXT;
                                break;
                        }
+                       /* Fall-through */
+               case MLX5_RTE_FLOW_ACTION_TYPE_MARK:
                        /* Legacy (non-extensive) MARK action. */
                        tag_resource.tag = mlx5_flow_mark_set
                              (((const struct rte_flow_action_mark *)
@@ -6357,6 +6599,14 @@ __flow_dv_translate(struct rte_eth_dev *dev,
                        dev_flow->dv.actions[actions_n++] =
                                dev_flow->dv.tag_resource->action;
                        break;
+               case RTE_FLOW_ACTION_TYPE_SET_META:
+                       if (flow_dv_convert_action_set_meta
+                               (dev, &mhdr_res, attr,
+                                (const struct rte_flow_action_set_meta *)
+                                 actions->conf, error))
+                               return -rte_errno;
+                       action_flags |= MLX5_FLOW_ACTION_SET_META;
+                       break;
                case RTE_FLOW_ACTION_TYPE_SET_TAG:
                        if (flow_dv_convert_action_set_tag
                                (dev, &mhdr_res,
@@ -6811,8 +7061,8 @@ cnt_err:
                        last_item = MLX5_FLOW_ITEM_MARK;
                        break;
                case RTE_FLOW_ITEM_TYPE_META:
-                       flow_dv_translate_item_meta(match_mask, match_value,
-                                                   items);
+                       flow_dv_translate_item_meta(dev, match_mask,
+                                                   match_value, attr, items);
                        last_item = MLX5_FLOW_ITEM_METADATA;
                        break;
                case RTE_FLOW_ITEM_TYPE_ICMP:
@@ -7349,6 +7599,452 @@ flow_dv_query(struct rte_eth_dev *dev,
        return ret;
 }
 
+/**
+ * Destroy the meter table set.
+ * Lock free, (mutex should be acquired by caller).
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in] tbl
+ *   Pointer to the meter table set.
+ *
+ * @return
+ *   Always 0.
+ */
+static int
+flow_dv_destroy_mtr_tbl(struct rte_eth_dev *dev,
+                       struct mlx5_meter_domains_infos *tbl)
+{
+       struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_meter_domains_infos *mtd =
+                               (struct mlx5_meter_domains_infos *)tbl;
+
+       if (!mtd || !priv->config.dv_flow_en)
+               return 0;
+       if (mtd->ingress.policer_rules[RTE_MTR_DROPPED])
+               claim_zero(mlx5_glue->dv_destroy_flow
+                         (mtd->ingress.policer_rules[RTE_MTR_DROPPED]));
+       if (mtd->egress.policer_rules[RTE_MTR_DROPPED])
+               claim_zero(mlx5_glue->dv_destroy_flow
+                         (mtd->egress.policer_rules[RTE_MTR_DROPPED]));
+       if (mtd->transfer.policer_rules[RTE_MTR_DROPPED])
+               claim_zero(mlx5_glue->dv_destroy_flow
+                         (mtd->transfer.policer_rules[RTE_MTR_DROPPED]));
+       if (mtd->egress.color_matcher)
+               claim_zero(mlx5_glue->dv_destroy_flow_matcher
+                         (mtd->egress.color_matcher));
+       if (mtd->egress.any_matcher)
+               claim_zero(mlx5_glue->dv_destroy_flow_matcher
+                         (mtd->egress.any_matcher));
+       if (mtd->egress.tbl)
+               claim_zero(flow_dv_tbl_resource_release(mtd->egress.tbl));
+       if (mtd->ingress.color_matcher)
+               claim_zero(mlx5_glue->dv_destroy_flow_matcher
+                         (mtd->ingress.color_matcher));
+       if (mtd->ingress.any_matcher)
+               claim_zero(mlx5_glue->dv_destroy_flow_matcher
+                         (mtd->ingress.any_matcher));
+       if (mtd->ingress.tbl)
+               claim_zero(flow_dv_tbl_resource_release(mtd->ingress.tbl));
+       if (mtd->transfer.color_matcher)
+               claim_zero(mlx5_glue->dv_destroy_flow_matcher
+                         (mtd->transfer.color_matcher));
+       if (mtd->transfer.any_matcher)
+               claim_zero(mlx5_glue->dv_destroy_flow_matcher
+                         (mtd->transfer.any_matcher));
+       if (mtd->transfer.tbl)
+               claim_zero(flow_dv_tbl_resource_release(mtd->transfer.tbl));
+       if (mtd->drop_actn)
+               claim_zero(mlx5_glue->destroy_flow_action(mtd->drop_actn));
+       rte_free(mtd);
+       return 0;
+}
+
+/* Number of meter flow actions, count and jump or count and drop. */
+#define METER_ACTIONS 2
+
+/**
+ * Create specify domain meter table and suffix table.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in,out] mtb
+ *   Pointer to DV meter table set.
+ * @param[in] egress
+ *   Table attribute.
+ * @param[in] transfer
+ *   Table attribute.
+ * @param[in] color_reg_c_idx
+ *   Reg C index for color match.
+ *
+ * @return
+ *   0 on success, -1 otherwise and rte_errno is set.
+ */
+static int
+flow_dv_prepare_mtr_tables(struct rte_eth_dev *dev,
+                          struct mlx5_meter_domains_infos *mtb,
+                          uint8_t egress, uint8_t transfer,
+                          uint32_t color_reg_c_idx)
+{
+       struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_ibv_shared *sh = priv->sh;
+       struct mlx5_flow_dv_match_params mask = {
+               .size = sizeof(mask.buf),
+       };
+       struct mlx5_flow_dv_match_params value = {
+               .size = sizeof(value.buf),
+       };
+       struct mlx5dv_flow_matcher_attr dv_attr = {
+               .type = IBV_FLOW_ATTR_NORMAL,
+               .priority = 0,
+               .match_criteria_enable = 0,
+               .match_mask = (void *)&mask,
+       };
+       void *actions[METER_ACTIONS];
+       struct mlx5_flow_tbl_resource **sfx_tbl;
+       struct mlx5_meter_domain_info *dtb;
+       struct rte_flow_error error;
+       int i = 0;
+
+       if (transfer) {
+               sfx_tbl = &sh->fdb_mtr_sfx_tbl;
+               dtb = &mtb->transfer;
+       } else if (egress) {
+               sfx_tbl = &sh->tx_mtr_sfx_tbl;
+               dtb = &mtb->egress;
+       } else {
+               sfx_tbl = &sh->rx_mtr_sfx_tbl;
+               dtb = &mtb->ingress;
+       }
+       /* If the suffix table in missing, create it. */
+       if (!(*sfx_tbl)) {
+               *sfx_tbl = flow_dv_tbl_resource_get(dev,
+                                               MLX5_FLOW_TABLE_LEVEL_SUFFIX,
+                                               egress, transfer, &error);
+               if (!(*sfx_tbl)) {
+                       DRV_LOG(ERR, "Failed to create meter suffix table.");
+                       return -1;
+               }
+       }
+       /* Create the meter table with METER level. */
+       dtb->tbl = flow_dv_tbl_resource_get(dev, MLX5_FLOW_TABLE_LEVEL_METER,
+                                           egress, transfer, &error);
+       if (!dtb->tbl) {
+               DRV_LOG(ERR, "Failed to create meter policer table.");
+               return -1;
+       }
+       /* Create matchers, Any and Color. */
+       dv_attr.priority = 3;
+       dv_attr.match_criteria_enable = 0;
+       dtb->any_matcher = mlx5_glue->dv_create_flow_matcher(sh->ctx,
+                                                            &dv_attr,
+                                                            dtb->tbl->obj);
+       if (!dtb->any_matcher) {
+               DRV_LOG(ERR, "Failed to create meter"
+                            " policer default matcher.");
+               goto error_exit;
+       }
+       dv_attr.priority = 0;
+       dv_attr.match_criteria_enable =
+                               1 << MLX5_MATCH_CRITERIA_ENABLE_MISC2_BIT;
+       flow_dv_match_meta_reg(mask.buf, value.buf, color_reg_c_idx,
+                              rte_col_2_mlx5_col(RTE_COLORS), UINT32_MAX);
+       dtb->color_matcher = mlx5_glue->dv_create_flow_matcher(sh->ctx,
+                                                              &dv_attr,
+                                                              dtb->tbl->obj);
+       if (!dtb->color_matcher) {
+               DRV_LOG(ERR, "Failed to create meter policer color matcher.");
+               goto error_exit;
+       }
+       actions[i++] = mtb->drop_actn;
+       /* Default rule: lowest priority, match any, actions: drop. */
+       dtb->policer_rules[RTE_MTR_DROPPED] =
+                       mlx5_glue->dv_create_flow(dtb->any_matcher,
+                                                (void *)&value, i, actions);
+       if (!dtb->policer_rules[RTE_MTR_DROPPED]) {
+               DRV_LOG(ERR, "Failed to create meter policer drop rule.");
+               goto error_exit;
+       }
+       return 0;
+error_exit:
+       return -1;
+}
+
+/**
+ * Create the needed meter and suffix tables.
+ * Lock free, (mutex should be acquired by caller).
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ *
+ * @return
+ *   Pointer to table set on success, NULL otherwise and rte_errno is set.
+ */
+static struct mlx5_meter_domains_infos *
+flow_dv_create_mtr_tbl(struct rte_eth_dev *dev)
+{
+       struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_meter_domains_infos *mtb;
+       int ret;
+
+       if (!priv->mtr_en) {
+               rte_errno = ENOTSUP;
+               return NULL;
+       }
+       mtb = rte_calloc(__func__, 1, sizeof(*mtb), 0);
+       if (!mtb) {
+               DRV_LOG(ERR, "Failed to allocate memory for meter.");
+               return NULL;
+       }
+       /* Create drop action. */
+       mtb->drop_actn = mlx5_glue->dr_create_flow_action_drop();
+       if (!mtb->drop_actn) {
+               DRV_LOG(ERR, "Failed to create drop action.");
+               goto error_exit;
+       }
+       /* Egress meter table. */
+       ret = flow_dv_prepare_mtr_tables(dev, mtb, 1, 0, priv->mtr_color_reg);
+       if (ret) {
+               DRV_LOG(ERR, "Failed to prepare egress meter table.");
+               goto error_exit;
+       }
+       /* Ingress meter table. */
+       ret = flow_dv_prepare_mtr_tables(dev, mtb, 0, 0, priv->mtr_color_reg);
+       if (ret) {
+               DRV_LOG(ERR, "Failed to prepare ingress meter table.");
+               goto error_exit;
+       }
+       /* FDB meter table. */
+       if (priv->config.dv_esw_en) {
+               ret = flow_dv_prepare_mtr_tables(dev, mtb, 0, 1,
+                                                priv->mtr_color_reg);
+               if (ret) {
+                       DRV_LOG(ERR, "Failed to prepare fdb meter table.");
+                       goto error_exit;
+               }
+       }
+       return mtb;
+error_exit:
+       flow_dv_destroy_mtr_tbl(dev, mtb);
+       return NULL;
+}
+
+/**
+ * Destroy domain policer rule.
+ *
+ * @param[in] dt
+ *   Pointer to domain table.
+ */
+static void
+flow_dv_destroy_domain_policer_rule(struct mlx5_meter_domain_info *dt)
+{
+       int i;
+
+       for (i = 0; i < RTE_MTR_DROPPED; i++) {
+               if (dt->policer_rules[i]) {
+                       claim_zero(mlx5_glue->dv_destroy_flow
+                                 (dt->policer_rules[i]));
+                       dt->policer_rules[i] = NULL;
+               }
+       }
+       if (dt->jump_actn) {
+               claim_zero(mlx5_glue->destroy_flow_action(dt->jump_actn));
+               dt->jump_actn = NULL;
+       }
+}
+
+/**
+ * Destroy policer rules.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in] fm
+ *   Pointer to flow meter structure.
+ * @param[in] attr
+ *   Pointer to flow attributes.
+ *
+ * @return
+ *   Always 0.
+ */
+static int
+flow_dv_destroy_policer_rules(struct rte_eth_dev *dev __rte_unused,
+                             const struct mlx5_flow_meter *fm,
+                             const struct rte_flow_attr *attr)
+{
+       struct mlx5_meter_domains_infos *mtb = fm ? fm->mfts : NULL;
+
+       if (!mtb)
+               return 0;
+       if (attr->egress)
+               flow_dv_destroy_domain_policer_rule(&mtb->egress);
+       if (attr->ingress)
+               flow_dv_destroy_domain_policer_rule(&mtb->ingress);
+       if (attr->transfer)
+               flow_dv_destroy_domain_policer_rule(&mtb->transfer);
+       return 0;
+}
+
+/**
+ * Create specify domain meter policer rule.
+ *
+ * @param[in] fm
+ *   Pointer to flow meter structure.
+ * @param[in] mtb
+ *   Pointer to DV meter table set.
+ * @param[in] sfx_tb
+ *   Pointer to suffix table.
+ * @param[in] mtr_reg_c
+ *   Color match REG_C.
+ *
+ * @return
+ *   0 on success, -1 otherwise.
+ */
+static int
+flow_dv_create_policer_forward_rule(struct mlx5_flow_meter *fm,
+                                   struct mlx5_meter_domain_info *dtb,
+                                   struct mlx5_flow_tbl_resource *sfx_tb,
+                                   uint8_t mtr_reg_c)
+{
+       struct mlx5_flow_dv_match_params matcher = {
+               .size = sizeof(matcher.buf),
+       };
+       struct mlx5_flow_dv_match_params value = {
+               .size = sizeof(value.buf),
+       };
+       struct mlx5_meter_domains_infos *mtb = fm->mfts;
+       void *actions[METER_ACTIONS];
+       int i;
+
+       /* Create jump action. */
+       if (!sfx_tb)
+               return -1;
+       if (!dtb->jump_actn)
+               dtb->jump_actn =
+                       mlx5_glue->dr_create_flow_action_dest_flow_tbl
+                                                       (sfx_tb->obj);
+       if (!dtb->jump_actn) {
+               DRV_LOG(ERR, "Failed to create policer jump action.");
+               goto error;
+       }
+       for (i = 0; i < RTE_MTR_DROPPED; i++) {
+               int j = 0;
+
+               flow_dv_match_meta_reg(matcher.buf, value.buf, mtr_reg_c,
+                                      rte_col_2_mlx5_col(i), UINT32_MAX);
+               if (fm->params.action[i] == MTR_POLICER_ACTION_DROP)
+                       actions[j++] = mtb->drop_actn;
+               else
+                       actions[j++] = dtb->jump_actn;
+               dtb->policer_rules[i] =
+                       mlx5_glue->dv_create_flow(dtb->color_matcher,
+                                                (void *)&value,
+                                                 j, actions);
+               if (!dtb->policer_rules[i]) {
+                       DRV_LOG(ERR, "Failed to create policer rule.");
+                       goto error;
+               }
+       }
+       return 0;
+error:
+       rte_errno = errno;
+       return -1;
+}
+
+/**
+ * Create policer rules.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in] fm
+ *   Pointer to flow meter structure.
+ * @param[in] attr
+ *   Pointer to flow attributes.
+ *
+ * @return
+ *   0 on success, -1 otherwise.
+ */
+static int
+flow_dv_create_policer_rules(struct rte_eth_dev *dev,
+                            struct mlx5_flow_meter *fm,
+                            const struct rte_flow_attr *attr)
+{
+       struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_meter_domains_infos *mtb = fm->mfts;
+       int ret;
+
+       if (attr->egress) {
+               ret = flow_dv_create_policer_forward_rule(fm, &mtb->egress,
+                                               priv->sh->tx_mtr_sfx_tbl,
+                                               priv->mtr_color_reg);
+               if (ret) {
+                       DRV_LOG(ERR, "Failed to create egress policer.");
+                       goto error;
+               }
+       }
+       if (attr->ingress) {
+               ret = flow_dv_create_policer_forward_rule(fm, &mtb->ingress,
+                                               priv->sh->rx_mtr_sfx_tbl,
+                                               priv->mtr_color_reg);
+               if (ret) {
+                       DRV_LOG(ERR, "Failed to create ingress policer.");
+                       goto error;
+               }
+       }
+       if (attr->transfer) {
+               ret = flow_dv_create_policer_forward_rule(fm, &mtb->transfer,
+                                               priv->sh->fdb_mtr_sfx_tbl,
+                                               priv->mtr_color_reg);
+               if (ret) {
+                       DRV_LOG(ERR, "Failed to create transfer policer.");
+                       goto error;
+               }
+       }
+       return 0;
+error:
+       flow_dv_destroy_policer_rules(dev, fm, attr);
+       return -1;
+}
+
+/**
+ * Query a devx counter.
+ *
+ * @param[in] dev
+ *   Pointer to the Ethernet device structure.
+ * @param[in] cnt
+ *   Pointer to the flow counter.
+ * @param[in] clear
+ *   Set to clear the counter statistics.
+ * @param[out] pkts
+ *   The statistics value of packets.
+ * @param[out] bytes
+ *   The statistics value of bytes.
+ *
+ * @return
+ *   0 on success, otherwise return -1.
+ */
+static int
+flow_dv_counter_query(struct rte_eth_dev *dev,
+                     struct mlx5_flow_counter *cnt, bool clear,
+                     uint64_t *pkts, uint64_t *bytes)
+{
+       struct mlx5_priv *priv = dev->data->dev_private;
+       uint64_t inn_pkts, inn_bytes;
+       int ret;
+
+       if (!priv->config.devx)
+               return -1;
+       ret = _flow_dv_query_count(dev, cnt, &inn_pkts, &inn_bytes);
+       if (ret)
+               return -1;
+       *pkts = inn_pkts - cnt->hits;
+       *bytes = inn_bytes - cnt->bytes;
+       if (clear) {
+               cnt->hits = inn_pkts;
+               cnt->bytes = inn_bytes;
+       }
+       return 0;
+}
+
 /*
  * Mutex-protected thunk to lock-free  __flow_dv_translate().
  */
@@ -7406,6 +8102,31 @@ flow_dv_destroy(struct rte_eth_dev *dev, struct rte_flow *flow)
        flow_dv_shared_unlock(dev);
 }
 
+/*
+ * Mutex-protected thunk to lock-free flow_dv_counter_alloc().
+ */
+static struct mlx5_flow_counter *
+flow_dv_counter_allocate(struct rte_eth_dev *dev)
+{
+       struct mlx5_flow_counter *cnt;
+
+       flow_dv_shared_lock(dev);
+       cnt = flow_dv_counter_alloc(dev, 0, 0, 1);
+       flow_dv_shared_unlock(dev);
+       return cnt;
+}
+
+/*
+ * Mutex-protected thunk to lock-free flow_dv_counter_release().
+ */
+static void
+flow_dv_counter_free(struct rte_eth_dev *dev, struct mlx5_flow_counter *cnt)
+{
+       flow_dv_shared_lock(dev);
+       flow_dv_counter_release(dev, cnt);
+       flow_dv_shared_unlock(dev);
+}
+
 const struct mlx5_flow_driver_ops mlx5_flow_dv_drv_ops = {
        .validate = flow_dv_validate,
        .prepare = flow_dv_prepare,
@@ -7414,6 +8135,13 @@ const struct mlx5_flow_driver_ops mlx5_flow_dv_drv_ops = {
        .remove = flow_dv_remove,
        .destroy = flow_dv_destroy,
        .query = flow_dv_query,
+       .create_mtr_tbls = flow_dv_create_mtr_tbl,
+       .destroy_mtr_tbls = flow_dv_destroy_mtr_tbl,
+       .create_policer_rules = flow_dv_create_policer_rules,
+       .destroy_policer_rules = flow_dv_destroy_policer_rules,
+       .counter_alloc = flow_dv_counter_allocate,
+       .counter_free = flow_dv_counter_free,
+       .counter_query = flow_dv_counter_query,
 };
 
 #endif /* HAVE_IBV_FLOW_DV_SUPPORT */