net/mlx5: support descriptor LWM for Rx queue
[dpdk.git] / drivers / net / mlx5 / mlx5_flow_dv.c
index 28911d6..65b02b2 100644 (file)
@@ -97,6 +97,10 @@ static int16_t
 flow_dv_get_esw_manager_vport_id(struct rte_eth_dev *dev)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_common_device *cdev = priv->sh->cdev;
+
+       if (cdev->config.hca_attr.esw_mgr_vport_id_valid)
+               return (int16_t)cdev->config.hca_attr.esw_mgr_vport_id;
 
        if (priv->pci_dev == NULL)
                return 0;
@@ -158,6 +162,7 @@ flow_dv_attr_init(const struct rte_flow_item *item, union flow_dv_attr *attr,
                case RTE_FLOW_ITEM_TYPE_VXLAN_GPE:
                case RTE_FLOW_ITEM_TYPE_GENEVE:
                case RTE_FLOW_ITEM_TYPE_MPLS:
+               case RTE_FLOW_ITEM_TYPE_GTP:
                        if (tunnel_decap)
                                attr->attr = 0;
                        break;
@@ -312,7 +317,8 @@ flow_dv_hlist_prepare(struct mlx5_dev_ctx_shared *sh, struct mlx5_hlist **phl,
                     mlx5_list_match_cb cb_match,
                     mlx5_list_remove_cb cb_remove,
                     mlx5_list_clone_cb cb_clone,
-                    mlx5_list_clone_free_cb cb_clone_free)
+                    mlx5_list_clone_free_cb cb_clone_free,
+                    struct rte_flow_error *error)
 {
        struct mlx5_hlist *hl;
        struct mlx5_hlist *expected = NULL;
@@ -327,7 +333,9 @@ flow_dv_hlist_prepare(struct mlx5_dev_ctx_shared *sh, struct mlx5_hlist **phl,
                        cb_clone_free);
        if (!hl) {
                DRV_LOG(ERR, "%s hash creation failed", name);
-               rte_errno = ENOMEM;
+               rte_flow_error_set(error, ENOMEM,
+                                  RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                  "cannot allocate resource memory");
                return NULL;
        }
        if (!__atomic_compare_exchange_n(phl, &expected, hl, false,
@@ -1146,7 +1154,8 @@ flow_dv_convert_action_copy_mreg(struct rte_eth_dev *dev,
                uint32_t reg_c0 = priv->sh->dv_regc0_mask;
 
                MLX5_ASSERT(reg_c0);
-               MLX5_ASSERT(priv->config.dv_xmeta_en != MLX5_XMETA_MODE_LEGACY);
+               MLX5_ASSERT(priv->sh->config.dv_xmeta_en !=
+                           MLX5_XMETA_MODE_LEGACY);
                if (conf->dst == REG_C_0) {
                        /* Copy to reg_c[0], within mask only. */
                        reg_dst.offset = rte_bsf32(reg_c0);
@@ -1441,6 +1450,9 @@ mlx5_flow_item_field_width(struct rte_eth_dev *dev,
        case RTE_FLOW_FIELD_POINTER:
        case RTE_FLOW_FIELD_VALUE:
                return inherit < 0 ? 0 : inherit;
+       case RTE_FLOW_FIELD_IPV4_ECN:
+       case RTE_FLOW_FIELD_IPV6_ECN:
+               return 2;
        default:
                MLX5_ASSERT(false);
        }
@@ -1451,7 +1463,7 @@ static void
 mlx5_flow_field_id_to_modify_info
                (const struct rte_flow_action_modify_data *data,
                 struct field_modify_info *info, uint32_t *mask,
-                uint32_t width, uint32_t *shift, struct rte_eth_dev *dev,
+                uint32_t width, struct rte_eth_dev *dev,
                 const struct rte_flow_attr *attr, struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
@@ -1487,9 +1499,9 @@ mlx5_flow_field_id_to_modify_info
                                                    (32 - width)) << off);
                } else {
                        if (data->offset < 16)
-                               info[idx++] = (struct field_modify_info){2, 4,
+                               info[idx++] = (struct field_modify_info){2, 0,
                                                MLX5_MODI_OUT_DMAC_15_0};
-                       info[idx] = (struct field_modify_info){4, 0,
+                       info[idx] = (struct field_modify_info){4, off,
                                                MLX5_MODI_OUT_DMAC_47_16};
                }
                break;
@@ -1517,9 +1529,9 @@ mlx5_flow_field_id_to_modify_info
                                                    (32 - width)) << off);
                } else {
                        if (data->offset < 16)
-                               info[idx++] = (struct field_modify_info){2, 4,
+                               info[idx++] = (struct field_modify_info){2, 0,
                                                MLX5_MODI_OUT_SMAC_15_0};
-                       info[idx] = (struct field_modify_info){4, 0,
+                       info[idx] = (struct field_modify_info){4, off,
                                                MLX5_MODI_OUT_SMAC_47_16};
                }
                break;
@@ -1631,13 +1643,13 @@ mlx5_flow_field_id_to_modify_info
                        mask[0] = rte_cpu_to_be_32(0xffffffff >> (32 - width));
                } else {
                        if (data->offset < 32)
-                               info[idx++] = (struct field_modify_info){4, 12,
+                               info[idx++] = (struct field_modify_info){4, 0,
                                                MLX5_MODI_OUT_SIPV6_31_0};
                        if (data->offset < 64)
-                               info[idx++] = (struct field_modify_info){4, 8,
+                               info[idx++] = (struct field_modify_info){4, 0,
                                                MLX5_MODI_OUT_SIPV6_63_32};
                        if (data->offset < 96)
-                               info[idx++] = (struct field_modify_info){4, 4,
+                               info[idx++] = (struct field_modify_info){4, 0,
                                                MLX5_MODI_OUT_SIPV6_95_64};
                        if (data->offset < 128)
                                info[idx++] = (struct field_modify_info){4, 0,
@@ -1699,13 +1711,13 @@ mlx5_flow_field_id_to_modify_info
                        mask[0] = rte_cpu_to_be_32(0xffffffff >> (32 - width));
                } else {
                        if (data->offset < 32)
-                               info[idx++] = (struct field_modify_info){4, 12,
+                               info[idx++] = (struct field_modify_info){4, 0,
                                                MLX5_MODI_OUT_DIPV6_31_0};
                        if (data->offset < 64)
-                               info[idx++] = (struct field_modify_info){4, 8,
+                               info[idx++] = (struct field_modify_info){4, 0,
                                                MLX5_MODI_OUT_DIPV6_63_32};
                        if (data->offset < 96)
-                               info[idx++] = (struct field_modify_info){4, 4,
+                               info[idx++] = (struct field_modify_info){4, 0,
                                                MLX5_MODI_OUT_DIPV6_95_64};
                        if (data->offset < 128)
                                info[idx++] = (struct field_modify_info){4, 0,
@@ -1806,16 +1818,11 @@ mlx5_flow_field_id_to_modify_info
                {
                        uint32_t meta_mask = priv->sh->dv_meta_mask;
                        uint32_t meta_count = __builtin_popcount(meta_mask);
-                       uint32_t msk_c0 =
-                               rte_cpu_to_be_32(priv->sh->dv_regc0_mask);
-                       uint32_t shl_c0 = rte_bsf32(msk_c0);
                        int reg = flow_dv_get_metadata_reg(dev, attr, error);
                        if (reg < 0)
                                return;
                        MLX5_ASSERT(reg != REG_NON);
                        MLX5_ASSERT((unsigned int)reg < RTE_DIM(reg_to_field));
-                       if (reg == REG_C_0)
-                               *shift = shl_c0;
                        info[idx] = (struct field_modify_info){4, 0,
                                                reg_to_field[reg]};
                        if (mask)
@@ -1823,6 +1830,13 @@ mlx5_flow_field_id_to_modify_info
                                        (meta_count - width)) & meta_mask);
                }
                break;
+       case RTE_FLOW_FIELD_IPV4_ECN:
+       case RTE_FLOW_FIELD_IPV6_ECN:
+               info[idx] = (struct field_modify_info){1, 0,
+                                       MLX5_MODI_OUT_IP_ECN};
+               if (mask)
+                       mask[idx] = 0x3 >> (2 - width);
+               break;
        case RTE_FLOW_FIELD_POINTER:
        case RTE_FLOW_FIELD_VALUE:
        default:
@@ -1867,29 +1881,33 @@ flow_dv_convert_action_modify_field
        struct field_modify_info dcopy[MLX5_ACT_MAX_MOD_FIELDS] = {
                                                                {0, 0, 0} };
        uint32_t mask[MLX5_ACT_MAX_MOD_FIELDS] = {0, 0, 0, 0, 0};
-       uint32_t type;
-       uint32_t shift = 0;
+       uint32_t type, meta = 0;
 
        if (conf->src.field == RTE_FLOW_FIELD_POINTER ||
            conf->src.field == RTE_FLOW_FIELD_VALUE) {
                type = MLX5_MODIFICATION_TYPE_SET;
                /** For SET fill the destination field (field) first. */
                mlx5_flow_field_id_to_modify_info(&conf->dst, field, mask,
-                                                 conf->width, &shift, dev,
+                                                 conf->width, dev,
                                                  attr, error);
                item.spec = conf->src.field == RTE_FLOW_FIELD_POINTER ?
                                        (void *)(uintptr_t)conf->src.pvalue :
                                        (void *)(uintptr_t)&conf->src.value;
+               if (conf->dst.field == RTE_FLOW_FIELD_META) {
+                       meta = *(const unaligned_uint32_t *)item.spec;
+                       meta = rte_cpu_to_be_32(meta);
+                       item.spec = &meta;
+               }
        } else {
                type = MLX5_MODIFICATION_TYPE_COPY;
                /** For COPY fill the destination field (dcopy) without mask. */
                mlx5_flow_field_id_to_modify_info(&conf->dst, dcopy, NULL,
-                                                 conf->width, &shift, dev,
+                                                 conf->width, dev,
                                                  attr, error);
                /** Then construct the source field (field) with mask. */
                mlx5_flow_field_id_to_modify_info(&conf->src, field, mask,
-                                                 conf->width, &shift,
-                                                 dev, attr, error);
+                                                 conf->width, dev,
+                                                 attr, error);
        }
        item.mask = &mask;
        return flow_dv_convert_modify_action(&item,
@@ -1918,7 +1936,7 @@ flow_dv_validate_item_mark(struct rte_eth_dev *dev,
                           struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *config = &priv->config;
+       struct mlx5_sh_config *config = &priv->sh->config;
        const struct rte_flow_item_mark *spec = item->spec;
        const struct rte_flow_item_mark *mask = item->mask;
        const struct rte_flow_item_mark nic_mask = {
@@ -1992,7 +2010,7 @@ flow_dv_validate_item_meta(struct rte_eth_dev *dev __rte_unused,
                           struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *config = &priv->config;
+       struct mlx5_sh_config *config = &priv->sh->config;
        const struct rte_flow_item_meta *spec = item->spec;
        const struct rte_flow_item_meta *mask = item->mask;
        struct rte_flow_item_meta nic_mask = {
@@ -2018,7 +2036,7 @@ flow_dv_validate_item_meta(struct rte_eth_dev *dev __rte_unused,
                if (reg == REG_NON)
                        return rte_flow_error_set(error, ENOTSUP,
                                        RTE_FLOW_ERROR_TYPE_ITEM, item,
-                                       "unavalable extended metadata register");
+                                       "unavailable extended metadata register");
                if (reg == REG_B)
                        return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_ITEM, item,
@@ -2202,6 +2220,80 @@ flow_dv_validate_item_port_id(struct rte_eth_dev *dev,
        return 0;
 }
 
+/**
+ * Validate represented port item.
+ *
+ * @param[in] dev
+ *   Pointer to the rte_eth_dev structure.
+ * @param[in] item
+ *   Item specification.
+ * @param[in] attr
+ *   Attributes of flow that includes this item.
+ * @param[in] item_flags
+ *   Bit-fields that holds the items detected until now.
+ * @param[out] error
+ *   Pointer to error structure.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+flow_dv_validate_item_represented_port(struct rte_eth_dev *dev,
+                                      const struct rte_flow_item *item,
+                                      const struct rte_flow_attr *attr,
+                                      uint64_t item_flags,
+                                      struct rte_flow_error *error)
+{
+       const struct rte_flow_item_ethdev *spec = item->spec;
+       const struct rte_flow_item_ethdev *mask = item->mask;
+       const struct rte_flow_item_ethdev switch_mask = {
+                       .port_id = UINT16_MAX,
+       };
+       struct mlx5_priv *esw_priv;
+       struct mlx5_priv *dev_priv;
+       int ret;
+
+       if (!attr->transfer)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ITEM, NULL,
+                                         "match on port id is valid only when transfer flag is enabled");
+       if (item_flags & MLX5_FLOW_ITEM_REPRESENTED_PORT)
+               return rte_flow_error_set(error, ENOTSUP,
+                                         RTE_FLOW_ERROR_TYPE_ITEM, item,
+                                         "multiple source ports are not supported");
+       if (!mask)
+               mask = &switch_mask;
+       if (mask->port_id != UINT16_MAX)
+               return rte_flow_error_set(error, ENOTSUP,
+                                          RTE_FLOW_ERROR_TYPE_ITEM_MASK, mask,
+                                          "no support for partial mask on \"id\" field");
+       ret = mlx5_flow_item_acceptable
+                               (item, (const uint8_t *)mask,
+                                (const uint8_t *)&rte_flow_item_ethdev_mask,
+                                sizeof(struct rte_flow_item_ethdev),
+                                MLX5_ITEM_RANGE_NOT_ACCEPTED, error);
+       if (ret)
+               return ret;
+       if (!spec || spec->port_id == UINT16_MAX)
+               return 0;
+       esw_priv = mlx5_port_to_eswitch_info(spec->port_id, false);
+       if (!esw_priv)
+               return rte_flow_error_set(error, rte_errno,
+                                         RTE_FLOW_ERROR_TYPE_ITEM_SPEC, spec,
+                                         "failed to obtain E-Switch info for port");
+       dev_priv = mlx5_dev_to_eswitch_info(dev);
+       if (!dev_priv)
+               return rte_flow_error_set(error, rte_errno,
+                                         RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
+                                         NULL,
+                                         "failed to obtain E-Switch info");
+       if (esw_priv->domain_id != dev_priv->domain_id)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ITEM_SPEC, spec,
+                                         "cannot match on a port from a different E-Switch");
+       return 0;
+}
+
 /**
  * Validate VLAN item.
  *
@@ -2318,7 +2410,7 @@ flow_dv_validate_item_gtp(struct rte_eth_dev *dev,
                .teid = RTE_BE32(0xffffffff),
        };
 
-       if (!priv->config.hca_attr.tunnel_stateless_gtp)
+       if (!priv->sh->cdev->config.hca_attr.tunnel_stateless_gtp)
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_ITEM, item,
                                          "GTP support is not enabled");
@@ -2427,6 +2519,7 @@ flow_dv_validate_item_ipv4(struct rte_eth_dev *dev,
 {
        int ret;
        struct mlx5_priv *priv = dev->data->dev_private;
+       struct mlx5_hca_attr *attr = &priv->sh->cdev->config.hca_attr;
        const struct rte_flow_item_ipv4 *spec = item->spec;
        const struct rte_flow_item_ipv4 *last = item->last;
        const struct rte_flow_item_ipv4 *mask = item->mask;
@@ -2445,8 +2538,8 @@ flow_dv_validate_item_ipv4(struct rte_eth_dev *dev,
 
        if (mask && (mask->hdr.version_ihl & RTE_IPV4_HDR_IHL_MASK)) {
                int tunnel = !!(item_flags & MLX5_FLOW_LAYER_TUNNEL);
-               bool ihl_cap = !tunnel ? priv->config.hca_attr.outer_ipv4_ihl :
-                              priv->config.hca_attr.inner_ipv4_ihl;
+               bool ihl_cap = !tunnel ?
+                              attr->outer_ipv4_ihl : attr->inner_ipv4_ihl;
                if (!ihl_cap)
                        return rte_flow_error_set(error, ENOTSUP,
                                                  RTE_FLOW_ERROR_TYPE_ITEM,
@@ -2865,8 +2958,6 @@ flow_dv_validate_action_push_vlan(struct rte_eth_dev *dev,
 {
        const struct rte_flow_action_of_push_vlan *push_vlan = action->conf;
        const struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_ctx_shared *sh = priv->sh;
-       bool direction_error = false;
 
        if (push_vlan->ethertype != RTE_BE16(RTE_ETHER_TYPE_VLAN) &&
            push_vlan->ethertype != RTE_BE16(RTE_ETHER_TYPE_QINQ))
@@ -2878,22 +2969,6 @@ flow_dv_validate_action_push_vlan(struct rte_eth_dev *dev,
                                          RTE_FLOW_ERROR_TYPE_ACTION, action,
                                          "wrong action order, port_id should "
                                          "be after push VLAN");
-       /* Push VLAN is not supported in ingress except for CX6 FDB mode. */
-       if (attr->transfer) {
-               bool fdb_tx = priv->representor_id != UINT16_MAX;
-               bool is_cx5 = sh->steering_format_version ==
-                   MLX5_STEERING_LOGIC_FORMAT_CONNECTX_5;
-
-               if (!fdb_tx && is_cx5)
-                       direction_error = true;
-       } else if (attr->ingress) {
-               direction_error = true;
-       }
-       if (direction_error)
-               return rte_flow_error_set(error, ENOTSUP,
-                                         RTE_FLOW_ERROR_TYPE_ATTR_INGRESS,
-                                         NULL,
-                                         "push vlan action not supported for ingress");
        if (!attr->transfer && priv->representor)
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
@@ -3041,7 +3116,7 @@ flow_dv_validate_action_flag(struct rte_eth_dev *dev,
                             struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *config = &priv->config;
+       struct mlx5_sh_config *config = &priv->sh->config;
        int ret;
 
        /* Fall back if no extended metadata register support. */
@@ -3100,7 +3175,7 @@ flow_dv_validate_action_mark(struct rte_eth_dev *dev,
                             struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *config = &priv->config;
+       struct mlx5_sh_config *config = &priv->sh->config;
        const struct rte_flow_action_mark *mark = action->conf;
        int ret;
 
@@ -3174,7 +3249,7 @@ flow_dv_validate_action_set_meta(struct rte_eth_dev *dev,
                                 struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *config = &priv->config;
+       struct mlx5_sh_config *config = &priv->sh->config;
        const struct rte_flow_action_set_meta *conf;
        uint32_t nic_mask = UINT32_MAX;
        int reg;
@@ -3191,7 +3266,7 @@ flow_dv_validate_action_set_meta(struct rte_eth_dev *dev,
        if (reg == REG_NON)
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_ACTION, action,
-                                         "unavalable extended metadata register");
+                                         "unavailable extended metadata register");
        if (reg != REG_A && reg != REG_B) {
                struct mlx5_priv *priv = dev->data->dev_private;
 
@@ -3269,6 +3344,25 @@ flow_dv_validate_action_set_tag(struct rte_eth_dev *dev,
        return 0;
 }
 
+/**
+ * Indicates whether ASO aging is supported.
+ *
+ * @param[in] sh
+ *   Pointer to shared device context structure.
+ * @param[in] attr
+ *   Attributes of flow that includes AGE action.
+ *
+ * @return
+ *   True when ASO aging is supported, false otherwise.
+ */
+static inline bool
+flow_hit_aso_supported(const struct mlx5_dev_ctx_shared *sh,
+               const struct rte_flow_attr *attr)
+{
+       MLX5_ASSERT(sh && attr);
+       return (sh->flow_hit_aso_en && (attr->transfer || attr->group));
+}
+
 /**
  * Validate count action.
  *
@@ -3278,6 +3372,8 @@ flow_dv_validate_action_set_tag(struct rte_eth_dev *dev,
  *   Indicator if action is shared.
  * @param[in] action_flags
  *   Holds the actions detected until now.
+ * @param[in] attr
+ *   Attributes of flow that includes this action.
  * @param[out] error
  *   Pointer to error structure.
  *
@@ -3287,21 +3383,22 @@ flow_dv_validate_action_set_tag(struct rte_eth_dev *dev,
 static int
 flow_dv_validate_action_count(struct rte_eth_dev *dev, bool shared,
                              uint64_t action_flags,
+                             const struct rte_flow_attr *attr,
                              struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
 
-       if (!priv->sh->devx)
+       if (!priv->sh->cdev->config.devx)
                goto notsup_err;
        if (action_flags & MLX5_FLOW_ACTION_COUNT)
                return rte_flow_error_set(error, EINVAL,
                                          RTE_FLOW_ERROR_TYPE_ACTION, NULL,
                                          "duplicate count actions set");
        if (shared && (action_flags & MLX5_FLOW_ACTION_AGE) &&
-           !priv->sh->flow_hit_aso_en)
+           !flow_hit_aso_supported(priv->sh, attr))
                return rte_flow_error_set(error, EINVAL,
                                          RTE_FLOW_ERROR_TYPE_ACTION, NULL,
-                                         "old age and shared count combination is not supported");
+                                         "old age and indirect count combination is not supported");
 #ifdef HAVE_IBV_FLOW_DEVX_COUNTERS
        return 0;
 #endif
@@ -3385,8 +3482,8 @@ flow_dv_validate_action_decap(struct rte_eth_dev *dev,
 {
        const struct mlx5_priv *priv = dev->data->dev_private;
 
-       if (priv->config.hca_attr.scatter_fcs_w_decap_disable &&
-           !priv->config.decap_en)
+       if (priv->sh->cdev->config.hca_attr.scatter_fcs_w_decap_disable &&
+           !priv->sh->config.decap_en)
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_ACTION, NULL,
                                          "decap is not enabled");
@@ -3726,7 +3823,8 @@ flow_dv_encap_decap_resource_register
                                flow_dv_encap_decap_match_cb,
                                flow_dv_encap_decap_remove_cb,
                                flow_dv_encap_decap_clone_cb,
-                               flow_dv_encap_decap_clone_free_cb);
+                               flow_dv_encap_decap_clone_free_cb,
+                               error);
        if (unlikely(!encaps_decaps))
                return -rte_errno;
        resource->flags = dev_flow->dv.group ? 0 : 1;
@@ -4025,7 +4123,7 @@ flow_dv_push_vlan_action_resource_register
  * @return
  *   sizeof struct item_type, 0 if void or irrelevant.
  */
-static size_t
+size_t
 flow_dv_get_item_hdr_len(const enum rte_flow_item_type item_type)
 {
        size_t retval;
@@ -4091,7 +4189,7 @@ flow_dv_get_item_hdr_len(const enum rte_flow_item_type item_type)
  * @return
  *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
-static int
+int
 flow_dv_convert_encap_data(const struct rte_flow_item *items, uint8_t *buf,
                           size_t *size, struct rte_flow_error *error)
 {
@@ -4811,7 +4909,8 @@ flow_dv_validate_action_modify_field(struct rte_eth_dev *dev,
 {
        int ret = 0;
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *config = &priv->config;
+       struct mlx5_sh_config *config = &priv->sh->config;
+       struct mlx5_hca_attr *hca_attr = &priv->sh->cdev->config.hca_attr;
        const struct rte_flow_action_modify_field *action_modify_field =
                action->conf;
        uint32_t dst_width = mlx5_flow_item_field_width(dev,
@@ -4939,6 +5038,15 @@ flow_dv_validate_action_modify_field(struct rte_eth_dev *dev,
                                RTE_FLOW_ERROR_TYPE_ACTION, action,
                                "add and sub operations"
                                " are not supported");
+       if (action_modify_field->dst.field == RTE_FLOW_FIELD_IPV4_ECN ||
+           action_modify_field->src.field == RTE_FLOW_FIELD_IPV4_ECN ||
+           action_modify_field->dst.field == RTE_FLOW_FIELD_IPV6_ECN ||
+           action_modify_field->src.field == RTE_FLOW_FIELD_IPV6_ECN)
+               if (!hca_attr->modify_outer_ip_ecn &&
+                   !attr->transfer && !attr->group)
+                       return rte_flow_error_set(error, ENOTSUP,
+                               RTE_FLOW_ERROR_TYPE_ACTION, action,
+                               "modifications of the ECN for current firmware is not supported");
        return (action_modify_field->width / 32) +
               !!(action_modify_field->width % 32);
 }
@@ -4968,7 +5076,7 @@ flow_dv_validate_action_jump(struct rte_eth_dev *dev,
                             const struct rte_flow_attr *attributes,
                             bool external, struct rte_flow_error *error)
 {
-       uint32_t target_group, table;
+       uint32_t target_group, table = 0;
        int ret = 0;
        struct flow_grp_info grp_info = {
                .external = !!external,
@@ -4999,6 +5107,10 @@ flow_dv_validate_action_jump(struct rte_eth_dev *dev,
                                          RTE_FLOW_ERROR_TYPE_ACTION, NULL,
                                          "target group must be other than"
                                          " the current flow group");
+       if (table == 0)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION_CONF,
+                                         NULL, "root table shouldn't be destination");
        return 0;
 }
 
@@ -5119,6 +5231,8 @@ flow_dv_modify_hdr_action_max(struct rte_eth_dev *dev __rte_unused,
  *   Pointer to rte_eth_dev structure.
  * @param[in] action_flags
  *   Bit-fields that holds the actions detected until now.
+ * @param[in] item_flags
+ *   Holds the items detected.
  * @param[in] action
  *   Pointer to the meter action.
  * @param[in] attr
@@ -5129,11 +5243,11 @@ flow_dv_modify_hdr_action_max(struct rte_eth_dev *dev __rte_unused,
  *   Pointer to error structure.
  *
  * @return
- *   0 on success, a negative errno value otherwise and rte_ernno is set.
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
 static int
 mlx5_flow_validate_action_meter(struct rte_eth_dev *dev,
-                               uint64_t action_flags,
+                               uint64_t action_flags, uint64_t item_flags,
                                const struct rte_flow_action *action,
                                const struct rte_flow_attr *attr,
                                const struct rte_flow_item *port_id_item,
@@ -5237,6 +5351,35 @@ mlx5_flow_validate_action_meter(struct rte_eth_dev *dev,
                                                NULL,
                                                "Flow and meter policy "
                                                "have different src port.");
+               } else if (mtr_policy->is_rss) {
+                       struct mlx5_flow_meter_policy *fp;
+                       struct mlx5_meter_policy_action_container *acg;
+                       struct mlx5_meter_policy_action_container *acy;
+                       const struct rte_flow_action *rss_act;
+                       int ret;
+
+                       fp = mlx5_flow_meter_hierarchy_get_final_policy(dev,
+                                                               mtr_policy);
+                       if (fp == NULL)
+                               return rte_flow_error_set(error, EINVAL,
+                                       RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                                 "Unable to get the final "
+                                                 "policy in the hierarchy");
+                       acg = &fp->act_cnt[RTE_COLOR_GREEN];
+                       acy = &fp->act_cnt[RTE_COLOR_YELLOW];
+                       MLX5_ASSERT(acg->fate_action ==
+                                   MLX5_FLOW_FATE_SHARED_RSS ||
+                                   acy->fate_action ==
+                                   MLX5_FLOW_FATE_SHARED_RSS);
+                       if (acg->fate_action == MLX5_FLOW_FATE_SHARED_RSS)
+                               rss_act = acg->rss;
+                       else
+                               rss_act = acy->rss;
+                       ret = mlx5_flow_validate_action_rss(rss_act,
+                                       action_flags, dev, attr,
+                                       item_flags, error);
+                       if (ret)
+                               return ret;
                }
                *def_policy = false;
        }
@@ -5267,8 +5410,8 @@ flow_dv_validate_action_age(uint64_t action_flags,
        struct mlx5_priv *priv = dev->data->dev_private;
        const struct rte_flow_action_age *age = action->conf;
 
-       if (!priv->sh->devx || (priv->sh->cmng.counter_fallback &&
-           !priv->sh->aso_age_mng))
+       if (!priv->sh->cdev->config.devx ||
+           (priv->sh->cmng.counter_fallback && !priv->sh->aso_age_mng))
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
                                          NULL,
@@ -5388,8 +5531,9 @@ flow_dv_modify_ipool_get(struct mlx5_dev_ctx_shared *sh, uint8_t index)
                       .grow_trunk = 3,
                       .grow_shift = 2,
                       .need_lock = 1,
-                      .release_mem_en = !!sh->reclaim_mode,
-                      .per_core_cache = sh->reclaim_mode ? 0 : (1 << 16),
+                      .release_mem_en = !!sh->config.reclaim_mode,
+                      .per_core_cache =
+                                      sh->config.reclaim_mode ? 0 : (1 << 16),
                       .malloc = mlx5_malloc,
                       .free = mlx5_free,
                       .type = "mlx5_modify_action_resource",
@@ -5536,7 +5680,7 @@ flow_dv_validate_action_sample(uint64_t *action_flags,
                               struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *dev_conf = &priv->config;
+       struct mlx5_sh_config *dev_conf = &priv->sh->config;
        const struct rte_flow_action_sample *sample = action->conf;
        const struct rte_flow_action *act;
        uint64_t sub_action_flags = 0;
@@ -5552,7 +5696,8 @@ flow_dv_validate_action_sample(uint64_t *action_flags,
                return rte_flow_error_set(error, EINVAL,
                                          RTE_FLOW_ERROR_TYPE_ACTION, action,
                                          "ratio value starts from 1");
-       if (!priv->sh->devx || (sample->ratio > 0 && !priv->sampler_en))
+       if (!priv->sh->cdev->config.devx ||
+           (sample->ratio > 0 && !priv->sampler_en))
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
                                          NULL,
@@ -5633,7 +5778,7 @@ flow_dv_validate_action_sample(uint64_t *action_flags,
                case RTE_FLOW_ACTION_TYPE_COUNT:
                        ret = flow_dv_validate_action_count
                                (dev, false, *action_flags | sub_action_flags,
-                                error);
+                                attr, error);
                        if (ret < 0)
                                return ret;
                        *count = act->conf;
@@ -5719,14 +5864,13 @@ flow_dv_validate_action_sample(uint64_t *action_flags,
                                                  NULL,
                                                  "E-Switch must has a dest "
                                                  "port for mirroring");
-               if (!priv->config.hca_attr.reg_c_preserve &&
+               if (!priv->sh->cdev->config.hca_attr.reg_c_preserve &&
                     priv->representor_id != UINT16_MAX)
                        *fdb_mirror_limit = 1;
        }
        /* Continue validation for Xcap actions.*/
        if ((sub_action_flags & MLX5_FLOW_XCAP_ACTIONS) &&
-           (queue_index == 0xFFFF ||
-            mlx5_rxq_get_type(dev, queue_index) != MLX5_RXQ_TYPE_HAIRPIN)) {
+           (queue_index == 0xFFFF || !mlx5_rxq_is_hairpin(dev, queue_index))) {
                if ((sub_action_flags & MLX5_FLOW_XCAP_ACTIONS) ==
                     MLX5_FLOW_XCAP_ACTIONS)
                        return rte_flow_error_set(error, ENOTSUP,
@@ -5787,7 +5931,8 @@ flow_dv_modify_hdr_resource_register
                                flow_dv_modify_match_cb,
                                flow_dv_modify_remove_cb,
                                flow_dv_modify_clone_cb,
-                               flow_dv_modify_clone_free_cb);
+                               flow_dv_modify_clone_free_cb,
+                               error);
        if (unlikely(!modify_cmds))
                return -rte_errno;
        resource->root = !dev_flow->dv.group;
@@ -6140,7 +6285,7 @@ flow_dv_counter_alloc(struct rte_eth_dev *dev, uint32_t age)
                        age ? MLX5_COUNTER_TYPE_AGE : MLX5_COUNTER_TYPE_ORIGIN;
        uint32_t cnt_idx;
 
-       if (!priv->sh->devx) {
+       if (!priv->sh->cdev->config.devx) {
                rte_errno = ENOTSUP;
                return 0;
        }
@@ -6463,7 +6608,7 @@ flow_dv_mtr_alloc(struct rte_eth_dev *dev)
        struct mlx5_aso_mtr_pool *pool;
        uint32_t mtr_idx = 0;
 
-       if (!priv->sh->devx) {
+       if (!priv->sh->cdev->config.devx) {
                rte_errno = ENOTSUP;
                return 0;
        }
@@ -6483,13 +6628,13 @@ flow_dv_mtr_alloc(struct rte_eth_dev *dev)
                        struct mlx5_aso_mtr_pool,
                        mtrs[mtr_free->offset]);
        mtr_idx = MLX5_MAKE_MTR_IDX(pool->index, mtr_free->offset);
-       if (!mtr_free->fm.meter_action) {
+       if (!mtr_free->fm.meter_action_g) {
 #ifdef HAVE_MLX5_DR_CREATE_ACTION_ASO
                struct rte_flow_error error;
                uint8_t reg_id;
 
                reg_id = mlx5_flow_get_reg_id(dev, MLX5_MTR_COLOR, 0, &error);
-               mtr_free->fm.meter_action =
+               mtr_free->fm.meter_action_g =
                        mlx5_glue->dv_create_flow_action_aso
                                                (priv->sh->rx_domain,
                                                 pool->devx_obj->obj,
@@ -6497,7 +6642,7 @@ flow_dv_mtr_alloc(struct rte_eth_dev *dev)
                                                 (1 << MLX5_FLOW_COLOR_GREEN),
                                                 reg_id - REG_C_0);
 #endif /* HAVE_MLX5_DR_CREATE_ACTION_ASO */
-               if (!mtr_free->fm.meter_action) {
+               if (!mtr_free->fm.meter_action_g) {
                        flow_dv_aso_mtr_release_to_pool(dev, mtr_idx);
                        return 0;
                }
@@ -6559,16 +6704,11 @@ flow_dv_validate_attributes(struct rte_eth_dev *dev,
                                          NULL,
                                          "priority out of range");
        if (attributes->transfer) {
-               if (!priv->config.dv_esw_en)
+               if (!priv->sh->config.dv_esw_en)
                        return rte_flow_error_set
                                (error, ENOTSUP,
                                 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
                                 "E-Switch dr is not supported");
-               if (!(priv->representor || priv->master))
-                       return rte_flow_error_set
-                               (error, EINVAL, RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
-                                NULL, "E-Switch configuration can only be"
-                                " done by a master or a representor device");
                if (attributes->egress)
                        return rte_flow_error_set
                                (error, ENOTSUP,
@@ -6652,7 +6792,7 @@ flow_dv_validate_item_integrity(struct rte_eth_dev *dev,
        const struct rte_flow_item_integrity *spec = (typeof(spec))
                                                     integrity_item->spec;
 
-       if (!priv->config.hca_attr.pkt_integrity_match)
+       if (!priv->sh->cdev->config.hca_attr.pkt_integrity_match)
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_ITEM,
                                          integrity_item,
@@ -6799,7 +6939,7 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                 bool external, int hairpin, struct rte_flow_error *error)
 {
        int ret;
-       uint64_t action_flags = 0;
+       uint64_t aso_mask, action_flags = 0;
        uint64_t item_flags = 0;
        uint64_t last_item = 0;
        uint8_t next_protocol = 0xff;
@@ -6849,7 +6989,7 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                },
        };
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *dev_conf = &priv->config;
+       struct mlx5_sh_config *dev_conf = &priv->sh->config;
        uint16_t queue_index = 0xFFFF;
        const struct rte_flow_item_vlan *vlan_m = NULL;
        uint32_t rw_act_num = 0;
@@ -6866,14 +7006,18 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
        const struct rte_flow_item *integrity_items[2] = {NULL, NULL};
        const struct rte_flow_item *port_id_item = NULL;
        bool def_policy = false;
+       bool shared_count = false;
        uint16_t udp_dport = 0;
+       uint32_t tag_id = 0;
+       const struct rte_flow_action_age *non_shared_age = NULL;
+       const struct rte_flow_action_count *count = NULL;
 
        if (items == NULL)
                return -1;
        tunnel = is_tunnel_offload_active(dev) ?
                 mlx5_get_tof(items, actions, &tof_rule_type) : NULL;
        if (tunnel) {
-               if (!priv->config.dv_flow_en)
+               if (!dev_conf->dv_flow_en)
                        return rte_flow_error_set
                                (error, ENOTSUP,
                                 RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
@@ -6906,6 +7050,14 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                switch (type) {
                case RTE_FLOW_ITEM_TYPE_VOID:
                        break;
+               case RTE_FLOW_ITEM_TYPE_ESP:
+                       ret = mlx5_flow_os_validate_item_esp(items, item_flags,
+                                                         next_protocol,
+                                                         error);
+                       if (ret < 0)
+                               return ret;
+                       last_item = MLX5_FLOW_ITEM_ESP;
+                       break;
                case RTE_FLOW_ITEM_TYPE_PORT_ID:
                        ret = flow_dv_validate_item_port_id
                                        (dev, items, attr, item_flags, error);
@@ -6914,6 +7066,13 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                        last_item = MLX5_FLOW_ITEM_PORT_ID;
                        port_id_item = items;
                        break;
+               case RTE_FLOW_ITEM_TYPE_REPRESENTED_PORT:
+                       ret = flow_dv_validate_item_represented_port
+                                       (dev, items, attr, item_flags, error);
+                       if (ret < 0)
+                               return ret;
+                       last_item = MLX5_FLOW_ITEM_REPRESENTED_PORT;
+                       break;
                case RTE_FLOW_ITEM_TYPE_ETH:
                        ret = mlx5_flow_validate_item_eth(items, item_flags,
                                                          true, error);
@@ -7067,6 +7226,13 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                        gre_item = items;
                        last_item = MLX5_FLOW_LAYER_GRE;
                        break;
+               case RTE_FLOW_ITEM_TYPE_GRE_OPTION:
+                       ret = mlx5_flow_validate_item_gre_option(dev, items, item_flags,
+                                                         attr, gre_item, error);
+                       if (ret < 0)
+                               return ret;
+                       last_item = MLX5_FLOW_LAYER_GRE;
+                       break;
                case RTE_FLOW_ITEM_TYPE_NVGRE:
                        ret = mlx5_flow_validate_item_nvgre(items, item_flags,
                                                            next_protocol,
@@ -7164,8 +7330,10 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                return ret;
                        last_item = MLX5_FLOW_ITEM_TAG;
                        break;
-               case MLX5_RTE_FLOW_ITEM_TYPE_TAG:
                case MLX5_RTE_FLOW_ITEM_TYPE_TX_QUEUE:
+                       last_item = MLX5_FLOW_ITEM_TX_QUEUE;
+                       break;
+               case MLX5_RTE_FLOW_ITEM_TYPE_TAG:
                        break;
                case RTE_FLOW_ITEM_TYPE_GTP:
                        ret = flow_dv_validate_item_gtp(dev, items, item_flags,
@@ -7236,7 +7404,6 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
        }
        for (; actions->type != RTE_FLOW_ACTION_TYPE_END; actions++) {
                int type = actions->type;
-               bool shared_count = false;
 
                if (!mlx5_flow_os_action_supported(type))
                        return rte_flow_error_set(error, ENOTSUP,
@@ -7335,6 +7502,8 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                ++actions_n;
                        if (action_flags & MLX5_FLOW_ACTION_SAMPLE)
                                modify_after_mirror = 1;
+                       tag_id = ((const struct rte_flow_action_set_tag *)
+                                 actions->conf)->index;
                        action_flags |= MLX5_FLOW_ACTION_SET_TAG;
                        rw_act_num += MLX5_ACT_NUM_SET_TAG;
                        break;
@@ -7393,9 +7562,10 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                case RTE_FLOW_ACTION_TYPE_COUNT:
                        ret = flow_dv_validate_action_count(dev, shared_count,
                                                            action_flags,
-                                                           error);
+                                                           attr, error);
                        if (ret < 0)
                                return ret;
+                       count = actions->conf;
                        action_flags |= MLX5_FLOW_ACTION_COUNT;
                        ++actions_n;
                        break;
@@ -7670,6 +7840,7 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                case RTE_FLOW_ACTION_TYPE_METER:
                        ret = mlx5_flow_validate_action_meter(dev,
                                                              action_flags,
+                                                             item_flags,
                                                              actions, attr,
                                                              port_id_item,
                                                              &def_policy,
@@ -7700,6 +7871,7 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                        ++actions_n;
                        break;
                case RTE_FLOW_ACTION_TYPE_AGE:
+                       non_shared_age = actions->conf;
                        ret = flow_dv_validate_action_age(action_flags,
                                                          actions, dev,
                                                          error);
@@ -7707,15 +7879,15 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                return ret;
                        /*
                         * Validate the regular AGE action (using counter)
-                        * mutual exclusion with share counter actions.
+                        * mutual exclusion with indirect counter actions.
                         */
-                       if (!priv->sh->flow_hit_aso_en) {
+                       if (!flow_hit_aso_supported(priv->sh, attr)) {
                                if (shared_count)
                                        return rte_flow_error_set
                                                (error, EINVAL,
                                                RTE_FLOW_ERROR_TYPE_ACTION,
                                                NULL,
-                                               "old age and shared count combination is not supported");
+                                               "old age and indirect count combination is not supported");
                                if (sample_count)
                                        return rte_flow_error_set
                                                (error, EINVAL,
@@ -7768,6 +7940,11 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                                             error);
                        if (ret < 0)
                                return ret;
+                       if ((action_flags & MLX5_FLOW_ACTION_SET_TAG) &&
+                           tag_id == 0 && priv->mtr_color_reg == REG_NON)
+                               return rte_flow_error_set(error, EINVAL,
+                                       RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                       "sample after tag action causes metadata tag index 0 corruption");
                        action_flags |= MLX5_FLOW_ACTION_SAMPLE;
                        ++actions_n;
                        break;
@@ -7812,7 +7989,7 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
         * - Explicit decap action is prohibited by the tunnel offload API.
         * - Drop action in tunnel steer rule is prohibited by the API.
         * - Application cannot use MARK action because it's value can mask
-        *   tunnel default miss nitification.
+        *   tunnel default miss notification.
         * - JUMP in tunnel match rule has no support in current PMD
         *   implementation.
         * - TAG & META are reserved for future uses.
@@ -7914,8 +8091,7 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
         */
        if ((action_flags & (MLX5_FLOW_XCAP_ACTIONS |
                             MLX5_FLOW_VLAN_ACTIONS)) &&
-           (queue_index == 0xFFFF ||
-            mlx5_rxq_get_type(dev, queue_index) != MLX5_RXQ_TYPE_HAIRPIN ||
+           (queue_index == 0xFFFF || !mlx5_rxq_is_hairpin(dev, queue_index) ||
             ((conf = mlx5_rxq_get_hairpin_conf(dev, queue_index)) != NULL &&
             conf->tx_explicit != 0))) {
                if ((action_flags & MLX5_FLOW_XCAP_ACTIONS) ==
@@ -7924,6 +8100,28 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                                  RTE_FLOW_ERROR_TYPE_ACTION,
                                                  NULL, "encap and decap "
                                                  "combination aren't supported");
+               /* Push VLAN is not supported in ingress except for NICs newer than CX5. */
+               if (action_flags & MLX5_FLOW_ACTION_OF_PUSH_VLAN) {
+                       struct mlx5_dev_ctx_shared *sh = priv->sh;
+                       bool direction_error = false;
+
+                       if (attr->transfer) {
+                               bool fdb_tx = priv->representor_id != UINT16_MAX;
+                               bool is_cx5 = sh->steering_format_version ==
+                                   MLX5_STEERING_LOGIC_FORMAT_CONNECTX_5;
+
+                               if (!fdb_tx && is_cx5)
+                                       direction_error = true;
+                       } else if (attr->ingress) {
+                               direction_error = true;
+                       }
+                       if (direction_error)
+                               return rte_flow_error_set(error, ENOTSUP,
+                                                         RTE_FLOW_ERROR_TYPE_ATTR_INGRESS,
+                                                         NULL,
+                                                         "push VLAN action not supported "
+                                                         "for ingress");
+               }
                if (!attr->transfer && attr->ingress) {
                        if (action_flags & MLX5_FLOW_ACTION_ENCAP)
                                return rte_flow_error_set
@@ -7931,12 +8129,6 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                                 RTE_FLOW_ERROR_TYPE_ACTION,
                                                 NULL, "encap is not supported"
                                                 " for ingress traffic");
-                       else if (action_flags & MLX5_FLOW_ACTION_OF_PUSH_VLAN)
-                               return rte_flow_error_set
-                                               (error, ENOTSUP,
-                                                RTE_FLOW_ERROR_TYPE_ACTION,
-                                                NULL, "push VLAN action not "
-                                                "supported for ingress");
                        else if ((action_flags & MLX5_FLOW_VLAN_ACTIONS) ==
                                        MLX5_FLOW_VLAN_ACTIONS)
                                return rte_flow_error_set
@@ -7976,6 +8168,20 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                        "cannot be done before meter action");
                }
        }
+       /*
+        * Only support one ASO action in a single flow rule.
+        * non-shared AGE + counter will fallback to use HW counter, no ASO hit object.
+        * Group 0 uses HW counter for AGE too even if no counter action.
+        */
+       aso_mask = (action_flags & MLX5_FLOW_ACTION_METER && priv->sh->meter_aso_en) << 2 |
+                  (action_flags & MLX5_FLOW_ACTION_CT && priv->sh->ct_aso_en) << 1 |
+                  (action_flags & MLX5_FLOW_ACTION_AGE &&
+                   !(non_shared_age && count) &&
+                   (attr->group || (attr->transfer && priv->fdb_def_rule)) &&
+                   priv->sh->flow_hit_aso_en);
+       if (__builtin_popcountl(aso_mask) > 1)
+               return rte_flow_error_set(error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION,
+                                         NULL, "unsupported combining AGE, METER, CT ASO actions in a single rule");
        /*
         * Hairpin flow will add one more TAG action in TX implicit mode.
         * In TX explicit mode, there will be no hairpin flow ID.
@@ -7999,6 +8205,18 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                return rte_flow_error_set(error, EINVAL,
                                RTE_FLOW_ERROR_TYPE_ACTION, NULL,
                                "sample before modify action is not supported");
+       /*
+        * Validation the NIC Egress flow on representor, except implicit
+        * hairpin default egress flow with TX_QUEUE item, other flows not
+        * work due to metadata regC0 mismatch.
+        */
+       if ((!attr->transfer && attr->egress) && priv->representor &&
+           !(item_flags & MLX5_FLOW_ITEM_TX_QUEUE))
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ITEM,
+                                         NULL,
+                                         "NIC egress rules on representors"
+                                         " is not supported");
        return 0;
 }
 
@@ -8621,6 +8839,58 @@ flow_dv_translate_item_tcp(void *matcher, void *key,
                 (tcp_v->hdr.tcp_flags & tcp_m->hdr.tcp_flags));
 }
 
+/**
+ * Add ESP item to matcher and to the value.
+ *
+ * @param[in, out] matcher
+ *   Flow matcher.
+ * @param[in, out] key
+ *   Flow matcher value.
+ * @param[in] item
+ *   Flow pattern to translate.
+ * @param[in] inner
+ *   Item is inner pattern.
+ */
+static void
+flow_dv_translate_item_esp(void *matcher, void *key,
+                          const struct rte_flow_item *item,
+                          int inner)
+{
+       const struct rte_flow_item_esp *esp_m = item->mask;
+       const struct rte_flow_item_esp *esp_v = item->spec;
+       void *headers_m;
+       void *headers_v;
+       char *spi_m;
+       char *spi_v;
+
+       if (inner) {
+               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
+                                        inner_headers);
+               headers_v = MLX5_ADDR_OF(fte_match_param, key, inner_headers);
+       } else {
+               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
+                                        outer_headers);
+               headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
+       }
+       MLX5_SET(fte_match_set_lyr_2_4, headers_m, ip_protocol, 0xff);
+       MLX5_SET(fte_match_set_lyr_2_4, headers_v, ip_protocol, IPPROTO_ESP);
+       if (!esp_v)
+               return;
+       if (!esp_m)
+               esp_m = &rte_flow_item_esp_mask;
+       headers_m = MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters);
+       headers_v = MLX5_ADDR_OF(fte_match_param, key, misc_parameters);
+       if (inner) {
+               spi_m = MLX5_ADDR_OF(fte_match_set_misc, headers_m, inner_esp_spi);
+               spi_v = MLX5_ADDR_OF(fte_match_set_misc, headers_v, inner_esp_spi);
+       } else {
+               spi_m = MLX5_ADDR_OF(fte_match_set_misc, headers_m, outer_esp_spi);
+               spi_v = MLX5_ADDR_OF(fte_match_set_misc, headers_v, outer_esp_spi);
+       }
+       *(uint32_t *)spi_m = esp_m->hdr.spi;
+       *(uint32_t *)spi_v = esp_m->hdr.spi & esp_v->hdr.spi;
+}
+
 /**
  * Add UDP item to matcher and to the value.
  *
@@ -8716,18 +8986,19 @@ flow_dv_translate_item_gre_key(void *matcher, void *key,
  *   Flow matcher value.
  * @param[in] item
  *   Flow pattern to translate.
- * @param[in] inner
- *   Item is inner pattern.
+ * @param[in] pattern_flags
+ *   Accumulated pattern flags.
  */
 static void
 flow_dv_translate_item_gre(void *matcher, void *key,
                           const struct rte_flow_item *item,
-                          int inner)
+                          uint64_t pattern_flags)
 {
+       static const struct rte_flow_item_gre empty_gre = {0,};
        const struct rte_flow_item_gre *gre_m = item->mask;
        const struct rte_flow_item_gre *gre_v = item->spec;
-       void *headers_m;
-       void *headers_v;
+       void *headers_m = MLX5_ADDR_OF(fte_match_param, matcher, outer_headers);
+       void *headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
        void *misc_m = MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters);
        void *misc_v = MLX5_ADDR_OF(fte_match_param, key, misc_parameters);
        struct {
@@ -8744,26 +9015,17 @@ flow_dv_translate_item_gre(void *matcher, void *key,
                        uint16_t value;
                };
        } gre_crks_rsvd0_ver_m, gre_crks_rsvd0_ver_v;
+       uint16_t protocol_m, protocol_v;
 
-       if (inner) {
-               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
-                                        inner_headers);
-               headers_v = MLX5_ADDR_OF(fte_match_param, key, inner_headers);
-       } else {
-               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
-                                        outer_headers);
-               headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
-       }
        MLX5_SET(fte_match_set_lyr_2_4, headers_m, ip_protocol, 0xff);
        MLX5_SET(fte_match_set_lyr_2_4, headers_v, ip_protocol, IPPROTO_GRE);
-       if (!gre_v)
-               return;
-       if (!gre_m)
-               gre_m = &rte_flow_item_gre_mask;
-       MLX5_SET(fte_match_set_misc, misc_m, gre_protocol,
-                rte_be_to_cpu_16(gre_m->protocol));
-       MLX5_SET(fte_match_set_misc, misc_v, gre_protocol,
-                rte_be_to_cpu_16(gre_v->protocol & gre_m->protocol));
+       if (!gre_v) {
+               gre_v = &empty_gre;
+               gre_m = &empty_gre;
+       } else {
+               if (!gre_m)
+                       gre_m = &rte_flow_item_gre_mask;
+       }
        gre_crks_rsvd0_ver_m.value = rte_be_to_cpu_16(gre_m->c_rsvd0_ver);
        gre_crks_rsvd0_ver_v.value = rte_be_to_cpu_16(gre_v->c_rsvd0_ver);
        MLX5_SET(fte_match_set_misc, misc_m, gre_c_present,
@@ -8781,6 +9043,121 @@ flow_dv_translate_item_gre(void *matcher, void *key,
        MLX5_SET(fte_match_set_misc, misc_v, gre_s_present,
                 gre_crks_rsvd0_ver_v.s_present &
                 gre_crks_rsvd0_ver_m.s_present);
+       protocol_m = rte_be_to_cpu_16(gre_m->protocol);
+       protocol_v = rte_be_to_cpu_16(gre_v->protocol);
+       if (!protocol_m) {
+               /* Force next protocol to prevent matchers duplication */
+               protocol_v = mlx5_translate_tunnel_etypes(pattern_flags);
+               if (protocol_v)
+                       protocol_m = 0xFFFF;
+       }
+       MLX5_SET(fte_match_set_misc, misc_m, gre_protocol, protocol_m);
+       MLX5_SET(fte_match_set_misc, misc_v, gre_protocol,
+                protocol_m & protocol_v);
+}
+
+/**
+ * Add GRE optional items to matcher and to the value.
+ *
+ * @param[in, out] matcher
+ *   Flow matcher.
+ * @param[in, out] key
+ *   Flow matcher value.
+ * @param[in] item
+ *   Flow pattern to translate.
+ * @param[in] gre_item
+ *   Pointer to gre_item.
+ * @param[in] pattern_flags
+ *   Accumulated pattern flags.
+ */
+static void
+flow_dv_translate_item_gre_option(void *matcher, void *key,
+                                 const struct rte_flow_item *item,
+                                 const struct rte_flow_item *gre_item,
+                                 uint64_t pattern_flags)
+{
+       const struct rte_flow_item_gre_opt *option_m = item->mask;
+       const struct rte_flow_item_gre_opt *option_v = item->spec;
+       const struct rte_flow_item_gre *gre_m = gre_item->mask;
+       const struct rte_flow_item_gre *gre_v = gre_item->spec;
+       static const struct rte_flow_item_gre empty_gre = {0};
+       struct rte_flow_item gre_key_item;
+       uint16_t c_rsvd0_ver_m, c_rsvd0_ver_v;
+       uint16_t protocol_m, protocol_v;
+       void *misc5_m;
+       void *misc5_v;
+
+       /*
+        * If only match key field, keep using misc for matching.
+        * If need to match checksum or sequence, using misc5 and do
+        * not need using misc.
+        */
+       if (!(option_m->sequence.sequence ||
+             option_m->checksum_rsvd.checksum)) {
+               flow_dv_translate_item_gre(matcher, key, gre_item,
+                                          pattern_flags);
+               gre_key_item.spec = &option_v->key.key;
+               gre_key_item.mask = &option_m->key.key;
+               flow_dv_translate_item_gre_key(matcher, key, &gre_key_item);
+               return;
+       }
+       if (!gre_v) {
+               gre_v = &empty_gre;
+               gre_m = &empty_gre;
+       } else {
+               if (!gre_m)
+                       gre_m = &rte_flow_item_gre_mask;
+       }
+       protocol_v = gre_v->protocol;
+       protocol_m = gre_m->protocol;
+       if (!protocol_m) {
+               /* Force next protocol to prevent matchers duplication */
+               uint16_t ether_type =
+                       mlx5_translate_tunnel_etypes(pattern_flags);
+               if (ether_type) {
+                       protocol_v = rte_be_to_cpu_16(ether_type);
+                       protocol_m = UINT16_MAX;
+               }
+       }
+       c_rsvd0_ver_v = gre_v->c_rsvd0_ver;
+       c_rsvd0_ver_m = gre_m->c_rsvd0_ver;
+       if (option_m->sequence.sequence) {
+               c_rsvd0_ver_v |= RTE_BE16(0x1000);
+               c_rsvd0_ver_m |= RTE_BE16(0x1000);
+       }
+       if (option_m->key.key) {
+               c_rsvd0_ver_v |= RTE_BE16(0x2000);
+               c_rsvd0_ver_m |= RTE_BE16(0x2000);
+       }
+       if (option_m->checksum_rsvd.checksum) {
+               c_rsvd0_ver_v |= RTE_BE16(0x8000);
+               c_rsvd0_ver_m |= RTE_BE16(0x8000);
+       }
+       /*
+        * Hardware parses GRE optional field into the fixed location,
+        * do not need to adjust the tunnel dword indices.
+        */
+       misc5_v = MLX5_ADDR_OF(fte_match_param, key, misc_parameters_5);
+       misc5_m = MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters_5);
+       MLX5_SET(fte_match_set_misc5, misc5_v, tunnel_header_0,
+                rte_be_to_cpu_32((c_rsvd0_ver_v | protocol_v << 16) &
+                                 (c_rsvd0_ver_m | protocol_m << 16)));
+       MLX5_SET(fte_match_set_misc5, misc5_m, tunnel_header_0,
+                rte_be_to_cpu_32(c_rsvd0_ver_m | protocol_m << 16));
+       MLX5_SET(fte_match_set_misc5, misc5_v, tunnel_header_1,
+                rte_be_to_cpu_32(option_v->checksum_rsvd.checksum &
+                                 option_m->checksum_rsvd.checksum));
+       MLX5_SET(fte_match_set_misc5, misc5_m, tunnel_header_1,
+                rte_be_to_cpu_32(option_m->checksum_rsvd.checksum));
+       MLX5_SET(fte_match_set_misc5, misc5_v, tunnel_header_2,
+                rte_be_to_cpu_32(option_v->key.key & option_m->key.key));
+       MLX5_SET(fte_match_set_misc5, misc5_m, tunnel_header_2,
+                rte_be_to_cpu_32(option_m->key.key));
+       MLX5_SET(fte_match_set_misc5, misc5_v, tunnel_header_3,
+                rte_be_to_cpu_32(option_v->sequence.sequence &
+                                 option_m->sequence.sequence));
+       MLX5_SET(fte_match_set_misc5, misc5_m, tunnel_header_3,
+                rte_be_to_cpu_32(option_m->sequence.sequence));
 }
 
 /**
@@ -8792,13 +9169,13 @@ flow_dv_translate_item_gre(void *matcher, void *key,
  *   Flow matcher value.
  * @param[in] item
  *   Flow pattern to translate.
- * @param[in] inner
- *   Item is inner pattern.
+ * @param[in] pattern_flags
+ *   Accumulated pattern flags.
  */
 static void
 flow_dv_translate_item_nvgre(void *matcher, void *key,
                             const struct rte_flow_item *item,
-                            int inner)
+                            unsigned long pattern_flags)
 {
        const struct rte_flow_item_nvgre *nvgre_m = item->mask;
        const struct rte_flow_item_nvgre *nvgre_v = item->spec;
@@ -8825,7 +9202,7 @@ flow_dv_translate_item_nvgre(void *matcher, void *key,
                .mask = &gre_mask,
                .last = NULL,
        };
-       flow_dv_translate_item_gre(matcher, key, &gre_item, inner);
+       flow_dv_translate_item_gre(matcher, key, &gre_item, pattern_flags);
        if (!nvgre_v)
                return;
        if (!nvgre_m)
@@ -8962,46 +9339,40 @@ flow_dv_translate_item_vxlan(struct rte_eth_dev *dev,
 
 static void
 flow_dv_translate_item_vxlan_gpe(void *matcher, void *key,
-                                const struct rte_flow_item *item, int inner)
+                                const struct rte_flow_item *item,
+                                const uint64_t pattern_flags)
 {
+       static const struct rte_flow_item_vxlan_gpe dummy_vxlan_gpe_hdr = {0, };
        const struct rte_flow_item_vxlan_gpe *vxlan_m = item->mask;
        const struct rte_flow_item_vxlan_gpe *vxlan_v = item->spec;
-       void *headers_m;
-       void *headers_v;
+       /* The item was validated to be on the outer side */
+       void *headers_m = MLX5_ADDR_OF(fte_match_param, matcher, outer_headers);
+       void *headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
        void *misc_m =
                MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters_3);
        void *misc_v =
                MLX5_ADDR_OF(fte_match_param, key, misc_parameters_3);
-       char *vni_m;
-       char *vni_v;
-       uint16_t dport;
-       int size;
-       int i;
+       char *vni_m =
+               MLX5_ADDR_OF(fte_match_set_misc3, misc_m, outer_vxlan_gpe_vni);
+       char *vni_v =
+               MLX5_ADDR_OF(fte_match_set_misc3, misc_v, outer_vxlan_gpe_vni);
+       int i, size = sizeof(vxlan_m->vni);
        uint8_t flags_m = 0xff;
        uint8_t flags_v = 0xc;
+       uint8_t m_protocol, v_protocol;
 
-       if (inner) {
-               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
-                                        inner_headers);
-               headers_v = MLX5_ADDR_OF(fte_match_param, key, inner_headers);
-       } else {
-               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
-                                        outer_headers);
-               headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
-       }
-       dport = item->type == RTE_FLOW_ITEM_TYPE_VXLAN ?
-               MLX5_UDP_PORT_VXLAN : MLX5_UDP_PORT_VXLAN_GPE;
        if (!MLX5_GET16(fte_match_set_lyr_2_4, headers_v, udp_dport)) {
                MLX5_SET(fte_match_set_lyr_2_4, headers_m, udp_dport, 0xFFFF);
-               MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport, dport);
+               MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport,
+                        MLX5_UDP_PORT_VXLAN_GPE);
+       }
+       if (!vxlan_v) {
+               vxlan_v = &dummy_vxlan_gpe_hdr;
+               vxlan_m = &dummy_vxlan_gpe_hdr;
+       } else {
+               if (!vxlan_m)
+                       vxlan_m = &rte_flow_item_vxlan_gpe_mask;
        }
-       if (!vxlan_v)
-               return;
-       if (!vxlan_m)
-               vxlan_m = &rte_flow_item_vxlan_gpe_mask;
-       size = sizeof(vxlan_m->vni);
-       vni_m = MLX5_ADDR_OF(fte_match_set_misc3, misc_m, outer_vxlan_gpe_vni);
-       vni_v = MLX5_ADDR_OF(fte_match_set_misc3, misc_v, outer_vxlan_gpe_vni);
        memcpy(vni_m, vxlan_m->vni, size);
        for (i = 0; i < size; ++i)
                vni_v[i] = vni_m[i] & vxlan_v->vni[i];
@@ -9011,10 +9382,23 @@ flow_dv_translate_item_vxlan_gpe(void *matcher, void *key,
        }
        MLX5_SET(fte_match_set_misc3, misc_m, outer_vxlan_gpe_flags, flags_m);
        MLX5_SET(fte_match_set_misc3, misc_v, outer_vxlan_gpe_flags, flags_v);
-       MLX5_SET(fte_match_set_misc3, misc_m, outer_vxlan_gpe_next_protocol,
-                vxlan_m->protocol);
-       MLX5_SET(fte_match_set_misc3, misc_v, outer_vxlan_gpe_next_protocol,
-                vxlan_v->protocol);
+       m_protocol = vxlan_m->protocol;
+       v_protocol = vxlan_v->protocol;
+       if (!m_protocol) {
+               /* Force next protocol to ensure next headers parsing. */
+               if (pattern_flags & MLX5_FLOW_LAYER_INNER_L2)
+                       v_protocol = RTE_VXLAN_GPE_TYPE_ETH;
+               else if (pattern_flags & MLX5_FLOW_LAYER_INNER_L3_IPV4)
+                       v_protocol = RTE_VXLAN_GPE_TYPE_IPV4;
+               else if (pattern_flags & MLX5_FLOW_LAYER_INNER_L3_IPV6)
+                       v_protocol = RTE_VXLAN_GPE_TYPE_IPV6;
+               if (v_protocol)
+                       m_protocol = 0xFF;
+       }
+       MLX5_SET(fte_match_set_misc3, misc_m,
+                outer_vxlan_gpe_next_protocol, m_protocol);
+       MLX5_SET(fte_match_set_misc3, misc_v,
+                outer_vxlan_gpe_next_protocol, m_protocol & v_protocol);
 }
 
 /**
@@ -9032,49 +9416,39 @@ flow_dv_translate_item_vxlan_gpe(void *matcher, void *key,
 
 static void
 flow_dv_translate_item_geneve(void *matcher, void *key,
-                             const struct rte_flow_item *item, int inner)
+                             const struct rte_flow_item *item,
+                             uint64_t pattern_flags)
 {
+       static const struct rte_flow_item_geneve empty_geneve = {0,};
        const struct rte_flow_item_geneve *geneve_m = item->mask;
        const struct rte_flow_item_geneve *geneve_v = item->spec;
-       void *headers_m;
-       void *headers_v;
+       /* GENEVE flow item validation allows single tunnel item */
+       void *headers_m = MLX5_ADDR_OF(fte_match_param, matcher, outer_headers);
+       void *headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
        void *misc_m = MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters);
        void *misc_v = MLX5_ADDR_OF(fte_match_param, key, misc_parameters);
-       uint16_t dport;
        uint16_t gbhdr_m;
        uint16_t gbhdr_v;
-       char *vni_m;
-       char *vni_v;
-       size_t size, i;
+       char *vni_m = MLX5_ADDR_OF(fte_match_set_misc, misc_m, geneve_vni);
+       char *vni_v = MLX5_ADDR_OF(fte_match_set_misc, misc_v, geneve_vni);
+       size_t size = sizeof(geneve_m->vni), i;
+       uint16_t protocol_m, protocol_v;
 
-       if (inner) {
-               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
-                                        inner_headers);
-               headers_v = MLX5_ADDR_OF(fte_match_param, key, inner_headers);
-       } else {
-               headers_m = MLX5_ADDR_OF(fte_match_param, matcher,
-                                        outer_headers);
-               headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
-       }
-       dport = MLX5_UDP_PORT_GENEVE;
        if (!MLX5_GET16(fte_match_set_lyr_2_4, headers_v, udp_dport)) {
                MLX5_SET(fte_match_set_lyr_2_4, headers_m, udp_dport, 0xFFFF);
-               MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport, dport);
+               MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport,
+                        MLX5_UDP_PORT_GENEVE);
+       }
+       if (!geneve_v) {
+               geneve_v = &empty_geneve;
+               geneve_m = &empty_geneve;
+       } else {
+               if (!geneve_m)
+                       geneve_m = &rte_flow_item_geneve_mask;
        }
-       if (!geneve_v)
-               return;
-       if (!geneve_m)
-               geneve_m = &rte_flow_item_geneve_mask;
-       size = sizeof(geneve_m->vni);
-       vni_m = MLX5_ADDR_OF(fte_match_set_misc, misc_m, geneve_vni);
-       vni_v = MLX5_ADDR_OF(fte_match_set_misc, misc_v, geneve_vni);
        memcpy(vni_m, geneve_m->vni, size);
        for (i = 0; i < size; ++i)
                vni_v[i] = vni_m[i] & geneve_v->vni[i];
-       MLX5_SET(fte_match_set_misc, misc_m, geneve_protocol_type,
-                rte_be_to_cpu_16(geneve_m->protocol));
-       MLX5_SET(fte_match_set_misc, misc_v, geneve_protocol_type,
-                rte_be_to_cpu_16(geneve_v->protocol & geneve_m->protocol));
        gbhdr_m = rte_be_to_cpu_16(geneve_m->ver_opt_len_o_c_rsvd0);
        gbhdr_v = rte_be_to_cpu_16(geneve_v->ver_opt_len_o_c_rsvd0);
        MLX5_SET(fte_match_set_misc, misc_m, geneve_oam,
@@ -9086,6 +9460,17 @@ flow_dv_translate_item_geneve(void *matcher, void *key,
        MLX5_SET(fte_match_set_misc, misc_v, geneve_opt_len,
                 MLX5_GENEVE_OPTLEN_VAL(gbhdr_v) &
                 MLX5_GENEVE_OPTLEN_VAL(gbhdr_m));
+       protocol_m = rte_be_to_cpu_16(geneve_m->protocol);
+       protocol_v = rte_be_to_cpu_16(geneve_v->protocol);
+       if (!protocol_m) {
+               /* Force next protocol to prevent matchers duplication */
+               protocol_v = mlx5_translate_tunnel_etypes(pattern_flags);
+               if (protocol_v)
+                       protocol_m = 0xFFFF;
+       }
+       MLX5_SET(fte_match_set_misc, misc_m, geneve_protocol_type, protocol_m);
+       MLX5_SET(fte_match_set_misc, misc_v, geneve_protocol_type,
+                protocol_m & protocol_v);
 }
 
 /**
@@ -9127,7 +9512,7 @@ flow_dev_geneve_tlv_option_resource_register(struct rte_eth_dev *dev,
                        geneve_opt_v->option_type &&
                        geneve_opt_resource->length ==
                        geneve_opt_v->option_len) {
-                       /* We already have GENVE TLV option obj allocated. */
+                       /* We already have GENEVE TLV option obj allocated. */
                        __atomic_fetch_add(&geneve_opt_resource->refcnt, 1,
                                           __ATOMIC_RELAXED);
                } else {
@@ -9282,16 +9667,22 @@ flow_dv_translate_item_mpls(void *matcher, void *key,
 
        switch (prev_layer) {
        case MLX5_FLOW_LAYER_OUTER_L4_UDP:
-               MLX5_SET(fte_match_set_lyr_2_4, headers_m, udp_dport, 0xffff);
-               MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport,
-                        MLX5_UDP_PORT_MPLS);
+               if (!MLX5_GET16(fte_match_set_lyr_2_4, headers_v, udp_dport)) {
+                       MLX5_SET(fte_match_set_lyr_2_4, headers_m, udp_dport,
+                                0xffff);
+                       MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport,
+                                MLX5_UDP_PORT_MPLS);
+               }
                break;
        case MLX5_FLOW_LAYER_GRE:
                /* Fall-through. */
        case MLX5_FLOW_LAYER_GRE_KEY:
-               MLX5_SET(fte_match_set_misc, misc_m, gre_protocol, 0xffff);
-               MLX5_SET(fte_match_set_misc, misc_v, gre_protocol,
-                        RTE_ETHER_TYPE_MPLS);
+               if (!MLX5_GET16(fte_match_set_misc, misc_v, gre_protocol)) {
+                       MLX5_SET(fte_match_set_misc, misc_m, gre_protocol,
+                                0xffff);
+                       MLX5_SET(fte_match_set_misc, misc_v, gre_protocol,
+                                RTE_ETHER_TYPE_MPLS);
+               }
                break;
        default:
                break;
@@ -9689,6 +10080,77 @@ flow_dv_translate_item_port_id(struct rte_eth_dev *dev, void *matcher,
        return 0;
 }
 
+/**
+ * Translate represented port item to eswitch match on port id.
+ *
+ * @param[in] dev
+ *   The devich to configure through.
+ * @param[in, out] matcher
+ *   Flow matcher.
+ * @param[in, out] key
+ *   Flow matcher value.
+ * @param[in] item
+ *   Flow pattern to translate.
+ * @param[in]
+ *   Flow attributes.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise.
+ */
+static int
+flow_dv_translate_item_represented_port(struct rte_eth_dev *dev, void *matcher,
+                                       void *key,
+                                       const struct rte_flow_item *item,
+                                       const struct rte_flow_attr *attr)
+{
+       const struct rte_flow_item_ethdev *pid_m = item ? item->mask : NULL;
+       const struct rte_flow_item_ethdev *pid_v = item ? item->spec : NULL;
+       struct mlx5_priv *priv;
+       uint16_t mask, id;
+
+       if (!pid_m && !pid_v)
+               return 0;
+       if (pid_v && pid_v->port_id == UINT16_MAX) {
+               flow_dv_translate_item_source_vport(matcher, key,
+                       flow_dv_get_esw_manager_vport_id(dev), UINT16_MAX);
+               return 0;
+       }
+       mask = pid_m ? pid_m->port_id : UINT16_MAX;
+       id = pid_v ? pid_v->port_id : dev->data->port_id;
+       priv = mlx5_port_to_eswitch_info(id, item == NULL);
+       if (!priv)
+               return -rte_errno;
+       /*
+        * Translate to vport field or to metadata, depending on mode.
+        * Kernel can use either misc.source_port or half of C0 metadata
+        * register.
+        */
+       if (priv->vport_meta_mask) {
+               /*
+                * Provide the hint for SW steering library
+                * to insert the flow into ingress domain and
+                * save the extra vport match.
+                */
+               if (mask == UINT16_MAX && priv->vport_id == UINT16_MAX &&
+                   priv->pf_bond < 0 && attr->transfer)
+                       flow_dv_translate_item_source_vport
+                               (matcher, key, priv->vport_id, mask);
+               /*
+                * We should always set the vport metadata register,
+                * otherwise the SW steering library can drop
+                * the rule if wire vport metadata value is not zero,
+                * it depends on kernel configuration.
+                */
+               flow_dv_translate_item_meta_vport(matcher, key,
+                                                 priv->vport_meta_tag,
+                                                 priv->vport_meta_mask);
+       } else {
+               flow_dv_translate_item_source_vport(matcher, key,
+                                                   priv->vport_id, mask);
+       }
+       return 0;
+}
+
 /**
  * Add ICMP6 item to matcher and to the value.
  *
@@ -10107,7 +10569,7 @@ flow_dv_translate_item_flex(struct rte_eth_dev *dev, void *matcher, void *key,
                /* Don't count both inner and outer flex items in one rule. */
                if (mlx5_flex_acquire_index(dev, spec->handle, true) != index)
                        MLX5_ASSERT(false);
-               dev_flow->handle->flex_item |= RTE_BIT32(index);
+               dev_flow->handle->flex_item |= (uint8_t)RTE_BIT32(index);
        }
        mlx5_flex_flow_translate_item(dev, matcher, key, item, is_inner);
 }
@@ -10163,7 +10625,7 @@ __flow_dv_adjust_buf_size(size_t *size, uint8_t match_criteria)
         * Check flow matching criteria first, subtract misc5/4 length if flow
         * doesn't own misc5/4 parameters. In some old rdma-core releases,
         * misc5/4 are not supported, and matcher creation failure is expected
-        * w/o subtration. If misc5 is provided, misc4 must be counted in since
+        * w/o subtraction. If misc5 is provided, misc4 must be counted in since
         * misc5 is right after misc4.
         */
        if (!(match_criteria & (1 << MLX5_MATCH_CRITERIA_ENABLE_MISC5_BIT))) {
@@ -10451,7 +10913,8 @@ flow_dv_tbl_remove_cb(void *tool_ctx, struct mlx5_list_entry *entry)
                        tbl_data->tunnel->tunnel_id : 0,
                        tbl_data->group_id);
        }
-       mlx5_list_destroy(tbl_data->matchers);
+       if (tbl_data->matchers)
+               mlx5_list_destroy(tbl_data->matchers);
        mlx5_ipool_free(sh->ipool[MLX5_IPOOL_JUMP], tbl_data->idx);
 }
 
@@ -10706,7 +11169,8 @@ flow_dv_tag_resource_register
                                      flow_dv_tag_match_cb,
                                      flow_dv_tag_remove_cb,
                                      flow_dv_tag_clone_cb,
-                                     flow_dv_tag_clone_free_cb);
+                                     flow_dv_tag_clone_free_cb,
+                                     error);
        if (unlikely(!tag_table))
                return -rte_errno;
        entry = mlx5_hlist_register(tag_table, tag_be24, &ctx);
@@ -10887,10 +11351,8 @@ flow_dv_translate_item_tx_queue(struct rte_eth_dev *dev,
 {
        const struct mlx5_rte_flow_item_tx_queue *queue_m;
        const struct mlx5_rte_flow_item_tx_queue *queue_v;
-       void *misc_m =
-               MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters);
-       void *misc_v =
-               MLX5_ADDR_OF(fte_match_param, key, misc_parameters);
+       void *misc_m = MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters);
+       void *misc_v = MLX5_ADDR_OF(fte_match_param, key, misc_parameters);
        struct mlx5_txq_ctrl *txq;
        uint32_t queue, mask;
 
@@ -10901,7 +11363,7 @@ flow_dv_translate_item_tx_queue(struct rte_eth_dev *dev,
        txq = mlx5_txq_get(dev, queue_v->queue);
        if (!txq)
                return;
-       if (txq->type == MLX5_TXQ_TYPE_HAIRPIN)
+       if (txq->is_hairpin)
                queue = txq->obj->sq->id;
        else
                queue = txq->obj->sq_obj.sq->id;
@@ -10914,78 +11376,89 @@ flow_dv_translate_item_tx_queue(struct rte_eth_dev *dev,
 /**
  * Set the hash fields according to the @p flow information.
  *
- * @param[in] dev_flow
- *   Pointer to the mlx5_flow.
+ * @param[in] item_flags
+ *   The match pattern item flags.
  * @param[in] rss_desc
  *   Pointer to the mlx5_flow_rss_desc.
+ * @param[out] hash_fields
+ *   Pointer to the RSS hash fields.
  */
-static void
-flow_dv_hashfields_set(struct mlx5_flow *dev_flow,
-                      struct mlx5_flow_rss_desc *rss_desc)
+void
+flow_dv_hashfields_set(uint64_t item_flags,
+                      struct mlx5_flow_rss_desc *rss_desc,
+                      uint64_t *hash_fields)
 {
-       uint64_t items = dev_flow->handle->layers;
+       uint64_t items = item_flags;
+       uint64_t fields = 0;
        int rss_inner = 0;
        uint64_t rss_types = rte_eth_rss_hf_refine(rss_desc->types);
 
-       dev_flow->hash_fields = 0;
+       *hash_fields = 0;
 #ifdef HAVE_IBV_DEVICE_TUNNEL_SUPPORT
        if (rss_desc->level >= 2)
                rss_inner = 1;
 #endif
        if ((rss_inner && (items & MLX5_FLOW_LAYER_INNER_L3_IPV4)) ||
-           (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L3_IPV4))) {
+           (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L3_IPV4)) ||
+            !items) {
                if (rss_types & MLX5_IPV4_LAYER_TYPES) {
                        if (rss_types & RTE_ETH_RSS_L3_SRC_ONLY)
-                               dev_flow->hash_fields |= IBV_RX_HASH_SRC_IPV4;
+                               fields |= IBV_RX_HASH_SRC_IPV4;
                        else if (rss_types & RTE_ETH_RSS_L3_DST_ONLY)
-                               dev_flow->hash_fields |= IBV_RX_HASH_DST_IPV4;
+                               fields |= IBV_RX_HASH_DST_IPV4;
                        else
-                               dev_flow->hash_fields |= MLX5_IPV4_IBV_RX_HASH;
+                               fields |= MLX5_IPV4_IBV_RX_HASH;
                }
        } else if ((rss_inner && (items & MLX5_FLOW_LAYER_INNER_L3_IPV6)) ||
-                  (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L3_IPV6))) {
+                  (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L3_IPV6)) ||
+                  !items) {
                if (rss_types & MLX5_IPV6_LAYER_TYPES) {
                        if (rss_types & RTE_ETH_RSS_L3_SRC_ONLY)
-                               dev_flow->hash_fields |= IBV_RX_HASH_SRC_IPV6;
+                               fields |= IBV_RX_HASH_SRC_IPV6;
                        else if (rss_types & RTE_ETH_RSS_L3_DST_ONLY)
-                               dev_flow->hash_fields |= IBV_RX_HASH_DST_IPV6;
+                               fields |= IBV_RX_HASH_DST_IPV6;
                        else
-                               dev_flow->hash_fields |= MLX5_IPV6_IBV_RX_HASH;
+                               fields |= MLX5_IPV6_IBV_RX_HASH;
                }
        }
-       if (dev_flow->hash_fields == 0)
+       if (items & MLX5_FLOW_ITEM_ESP) {
+               if (rss_types & RTE_ETH_RSS_ESP)
+                       fields |= IBV_RX_HASH_IPSEC_SPI;
+       }
+       if ((fields & ~IBV_RX_HASH_IPSEC_SPI) == 0) {
+               *hash_fields = fields;
                /*
                 * There is no match between the RSS types and the
                 * L3 protocol (IPv4/IPv6) defined in the flow rule.
                 */
                return;
+       }
        if ((rss_inner && (items & MLX5_FLOW_LAYER_INNER_L4_UDP)) ||
-           (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L4_UDP))) {
+           (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L4_UDP)) ||
+           !items) {
                if (rss_types & RTE_ETH_RSS_UDP) {
                        if (rss_types & RTE_ETH_RSS_L4_SRC_ONLY)
-                               dev_flow->hash_fields |=
-                                               IBV_RX_HASH_SRC_PORT_UDP;
+                               fields |= IBV_RX_HASH_SRC_PORT_UDP;
                        else if (rss_types & RTE_ETH_RSS_L4_DST_ONLY)
-                               dev_flow->hash_fields |=
-                                               IBV_RX_HASH_DST_PORT_UDP;
+                               fields |= IBV_RX_HASH_DST_PORT_UDP;
                        else
-                               dev_flow->hash_fields |= MLX5_UDP_IBV_RX_HASH;
+                               fields |= MLX5_UDP_IBV_RX_HASH;
                }
        } else if ((rss_inner && (items & MLX5_FLOW_LAYER_INNER_L4_TCP)) ||
-                  (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L4_TCP))) {
+                  (!rss_inner && (items & MLX5_FLOW_LAYER_OUTER_L4_TCP)) ||
+                  !items) {
                if (rss_types & RTE_ETH_RSS_TCP) {
                        if (rss_types & RTE_ETH_RSS_L4_SRC_ONLY)
-                               dev_flow->hash_fields |=
-                                               IBV_RX_HASH_SRC_PORT_TCP;
+                               fields |= IBV_RX_HASH_SRC_PORT_TCP;
                        else if (rss_types & RTE_ETH_RSS_L4_DST_ONLY)
-                               dev_flow->hash_fields |=
-                                               IBV_RX_HASH_DST_PORT_TCP;
+                               fields |= IBV_RX_HASH_DST_PORT_TCP;
                        else
-                               dev_flow->hash_fields |= MLX5_TCP_IBV_RX_HASH;
+                               fields |= MLX5_TCP_IBV_RX_HASH;
                }
        }
        if (rss_inner)
-               dev_flow->hash_fields |= IBV_RX_HASH_INNER;
+               fields |= IBV_RX_HASH_INNER;
+       *hash_fields = fields;
 }
 
 /**
@@ -11009,8 +11482,8 @@ flow_dv_hrxq_prepare(struct rte_eth_dev *dev,
                     struct mlx5_flow_rss_desc *rss_desc,
                     uint32_t *hrxq_idx)
 {
-       struct mlx5_priv *priv = dev->data->dev_private;
        struct mlx5_flow_handle *dh = dev_flow->handle;
+       uint32_t shared_rss = rss_desc->shared_rss;
        struct mlx5_hrxq *hrxq;
 
        MLX5_ASSERT(rss_desc->queue_num);
@@ -11020,11 +11493,9 @@ flow_dv_hrxq_prepare(struct rte_eth_dev *dev,
        rss_desc->shared_rss = 0;
        if (rss_desc->hash_fields == 0)
                rss_desc->queue_num = 1;
-       *hrxq_idx = mlx5_hrxq_get(dev, rss_desc);
-       if (!*hrxq_idx)
-               return NULL;
-       hrxq = mlx5_ipool_get(priv->sh->ipool[MLX5_IPOOL_HRXQ],
-                             *hrxq_idx);
+       hrxq = mlx5_hrxq_get(dev, rss_desc);
+       *hrxq_idx = hrxq ? hrxq->idx : 0;
+       rss_desc->shared_rss = shared_rss;
        return hrxq;
 }
 
@@ -11362,7 +11833,7 @@ flow_dv_dest_array_create_cb(void *tool_ctx __rte_unused, void *cb_ctx)
                        goto error;
                }
        }
-       /* create a dest array actioin */
+       /* create a dest array action */
        ret = mlx5_os_flow_dr_create_flow_action_dest_array
                                                (domain,
                                                 resource->num_of_dest,
@@ -11570,7 +12041,9 @@ flow_dv_translate_action_sample(struct rte_eth_dev *dev,
                         * rss->level and rss.types should be set in advance
                         * when expanding items for RSS.
                         */
-                       flow_dv_hashfields_set(dev_flow, rss_desc);
+                       flow_dv_hashfields_set(dev_flow->handle->layers,
+                                              rss_desc,
+                                              &dev_flow->hash_fields);
                        hrxq = flow_dv_hrxq_prepare(dev, dev_flow,
                                                    rss_desc, &hrxq_idx);
                        if (!hrxq)
@@ -11597,7 +12070,7 @@ flow_dv_translate_action_sample(struct rte_eth_dev *dev,
                                (((const struct rte_flow_action_mark *)
                                (sub_actions->conf))->id);
 
-                       dev_flow->handle->mark = 1;
+                       wks->mark = 1;
                        pre_rix = dev_flow->handle->dvh.rix_tag;
                        /* Save the mark resource before sample */
                        pre_r = dev_flow->dv.tag_resource;
@@ -12106,34 +12579,24 @@ flow_dv_translate_integrity_l4(const struct rte_flow_item_integrity *mask,
                               void *headers_m, void *headers_v)
 {
        if (mask->l4_ok) {
-               /* application l4_ok filter aggregates all hardware l4 filters
-                * therefore hw l4_checksum_ok must be implicitly added here.
+               /* RTE l4_ok filter aggregates hardware l4_ok and
+                * l4_checksum_ok filters.
+                * Positive RTE l4_ok match requires hardware match on both L4
+                * hardware integrity bits.
+                * For negative match, check hardware l4_checksum_ok bit only,
+                * because hardware sets that bit to 0 for all packets
+                * with bad L4.
                 */
-               struct rte_flow_item_integrity local_item;
-
-               local_item.l4_csum_ok = 1;
-               MLX5_SET(fte_match_set_lyr_2_4, headers_m, l4_checksum_ok,
-                        local_item.l4_csum_ok);
                if (value->l4_ok) {
-                       /* application l4_ok = 1 matches sets both hw flags
-                        * l4_ok and l4_checksum_ok flags to 1.
-                        */
-                       MLX5_SET(fte_match_set_lyr_2_4, headers_v,
-                                l4_checksum_ok, local_item.l4_csum_ok);
-                       MLX5_SET(fte_match_set_lyr_2_4, headers_m, l4_ok,
-                                mask->l4_ok);
-                       MLX5_SET(fte_match_set_lyr_2_4, headers_v, l4_ok,
-                                value->l4_ok);
-               } else {
-                       /* application l4_ok = 0 matches on hw flag
-                        * l4_checksum_ok = 0 only.
-                        */
-                       MLX5_SET(fte_match_set_lyr_2_4, headers_v,
-                                l4_checksum_ok, 0);
+                       MLX5_SET(fte_match_set_lyr_2_4, headers_m, l4_ok, 1);
+                       MLX5_SET(fte_match_set_lyr_2_4, headers_v, l4_ok, 1);
                }
-       } else if (mask->l4_csum_ok) {
-               MLX5_SET(fte_match_set_lyr_2_4, headers_m, l4_checksum_ok,
-                        mask->l4_csum_ok);
+               MLX5_SET(fte_match_set_lyr_2_4, headers_m, l4_checksum_ok, 1);
+               MLX5_SET(fte_match_set_lyr_2_4, headers_v, l4_checksum_ok,
+                        !!value->l4_ok);
+       }
+       if (mask->l4_csum_ok) {
+               MLX5_SET(fte_match_set_lyr_2_4, headers_m, l4_checksum_ok, 1);
                MLX5_SET(fte_match_set_lyr_2_4, headers_v, l4_checksum_ok,
                         value->l4_csum_ok);
        }
@@ -12145,28 +12608,33 @@ flow_dv_translate_integrity_l3(const struct rte_flow_item_integrity *mask,
                               void *headers_m, void *headers_v, bool is_ipv4)
 {
        if (mask->l3_ok) {
-               /* application l3_ok filter aggregates all hardware l3 filters
-                * therefore hw ipv4_checksum_ok must be implicitly added here.
+               /* RTE l3_ok filter aggregates for IPv4 hardware l3_ok and
+                * ipv4_csum_ok filters.
+                * Positive RTE l3_ok match requires hardware match on both L3
+                * hardware integrity bits.
+                * For negative match, check hardware l3_csum_ok bit only,
+                * because hardware sets that bit to 0 for all packets
+                * with bad L3.
                 */
-               struct rte_flow_item_integrity local_item;
-
-               local_item.ipv4_csum_ok = !!is_ipv4;
-               MLX5_SET(fte_match_set_lyr_2_4, headers_m, ipv4_checksum_ok,
-                        local_item.ipv4_csum_ok);
-               if (value->l3_ok) {
+               if (is_ipv4) {
+                       if (value->l3_ok) {
+                               MLX5_SET(fte_match_set_lyr_2_4, headers_m,
+                                        l3_ok, 1);
+                               MLX5_SET(fte_match_set_lyr_2_4, headers_v,
+                                        l3_ok, 1);
+                       }
+                       MLX5_SET(fte_match_set_lyr_2_4, headers_m,
+                                ipv4_checksum_ok, 1);
                        MLX5_SET(fte_match_set_lyr_2_4, headers_v,
-                                ipv4_checksum_ok, local_item.ipv4_csum_ok);
-                       MLX5_SET(fte_match_set_lyr_2_4, headers_m, l3_ok,
-                                mask->l3_ok);
+                                ipv4_checksum_ok, !!value->l3_ok);
+               } else {
+                       MLX5_SET(fte_match_set_lyr_2_4, headers_m, l3_ok, 1);
                        MLX5_SET(fte_match_set_lyr_2_4, headers_v, l3_ok,
                                 value->l3_ok);
-               } else {
-                       MLX5_SET(fte_match_set_lyr_2_4, headers_v,
-                                ipv4_checksum_ok, 0);
                }
-       } else if (mask->ipv4_csum_ok) {
-               MLX5_SET(fte_match_set_lyr_2_4, headers_m, ipv4_checksum_ok,
-                        mask->ipv4_csum_ok);
+       }
+       if (mask->ipv4_csum_ok) {
+               MLX5_SET(fte_match_set_lyr_2_4, headers_m, ipv4_checksum_ok, 1);
                MLX5_SET(fte_match_set_lyr_2_4, headers_v, ipv4_checksum_ok,
                         value->ipv4_csum_ok);
        }
@@ -12467,7 +12935,7 @@ flow_dv_aso_ct_alloc(struct rte_eth_dev *dev, struct rte_flow_error *error)
        uint32_t ct_idx;
 
        MLX5_ASSERT(mng);
-       if (!priv->sh->devx) {
+       if (!priv->sh->cdev->config.devx) {
                rte_errno = ENOTSUP;
                return 0;
        }
@@ -12596,7 +13064,7 @@ flow_dv_translate(struct rte_eth_dev *dev,
                  struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *dev_conf = &priv->config;
+       struct mlx5_sh_config *dev_conf = &priv->sh->config;
        struct rte_flow *flow = dev_flow->flow;
        struct mlx5_flow_handle *handle = dev_flow->handle;
        struct mlx5_flow_workspace *wks = mlx5_flow_get_thread_workspace();
@@ -12649,6 +13117,8 @@ flow_dv_translate(struct rte_eth_dev *dev,
                .std_tbl_fix = true,
        };
        const struct rte_flow_item *integrity_items[2] = {NULL, NULL};
+       const struct rte_flow_item *tunnel_item = NULL;
+       const struct rte_flow_item *gre_item = NULL;
 
        if (!wks)
                return rte_flow_error_set(error, ENOMEM,
@@ -12761,7 +13231,7 @@ flow_dv_translate(struct rte_eth_dev *dev,
                        break;
                case RTE_FLOW_ACTION_TYPE_FLAG:
                        action_flags |= MLX5_FLOW_ACTION_FLAG;
-                       dev_flow->handle->mark = 1;
+                       wks->mark = 1;
                        if (dev_conf->dv_xmeta_en != MLX5_XMETA_MODE_LEGACY) {
                                struct rte_flow_action_mark mark = {
                                        .id = MLX5_FLOW_MARK_DEFAULT,
@@ -12790,7 +13260,7 @@ flow_dv_translate(struct rte_eth_dev *dev,
                        break;
                case RTE_FLOW_ACTION_TYPE_MARK:
                        action_flags |= MLX5_FLOW_ACTION_MARK;
-                       dev_flow->handle->mark = 1;
+                       wks->mark = 1;
                        if (dev_conf->dv_xmeta_en != MLX5_XMETA_MODE_LEGACY) {
                                const struct rte_flow_action_mark *mark =
                                        (const struct rte_flow_action_mark *)
@@ -12904,7 +13374,7 @@ flow_dv_translate(struct rte_eth_dev *dev,
                        }
                        break;
                case RTE_FLOW_ACTION_TYPE_COUNT:
-                       if (!priv->sh->devx) {
+                       if (!priv->sh->cdev->config.devx) {
                                return rte_flow_error_set
                                              (error, ENOTSUP,
                                               RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
@@ -13169,7 +13639,7 @@ flow_dv_translate(struct rte_eth_dev *dev,
                                        NULL, "Failed to get meter in flow.");
                        /* Set the meter action. */
                        dev_flow->dv.actions[actions_n++] =
-                               wks->fm->meter_action;
+                               wks->fm->meter_action_g;
                        action_flags |= MLX5_FLOW_ACTION_METER;
                        break;
                case RTE_FLOW_ACTION_TYPE_SET_IPV4_DSCP:
@@ -13247,8 +13717,7 @@ flow_dv_translate(struct rte_eth_dev *dev,
                         */
                        if (action_flags & MLX5_FLOW_ACTION_AGE) {
                                if ((non_shared_age && count) ||
-                                   !(priv->sh->flow_hit_aso_en &&
-                                     (attr->group || attr->transfer))) {
+                                   !flow_hit_aso_supported(priv->sh, attr)) {
                                        /* Creates age by counters. */
                                        cnt_act = flow_dv_prepare_counter
                                                                (dev, dev_flow,
@@ -13308,11 +13777,21 @@ flow_dv_translate(struct rte_eth_dev *dev,
                                                  RTE_FLOW_ERROR_TYPE_ITEM,
                                                  NULL, "item not supported");
                switch (item_type) {
+               case RTE_FLOW_ITEM_TYPE_ESP:
+                       flow_dv_translate_item_esp(match_mask, match_value,
+                                                  items, tunnel);
+                       last_item = MLX5_FLOW_ITEM_ESP;
+                       break;
                case RTE_FLOW_ITEM_TYPE_PORT_ID:
                        flow_dv_translate_item_port_id
                                (dev, match_mask, match_value, items, attr);
                        last_item = MLX5_FLOW_ITEM_PORT_ID;
                        break;
+               case RTE_FLOW_ITEM_TYPE_REPRESENTED_PORT:
+                       flow_dv_translate_item_represented_port
+                               (dev, match_mask, match_value, items, attr);
+                       last_item = MLX5_FLOW_ITEM_REPRESENTED_PORT;
+                       break;
                case RTE_FLOW_ITEM_TYPE_ETH:
                        flow_dv_translate_item_eth(match_mask, match_value,
                                                   items, tunnel,
@@ -13418,21 +13897,25 @@ flow_dv_translate(struct rte_eth_dev *dev,
                                             MLX5_FLOW_LAYER_OUTER_L4_UDP;
                        break;
                case RTE_FLOW_ITEM_TYPE_GRE:
-                       flow_dv_translate_item_gre(match_mask, match_value,
-                                                  items, tunnel);
                        matcher.priority = MLX5_TUNNEL_PRIO_GET(rss_desc);
                        last_item = MLX5_FLOW_LAYER_GRE;
+                       tunnel_item = items;
+                       gre_item = items;
                        break;
                case RTE_FLOW_ITEM_TYPE_GRE_KEY:
                        flow_dv_translate_item_gre_key(match_mask,
                                                       match_value, items);
                        last_item = MLX5_FLOW_LAYER_GRE_KEY;
                        break;
+               case RTE_FLOW_ITEM_TYPE_GRE_OPTION:
+                       matcher.priority = MLX5_TUNNEL_PRIO_GET(rss_desc);
+                       last_item = MLX5_FLOW_LAYER_GRE;
+                       tunnel_item = items;
+                       break;
                case RTE_FLOW_ITEM_TYPE_NVGRE:
-                       flow_dv_translate_item_nvgre(match_mask, match_value,
-                                                    items, tunnel);
                        matcher.priority = MLX5_TUNNEL_PRIO_GET(rss_desc);
                        last_item = MLX5_FLOW_LAYER_GRE;
+                       tunnel_item = items;
                        break;
                case RTE_FLOW_ITEM_TYPE_VXLAN:
                        flow_dv_translate_item_vxlan(dev, attr,
@@ -13442,17 +13925,14 @@ flow_dv_translate(struct rte_eth_dev *dev,
                        last_item = MLX5_FLOW_LAYER_VXLAN;
                        break;
                case RTE_FLOW_ITEM_TYPE_VXLAN_GPE:
-                       flow_dv_translate_item_vxlan_gpe(match_mask,
-                                                        match_value, items,
-                                                        tunnel);
                        matcher.priority = MLX5_TUNNEL_PRIO_GET(rss_desc);
                        last_item = MLX5_FLOW_LAYER_VXLAN_GPE;
+                       tunnel_item = items;
                        break;
                case RTE_FLOW_ITEM_TYPE_GENEVE:
-                       flow_dv_translate_item_geneve(match_mask, match_value,
-                                                     items, tunnel);
                        matcher.priority = MLX5_TUNNEL_PRIO_GET(rss_desc);
                        last_item = MLX5_FLOW_LAYER_GENEVE;
+                       tunnel_item = items;
                        break;
                case RTE_FLOW_ITEM_TYPE_GENEVE_OPT:
                        ret = flow_dv_translate_item_geneve_opt(dev, match_mask,
@@ -13484,11 +13964,13 @@ flow_dv_translate(struct rte_eth_dev *dev,
                case RTE_FLOW_ITEM_TYPE_ICMP:
                        flow_dv_translate_item_icmp(match_mask, match_value,
                                                    items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L4;
                        last_item = MLX5_FLOW_LAYER_ICMP;
                        break;
                case RTE_FLOW_ITEM_TYPE_ICMP6:
                        flow_dv_translate_item_icmp6(match_mask, match_value,
                                                      items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L4;
                        last_item = MLX5_FLOW_LAYER_ICMP6;
                        break;
                case RTE_FLOW_ITEM_TYPE_TAG:
@@ -13563,12 +14045,14 @@ flow_dv_translate(struct rte_eth_dev *dev,
        /*
         * When E-Switch mode is enabled, we have two cases where we need to
         * set the source port manually.
-        * The first one, is in case of Nic steering rule, and the second is
-        * E-Switch rule where no port_id item was found. In both cases
-        * the source port is set according the current port in use.
+        * The first one, is in case of NIC ingress steering rule, and the
+        * second is E-Switch rule where no port_id item was found.
+        * In both cases the source port is set according the current port
+        * in use.
         */
        if (!(item_flags & MLX5_FLOW_ITEM_PORT_ID) &&
-           (priv->representor || priv->master)) {
+           !(item_flags & MLX5_FLOW_ITEM_REPRESENTED_PORT) && priv->sh->esw_mode &&
+           !(attr->egress && !attr->transfer)) {
                if (flow_dv_translate_item_port_id(dev, match_mask,
                                                   match_value, NULL, attr))
                        return -rte_errno;
@@ -13578,6 +14062,25 @@ flow_dv_translate(struct rte_eth_dev *dev,
                                                      integrity_items,
                                                      item_flags);
        }
+       if (item_flags & MLX5_FLOW_LAYER_VXLAN_GPE)
+               flow_dv_translate_item_vxlan_gpe(match_mask, match_value,
+                                                tunnel_item, item_flags);
+       else if (item_flags & MLX5_FLOW_LAYER_GENEVE)
+               flow_dv_translate_item_geneve(match_mask, match_value,
+                                             tunnel_item, item_flags);
+       else if (item_flags & MLX5_FLOW_LAYER_GRE) {
+               if (tunnel_item->type == RTE_FLOW_ITEM_TYPE_GRE)
+                       flow_dv_translate_item_gre(match_mask, match_value,
+                                                  tunnel_item, item_flags);
+               else if (tunnel_item->type == RTE_FLOW_ITEM_TYPE_NVGRE)
+                       flow_dv_translate_item_nvgre(match_mask, match_value,
+                                                    tunnel_item, item_flags);
+               else if (tunnel_item->type == RTE_FLOW_ITEM_TYPE_GRE_OPTION)
+                       flow_dv_translate_item_gre_option(match_mask, match_value,
+                                       tunnel_item, gre_item, item_flags);
+               else
+                       MLX5_ASSERT(false);
+       }
 #ifdef RTE_LIBRTE_MLX5_DEBUG
        MLX5_ASSERT(!flow_dv_check_valid_spec(matcher.mask.buf,
                                              dev_flow->dv.value.buf));
@@ -13588,7 +14091,9 @@ flow_dv_translate(struct rte_eth_dev *dev,
         */
        handle->layers |= item_flags;
        if (action_flags & MLX5_FLOW_ACTION_RSS)
-               flow_dv_hashfields_set(dev_flow, rss_desc);
+               flow_dv_hashfields_set(dev_flow->handle->layers,
+                                      rss_desc,
+                                      &dev_flow->hash_fields);
        /* If has RSS action in the sample action, the Sample/Mirror resource
         * should be registered after the hash filed be update.
         */
@@ -13752,6 +14257,15 @@ __flow_dv_action_rss_hrxq_set(struct mlx5_shared_action_rss *action,
        case MLX5_RSS_HASH_NONE:
                hrxqs[6] = hrxq_idx;
                return 0;
+       case MLX5_RSS_HASH_IPV4_ESP:
+               hrxqs[7] = hrxq_idx;
+               return 0;
+       case MLX5_RSS_HASH_IPV6_ESP:
+               hrxqs[8] = hrxq_idx;
+               return 0;
+       case MLX5_RSS_HASH_ESP_SPI:
+               hrxqs[9] = hrxq_idx;
+               return 0;
        default:
                return -1;
        }
@@ -13773,9 +14287,9 @@ __flow_dv_action_rss_hrxq_set(struct mlx5_shared_action_rss *action,
  * @return
  *   Valid hash RX queue index, otherwise 0.
  */
-static uint32_t
-__flow_dv_action_rss_hrxq_lookup(struct rte_eth_dev *dev, uint32_t idx,
-                                const uint64_t hash_fields)
+uint32_t
+flow_dv_action_rss_hrxq_lookup(struct rte_eth_dev *dev, uint32_t idx,
+                              const uint64_t hash_fields)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
        struct mlx5_shared_action_rss *shared_rss =
@@ -13821,6 +14335,12 @@ __flow_dv_action_rss_hrxq_lookup(struct rte_eth_dev *dev, uint32_t idx,
                return hrxqs[5];
        case MLX5_RSS_HASH_NONE:
                return hrxqs[6];
+       case MLX5_RSS_HASH_IPV4_ESP:
+               return hrxqs[7];
+       case MLX5_RSS_HASH_IPV6_ESP:
+               return hrxqs[8];
+       case MLX5_RSS_HASH_ESP_SPI:
+               return hrxqs[9];
        default:
                return 0;
        }
@@ -13903,7 +14423,7 @@ flow_dv_apply(struct rte_eth_dev *dev, struct rte_flow *flow,
                        struct mlx5_hrxq *hrxq = NULL;
                        uint32_t hrxq_idx;
 
-                       hrxq_idx = __flow_dv_action_rss_hrxq_lookup(dev,
+                       hrxq_idx = flow_dv_action_rss_hrxq_lookup(dev,
                                                rss_desc->shared_rss,
                                                dev_flow->hash_fields);
                        if (hrxq_idx)
@@ -13939,7 +14459,7 @@ flow_dv_apply(struct rte_eth_dev *dev, struct rte_flow *flow,
                                (error, errno,
                                RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
                                NULL,
-                               (!priv->config.allow_duplicate_pattern &&
+                               (!priv->sh->config.allow_duplicate_pattern &&
                                errno == EEXIST) ?
                                "duplicating pattern is not allowed" :
                                "hardware refuses to create flow");
@@ -14438,7 +14958,7 @@ flow_dv_destroy(struct rte_eth_dev *dev, struct rte_flow *flow)
                        int index = rte_bsf32(dev_handle->flex_item);
 
                        mlx5_flex_release_index(dev, index);
-                       dev_handle->flex_item &= ~RTE_BIT32(index);
+                       dev_handle->flex_item &= ~(uint8_t)RTE_BIT32(index);
                }
                if (dev_handle->dvh.matcher)
                        flow_dv_matcher_release(dev, dev_handle);
@@ -14537,19 +15057,19 @@ __flow_dv_action_rss_hrxqs_release(struct rte_eth_dev *dev,
  * MLX5_RSS_HASH_IPV4_DST_ONLY are mutually exclusive so they can share
  * same slot in mlx5_rss_hash_fields.
  *
- * @param[in] rss
- *   Pointer to the shared action RSS conf.
+ * @param[in] orig_rss_types
+ *   RSS type as provided in shared RSS action.
  * @param[in, out] hash_field
  *   hash_field variable needed to be adjusted.
  *
  * @return
  *   void
  */
-static void
-__flow_dv_action_rss_l34_hash_adjust(struct mlx5_shared_action_rss *rss,
-                                    uint64_t *hash_field)
+void
+flow_dv_action_rss_l34_hash_adjust(uint64_t orig_rss_types,
+                                  uint64_t *hash_field)
 {
-       uint64_t rss_types = rss->origin.types;
+       uint64_t rss_types = rte_eth_rss_hf_refine(orig_rss_types);
 
        switch (*hash_field & ~IBV_RX_HASH_INNER) {
        case MLX5_RSS_HASH_IPV4:
@@ -14629,15 +15149,20 @@ __flow_dv_action_rss_setup(struct rte_eth_dev *dev,
                           struct mlx5_shared_action_rss *shared_rss,
                           struct rte_flow_error *error)
 {
+       struct mlx5_priv *priv = dev->data->dev_private;
        struct mlx5_flow_rss_desc rss_desc = { 0 };
        size_t i;
        int err;
 
-       if (mlx5_ind_table_obj_setup(dev, shared_rss->ind_tbl)) {
+       shared_rss->ind_tbl = mlx5_ind_table_obj_new
+                             (dev, shared_rss->origin.queue,
+                              shared_rss->origin.queue_num,
+                              true,
+                              !!dev->data->dev_started);
+       if (!shared_rss->ind_tbl)
                return rte_flow_error_set(error, rte_errno,
                                          RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
                                          "cannot setup indirection table");
-       }
        memcpy(rss_desc.key, shared_rss->origin.key, MLX5_RSS_HASH_KEY_LEN);
        rss_desc.key_len = MLX5_RSS_HASH_KEY_LEN;
        rss_desc.const_q = shared_rss->origin.queue;
@@ -14645,20 +15170,23 @@ __flow_dv_action_rss_setup(struct rte_eth_dev *dev,
        /* Set non-zero value to indicate a shared RSS. */
        rss_desc.shared_rss = action_idx;
        rss_desc.ind_tbl = shared_rss->ind_tbl;
+       if (priv->sh->config.dv_flow_en == 2)
+               rss_desc.hws_flags = MLX5DR_ACTION_FLAG_HWS_RX;
        for (i = 0; i < MLX5_RSS_HASH_FIELDS_LEN; i++) {
-               uint32_t hrxq_idx;
+               struct mlx5_hrxq *hrxq;
                uint64_t hash_fields = mlx5_rss_hash_fields[i];
                int tunnel = 0;
 
-               __flow_dv_action_rss_l34_hash_adjust(shared_rss, &hash_fields);
+               flow_dv_action_rss_l34_hash_adjust(shared_rss->origin.types,
+                                                  &hash_fields);
                if (shared_rss->origin.level > 1) {
                        hash_fields |= IBV_RX_HASH_INNER;
                        tunnel = 1;
                }
                rss_desc.tunnel = tunnel;
                rss_desc.hash_fields = hash_fields;
-               hrxq_idx = mlx5_hrxq_get(dev, &rss_desc);
-               if (!hrxq_idx) {
+               hrxq = mlx5_hrxq_get(dev, &rss_desc);
+               if (!hrxq) {
                        rte_flow_error_set
                                (error, rte_errno,
                                 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
@@ -14666,7 +15194,7 @@ __flow_dv_action_rss_setup(struct rte_eth_dev *dev,
                        goto error_hrxq_new;
                }
                err = __flow_dv_action_rss_hrxq_set
-                       (shared_rss, hash_fields, hrxq_idx);
+                       (shared_rss, hash_fields, hrxq->idx);
                MLX5_ASSERT(!err);
        }
        return 0;
@@ -14704,18 +15232,14 @@ __flow_dv_action_rss_create(struct rte_eth_dev *dev,
 {
        struct mlx5_priv *priv = dev->data->dev_private;
        struct mlx5_shared_action_rss *shared_rss = NULL;
-       void *queue = NULL;
        struct rte_flow_action_rss *origin;
        const uint8_t *rss_key;
-       uint32_t queue_size = rss->queue_num * sizeof(uint16_t);
        uint32_t idx;
 
        RTE_SET_USED(conf);
-       queue = mlx5_malloc(0, RTE_ALIGN_CEIL(queue_size, sizeof(void *)),
-                           0, SOCKET_ID_ANY);
        shared_rss = mlx5_ipool_zmalloc
                         (priv->sh->ipool[MLX5_IPOOL_RSS_SHARED_ACTIONS], &idx);
-       if (!shared_rss || !queue) {
+       if (!shared_rss) {
                rte_flow_error_set(error, ENOMEM,
                                   RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
                                   "cannot allocate resource memory");
@@ -14727,18 +15251,6 @@ __flow_dv_action_rss_create(struct rte_eth_dev *dev,
                                   "rss action number out of range");
                goto error_rss_init;
        }
-       shared_rss->ind_tbl = mlx5_malloc(MLX5_MEM_ZERO,
-                                         sizeof(*shared_rss->ind_tbl),
-                                         0, SOCKET_ID_ANY);
-       if (!shared_rss->ind_tbl) {
-               rte_flow_error_set(error, ENOMEM,
-                                  RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
-                                  "cannot allocate resource memory");
-               goto error_rss_init;
-       }
-       memcpy(queue, rss->queue, queue_size);
-       shared_rss->ind_tbl->queues = queue;
-       shared_rss->ind_tbl->queues_n = rss->queue_num;
        origin = &shared_rss->origin;
        origin->func = rss->func;
        origin->level = rss->level;
@@ -14749,10 +15261,12 @@ __flow_dv_action_rss_create(struct rte_eth_dev *dev,
        memcpy(shared_rss->key, rss_key, MLX5_RSS_HASH_KEY_LEN);
        origin->key = &shared_rss->key[0];
        origin->key_len = MLX5_RSS_HASH_KEY_LEN;
-       origin->queue = queue;
+       origin->queue = rss->queue;
        origin->queue_num = rss->queue_num;
        if (__flow_dv_action_rss_setup(dev, idx, shared_rss, error))
                goto error_rss_init;
+       /* Update queue with indirect table queue memoyr. */
+       origin->queue = shared_rss->ind_tbl->queues;
        rte_spinlock_init(&shared_rss->action_rss_sl);
        __atomic_add_fetch(&shared_rss->refcnt, 1, __ATOMIC_RELAXED);
        rte_spinlock_lock(&priv->shared_act_sl);
@@ -14763,12 +15277,11 @@ __flow_dv_action_rss_create(struct rte_eth_dev *dev,
 error_rss_init:
        if (shared_rss) {
                if (shared_rss->ind_tbl)
-                       mlx5_free(shared_rss->ind_tbl);
+                       mlx5_ind_table_obj_release(dev, shared_rss->ind_tbl,
+                                                  !!dev->data->dev_started);
                mlx5_ipool_free(priv->sh->ipool[MLX5_IPOOL_RSS_SHARED_ACTIONS],
                                idx);
        }
-       if (queue)
-               mlx5_free(queue);
        return 0;
 }
 
@@ -14796,7 +15309,6 @@ __flow_dv_action_rss_release(struct rte_eth_dev *dev, uint32_t idx,
            mlx5_ipool_get(priv->sh->ipool[MLX5_IPOOL_RSS_SHARED_ACTIONS], idx);
        uint32_t old_refcnt = 1;
        int remaining;
-       uint16_t *queue = NULL;
 
        if (!shared_rss)
                return rte_flow_error_set(error, EINVAL,
@@ -14815,15 +15327,14 @@ __flow_dv_action_rss_release(struct rte_eth_dev *dev, uint32_t idx,
                                          RTE_FLOW_ERROR_TYPE_ACTION,
                                          NULL,
                                          "shared rss hrxq has references");
-       queue = shared_rss->ind_tbl->queues;
-       remaining = mlx5_ind_table_obj_release(dev, shared_rss->ind_tbl, true);
+       remaining = mlx5_ind_table_obj_release(dev, shared_rss->ind_tbl,
+                                              !!dev->data->dev_started);
        if (remaining)
                return rte_flow_error_set(error, EBUSY,
                                          RTE_FLOW_ERROR_TYPE_ACTION,
                                          NULL,
                                          "shared rss indirection table has"
                                          " references");
-       mlx5_free(queue);
        rte_spinlock_lock(&priv->shared_act_sl);
        ILIST_REMOVE(priv->sh->ipool[MLX5_IPOOL_RSS_SHARED_ACTIONS],
                     &priv->rss_shared_actions, idx, shared_rss, next);
@@ -14852,7 +15363,7 @@ __flow_dv_action_rss_release(struct rte_eth_dev *dev, uint32_t idx,
  *   A valid shared action handle in case of success, NULL otherwise and
  *   rte_errno is set.
  */
-static struct rte_flow_action_handle *
+struct rte_flow_action_handle *
 flow_dv_action_create(struct rte_eth_dev *dev,
                      const struct rte_flow_indir_action_conf *conf,
                      const struct rte_flow_action *action,
@@ -14922,7 +15433,7 @@ flow_dv_action_create(struct rte_eth_dev *dev,
  * @return
  *   0 on success, otherwise negative errno value.
  */
-static int
+int
 flow_dv_action_destroy(struct rte_eth_dev *dev,
                       struct rte_flow_action_handle *handle,
                       struct rte_flow_error *error)
@@ -15002,8 +15513,9 @@ __flow_dv_action_rss_update(struct rte_eth_dev *dev, uint32_t idx,
            mlx5_ipool_get(priv->sh->ipool[MLX5_IPOOL_RSS_SHARED_ACTIONS], idx);
        int ret = 0;
        void *queue = NULL;
-       uint16_t *queue_old = NULL;
+       void *queue_i = NULL;
        uint32_t queue_size = action_conf->queue_num * sizeof(uint16_t);
+       bool dev_started = !!dev->data->dev_started;
 
        if (!shared_rss)
                return rte_flow_error_set(error, EINVAL,
@@ -15024,19 +15536,23 @@ __flow_dv_action_rss_update(struct rte_eth_dev *dev, uint32_t idx,
        memcpy(queue, action_conf->queue, queue_size);
        MLX5_ASSERT(shared_rss->ind_tbl);
        rte_spinlock_lock(&shared_rss->action_rss_sl);
-       queue_old = shared_rss->ind_tbl->queues;
+       queue_i = shared_rss->ind_tbl->queues;
        ret = mlx5_ind_table_obj_modify(dev, shared_rss->ind_tbl,
-                                       queue, action_conf->queue_num, true);
+                                       queue, action_conf->queue_num,
+                                       true /* standalone */,
+                                       dev_started /* ref_new_qs */,
+                                       dev_started /* deref_old_qs */);
        if (ret) {
-               mlx5_free(queue);
                ret = rte_flow_error_set(error, rte_errno,
                                          RTE_FLOW_ERROR_TYPE_ACTION, NULL,
                                          "cannot update indirection table");
        } else {
-               mlx5_free(queue_old);
-               shared_rss->origin.queue = queue;
+               /* Restore the queue to indirect table internal queue. */
+               memcpy(queue_i, queue, queue_size);
+               shared_rss->ind_tbl->queues = queue_i;
                shared_rss->origin.queue_num = action_conf->queue_num;
        }
+       mlx5_free(queue);
        rte_spinlock_unlock(&shared_rss->action_rss_sl);
        return ret;
 }
@@ -15127,7 +15643,7 @@ __flow_dv_action_ct_update(struct rte_eth_dev *dev, uint32_t idx,
  * @return
  *   0 on success, otherwise negative errno value.
  */
-static int
+int
 flow_dv_action_update(struct rte_eth_dev *dev,
                        struct rte_flow_action_handle *handle,
                        const void *update,
@@ -15175,7 +15691,7 @@ __flow_dv_destroy_sub_policy_rules(struct rte_eth_dev *dev,
 
        for (i = 0; i < RTE_COLORS; i++) {
                next_fm = NULL;
-               if (i == RTE_COLOR_GREEN && policy &&
+               if (i <= RTE_COLOR_YELLOW && policy &&
                    policy->act_cnt[i].fate_action == MLX5_FLOW_FATE_MTR)
                        next_fm = mlx5_flow_meter_find(priv,
                                        policy->act_cnt[i].next_mtr_id, NULL);
@@ -15299,6 +15815,51 @@ flow_dv_destroy_mtr_policy_acts(struct rte_eth_dev *dev,
                mtr_policy->dr_drop_action[j] = NULL;
 }
 
+/**
+ * Create yellow action for color aware meter.
+ *
+ * @param[in] dev
+ *   Pointer to the Ethernet device structure.
+ * @param[in] fm
+ *   Meter information table.
+ * @param[out] error
+ *   Perform verbose error reporting if not NULL. Initialized in case of
+ *   error only.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+__flow_dv_create_mtr_yellow_action(struct rte_eth_dev *dev,
+                                  struct mlx5_flow_meter_info *fm,
+                                  struct rte_mtr_error *error)
+{
+#ifdef HAVE_MLX5_DR_CREATE_ACTION_ASO
+       struct mlx5_priv *priv = dev->data->dev_private;
+       struct rte_flow_error flow_err;
+       struct mlx5_aso_mtr *aso_mtr;
+       struct mlx5_aso_mtr_pool *pool;
+       uint8_t reg_id;
+
+       aso_mtr = container_of(fm, struct mlx5_aso_mtr, fm);
+       pool = container_of(aso_mtr, struct mlx5_aso_mtr_pool, mtrs[aso_mtr->offset]);
+       reg_id = mlx5_flow_get_reg_id(dev, MLX5_MTR_COLOR, 0, &flow_err);
+       fm->meter_action_y =
+               mlx5_glue->dv_create_flow_action_aso(priv->sh->rx_domain,
+                                                    pool->devx_obj->obj,
+                                                    aso_mtr->offset,
+                                                    (1 << MLX5_FLOW_COLOR_YELLOW),
+                                                    reg_id - REG_C_0);
+#else
+       RTE_SET_USED(dev);
+#endif
+       if (!fm->meter_action_y) {
+               return -rte_mtr_error_set(error, EINVAL, RTE_MTR_ERROR_TYPE_MTR_ID, NULL,
+                                         "Fail to create yellow meter action.");
+       }
+       return 0;
+}
+
 /**
  * Create policy action per domain, lock free,
  * (mutex should be acquired by caller).
@@ -15310,6 +15871,8 @@ flow_dv_destroy_mtr_policy_acts(struct rte_eth_dev *dev,
  *   Meter policy struct.
  * @param[in] action
  *   Action specification used to create meter actions.
+ * @param[in] attr
+ *   Pointer to the flow attributes.
  * @param[out] error
  *   Perform verbose error reporting if not NULL. Initialized in case of
  *   error only.
@@ -15321,6 +15884,7 @@ static int
 __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
                        struct mlx5_flow_meter_policy *mtr_policy,
                        const struct rte_flow_action *actions[RTE_COLORS],
+                       struct rte_flow_attr *attr,
                        enum mlx5_meter_domain domain,
                        struct rte_mtr_error *error)
 {
@@ -15379,7 +15943,6 @@ __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
                                          NULL,
                                          "cannot create policy "
                                          "mark action for this color");
-                               dev_flow.handle->mark = 1;
                                if (flow_dv_tag_resource_register(dev, tag_be,
                                                  &dev_flow, &flow_err))
                                        return -rte_mtr_error_set(error,
@@ -15391,6 +15954,7 @@ __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
                                act_cnt->rix_mark =
                                        dev_flow.handle->dvh.rix_tag;
                                action_flags |= MLX5_FLOW_ACTION_MARK;
+                               mtr_policy->mark = 1;
                                break;
                        }
                        case RTE_FLOW_ACTION_TYPE_SET_TAG:
@@ -15617,8 +16181,30 @@ __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
                                action_flags |= MLX5_FLOW_ACTION_JUMP;
                                break;
                        }
+                       case RTE_FLOW_ACTION_TYPE_MODIFY_FIELD:
+                       {
+                               if (i >= MLX5_MTR_RTE_COLORS)
+                                       return -rte_mtr_error_set(error,
+                                         ENOTSUP,
+                                         RTE_MTR_ERROR_TYPE_METER_POLICY,
+                                         NULL,
+                                         "cannot create policy modify field for this color");
+                               if (flow_dv_convert_action_modify_field
+                                       (dev, mhdr_res, act, attr, &flow_err))
+                                       return -rte_mtr_error_set(error,
+                                       ENOTSUP,
+                                       RTE_MTR_ERROR_TYPE_METER_POLICY,
+                                       NULL, "cannot setup policy modify field action");
+                               if (!mhdr_res->actions_num)
+                                       return -rte_mtr_error_set(error,
+                                       ENOTSUP,
+                                       RTE_MTR_ERROR_TYPE_METER_POLICY,
+                                       NULL, "cannot find policy modify field action");
+                               action_flags |= MLX5_FLOW_ACTION_MODIFY_FIELD;
+                               break;
+                       }
                        /*
-                        * No need to check meter hierarchy for Y or R colors
+                        * No need to check meter hierarchy for R colors
                         * here since it is done in the validation stage.
                         */
                        case RTE_FLOW_ACTION_TYPE_METER:
@@ -15669,11 +16255,17 @@ __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
                                        action_flags |=
                                                MLX5_FLOW_ACTION_SET_TAG;
                                }
+                               if (i == RTE_COLOR_YELLOW && next_fm->color_aware &&
+                                   !next_fm->meter_action_y)
+                                       if (__flow_dv_create_mtr_yellow_action(dev, next_fm, error))
+                                               return -rte_errno;
                                act_cnt->fate_action = MLX5_FLOW_FATE_MTR;
                                act_cnt->next_mtr_id = next_fm->meter_id;
                                act_cnt->next_sub_policy = NULL;
                                mtr_policy->is_hierarchy = 1;
                                mtr_policy->dev = next_policy->dev;
+                               if (next_policy->mark)
+                                       mtr_policy->mark = 1;
                                action_flags |=
                                MLX5_FLOW_ACTION_METER_WITH_TERMINATED_POLICY;
                                break;
@@ -15683,7 +16275,8 @@ __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
                                          RTE_MTR_ERROR_TYPE_METER_POLICY,
                                          NULL, "action type not supported");
                        }
-                       if (action_flags & MLX5_FLOW_ACTION_SET_TAG) {
+                       if ((action_flags & MLX5_FLOW_ACTION_SET_TAG) ||
+                           (action_flags & MLX5_FLOW_ACTION_MODIFY_FIELD)) {
                                /* create modify action if needed. */
                                dev_flow.dv.group = 1;
                                if (flow_dv_modify_hdr_resource_register
@@ -15691,8 +16284,7 @@ __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
                                        return -rte_mtr_error_set(error,
                                                ENOTSUP,
                                                RTE_MTR_ERROR_TYPE_METER_POLICY,
-                                               NULL, "cannot register policy "
-                                               "set tag action");
+                                               NULL, "cannot register policy set tag/modify field action");
                                act_cnt->modify_hdr =
                                        dev_flow.handle->dvh.modify_hdr;
                        }
@@ -15712,6 +16304,8 @@ __flow_dv_create_domain_policy_acts(struct rte_eth_dev *dev,
  *   Meter policy struct.
  * @param[in] action
  *   Action specification used to create meter actions.
+ * @param[in] attr
+ *   Pointer to the flow attributes.
  * @param[out] error
  *   Perform verbose error reporting if not NULL. Initialized in case of
  *   error only.
@@ -15723,6 +16317,7 @@ static int
 flow_dv_create_mtr_policy_acts(struct rte_eth_dev *dev,
                      struct mlx5_flow_meter_policy *mtr_policy,
                      const struct rte_flow_action *actions[RTE_COLORS],
+                     struct rte_flow_attr *attr,
                      struct rte_mtr_error *error)
 {
        int ret, i;
@@ -15734,7 +16329,7 @@ flow_dv_create_mtr_policy_acts(struct rte_eth_dev *dev,
                        MLX5_MTR_SUB_POLICY_NUM_MASK;
                if (sub_policy_num) {
                        ret = __flow_dv_create_domain_policy_acts(dev,
-                               mtr_policy, actions,
+                               mtr_policy, actions, attr,
                                (enum mlx5_meter_domain)i, error);
                        /* Cleaning resource is done in the caller level. */
                        if (ret)
@@ -15759,14 +16354,14 @@ flow_dv_create_mtr_policy_acts(struct rte_eth_dev *dev,
  * @return
  *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
-int
+static int
 flow_dv_query_count(struct rte_eth_dev *dev, uint32_t cnt_idx, void *data,
                    struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
        struct rte_flow_query_count *qc = data;
 
-       if (!priv->sh->devx)
+       if (!priv->sh->cdev->config.devx)
                return rte_flow_error_set(error, ENOTSUP,
                                          RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
                                          NULL,
@@ -15797,49 +16392,7 @@ flow_dv_query_count(struct rte_eth_dev *dev, uint32_t cnt_idx, void *data,
                                  "counters are not available");
 }
 
-
-/**
- * Query counter's action pointer for a DV flow rule via DevX.
- *
- * @param[in] dev
- *   Pointer to Ethernet device.
- * @param[in] cnt_idx
- *   Index to the flow counter.
- * @param[out] action_ptr
- *   Action pointer for counter.
- * @param[out] error
- *   Perform verbose error reporting if not NULL.
- *
- * @return
- *   0 on success, a negative errno value otherwise and rte_errno is set.
- */
 int
-flow_dv_query_count_ptr(struct rte_eth_dev *dev, uint32_t cnt_idx,
-       void **action_ptr, struct rte_flow_error *error)
-{
-       struct mlx5_priv *priv = dev->data->dev_private;
-
-       if (!priv->sh->devx || !action_ptr)
-               return rte_flow_error_set(error, ENOTSUP,
-                                         RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
-                                         NULL,
-                                         "counters are not supported");
-
-       if (cnt_idx) {
-               struct mlx5_flow_counter *cnt = NULL;
-               cnt = flow_dv_counter_get_by_idx(dev, cnt_idx, NULL);
-               if (cnt) {
-                       *action_ptr = cnt->action;
-                       return 0;
-               }
-       }
-       return rte_flow_error_set(error, EINVAL,
-                                 RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
-                                 NULL,
-                                 "counters are not available");
-}
-
-static int
 flow_dv_action_query(struct rte_eth_dev *dev,
                     const struct rte_flow_action_handle *handle, void *data,
                     struct rte_flow_error *error)
@@ -16001,7 +16554,7 @@ flow_dv_destroy_mtr_tbls(struct rte_eth_dev *dev,
        struct mlx5_priv *priv = dev->data->dev_private;
        int i;
 
-       if (!fm || !priv->config.dv_flow_en)
+       if (!fm || !priv->sh->config.dv_flow_en)
                return;
        for (i = 0; i < MLX5_MTR_DOMAIN_MAX; i++) {
                if (fm->drop_rule[i]) {
@@ -16104,7 +16657,7 @@ __flow_dv_create_policy_flow(struct rte_eth_dev *dev,
        struct mlx5_priv *priv = dev->data->dev_private;
        uint8_t misc_mask;
 
-       if (match_src_port && (priv->representor || priv->master)) {
+       if (match_src_port && priv->sh->esw_mode) {
                if (flow_dv_translate_item_port_id(dev, matcher.buf,
                                                   value.buf, item, attr)) {
                        DRV_LOG(ERR, "Failed to create meter policy%d flow's"
@@ -16156,7 +16709,7 @@ __flow_dv_create_policy_matcher(struct rte_eth_dev *dev,
        struct mlx5_priv *priv = dev->data->dev_private;
        const uint32_t color_mask = (UINT32_C(1) << MLX5_MTR_COLOR_BITS) - 1;
 
-       if (match_src_port && (priv->representor || priv->master)) {
+       if (match_src_port && priv->sh->esw_mode) {
                if (flow_dv_translate_item_port_id(dev, matcher.mask.buf,
                                                   value.buf, item, attr)) {
                        DRV_LOG(ERR, "Failed to register meter policy%d matcher"
@@ -16307,7 +16860,7 @@ __flow_dv_create_policy_acts_rules(struct rte_eth_dev *dev,
        struct mlx5_flow_dv_tag_resource *tag;
        struct mlx5_flow_dv_port_id_action_resource *port_action;
        struct mlx5_hrxq *hrxq;
-       struct mlx5_flow_meter_info *next_fm = NULL;
+       struct mlx5_flow_meter_info *next_fm[RTE_COLORS] = {NULL};
        struct mlx5_flow_meter_policy *next_policy;
        struct mlx5_flow_meter_sub_policy *next_sub_policy;
        struct mlx5_flow_tbl_data_entry *tbl_data;
@@ -16328,30 +16881,31 @@ __flow_dv_create_policy_acts_rules(struct rte_eth_dev *dev,
                        acts[i].actions_n = 1;
                        continue;
                }
-               if (i == RTE_COLOR_GREEN &&
-                   mtr_policy->act_cnt[i].fate_action == MLX5_FLOW_FATE_MTR) {
+               if (mtr_policy->act_cnt[i].fate_action == MLX5_FLOW_FATE_MTR) {
                        struct rte_flow_attr attr = {
                                .transfer = transfer
                        };
 
-                       next_fm = mlx5_flow_meter_find(priv,
+                       next_fm[i] = mlx5_flow_meter_find(priv,
                                        mtr_policy->act_cnt[i].next_mtr_id,
                                        NULL);
-                       if (!next_fm) {
+                       if (!next_fm[i]) {
                                DRV_LOG(ERR,
                                        "Failed to get next hierarchy meter.");
                                goto err_exit;
                        }
-                       if (mlx5_flow_meter_attach(priv, next_fm,
+                       if (mlx5_flow_meter_attach(priv, next_fm[i],
                                                   &attr, &error)) {
                                DRV_LOG(ERR, "%s", error.message);
-                               next_fm = NULL;
+                               next_fm[i] = NULL;
                                goto err_exit;
                        }
                        /* Meter action must be the first for TX. */
                        if (mtr_first) {
                                acts[i].dv_actions[acts[i].actions_n] =
-                                       next_fm->meter_action;
+                                       (next_fm[i]->color_aware && i == RTE_COLOR_YELLOW) ?
+                                               next_fm[i]->meter_action_y :
+                                               next_fm[i]->meter_action_g;
                                acts[i].actions_n++;
                        }
                }
@@ -16409,14 +16963,16 @@ __flow_dv_create_policy_acts_rules(struct rte_eth_dev *dev,
                                acts[i].actions_n++;
                                break;
                        case MLX5_FLOW_FATE_MTR:
-                               if (!next_fm) {
+                               if (!next_fm[i]) {
                                        DRV_LOG(ERR,
                                                "No next hierarchy meter.");
                                        goto err_exit;
                                }
                                if (!mtr_first) {
                                        acts[i].dv_actions[acts[i].actions_n] =
-                                                       next_fm->meter_action;
+                                               (next_fm[i]->color_aware && i == RTE_COLOR_YELLOW) ?
+                                                       next_fm[i]->meter_action_y :
+                                                       next_fm[i]->meter_action_g;
                                        acts[i].actions_n++;
                                }
                                if (mtr_policy->act_cnt[i].next_sub_policy) {
@@ -16425,7 +16981,7 @@ __flow_dv_create_policy_acts_rules(struct rte_eth_dev *dev,
                                } else {
                                        next_policy =
                                                mlx5_flow_meter_policy_find(dev,
-                                               next_fm->policy_id, NULL);
+                                                               next_fm[i]->policy_id, NULL);
                                        MLX5_ASSERT(next_policy);
                                        next_sub_policy =
                                        next_policy->sub_policys[domain][0];
@@ -16452,8 +17008,9 @@ __flow_dv_create_policy_acts_rules(struct rte_eth_dev *dev,
        }
        return 0;
 err_exit:
-       if (next_fm)
-               mlx5_flow_meter_detach(priv, next_fm);
+       for (i = 0; i < RTE_COLORS; i++)
+               if (next_fm[i])
+                       mlx5_flow_meter_detach(priv, next_fm[i]);
        return -1;
 }
 
@@ -16607,7 +17164,8 @@ flow_dv_create_def_policy(struct rte_eth_dev *dev)
 
        /* Non-termination policy table. */
        for (i = 0; i < MLX5_MTR_DOMAIN_MAX; i++) {
-               if (!priv->config.dv_esw_en && i == MLX5_MTR_DOMAIN_TRANSFER)
+               if (!priv->sh->config.dv_esw_en &&
+                   i == MLX5_MTR_DOMAIN_TRANSFER)
                        continue;
                if (__flow_dv_create_domain_def_policy(dev, i)) {
                        DRV_LOG(ERR, "Failed to create default policy");
@@ -16804,16 +17362,19 @@ __flow_dv_meter_get_rss_sub_policy(struct rte_eth_dev *dev,
        struct mlx5_meter_policy_action_container *act_cnt;
        uint32_t domain = MLX5_MTR_DOMAIN_INGRESS;
        uint16_t sub_policy_num;
+       struct mlx5_flow_workspace *wks = mlx5_flow_get_thread_workspace();
 
+       MLX5_ASSERT(wks);
        rte_spinlock_lock(&mtr_policy->sl);
        for (i = 0; i < MLX5_MTR_RTE_COLORS; i++) {
                if (!rss_desc[i])
                        continue;
-               hrxq_idx[i] = mlx5_hrxq_get(dev, rss_desc[i]);
-               if (!hrxq_idx[i]) {
+               hrxq = mlx5_hrxq_get(dev, rss_desc[i]);
+               if (!hrxq) {
                        rte_spinlock_unlock(&mtr_policy->sl);
                        return NULL;
                }
+               hrxq_idx[i] = hrxq->idx;
        }
        sub_policy_num = (mtr_policy->sub_policy_num >>
                        (MLX5_MTR_SUB_POLICY_NUM_SHIFT * domain)) &
@@ -16838,7 +17399,8 @@ __flow_dv_meter_get_rss_sub_policy(struct rte_eth_dev *dev,
                }
        }
        /* Create sub policy. */
-       if (!mtr_policy->sub_policys[domain][0]->rix_hrxq[0]) {
+       if (!mtr_policy->sub_policys[domain][0]->rix_hrxq[RTE_COLOR_GREEN] &&
+           !mtr_policy->sub_policys[domain][0]->rix_hrxq[RTE_COLOR_YELLOW]) {
                /* Reuse the first pre-allocated sub_policy. */
                sub_policy = mtr_policy->sub_policys[domain][0];
                sub_policy_idx = sub_policy->idx;
@@ -16878,7 +17440,7 @@ __flow_dv_meter_get_rss_sub_policy(struct rte_eth_dev *dev,
                        if (act_cnt->rix_mark || act_cnt->modify_hdr) {
                                memset(&dh, 0, sizeof(struct mlx5_flow_handle));
                                if (act_cnt->rix_mark)
-                                       dh.mark = 1;
+                                       wks->mark = 1;
                                dh.fate_action = MLX5_FLOW_FATE_QUEUE;
                                dh.rix_hrxq = hrxq_idx[i];
                                flow_drv_rxq_flags_set(dev, &dh);
@@ -16964,8 +17526,9 @@ flow_dv_meter_sub_policy_rss_prepare(struct rte_eth_dev *dev,
                        DRV_LOG(ERR, "Exceed max meter number in hierarchy.");
                        return NULL;
                }
-               next_fm = mlx5_flow_meter_find(priv,
-                       mtr_policy->act_cnt[RTE_COLOR_GREEN].next_mtr_id, NULL);
+               rte_spinlock_lock(&mtr_policy->sl);
+               next_fm = mlx5_flow_meter_hierarchy_next_meter(priv, mtr_policy, NULL);
+               rte_spinlock_unlock(&mtr_policy->sl);
                if (!next_fm) {
                        DRV_LOG(ERR, "Failed to get next meter in hierarchy.");
                        return NULL;
@@ -17022,6 +17585,68 @@ err_exit:
        return NULL;
 }
 
+/**
+ * Check if need to create hierarchy tag rule.
+ *
+ * @param[in] priv
+ *   Pointer to mlx5_priv.
+ * @param[in] mtr_policy
+ *   Pointer to current meter policy.
+ * @param[in] src_port
+ *   The src port this extra rule should use.
+ * @param[out] next_fm
+ *   Pointer to next meter in hierarchy.
+ * @param[out] skip
+ *   Indicate if skip the tag rule creation.
+ * @param[out] error
+ *   Perform verbose error reporting if not NULL.
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+mlx5_meter_hierarchy_skip_tag_rule(struct mlx5_priv *priv,
+                                  struct mlx5_flow_meter_policy *mtr_policy,
+                                  int32_t src_port,
+                                  struct mlx5_flow_meter_info **next_fm,
+                                  bool *skip,
+                                  struct rte_flow_error *error)
+{
+       struct mlx5_flow_meter_sub_policy *sub_policy;
+       struct mlx5_sub_policy_color_rule *color_rule;
+       uint32_t domain = MLX5_MTR_DOMAIN_TRANSFER;
+       int ret = 0;
+       int i;
+
+       *next_fm = NULL;
+       *skip = false;
+       rte_spinlock_lock(&mtr_policy->sl);
+       if (!mtr_policy->is_hierarchy)
+               goto exit;
+       *next_fm = mlx5_flow_meter_hierarchy_next_meter(priv, mtr_policy, NULL);
+       if (!*next_fm) {
+               ret = rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION,
+                                        NULL, "Failed to find next meter in hierarchy.");
+               goto exit;
+       }
+       if (!(*next_fm)->drop_cnt) {
+               *skip = true;
+               goto exit;
+       }
+       sub_policy = mtr_policy->sub_policys[domain][0];
+       for (i = 0; i < MLX5_MTR_RTE_COLORS; i++) {
+               if (mtr_policy->act_cnt[i].fate_action != MLX5_FLOW_FATE_MTR)
+                       continue;
+               TAILQ_FOREACH(color_rule, &sub_policy->color_rules[i], next_port)
+                       if (color_rule->src_port == src_port) {
+                               *skip = true;
+                               goto exit;
+                       }
+       }
+exit:
+       rte_spinlock_unlock(&mtr_policy->sl);
+       return ret;
+}
+
 /**
  * Create the sub policy tag rule for all meters in hierarchy.
  *
@@ -17065,111 +17690,129 @@ flow_dv_meter_hierarchy_rule_create(struct rte_eth_dev *dev,
                .reserved = 0,
        };
        uint32_t domain = MLX5_MTR_DOMAIN_TRANSFER;
-       int i;
+       struct {
+               struct mlx5_flow_meter_policy *fm_policy;
+               struct mlx5_flow_meter_info *next_fm;
+               struct mlx5_sub_policy_color_rule *tag_rule[MLX5_MTR_RTE_COLORS];
+       } fm_info[MLX5_MTR_CHAIN_MAX_NUM] = { {0} };
+       uint32_t fm_cnt = 0;
+       uint32_t i, j;
 
-       mtr_policy = mlx5_flow_meter_policy_find(dev, fm->policy_id, NULL);
-       MLX5_ASSERT(mtr_policy);
-       if (!mtr_policy->is_hierarchy)
-               return 0;
-       next_fm = mlx5_flow_meter_find(priv,
-                       mtr_policy->act_cnt[RTE_COLOR_GREEN].next_mtr_id, NULL);
-       if (!next_fm) {
-               return rte_flow_error_set(error, EINVAL,
-                               RTE_FLOW_ERROR_TYPE_ACTION, NULL,
-                               "Failed to find next meter in hierarchy.");
-       }
-       if (!next_fm->drop_cnt)
-               goto exit;
        color_reg_c_idx = mlx5_flow_get_reg_id(dev, MLX5_MTR_COLOR, 0, error);
-       sub_policy = mtr_policy->sub_policys[domain][0];
-       for (i = 0; i < RTE_COLORS; i++) {
-               bool rule_exist = false;
-               struct mlx5_meter_policy_action_container *act_cnt;
+       /* Get all fms who need to create the tag color rule. */
+       do {
+               bool skip = false;
 
-               if (i >= RTE_COLOR_YELLOW)
-                       break;
-               TAILQ_FOREACH(color_rule,
-                             &sub_policy->color_rules[i], next_port)
-                       if (color_rule->src_port == src_port) {
-                               rule_exist = true;
-                               break;
-                       }
-               if (rule_exist)
-                       continue;
-               color_rule = mlx5_malloc(MLX5_MEM_ZERO,
-                               sizeof(struct mlx5_sub_policy_color_rule),
-                               0, SOCKET_ID_ANY);
-               if (!color_rule)
-                       return rte_flow_error_set(error, ENOMEM,
-                               RTE_FLOW_ERROR_TYPE_ACTION,
-                               NULL, "No memory to create tag color rule.");
-               color_rule->src_port = src_port;
-               attr.priority = i;
-               next_policy = mlx5_flow_meter_policy_find(dev,
-                                               next_fm->policy_id, NULL);
-               MLX5_ASSERT(next_policy);
-               next_sub_policy = next_policy->sub_policys[domain][0];
-               tbl_data = container_of(next_sub_policy->tbl_rsc,
-                                       struct mlx5_flow_tbl_data_entry, tbl);
-               act_cnt = &mtr_policy->act_cnt[i];
-               if (mtr_first) {
-                       acts.dv_actions[0] = next_fm->meter_action;
-                       acts.dv_actions[1] = act_cnt->modify_hdr->action;
-               } else {
-                       acts.dv_actions[0] = act_cnt->modify_hdr->action;
-                       acts.dv_actions[1] = next_fm->meter_action;
-               }
-               acts.dv_actions[2] = tbl_data->jump.action;
-               acts.actions_n = 3;
-               if (mlx5_flow_meter_attach(priv, next_fm, &attr, error)) {
-                       next_fm = NULL;
-                       goto err_exit;
-               }
-               if (__flow_dv_create_policy_matcher(dev, color_reg_c_idx,
-                               MLX5_MTR_POLICY_MATCHER_PRIO, sub_policy,
-                               &attr, true, item,
-                               &color_rule->matcher, error)) {
-                       rte_flow_error_set(error, errno,
-                               RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
-                               "Failed to create hierarchy meter matcher.");
+               mtr_policy = mlx5_flow_meter_policy_find(dev, fm->policy_id, NULL);
+               MLX5_ASSERT(mtr_policy);
+               if (mlx5_meter_hierarchy_skip_tag_rule(priv, mtr_policy, src_port,
+                                                      &next_fm, &skip, error))
                        goto err_exit;
+               if (next_fm && !skip) {
+                       fm_info[fm_cnt].fm_policy = mtr_policy;
+                       fm_info[fm_cnt].next_fm = next_fm;
+                       if (++fm_cnt >= MLX5_MTR_CHAIN_MAX_NUM) {
+                               rte_flow_error_set(error, errno,
+                                       RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                       "Exceed max meter number in hierarchy.");
+                               goto err_exit;
+                       }
                }
-               if (__flow_dv_create_policy_flow(dev, color_reg_c_idx,
-                                       (enum rte_color)i,
-                                       color_rule->matcher->matcher_object,
-                                       acts.actions_n, acts.dv_actions,
-                                       true, item,
-                                       &color_rule->rule, &attr)) {
-                       rte_flow_error_set(error, errno,
-                               RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
-                               "Failed to create hierarchy meter rule.");
-                       goto err_exit;
+               fm = next_fm;
+       } while (fm);
+       /* Create tag color rules for all needed fms. */
+       for (i = 0; i < fm_cnt; i++) {
+               void *mtr_action;
+
+               mtr_policy = fm_info[i].fm_policy;
+               rte_spinlock_lock(&mtr_policy->sl);
+               sub_policy = mtr_policy->sub_policys[domain][0];
+               for (j = 0; j < MLX5_MTR_RTE_COLORS; j++) {
+                       if (mtr_policy->act_cnt[j].fate_action != MLX5_FLOW_FATE_MTR)
+                               continue;
+                       color_rule = mlx5_malloc(MLX5_MEM_ZERO,
+                                                sizeof(struct mlx5_sub_policy_color_rule),
+                                                0, SOCKET_ID_ANY);
+                       if (!color_rule) {
+                               rte_spinlock_unlock(&mtr_policy->sl);
+                               rte_flow_error_set(error, ENOMEM,
+                                                  RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                                  "No memory to create tag color rule.");
+                               goto err_exit;
+                       }
+                       color_rule->src_port = src_port;
+                       next_fm = fm_info[i].next_fm;
+                       if (mlx5_flow_meter_attach(priv, next_fm, &attr, error)) {
+                               mlx5_free(color_rule);
+                               rte_spinlock_unlock(&mtr_policy->sl);
+                               goto err_exit;
+                       }
+                       fm_info[i].tag_rule[j] = color_rule;
+                       TAILQ_INSERT_TAIL(&sub_policy->color_rules[j], color_rule, next_port);
+                       /* Prepare to create color rule. */
+                       mtr_action = (next_fm->color_aware && j == RTE_COLOR_YELLOW) ?
+                                                               next_fm->meter_action_y :
+                                                               next_fm->meter_action_g;
+                       next_policy = mlx5_flow_meter_policy_find(dev, next_fm->policy_id, NULL);
+                       MLX5_ASSERT(next_policy);
+                       next_sub_policy = next_policy->sub_policys[domain][0];
+                       tbl_data = container_of(next_sub_policy->tbl_rsc,
+                                               struct mlx5_flow_tbl_data_entry, tbl);
+                       if (mtr_first) {
+                               acts.dv_actions[0] = mtr_action;
+                               acts.dv_actions[1] = mtr_policy->act_cnt[j].modify_hdr->action;
+                       } else {
+                               acts.dv_actions[0] = mtr_policy->act_cnt[j].modify_hdr->action;
+                               acts.dv_actions[1] = mtr_action;
+                       }
+                       acts.dv_actions[2] = tbl_data->jump.action;
+                       acts.actions_n = 3;
+                       if (__flow_dv_create_policy_matcher(dev, color_reg_c_idx,
+                                               MLX5_MTR_POLICY_MATCHER_PRIO, sub_policy,
+                                               &attr, true, item, &color_rule->matcher, error)) {
+                               rte_spinlock_unlock(&mtr_policy->sl);
+                               rte_flow_error_set(error, errno,
+                                                  RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                                  "Failed to create hierarchy meter matcher.");
+                               goto err_exit;
+                       }
+                       if (__flow_dv_create_policy_flow(dev, color_reg_c_idx, (enum rte_color)j,
+                                               color_rule->matcher->matcher_object,
+                                               acts.actions_n, acts.dv_actions,
+                                               true, item, &color_rule->rule, &attr)) {
+                               rte_spinlock_unlock(&mtr_policy->sl);
+                               rte_flow_error_set(error, errno,
+                                                  RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                                  "Failed to create hierarchy meter rule.");
+                               goto err_exit;
+                       }
                }
-               TAILQ_INSERT_TAIL(&sub_policy->color_rules[i],
-                                 color_rule, next_port);
+               rte_spinlock_unlock(&mtr_policy->sl);
        }
-exit:
-       /**
-        * Recursive call to iterate all meters in hierarchy and
-        * create needed rules.
-        */
-       return flow_dv_meter_hierarchy_rule_create(dev, next_fm,
-                                               src_port, item, error);
+       return 0;
 err_exit:
-       if (color_rule) {
-               if (color_rule->rule)
-                       mlx5_flow_os_destroy_flow(color_rule->rule);
-               if (color_rule->matcher) {
-                       struct mlx5_flow_tbl_data_entry *tbl =
-                               container_of(color_rule->matcher->tbl,
-                                               typeof(*tbl), tbl);
-                       mlx5_list_unregister(tbl->matchers,
-                                               &color_rule->matcher->entry);
+       for (i = 0; i < fm_cnt; i++) {
+               mtr_policy = fm_info[i].fm_policy;
+               rte_spinlock_lock(&mtr_policy->sl);
+               sub_policy = mtr_policy->sub_policys[domain][0];
+               for (j = 0; j < MLX5_MTR_RTE_COLORS; j++) {
+                       color_rule = fm_info[i].tag_rule[j];
+                       if (!color_rule)
+                               continue;
+                       if (color_rule->rule)
+                               mlx5_flow_os_destroy_flow(color_rule->rule);
+                       if (color_rule->matcher) {
+                               struct mlx5_flow_tbl_data_entry *tbl =
+                                       container_of(color_rule->matcher->tbl, typeof(*tbl), tbl);
+                               mlx5_list_unregister(tbl->matchers, &color_rule->matcher->entry);
+                       }
+                       if (fm_info[i].next_fm)
+                               mlx5_flow_meter_detach(priv, fm_info[i].next_fm);
+                       TAILQ_REMOVE(&sub_policy->color_rules[j], color_rule, next_port);
+                       mlx5_free(color_rule);
                }
-               mlx5_free(color_rule);
+               rte_spinlock_unlock(&mtr_policy->sl);
        }
-       if (next_fm)
-               mlx5_flow_meter_detach(priv, next_fm);
        return -rte_errno;
 }
 
@@ -17414,20 +18057,23 @@ err:
  */
 static int
 flow_dv_counter_query(struct rte_eth_dev *dev, uint32_t counter, bool clear,
-                     uint64_t *pkts, uint64_t *bytes)
+                     uint64_t *pkts, uint64_t *bytes, void **action)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
        struct mlx5_flow_counter *cnt;
        uint64_t inn_pkts, inn_bytes;
        int ret;
 
-       if (!priv->sh->devx)
+       if (!priv->sh->cdev->config.devx)
                return -1;
 
        ret = _flow_dv_query_count(dev, counter, &inn_pkts, &inn_bytes);
        if (ret)
                return -1;
        cnt = flow_dv_counter_get_by_idx(dev, counter, NULL);
+       if (cnt && action)
+               *action = cnt->action;
+
        *pkts = inn_pkts - cnt->hits;
        *bytes = inn_bytes - cnt->bytes;
        if (clear) {
@@ -17525,7 +18171,7 @@ flow_dv_counter_allocate(struct rte_eth_dev *dev)
  * @return
  *   0 on success, otherwise negative errno value.
  */
-static int
+int
 flow_dv_action_validate(struct rte_eth_dev *dev,
                        const struct rte_flow_indir_action_conf *conf,
                        const struct rte_flow_action *action,
@@ -17559,7 +18205,7 @@ flow_dv_action_validate(struct rte_eth_dev *dev,
                                                "Indirect age action not supported");
                return flow_dv_validate_action_age(0, action, dev, err);
        case RTE_FLOW_ACTION_TYPE_COUNT:
-               return flow_dv_validate_action_count(dev, true, 0, err);
+               return flow_dv_validate_action_count(dev, true, 0, NULL, err);
        case RTE_FLOW_ACTION_TYPE_CONNTRACK:
                if (!priv->sh->ct_aso_en)
                        return rte_flow_error_set(err, ENOTSUP,
@@ -17649,8 +18295,8 @@ flow_dv_validate_policy_mtr_hierarchy(struct rte_eth_dev *dev,
                                        NULL,
                                        "Multiple fate actions not supported.");
        *hierarchy_domain = 0;
+       fm = mlx5_flow_meter_find(priv, meter_id, NULL);
        while (true) {
-               fm = mlx5_flow_meter_find(priv, meter_id, NULL);
                if (!fm)
                        return -rte_mtr_error_set(error, EINVAL,
                                                RTE_MTR_ERROR_TYPE_MTR_ID, NULL,
@@ -17659,6 +18305,10 @@ flow_dv_validate_policy_mtr_hierarchy(struct rte_eth_dev *dev,
                        return -rte_mtr_error_set(error, EINVAL,
                                        RTE_MTR_ERROR_TYPE_MTR_ID, NULL,
                        "Non termination meter not supported in hierarchy.");
+               if (!fm->shared)
+                       return -rte_mtr_error_set(error, EINVAL,
+                                       RTE_MTR_ERROR_TYPE_MTR_ID, NULL,
+                                       "Only shared meter supported in hierarchy.");
                policy = mlx5_flow_meter_policy_find(dev, fm->policy_id, NULL);
                MLX5_ASSERT(policy);
                /**
@@ -17680,7 +18330,9 @@ flow_dv_validate_policy_mtr_hierarchy(struct rte_eth_dev *dev,
                        *is_rss = policy->is_rss;
                        break;
                }
-               meter_id = policy->act_cnt[RTE_COLOR_GREEN].next_mtr_id;
+               rte_spinlock_lock(&policy->sl);
+               fm = mlx5_flow_meter_hierarchy_next_meter(priv, policy, NULL);
+               rte_spinlock_unlock(&policy->sl);
                if (++cnt >= MLX5_MTR_CHAIN_MAX_NUM)
                        return -rte_mtr_error_set(error, EINVAL,
                                        RTE_MTR_ERROR_TYPE_METER_POLICY, NULL,
@@ -17716,7 +18368,7 @@ flow_dv_validate_mtr_policy_acts(struct rte_eth_dev *dev,
                        struct rte_mtr_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
-       struct mlx5_dev_config *dev_conf = &priv->config;
+       struct mlx5_sh_config *dev_conf = &priv->sh->config;
        const struct rte_flow_action *act;
        uint64_t action_flags[RTE_COLORS] = {0};
        int actions_n;
@@ -17726,11 +18378,12 @@ flow_dv_validate_mtr_policy_acts(struct rte_eth_dev *dev,
        uint8_t def_domain = MLX5_MTR_ALL_DOMAIN_BIT;
        uint8_t hierarchy_domain = 0;
        const struct rte_flow_action_meter *mtr;
+       const struct rte_flow_action_meter *next_mtr = NULL;
        bool def_green = false;
        bool def_yellow = false;
        const struct rte_flow_action_rss *rss_color[RTE_COLORS] = {NULL};
 
-       if (!priv->config.dv_esw_en)
+       if (!dev_conf->dv_esw_en)
                def_domain &= ~MLX5_MTR_DOMAIN_TRANSFER_BIT;
        *domain_bitmap = def_domain;
        /* Red color could only support DROP action. */
@@ -17774,7 +18427,7 @@ flow_dv_validate_mtr_policy_acts(struct rte_eth_dev *dev,
                        switch (act->type) {
                        case RTE_FLOW_ACTION_TYPE_PORT_ID:
                        case RTE_FLOW_ACTION_TYPE_REPRESENTED_PORT:
-                               if (!priv->config.dv_esw_en)
+                               if (!dev_conf->dv_esw_en)
                                        return -rte_mtr_error_set(error,
                                        ENOTSUP,
                                        RTE_MTR_ERROR_TYPE_METER_POLICY,
@@ -17909,25 +18562,12 @@ flow_dv_validate_mtr_policy_acts(struct rte_eth_dev *dev,
                                ++actions_n;
                                action_flags[i] |= MLX5_FLOW_ACTION_JUMP;
                                break;
-                       /*
-                        * Only the last meter in the hierarchy will support
-                        * the YELLOW color steering. Then in the meter policy
-                        * actions list, there should be no other meter inside.
-                        */
                        case RTE_FLOW_ACTION_TYPE_METER:
-                               if (i != RTE_COLOR_GREEN)
-                                       return -rte_mtr_error_set(error,
-                                               ENOTSUP,
-                                               RTE_MTR_ERROR_TYPE_METER_POLICY,
-                                               NULL,
-                                               "Meter hierarchy only supports GREEN color.");
-                               if (*policy_mode != MLX5_MTR_POLICY_MODE_OG)
-                                       return -rte_mtr_error_set(error,
-                                               ENOTSUP,
-                                               RTE_MTR_ERROR_TYPE_METER_POLICY,
-                                               NULL,
-                                               "No yellow policy should be provided in meter hierarchy.");
                                mtr = act->conf;
+                               if (next_mtr && next_mtr->mtr_id != mtr->mtr_id)
+                                       return -rte_mtr_error_set(error, ENOTSUP,
+                                               RTE_MTR_ERROR_TYPE_METER_POLICY, NULL,
+                                               "Green and Yellow must use the same meter.");
                                ret = flow_dv_validate_policy_mtr_hierarchy(dev,
                                                        mtr->mtr_id,
                                                        action_flags[i],
@@ -17939,6 +18579,20 @@ flow_dv_validate_mtr_policy_acts(struct rte_eth_dev *dev,
                                ++actions_n;
                                action_flags[i] |=
                                MLX5_FLOW_ACTION_METER_WITH_TERMINATED_POLICY;
+                               next_mtr = mtr;
+                               break;
+                       case RTE_FLOW_ACTION_TYPE_MODIFY_FIELD:
+                               ret = flow_dv_validate_action_modify_field(dev,
+                                       action_flags[i], act, attr, &flow_err);
+                               if (ret < 0)
+                                       return -rte_mtr_error_set(error,
+                                         ENOTSUP,
+                                         RTE_MTR_ERROR_TYPE_METER_POLICY,
+                                         NULL, flow_err.message ?
+                                         flow_err.message :
+                                         "Modify field action validate check fail");
+                               ++actions_n;
+                               action_flags[i] |= MLX5_FLOW_ACTION_MODIFY_FIELD;
                                break;
                        default:
                                return -rte_mtr_error_set(error, ENOTSUP,
@@ -18024,6 +18678,13 @@ flow_dv_validate_mtr_policy_acts(struct rte_eth_dev *dev,
                        }
                }
        }
+       if (next_mtr && *policy_mode == MLX5_MTR_POLICY_MODE_ALL) {
+               if (!(action_flags[RTE_COLOR_GREEN] & action_flags[RTE_COLOR_YELLOW] &
+                     MLX5_FLOW_ACTION_METER_WITH_TERMINATED_POLICY))
+                       return -rte_mtr_error_set(error, EINVAL, RTE_MTR_ERROR_TYPE_METER_POLICY,
+                                                 NULL,
+                                                 "Meter hierarchy supports meter action only.");
+       }
        /* If both colors have RSS, the attributes should be the same. */
        if (flow_dv_mtr_policy_rss_compare(rss_color[RTE_COLOR_GREEN],
                                           rss_color[RTE_COLOR_YELLOW]))
@@ -18215,4 +18876,3 @@ const struct mlx5_flow_driver_ops mlx5_flow_dv_drv_ops = {
 };
 
 #endif /* HAVE_IBV_FLOW_DV_SUPPORT */
-