net/mlx5: add MPLS to Direct Verbs flow engine
[dpdk.git] / drivers / net / mlx5 / mlx5_flow_dv.c
index 156d0d0..b9293bd 100644 (file)
@@ -35,8 +35,6 @@
 
 #ifdef HAVE_IBV_FLOW_DV_SUPPORT
 
-#define MLX5_ENCAP_MAX_LEN 132
-
 /**
  * Validate META item.
  *
@@ -177,6 +175,172 @@ flow_dv_validate_action_l2_decap(uint64_t action_flags,
        return 0;
 }
 
+/**
+ * Validate the raw encap action.
+ *
+ * @param[in] action_flags
+ *   Holds the actions detected until now.
+ * @param[in] action
+ *   Pointer to the encap action.
+ * @param[in] attr
+ *   Pointer to flow attributes
+ * @param[out] error
+ *   Pointer to error structure.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+flow_dv_validate_action_raw_encap(uint64_t action_flags,
+                                 const struct rte_flow_action *action,
+                                 const struct rte_flow_attr *attr,
+                                 struct rte_flow_error *error)
+{
+       if (!(action->conf))
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, action,
+                                         "configuration cannot be null");
+       if (action_flags & MLX5_FLOW_ACTION_DROP)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                         "can't drop and encap in same flow");
+       if (action_flags & MLX5_FLOW_ENCAP_ACTIONS)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                         "can only have a single encap"
+                                         " action in a flow");
+       /* encap without preceding decap is not supported for ingress */
+       if (attr->ingress && !(action_flags & MLX5_FLOW_ACTION_RAW_DECAP))
+               return rte_flow_error_set(error, ENOTSUP,
+                                         RTE_FLOW_ERROR_TYPE_ATTR_INGRESS,
+                                         NULL,
+                                         "encap action not supported for "
+                                         "ingress");
+       return 0;
+}
+
+/**
+ * Validate the raw decap action.
+ *
+ * @param[in] action_flags
+ *   Holds the actions detected until now.
+ * @param[in] action
+ *   Pointer to the encap action.
+ * @param[in] attr
+ *   Pointer to flow attributes
+ * @param[out] error
+ *   Pointer to error structure.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+flow_dv_validate_action_raw_decap(uint64_t action_flags,
+                                 const struct rte_flow_action *action,
+                                 const struct rte_flow_attr *attr,
+                                 struct rte_flow_error *error)
+{
+       if (action_flags & MLX5_FLOW_ACTION_DROP)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                         "can't drop and decap in same flow");
+       if (action_flags & MLX5_FLOW_ENCAP_ACTIONS)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                         "can't have encap action before"
+                                         " decap action");
+       if (action_flags & MLX5_FLOW_DECAP_ACTIONS)
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION, NULL,
+                                         "can only have a single decap"
+                                         " action in a flow");
+       /* decap action is valid on egress only if it is followed by encap */
+       if (attr->egress) {
+               for (; action->type != RTE_FLOW_ACTION_TYPE_END &&
+                      action->type != RTE_FLOW_ACTION_TYPE_RAW_ENCAP;
+                      action++) {
+               }
+               if (action->type != RTE_FLOW_ACTION_TYPE_RAW_ENCAP)
+                       return rte_flow_error_set
+                                       (error, ENOTSUP,
+                                        RTE_FLOW_ERROR_TYPE_ATTR_EGRESS,
+                                        NULL, "decap action not supported"
+                                        " for egress");
+       }
+       return 0;
+}
+
+
+/**
+ * Find existing encap/decap resource or create and register a new one.
+ *
+ * @param dev[in, out]
+ *   Pointer to rte_eth_dev structure.
+ * @param[in, out] resource
+ *   Pointer to encap/decap resource.
+ * @parm[in, out] dev_flow
+ *   Pointer to the dev_flow.
+ * @param[out] error
+ *   pointer to error structure.
+ *
+ * @return
+ *   0 on success otherwise -errno and errno is set.
+ */
+static int
+flow_dv_encap_decap_resource_register
+                       (struct rte_eth_dev *dev,
+                        struct mlx5_flow_dv_encap_decap_resource *resource,
+                        struct mlx5_flow *dev_flow,
+                        struct rte_flow_error *error)
+{
+       struct priv *priv = dev->data->dev_private;
+       struct mlx5_flow_dv_encap_decap_resource *cache_resource;
+
+       /* Lookup a matching resource from cache. */
+       LIST_FOREACH(cache_resource, &priv->encaps_decaps, next) {
+               if (resource->reformat_type == cache_resource->reformat_type &&
+                   resource->ft_type == cache_resource->ft_type &&
+                   resource->size == cache_resource->size &&
+                   !memcmp((const void *)resource->buf,
+                           (const void *)cache_resource->buf,
+                           resource->size)) {
+                       DRV_LOG(DEBUG, "encap/decap resource %p: refcnt %d++",
+                               (void *)cache_resource,
+                               rte_atomic32_read(&cache_resource->refcnt));
+                       rte_atomic32_inc(&cache_resource->refcnt);
+                       dev_flow->dv.encap_decap = cache_resource;
+                       return 0;
+               }
+       }
+       /* Register new encap/decap resource. */
+       cache_resource = rte_calloc(__func__, 1, sizeof(*cache_resource), 0);
+       if (!cache_resource)
+               return rte_flow_error_set(error, ENOMEM,
+                                         RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                         "cannot allocate resource memory");
+       *cache_resource = *resource;
+       cache_resource->verbs_action =
+               mlx5_glue->dv_create_flow_action_packet_reformat
+                       (priv->ctx, cache_resource->size,
+                        (cache_resource->size ? cache_resource->buf : NULL),
+                        cache_resource->reformat_type,
+                        cache_resource->ft_type);
+       if (!cache_resource->verbs_action) {
+               rte_free(cache_resource);
+               return rte_flow_error_set(error, ENOMEM,
+                                         RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
+                                         NULL, "cannot create action");
+       }
+       rte_atomic32_init(&cache_resource->refcnt);
+       rte_atomic32_inc(&cache_resource->refcnt);
+       LIST_INSERT_HEAD(&priv->encaps_decaps, cache_resource, next);
+       dev_flow->dv.encap_decap = cache_resource;
+       DRV_LOG(DEBUG, "new encap/decap resource %p: refcnt %d++",
+               (void *)cache_resource,
+               rte_atomic32_read(&cache_resource->refcnt));
+       return 0;
+}
+
 /**
  * Get the size of specific rte_flow_item_type
  *
@@ -418,42 +582,51 @@ flow_dv_convert_encap_data(const struct rte_flow_item *items, uint8_t *buf,
  *   Pointer to rte_eth_dev structure.
  * @param[in] action
  *   Pointer to action structure.
+ * @param[in, out] dev_flow
+ *   Pointer to the mlx5_flow.
  * @param[out] error
  *   Pointer to the error structure.
  *
  * @return
- *   Pointer to action on success, NULL otherwise and rte_errno is set.
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
-static struct ibv_flow_action *
+static int
 flow_dv_create_action_l2_encap(struct rte_eth_dev *dev,
                               const struct rte_flow_action *action,
+                              struct mlx5_flow *dev_flow,
                               struct rte_flow_error *error)
 {
-       struct ibv_flow_action *verbs_action = NULL;
        const struct rte_flow_item *encap_data;
-       struct priv *priv = dev->data->dev_private;
-       uint8_t buf[MLX5_ENCAP_MAX_LEN];
-       size_t size = 0;
-       int convert_result = 0;
+       const struct rte_flow_action_raw_encap *raw_encap_data;
+       struct mlx5_flow_dv_encap_decap_resource res = {
+               .reformat_type =
+                       MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TO_L2_TUNNEL,
+               .ft_type = MLX5DV_FLOW_TABLE_TYPE_NIC_TX,
+       };
 
-       if (action->type == RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP)
-               encap_data = ((const struct rte_flow_action_vxlan_encap *)
+       if (action->type == RTE_FLOW_ACTION_TYPE_RAW_ENCAP) {
+               raw_encap_data =
+                       (const struct rte_flow_action_raw_encap *)action->conf;
+               res.size = raw_encap_data->size;
+               memcpy(res.buf, raw_encap_data->data, res.size);
+       } else {
+               if (action->type == RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP)
+                       encap_data =
+                               ((const struct rte_flow_action_vxlan_encap *)
                                                action->conf)->definition;
-       else
-               encap_data = ((const struct rte_flow_action_nvgre_encap *)
+               else
+                       encap_data =
+                               ((const struct rte_flow_action_nvgre_encap *)
                                                action->conf)->definition;
-       convert_result = flow_dv_convert_encap_data(encap_data, buf,
-                                                   &size, error);
-       if (convert_result)
-               return NULL;
-       verbs_action = mlx5_glue->dv_create_flow_action_packet_reformat
-               (priv->ctx, size, buf,
-                MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TO_L2_TUNNEL,
-                MLX5DV_FLOW_TABLE_TYPE_NIC_TX);
-       if (!verbs_action)
-               rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION,
-                                  NULL, "cannot create L2 encap action");
-       return verbs_action;
+               if (flow_dv_convert_encap_data(encap_data, res.buf,
+                                              &res.size, error))
+                       return -rte_errno;
+       }
+       if (flow_dv_encap_decap_resource_register(dev, &res, dev_flow, error))
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION,
+                                         NULL, "can't create L2 encap action");
+       return 0;
 }
 
 /**
@@ -461,27 +634,73 @@ flow_dv_create_action_l2_encap(struct rte_eth_dev *dev,
  *
  * @param[in] dev
  *   Pointer to rte_eth_dev structure.
+ * @param[in, out] dev_flow
+ *   Pointer to the mlx5_flow.
  * @param[out] error
  *   Pointer to the error structure.
  *
  * @return
- *   Pointer to action on success, NULL otherwise and rte_errno is set.
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
-static struct ibv_flow_action *
+static int
 flow_dv_create_action_l2_decap(struct rte_eth_dev *dev,
+                              struct mlx5_flow *dev_flow,
                               struct rte_flow_error *error)
 {
-       struct ibv_flow_action *verbs_action = NULL;
-       struct priv *priv = dev->data->dev_private;
+       struct mlx5_flow_dv_encap_decap_resource res = {
+               .size = 0,
+               .reformat_type =
+                       MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TUNNEL_TO_L2,
+               .ft_type = MLX5DV_FLOW_TABLE_TYPE_NIC_RX,
+       };
+
+       if (flow_dv_encap_decap_resource_register(dev, &res, dev_flow, error))
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION,
+                                         NULL, "can't create L2 decap action");
+       return 0;
+}
 
-       verbs_action = mlx5_glue->dv_create_flow_action_packet_reformat
-               (priv->ctx, 0, NULL,
-                MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TUNNEL_TO_L2,
-                MLX5DV_FLOW_TABLE_TYPE_NIC_RX);
-       if (!verbs_action)
-               rte_flow_error_set(error, EINVAL, RTE_FLOW_ERROR_TYPE_ACTION,
-                                  NULL, "cannot create L2 decap action");
-       return verbs_action;
+/**
+ * Convert raw decap/encap (L3 tunnel) action to DV specification.
+ *
+ * @param[in] dev
+ *   Pointer to rte_eth_dev structure.
+ * @param[in] action
+ *   Pointer to action structure.
+ * @param[in, out] dev_flow
+ *   Pointer to the mlx5_flow.
+ * @param[in] attr
+ *   Pointer to the flow attributes.
+ * @param[out] error
+ *   Pointer to the error structure.
+ *
+ * @return
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
+ */
+static int
+flow_dv_create_action_raw_encap(struct rte_eth_dev *dev,
+                               const struct rte_flow_action *action,
+                               struct mlx5_flow *dev_flow,
+                               const struct rte_flow_attr *attr,
+                               struct rte_flow_error *error)
+{
+       const struct rte_flow_action_raw_encap *encap_data;
+       struct mlx5_flow_dv_encap_decap_resource res;
+
+       encap_data = (const struct rte_flow_action_raw_encap *)action->conf;
+       res.size = encap_data->size;
+       memcpy(res.buf, encap_data->data, res.size);
+       res.reformat_type = attr->egress ?
+               MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L2_TO_L3_TUNNEL :
+               MLX5DV_FLOW_ACTION_PACKET_REFORMAT_TYPE_L3_TUNNEL_TO_L2;
+       res.ft_type = attr->egress ? MLX5DV_FLOW_TABLE_TYPE_NIC_TX :
+                                    MLX5DV_FLOW_TABLE_TYPE_NIC_RX;
+       if (flow_dv_encap_decap_resource_register(dev, &res, dev_flow, error))
+               return rte_flow_error_set(error, EINVAL,
+                                         RTE_FLOW_ERROR_TYPE_ACTION,
+                                         NULL, "can't create encap action");
+       return 0;
 }
 
 /**
@@ -595,10 +814,17 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                               MLX5_FLOW_LAYER_OUTER_L3_IPV4;
                        if (items->mask != NULL &&
                            ((const struct rte_flow_item_ipv4 *)
-                            items->mask)->hdr.next_proto_id)
+                            items->mask)->hdr.next_proto_id) {
                                next_protocol =
                                        ((const struct rte_flow_item_ipv4 *)
                                         (items->spec))->hdr.next_proto_id;
+                               next_protocol &=
+                                       ((const struct rte_flow_item_ipv4 *)
+                                        (items->mask))->hdr.next_proto_id;
+                       } else {
+                               /* Reset for inner layer. */
+                               next_protocol = 0xff;
+                       }
                        break;
                case RTE_FLOW_ITEM_TYPE_IPV6:
                        ret = mlx5_flow_validate_item_ipv6(items, item_flags,
@@ -609,10 +835,17 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                               MLX5_FLOW_LAYER_OUTER_L3_IPV6;
                        if (items->mask != NULL &&
                            ((const struct rte_flow_item_ipv6 *)
-                            items->mask)->hdr.proto)
+                            items->mask)->hdr.proto) {
                                next_protocol =
                                        ((const struct rte_flow_item_ipv6 *)
                                         items->spec)->hdr.proto;
+                               next_protocol &=
+                                       ((const struct rte_flow_item_ipv6 *)
+                                        items->mask)->hdr.proto;
+                       } else {
+                               /* Reset for inner layer. */
+                               next_protocol = 0xff;
+                       }
                        break;
                case RTE_FLOW_ITEM_TYPE_TCP:
                        ret = mlx5_flow_validate_item_tcp
@@ -657,6 +890,14 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                return ret;
                        item_flags |= MLX5_FLOW_LAYER_VXLAN_GPE;
                        break;
+               case RTE_FLOW_ITEM_TYPE_MPLS:
+                       ret = mlx5_flow_validate_item_mpls(items, item_flags,
+                                                          next_protocol,
+                                                          error);
+                       if (ret < 0)
+                               return ret;
+                       item_flags |= MLX5_FLOW_LAYER_MPLS;
+                       break;
                case RTE_FLOW_ITEM_TYPE_META:
                        ret = flow_dv_validate_item_meta(dev, items, attr,
                                                         error);
@@ -739,7 +980,6 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                        RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP ?
                                        MLX5_FLOW_ACTION_VXLAN_ENCAP :
                                        MLX5_FLOW_ACTION_NVGRE_ENCAP;
-
                        ++actions_n;
                        break;
                case RTE_FLOW_ACTION_TYPE_VXLAN_DECAP:
@@ -752,7 +992,24 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
                                        RTE_FLOW_ACTION_TYPE_VXLAN_DECAP ?
                                        MLX5_FLOW_ACTION_VXLAN_DECAP :
                                        MLX5_FLOW_ACTION_NVGRE_DECAP;
-
+                       ++actions_n;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_RAW_ENCAP:
+                       ret = flow_dv_validate_action_raw_encap(action_flags,
+                                                               actions, attr,
+                                                               error);
+                       if (ret < 0)
+                               return ret;
+                       action_flags |= MLX5_FLOW_ACTION_RAW_ENCAP;
+                       ++actions_n;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_RAW_DECAP:
+                       ret = flow_dv_validate_action_raw_decap(action_flags,
+                                                               actions, attr,
+                                                               error);
+                       if (ret < 0)
+                               return ret;
+                       action_flags |= MLX5_FLOW_ACTION_RAW_DECAP;
                        ++actions_n;
                        break;
                default:
@@ -779,10 +1036,6 @@ flow_dv_validate(struct rte_eth_dev *dev, const struct rte_flow_attr *attr,
  *   Pointer to the list of items.
  * @param[in] actions
  *   Pointer to the list of actions.
- * @param[out] item_flags
- *   Pointer to bit mask of all items detected.
- * @param[out] action_flags
- *   Pointer to bit mask of all actions detected.
  * @param[out] error
  *   Pointer to the error structure.
  *
@@ -794,8 +1047,6 @@ static struct mlx5_flow *
 flow_dv_prepare(const struct rte_flow_attr *attr __rte_unused,
                const struct rte_flow_item items[] __rte_unused,
                const struct rte_flow_action actions[] __rte_unused,
-               uint64_t *item_flags __rte_unused,
-               uint64_t *action_flags __rte_unused,
                struct rte_flow_error *error)
 {
        uint32_t size = sizeof(struct mlx5_flow);
@@ -812,6 +1063,39 @@ flow_dv_prepare(const struct rte_flow_attr *attr __rte_unused,
        return flow;
 }
 
+#ifndef NDEBUG
+/**
+ * Sanity check for match mask and value. Similar to check_valid_spec() in
+ * kernel driver. If unmasked bit is present in value, it returns failure.
+ *
+ * @param match_mask
+ *   pointer to match mask buffer.
+ * @param match_value
+ *   pointer to match value buffer.
+ *
+ * @return
+ *   0 if valid, -EINVAL otherwise.
+ */
+static int
+flow_dv_check_valid_spec(void *match_mask, void *match_value)
+{
+       uint8_t *m = match_mask;
+       uint8_t *v = match_value;
+       unsigned int i;
+
+       for (i = 0; i < MLX5_ST_SZ_DB(fte_match_param); ++i) {
+               if (v[i] & ~m[i]) {
+                       DRV_LOG(ERR,
+                               "match_value differs from match_criteria"
+                               " %p[%u] != %p[%u]",
+                               match_value, i, match_mask, i);
+                       return -EINVAL;
+               }
+       }
+       return 0;
+}
+#endif
+
 /**
  * Add Ethernet item to matcher and to the value.
  *
@@ -1332,6 +1616,96 @@ flow_dv_translate_item_vxlan(void *matcher, void *key,
                vni_v[i] = vni_m[i] & vxlan_v->vni[i];
 }
 
+/**
+ * Add MPLS item to matcher and to the value.
+ *
+ * @param[in, out] matcher
+ *   Flow matcher.
+ * @param[in, out] key
+ *   Flow matcher value.
+ * @param[in] item
+ *   Flow pattern to translate.
+ * @param[in] prev_layer
+ *   The protocol layer indicated in previous item.
+ * @param[in] inner
+ *   Item is inner pattern.
+ */
+static void
+flow_dv_translate_item_mpls(void *matcher, void *key,
+                           const struct rte_flow_item *item,
+                           uint64_t prev_layer,
+                           int inner)
+{
+       const uint32_t *in_mpls_m = item->mask;
+       const uint32_t *in_mpls_v = item->spec;
+       uint32_t *out_mpls_m = 0;
+       uint32_t *out_mpls_v = 0;
+       void *misc_m = MLX5_ADDR_OF(fte_match_param, matcher, misc_parameters);
+       void *misc_v = MLX5_ADDR_OF(fte_match_param, key, misc_parameters);
+       void *misc2_m = MLX5_ADDR_OF(fte_match_param, matcher,
+                                    misc_parameters_2);
+       void *misc2_v = MLX5_ADDR_OF(fte_match_param, key, misc_parameters_2);
+       void *headers_m = MLX5_ADDR_OF(fte_match_param, matcher, outer_headers);
+       void *headers_v = MLX5_ADDR_OF(fte_match_param, key, outer_headers);
+
+       switch (prev_layer) {
+       case MLX5_FLOW_LAYER_OUTER_L4_UDP:
+               MLX5_SET(fte_match_set_lyr_2_4, headers_m, udp_dport, 0xffff);
+               MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport,
+                        MLX5_UDP_PORT_MPLS);
+               break;
+       case MLX5_FLOW_LAYER_GRE:
+               MLX5_SET(fte_match_set_misc, misc_m, gre_protocol, 0xffff);
+               MLX5_SET(fte_match_set_misc, misc_v, gre_protocol,
+                        ETHER_TYPE_MPLS);
+               break;
+       default:
+               MLX5_SET(fte_match_set_lyr_2_4, headers_m, ip_protocol, 0xff);
+               MLX5_SET(fte_match_set_lyr_2_4, headers_v, ip_protocol,
+                        IPPROTO_MPLS);
+               break;
+       }
+       if (!in_mpls_v)
+               return;
+       if (!in_mpls_m)
+               in_mpls_m = (const uint32_t *)&rte_flow_item_mpls_mask;
+       switch (prev_layer) {
+       case MLX5_FLOW_LAYER_OUTER_L4_UDP:
+               out_mpls_m =
+                       (uint32_t *)MLX5_ADDR_OF(fte_match_set_misc2, misc2_m,
+                                                outer_first_mpls_over_udp);
+               out_mpls_v =
+                       (uint32_t *)MLX5_ADDR_OF(fte_match_set_misc2, misc2_v,
+                                                outer_first_mpls_over_udp);
+               break;
+       case MLX5_FLOW_LAYER_GRE:
+               out_mpls_m =
+                       (uint32_t *)MLX5_ADDR_OF(fte_match_set_misc2, misc2_m,
+                                                outer_first_mpls_over_gre);
+               out_mpls_v =
+                       (uint32_t *)MLX5_ADDR_OF(fte_match_set_misc2, misc2_v,
+                                                outer_first_mpls_over_gre);
+               break;
+       default:
+               /* Inner MPLS not over GRE is not supported. */
+               if (!inner) {
+                       out_mpls_m =
+                               (uint32_t *)MLX5_ADDR_OF(fte_match_set_misc2,
+                                                        misc2_m,
+                                                        outer_first_mpls);
+                       out_mpls_v =
+                               (uint32_t *)MLX5_ADDR_OF(fte_match_set_misc2,
+                                                        misc2_v,
+                                                        outer_first_mpls);
+               }
+               break;
+       }
+       if (out_mpls_m && out_mpls_v) {
+               *out_mpls_m = *in_mpls_m;
+               *out_mpls_v = *in_mpls_v & *in_mpls_m;
+       }
+}
+
 /**
  * Add META item to matcher
  *
@@ -1367,204 +1741,6 @@ flow_dv_translate_item_meta(void *matcher, void *key,
        }
 }
 
-/**
- * Update the matcher and the value based the selected item.
- *
- * @param[in, out] matcher
- *   Flow matcher.
- * @param[in, out] key
- *   Flow matcher value.
- * @param[in] item
- *   Flow pattern to translate.
- * @param[in, out] dev_flow
- *   Pointer to the mlx5_flow.
- * @param[in] inner
- *   Item is inner pattern.
- */
-static void
-flow_dv_create_item(void *matcher, void *key,
-                   const struct rte_flow_item *item,
-                   struct mlx5_flow *dev_flow,
-                   int inner)
-{
-       struct mlx5_flow_dv_matcher *tmatcher = matcher;
-
-       switch (item->type) {
-       case RTE_FLOW_ITEM_TYPE_ETH:
-               flow_dv_translate_item_eth(tmatcher->mask.buf, key, item,
-                                          inner);
-               tmatcher->priority = MLX5_PRIORITY_MAP_L2;
-               break;
-       case RTE_FLOW_ITEM_TYPE_VLAN:
-               flow_dv_translate_item_vlan(tmatcher->mask.buf, key, item,
-                                           inner);
-               break;
-       case RTE_FLOW_ITEM_TYPE_IPV4:
-               flow_dv_translate_item_ipv4(tmatcher->mask.buf, key, item,
-                                           inner);
-               tmatcher->priority = MLX5_PRIORITY_MAP_L3;
-               dev_flow->dv.hash_fields |=
-                       mlx5_flow_hashfields_adjust(dev_flow, inner,
-                                                   MLX5_IPV4_LAYER_TYPES,
-                                                   MLX5_IPV4_IBV_RX_HASH);
-               break;
-       case RTE_FLOW_ITEM_TYPE_IPV6:
-               flow_dv_translate_item_ipv6(tmatcher->mask.buf, key, item,
-                                           inner);
-               tmatcher->priority = MLX5_PRIORITY_MAP_L3;
-               dev_flow->dv.hash_fields |=
-                       mlx5_flow_hashfields_adjust(dev_flow, inner,
-                                                   MLX5_IPV6_LAYER_TYPES,
-                                                   MLX5_IPV6_IBV_RX_HASH);
-               break;
-       case RTE_FLOW_ITEM_TYPE_TCP:
-               flow_dv_translate_item_tcp(tmatcher->mask.buf, key, item,
-                                          inner);
-               tmatcher->priority = MLX5_PRIORITY_MAP_L4;
-               dev_flow->dv.hash_fields |=
-                       mlx5_flow_hashfields_adjust(dev_flow, inner,
-                                                   ETH_RSS_TCP,
-                                                   (IBV_RX_HASH_SRC_PORT_TCP |
-                                                    IBV_RX_HASH_DST_PORT_TCP));
-               break;
-       case RTE_FLOW_ITEM_TYPE_UDP:
-               flow_dv_translate_item_udp(tmatcher->mask.buf, key, item,
-                                          inner);
-               tmatcher->priority = MLX5_PRIORITY_MAP_L4;
-               dev_flow->verbs.hash_fields |=
-                       mlx5_flow_hashfields_adjust(dev_flow, inner,
-                                                   ETH_RSS_UDP,
-                                                   (IBV_RX_HASH_SRC_PORT_UDP |
-                                                    IBV_RX_HASH_DST_PORT_UDP));
-               break;
-       case RTE_FLOW_ITEM_TYPE_GRE:
-               flow_dv_translate_item_gre(tmatcher->mask.buf, key, item,
-                                          inner);
-               break;
-       case RTE_FLOW_ITEM_TYPE_NVGRE:
-               flow_dv_translate_item_nvgre(tmatcher->mask.buf, key, item,
-                                            inner);
-               break;
-       case RTE_FLOW_ITEM_TYPE_VXLAN:
-       case RTE_FLOW_ITEM_TYPE_VXLAN_GPE:
-               flow_dv_translate_item_vxlan(tmatcher->mask.buf, key, item,
-                                            inner);
-               break;
-       case RTE_FLOW_ITEM_TYPE_META:
-               flow_dv_translate_item_meta(tmatcher->mask.buf, key, item);
-               break;
-       default:
-               break;
-       }
-}
-
-/**
- * Store the requested actions in an array.
- *
- * @param[in] dev
- *   Pointer to rte_eth_dev structure.
- * @param[in] action
- *   Flow action to translate.
- * @param[in, out] dev_flow
- *   Pointer to the mlx5_flow.
- * @param[out] error
- *   Pointer to the error structure.
- *
- * @return
- *   0 on success, a negative errno value otherwise and rte_errno is set.
- */
-static int
-flow_dv_create_action(struct rte_eth_dev *dev,
-                     const struct rte_flow_action *action,
-                     struct mlx5_flow *dev_flow,
-                     struct rte_flow_error *error)
-{
-       const struct rte_flow_action_queue *queue;
-       const struct rte_flow_action_rss *rss;
-       int actions_n = dev_flow->dv.actions_n;
-       struct rte_flow *flow = dev_flow->flow;
-
-       switch (action->type) {
-       case RTE_FLOW_ACTION_TYPE_VOID:
-               break;
-       case RTE_FLOW_ACTION_TYPE_FLAG:
-               dev_flow->dv.actions[actions_n].type = MLX5DV_FLOW_ACTION_TAG;
-               dev_flow->dv.actions[actions_n].tag_value =
-                       mlx5_flow_mark_set(MLX5_FLOW_MARK_DEFAULT);
-               actions_n++;
-               flow->actions |= MLX5_FLOW_ACTION_FLAG;
-               break;
-       case RTE_FLOW_ACTION_TYPE_MARK:
-               dev_flow->dv.actions[actions_n].type = MLX5DV_FLOW_ACTION_TAG;
-               dev_flow->dv.actions[actions_n].tag_value =
-                       mlx5_flow_mark_set
-                       (((const struct rte_flow_action_mark *)
-                         (action->conf))->id);
-               flow->actions |= MLX5_FLOW_ACTION_MARK;
-               actions_n++;
-               break;
-       case RTE_FLOW_ACTION_TYPE_DROP:
-               dev_flow->dv.actions[actions_n].type = MLX5DV_FLOW_ACTION_DROP;
-               flow->actions |= MLX5_FLOW_ACTION_DROP;
-               break;
-       case RTE_FLOW_ACTION_TYPE_QUEUE:
-               queue = action->conf;
-               flow->rss.queue_num = 1;
-               (*flow->queue)[0] = queue->index;
-               flow->actions |= MLX5_FLOW_ACTION_QUEUE;
-               break;
-       case RTE_FLOW_ACTION_TYPE_RSS:
-               rss = action->conf;
-               if (flow->queue)
-                       memcpy((*flow->queue), rss->queue,
-                              rss->queue_num * sizeof(uint16_t));
-               flow->rss.queue_num = rss->queue_num;
-               memcpy(flow->key, rss->key, MLX5_RSS_HASH_KEY_LEN);
-               flow->rss.types = rss->types;
-               flow->rss.level = rss->level;
-               /* Added to array only in apply since we need the QP */
-               flow->actions |= MLX5_FLOW_ACTION_RSS;
-               break;
-       case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP:
-       case RTE_FLOW_ACTION_TYPE_NVGRE_ENCAP:
-               dev_flow->dv.actions[actions_n].type =
-                       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
-               dev_flow->dv.actions[actions_n].action =
-                               flow_dv_create_action_l2_encap(dev, action,
-                                                              error);
-               if (!(dev_flow->dv.actions[actions_n].action))
-                       return -rte_errno;
-               dev_flow->dv.encap_decap_verbs_action =
-                       dev_flow->dv.actions[actions_n].action;
-               flow->actions |= action->type ==
-                                RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP ?
-                                MLX5_FLOW_ACTION_VXLAN_ENCAP :
-                                MLX5_FLOW_ACTION_NVGRE_ENCAP;
-               actions_n++;
-               break;
-       case RTE_FLOW_ACTION_TYPE_VXLAN_DECAP:
-       case RTE_FLOW_ACTION_TYPE_NVGRE_DECAP:
-               dev_flow->dv.actions[actions_n].type =
-                       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
-               dev_flow->dv.actions[actions_n].action =
-                               flow_dv_create_action_l2_decap(dev, error);
-               if (!(dev_flow->dv.actions[actions_n].action))
-                       return -rte_errno;
-               dev_flow->dv.encap_decap_verbs_action =
-                       dev_flow->dv.actions[actions_n].action;
-               flow->actions |= action->type ==
-                                RTE_FLOW_ACTION_TYPE_VXLAN_DECAP ?
-                                MLX5_FLOW_ACTION_VXLAN_DECAP :
-                                MLX5_FLOW_ACTION_NVGRE_DECAP;
-               actions_n++;
-               break;
-       default:
-               break;
-       }
-       dev_flow->dv.actions_n = actions_n;
-       return 0;
-}
-
 static uint32_t matcher_zero[MLX5_ST_SZ_DW(fte_match_param)] = { 0 };
 
 #define HEADER_IS_ZERO(match_criteria, headers)                                     \
@@ -1702,38 +1878,273 @@ flow_dv_translate(struct rte_eth_dev *dev,
                  struct mlx5_flow *dev_flow,
                  const struct rte_flow_attr *attr,
                  const struct rte_flow_item items[],
-                 const struct rte_flow_action actions[] __rte_unused,
+                 const struct rte_flow_action actions[],
                  struct rte_flow_error *error)
 {
        struct priv *priv = dev->data->dev_private;
+       struct rte_flow *flow = dev_flow->flow;
+       uint64_t item_flags = 0;
+       uint64_t last_item = 0;
+       uint64_t action_flags = 0;
        uint64_t priority = attr->priority;
        struct mlx5_flow_dv_matcher matcher = {
                .mask = {
                        .size = sizeof(matcher.mask.buf),
                },
        };
-       void *match_value = dev_flow->dv.value.buf;
-       int tunnel = 0;
+       int actions_n = 0;
 
        if (priority == MLX5_FLOW_PRIO_RSVD)
                priority = priv->config.flow_prio - 1;
+       for (; actions->type != RTE_FLOW_ACTION_TYPE_END; actions++) {
+               const struct rte_flow_action_queue *queue;
+               const struct rte_flow_action_rss *rss;
+               const struct rte_flow_action *action = actions;
+               const uint8_t *rss_key;
+
+               switch (actions->type) {
+               case RTE_FLOW_ACTION_TYPE_VOID:
+                       break;
+               case RTE_FLOW_ACTION_TYPE_FLAG:
+                       dev_flow->dv.actions[actions_n].type =
+                               MLX5DV_FLOW_ACTION_TAG;
+                       dev_flow->dv.actions[actions_n].tag_value =
+                               mlx5_flow_mark_set(MLX5_FLOW_MARK_DEFAULT);
+                       actions_n++;
+                       action_flags |= MLX5_FLOW_ACTION_FLAG;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_MARK:
+                       dev_flow->dv.actions[actions_n].type =
+                               MLX5DV_FLOW_ACTION_TAG;
+                       dev_flow->dv.actions[actions_n].tag_value =
+                               mlx5_flow_mark_set
+                               (((const struct rte_flow_action_mark *)
+                                 (actions->conf))->id);
+                       actions_n++;
+                       action_flags |= MLX5_FLOW_ACTION_MARK;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_DROP:
+                       dev_flow->dv.actions[actions_n].type =
+                               MLX5DV_FLOW_ACTION_DROP;
+                       action_flags |= MLX5_FLOW_ACTION_DROP;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_QUEUE:
+                       queue = actions->conf;
+                       flow->rss.queue_num = 1;
+                       (*flow->queue)[0] = queue->index;
+                       action_flags |= MLX5_FLOW_ACTION_QUEUE;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_RSS:
+                       rss = actions->conf;
+                       if (flow->queue)
+                               memcpy((*flow->queue), rss->queue,
+                                      rss->queue_num * sizeof(uint16_t));
+                       flow->rss.queue_num = rss->queue_num;
+                       /* NULL RSS key indicates default RSS key. */
+                       rss_key = !rss->key ? rss_hash_default_key : rss->key;
+                       memcpy(flow->key, rss_key, MLX5_RSS_HASH_KEY_LEN);
+                       /* RSS type 0 indicates default RSS type ETH_RSS_IP. */
+                       flow->rss.types = !rss->types ? ETH_RSS_IP : rss->types;
+                       flow->rss.level = rss->level;
+                       action_flags |= MLX5_FLOW_ACTION_RSS;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP:
+               case RTE_FLOW_ACTION_TYPE_NVGRE_ENCAP:
+                       if (flow_dv_create_action_l2_encap(dev, actions,
+                                                          dev_flow, error))
+                               return -rte_errno;
+                       dev_flow->dv.actions[actions_n].type =
+                               MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
+                       dev_flow->dv.actions[actions_n].action =
+                               dev_flow->dv.encap_decap->verbs_action;
+                       actions_n++;
+                       action_flags |= actions->type ==
+                                       RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP ?
+                                       MLX5_FLOW_ACTION_VXLAN_ENCAP :
+                                       MLX5_FLOW_ACTION_NVGRE_ENCAP;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_VXLAN_DECAP:
+               case RTE_FLOW_ACTION_TYPE_NVGRE_DECAP:
+                       if (flow_dv_create_action_l2_decap(dev, dev_flow,
+                                                          error))
+                               return -rte_errno;
+                       dev_flow->dv.actions[actions_n].type =
+                               MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
+                       dev_flow->dv.actions[actions_n].action =
+                               dev_flow->dv.encap_decap->verbs_action;
+                       actions_n++;
+                       action_flags |= actions->type ==
+                                       RTE_FLOW_ACTION_TYPE_VXLAN_DECAP ?
+                                       MLX5_FLOW_ACTION_VXLAN_DECAP :
+                                       MLX5_FLOW_ACTION_NVGRE_DECAP;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_RAW_ENCAP:
+                       /* Handle encap with preceding decap. */
+                       if (action_flags & MLX5_FLOW_ACTION_RAW_DECAP) {
+                               if (flow_dv_create_action_raw_encap
+                                       (dev, actions, dev_flow, attr, error))
+                                       return -rte_errno;
+                               dev_flow->dv.actions[actions_n].type =
+                                       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
+                               dev_flow->dv.actions[actions_n].action =
+                                       dev_flow->dv.encap_decap->verbs_action;
+                       } else {
+                               /* Handle encap without preceding decap. */
+                               if (flow_dv_create_action_l2_encap(dev, actions,
+                                                                  dev_flow,
+                                                                  error))
+                                       return -rte_errno;
+                               dev_flow->dv.actions[actions_n].type =
+                                       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
+                               dev_flow->dv.actions[actions_n].action =
+                                       dev_flow->dv.encap_decap->verbs_action;
+                       }
+                       actions_n++;
+                       action_flags |= MLX5_FLOW_ACTION_RAW_ENCAP;
+                       break;
+               case RTE_FLOW_ACTION_TYPE_RAW_DECAP:
+                       /* Check if this decap is followed by encap. */
+                       for (; action->type != RTE_FLOW_ACTION_TYPE_END &&
+                              action->type != RTE_FLOW_ACTION_TYPE_RAW_ENCAP;
+                              action++) {
+                       }
+                       /* Handle decap only if it isn't followed by encap. */
+                       if (action->type != RTE_FLOW_ACTION_TYPE_RAW_ENCAP) {
+                               if (flow_dv_create_action_l2_decap(dev,
+                                                                  dev_flow,
+                                                                  error))
+                                       return -rte_errno;
+                               dev_flow->dv.actions[actions_n].type =
+                                       MLX5DV_FLOW_ACTION_IBV_FLOW_ACTION;
+                               dev_flow->dv.actions[actions_n].action =
+                                       dev_flow->dv.encap_decap->verbs_action;
+                               actions_n++;
+                       }
+                       /* If decap is followed by encap, handle it at encap. */
+                       action_flags |= MLX5_FLOW_ACTION_RAW_DECAP;
+                       break;
+               default:
+                       break;
+               }
+       }
+       dev_flow->dv.actions_n = actions_n;
+       flow->actions = action_flags;
        for (; items->type != RTE_FLOW_ITEM_TYPE_END; items++) {
-               tunnel = !!(dev_flow->layers & MLX5_FLOW_LAYER_TUNNEL);
-               flow_dv_create_item(&matcher, match_value, items, dev_flow,
-                                   tunnel);
+               int tunnel = !!(item_flags & MLX5_FLOW_LAYER_TUNNEL);
+               void *match_mask = matcher.mask.buf;
+               void *match_value = dev_flow->dv.value.buf;
+
+               switch (items->type) {
+               case RTE_FLOW_ITEM_TYPE_ETH:
+                       flow_dv_translate_item_eth(match_mask, match_value,
+                                                  items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L2;
+                       last_item = tunnel ? MLX5_FLOW_LAYER_INNER_L2 :
+                                            MLX5_FLOW_LAYER_OUTER_L2;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_VLAN:
+                       flow_dv_translate_item_vlan(match_mask, match_value,
+                                                   items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L2;
+                       last_item = tunnel ? (MLX5_FLOW_LAYER_INNER_L2 |
+                                             MLX5_FLOW_LAYER_INNER_VLAN) :
+                                            (MLX5_FLOW_LAYER_OUTER_L2 |
+                                             MLX5_FLOW_LAYER_OUTER_VLAN);
+                       break;
+               case RTE_FLOW_ITEM_TYPE_IPV4:
+                       flow_dv_translate_item_ipv4(match_mask, match_value,
+                                                   items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L3;
+                       dev_flow->dv.hash_fields |=
+                               mlx5_flow_hashfields_adjust
+                                       (dev_flow, tunnel,
+                                        MLX5_IPV4_LAYER_TYPES,
+                                        MLX5_IPV4_IBV_RX_HASH);
+                       last_item = tunnel ? MLX5_FLOW_LAYER_INNER_L3_IPV4 :
+                                            MLX5_FLOW_LAYER_OUTER_L3_IPV4;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_IPV6:
+                       flow_dv_translate_item_ipv6(match_mask, match_value,
+                                                   items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L3;
+                       dev_flow->dv.hash_fields |=
+                               mlx5_flow_hashfields_adjust
+                                       (dev_flow, tunnel,
+                                        MLX5_IPV6_LAYER_TYPES,
+                                        MLX5_IPV6_IBV_RX_HASH);
+                       last_item = tunnel ? MLX5_FLOW_LAYER_INNER_L3_IPV6 :
+                                            MLX5_FLOW_LAYER_OUTER_L3_IPV6;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_TCP:
+                       flow_dv_translate_item_tcp(match_mask, match_value,
+                                                  items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L4;
+                       dev_flow->dv.hash_fields |=
+                               mlx5_flow_hashfields_adjust
+                                       (dev_flow, tunnel, ETH_RSS_TCP,
+                                        IBV_RX_HASH_SRC_PORT_TCP |
+                                        IBV_RX_HASH_DST_PORT_TCP);
+                       last_item = tunnel ? MLX5_FLOW_LAYER_INNER_L4_TCP :
+                                            MLX5_FLOW_LAYER_OUTER_L4_TCP;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_UDP:
+                       flow_dv_translate_item_udp(match_mask, match_value,
+                                                  items, tunnel);
+                       matcher.priority = MLX5_PRIORITY_MAP_L4;
+                       dev_flow->dv.hash_fields |=
+                               mlx5_flow_hashfields_adjust
+                                       (dev_flow, tunnel, ETH_RSS_UDP,
+                                        IBV_RX_HASH_SRC_PORT_UDP |
+                                        IBV_RX_HASH_DST_PORT_UDP);
+                       last_item = tunnel ? MLX5_FLOW_LAYER_INNER_L4_UDP :
+                                            MLX5_FLOW_LAYER_OUTER_L4_UDP;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_GRE:
+                       flow_dv_translate_item_gre(match_mask, match_value,
+                                                  items, tunnel);
+                       last_item = MLX5_FLOW_LAYER_GRE;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_NVGRE:
+                       flow_dv_translate_item_nvgre(match_mask, match_value,
+                                                    items, tunnel);
+                       last_item = MLX5_FLOW_LAYER_GRE;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_VXLAN:
+                       flow_dv_translate_item_vxlan(match_mask, match_value,
+                                                    items, tunnel);
+                       last_item = MLX5_FLOW_LAYER_VXLAN;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_VXLAN_GPE:
+                       flow_dv_translate_item_vxlan(match_mask, match_value,
+                                                    items, tunnel);
+                       last_item = MLX5_FLOW_LAYER_VXLAN_GPE;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_MPLS:
+                       flow_dv_translate_item_mpls(match_mask, match_value,
+                                                   items, last_item, tunnel);
+                       last_item = MLX5_FLOW_LAYER_MPLS;
+                       break;
+               case RTE_FLOW_ITEM_TYPE_META:
+                       flow_dv_translate_item_meta(match_mask, match_value,
+                                                   items);
+                       last_item = MLX5_FLOW_ITEM_METADATA;
+                       break;
+               default:
+                       break;
+               }
+               item_flags |= last_item;
        }
+       assert(!flow_dv_check_valid_spec(matcher.mask.buf,
+                                        dev_flow->dv.value.buf));
+       dev_flow->layers = item_flags;
+       /* Register matcher. */
        matcher.crc = rte_raw_cksum((const void *)matcher.mask.buf,
-                                    matcher.mask.size);
-       if (priority == MLX5_FLOW_PRIO_RSVD)
-               priority = priv->config.flow_prio - 1;
+                                   matcher.mask.size);
        matcher.priority = mlx5_flow_adjust_priority(dev, priority,
                                                     matcher.priority);
        matcher.egress = attr->egress;
        if (flow_dv_matcher_register(dev, &matcher, dev_flow, error))
                return -rte_errno;
-       for (; actions->type != RTE_FLOW_ACTION_TYPE_END; actions++)
-               if (flow_dv_create_action(dev, actions, dev_flow, error))
-                       return -rte_errno;
        return 0;
 }
 
@@ -1777,6 +2188,7 @@ flow_dv_apply(struct rte_eth_dev *dev, struct rte_flow *flow,
                } else if (flow->actions &
                           (MLX5_FLOW_ACTION_QUEUE | MLX5_FLOW_ACTION_RSS)) {
                        struct mlx5_hrxq *hrxq;
+
                        hrxq = mlx5_hrxq_get(dev, flow->key,
                                             MLX5_RSS_HASH_KEY_LEN,
                                             dv->hash_fields,
@@ -1863,6 +2275,37 @@ flow_dv_matcher_release(struct rte_eth_dev *dev,
        return 1;
 }
 
+/**
+ * Release an encap/decap resource.
+ *
+ * @param flow
+ *   Pointer to mlx5_flow.
+ *
+ * @return
+ *   1 while a reference on it exists, 0 when freed.
+ */
+static int
+flow_dv_encap_decap_resource_release(struct mlx5_flow *flow)
+{
+       struct mlx5_flow_dv_encap_decap_resource *cache_resource =
+                                               flow->dv.encap_decap;
+
+       assert(cache_resource->verbs_action);
+       DRV_LOG(DEBUG, "encap/decap resource %p: refcnt %d--",
+               (void *)cache_resource,
+               rte_atomic32_read(&cache_resource->refcnt));
+       if (rte_atomic32_dec_and_test(&cache_resource->refcnt)) {
+               claim_zero(mlx5_glue->destroy_flow_action
+                               (cache_resource->verbs_action));
+               LIST_REMOVE(cache_resource, next);
+               rte_free(cache_resource);
+               DRV_LOG(DEBUG, "encap/decap resource %p: removed",
+                       (void *)cache_resource);
+               return 0;
+       }
+       return 1;
+}
+
 /**
  * Remove the flow from the NIC but keeps it in memory.
  *
@@ -1918,11 +2361,8 @@ flow_dv_destroy(struct rte_eth_dev *dev, struct rte_flow *flow)
                LIST_REMOVE(dev_flow, next);
                if (dev_flow->dv.matcher)
                        flow_dv_matcher_release(dev, dev_flow);
-               if (dev_flow->dv.encap_decap_verbs_action) {
-                       claim_zero(mlx5_glue->destroy_flow_action
-                               (dev_flow->dv.encap_decap_verbs_action));
-                       dev_flow->dv.encap_decap_verbs_action = NULL;
-               }
+               if (dev_flow->dv.encap_decap)
+                       flow_dv_encap_decap_resource_release(dev_flow);
                rte_free(dev_flow);
        }
 }
@@ -1940,8 +2380,10 @@ flow_dv_query(struct rte_eth_dev *dev __rte_unused,
              void *data __rte_unused,
              struct rte_flow_error *error __rte_unused)
 {
-       rte_errno = ENOTSUP;
-       return -rte_errno;
+       return rte_flow_error_set(error, ENOTSUP,
+                                 RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
+                                 NULL,
+                                 "flow query with DV is not supported");
 }