net/mlx5: workaround ASO memory region creation
[dpdk.git] / drivers / net / mlx5 / mlx5_flow.c
index 1afddf7..1923abe 100644 (file)
@@ -1028,7 +1028,7 @@ flow_rxq_tunnel_ptype_update(struct mlx5_rxq_ctrl *rxq_ctrl)
  * @param[in] dev_handle
  *   Pointer to device flow handle structure.
  */
-static void
+void
 flow_drv_rxq_flags_set(struct rte_eth_dev *dev,
                       struct mlx5_flow_handle *dev_handle)
 {
@@ -3343,18 +3343,52 @@ flow_drv_destroy(struct rte_eth_dev *dev, struct rte_flow *flow)
        fops->destroy(dev, flow);
 }
 
+/**
+ * Flow driver find RSS policy tbl API. This abstracts calling driver
+ * specific functions. Parent flow (rte_flow) should have driver
+ * type (drv_type). It will find the RSS policy table that has the rss_desc.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in, out] flow
+ *   Pointer to flow structure.
+ * @param[in] policy
+ *   Pointer to meter policy table.
+ * @param[in] rss_desc
+ *   Pointer to rss_desc
+ */
+static struct mlx5_flow_meter_sub_policy *
+flow_drv_meter_sub_policy_rss_prepare(struct rte_eth_dev *dev,
+               struct rte_flow *flow,
+               struct mlx5_flow_meter_policy *policy,
+               struct mlx5_flow_rss_desc *rss_desc[MLX5_MTR_RTE_COLORS])
+{
+       const struct mlx5_flow_driver_ops *fops;
+       enum mlx5_flow_drv_type type = flow->drv_type;
+
+       MLX5_ASSERT(type > MLX5_FLOW_TYPE_MIN && type < MLX5_FLOW_TYPE_MAX);
+       fops = flow_get_drv_ops(type);
+       return fops->meter_sub_policy_rss_prepare(dev, policy, rss_desc);
+}
+
 /**
  * Get RSS action from the action list.
  *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
  * @param[in] actions
  *   Pointer to the list of actions.
+ * @param[in] flow
+ *   Parent flow structure pointer.
  *
  * @return
  *   Pointer to the RSS action if exist, else return NULL.
  */
 static const struct rte_flow_action_rss*
-flow_get_rss_action(const struct rte_flow_action actions[])
+flow_get_rss_action(struct rte_eth_dev *dev,
+                   const struct rte_flow_action actions[])
 {
+       struct mlx5_priv *priv = dev->data->dev_private;
        const struct rte_flow_action_rss *rss = NULL;
 
        for (; actions->type != RTE_FLOW_ACTION_TYPE_END; actions++) {
@@ -3372,6 +3406,23 @@ flow_get_rss_action(const struct rte_flow_action actions[])
                                        rss = act->conf;
                        break;
                }
+               case RTE_FLOW_ACTION_TYPE_METER:
+               {
+                       uint32_t mtr_idx;
+                       struct mlx5_flow_meter_info *fm;
+                       struct mlx5_flow_meter_policy *policy;
+                       const struct rte_flow_action_meter *mtr = actions->conf;
+
+                       fm = mlx5_flow_meter_find(priv, mtr->mtr_id, &mtr_idx);
+                       if (fm) {
+                               policy = mlx5_flow_meter_policy_find(dev,
+                                               fm->policy_id, NULL);
+                               if (policy && policy->is_rss)
+                                       rss =
+                               policy->act_cnt[RTE_COLOR_GREEN].rss->conf;
+                       }
+                       break;
+               }
                default:
                        break;
                }
@@ -3489,6 +3540,12 @@ flow_action_handles_translate(struct rte_eth_dev *dev,
                        translated[handle->index].conf =
                                &shared_rss->origin;
                        break;
+               case MLX5_INDIRECT_ACTION_TYPE_COUNT:
+                       translated[handle->index].type =
+                                               (enum rte_flow_action_type)
+                                               MLX5_RTE_FLOW_ACTION_TYPE_COUNT;
+                       translated[handle->index].conf = (void *)(uintptr_t)idx;
+                       break;
                case MLX5_INDIRECT_ACTION_TYPE_AGE:
                        if (priv->sh->flow_hit_aso_en) {
                                translated[handle->index].type =
@@ -3670,13 +3727,75 @@ flow_parse_metadata_split_actions_info(const struct rte_flow_action actions[],
        return actions_n + 1;
 }
 
+/**
+ * Check if the action will change packet.
+ *
+ * @param dev
+ *   Pointer to Ethernet device.
+ * @param[in] type
+ *   action type.
+ *
+ * @return
+ *   true if action will change packet, false otherwise.
+ */
+static bool flow_check_modify_action_type(struct rte_eth_dev *dev,
+                                         enum rte_flow_action_type type)
+{
+       struct mlx5_priv *priv = dev->data->dev_private;
+
+       switch (type) {
+       case RTE_FLOW_ACTION_TYPE_SET_MAC_SRC:
+       case RTE_FLOW_ACTION_TYPE_SET_MAC_DST:
+       case RTE_FLOW_ACTION_TYPE_SET_IPV4_SRC:
+       case RTE_FLOW_ACTION_TYPE_SET_IPV4_DST:
+       case RTE_FLOW_ACTION_TYPE_SET_IPV6_SRC:
+       case RTE_FLOW_ACTION_TYPE_SET_IPV6_DST:
+       case RTE_FLOW_ACTION_TYPE_SET_TP_SRC:
+       case RTE_FLOW_ACTION_TYPE_SET_TP_DST:
+       case RTE_FLOW_ACTION_TYPE_DEC_TTL:
+       case RTE_FLOW_ACTION_TYPE_SET_TTL:
+       case RTE_FLOW_ACTION_TYPE_INC_TCP_SEQ:
+       case RTE_FLOW_ACTION_TYPE_DEC_TCP_SEQ:
+       case RTE_FLOW_ACTION_TYPE_INC_TCP_ACK:
+       case RTE_FLOW_ACTION_TYPE_DEC_TCP_ACK:
+       case RTE_FLOW_ACTION_TYPE_SET_IPV4_DSCP:
+       case RTE_FLOW_ACTION_TYPE_SET_IPV6_DSCP:
+       case RTE_FLOW_ACTION_TYPE_SET_META:
+       case RTE_FLOW_ACTION_TYPE_SET_TAG:
+       case RTE_FLOW_ACTION_TYPE_OF_POP_VLAN:
+       case RTE_FLOW_ACTION_TYPE_OF_PUSH_VLAN:
+       case RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_VID:
+       case RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_PCP:
+       case RTE_FLOW_ACTION_TYPE_VXLAN_ENCAP:
+       case RTE_FLOW_ACTION_TYPE_VXLAN_DECAP:
+       case RTE_FLOW_ACTION_TYPE_NVGRE_ENCAP:
+       case RTE_FLOW_ACTION_TYPE_NVGRE_DECAP:
+       case RTE_FLOW_ACTION_TYPE_RAW_ENCAP:
+       case RTE_FLOW_ACTION_TYPE_RAW_DECAP:
+       case RTE_FLOW_ACTION_TYPE_MODIFY_FIELD:
+               return true;
+       case RTE_FLOW_ACTION_TYPE_FLAG:
+       case RTE_FLOW_ACTION_TYPE_MARK:
+               if (priv->config.dv_xmeta_en != MLX5_XMETA_MODE_LEGACY)
+                       return true;
+               else
+                       return false;
+       default:
+               return false;
+       }
+}
+
 /**
  * Check meter action from the action list.
  *
+ * @param dev
+ *   Pointer to Ethernet device.
  * @param[in] actions
  *   Pointer to the list of actions.
  * @param[out] has_mtr
  *   Pointer to the meter exist flag.
+ * @param[out] has_modify
+ *   Pointer to the flag showing there's packet change action.
  * @param[out] meter_id
  *   Pointer to the meter id.
  *
@@ -3684,9 +3803,9 @@ flow_parse_metadata_split_actions_info(const struct rte_flow_action actions[],
  *   Total number of actions.
  */
 static int
-flow_check_meter_action(const struct rte_flow_action actions[],
-                       bool *has_mtr,
-                       uint32_t *meter_id)
+flow_check_meter_action(struct rte_eth_dev *dev,
+                       const struct rte_flow_action actions[],
+                       bool *has_mtr, bool *has_modify, uint32_t *meter_id)
 {
        const struct rte_flow_action_meter *mtr = NULL;
        int actions_n = 0;
@@ -3703,6 +3822,9 @@ flow_check_meter_action(const struct rte_flow_action actions[],
                default:
                        break;
                }
+               if (!*has_mtr)
+                       *has_modify |= flow_check_modify_action_type(dev,
+                                                               actions->type);
                actions_n++;
        }
        /* Count RTE_FLOW_ACTION_TYPE_END. */
@@ -4342,9 +4464,114 @@ flow_create_split_inner(struct rte_eth_dev *dev,
                dev_flow->handle->mark = 1;
        if (sub_flow)
                *sub_flow = dev_flow;
+#ifdef HAVE_IBV_FLOW_DV_SUPPORT
+       dev_flow->dv.table_id = flow_split_info->table_id;
+#endif
        return flow_drv_translate(dev, dev_flow, attr, items, actions, error);
 }
 
+/**
+ * Get the sub policy of a meter.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in] flow
+ *   Parent flow structure pointer.
+ * @param[in] policy_id;
+ *   Meter Policy id.
+ * @param[in] attr
+ *   Flow rule attributes.
+ * @param[in] items
+ *   Pattern specification (list terminated by the END pattern item).
+ * @param[out] error
+ *   Perform verbose error reporting if not NULL.
+ *
+ * @return
+ *   Pointer to the meter sub policy, NULL otherwise and rte_errno is set.
+ */
+static struct mlx5_flow_meter_sub_policy *
+get_meter_sub_policy(struct rte_eth_dev *dev,
+                    struct rte_flow *flow,
+                    uint32_t policy_id,
+                    const struct rte_flow_attr *attr,
+                    const struct rte_flow_item items[],
+                    struct rte_flow_error *error)
+{
+       struct mlx5_flow_meter_policy *policy;
+       struct mlx5_flow_meter_sub_policy *sub_policy = NULL;
+
+       policy = mlx5_flow_meter_policy_find(dev, policy_id, NULL);
+       if (!policy) {
+               rte_flow_error_set(error, EINVAL,
+                                  RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                  "Failed to find Meter Policy.");
+               goto exit;
+       }
+       if (policy->is_rss) {
+               struct mlx5_flow_workspace *wks =
+                               mlx5_flow_get_thread_workspace();
+               struct mlx5_flow_rss_desc rss_desc_v[MLX5_MTR_RTE_COLORS];
+               struct mlx5_flow_rss_desc *rss_desc[MLX5_MTR_RTE_COLORS] = {0};
+               uint32_t i;
+
+               MLX5_ASSERT(wks);
+               /**
+                * This is a tmp dev_flow,
+                * no need to register any matcher for it in translate.
+                */
+               wks->skip_matcher_reg = 1;
+               for (i = 0; i < MLX5_MTR_RTE_COLORS; i++) {
+                       struct mlx5_flow dev_flow = {0};
+                       struct mlx5_flow_handle dev_handle = { {0} };
+                       const void *rss_act = policy->act_cnt[i].rss->conf;
+                       struct rte_flow_action rss_actions[2] = {
+                               [0] = {
+                                       .type = RTE_FLOW_ACTION_TYPE_RSS,
+                                       .conf = rss_act
+                               },
+                               [1] = {
+                                       .type = RTE_FLOW_ACTION_TYPE_END,
+                                       .conf = NULL
+                               }
+                       };
+
+                       dev_flow.handle = &dev_handle;
+                       dev_flow.ingress = attr->ingress;
+                       dev_flow.flow = flow;
+                       dev_flow.external = 0;
+#ifdef HAVE_IBV_FLOW_DV_SUPPORT
+                       dev_flow.dv.transfer = attr->transfer;
+#endif
+                       /* Translate RSS action to get rss hash fields. */
+                       if (flow_drv_translate(dev, &dev_flow, attr,
+                                               items, rss_actions, error))
+                               goto exit;
+                       rss_desc_v[i] = wks->rss_desc;
+                       rss_desc_v[i].key_len = MLX5_RSS_HASH_KEY_LEN;
+                       rss_desc_v[i].hash_fields = dev_flow.hash_fields;
+                       rss_desc_v[i].queue_num = rss_desc_v[i].hash_fields ?
+                                                 rss_desc_v[i].queue_num : 1;
+                       rss_desc[i] = &rss_desc_v[i];
+               }
+               sub_policy = flow_drv_meter_sub_policy_rss_prepare(dev,
+                                               flow, policy, rss_desc);
+       } else {
+               enum mlx5_meter_domain mtr_domain =
+                       attr->transfer ? MLX5_MTR_DOMAIN_TRANSFER :
+                               attr->egress ? MLX5_MTR_DOMAIN_EGRESS :
+                                       MLX5_MTR_DOMAIN_INGRESS;
+               sub_policy = policy->sub_policys[mtr_domain][0];
+       }
+       if (!sub_policy) {
+               rte_flow_error_set(error, EINVAL,
+                       RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                       "Failed to get meter sub-policy.");
+               goto exit;
+       }
+exit:
+       return sub_policy;
+}
+
 /**
  * Split the meter flow.
  *
@@ -4359,8 +4586,12 @@ flow_create_split_inner(struct rte_eth_dev *dev,
  *
  * @param[in] dev
  *   Pointer to Ethernet device.
+ * @param[in] flow
+ *   Parent flow structure pointer.
  * @param[in] fm
  *   Pointer to flow meter structure.
+ * @param[in] attr
+ *   Flow rule attributes.
  * @param[in] items
  *   Pattern specification (list terminated by the END pattern item).
  * @param[out] sfx_items
@@ -4371,24 +4602,25 @@ flow_create_split_inner(struct rte_eth_dev *dev,
  *   Suffix flow actions.
  * @param[out] actions_pre
  *   Prefix flow actions.
- * @param[out] pattern_sfx
- *   The pattern items for the suffix flow.
- * @param[out] tag_sfx
- *   Pointer to suffix flow tag.
+ * @param[out] mtr_flow_id
+ *   Pointer to meter flow id.
  * @param[out] error
  *   Perform verbose error reporting if not NULL.
  *
  * @return
- *   The flow id, 0 otherwise and rte_errno is set.
+ *   0 on success, a negative errno value otherwise and rte_errno is set.
  */
-static uint32_t
+static int
 flow_meter_split_prep(struct rte_eth_dev *dev,
-                     struct mlx5_flow_meter *fm,
+                     struct rte_flow *flow,
+                     struct mlx5_flow_meter_info *fm,
+                     const struct rte_flow_attr *attr,
                      const struct rte_flow_item items[],
                      struct rte_flow_item sfx_items[],
                      const struct rte_flow_action actions[],
                      struct rte_flow_action actions_sfx[],
                      struct rte_flow_action actions_pre[],
+                     uint32_t *mtr_flow_id,
                      struct rte_flow_error *error)
 {
        struct mlx5_priv *priv = dev->data->dev_private;
@@ -4401,6 +4633,11 @@ flow_meter_split_prep(struct rte_eth_dev *dev,
        struct mlx5_rte_flow_item_tag *tag_item_mask;
        uint32_t tag_id = 0;
        bool copy_vlan = false;
+       struct rte_flow_action *hw_mtr_action;
+       struct rte_flow_action *action_pre_head = NULL;
+       bool mtr_first = priv->sh->meter_aso_en &&
+                       (attr->egress ||
+                       (attr->transfer && priv->representor_id != UINT16_MAX));
        uint8_t mtr_id_offset = priv->mtr_reg_share ? MLX5_MTR_COLOR_BITS : 0;
        uint8_t mtr_reg_bits = priv->mtr_reg_share ?
                                MLX5_MTR_IDLE_BITS_IN_COLOR_REG : MLX5_REG_BITS;
@@ -4409,29 +4646,39 @@ flow_meter_split_prep(struct rte_eth_dev *dev,
        uint8_t flow_id_bits = 0;
        int shift;
 
+       /* For ASO meter, meter must be before tag in TX direction. */
+       if (mtr_first) {
+               action_pre_head = actions_pre++;
+               /* Leave space for tag action. */
+               tag_action = actions_pre++;
+       }
        /* Prepare the actions for prefix and suffix flow. */
        for (; actions->type != RTE_FLOW_ACTION_TYPE_END; actions++) {
-               struct rte_flow_action **action_cur = NULL;
+               struct rte_flow_action *action_cur = NULL;
 
                switch (actions->type) {
                case RTE_FLOW_ACTION_TYPE_METER:
-                       /* Add the extra tag action first. */
-                       tag_action = actions_pre++;
-                       action_cur = &actions_pre;
+                       if (mtr_first) {
+                               action_cur = action_pre_head;
+                       } else {
+                               /* Leave space for tag action. */
+                               tag_action = actions_pre++;
+                               action_cur = actions_pre++;
+                       }
                        break;
                case RTE_FLOW_ACTION_TYPE_VXLAN_DECAP:
                case RTE_FLOW_ACTION_TYPE_NVGRE_DECAP:
-                       action_cur = &actions_pre;
+                       action_cur = actions_pre++;
                        break;
                case RTE_FLOW_ACTION_TYPE_RAW_ENCAP:
                        raw_encap = actions->conf;
                        if (raw_encap->size < MLX5_ENCAPSULATION_DECISION_SIZE)
-                               action_cur = &actions_pre;
+                               action_cur = actions_pre++;
                        break;
                case RTE_FLOW_ACTION_TYPE_RAW_DECAP:
                        raw_decap = actions->conf;
                        if (raw_decap->size > MLX5_ENCAPSULATION_DECISION_SIZE)
-                               action_cur = &actions_pre;
+                               action_cur = actions_pre++;
                        break;
                case RTE_FLOW_ACTION_TYPE_OF_PUSH_VLAN:
                case RTE_FLOW_ACTION_TYPE_OF_SET_VLAN_VID:
@@ -4441,30 +4688,72 @@ flow_meter_split_prep(struct rte_eth_dev *dev,
                        break;
                }
                if (!action_cur)
-                       action_cur = &actions_sfx;
-               memcpy(*action_cur, actions, sizeof(struct rte_flow_action));
-               (*action_cur)++;
+                       action_cur = (fm->def_policy) ?
+                                       actions_sfx++ : actions_pre++;
+               memcpy(action_cur, actions, sizeof(struct rte_flow_action));
        }
        /* Add end action to the actions. */
        actions_sfx->type = RTE_FLOW_ACTION_TYPE_END;
+       if (priv->sh->meter_aso_en) {
+               /**
+                * For ASO meter, need to add an extra jump action explicitly,
+                * to jump from meter to policer table.
+                */
+               struct mlx5_flow_meter_sub_policy *sub_policy;
+               struct mlx5_flow_tbl_data_entry *tbl_data;
+
+               if (!fm->def_policy) {
+                       sub_policy = get_meter_sub_policy(dev, flow,
+                                                         fm->policy_id, attr,
+                                                         items, error);
+                       if (!sub_policy)
+                               return -rte_errno;
+               } else {
+                       enum mlx5_meter_domain mtr_domain =
+                       attr->transfer ? MLX5_MTR_DOMAIN_TRANSFER :
+                               attr->egress ? MLX5_MTR_DOMAIN_EGRESS :
+                                       MLX5_MTR_DOMAIN_INGRESS;
+
+                       sub_policy =
+                       &priv->sh->mtrmng->def_policy[mtr_domain]->sub_policy;
+               }
+               tbl_data = container_of(sub_policy->tbl_rsc,
+                                       struct mlx5_flow_tbl_data_entry, tbl);
+               hw_mtr_action = actions_pre++;
+               hw_mtr_action->type = (enum rte_flow_action_type)
+                                     MLX5_RTE_FLOW_ACTION_TYPE_JUMP;
+               hw_mtr_action->conf = tbl_data->jump.action;
+       }
        actions_pre->type = RTE_FLOW_ACTION_TYPE_END;
        actions_pre++;
-       mlx5_ipool_malloc(fm->flow_ipool, &tag_id);
-       if (!tag_id)
+       if (!tag_action)
                return rte_flow_error_set(error, ENOMEM,
-                               RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
-                               "Failed to allocate meter flow id.");
-       flow_id = tag_id - 1;
-       flow_id_bits = MLX5_REG_BITS - __builtin_clz(flow_id);
-       flow_id_bits = flow_id_bits ? flow_id_bits : 1;
-       if ((flow_id_bits + priv->max_mtr_bits) > mtr_reg_bits) {
-               mlx5_ipool_free(fm->flow_ipool, tag_id);
-               return rte_flow_error_set(error, EINVAL,
-                               RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
-                               "Meter flow id exceeds max limit.");
+                                       RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                       "No tag action space.");
+       if (!mtr_flow_id) {
+               tag_action->type = RTE_FLOW_ACTION_TYPE_VOID;
+               goto exit;
+       }
+       /* Only default-policy Meter creates mtr flow id. */
+       if (fm->def_policy) {
+               mlx5_ipool_malloc(fm->flow_ipool, &tag_id);
+               if (!tag_id)
+                       return rte_flow_error_set(error, ENOMEM,
+                                       RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                       "Failed to allocate meter flow id.");
+               flow_id = tag_id - 1;
+               flow_id_bits = MLX5_REG_BITS - __builtin_clz(flow_id);
+               flow_id_bits = flow_id_bits ? flow_id_bits : 1;
+               if ((flow_id_bits + priv->sh->mtrmng->max_mtr_bits) >
+                   mtr_reg_bits) {
+                       mlx5_ipool_free(fm->flow_ipool, tag_id);
+                       return rte_flow_error_set(error, EINVAL,
+                                       RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
+                                       "Meter flow id exceeds max limit.");
+               }
+               if (flow_id_bits > priv->sh->mtrmng->max_mtr_flow_bits)
+                       priv->sh->mtrmng->max_mtr_flow_bits = flow_id_bits;
        }
-       if (flow_id_bits > priv->max_mtr_flow_bits)
-               priv->max_mtr_flow_bits = flow_id_bits;
        /* Prepare the suffix subflow items. */
        tag_item = sfx_items++;
        for (; items->type != RTE_FLOW_ITEM_TYPE_END; items++) {
@@ -4494,7 +4783,6 @@ flow_meter_split_prep(struct rte_eth_dev *dev,
        sfx_items->type = RTE_FLOW_ITEM_TYPE_END;
        sfx_items++;
        /* Build tag actions and items for meter_id/meter flow_id. */
-       assert(tag_action);
        set_tag = (struct mlx5_rte_flow_action_set_tag *)actions_pre;
        tag_item_spec = (struct mlx5_rte_flow_item_tag *)sfx_items;
        tag_item_mask = tag_item_spec + 1;
@@ -4504,7 +4792,7 @@ flow_meter_split_prep(struct rte_eth_dev *dev,
                                                            0, error),
                .offset = mtr_id_offset,
                .length = mtr_reg_bits,
-               .data = fm->idx,
+               .data = flow->meter,
        };
        /*
         * The color Reg bits used by flow_id are growing from
@@ -4512,8 +4800,9 @@ flow_meter_split_prep(struct rte_eth_dev *dev,
         */
        for (shift = 0; shift < flow_id_bits; shift++)
                flow_id_reversed = (flow_id_reversed << 1) |
-                             ((flow_id >> shift) & 0x1);
-       set_tag->data |= flow_id_reversed << (mtr_reg_bits - flow_id_bits);
+                               ((flow_id >> shift) & 0x1);
+       set_tag->data |=
+               flow_id_reversed << (mtr_reg_bits - flow_id_bits);
        tag_item_spec->id = set_tag->id;
        tag_item_spec->data = set_tag->data << mtr_id_offset;
        tag_item_mask->data = UINT32_MAX << mtr_id_offset;
@@ -4525,7 +4814,10 @@ flow_meter_split_prep(struct rte_eth_dev *dev,
        tag_item->spec = tag_item_spec;
        tag_item->last = NULL;
        tag_item->mask = tag_item_mask;
-       return tag_id;
+exit:
+       if (mtr_flow_id)
+               *mtr_flow_id = tag_id;
+       return 0;
 }
 
 /**
@@ -5048,8 +5340,8 @@ flow_create_split_metadata(struct rte_eth_dev *dev,
        if (qrss) {
                /* Check if it is in meter suffix table. */
                mtr_sfx = attr->group == (attr->transfer ?
-                         (MLX5_FLOW_TABLE_LEVEL_SUFFIX - 1) :
-                         MLX5_FLOW_TABLE_LEVEL_SUFFIX);
+                         (MLX5_FLOW_TABLE_LEVEL_METER - 1) :
+                         MLX5_FLOW_TABLE_LEVEL_METER);
                /*
                 * Q/RSS action on NIC Rx should be split in order to pass by
                 * the mreg copy table (RX_CP_TBL) and then it jumps to the
@@ -5197,6 +5489,57 @@ exit:
        return ret;
 }
 
+/**
+ * Create meter internal drop flow with the original pattern.
+ *
+ * @param dev
+ *   Pointer to Ethernet device.
+ * @param[in] flow
+ *   Parent flow structure pointer.
+ * @param[in] attr
+ *   Flow rule attributes.
+ * @param[in] items
+ *   Pattern specification (list terminated by the END pattern item).
+ * @param[in] flow_split_info
+ *   Pointer to flow split info structure.
+ * @param[in] fm
+ *   Pointer to flow meter structure.
+ * @param[out] error
+ *   Perform verbose error reporting if not NULL.
+ * @return
+ *   0 on success, negative value otherwise
+ */
+static uint32_t
+flow_meter_create_drop_flow_with_org_pattern(struct rte_eth_dev *dev,
+                       struct rte_flow *flow,
+                       const struct rte_flow_attr *attr,
+                       const struct rte_flow_item items[],
+                       struct mlx5_flow_split_info *flow_split_info,
+                       struct mlx5_flow_meter_info *fm,
+                       struct rte_flow_error *error)
+{
+       struct mlx5_flow *dev_flow = NULL;
+       struct rte_flow_attr drop_attr = *attr;
+       struct rte_flow_action drop_actions[3];
+       struct mlx5_flow_split_info drop_split_info = *flow_split_info;
+
+       MLX5_ASSERT(fm->drop_cnt);
+       drop_actions[0].type =
+               (enum rte_flow_action_type)MLX5_RTE_FLOW_ACTION_TYPE_COUNT;
+       drop_actions[0].conf = (void *)(uintptr_t)fm->drop_cnt;
+       drop_actions[1].type = RTE_FLOW_ACTION_TYPE_DROP;
+       drop_actions[1].conf = NULL;
+       drop_actions[2].type = RTE_FLOW_ACTION_TYPE_END;
+       drop_actions[2].conf = NULL;
+       drop_split_info.external = false;
+       drop_split_info.skip_scale |= 1 << MLX5_SCALE_FLOW_GROUP_BIT;
+       drop_split_info.table_id = MLX5_MTR_TABLE_ID_DROP;
+       drop_attr.group = MLX5_FLOW_TABLE_LEVEL_METER;
+       return flow_create_split_inner(dev, flow, &dev_flow,
+                               &drop_attr, items, drop_actions,
+                               &drop_split_info, error);
+}
+
 /**
  * The splitting for meter feature.
  *
@@ -5240,28 +5583,31 @@ flow_create_split_meter(struct rte_eth_dev *dev,
        struct rte_flow_item *sfx_items = NULL;
        struct mlx5_flow *dev_flow = NULL;
        struct rte_flow_attr sfx_attr = *attr;
-       struct mlx5_flow_meter *fm = NULL;
+       struct mlx5_flow_meter_info *fm = NULL;
+       uint8_t skip_scale_restore;
        bool has_mtr = false;
-       uint32_t meter_id;
-       uint32_t mtr_tag_id = 0;
+       bool has_modify = false;
+       bool set_mtr_reg = true;
+       uint32_t meter_id = 0;
+       uint32_t mtr_idx = 0;
+       uint32_t mtr_flow_id = 0;
        size_t act_size;
        size_t item_size;
        int actions_n = 0;
        int ret = 0;
 
        if (priv->mtr_en)
-               actions_n = flow_check_meter_action(actions, &has_mtr,
-                                                   &meter_id);
+               actions_n = flow_check_meter_action(dev, actions, &has_mtr,
+                                                   &has_modify, &meter_id);
        if (has_mtr) {
                if (flow->meter) {
-                       fm = mlx5_ipool_get(priv->sh->ipool[MLX5_IPOOL_MTR],
-                                           flow->meter);
+                       fm = flow_dv_meter_find_by_idx(priv, flow->meter);
                        if (!fm)
                                return rte_flow_error_set(error, EINVAL,
                                                RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
                                                NULL, "Meter not found.");
                } else {
-                       fm = mlx5_flow_meter_find(priv, meter_id);
+                       fm = mlx5_flow_meter_find(priv, meter_id, &mtr_idx);
                        if (!fm)
                                return rte_flow_error_set(error, EINVAL,
                                                RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
@@ -5270,13 +5616,23 @@ flow_create_split_meter(struct rte_eth_dev *dev,
                                                     &sfx_attr, error);
                        if (ret)
                                return -rte_errno;
-                       flow->meter = fm->idx;
+                       flow->meter = mtr_idx;
                }
+               MLX5_ASSERT(wks);
                wks->fm = fm;
-               /* The prefix actions: meter, decap, encap, tag, end. */
-               act_size = sizeof(struct rte_flow_action) * (actions_n + 5) +
+               /*
+                * If it isn't default-policy Meter, and
+                * 1. There's no action in flow to change
+                *    packet (modify/encap/decap etc.), OR
+                * 2. No drop count needed for this meter.
+                * no need to use regC to save meter id anymore.
+                */
+               if (!fm->def_policy && (!has_modify || !fm->drop_cnt))
+                       set_mtr_reg = false;
+               /* Prefix actions: meter, decap, encap, tag, jump, end. */
+               act_size = sizeof(struct rte_flow_action) * (actions_n + 6) +
                           sizeof(struct mlx5_rte_flow_action_set_tag);
-               /* The suffix items: tag, vlan, port id, end. */
+               /* Suffix items: tag, vlan, port id, end. */
 #define METER_SUFFIX_ITEM 4
                item_size = sizeof(struct rte_flow_item) * METER_SUFFIX_ITEM +
                            sizeof(struct mlx5_rte_flow_item_tag) * 2;
@@ -5289,33 +5645,56 @@ flow_create_split_meter(struct rte_eth_dev *dev,
                                                  "meter flow");
                sfx_items = (struct rte_flow_item *)((char *)sfx_actions +
                             act_size);
-               pre_actions = sfx_actions + actions_n;
-               mtr_tag_id = flow_meter_split_prep(dev, fm, items, sfx_items,
-                                                  actions, sfx_actions,
-                                                  pre_actions, error);
-               if (!mtr_tag_id) {
+               /* There's no suffix flow for meter of non-default policy. */
+               if (!fm->def_policy)
+                       pre_actions = sfx_actions + 1;
+               else
+                       pre_actions = sfx_actions + actions_n;
+               ret = flow_meter_split_prep(dev, flow, fm, &sfx_attr,
+                                           items, sfx_items, actions,
+                                           sfx_actions, pre_actions,
+                                           (set_mtr_reg ? &mtr_flow_id : NULL),
+                                           error);
+               if (ret) {
                        ret = -rte_errno;
                        goto exit;
                }
                /* Add the prefix subflow. */
                flow_split_info->prefix_mark = 0;
+               skip_scale_restore = flow_split_info->skip_scale;
+               flow_split_info->skip_scale |=
+                       1 << MLX5_SCALE_JUMP_FLOW_GROUP_BIT;
                ret = flow_create_split_inner(dev, flow, &dev_flow,
                                              attr, items, pre_actions,
                                              flow_split_info, error);
+               flow_split_info->skip_scale = skip_scale_restore;
                if (ret) {
-                       mlx5_ipool_free(fm->flow_ipool, mtr_tag_id);
+                       if (mtr_flow_id)
+                               mlx5_ipool_free(fm->flow_ipool, mtr_flow_id);
                        ret = -rte_errno;
                        goto exit;
                }
-               dev_flow->handle->split_flow_id = mtr_tag_id;
-               dev_flow->handle->is_meter_flow_id = 1;
+               if (mtr_flow_id) {
+                       dev_flow->handle->split_flow_id = mtr_flow_id;
+                       dev_flow->handle->is_meter_flow_id = 1;
+               }
+               if (!fm->def_policy) {
+                       if (!set_mtr_reg && fm->drop_cnt)
+                               ret =
+                       flow_meter_create_drop_flow_with_org_pattern(dev, flow,
+                                                       &sfx_attr, items,
+                                                       flow_split_info,
+                                                       fm, error);
+                       goto exit;
+               }
                /* Setting the sfx group atrr. */
                sfx_attr.group = sfx_attr.transfer ?
-                               (MLX5_FLOW_TABLE_LEVEL_SUFFIX - 1) :
-                                MLX5_FLOW_TABLE_LEVEL_SUFFIX;
+                               (MLX5_FLOW_TABLE_LEVEL_METER - 1) :
+                                MLX5_FLOW_TABLE_LEVEL_METER;
                flow_split_info->prefix_layers =
                                flow_get_prefix_layer_flags(dev_flow);
                flow_split_info->prefix_mark = dev_flow->handle->mark;
+               flow_split_info->table_id = MLX5_MTR_TABLE_ID_SUFFIX;
        }
        /* Add the prefix subflow. */
        ret = flow_create_split_metadata(dev, flow,
@@ -5459,8 +5838,7 @@ flow_create_split_sample(struct rte_eth_dev *dev,
                                                struct mlx5_flow_tbl_data_entry,
                                                tbl);
                        sfx_attr.group = sfx_attr.transfer ?
-                                               (sfx_tbl_data->table_id - 1) :
-                                               sfx_tbl_data->table_id;
+                       (sfx_tbl_data->level - 1) : sfx_tbl_data->level;
                } else {
                        MLX5_ASSERT(attr->transfer);
                        sfx_attr.group = jump_table;
@@ -5660,7 +6038,8 @@ flow_list_create(struct rte_eth_dev *dev, uint32_t *list,
                .skip_scale = 0,
                .flow_idx = 0,
                .prefix_mark = 0,
-               .prefix_layers = 0
+               .prefix_layers = 0,
+               .table_id = 0
        };
        int ret;
 
@@ -5703,7 +6082,7 @@ flow_list_create(struct rte_eth_dev *dev, uint32_t *list,
        memset(rss_desc, 0, offsetof(struct mlx5_flow_rss_desc, queue));
        /* RSS Action only works on NIC RX domain */
        if (attr->ingress && !attr->transfer)
-               rss = flow_get_rss_action(p_actions_rx);
+               rss = flow_get_rss_action(dev, p_actions_rx);
        if (rss) {
                if (flow_rss_workspace_adjust(wks, rss_desc, rss->queue_num))
                        return 0;
@@ -6576,21 +6955,42 @@ mlx5_flow_ops_get(struct rte_eth_dev *dev __rte_unused,
 }
 
 /**
- * Create the needed meter and suffix tables.
+ * Validate meter policy actions.
+ * Dispatcher for action type specific validation.
  *
  * @param[in] dev
- *   Pointer to Ethernet device.
+ *   Pointer to the Ethernet device structure.
+ * @param[in] action
+ *   The meter policy action object to validate.
+ * @param[in] attr
+ *   Attributes of flow to determine steering domain.
+ * @param[out] is_rss
+ *   Is RSS or not.
+ * @param[out] domain_bitmap
+ *   Domain bitmap.
+ * @param[out] is_def_policy
+ *   Is default policy or not.
+ * @param[out] error
+ *   Perform verbose error reporting if not NULL. Initialized in case of
+ *   error only.
  *
  * @return
- *   Pointer to table set on success, NULL otherwise.
+ *   0 on success, otherwise negative errno value.
  */
-struct mlx5_meter_domains_infos *
-mlx5_flow_create_mtr_tbls(struct rte_eth_dev *dev)
+int
+mlx5_flow_validate_mtr_acts(struct rte_eth_dev *dev,
+                       const struct rte_flow_action *actions[RTE_COLORS],
+                       struct rte_flow_attr *attr,
+                       bool *is_rss,
+                       uint8_t *domain_bitmap,
+                       bool *is_def_policy,
+                       struct rte_mtr_error *error)
 {
        const struct mlx5_flow_driver_ops *fops;
 
        fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
-       return fops->create_mtr_tbls(dev);
+       return fops->validate_mtr_acts(dev, actions, attr,
+                       is_rss, domain_bitmap, is_def_policy, error);
 }
 
 /**
@@ -6598,66 +6998,215 @@ mlx5_flow_create_mtr_tbls(struct rte_eth_dev *dev)
  *
  * @param[in] dev
  *   Pointer to Ethernet device.
- * @param[in] tbl
- *   Pointer to the meter table set.
+ * @param[in] mtr_policy
+ *   Meter policy struct.
+ */
+void
+mlx5_flow_destroy_mtr_acts(struct rte_eth_dev *dev,
+                     struct mlx5_flow_meter_policy *mtr_policy)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       fops->destroy_mtr_acts(dev, mtr_policy);
+}
+
+/**
+ * Create policy action, lock free,
+ * (mutex should be acquired by caller).
+ * Dispatcher for action type specific call.
+ *
+ * @param[in] dev
+ *   Pointer to the Ethernet device structure.
+ * @param[in] mtr_policy
+ *   Meter policy struct.
+ * @param[in] action
+ *   Action specification used to create meter actions.
+ * @param[out] error
+ *   Perform verbose error reporting if not NULL. Initialized in case of
+ *   error only.
  *
  * @return
- *   0 on success.
+ *   0 on success, otherwise negative errno value.
  */
 int
-mlx5_flow_destroy_mtr_tbls(struct rte_eth_dev *dev,
-                          struct mlx5_meter_domains_infos *tbls)
+mlx5_flow_create_mtr_acts(struct rte_eth_dev *dev,
+                     struct mlx5_flow_meter_policy *mtr_policy,
+                     const struct rte_flow_action *actions[RTE_COLORS],
+                     struct rte_mtr_error *error)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       return fops->create_mtr_acts(dev, mtr_policy, actions, error);
+}
+
+/**
+ * Create policy rules, lock free,
+ * (mutex should be acquired by caller).
+ * Dispatcher for action type specific call.
+ *
+ * @param[in] dev
+ *   Pointer to the Ethernet device structure.
+ * @param[in] mtr_policy
+ *   Meter policy struct.
+ *
+ * @return
+ *   0 on success, -1 otherwise.
+ */
+int
+mlx5_flow_create_policy_rules(struct rte_eth_dev *dev,
+                            struct mlx5_flow_meter_policy *mtr_policy)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       return fops->create_policy_rules(dev, mtr_policy);
+}
+
+/**
+ * Destroy policy rules, lock free,
+ * (mutex should be acquired by caller).
+ * Dispatcher for action type specific call.
+ *
+ * @param[in] dev
+ *   Pointer to the Ethernet device structure.
+ * @param[in] mtr_policy
+ *   Meter policy struct.
+ */
+void
+mlx5_flow_destroy_policy_rules(struct rte_eth_dev *dev,
+                            struct mlx5_flow_meter_policy *mtr_policy)
 {
        const struct mlx5_flow_driver_ops *fops;
 
        fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
-       return fops->destroy_mtr_tbls(dev, tbls);
+       fops->destroy_policy_rules(dev, mtr_policy);
 }
 
 /**
- * Prepare policer rules.
+ * Destroy the default policy table set.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ */
+void
+mlx5_flow_destroy_def_policy(struct rte_eth_dev *dev)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       fops->destroy_def_policy(dev);
+}
+
+/**
+ * Destroy the default policy table set.
  *
  * @param[in] dev
  *   Pointer to Ethernet device.
- * @param[in] fm
- *   Pointer to flow meter structure.
- * @param[in] attr
- *   Pointer to flow attributes.
  *
  * @return
  *   0 on success, -1 otherwise.
  */
 int
-mlx5_flow_prepare_policer_rules(struct rte_eth_dev *dev,
-                              struct mlx5_flow_meter *fm,
-                              const struct rte_flow_attr *attr)
+mlx5_flow_create_def_policy(struct rte_eth_dev *dev)
 {
        const struct mlx5_flow_driver_ops *fops;
 
        fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
-       return fops->prepare_policer_rules(dev, fm, attr);
+       return fops->create_def_policy(dev);
 }
 
 /**
- * Destroy policer rules.
+ * Create the needed meter and suffix tables.
  *
- * @param[in] fm
- *   Pointer to flow meter structure.
- * @param[in] attr
- *   Pointer to flow attributes.
+ * @param[in] dev
+ *   Pointer to Ethernet device.
  *
  * @return
  *   0 on success, -1 otherwise.
  */
 int
-mlx5_flow_destroy_policer_rules(struct rte_eth_dev *dev,
-                               struct mlx5_flow_meter *fm,
-                               const struct rte_flow_attr *attr)
+mlx5_flow_create_mtr_tbls(struct rte_eth_dev *dev,
+                       struct mlx5_flow_meter_info *fm,
+                       uint32_t mtr_idx,
+                       uint8_t domain_bitmap)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       return fops->create_mtr_tbls(dev, fm, mtr_idx, domain_bitmap);
+}
+
+/**
+ * Destroy the meter table set.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in] tbl
+ *   Pointer to the meter table set.
+ */
+void
+mlx5_flow_destroy_mtr_tbls(struct rte_eth_dev *dev,
+                          struct mlx5_flow_meter_info *fm)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       fops->destroy_mtr_tbls(dev, fm);
+}
+
+/**
+ * Destroy the global meter drop table.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ */
+void
+mlx5_flow_destroy_mtr_drop_tbls(struct rte_eth_dev *dev)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       fops->destroy_mtr_drop_tbls(dev);
+}
+
+/**
+ * Allocate the needed aso flow meter id.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ *
+ * @return
+ *   Index to aso flow meter on success, NULL otherwise.
+ */
+uint32_t
+mlx5_flow_mtr_alloc(struct rte_eth_dev *dev)
+{
+       const struct mlx5_flow_driver_ops *fops;
+
+       fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
+       return fops->create_meter(dev);
+}
+
+/**
+ * Free the aso flow meter id.
+ *
+ * @param[in] dev
+ *   Pointer to Ethernet device.
+ * @param[in] mtr_idx
+ *  Index to aso flow meter to be free.
+ *
+ * @return
+ *   0 on success.
+ */
+void
+mlx5_flow_mtr_free(struct rte_eth_dev *dev, uint32_t mtr_idx)
 {
        const struct mlx5_flow_driver_ops *fops;
 
        fops = flow_get_drv_ops(MLX5_FLOW_TYPE_DV);
-       return fops->destroy_policer_rules(dev, fm, attr);
+       fops->free_meter(dev, mtr_idx);
 }
 
 /**
@@ -7708,10 +8257,12 @@ tunnel_mark_decode(struct rte_eth_dev *dev, uint32_t mark)
        union tunnel_offload_mark mbits = { .val = mark };
        union mlx5_flow_tbl_key table_key = {
                {
-                       .table_id = tunnel_id_to_flow_tbl(mbits.table_id),
+                       .level = tunnel_id_to_flow_tbl(mbits.table_id),
+                       .id = 0,
+                       .reserved = 0,
                        .dummy = 0,
-                       .domain = !!mbits.transfer,
-                       .direction = 0,
+                       .is_fdb = !!mbits.transfer,
+                       .is_egress = 0,
                }
        };
        he = mlx5_hlist_lookup(sh->flow_tbls, table_key.v64, NULL);