net/mlx5: enable DevX Tx queue creation

[dpdk.git] / drivers / net / mlx5 / mlx5_flow.c
diff --git a/drivers/net/mlx5/mlx5_flow.c b/drivers/net/mlx5/mlx5_flow.c

index 6cf1bb8..1d493f1 100644 (file)
--- a/drivers/net/mlx5/mlx5_flow.c
+++ b/drivers/net/mlx5/mlx5_flow.c
@@ -132,6 +132,12 @@ struct mlx5_flow_expand_rss {
  static void
  mlx5_dbg__print_pattern(const struct rte_flow_item *item);
  
+static const struct mlx5_flow_expand_node *
+mlx5_flow_expand_rss_adjust_node(const struct rte_flow_item *pattern,
+               unsigned int item_idx,
+               const struct mlx5_flow_expand_node graph[],
+               const struct mlx5_flow_expand_node *node);
+
  static bool
  mlx5_flow_is_rss_expandable_item(const struct rte_flow_item *item)
  {
@@ -318,7 +324,7 @@ mlx5_flow_expand_rss(struct mlx5_flow_expand_rss *buf, size_t size,
         const int *stack[MLX5_RSS_EXP_ELT_N];
         int stack_pos = 0;
         struct rte_flow_item flow_items[MLX5_RSS_EXP_ELT_N];
-       unsigned int i;
+       unsigned int i, item_idx, last_expand_item_idx = 0;
         size_t lsize;
         size_t user_pattern_size = 0;
         void *addr = NULL;
@@ -326,7 +332,7 @@ mlx5_flow_expand_rss(struct mlx5_flow_expand_rss *buf, size_t size,
         struct rte_flow_item missed_item;
         int missed = 0;
         int elt = 0;
-       const struct rte_flow_item *last_item = NULL;
+       const struct rte_flow_item *last_expand_item = NULL;
  
         memset(&missed_item, 0, sizeof(missed_item));
         lsize = offsetof(struct mlx5_flow_expand_rss, entry) +
@@ -337,12 +343,15 @@ mlx5_flow_expand_rss(struct mlx5_flow_expand_rss *buf, size_t size,
         buf->entry[0].pattern = (void *)&buf->entry[MLX5_RSS_EXP_ELT_N];
         buf->entries = 0;
         addr = buf->entry[0].pattern;
-       for (item = pattern; item->type != RTE_FLOW_ITEM_TYPE_END; item++) {
+       for (item = pattern, item_idx = 0;
+                       item->type != RTE_FLOW_ITEM_TYPE_END;
+                       item++, item_idx++) {
                 if (!mlx5_flow_is_rss_expandable_item(item)) {
                         user_pattern_size += sizeof(*item);
                         continue;
                 }
-               last_item = item;
+               last_expand_item = item;
+               last_expand_item_idx = item_idx;
                 i = 0;
                 while (node->next && node->next[i]) {
                         next = &graph[node->next[i]];
@@ -374,7 +383,7 @@ mlx5_flow_expand_rss(struct mlx5_flow_expand_rss *buf, size_t size,
          * Check if the last valid item has spec set, need complete pattern,
          * and the pattern can be used for expansion.
          */
-       missed_item.type = mlx5_flow_expand_rss_item_complete(last_item);
+       missed_item.type = mlx5_flow_expand_rss_item_complete(last_expand_item);
         if (missed_item.type == RTE_FLOW_ITEM_TYPE_END) {
                 /* Item type END indicates expansion is not required. */
                 return lsize;
@@ -409,6 +418,9 @@ mlx5_flow_expand_rss(struct mlx5_flow_expand_rss *buf, size_t size,
                         addr = (void *)(((uintptr_t)addr) +
                                         elt * sizeof(*item));
                 }
+       } else if (last_expand_item != NULL) {
+               node = mlx5_flow_expand_rss_adjust_node(pattern,
+                               last_expand_item_idx, graph, node);
         }
         memset(flow_items, 0, sizeof(flow_items));
         next_node = mlx5_flow_expand_rss_skip_explicit(graph,
@@ -460,12 +472,22 @@ mlx5_flow_expand_rss(struct mlx5_flow_expand_rss *buf, size_t size,
                         /* Follow up with the next possibility. */
                         next_node = mlx5_flow_expand_rss_skip_explicit(graph,
                                         ++next_node);
+               } else if (!stack_pos) {
+                       /*
+                        * Completing the traverse over the different paths.
+                        * The next_node is advanced to the terminator.
+                        */
+                       ++next_node;
                 } else {
                         /* Move to the next path. */
-                       if (stack_pos)
+                       while (stack_pos) {
                                 next_node = stack[--stack_pos];
+                               next_node++;
+                               if (*next_node)
+                                       break;
+                       }
                         next_node = mlx5_flow_expand_rss_skip_explicit(graph,
-                                       ++next_node);
+                                       next_node);
                         stack[stack_pos] = next_node;
                 }
                 node = next_node && *next_node ? &graph[*next_node] : NULL;
@@ -485,6 +507,8 @@ enum mlx5_expansion {
         MLX5_EXPANSION_OUTER_IPV6_UDP,
         MLX5_EXPANSION_OUTER_IPV6_TCP,
         MLX5_EXPANSION_VXLAN,
+       MLX5_EXPANSION_STD_VXLAN,
+       MLX5_EXPANSION_L3_VXLAN,
         MLX5_EXPANSION_VXLAN_GPE,
         MLX5_EXPANSION_GRE,
         MLX5_EXPANSION_NVGRE,
@@ -581,6 +605,15 @@ static const struct mlx5_flow_expand_node mlx5_support_expansion[] = {
                                                   MLX5_EXPANSION_IPV6),
                 .type = RTE_FLOW_ITEM_TYPE_VXLAN,
         },
+       [MLX5_EXPANSION_STD_VXLAN] = {
+                       .next = MLX5_FLOW_EXPAND_RSS_NEXT(MLX5_EXPANSION_ETH),
+                                       .type = RTE_FLOW_ITEM_TYPE_VXLAN,
+       },
+       [MLX5_EXPANSION_L3_VXLAN] = {
+                       .next = MLX5_FLOW_EXPAND_RSS_NEXT(MLX5_EXPANSION_IPV4,
+                                       MLX5_EXPANSION_IPV6),
+                                       .type = RTE_FLOW_ITEM_TYPE_VXLAN,
+       },
         [MLX5_EXPANSION_VXLAN_GPE] = {
                 .next = MLX5_FLOW_EXPAND_RSS_NEXT(MLX5_EXPANSION_ETH,
                                                   MLX5_EXPANSION_IPV4,
@@ -970,13 +1003,15 @@ mlx5_get_lowest_priority(struct rte_eth_dev *dev,
   *   Pointer to device flow rule attributes.
   * @param[in] subpriority
   *   The priority based on the items.
+ * @param[in] external
+ *   Flow is user flow.
   * @return
   *   The matcher priority of the flow.
   */
  uint16_t
  mlx5_get_matcher_priority(struct rte_eth_dev *dev,
                           const struct rte_flow_attr *attr,
-                         uint32_t subpriority)
+                         uint32_t subpriority, bool external)
  {
         uint16_t priority = (uint16_t)attr->priority;
         struct mlx5_priv *priv = dev->data->dev_private;
@@ -985,6 +1020,9 @@ mlx5_get_matcher_priority(struct rte_eth_dev *dev,
                 if (attr->priority == MLX5_FLOW_LOWEST_PRIO_INDICATOR)
                         priority = priv->config.flow_prio - 1;
                 return mlx5_os_flow_adjust_priority(dev, priority, subpriority);
+       } else if (!external && attr->transfer && attr->group == 0 &&
+                  attr->priority == MLX5_FLOW_LOWEST_PRIO_INDICATOR) {
+               return (priv->config.flow_prio - 1) * 3;
         }
         if (attr->priority == MLX5_FLOW_LOWEST_PRIO_INDICATOR)
                 priority = MLX5_NON_ROOT_FLOW_MAX_PRIO;
@@ -6558,6 +6596,80 @@ mlx5_flow_create_esw_table_zero_flow(struct rte_eth_dev *dev)
                                                    actions, false, &error);
  }
  
+/**
+ * Create a dedicated flow rule on e-switch table 1, matches ESW manager
+ * and sq number, directs all packets to peer vport.
+ *
+ * @param dev
+ *   Pointer to Ethernet device.
+ * @param txq
+ *   Txq index.
+ *
+ * @return
+ *   Flow ID on success, 0 otherwise and rte_errno is set.
+ */
+uint32_t
+mlx5_flow_create_devx_sq_miss_flow(struct rte_eth_dev *dev, uint32_t txq)
+{
+       struct rte_flow_attr attr = {
+               .group = 0,
+               .priority = MLX5_FLOW_LOWEST_PRIO_INDICATOR,
+               .ingress = 1,
+               .egress = 0,
+               .transfer = 1,
+       };
+       struct rte_flow_item_port_id port_spec = {
+               .id = MLX5_PORT_ESW_MGR,
+       };
+       struct mlx5_rte_flow_item_tx_queue txq_spec = {
+               .queue = txq,
+       };
+       struct rte_flow_item pattern[] = {
+               {
+                       .type = RTE_FLOW_ITEM_TYPE_PORT_ID,
+                       .spec = &port_spec,
+               },
+               {
+                       .type = (enum rte_flow_item_type)
+                               MLX5_RTE_FLOW_ITEM_TYPE_TX_QUEUE,
+                       .spec = &txq_spec,
+               },
+               {
+                       .type = RTE_FLOW_ITEM_TYPE_END,
+               },
+       };
+       struct rte_flow_action_jump jump = {
+               .group = 1,
+       };
+       struct rte_flow_action_port_id port = {
+               .id = dev->data->port_id,
+       };
+       struct rte_flow_action actions[] = {
+               {
+                       .type = RTE_FLOW_ACTION_TYPE_JUMP,
+                       .conf = &jump,
+               },
+               {
+                       .type = RTE_FLOW_ACTION_TYPE_END,
+               },
+       };
+       struct rte_flow_error error;
+
+       /*
+        * Creates group 0, highest priority jump flow.
+        * Matches txq to bypass kernel packets.
+        */
+       if (flow_list_create(dev, MLX5_FLOW_TYPE_CTL, &attr, pattern, actions,
+                            false, &error) == 0)
+               return 0;
+       /* Create group 1, lowest priority redirect flow for txq. */
+       attr.group = 1;
+       actions[0].conf = &port;
+       actions[0].type = RTE_FLOW_ACTION_TYPE_PORT_ID;
+       return flow_list_create(dev, MLX5_FLOW_TYPE_CTL, &attr, pattern,
+                               actions, false, &error);
+}
+
  /**
   * Validate a flow supported by the NIC.
   *
@@ -7618,7 +7730,7 @@ mlx5_flow_create_counter_stat_mem_mng(struct mlx5_dev_ctx_shared *sh)
         }
         mem_mng = (struct mlx5_counter_stats_mem_mng *)(mem + size) - 1;
         size = sizeof(*raw_data) * MLX5_COUNTERS_PER_POOL * raws_n;
-       mem_mng->umem = mlx5_os_umem_reg(sh->ctx, mem, size,
+       mem_mng->umem = mlx5_os_umem_reg(sh->cdev->ctx, mem, size,
                                                  IBV_ACCESS_LOCAL_WRITE);
         if (!mem_mng->umem) {
                 rte_errno = errno;
@@ -7629,10 +7741,10 @@ mlx5_flow_create_counter_stat_mem_mng(struct mlx5_dev_ctx_shared *sh)
         mkey_attr.addr = (uintptr_t)mem;
         mkey_attr.size = size;
         mkey_attr.umem_id = mlx5_os_get_umem_id(mem_mng->umem);
-       mkey_attr.pd = sh->pdn;
+       mkey_attr.pd = sh->cdev->pdn;
         mkey_attr.relaxed_ordering_write = sh->cmng.relaxed_ordering_write;
         mkey_attr.relaxed_ordering_read = sh->cmng.relaxed_ordering_read;
-       mem_mng->dm = mlx5_devx_cmd_mkey_create(sh->ctx, &mkey_attr);
+       mem_mng->dm = mlx5_devx_cmd_mkey_create(sh->cdev->ctx, &mkey_attr);
         if (!mem_mng->dm) {
                 mlx5_os_umem_dereg(mem_mng->umem);
                 rte_errno = errno;
@@ -9113,6 +9225,9 @@ mlx5_flow_tunnel_validate(struct rte_eth_dev *dev,
                 err_msg = "unsupported tunnel type";
                 goto out;
         case RTE_FLOW_ITEM_TYPE_VXLAN:
+       case RTE_FLOW_ITEM_TYPE_GRE:
+       case RTE_FLOW_ITEM_TYPE_NVGRE:
+       case RTE_FLOW_ITEM_TYPE_GENEVE:
                 break;
         }
  
@@ -9406,3 +9521,41 @@ mlx5_dbg__print_pattern(const struct rte_flow_item *item)
         }
         printf("END\n");
  }
+
+static int
+mlx5_flow_is_std_vxlan_port(const struct rte_flow_item *udp_item)
+{
+       const struct rte_flow_item_udp *spec = udp_item->spec;
+       const struct rte_flow_item_udp *mask = udp_item->mask;
+       uint16_t udp_dport = 0;
+
+       if (spec != NULL) {
+               if (!mask)
+                       mask = &rte_flow_item_udp_mask;
+               udp_dport = rte_be_to_cpu_16(spec->hdr.dst_port &
+                               mask->hdr.dst_port);
+       }
+       return (!udp_dport || udp_dport == MLX5_UDP_PORT_VXLAN);
+}
+
+static const struct mlx5_flow_expand_node *
+mlx5_flow_expand_rss_adjust_node(const struct rte_flow_item *pattern,
+               unsigned int item_idx,
+               const struct mlx5_flow_expand_node graph[],
+               const struct mlx5_flow_expand_node *node)
+{
+       const struct rte_flow_item *item = pattern + item_idx, *prev_item;
+       switch (item->type) {
+       case RTE_FLOW_ITEM_TYPE_VXLAN:
+               MLX5_ASSERT(item_idx > 0);
+               prev_item = pattern + item_idx - 1;
+               MLX5_ASSERT(prev_item->type == RTE_FLOW_ITEM_TYPE_UDP);
+               if (mlx5_flow_is_std_vxlan_port(prev_item))
+                       return &graph[MLX5_EXPANSION_STD_VXLAN];
+               else
+                       return &graph[MLX5_EXPANSION_L3_VXLAN];
+               break;
+       default:
+               return node;
+       }
+}