1 /* SPDX-License-Identifier: BSD-3-Clause
3 * Copyright (c) 2017-2018 Solarflare Communications Inc.
6 * This software was jointly developed between OKTET Labs (under contract
7 * for Solarflare) and Solarflare Communications, Inc.
10 #include <rte_byteorder.h>
11 #include <rte_tailq.h>
12 #include <rte_common.h>
13 #include <rte_ethdev_driver.h>
14 #include <rte_eth_ctrl.h>
15 #include <rte_ether.h>
17 #include <rte_flow_driver.h>
23 #include "sfc_filter.h"
28 * At now flow API is implemented in such a manner that each
29 * flow rule is converted to one or more hardware filters.
30 * All elements of flow rule (attributes, pattern items, actions)
31 * correspond to one or more fields in the efx_filter_spec_s structure
32 * that is responsible for the hardware filter.
33 * If some required field is unset in the flow rule, then a handful
34 * of filter copies will be created to cover all possible values
38 enum sfc_flow_item_layers {
39 SFC_FLOW_ITEM_ANY_LAYER,
40 SFC_FLOW_ITEM_START_LAYER,
46 typedef int (sfc_flow_item_parse)(const struct rte_flow_item *item,
47 efx_filter_spec_t *spec,
48 struct rte_flow_error *error);
50 struct sfc_flow_item {
51 enum rte_flow_item_type type; /* Type of item */
52 enum sfc_flow_item_layers layer; /* Layer of item */
53 enum sfc_flow_item_layers prev_layer; /* Previous layer of item */
54 sfc_flow_item_parse *parse; /* Parsing function */
57 static sfc_flow_item_parse sfc_flow_parse_void;
58 static sfc_flow_item_parse sfc_flow_parse_eth;
59 static sfc_flow_item_parse sfc_flow_parse_vlan;
60 static sfc_flow_item_parse sfc_flow_parse_ipv4;
61 static sfc_flow_item_parse sfc_flow_parse_ipv6;
62 static sfc_flow_item_parse sfc_flow_parse_tcp;
63 static sfc_flow_item_parse sfc_flow_parse_udp;
64 static sfc_flow_item_parse sfc_flow_parse_vxlan;
65 static sfc_flow_item_parse sfc_flow_parse_geneve;
66 static sfc_flow_item_parse sfc_flow_parse_nvgre;
68 typedef int (sfc_flow_spec_set_vals)(struct sfc_flow_spec *spec,
69 unsigned int filters_count_for_one_val,
70 struct rte_flow_error *error);
72 typedef boolean_t (sfc_flow_spec_check)(efx_filter_match_flags_t match,
73 efx_filter_spec_t *spec,
74 struct sfc_filter *filter);
76 struct sfc_flow_copy_flag {
77 /* EFX filter specification match flag */
78 efx_filter_match_flags_t flag;
79 /* Number of values of corresponding field */
80 unsigned int vals_count;
81 /* Function to set values in specifications */
82 sfc_flow_spec_set_vals *set_vals;
84 * Function to check that the specification is suitable
85 * for adding this match flag
87 sfc_flow_spec_check *spec_check;
90 static sfc_flow_spec_set_vals sfc_flow_set_unknown_dst_flags;
91 static sfc_flow_spec_check sfc_flow_check_unknown_dst_flags;
92 static sfc_flow_spec_set_vals sfc_flow_set_ethertypes;
93 static sfc_flow_spec_set_vals sfc_flow_set_ifrm_unknown_dst_flags;
94 static sfc_flow_spec_check sfc_flow_check_ifrm_unknown_dst_flags;
97 sfc_flow_is_zero(const uint8_t *buf, unsigned int size)
102 for (i = 0; i < size; i++)
105 return (sum == 0) ? B_TRUE : B_FALSE;
109 * Validate item and prepare structures spec and mask for parsing
112 sfc_flow_parse_init(const struct rte_flow_item *item,
113 const void **spec_ptr,
114 const void **mask_ptr,
115 const void *supp_mask,
116 const void *def_mask,
118 struct rte_flow_error *error)
128 rte_flow_error_set(error, EINVAL,
129 RTE_FLOW_ERROR_TYPE_ITEM, NULL,
134 if ((item->last != NULL || item->mask != NULL) && item->spec == NULL) {
135 rte_flow_error_set(error, EINVAL,
136 RTE_FLOW_ERROR_TYPE_ITEM, item,
137 "Mask or last is set without spec");
142 * If "mask" is not set, default mask is used,
143 * but if default mask is NULL, "mask" should be set
145 if (item->mask == NULL) {
146 if (def_mask == NULL) {
147 rte_flow_error_set(error, EINVAL,
148 RTE_FLOW_ERROR_TYPE_ITEM, NULL,
149 "Mask should be specified");
165 * If field values in "last" are either 0 or equal to the corresponding
166 * values in "spec" then they are ignored
169 !sfc_flow_is_zero(last, size) &&
170 memcmp(last, spec, size) != 0) {
171 rte_flow_error_set(error, ENOTSUP,
172 RTE_FLOW_ERROR_TYPE_ITEM, item,
173 "Ranging is not supported");
177 if (supp_mask == NULL) {
178 rte_flow_error_set(error, EINVAL,
179 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
180 "Supported mask for item should be specified");
184 /* Check that mask and spec not asks for more match than supp_mask */
185 for (i = 0; i < size; i++) {
186 match = spec[i] | mask[i];
187 supp = ((const uint8_t *)supp_mask)[i];
189 if ((match | supp) != supp) {
190 rte_flow_error_set(error, ENOTSUP,
191 RTE_FLOW_ERROR_TYPE_ITEM, item,
192 "Item's field is not supported");
205 * Masking is not supported, so masks in items should be either
206 * full or empty (zeroed) and set only for supported fields which
207 * are specified in the supp_mask.
211 sfc_flow_parse_void(__rte_unused const struct rte_flow_item *item,
212 __rte_unused efx_filter_spec_t *efx_spec,
213 __rte_unused struct rte_flow_error *error)
219 * Convert Ethernet item to EFX filter specification.
222 * Item specification. Outer frame specification may only comprise
223 * source/destination addresses and Ethertype field.
224 * Inner frame specification may contain destination address only.
225 * There is support for individual/group mask as well as for empty and full.
226 * If the mask is NULL, default mask will be used. Ranging is not supported.
227 * @param efx_spec[in, out]
228 * EFX filter specification to update.
230 * Perform verbose error reporting if not NULL.
233 sfc_flow_parse_eth(const struct rte_flow_item *item,
234 efx_filter_spec_t *efx_spec,
235 struct rte_flow_error *error)
238 const struct rte_flow_item_eth *spec = NULL;
239 const struct rte_flow_item_eth *mask = NULL;
240 const struct rte_flow_item_eth supp_mask = {
241 .dst.addr_bytes = { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff },
242 .src.addr_bytes = { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff },
245 const struct rte_flow_item_eth ifrm_supp_mask = {
246 .dst.addr_bytes = { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff },
248 const uint8_t ig_mask[EFX_MAC_ADDR_LEN] = {
249 0x01, 0x00, 0x00, 0x00, 0x00, 0x00
251 const struct rte_flow_item_eth *supp_mask_p;
252 const struct rte_flow_item_eth *def_mask_p;
253 uint8_t *loc_mac = NULL;
254 boolean_t is_ifrm = (efx_spec->efs_encap_type !=
255 EFX_TUNNEL_PROTOCOL_NONE);
258 supp_mask_p = &ifrm_supp_mask;
259 def_mask_p = &ifrm_supp_mask;
260 loc_mac = efx_spec->efs_ifrm_loc_mac;
262 supp_mask_p = &supp_mask;
263 def_mask_p = &rte_flow_item_eth_mask;
264 loc_mac = efx_spec->efs_loc_mac;
267 rc = sfc_flow_parse_init(item,
268 (const void **)&spec,
269 (const void **)&mask,
270 supp_mask_p, def_mask_p,
271 sizeof(struct rte_flow_item_eth),
276 /* If "spec" is not set, could be any Ethernet */
280 if (is_same_ether_addr(&mask->dst, &supp_mask.dst)) {
281 efx_spec->efs_match_flags |= is_ifrm ?
282 EFX_FILTER_MATCH_IFRM_LOC_MAC :
283 EFX_FILTER_MATCH_LOC_MAC;
284 rte_memcpy(loc_mac, spec->dst.addr_bytes,
286 } else if (memcmp(mask->dst.addr_bytes, ig_mask,
287 EFX_MAC_ADDR_LEN) == 0) {
288 if (is_unicast_ether_addr(&spec->dst))
289 efx_spec->efs_match_flags |= is_ifrm ?
290 EFX_FILTER_MATCH_IFRM_UNKNOWN_UCAST_DST :
291 EFX_FILTER_MATCH_UNKNOWN_UCAST_DST;
293 efx_spec->efs_match_flags |= is_ifrm ?
294 EFX_FILTER_MATCH_IFRM_UNKNOWN_MCAST_DST :
295 EFX_FILTER_MATCH_UNKNOWN_MCAST_DST;
296 } else if (!is_zero_ether_addr(&mask->dst)) {
301 * ifrm_supp_mask ensures that the source address and
302 * ethertype masks are equal to zero in inner frame,
303 * so these fields are filled in only for the outer frame
305 if (is_same_ether_addr(&mask->src, &supp_mask.src)) {
306 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_REM_MAC;
307 rte_memcpy(efx_spec->efs_rem_mac, spec->src.addr_bytes,
309 } else if (!is_zero_ether_addr(&mask->src)) {
314 * Ether type is in big-endian byte order in item and
315 * in little-endian in efx_spec, so byte swap is used
317 if (mask->type == supp_mask.type) {
318 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_ETHER_TYPE;
319 efx_spec->efs_ether_type = rte_bswap16(spec->type);
320 } else if (mask->type != 0) {
327 rte_flow_error_set(error, EINVAL,
328 RTE_FLOW_ERROR_TYPE_ITEM, item,
329 "Bad mask in the ETH pattern item");
334 * Convert VLAN item to EFX filter specification.
337 * Item specification. Only VID field is supported.
338 * The mask can not be NULL. Ranging is not supported.
339 * @param efx_spec[in, out]
340 * EFX filter specification to update.
342 * Perform verbose error reporting if not NULL.
345 sfc_flow_parse_vlan(const struct rte_flow_item *item,
346 efx_filter_spec_t *efx_spec,
347 struct rte_flow_error *error)
351 const struct rte_flow_item_vlan *spec = NULL;
352 const struct rte_flow_item_vlan *mask = NULL;
353 const struct rte_flow_item_vlan supp_mask = {
354 .tci = rte_cpu_to_be_16(ETH_VLAN_ID_MAX),
355 .inner_type = RTE_BE16(0xffff),
358 rc = sfc_flow_parse_init(item,
359 (const void **)&spec,
360 (const void **)&mask,
363 sizeof(struct rte_flow_item_vlan),
369 * VID is in big-endian byte order in item and
370 * in little-endian in efx_spec, so byte swap is used.
371 * If two VLAN items are included, the first matches
372 * the outer tag and the next matches the inner tag.
374 if (mask->tci == supp_mask.tci) {
375 vid = rte_bswap16(spec->tci);
377 if (!(efx_spec->efs_match_flags &
378 EFX_FILTER_MATCH_OUTER_VID)) {
379 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_OUTER_VID;
380 efx_spec->efs_outer_vid = vid;
381 } else if (!(efx_spec->efs_match_flags &
382 EFX_FILTER_MATCH_INNER_VID)) {
383 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_INNER_VID;
384 efx_spec->efs_inner_vid = vid;
386 rte_flow_error_set(error, EINVAL,
387 RTE_FLOW_ERROR_TYPE_ITEM, item,
388 "More than two VLAN items");
392 rte_flow_error_set(error, EINVAL,
393 RTE_FLOW_ERROR_TYPE_ITEM, item,
394 "VLAN ID in TCI match is required");
398 if (efx_spec->efs_match_flags & EFX_FILTER_MATCH_ETHER_TYPE) {
399 rte_flow_error_set(error, EINVAL,
400 RTE_FLOW_ERROR_TYPE_ITEM, item,
401 "VLAN TPID matching is not supported");
404 if (mask->inner_type == supp_mask.inner_type) {
405 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_ETHER_TYPE;
406 efx_spec->efs_ether_type = rte_bswap16(spec->inner_type);
407 } else if (mask->inner_type) {
408 rte_flow_error_set(error, EINVAL,
409 RTE_FLOW_ERROR_TYPE_ITEM, item,
410 "Bad mask for VLAN inner_type");
418 * Convert IPv4 item to EFX filter specification.
421 * Item specification. Only source and destination addresses and
422 * protocol fields are supported. If the mask is NULL, default
423 * mask will be used. Ranging is not supported.
424 * @param efx_spec[in, out]
425 * EFX filter specification to update.
427 * Perform verbose error reporting if not NULL.
430 sfc_flow_parse_ipv4(const struct rte_flow_item *item,
431 efx_filter_spec_t *efx_spec,
432 struct rte_flow_error *error)
435 const struct rte_flow_item_ipv4 *spec = NULL;
436 const struct rte_flow_item_ipv4 *mask = NULL;
437 const uint16_t ether_type_ipv4 = rte_cpu_to_le_16(EFX_ETHER_TYPE_IPV4);
438 const struct rte_flow_item_ipv4 supp_mask = {
440 .src_addr = 0xffffffff,
441 .dst_addr = 0xffffffff,
442 .next_proto_id = 0xff,
446 rc = sfc_flow_parse_init(item,
447 (const void **)&spec,
448 (const void **)&mask,
450 &rte_flow_item_ipv4_mask,
451 sizeof(struct rte_flow_item_ipv4),
457 * Filtering by IPv4 source and destination addresses requires
458 * the appropriate ETHER_TYPE in hardware filters
460 if (!(efx_spec->efs_match_flags & EFX_FILTER_MATCH_ETHER_TYPE)) {
461 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_ETHER_TYPE;
462 efx_spec->efs_ether_type = ether_type_ipv4;
463 } else if (efx_spec->efs_ether_type != ether_type_ipv4) {
464 rte_flow_error_set(error, EINVAL,
465 RTE_FLOW_ERROR_TYPE_ITEM, item,
466 "Ethertype in pattern with IPV4 item should be appropriate");
474 * IPv4 addresses are in big-endian byte order in item and in
477 if (mask->hdr.src_addr == supp_mask.hdr.src_addr) {
478 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_REM_HOST;
479 efx_spec->efs_rem_host.eo_u32[0] = spec->hdr.src_addr;
480 } else if (mask->hdr.src_addr != 0) {
484 if (mask->hdr.dst_addr == supp_mask.hdr.dst_addr) {
485 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_LOC_HOST;
486 efx_spec->efs_loc_host.eo_u32[0] = spec->hdr.dst_addr;
487 } else if (mask->hdr.dst_addr != 0) {
491 if (mask->hdr.next_proto_id == supp_mask.hdr.next_proto_id) {
492 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_IP_PROTO;
493 efx_spec->efs_ip_proto = spec->hdr.next_proto_id;
494 } else if (mask->hdr.next_proto_id != 0) {
501 rte_flow_error_set(error, EINVAL,
502 RTE_FLOW_ERROR_TYPE_ITEM, item,
503 "Bad mask in the IPV4 pattern item");
508 * Convert IPv6 item to EFX filter specification.
511 * Item specification. Only source and destination addresses and
512 * next header fields are supported. If the mask is NULL, default
513 * mask will be used. Ranging is not supported.
514 * @param efx_spec[in, out]
515 * EFX filter specification to update.
517 * Perform verbose error reporting if not NULL.
520 sfc_flow_parse_ipv6(const struct rte_flow_item *item,
521 efx_filter_spec_t *efx_spec,
522 struct rte_flow_error *error)
525 const struct rte_flow_item_ipv6 *spec = NULL;
526 const struct rte_flow_item_ipv6 *mask = NULL;
527 const uint16_t ether_type_ipv6 = rte_cpu_to_le_16(EFX_ETHER_TYPE_IPV6);
528 const struct rte_flow_item_ipv6 supp_mask = {
530 .src_addr = { 0xff, 0xff, 0xff, 0xff,
531 0xff, 0xff, 0xff, 0xff,
532 0xff, 0xff, 0xff, 0xff,
533 0xff, 0xff, 0xff, 0xff },
534 .dst_addr = { 0xff, 0xff, 0xff, 0xff,
535 0xff, 0xff, 0xff, 0xff,
536 0xff, 0xff, 0xff, 0xff,
537 0xff, 0xff, 0xff, 0xff },
542 rc = sfc_flow_parse_init(item,
543 (const void **)&spec,
544 (const void **)&mask,
546 &rte_flow_item_ipv6_mask,
547 sizeof(struct rte_flow_item_ipv6),
553 * Filtering by IPv6 source and destination addresses requires
554 * the appropriate ETHER_TYPE in hardware filters
556 if (!(efx_spec->efs_match_flags & EFX_FILTER_MATCH_ETHER_TYPE)) {
557 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_ETHER_TYPE;
558 efx_spec->efs_ether_type = ether_type_ipv6;
559 } else if (efx_spec->efs_ether_type != ether_type_ipv6) {
560 rte_flow_error_set(error, EINVAL,
561 RTE_FLOW_ERROR_TYPE_ITEM, item,
562 "Ethertype in pattern with IPV6 item should be appropriate");
570 * IPv6 addresses are in big-endian byte order in item and in
573 if (memcmp(mask->hdr.src_addr, supp_mask.hdr.src_addr,
574 sizeof(mask->hdr.src_addr)) == 0) {
575 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_REM_HOST;
577 RTE_BUILD_BUG_ON(sizeof(efx_spec->efs_rem_host) !=
578 sizeof(spec->hdr.src_addr));
579 rte_memcpy(&efx_spec->efs_rem_host, spec->hdr.src_addr,
580 sizeof(efx_spec->efs_rem_host));
581 } else if (!sfc_flow_is_zero(mask->hdr.src_addr,
582 sizeof(mask->hdr.src_addr))) {
586 if (memcmp(mask->hdr.dst_addr, supp_mask.hdr.dst_addr,
587 sizeof(mask->hdr.dst_addr)) == 0) {
588 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_LOC_HOST;
590 RTE_BUILD_BUG_ON(sizeof(efx_spec->efs_loc_host) !=
591 sizeof(spec->hdr.dst_addr));
592 rte_memcpy(&efx_spec->efs_loc_host, spec->hdr.dst_addr,
593 sizeof(efx_spec->efs_loc_host));
594 } else if (!sfc_flow_is_zero(mask->hdr.dst_addr,
595 sizeof(mask->hdr.dst_addr))) {
599 if (mask->hdr.proto == supp_mask.hdr.proto) {
600 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_IP_PROTO;
601 efx_spec->efs_ip_proto = spec->hdr.proto;
602 } else if (mask->hdr.proto != 0) {
609 rte_flow_error_set(error, EINVAL,
610 RTE_FLOW_ERROR_TYPE_ITEM, item,
611 "Bad mask in the IPV6 pattern item");
616 * Convert TCP item to EFX filter specification.
619 * Item specification. Only source and destination ports fields
620 * are supported. If the mask is NULL, default mask will be used.
621 * Ranging is not supported.
622 * @param efx_spec[in, out]
623 * EFX filter specification to update.
625 * Perform verbose error reporting if not NULL.
628 sfc_flow_parse_tcp(const struct rte_flow_item *item,
629 efx_filter_spec_t *efx_spec,
630 struct rte_flow_error *error)
633 const struct rte_flow_item_tcp *spec = NULL;
634 const struct rte_flow_item_tcp *mask = NULL;
635 const struct rte_flow_item_tcp supp_mask = {
642 rc = sfc_flow_parse_init(item,
643 (const void **)&spec,
644 (const void **)&mask,
646 &rte_flow_item_tcp_mask,
647 sizeof(struct rte_flow_item_tcp),
653 * Filtering by TCP source and destination ports requires
654 * the appropriate IP_PROTO in hardware filters
656 if (!(efx_spec->efs_match_flags & EFX_FILTER_MATCH_IP_PROTO)) {
657 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_IP_PROTO;
658 efx_spec->efs_ip_proto = EFX_IPPROTO_TCP;
659 } else if (efx_spec->efs_ip_proto != EFX_IPPROTO_TCP) {
660 rte_flow_error_set(error, EINVAL,
661 RTE_FLOW_ERROR_TYPE_ITEM, item,
662 "IP proto in pattern with TCP item should be appropriate");
670 * Source and destination ports are in big-endian byte order in item and
671 * in little-endian in efx_spec, so byte swap is used
673 if (mask->hdr.src_port == supp_mask.hdr.src_port) {
674 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_REM_PORT;
675 efx_spec->efs_rem_port = rte_bswap16(spec->hdr.src_port);
676 } else if (mask->hdr.src_port != 0) {
680 if (mask->hdr.dst_port == supp_mask.hdr.dst_port) {
681 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_LOC_PORT;
682 efx_spec->efs_loc_port = rte_bswap16(spec->hdr.dst_port);
683 } else if (mask->hdr.dst_port != 0) {
690 rte_flow_error_set(error, EINVAL,
691 RTE_FLOW_ERROR_TYPE_ITEM, item,
692 "Bad mask in the TCP pattern item");
697 * Convert UDP item to EFX filter specification.
700 * Item specification. Only source and destination ports fields
701 * are supported. If the mask is NULL, default mask will be used.
702 * Ranging is not supported.
703 * @param efx_spec[in, out]
704 * EFX filter specification to update.
706 * Perform verbose error reporting if not NULL.
709 sfc_flow_parse_udp(const struct rte_flow_item *item,
710 efx_filter_spec_t *efx_spec,
711 struct rte_flow_error *error)
714 const struct rte_flow_item_udp *spec = NULL;
715 const struct rte_flow_item_udp *mask = NULL;
716 const struct rte_flow_item_udp supp_mask = {
723 rc = sfc_flow_parse_init(item,
724 (const void **)&spec,
725 (const void **)&mask,
727 &rte_flow_item_udp_mask,
728 sizeof(struct rte_flow_item_udp),
734 * Filtering by UDP source and destination ports requires
735 * the appropriate IP_PROTO in hardware filters
737 if (!(efx_spec->efs_match_flags & EFX_FILTER_MATCH_IP_PROTO)) {
738 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_IP_PROTO;
739 efx_spec->efs_ip_proto = EFX_IPPROTO_UDP;
740 } else if (efx_spec->efs_ip_proto != EFX_IPPROTO_UDP) {
741 rte_flow_error_set(error, EINVAL,
742 RTE_FLOW_ERROR_TYPE_ITEM, item,
743 "IP proto in pattern with UDP item should be appropriate");
751 * Source and destination ports are in big-endian byte order in item and
752 * in little-endian in efx_spec, so byte swap is used
754 if (mask->hdr.src_port == supp_mask.hdr.src_port) {
755 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_REM_PORT;
756 efx_spec->efs_rem_port = rte_bswap16(spec->hdr.src_port);
757 } else if (mask->hdr.src_port != 0) {
761 if (mask->hdr.dst_port == supp_mask.hdr.dst_port) {
762 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_LOC_PORT;
763 efx_spec->efs_loc_port = rte_bswap16(spec->hdr.dst_port);
764 } else if (mask->hdr.dst_port != 0) {
771 rte_flow_error_set(error, EINVAL,
772 RTE_FLOW_ERROR_TYPE_ITEM, item,
773 "Bad mask in the UDP pattern item");
778 * Filters for encapsulated packets match based on the EtherType and IP
779 * protocol in the outer frame.
782 sfc_flow_set_match_flags_for_encap_pkts(const struct rte_flow_item *item,
783 efx_filter_spec_t *efx_spec,
785 struct rte_flow_error *error)
787 if (!(efx_spec->efs_match_flags & EFX_FILTER_MATCH_IP_PROTO)) {
788 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_IP_PROTO;
789 efx_spec->efs_ip_proto = ip_proto;
790 } else if (efx_spec->efs_ip_proto != ip_proto) {
792 case EFX_IPPROTO_UDP:
793 rte_flow_error_set(error, EINVAL,
794 RTE_FLOW_ERROR_TYPE_ITEM, item,
795 "Outer IP header protocol must be UDP "
796 "in VxLAN/GENEVE pattern");
799 case EFX_IPPROTO_GRE:
800 rte_flow_error_set(error, EINVAL,
801 RTE_FLOW_ERROR_TYPE_ITEM, item,
802 "Outer IP header protocol must be GRE "
807 rte_flow_error_set(error, EINVAL,
808 RTE_FLOW_ERROR_TYPE_ITEM, item,
809 "Only VxLAN/GENEVE/NVGRE tunneling patterns "
815 if (efx_spec->efs_match_flags & EFX_FILTER_MATCH_ETHER_TYPE &&
816 efx_spec->efs_ether_type != EFX_ETHER_TYPE_IPV4 &&
817 efx_spec->efs_ether_type != EFX_ETHER_TYPE_IPV6) {
818 rte_flow_error_set(error, EINVAL,
819 RTE_FLOW_ERROR_TYPE_ITEM, item,
820 "Outer frame EtherType in pattern with tunneling "
821 "must be IPv4 or IPv6");
829 sfc_flow_set_efx_spec_vni_or_vsid(efx_filter_spec_t *efx_spec,
830 const uint8_t *vni_or_vsid_val,
831 const uint8_t *vni_or_vsid_mask,
832 const struct rte_flow_item *item,
833 struct rte_flow_error *error)
835 const uint8_t vni_or_vsid_full_mask[EFX_VNI_OR_VSID_LEN] = {
839 if (memcmp(vni_or_vsid_mask, vni_or_vsid_full_mask,
840 EFX_VNI_OR_VSID_LEN) == 0) {
841 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_VNI_OR_VSID;
842 rte_memcpy(efx_spec->efs_vni_or_vsid, vni_or_vsid_val,
843 EFX_VNI_OR_VSID_LEN);
844 } else if (!sfc_flow_is_zero(vni_or_vsid_mask, EFX_VNI_OR_VSID_LEN)) {
845 rte_flow_error_set(error, EINVAL,
846 RTE_FLOW_ERROR_TYPE_ITEM, item,
847 "Unsupported VNI/VSID mask");
855 * Convert VXLAN item to EFX filter specification.
858 * Item specification. Only VXLAN network identifier field is supported.
859 * If the mask is NULL, default mask will be used.
860 * Ranging is not supported.
861 * @param efx_spec[in, out]
862 * EFX filter specification to update.
864 * Perform verbose error reporting if not NULL.
867 sfc_flow_parse_vxlan(const struct rte_flow_item *item,
868 efx_filter_spec_t *efx_spec,
869 struct rte_flow_error *error)
872 const struct rte_flow_item_vxlan *spec = NULL;
873 const struct rte_flow_item_vxlan *mask = NULL;
874 const struct rte_flow_item_vxlan supp_mask = {
875 .vni = { 0xff, 0xff, 0xff }
878 rc = sfc_flow_parse_init(item,
879 (const void **)&spec,
880 (const void **)&mask,
882 &rte_flow_item_vxlan_mask,
883 sizeof(struct rte_flow_item_vxlan),
888 rc = sfc_flow_set_match_flags_for_encap_pkts(item, efx_spec,
889 EFX_IPPROTO_UDP, error);
893 efx_spec->efs_encap_type = EFX_TUNNEL_PROTOCOL_VXLAN;
894 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_ENCAP_TYPE;
899 rc = sfc_flow_set_efx_spec_vni_or_vsid(efx_spec, spec->vni,
900 mask->vni, item, error);
906 * Convert GENEVE item to EFX filter specification.
909 * Item specification. Only Virtual Network Identifier and protocol type
910 * fields are supported. But protocol type can be only Ethernet (0x6558).
911 * If the mask is NULL, default mask will be used.
912 * Ranging is not supported.
913 * @param efx_spec[in, out]
914 * EFX filter specification to update.
916 * Perform verbose error reporting if not NULL.
919 sfc_flow_parse_geneve(const struct rte_flow_item *item,
920 efx_filter_spec_t *efx_spec,
921 struct rte_flow_error *error)
924 const struct rte_flow_item_geneve *spec = NULL;
925 const struct rte_flow_item_geneve *mask = NULL;
926 const struct rte_flow_item_geneve supp_mask = {
927 .protocol = RTE_BE16(0xffff),
928 .vni = { 0xff, 0xff, 0xff }
931 rc = sfc_flow_parse_init(item,
932 (const void **)&spec,
933 (const void **)&mask,
935 &rte_flow_item_geneve_mask,
936 sizeof(struct rte_flow_item_geneve),
941 rc = sfc_flow_set_match_flags_for_encap_pkts(item, efx_spec,
942 EFX_IPPROTO_UDP, error);
946 efx_spec->efs_encap_type = EFX_TUNNEL_PROTOCOL_GENEVE;
947 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_ENCAP_TYPE;
952 if (mask->protocol == supp_mask.protocol) {
953 if (spec->protocol != rte_cpu_to_be_16(ETHER_TYPE_TEB)) {
954 rte_flow_error_set(error, EINVAL,
955 RTE_FLOW_ERROR_TYPE_ITEM, item,
956 "GENEVE encap. protocol must be Ethernet "
957 "(0x6558) in the GENEVE pattern item");
960 } else if (mask->protocol != 0) {
961 rte_flow_error_set(error, EINVAL,
962 RTE_FLOW_ERROR_TYPE_ITEM, item,
963 "Unsupported mask for GENEVE encap. protocol");
967 rc = sfc_flow_set_efx_spec_vni_or_vsid(efx_spec, spec->vni,
968 mask->vni, item, error);
974 * Convert NVGRE item to EFX filter specification.
977 * Item specification. Only virtual subnet ID field is supported.
978 * If the mask is NULL, default mask will be used.
979 * Ranging is not supported.
980 * @param efx_spec[in, out]
981 * EFX filter specification to update.
983 * Perform verbose error reporting if not NULL.
986 sfc_flow_parse_nvgre(const struct rte_flow_item *item,
987 efx_filter_spec_t *efx_spec,
988 struct rte_flow_error *error)
991 const struct rte_flow_item_nvgre *spec = NULL;
992 const struct rte_flow_item_nvgre *mask = NULL;
993 const struct rte_flow_item_nvgre supp_mask = {
994 .tni = { 0xff, 0xff, 0xff }
997 rc = sfc_flow_parse_init(item,
998 (const void **)&spec,
999 (const void **)&mask,
1001 &rte_flow_item_nvgre_mask,
1002 sizeof(struct rte_flow_item_nvgre),
1007 rc = sfc_flow_set_match_flags_for_encap_pkts(item, efx_spec,
1008 EFX_IPPROTO_GRE, error);
1012 efx_spec->efs_encap_type = EFX_TUNNEL_PROTOCOL_NVGRE;
1013 efx_spec->efs_match_flags |= EFX_FILTER_MATCH_ENCAP_TYPE;
1018 rc = sfc_flow_set_efx_spec_vni_or_vsid(efx_spec, spec->tni,
1019 mask->tni, item, error);
1024 static const struct sfc_flow_item sfc_flow_items[] = {
1026 .type = RTE_FLOW_ITEM_TYPE_VOID,
1027 .prev_layer = SFC_FLOW_ITEM_ANY_LAYER,
1028 .layer = SFC_FLOW_ITEM_ANY_LAYER,
1029 .parse = sfc_flow_parse_void,
1032 .type = RTE_FLOW_ITEM_TYPE_ETH,
1033 .prev_layer = SFC_FLOW_ITEM_START_LAYER,
1034 .layer = SFC_FLOW_ITEM_L2,
1035 .parse = sfc_flow_parse_eth,
1038 .type = RTE_FLOW_ITEM_TYPE_VLAN,
1039 .prev_layer = SFC_FLOW_ITEM_L2,
1040 .layer = SFC_FLOW_ITEM_L2,
1041 .parse = sfc_flow_parse_vlan,
1044 .type = RTE_FLOW_ITEM_TYPE_IPV4,
1045 .prev_layer = SFC_FLOW_ITEM_L2,
1046 .layer = SFC_FLOW_ITEM_L3,
1047 .parse = sfc_flow_parse_ipv4,
1050 .type = RTE_FLOW_ITEM_TYPE_IPV6,
1051 .prev_layer = SFC_FLOW_ITEM_L2,
1052 .layer = SFC_FLOW_ITEM_L3,
1053 .parse = sfc_flow_parse_ipv6,
1056 .type = RTE_FLOW_ITEM_TYPE_TCP,
1057 .prev_layer = SFC_FLOW_ITEM_L3,
1058 .layer = SFC_FLOW_ITEM_L4,
1059 .parse = sfc_flow_parse_tcp,
1062 .type = RTE_FLOW_ITEM_TYPE_UDP,
1063 .prev_layer = SFC_FLOW_ITEM_L3,
1064 .layer = SFC_FLOW_ITEM_L4,
1065 .parse = sfc_flow_parse_udp,
1068 .type = RTE_FLOW_ITEM_TYPE_VXLAN,
1069 .prev_layer = SFC_FLOW_ITEM_L4,
1070 .layer = SFC_FLOW_ITEM_START_LAYER,
1071 .parse = sfc_flow_parse_vxlan,
1074 .type = RTE_FLOW_ITEM_TYPE_GENEVE,
1075 .prev_layer = SFC_FLOW_ITEM_L4,
1076 .layer = SFC_FLOW_ITEM_START_LAYER,
1077 .parse = sfc_flow_parse_geneve,
1080 .type = RTE_FLOW_ITEM_TYPE_NVGRE,
1081 .prev_layer = SFC_FLOW_ITEM_L3,
1082 .layer = SFC_FLOW_ITEM_START_LAYER,
1083 .parse = sfc_flow_parse_nvgre,
1088 * Protocol-independent flow API support
1091 sfc_flow_parse_attr(const struct rte_flow_attr *attr,
1092 struct rte_flow *flow,
1093 struct rte_flow_error *error)
1096 rte_flow_error_set(error, EINVAL,
1097 RTE_FLOW_ERROR_TYPE_ATTR, NULL,
1101 if (attr->group != 0) {
1102 rte_flow_error_set(error, ENOTSUP,
1103 RTE_FLOW_ERROR_TYPE_ATTR_GROUP, attr,
1104 "Groups are not supported");
1107 if (attr->priority != 0) {
1108 rte_flow_error_set(error, ENOTSUP,
1109 RTE_FLOW_ERROR_TYPE_ATTR_PRIORITY, attr,
1110 "Priorities are not supported");
1113 if (attr->egress != 0) {
1114 rte_flow_error_set(error, ENOTSUP,
1115 RTE_FLOW_ERROR_TYPE_ATTR_EGRESS, attr,
1116 "Egress is not supported");
1119 if (attr->transfer != 0) {
1120 rte_flow_error_set(error, ENOTSUP,
1121 RTE_FLOW_ERROR_TYPE_ATTR_TRANSFER, attr,
1122 "Transfer is not supported");
1125 if (attr->ingress == 0) {
1126 rte_flow_error_set(error, ENOTSUP,
1127 RTE_FLOW_ERROR_TYPE_ATTR_INGRESS, attr,
1128 "Only ingress is supported");
1132 flow->spec.template.efs_flags |= EFX_FILTER_FLAG_RX;
1133 flow->spec.template.efs_rss_context = EFX_RSS_CONTEXT_DEFAULT;
1138 /* Get item from array sfc_flow_items */
1139 static const struct sfc_flow_item *
1140 sfc_flow_get_item(enum rte_flow_item_type type)
1144 for (i = 0; i < RTE_DIM(sfc_flow_items); i++)
1145 if (sfc_flow_items[i].type == type)
1146 return &sfc_flow_items[i];
1152 sfc_flow_parse_pattern(const struct rte_flow_item pattern[],
1153 struct rte_flow *flow,
1154 struct rte_flow_error *error)
1157 unsigned int prev_layer = SFC_FLOW_ITEM_ANY_LAYER;
1158 boolean_t is_ifrm = B_FALSE;
1159 const struct sfc_flow_item *item;
1161 if (pattern == NULL) {
1162 rte_flow_error_set(error, EINVAL,
1163 RTE_FLOW_ERROR_TYPE_ITEM_NUM, NULL,
1168 for (; pattern->type != RTE_FLOW_ITEM_TYPE_END; pattern++) {
1169 item = sfc_flow_get_item(pattern->type);
1171 rte_flow_error_set(error, ENOTSUP,
1172 RTE_FLOW_ERROR_TYPE_ITEM, pattern,
1173 "Unsupported pattern item");
1178 * Omitting one or several protocol layers at the beginning
1179 * of pattern is supported
1181 if (item->prev_layer != SFC_FLOW_ITEM_ANY_LAYER &&
1182 prev_layer != SFC_FLOW_ITEM_ANY_LAYER &&
1183 item->prev_layer != prev_layer) {
1184 rte_flow_error_set(error, ENOTSUP,
1185 RTE_FLOW_ERROR_TYPE_ITEM, pattern,
1186 "Unexpected sequence of pattern items");
1191 * Allow only VOID and ETH pattern items in the inner frame.
1192 * Also check that there is only one tunneling protocol.
1194 switch (item->type) {
1195 case RTE_FLOW_ITEM_TYPE_VOID:
1196 case RTE_FLOW_ITEM_TYPE_ETH:
1199 case RTE_FLOW_ITEM_TYPE_VXLAN:
1200 case RTE_FLOW_ITEM_TYPE_GENEVE:
1201 case RTE_FLOW_ITEM_TYPE_NVGRE:
1203 rte_flow_error_set(error, EINVAL,
1204 RTE_FLOW_ERROR_TYPE_ITEM,
1206 "More than one tunneling protocol");
1214 rte_flow_error_set(error, EINVAL,
1215 RTE_FLOW_ERROR_TYPE_ITEM,
1217 "There is an unsupported pattern item "
1218 "in the inner frame");
1224 rc = item->parse(pattern, &flow->spec.template, error);
1228 if (item->layer != SFC_FLOW_ITEM_ANY_LAYER)
1229 prev_layer = item->layer;
1236 sfc_flow_parse_queue(struct sfc_adapter *sa,
1237 const struct rte_flow_action_queue *queue,
1238 struct rte_flow *flow)
1240 struct sfc_rxq *rxq;
1242 if (queue->index >= sa->rxq_count)
1245 rxq = sa->rxq_info[queue->index].rxq;
1246 flow->spec.template.efs_dmaq_id = (uint16_t)rxq->hw_index;
1252 sfc_flow_parse_rss(struct sfc_adapter *sa,
1253 const struct rte_flow_action_rss *rss,
1254 struct rte_flow *flow)
1256 unsigned int rxq_sw_index;
1257 struct sfc_rxq *rxq;
1258 unsigned int rxq_hw_index_min;
1259 unsigned int rxq_hw_index_max;
1260 const uint8_t *rss_key;
1261 struct sfc_flow_rss *sfc_rss_conf = &flow->rss_conf;
1264 if (rss->queue_num == 0)
1267 rxq_sw_index = sa->rxq_count - 1;
1268 rxq = sa->rxq_info[rxq_sw_index].rxq;
1269 rxq_hw_index_min = rxq->hw_index;
1270 rxq_hw_index_max = 0;
1272 for (i = 0; i < rss->queue_num; ++i) {
1273 rxq_sw_index = rss->queue[i];
1275 if (rxq_sw_index >= sa->rxq_count)
1278 rxq = sa->rxq_info[rxq_sw_index].rxq;
1280 if (rxq->hw_index < rxq_hw_index_min)
1281 rxq_hw_index_min = rxq->hw_index;
1283 if (rxq->hw_index > rxq_hw_index_max)
1284 rxq_hw_index_max = rxq->hw_index;
1287 switch (rss->func) {
1288 case RTE_ETH_HASH_FUNCTION_DEFAULT:
1289 case RTE_ETH_HASH_FUNCTION_TOEPLITZ:
1298 if ((rss->types & ~SFC_RSS_OFFLOADS) != 0)
1302 if (rss->key_len != sizeof(sa->rss_key))
1307 rss_key = sa->rss_key;
1312 sfc_rss_conf->rxq_hw_index_min = rxq_hw_index_min;
1313 sfc_rss_conf->rxq_hw_index_max = rxq_hw_index_max;
1314 sfc_rss_conf->rss_hash_types = sfc_rte_to_efx_hash_type(rss->types);
1315 rte_memcpy(sfc_rss_conf->rss_key, rss_key, sizeof(sa->rss_key));
1317 for (i = 0; i < RTE_DIM(sfc_rss_conf->rss_tbl); ++i) {
1318 unsigned int rxq_sw_index = rss->queue[i % rss->queue_num];
1319 struct sfc_rxq *rxq = sa->rxq_info[rxq_sw_index].rxq;
1321 sfc_rss_conf->rss_tbl[i] = rxq->hw_index - rxq_hw_index_min;
1328 sfc_flow_spec_flush(struct sfc_adapter *sa, struct sfc_flow_spec *spec,
1329 unsigned int filters_count)
1334 for (i = 0; i < filters_count; i++) {
1337 rc = efx_filter_remove(sa->nic, &spec->filters[i]);
1338 if (ret == 0 && rc != 0) {
1339 sfc_err(sa, "failed to remove filter specification "
1349 sfc_flow_spec_insert(struct sfc_adapter *sa, struct sfc_flow_spec *spec)
1354 for (i = 0; i < spec->count; i++) {
1355 rc = efx_filter_insert(sa->nic, &spec->filters[i]);
1357 sfc_flow_spec_flush(sa, spec, i);
1366 sfc_flow_spec_remove(struct sfc_adapter *sa, struct sfc_flow_spec *spec)
1368 return sfc_flow_spec_flush(sa, spec, spec->count);
1372 sfc_flow_filter_insert(struct sfc_adapter *sa,
1373 struct rte_flow *flow)
1375 struct sfc_flow_rss *rss = &flow->rss_conf;
1376 uint32_t efs_rss_context = EFX_RSS_CONTEXT_DEFAULT;
1381 unsigned int rss_spread = MIN(rss->rxq_hw_index_max -
1382 rss->rxq_hw_index_min + 1,
1385 rc = efx_rx_scale_context_alloc(sa->nic,
1386 EFX_RX_SCALE_EXCLUSIVE,
1390 goto fail_scale_context_alloc;
1392 rc = efx_rx_scale_mode_set(sa->nic, efs_rss_context,
1393 EFX_RX_HASHALG_TOEPLITZ,
1394 rss->rss_hash_types, B_TRUE);
1396 goto fail_scale_mode_set;
1398 rc = efx_rx_scale_key_set(sa->nic, efs_rss_context,
1400 sizeof(sa->rss_key));
1402 goto fail_scale_key_set;
1405 * At this point, fully elaborated filter specifications
1406 * have been produced from the template. To make sure that
1407 * RSS behaviour is consistent between them, set the same
1408 * RSS context value everywhere.
1410 for (i = 0; i < flow->spec.count; i++) {
1411 efx_filter_spec_t *spec = &flow->spec.filters[i];
1413 spec->efs_rss_context = efs_rss_context;
1414 spec->efs_dmaq_id = rss->rxq_hw_index_min;
1415 spec->efs_flags |= EFX_FILTER_FLAG_RX_RSS;
1419 rc = sfc_flow_spec_insert(sa, &flow->spec);
1421 goto fail_filter_insert;
1425 * Scale table is set after filter insertion because
1426 * the table entries are relative to the base RxQ ID
1427 * and the latter is submitted to the HW by means of
1428 * inserting a filter, so by the time of the request
1429 * the HW knows all the information needed to verify
1430 * the table entries, and the operation will succeed
1432 rc = efx_rx_scale_tbl_set(sa->nic, efs_rss_context,
1433 rss->rss_tbl, RTE_DIM(rss->rss_tbl));
1435 goto fail_scale_tbl_set;
1441 sfc_flow_spec_remove(sa, &flow->spec);
1445 fail_scale_mode_set:
1446 if (efs_rss_context != EFX_RSS_CONTEXT_DEFAULT)
1447 efx_rx_scale_context_free(sa->nic, efs_rss_context);
1449 fail_scale_context_alloc:
1454 sfc_flow_filter_remove(struct sfc_adapter *sa,
1455 struct rte_flow *flow)
1459 rc = sfc_flow_spec_remove(sa, &flow->spec);
1465 * All specifications for a given flow rule have the same RSS
1466 * context, so that RSS context value is taken from the first
1467 * filter specification
1469 efx_filter_spec_t *spec = &flow->spec.filters[0];
1471 rc = efx_rx_scale_context_free(sa->nic, spec->efs_rss_context);
1478 sfc_flow_parse_actions(struct sfc_adapter *sa,
1479 const struct rte_flow_action actions[],
1480 struct rte_flow *flow,
1481 struct rte_flow_error *error)
1484 boolean_t is_specified = B_FALSE;
1486 if (actions == NULL) {
1487 rte_flow_error_set(error, EINVAL,
1488 RTE_FLOW_ERROR_TYPE_ACTION_NUM, NULL,
1493 for (; actions->type != RTE_FLOW_ACTION_TYPE_END; actions++) {
1494 /* This one may appear anywhere multiple times. */
1495 if (actions->type == RTE_FLOW_ACTION_TYPE_VOID)
1497 /* Fate-deciding actions may appear exactly once. */
1500 (error, ENOTSUP, RTE_FLOW_ERROR_TYPE_ACTION,
1502 "Cannot combine several fate-deciding actions,"
1503 "choose between QUEUE, RSS or DROP");
1506 switch (actions->type) {
1507 case RTE_FLOW_ACTION_TYPE_QUEUE:
1508 rc = sfc_flow_parse_queue(sa, actions->conf, flow);
1510 rte_flow_error_set(error, EINVAL,
1511 RTE_FLOW_ERROR_TYPE_ACTION, actions,
1512 "Bad QUEUE action");
1516 is_specified = B_TRUE;
1519 case RTE_FLOW_ACTION_TYPE_RSS:
1520 rc = sfc_flow_parse_rss(sa, actions->conf, flow);
1522 rte_flow_error_set(error, rc,
1523 RTE_FLOW_ERROR_TYPE_ACTION, actions,
1528 is_specified = B_TRUE;
1531 case RTE_FLOW_ACTION_TYPE_DROP:
1532 flow->spec.template.efs_dmaq_id =
1533 EFX_FILTER_SPEC_RX_DMAQ_ID_DROP;
1535 is_specified = B_TRUE;
1539 rte_flow_error_set(error, ENOTSUP,
1540 RTE_FLOW_ERROR_TYPE_ACTION, actions,
1541 "Action is not supported");
1546 /* When fate is unknown, drop traffic. */
1547 if (!is_specified) {
1548 flow->spec.template.efs_dmaq_id =
1549 EFX_FILTER_SPEC_RX_DMAQ_ID_DROP;
1556 * Set the EFX_FILTER_MATCH_UNKNOWN_UCAST_DST
1557 * and EFX_FILTER_MATCH_UNKNOWN_MCAST_DST match flags in the same
1558 * specifications after copying.
1560 * @param spec[in, out]
1561 * SFC flow specification to update.
1562 * @param filters_count_for_one_val[in]
1563 * How many specifications should have the same match flag, what is the
1564 * number of specifications before copying.
1566 * Perform verbose error reporting if not NULL.
1569 sfc_flow_set_unknown_dst_flags(struct sfc_flow_spec *spec,
1570 unsigned int filters_count_for_one_val,
1571 struct rte_flow_error *error)
1574 static const efx_filter_match_flags_t vals[] = {
1575 EFX_FILTER_MATCH_UNKNOWN_UCAST_DST,
1576 EFX_FILTER_MATCH_UNKNOWN_MCAST_DST
1579 if (filters_count_for_one_val * RTE_DIM(vals) != spec->count) {
1580 rte_flow_error_set(error, EINVAL,
1581 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
1582 "Number of specifications is incorrect while copying "
1583 "by unknown destination flags");
1587 for (i = 0; i < spec->count; i++) {
1588 /* The check above ensures that divisor can't be zero here */
1589 spec->filters[i].efs_match_flags |=
1590 vals[i / filters_count_for_one_val];
1597 * Check that the following conditions are met:
1598 * - the list of supported filters has a filter
1599 * with EFX_FILTER_MATCH_UNKNOWN_MCAST_DST flag instead of
1600 * EFX_FILTER_MATCH_UNKNOWN_UCAST_DST, since this filter will also
1604 * The match flags of filter.
1606 * Specification to be supplemented.
1608 * SFC filter with list of supported filters.
1611 sfc_flow_check_unknown_dst_flags(efx_filter_match_flags_t match,
1612 __rte_unused efx_filter_spec_t *spec,
1613 struct sfc_filter *filter)
1616 efx_filter_match_flags_t match_mcast_dst;
1619 (match & ~EFX_FILTER_MATCH_UNKNOWN_UCAST_DST) |
1620 EFX_FILTER_MATCH_UNKNOWN_MCAST_DST;
1621 for (i = 0; i < filter->supported_match_num; i++) {
1622 if (match_mcast_dst == filter->supported_match[i])
1630 * Set the EFX_FILTER_MATCH_ETHER_TYPE match flag and EFX_ETHER_TYPE_IPV4 and
1631 * EFX_ETHER_TYPE_IPV6 values of the corresponding field in the same
1632 * specifications after copying.
1634 * @param spec[in, out]
1635 * SFC flow specification to update.
1636 * @param filters_count_for_one_val[in]
1637 * How many specifications should have the same EtherType value, what is the
1638 * number of specifications before copying.
1640 * Perform verbose error reporting if not NULL.
1643 sfc_flow_set_ethertypes(struct sfc_flow_spec *spec,
1644 unsigned int filters_count_for_one_val,
1645 struct rte_flow_error *error)
1648 static const uint16_t vals[] = {
1649 EFX_ETHER_TYPE_IPV4, EFX_ETHER_TYPE_IPV6
1652 if (filters_count_for_one_val * RTE_DIM(vals) != spec->count) {
1653 rte_flow_error_set(error, EINVAL,
1654 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
1655 "Number of specifications is incorrect "
1656 "while copying by Ethertype");
1660 for (i = 0; i < spec->count; i++) {
1661 spec->filters[i].efs_match_flags |=
1662 EFX_FILTER_MATCH_ETHER_TYPE;
1665 * The check above ensures that
1666 * filters_count_for_one_val is not 0
1668 spec->filters[i].efs_ether_type =
1669 vals[i / filters_count_for_one_val];
1676 * Set the EFX_FILTER_MATCH_IFRM_UNKNOWN_UCAST_DST and
1677 * EFX_FILTER_MATCH_IFRM_UNKNOWN_MCAST_DST match flags in the same
1678 * specifications after copying.
1680 * @param spec[in, out]
1681 * SFC flow specification to update.
1682 * @param filters_count_for_one_val[in]
1683 * How many specifications should have the same match flag, what is the
1684 * number of specifications before copying.
1686 * Perform verbose error reporting if not NULL.
1689 sfc_flow_set_ifrm_unknown_dst_flags(struct sfc_flow_spec *spec,
1690 unsigned int filters_count_for_one_val,
1691 struct rte_flow_error *error)
1694 static const efx_filter_match_flags_t vals[] = {
1695 EFX_FILTER_MATCH_IFRM_UNKNOWN_UCAST_DST,
1696 EFX_FILTER_MATCH_IFRM_UNKNOWN_MCAST_DST
1699 if (filters_count_for_one_val * RTE_DIM(vals) != spec->count) {
1700 rte_flow_error_set(error, EINVAL,
1701 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
1702 "Number of specifications is incorrect while copying "
1703 "by inner frame unknown destination flags");
1707 for (i = 0; i < spec->count; i++) {
1708 /* The check above ensures that divisor can't be zero here */
1709 spec->filters[i].efs_match_flags |=
1710 vals[i / filters_count_for_one_val];
1717 * Check that the following conditions are met:
1718 * - the specification corresponds to a filter for encapsulated traffic
1719 * - the list of supported filters has a filter
1720 * with EFX_FILTER_MATCH_IFRM_UNKNOWN_MCAST_DST flag instead of
1721 * EFX_FILTER_MATCH_IFRM_UNKNOWN_UCAST_DST, since this filter will also
1725 * The match flags of filter.
1727 * Specification to be supplemented.
1729 * SFC filter with list of supported filters.
1732 sfc_flow_check_ifrm_unknown_dst_flags(efx_filter_match_flags_t match,
1733 efx_filter_spec_t *spec,
1734 struct sfc_filter *filter)
1737 efx_tunnel_protocol_t encap_type = spec->efs_encap_type;
1738 efx_filter_match_flags_t match_mcast_dst;
1740 if (encap_type == EFX_TUNNEL_PROTOCOL_NONE)
1744 (match & ~EFX_FILTER_MATCH_IFRM_UNKNOWN_UCAST_DST) |
1745 EFX_FILTER_MATCH_IFRM_UNKNOWN_MCAST_DST;
1746 for (i = 0; i < filter->supported_match_num; i++) {
1747 if (match_mcast_dst == filter->supported_match[i])
1755 * Match flags that can be automatically added to filters.
1756 * Selecting the last minimum when searching for the copy flag ensures that the
1757 * EFX_FILTER_MATCH_UNKNOWN_UCAST_DST flag has a higher priority than
1758 * EFX_FILTER_MATCH_ETHER_TYPE. This is because the filter
1759 * EFX_FILTER_MATCH_UNKNOWN_UCAST_DST is at the end of the list of supported
1762 static const struct sfc_flow_copy_flag sfc_flow_copy_flags[] = {
1764 .flag = EFX_FILTER_MATCH_UNKNOWN_UCAST_DST,
1766 .set_vals = sfc_flow_set_unknown_dst_flags,
1767 .spec_check = sfc_flow_check_unknown_dst_flags,
1770 .flag = EFX_FILTER_MATCH_ETHER_TYPE,
1772 .set_vals = sfc_flow_set_ethertypes,
1776 .flag = EFX_FILTER_MATCH_IFRM_UNKNOWN_UCAST_DST,
1778 .set_vals = sfc_flow_set_ifrm_unknown_dst_flags,
1779 .spec_check = sfc_flow_check_ifrm_unknown_dst_flags,
1783 /* Get item from array sfc_flow_copy_flags */
1784 static const struct sfc_flow_copy_flag *
1785 sfc_flow_get_copy_flag(efx_filter_match_flags_t flag)
1789 for (i = 0; i < RTE_DIM(sfc_flow_copy_flags); i++) {
1790 if (sfc_flow_copy_flags[i].flag == flag)
1791 return &sfc_flow_copy_flags[i];
1798 * Make copies of the specifications, set match flag and values
1799 * of the field that corresponds to it.
1801 * @param spec[in, out]
1802 * SFC flow specification to update.
1804 * The match flag to add.
1806 * Perform verbose error reporting if not NULL.
1809 sfc_flow_spec_add_match_flag(struct sfc_flow_spec *spec,
1810 efx_filter_match_flags_t flag,
1811 struct rte_flow_error *error)
1814 unsigned int new_filters_count;
1815 unsigned int filters_count_for_one_val;
1816 const struct sfc_flow_copy_flag *copy_flag;
1819 copy_flag = sfc_flow_get_copy_flag(flag);
1820 if (copy_flag == NULL) {
1821 rte_flow_error_set(error, ENOTSUP,
1822 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
1823 "Unsupported spec field for copying");
1827 new_filters_count = spec->count * copy_flag->vals_count;
1828 if (new_filters_count > SF_FLOW_SPEC_NB_FILTERS_MAX) {
1829 rte_flow_error_set(error, EINVAL,
1830 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
1831 "Too much EFX specifications in the flow rule");
1835 /* Copy filters specifications */
1836 for (i = spec->count; i < new_filters_count; i++)
1837 spec->filters[i] = spec->filters[i - spec->count];
1839 filters_count_for_one_val = spec->count;
1840 spec->count = new_filters_count;
1842 rc = copy_flag->set_vals(spec, filters_count_for_one_val, error);
1850 * Check that the given set of match flags missing in the original filter spec
1851 * could be covered by adding spec copies which specify the corresponding
1852 * flags and packet field values to match.
1854 * @param miss_flags[in]
1855 * Flags that are missing until the supported filter.
1857 * Specification to be supplemented.
1862 * Number of specifications after copy or 0, if the flags can not be added.
1865 sfc_flow_check_missing_flags(efx_filter_match_flags_t miss_flags,
1866 efx_filter_spec_t *spec,
1867 struct sfc_filter *filter)
1870 efx_filter_match_flags_t copy_flags = 0;
1871 efx_filter_match_flags_t flag;
1872 efx_filter_match_flags_t match = spec->efs_match_flags | miss_flags;
1873 sfc_flow_spec_check *check;
1874 unsigned int multiplier = 1;
1876 for (i = 0; i < RTE_DIM(sfc_flow_copy_flags); i++) {
1877 flag = sfc_flow_copy_flags[i].flag;
1878 check = sfc_flow_copy_flags[i].spec_check;
1879 if ((flag & miss_flags) == flag) {
1880 if (check != NULL && (!check(match, spec, filter)))
1884 multiplier *= sfc_flow_copy_flags[i].vals_count;
1888 if (copy_flags == miss_flags)
1895 * Attempt to supplement the specification template to the minimally
1896 * supported set of match flags. To do this, it is necessary to copy
1897 * the specifications, filling them with the values of fields that
1898 * correspond to the missing flags.
1899 * The necessary and sufficient filter is built from the fewest number
1900 * of copies which could be made to cover the minimally required set
1905 * @param spec[in, out]
1906 * SFC flow specification to update.
1908 * Perform verbose error reporting if not NULL.
1911 sfc_flow_spec_filters_complete(struct sfc_adapter *sa,
1912 struct sfc_flow_spec *spec,
1913 struct rte_flow_error *error)
1915 struct sfc_filter *filter = &sa->filter;
1916 efx_filter_match_flags_t miss_flags;
1917 efx_filter_match_flags_t min_miss_flags = 0;
1918 efx_filter_match_flags_t match;
1919 unsigned int min_multiplier = UINT_MAX;
1920 unsigned int multiplier;
1924 match = spec->template.efs_match_flags;
1925 for (i = 0; i < filter->supported_match_num; i++) {
1926 if ((match & filter->supported_match[i]) == match) {
1927 miss_flags = filter->supported_match[i] & (~match);
1928 multiplier = sfc_flow_check_missing_flags(miss_flags,
1929 &spec->template, filter);
1930 if (multiplier > 0) {
1931 if (multiplier <= min_multiplier) {
1932 min_multiplier = multiplier;
1933 min_miss_flags = miss_flags;
1939 if (min_multiplier == UINT_MAX) {
1940 rte_flow_error_set(error, ENOTSUP,
1941 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
1942 "Flow rule pattern is not supported");
1946 for (i = 0; i < RTE_DIM(sfc_flow_copy_flags); i++) {
1947 efx_filter_match_flags_t flag = sfc_flow_copy_flags[i].flag;
1949 if ((flag & min_miss_flags) == flag) {
1950 rc = sfc_flow_spec_add_match_flag(spec, flag, error);
1960 * Check that set of match flags is referred to by a filter. Filter is
1961 * described by match flags with the ability to add OUTER_VID and INNER_VID
1964 * @param match_flags[in]
1965 * Set of match flags.
1966 * @param flags_pattern[in]
1967 * Pattern of filter match flags.
1970 sfc_flow_is_match_with_vids(efx_filter_match_flags_t match_flags,
1971 efx_filter_match_flags_t flags_pattern)
1973 if ((match_flags & flags_pattern) != flags_pattern)
1976 switch (match_flags & ~flags_pattern) {
1978 case EFX_FILTER_MATCH_OUTER_VID:
1979 case EFX_FILTER_MATCH_OUTER_VID | EFX_FILTER_MATCH_INNER_VID:
1987 * Check whether the spec maps to a hardware filter which is known to be
1988 * ineffective despite being valid.
1991 * SFC flow specification.
1994 sfc_flow_is_match_flags_exception(struct sfc_flow_spec *spec)
1997 uint16_t ether_type;
1999 efx_filter_match_flags_t match_flags;
2001 for (i = 0; i < spec->count; i++) {
2002 match_flags = spec->filters[i].efs_match_flags;
2004 if (sfc_flow_is_match_with_vids(match_flags,
2005 EFX_FILTER_MATCH_ETHER_TYPE) ||
2006 sfc_flow_is_match_with_vids(match_flags,
2007 EFX_FILTER_MATCH_ETHER_TYPE |
2008 EFX_FILTER_MATCH_LOC_MAC)) {
2009 ether_type = spec->filters[i].efs_ether_type;
2010 if (ether_type == EFX_ETHER_TYPE_IPV4 ||
2011 ether_type == EFX_ETHER_TYPE_IPV6)
2013 } else if (sfc_flow_is_match_with_vids(match_flags,
2014 EFX_FILTER_MATCH_ETHER_TYPE |
2015 EFX_FILTER_MATCH_IP_PROTO) ||
2016 sfc_flow_is_match_with_vids(match_flags,
2017 EFX_FILTER_MATCH_ETHER_TYPE |
2018 EFX_FILTER_MATCH_IP_PROTO |
2019 EFX_FILTER_MATCH_LOC_MAC)) {
2020 ip_proto = spec->filters[i].efs_ip_proto;
2021 if (ip_proto == EFX_IPPROTO_TCP ||
2022 ip_proto == EFX_IPPROTO_UDP)
2031 sfc_flow_validate_match_flags(struct sfc_adapter *sa,
2032 struct rte_flow *flow,
2033 struct rte_flow_error *error)
2035 efx_filter_spec_t *spec_tmpl = &flow->spec.template;
2036 efx_filter_match_flags_t match_flags = spec_tmpl->efs_match_flags;
2039 /* Initialize the first filter spec with template */
2040 flow->spec.filters[0] = *spec_tmpl;
2041 flow->spec.count = 1;
2043 if (!sfc_filter_is_match_supported(sa, match_flags)) {
2044 rc = sfc_flow_spec_filters_complete(sa, &flow->spec, error);
2049 if (sfc_flow_is_match_flags_exception(&flow->spec)) {
2050 rte_flow_error_set(error, ENOTSUP,
2051 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
2052 "The flow rule pattern is unsupported");
2060 sfc_flow_parse(struct rte_eth_dev *dev,
2061 const struct rte_flow_attr *attr,
2062 const struct rte_flow_item pattern[],
2063 const struct rte_flow_action actions[],
2064 struct rte_flow *flow,
2065 struct rte_flow_error *error)
2067 struct sfc_adapter *sa = dev->data->dev_private;
2070 rc = sfc_flow_parse_attr(attr, flow, error);
2072 goto fail_bad_value;
2074 rc = sfc_flow_parse_pattern(pattern, flow, error);
2076 goto fail_bad_value;
2078 rc = sfc_flow_parse_actions(sa, actions, flow, error);
2080 goto fail_bad_value;
2082 rc = sfc_flow_validate_match_flags(sa, flow, error);
2084 goto fail_bad_value;
2093 sfc_flow_validate(struct rte_eth_dev *dev,
2094 const struct rte_flow_attr *attr,
2095 const struct rte_flow_item pattern[],
2096 const struct rte_flow_action actions[],
2097 struct rte_flow_error *error)
2099 struct rte_flow flow;
2101 memset(&flow, 0, sizeof(flow));
2103 return sfc_flow_parse(dev, attr, pattern, actions, &flow, error);
2106 static struct rte_flow *
2107 sfc_flow_create(struct rte_eth_dev *dev,
2108 const struct rte_flow_attr *attr,
2109 const struct rte_flow_item pattern[],
2110 const struct rte_flow_action actions[],
2111 struct rte_flow_error *error)
2113 struct sfc_adapter *sa = dev->data->dev_private;
2114 struct rte_flow *flow = NULL;
2117 flow = rte_zmalloc("sfc_rte_flow", sizeof(*flow), 0);
2119 rte_flow_error_set(error, ENOMEM,
2120 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
2121 "Failed to allocate memory");
2125 rc = sfc_flow_parse(dev, attr, pattern, actions, flow, error);
2127 goto fail_bad_value;
2129 TAILQ_INSERT_TAIL(&sa->filter.flow_list, flow, entries);
2131 sfc_adapter_lock(sa);
2133 if (sa->state == SFC_ADAPTER_STARTED) {
2134 rc = sfc_flow_filter_insert(sa, flow);
2136 rte_flow_error_set(error, rc,
2137 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
2138 "Failed to insert filter");
2139 goto fail_filter_insert;
2143 sfc_adapter_unlock(sa);
2148 TAILQ_REMOVE(&sa->filter.flow_list, flow, entries);
2152 sfc_adapter_unlock(sa);
2159 sfc_flow_remove(struct sfc_adapter *sa,
2160 struct rte_flow *flow,
2161 struct rte_flow_error *error)
2165 SFC_ASSERT(sfc_adapter_is_locked(sa));
2167 if (sa->state == SFC_ADAPTER_STARTED) {
2168 rc = sfc_flow_filter_remove(sa, flow);
2170 rte_flow_error_set(error, rc,
2171 RTE_FLOW_ERROR_TYPE_UNSPECIFIED, NULL,
2172 "Failed to destroy flow rule");
2175 TAILQ_REMOVE(&sa->filter.flow_list, flow, entries);
2182 sfc_flow_destroy(struct rte_eth_dev *dev,
2183 struct rte_flow *flow,
2184 struct rte_flow_error *error)
2186 struct sfc_adapter *sa = dev->data->dev_private;
2187 struct rte_flow *flow_ptr;
2190 sfc_adapter_lock(sa);
2192 TAILQ_FOREACH(flow_ptr, &sa->filter.flow_list, entries) {
2193 if (flow_ptr == flow)
2197 rte_flow_error_set(error, rc,
2198 RTE_FLOW_ERROR_TYPE_HANDLE, NULL,
2199 "Failed to find flow rule to destroy");
2200 goto fail_bad_value;
2203 rc = sfc_flow_remove(sa, flow, error);
2206 sfc_adapter_unlock(sa);
2212 sfc_flow_flush(struct rte_eth_dev *dev,
2213 struct rte_flow_error *error)
2215 struct sfc_adapter *sa = dev->data->dev_private;
2216 struct rte_flow *flow;
2220 sfc_adapter_lock(sa);
2222 while ((flow = TAILQ_FIRST(&sa->filter.flow_list)) != NULL) {
2223 rc = sfc_flow_remove(sa, flow, error);
2228 sfc_adapter_unlock(sa);
2234 sfc_flow_isolate(struct rte_eth_dev *dev, int enable,
2235 struct rte_flow_error *error)
2237 struct sfc_adapter *sa = dev->data->dev_private;
2238 struct sfc_port *port = &sa->port;
2241 sfc_adapter_lock(sa);
2242 if (sa->state != SFC_ADAPTER_INITIALIZED) {
2243 rte_flow_error_set(error, EBUSY,
2244 RTE_FLOW_ERROR_TYPE_UNSPECIFIED,
2245 NULL, "please close the port first");
2248 port->isolated = (enable) ? B_TRUE : B_FALSE;
2250 sfc_adapter_unlock(sa);
2255 const struct rte_flow_ops sfc_flow_ops = {
2256 .validate = sfc_flow_validate,
2257 .create = sfc_flow_create,
2258 .destroy = sfc_flow_destroy,
2259 .flush = sfc_flow_flush,
2261 .isolate = sfc_flow_isolate,
2265 sfc_flow_init(struct sfc_adapter *sa)
2267 SFC_ASSERT(sfc_adapter_is_locked(sa));
2269 TAILQ_INIT(&sa->filter.flow_list);
2273 sfc_flow_fini(struct sfc_adapter *sa)
2275 struct rte_flow *flow;
2277 SFC_ASSERT(sfc_adapter_is_locked(sa));
2279 while ((flow = TAILQ_FIRST(&sa->filter.flow_list)) != NULL) {
2280 TAILQ_REMOVE(&sa->filter.flow_list, flow, entries);
2286 sfc_flow_stop(struct sfc_adapter *sa)
2288 struct rte_flow *flow;
2290 SFC_ASSERT(sfc_adapter_is_locked(sa));
2292 TAILQ_FOREACH(flow, &sa->filter.flow_list, entries)
2293 sfc_flow_filter_remove(sa, flow);
2297 sfc_flow_start(struct sfc_adapter *sa)
2299 struct rte_flow *flow;
2302 sfc_log_init(sa, "entry");
2304 SFC_ASSERT(sfc_adapter_is_locked(sa));
2306 TAILQ_FOREACH(flow, &sa->filter.flow_list, entries) {
2307 rc = sfc_flow_filter_insert(sa, flow);
2312 sfc_log_init(sa, "done");