4 * Copyright(c) 2010-2016 Intel Corporation. All rights reserved.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in
15 * the documentation and/or other materials provided with the
17 * * Neither the name of Intel Corporation nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
38 #include <sys/types.h>
40 #include <sys/queue.h>
46 #include <rte_debug.h>
47 #include <rte_ether.h>
48 #include <rte_ethdev.h>
49 #include <rte_mempool.h>
50 #include <rte_cycles.h>
60 struct ipv4_l3fwd_lpm_route {
66 struct ipv6_l3fwd_lpm_route {
72 static struct ipv4_l3fwd_lpm_route ipv4_l3fwd_lpm_route_array[] = {
73 {IPv4(1, 1, 1, 0), 24, 0},
74 {IPv4(2, 1, 1, 0), 24, 1},
75 {IPv4(3, 1, 1, 0), 24, 2},
76 {IPv4(4, 1, 1, 0), 24, 3},
77 {IPv4(5, 1, 1, 0), 24, 4},
78 {IPv4(6, 1, 1, 0), 24, 5},
79 {IPv4(7, 1, 1, 0), 24, 6},
80 {IPv4(8, 1, 1, 0), 24, 7},
83 static struct ipv6_l3fwd_lpm_route ipv6_l3fwd_lpm_route_array[] = {
84 {{1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 0},
85 {{2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 1},
86 {{3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 2},
87 {{4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 3},
88 {{5, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 4},
89 {{6, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 5},
90 {{7, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 6},
91 {{8, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1}, 48, 7},
94 #define IPV4_L3FWD_LPM_NUM_ROUTES \
95 (sizeof(ipv4_l3fwd_lpm_route_array) / sizeof(ipv4_l3fwd_lpm_route_array[0]))
96 #define IPV6_L3FWD_LPM_NUM_ROUTES \
97 (sizeof(ipv6_l3fwd_lpm_route_array) / sizeof(ipv6_l3fwd_lpm_route_array[0]))
99 #define IPV4_L3FWD_LPM_MAX_RULES 1024
100 #define IPV4_L3FWD_LPM_NUMBER_TBL8S (1 << 8)
101 #define IPV6_L3FWD_LPM_MAX_RULES 1024
102 #define IPV6_L3FWD_LPM_NUMBER_TBL8S (1 << 16)
104 struct rte_lpm *ipv4_l3fwd_lpm_lookup_struct[NB_SOCKETS];
105 struct rte_lpm6 *ipv6_l3fwd_lpm_lookup_struct[NB_SOCKETS];
107 static inline uint16_t
108 lpm_get_ipv4_dst_port(void *ipv4_hdr, uint8_t portid, void *lookup_struct)
111 struct rte_lpm *ipv4_l3fwd_lookup_struct =
112 (struct rte_lpm *)lookup_struct;
114 return (uint16_t) ((rte_lpm_lookup(ipv4_l3fwd_lookup_struct,
115 rte_be_to_cpu_32(((struct ipv4_hdr *)ipv4_hdr)->dst_addr),
116 &next_hop) == 0) ? next_hop : portid);
119 static inline uint16_t
120 lpm_get_ipv6_dst_port(void *ipv6_hdr, uint8_t portid, void *lookup_struct)
123 struct rte_lpm6 *ipv6_l3fwd_lookup_struct =
124 (struct rte_lpm6 *)lookup_struct;
126 return (uint16_t) ((rte_lpm6_lookup(ipv6_l3fwd_lookup_struct,
127 ((struct ipv6_hdr *)ipv6_hdr)->dst_addr,
128 &next_hop) == 0) ? next_hop : portid);
131 static __rte_always_inline uint16_t
132 lpm_get_dst_port(const struct lcore_conf *qconf, struct rte_mbuf *pkt,
135 struct ipv6_hdr *ipv6_hdr;
136 struct ipv4_hdr *ipv4_hdr;
137 struct ether_hdr *eth_hdr;
139 if (RTE_ETH_IS_IPV4_HDR(pkt->packet_type)) {
141 eth_hdr = rte_pktmbuf_mtod(pkt, struct ether_hdr *);
142 ipv4_hdr = (struct ipv4_hdr *)(eth_hdr + 1);
144 return lpm_get_ipv4_dst_port(ipv4_hdr, portid,
145 qconf->ipv4_lookup_struct);
146 } else if (RTE_ETH_IS_IPV6_HDR(pkt->packet_type)) {
148 eth_hdr = rte_pktmbuf_mtod(pkt, struct ether_hdr *);
149 ipv6_hdr = (struct ipv6_hdr *)(eth_hdr + 1);
151 return lpm_get_ipv6_dst_port(ipv6_hdr, portid,
152 qconf->ipv6_lookup_struct);
159 * lpm_get_dst_port optimized routine for packets where dst_ipv4 is already
160 * precalculated. If packet is ipv6 dst_addr is taken directly from packet
161 * header and dst_ipv4 value is not used.
163 static __rte_always_inline uint16_t
164 lpm_get_dst_port_with_ipv4(const struct lcore_conf *qconf, struct rte_mbuf *pkt,
165 uint32_t dst_ipv4, uint8_t portid)
168 struct ipv6_hdr *ipv6_hdr;
169 struct ether_hdr *eth_hdr;
171 if (RTE_ETH_IS_IPV4_HDR(pkt->packet_type)) {
172 return (uint16_t) ((rte_lpm_lookup(qconf->ipv4_lookup_struct,
173 dst_ipv4, &next_hop) == 0)
174 ? next_hop : portid);
176 } else if (RTE_ETH_IS_IPV6_HDR(pkt->packet_type)) {
178 eth_hdr = rte_pktmbuf_mtod(pkt, struct ether_hdr *);
179 ipv6_hdr = (struct ipv6_hdr *)(eth_hdr + 1);
181 return (uint16_t) ((rte_lpm6_lookup(qconf->ipv6_lookup_struct,
182 ipv6_hdr->dst_addr, &next_hop) == 0)
183 ? next_hop : portid);
190 #if defined(RTE_ARCH_X86)
191 #include "l3fwd_lpm_sse.h"
192 #elif defined RTE_MACHINE_CPUFLAG_NEON
193 #include "l3fwd_lpm_neon.h"
195 #include "l3fwd_lpm.h"
198 /* main processing loop */
200 lpm_main_loop(__attribute__((unused)) void *dummy)
202 struct rte_mbuf *pkts_burst[MAX_PKT_BURST];
204 uint64_t prev_tsc, diff_tsc, cur_tsc;
206 uint8_t portid, queueid;
207 struct lcore_conf *qconf;
208 const uint64_t drain_tsc = (rte_get_tsc_hz() + US_PER_S - 1) /
209 US_PER_S * BURST_TX_DRAIN_US;
213 lcore_id = rte_lcore_id();
214 qconf = &lcore_conf[lcore_id];
216 if (qconf->n_rx_queue == 0) {
217 RTE_LOG(INFO, L3FWD, "lcore %u has nothing to do\n", lcore_id);
221 RTE_LOG(INFO, L3FWD, "entering main loop on lcore %u\n", lcore_id);
223 for (i = 0; i < qconf->n_rx_queue; i++) {
225 portid = qconf->rx_queue_list[i].port_id;
226 queueid = qconf->rx_queue_list[i].queue_id;
228 " -- lcoreid=%u portid=%hhu rxqueueid=%hhu\n",
229 lcore_id, portid, queueid);
232 while (!force_quit) {
234 cur_tsc = rte_rdtsc();
237 * TX burst queue drain
239 diff_tsc = cur_tsc - prev_tsc;
240 if (unlikely(diff_tsc > drain_tsc)) {
242 for (i = 0; i < qconf->n_tx_port; ++i) {
243 portid = qconf->tx_port_id[i];
244 if (qconf->tx_mbufs[portid].len == 0)
247 qconf->tx_mbufs[portid].len,
249 qconf->tx_mbufs[portid].len = 0;
256 * Read packet from RX queues
258 for (i = 0; i < qconf->n_rx_queue; ++i) {
259 portid = qconf->rx_queue_list[i].port_id;
260 queueid = qconf->rx_queue_list[i].queue_id;
261 nb_rx = rte_eth_rx_burst(portid, queueid, pkts_burst,
266 #if defined RTE_ARCH_X86 || defined RTE_MACHINE_CPUFLAG_NEON
267 l3fwd_lpm_send_packets(nb_rx, pkts_burst,
270 l3fwd_lpm_no_opt_send_packets(nb_rx, pkts_burst,
280 setup_lpm(const int socketid)
282 struct rte_lpm6_config config;
283 struct rte_lpm_config config_ipv4;
288 /* create the LPM table */
289 config_ipv4.max_rules = IPV4_L3FWD_LPM_MAX_RULES;
290 config_ipv4.number_tbl8s = IPV4_L3FWD_LPM_NUMBER_TBL8S;
291 config_ipv4.flags = 0;
292 snprintf(s, sizeof(s), "IPV4_L3FWD_LPM_%d", socketid);
293 ipv4_l3fwd_lpm_lookup_struct[socketid] =
294 rte_lpm_create(s, socketid, &config_ipv4);
295 if (ipv4_l3fwd_lpm_lookup_struct[socketid] == NULL)
296 rte_exit(EXIT_FAILURE,
297 "Unable to create the l3fwd LPM table on socket %d\n",
300 /* populate the LPM table */
301 for (i = 0; i < IPV4_L3FWD_LPM_NUM_ROUTES; i++) {
303 /* skip unused ports */
304 if ((1 << ipv4_l3fwd_lpm_route_array[i].if_out &
305 enabled_port_mask) == 0)
308 ret = rte_lpm_add(ipv4_l3fwd_lpm_lookup_struct[socketid],
309 ipv4_l3fwd_lpm_route_array[i].ip,
310 ipv4_l3fwd_lpm_route_array[i].depth,
311 ipv4_l3fwd_lpm_route_array[i].if_out);
314 rte_exit(EXIT_FAILURE,
315 "Unable to add entry %u to the l3fwd LPM table on socket %d\n",
319 printf("LPM: Adding route 0x%08x / %d (%d)\n",
320 (unsigned)ipv4_l3fwd_lpm_route_array[i].ip,
321 ipv4_l3fwd_lpm_route_array[i].depth,
322 ipv4_l3fwd_lpm_route_array[i].if_out);
325 /* create the LPM6 table */
326 snprintf(s, sizeof(s), "IPV6_L3FWD_LPM_%d", socketid);
328 config.max_rules = IPV6_L3FWD_LPM_MAX_RULES;
329 config.number_tbl8s = IPV6_L3FWD_LPM_NUMBER_TBL8S;
331 ipv6_l3fwd_lpm_lookup_struct[socketid] = rte_lpm6_create(s, socketid,
333 if (ipv6_l3fwd_lpm_lookup_struct[socketid] == NULL)
334 rte_exit(EXIT_FAILURE,
335 "Unable to create the l3fwd LPM table on socket %d\n",
338 /* populate the LPM table */
339 for (i = 0; i < IPV6_L3FWD_LPM_NUM_ROUTES; i++) {
341 /* skip unused ports */
342 if ((1 << ipv6_l3fwd_lpm_route_array[i].if_out &
343 enabled_port_mask) == 0)
346 ret = rte_lpm6_add(ipv6_l3fwd_lpm_lookup_struct[socketid],
347 ipv6_l3fwd_lpm_route_array[i].ip,
348 ipv6_l3fwd_lpm_route_array[i].depth,
349 ipv6_l3fwd_lpm_route_array[i].if_out);
352 rte_exit(EXIT_FAILURE,
353 "Unable to add entry %u to the l3fwd LPM table on socket %d\n",
357 printf("LPM: Adding route %s / %d (%d)\n",
359 ipv6_l3fwd_lpm_route_array[i].depth,
360 ipv6_l3fwd_lpm_route_array[i].if_out);
365 lpm_check_ptype(int portid)
368 int ptype_l3_ipv4 = 0, ptype_l3_ipv6 = 0;
369 uint32_t ptype_mask = RTE_PTYPE_L3_MASK;
371 ret = rte_eth_dev_get_supported_ptypes(portid, ptype_mask, NULL, 0);
375 uint32_t ptypes[ret];
377 ret = rte_eth_dev_get_supported_ptypes(portid, ptype_mask, ptypes, ret);
378 for (i = 0; i < ret; ++i) {
379 if (ptypes[i] & RTE_PTYPE_L3_IPV4)
381 if (ptypes[i] & RTE_PTYPE_L3_IPV6)
385 if (ptype_l3_ipv4 == 0)
386 printf("port %d cannot parse RTE_PTYPE_L3_IPV4\n", portid);
388 if (ptype_l3_ipv6 == 0)
389 printf("port %d cannot parse RTE_PTYPE_L3_IPV6\n", portid);
391 if (ptype_l3_ipv4 && ptype_l3_ipv6)
399 lpm_parse_ptype(struct rte_mbuf *m)
401 struct ether_hdr *eth_hdr;
402 uint32_t packet_type = RTE_PTYPE_UNKNOWN;
405 eth_hdr = rte_pktmbuf_mtod(m, struct ether_hdr *);
406 ether_type = eth_hdr->ether_type;
407 if (ether_type == rte_cpu_to_be_16(ETHER_TYPE_IPv4))
408 packet_type |= RTE_PTYPE_L3_IPV4_EXT_UNKNOWN;
409 else if (ether_type == rte_cpu_to_be_16(ETHER_TYPE_IPv6))
410 packet_type |= RTE_PTYPE_L3_IPV6_EXT_UNKNOWN;
412 m->packet_type = packet_type;
416 lpm_cb_parse_ptype(uint8_t port __rte_unused, uint16_t queue __rte_unused,
417 struct rte_mbuf *pkts[], uint16_t nb_pkts,
418 uint16_t max_pkts __rte_unused,
419 void *user_param __rte_unused)
423 for (i = 0; i < nb_pkts; ++i)
424 lpm_parse_ptype(pkts[i]);
429 /* Return ipv4/ipv6 lpm fwd lookup struct. */
431 lpm_get_ipv4_l3fwd_lookup_struct(const int socketid)
433 return ipv4_l3fwd_lpm_lookup_struct[socketid];
437 lpm_get_ipv6_l3fwd_lookup_struct(const int socketid)
439 return ipv6_l3fwd_lpm_lookup_struct[socketid];