remove extra parentheses in return statement
[dpdk.git] / examples / l3fwd / main.c
index def9594..c35926d 100644 (file)
@@ -1,7 +1,7 @@
 /*-
  *   BSD LICENSE
  *
- *   Copyright(c) 2010-2014 Intel Corporation. All rights reserved.
+ *   Copyright(c) 2010-2015 Intel Corporation. All rights reserved.
  *   All rights reserved.
  *
  *   Redistribution and use in source and binary forms, with or without
@@ -41,6 +41,8 @@
 #include <stdarg.h>
 #include <errno.h>
 #include <getopt.h>
+#include <signal.h>
+#include <stdbool.h>
 
 #include <rte_common.h>
 #include <rte_vect.h>
@@ -75,6 +77,8 @@
 #include <cmdline_parse.h>
 #include <cmdline_parse_etheraddr.h>
 
+static volatile bool force_quit;
+
 #define APP_LOOKUP_EXACT_MATCH          0
 #define APP_LOOKUP_LPM                  1
 #define DO_RFC_1812_CHECKS
@@ -373,7 +377,7 @@ ipv4_hash_crc(const void *data, __rte_unused uint32_t data_len,
        init_val = rte_jhash_1word(k->ip_dst, init_val);
        init_val = rte_jhash_1word(*p, init_val);
 #endif /* RTE_MACHINE_CPUFLAG_SSE4_2 */
-       return (init_val);
+       return init_val;
 }
 
 static inline uint32_t
@@ -416,7 +420,7 @@ ipv6_hash_crc(const void *data, __rte_unused uint32_t data_len, uint32_t init_va
        init_val = rte_jhash(k->ip_dst, sizeof(uint8_t) * IPV6_ADDR_LEN, init_val);
        init_val = rte_jhash_1word(*p, init_val);
 #endif /* RTE_MACHINE_CPUFLAG_SSE4_2 */
-       return (init_val);
+       return init_val;
 }
 
 #define IPV4_L3FWD_NUM_ROUTES \
@@ -541,6 +545,7 @@ send_single_packet(struct rte_mbuf *m, uint8_t port)
        return 0;
 }
 
+#if (APP_LOOKUP_METHOD == APP_LOOKUP_LPM)
 static inline __attribute__((always_inline)) void
 send_packetsx4(struct lcore_conf *qconf, uint8_t port,
        struct rte_mbuf *m[], uint32_t num)
@@ -618,6 +623,7 @@ send_packetsx4(struct lcore_conf *qconf, uint8_t port,
 
        qconf->tx_mbufs[port].len = len;
 }
+#endif /* APP_LOOKUP_LPM */
 
 #ifdef DO_RFC_1812_CHECKS
 static inline int
@@ -731,26 +737,34 @@ static inline void l3fwd_simple_forward(struct rte_mbuf *m, uint8_t portid,
 #if ((APP_LOOKUP_METHOD == APP_LOOKUP_EXACT_MATCH) && \
        (ENABLE_MULTI_BUFFER_OPTIMIZE == 1))
 
-#define MASK_ALL_PKTS    0xf
-#define EXECLUDE_1ST_PKT 0xe
-#define EXECLUDE_2ND_PKT 0xd
-#define EXECLUDE_3RD_PKT 0xb
-#define EXECLUDE_4TH_PKT 0x7
+#define MASK_ALL_PKTS    0xff
+#define EXCLUDE_1ST_PKT 0xfe
+#define EXCLUDE_2ND_PKT 0xfd
+#define EXCLUDE_3RD_PKT 0xfb
+#define EXCLUDE_4TH_PKT 0xf7
+#define EXCLUDE_5TH_PKT 0xef
+#define EXCLUDE_6TH_PKT 0xdf
+#define EXCLUDE_7TH_PKT 0xbf
+#define EXCLUDE_8TH_PKT 0x7f
 
 static inline void
-simple_ipv4_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *qconf)
+simple_ipv4_fwd_8pkts(struct rte_mbuf *m[8], uint8_t portid, struct lcore_conf *qconf)
 {
-       struct ether_hdr *eth_hdr[4];
-       struct ipv4_hdr *ipv4_hdr[4];
-       uint8_t dst_port[4];
-       int32_t ret[4];
-       union ipv4_5tuple_host key[4];
-       __m128i data[4];
+       struct ether_hdr *eth_hdr[8];
+       struct ipv4_hdr *ipv4_hdr[8];
+       uint8_t dst_port[8];
+       int32_t ret[8];
+       union ipv4_5tuple_host key[8];
+       __m128i data[8];
 
        eth_hdr[0] = rte_pktmbuf_mtod(m[0], struct ether_hdr *);
        eth_hdr[1] = rte_pktmbuf_mtod(m[1], struct ether_hdr *);
        eth_hdr[2] = rte_pktmbuf_mtod(m[2], struct ether_hdr *);
        eth_hdr[3] = rte_pktmbuf_mtod(m[3], struct ether_hdr *);
+       eth_hdr[4] = rte_pktmbuf_mtod(m[4], struct ether_hdr *);
+       eth_hdr[5] = rte_pktmbuf_mtod(m[5], struct ether_hdr *);
+       eth_hdr[6] = rte_pktmbuf_mtod(m[6], struct ether_hdr *);
+       eth_hdr[7] = rte_pktmbuf_mtod(m[7], struct ether_hdr *);
 
        /* Handle IPv4 headers.*/
        ipv4_hdr[0] = rte_pktmbuf_mtod_offset(m[0], struct ipv4_hdr *,
@@ -761,32 +775,56 @@ simple_ipv4_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *
                                              sizeof(struct ether_hdr));
        ipv4_hdr[3] = rte_pktmbuf_mtod_offset(m[3], struct ipv4_hdr *,
                                              sizeof(struct ether_hdr));
+       ipv4_hdr[4] = rte_pktmbuf_mtod_offset(m[4], struct ipv4_hdr *,
+                                             sizeof(struct ether_hdr));
+       ipv4_hdr[5] = rte_pktmbuf_mtod_offset(m[5], struct ipv4_hdr *,
+                                             sizeof(struct ether_hdr));
+       ipv4_hdr[6] = rte_pktmbuf_mtod_offset(m[6], struct ipv4_hdr *,
+                                             sizeof(struct ether_hdr));
+       ipv4_hdr[7] = rte_pktmbuf_mtod_offset(m[7], struct ipv4_hdr *,
+                                             sizeof(struct ether_hdr));
 
 #ifdef DO_RFC_1812_CHECKS
        /* Check to make sure the packet is valid (RFC1812) */
        uint8_t valid_mask = MASK_ALL_PKTS;
        if (is_valid_ipv4_pkt(ipv4_hdr[0], m[0]->pkt_len) < 0) {
                rte_pktmbuf_free(m[0]);
-               valid_mask &= EXECLUDE_1ST_PKT;
+               valid_mask &= EXCLUDE_1ST_PKT;
        }
        if (is_valid_ipv4_pkt(ipv4_hdr[1], m[1]->pkt_len) < 0) {
                rte_pktmbuf_free(m[1]);
-               valid_mask &= EXECLUDE_2ND_PKT;
+               valid_mask &= EXCLUDE_2ND_PKT;
        }
        if (is_valid_ipv4_pkt(ipv4_hdr[2], m[2]->pkt_len) < 0) {
                rte_pktmbuf_free(m[2]);
-               valid_mask &= EXECLUDE_3RD_PKT;
+               valid_mask &= EXCLUDE_3RD_PKT;
        }
        if (is_valid_ipv4_pkt(ipv4_hdr[3], m[3]->pkt_len) < 0) {
                rte_pktmbuf_free(m[3]);
-               valid_mask &= EXECLUDE_4TH_PKT;
+               valid_mask &= EXCLUDE_4TH_PKT;
+       }
+       if (is_valid_ipv4_pkt(ipv4_hdr[4], m[4]->pkt_len) < 0) {
+               rte_pktmbuf_free(m[4]);
+               valid_mask &= EXCLUDE_5TH_PKT;
+       }
+       if (is_valid_ipv4_pkt(ipv4_hdr[5], m[5]->pkt_len) < 0) {
+               rte_pktmbuf_free(m[5]);
+               valid_mask &= EXCLUDE_6TH_PKT;
+       }
+       if (is_valid_ipv4_pkt(ipv4_hdr[6], m[6]->pkt_len) < 0) {
+               rte_pktmbuf_free(m[6]);
+               valid_mask &= EXCLUDE_7TH_PKT;
+       }
+       if (is_valid_ipv4_pkt(ipv4_hdr[7], m[7]->pkt_len) < 0) {
+               rte_pktmbuf_free(m[7]);
+               valid_mask &= EXCLUDE_8TH_PKT;
        }
        if (unlikely(valid_mask != MASK_ALL_PKTS)) {
                if (valid_mask == 0){
                        return;
                } else {
                        uint8_t i = 0;
-                       for (i = 0; i < 4; i++) {
+                       for (i = 0; i < 8; i++) {
                                if ((0x1 << i) & valid_mask) {
                                        l3fwd_simple_forward(m[i], portid, qconf);
                                }
@@ -796,22 +834,52 @@ simple_ipv4_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *
        }
 #endif // End of #ifdef DO_RFC_1812_CHECKS
 
-       data[0] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[0], __m128i *, sizeof(struct ether_hdr) + offsetof(struct ipv4_hdr, time_to_live)));
-       data[1] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[1], __m128i *, sizeof(struct ether_hdr) + offsetof(struct ipv4_hdr, time_to_live)));
-       data[2] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[2], __m128i *, sizeof(struct ether_hdr) + offsetof(struct ipv4_hdr, time_to_live)));
-       data[3] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[3], __m128i *, sizeof(struct ether_hdr) + offsetof(struct ipv4_hdr, time_to_live)));
+       data[0] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[0], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
+       data[1] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[1], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
+       data[2] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[2], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
+       data[3] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[3], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
+       data[4] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[4], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
+       data[5] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[5], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
+       data[6] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[6], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
+       data[7] = _mm_loadu_si128(rte_pktmbuf_mtod_offset(m[7], __m128i *,
+                                       sizeof(struct ether_hdr) +
+                                       offsetof(struct ipv4_hdr, time_to_live)));
 
        key[0].xmm = _mm_and_si128(data[0], mask0);
        key[1].xmm = _mm_and_si128(data[1], mask0);
        key[2].xmm = _mm_and_si128(data[2], mask0);
        key[3].xmm = _mm_and_si128(data[3], mask0);
+       key[4].xmm = _mm_and_si128(data[4], mask0);
+       key[5].xmm = _mm_and_si128(data[5], mask0);
+       key[6].xmm = _mm_and_si128(data[6], mask0);
+       key[7].xmm = _mm_and_si128(data[7], mask0);
+
+       const void *key_array[8] = {&key[0], &key[1], &key[2], &key[3],
+                               &key[4], &key[5], &key[6], &key[7]};
 
-       const void *key_array[4] = {&key[0], &key[1], &key[2],&key[3]};
-       rte_hash_lookup_multi(qconf->ipv4_lookup_struct, &key_array[0], 4, ret);
+       rte_hash_lookup_multi(qconf->ipv4_lookup_struct, &key_array[0], 8, ret);
        dst_port[0] = (uint8_t) ((ret[0] < 0) ? portid : ipv4_l3fwd_out_if[ret[0]]);
        dst_port[1] = (uint8_t) ((ret[1] < 0) ? portid : ipv4_l3fwd_out_if[ret[1]]);
        dst_port[2] = (uint8_t) ((ret[2] < 0) ? portid : ipv4_l3fwd_out_if[ret[2]]);
        dst_port[3] = (uint8_t) ((ret[3] < 0) ? portid : ipv4_l3fwd_out_if[ret[3]]);
+       dst_port[4] = (uint8_t) ((ret[4] < 0) ? portid : ipv4_l3fwd_out_if[ret[4]]);
+       dst_port[5] = (uint8_t) ((ret[5] < 0) ? portid : ipv4_l3fwd_out_if[ret[5]]);
+       dst_port[6] = (uint8_t) ((ret[6] < 0) ? portid : ipv4_l3fwd_out_if[ret[6]]);
+       dst_port[7] = (uint8_t) ((ret[7] < 0) ? portid : ipv4_l3fwd_out_if[ret[7]]);
 
        if (dst_port[0] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[0]) == 0)
                dst_port[0] = portid;
@@ -821,6 +889,14 @@ simple_ipv4_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *
                dst_port[2] = portid;
        if (dst_port[3] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[3]) == 0)
                dst_port[3] = portid;
+       if (dst_port[4] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[4]) == 0)
+               dst_port[4] = portid;
+       if (dst_port[5] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[5]) == 0)
+               dst_port[5] = portid;
+       if (dst_port[6] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[6]) == 0)
+               dst_port[6] = portid;
+       if (dst_port[7] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[7]) == 0)
+               dst_port[7] = portid;
 
 #ifdef DO_RFC_1812_CHECKS
        /* Update time to live and header checksum */
@@ -832,6 +908,14 @@ simple_ipv4_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *
        ++(ipv4_hdr[1]->hdr_checksum);
        ++(ipv4_hdr[2]->hdr_checksum);
        ++(ipv4_hdr[3]->hdr_checksum);
+       --(ipv4_hdr[4]->time_to_live);
+       --(ipv4_hdr[5]->time_to_live);
+       --(ipv4_hdr[6]->time_to_live);
+       --(ipv4_hdr[7]->time_to_live);
+       ++(ipv4_hdr[4]->hdr_checksum);
+       ++(ipv4_hdr[5]->hdr_checksum);
+       ++(ipv4_hdr[6]->hdr_checksum);
+       ++(ipv4_hdr[7]->hdr_checksum);
 #endif
 
        /* dst addr */
@@ -839,17 +923,29 @@ simple_ipv4_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *
        *(uint64_t *)&eth_hdr[1]->d_addr = dest_eth_addr[dst_port[1]];
        *(uint64_t *)&eth_hdr[2]->d_addr = dest_eth_addr[dst_port[2]];
        *(uint64_t *)&eth_hdr[3]->d_addr = dest_eth_addr[dst_port[3]];
+       *(uint64_t *)&eth_hdr[4]->d_addr = dest_eth_addr[dst_port[4]];
+       *(uint64_t *)&eth_hdr[5]->d_addr = dest_eth_addr[dst_port[5]];
+       *(uint64_t *)&eth_hdr[6]->d_addr = dest_eth_addr[dst_port[6]];
+       *(uint64_t *)&eth_hdr[7]->d_addr = dest_eth_addr[dst_port[7]];
 
        /* src addr */
        ether_addr_copy(&ports_eth_addr[dst_port[0]], &eth_hdr[0]->s_addr);
        ether_addr_copy(&ports_eth_addr[dst_port[1]], &eth_hdr[1]->s_addr);
        ether_addr_copy(&ports_eth_addr[dst_port[2]], &eth_hdr[2]->s_addr);
        ether_addr_copy(&ports_eth_addr[dst_port[3]], &eth_hdr[3]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[4]], &eth_hdr[4]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[5]], &eth_hdr[5]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[6]], &eth_hdr[6]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[7]], &eth_hdr[7]->s_addr);
 
        send_single_packet(m[0], (uint8_t)dst_port[0]);
        send_single_packet(m[1], (uint8_t)dst_port[1]);
        send_single_packet(m[2], (uint8_t)dst_port[2]);
        send_single_packet(m[3], (uint8_t)dst_port[3]);
+       send_single_packet(m[4], (uint8_t)dst_port[4]);
+       send_single_packet(m[5], (uint8_t)dst_port[5]);
+       send_single_packet(m[6], (uint8_t)dst_port[6]);
+       send_single_packet(m[7], (uint8_t)dst_port[7]);
 
 }
 
@@ -866,18 +962,22 @@ static inline void get_ipv6_5tuple(struct rte_mbuf* m0, __m128i mask0, __m128i m
 }
 
 static inline void
-simple_ipv6_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *qconf)
+simple_ipv6_fwd_8pkts(struct rte_mbuf *m[8], uint8_t portid, struct lcore_conf *qconf)
 {
-       struct ether_hdr *eth_hdr[4];
-       __attribute__((unused)) struct ipv6_hdr *ipv6_hdr[4];
-       uint8_t dst_port[4];
-       int32_t ret[4];
-       union ipv6_5tuple_host key[4];
+       struct ether_hdr *eth_hdr[8];
+       __attribute__((unused)) struct ipv6_hdr *ipv6_hdr[8];
+       uint8_t dst_port[8];
+       int32_t ret[8];
+       union ipv6_5tuple_host key[8];
 
        eth_hdr[0] = rte_pktmbuf_mtod(m[0], struct ether_hdr *);
        eth_hdr[1] = rte_pktmbuf_mtod(m[1], struct ether_hdr *);
        eth_hdr[2] = rte_pktmbuf_mtod(m[2], struct ether_hdr *);
        eth_hdr[3] = rte_pktmbuf_mtod(m[3], struct ether_hdr *);
+       eth_hdr[4] = rte_pktmbuf_mtod(m[4], struct ether_hdr *);
+       eth_hdr[5] = rte_pktmbuf_mtod(m[5], struct ether_hdr *);
+       eth_hdr[6] = rte_pktmbuf_mtod(m[6], struct ether_hdr *);
+       eth_hdr[7] = rte_pktmbuf_mtod(m[7], struct ether_hdr *);
 
        /* Handle IPv6 headers.*/
        ipv6_hdr[0] = rte_pktmbuf_mtod_offset(m[0], struct ipv6_hdr *,
@@ -888,18 +988,36 @@ simple_ipv6_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *
                                              sizeof(struct ether_hdr));
        ipv6_hdr[3] = rte_pktmbuf_mtod_offset(m[3], struct ipv6_hdr *,
                                              sizeof(struct ether_hdr));
+       ipv6_hdr[4] = rte_pktmbuf_mtod_offset(m[4], struct ipv6_hdr *,
+                                             sizeof(struct ether_hdr));
+       ipv6_hdr[5] = rte_pktmbuf_mtod_offset(m[5], struct ipv6_hdr *,
+                                             sizeof(struct ether_hdr));
+       ipv6_hdr[6] = rte_pktmbuf_mtod_offset(m[6], struct ipv6_hdr *,
+                                             sizeof(struct ether_hdr));
+       ipv6_hdr[7] = rte_pktmbuf_mtod_offset(m[7], struct ipv6_hdr *,
+                                             sizeof(struct ether_hdr));
 
        get_ipv6_5tuple(m[0], mask1, mask2, &key[0]);
        get_ipv6_5tuple(m[1], mask1, mask2, &key[1]);
        get_ipv6_5tuple(m[2], mask1, mask2, &key[2]);
        get_ipv6_5tuple(m[3], mask1, mask2, &key[3]);
-
-       const void *key_array[4] = {&key[0], &key[1], &key[2],&key[3]};
-       rte_hash_lookup_multi(qconf->ipv6_lookup_struct, &key_array[0], 4, ret);
-       dst_port[0] = (uint8_t) ((ret[0] < 0)? portid:ipv6_l3fwd_out_if[ret[0]]);
-       dst_port[1] = (uint8_t) ((ret[1] < 0)? portid:ipv6_l3fwd_out_if[ret[1]]);
-       dst_port[2] = (uint8_t) ((ret[2] < 0)? portid:ipv6_l3fwd_out_if[ret[2]]);
-       dst_port[3] = (uint8_t) ((ret[3] < 0)? portid:ipv6_l3fwd_out_if[ret[3]]);
+       get_ipv6_5tuple(m[4], mask1, mask2, &key[4]);
+       get_ipv6_5tuple(m[5], mask1, mask2, &key[5]);
+       get_ipv6_5tuple(m[6], mask1, mask2, &key[6]);
+       get_ipv6_5tuple(m[7], mask1, mask2, &key[7]);
+
+       const void *key_array[8] = {&key[0], &key[1], &key[2], &key[3],
+                               &key[4], &key[5], &key[6], &key[7]};
+
+       rte_hash_lookup_multi(qconf->ipv6_lookup_struct, &key_array[0], 8, ret);
+       dst_port[0] = (uint8_t) ((ret[0] < 0) ? portid:ipv6_l3fwd_out_if[ret[0]]);
+       dst_port[1] = (uint8_t) ((ret[1] < 0) ? portid:ipv6_l3fwd_out_if[ret[1]]);
+       dst_port[2] = (uint8_t) ((ret[2] < 0) ? portid:ipv6_l3fwd_out_if[ret[2]]);
+       dst_port[3] = (uint8_t) ((ret[3] < 0) ? portid:ipv6_l3fwd_out_if[ret[3]]);
+       dst_port[4] = (uint8_t) ((ret[4] < 0) ? portid:ipv6_l3fwd_out_if[ret[4]]);
+       dst_port[5] = (uint8_t) ((ret[5] < 0) ? portid:ipv6_l3fwd_out_if[ret[5]]);
+       dst_port[6] = (uint8_t) ((ret[6] < 0) ? portid:ipv6_l3fwd_out_if[ret[6]]);
+       dst_port[7] = (uint8_t) ((ret[7] < 0) ? portid:ipv6_l3fwd_out_if[ret[7]]);
 
        if (dst_port[0] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[0]) == 0)
                dst_port[0] = portid;
@@ -909,23 +1027,43 @@ simple_ipv6_fwd_4pkts(struct rte_mbuf* m[4], uint8_t portid, struct lcore_conf *
                dst_port[2] = portid;
        if (dst_port[3] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[3]) == 0)
                dst_port[3] = portid;
+       if (dst_port[4] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[4]) == 0)
+               dst_port[4] = portid;
+       if (dst_port[5] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[5]) == 0)
+               dst_port[5] = portid;
+       if (dst_port[6] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[6]) == 0)
+               dst_port[6] = portid;
+       if (dst_port[7] >= RTE_MAX_ETHPORTS || (enabled_port_mask & 1 << dst_port[7]) == 0)
+               dst_port[7] = portid;
 
        /* dst addr */
        *(uint64_t *)&eth_hdr[0]->d_addr = dest_eth_addr[dst_port[0]];
        *(uint64_t *)&eth_hdr[1]->d_addr = dest_eth_addr[dst_port[1]];
        *(uint64_t *)&eth_hdr[2]->d_addr = dest_eth_addr[dst_port[2]];
        *(uint64_t *)&eth_hdr[3]->d_addr = dest_eth_addr[dst_port[3]];
+       *(uint64_t *)&eth_hdr[4]->d_addr = dest_eth_addr[dst_port[4]];
+       *(uint64_t *)&eth_hdr[5]->d_addr = dest_eth_addr[dst_port[5]];
+       *(uint64_t *)&eth_hdr[6]->d_addr = dest_eth_addr[dst_port[6]];
+       *(uint64_t *)&eth_hdr[7]->d_addr = dest_eth_addr[dst_port[7]];
 
        /* src addr */
        ether_addr_copy(&ports_eth_addr[dst_port[0]], &eth_hdr[0]->s_addr);
        ether_addr_copy(&ports_eth_addr[dst_port[1]], &eth_hdr[1]->s_addr);
        ether_addr_copy(&ports_eth_addr[dst_port[2]], &eth_hdr[2]->s_addr);
        ether_addr_copy(&ports_eth_addr[dst_port[3]], &eth_hdr[3]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[4]], &eth_hdr[4]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[5]], &eth_hdr[5]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[6]], &eth_hdr[6]->s_addr);
+       ether_addr_copy(&ports_eth_addr[dst_port[7]], &eth_hdr[7]->s_addr);
 
        send_single_packet(m[0], (uint8_t)dst_port[0]);
        send_single_packet(m[1], (uint8_t)dst_port[1]);
        send_single_packet(m[2], (uint8_t)dst_port[2]);
        send_single_packet(m[3], (uint8_t)dst_port[3]);
+       send_single_packet(m[4], (uint8_t)dst_port[4]);
+       send_single_packet(m[5], (uint8_t)dst_port[5]);
+       send_single_packet(m[6], (uint8_t)dst_port[6]);
+       send_single_packet(m[7], (uint8_t)dst_port[7]);
 
 }
 #endif /* APP_LOOKUP_METHOD */
@@ -939,7 +1077,7 @@ l3fwd_simple_forward(struct rte_mbuf *m, uint8_t portid, struct lcore_conf *qcon
 
        eth_hdr = rte_pktmbuf_mtod(m, struct ether_hdr *);
 
-       if (m->ol_flags & PKT_RX_IPV4_HDR) {
+       if (RTE_ETH_IS_IPV4_HDR(m->packet_type)) {
                /* Handle IPv4 headers.*/
                ipv4_hdr = rte_pktmbuf_mtod_offset(m, struct ipv4_hdr *,
                                                   sizeof(struct ether_hdr));
@@ -970,8 +1108,7 @@ l3fwd_simple_forward(struct rte_mbuf *m, uint8_t portid, struct lcore_conf *qcon
                ether_addr_copy(&ports_eth_addr[dst_port], &eth_hdr->s_addr);
 
                send_single_packet(m, dst_port);
-
-       } else {
+       } else if (RTE_ETH_IS_IPV6_HDR(m->packet_type)) {
                /* Handle IPv6 headers.*/
                struct ipv6_hdr *ipv6_hdr;
 
@@ -990,10 +1127,13 @@ l3fwd_simple_forward(struct rte_mbuf *m, uint8_t portid, struct lcore_conf *qcon
                ether_addr_copy(&ports_eth_addr[dst_port], &eth_hdr->s_addr);
 
                send_single_packet(m, dst_port);
-       }
-
+       } else
+               /* Free the mbuf that contains non-IPV4/IPV6 packet */
+               rte_pktmbuf_free(m);
 }
 
+#if ((APP_LOOKUP_METHOD == APP_LOOKUP_LPM) && \
+       (ENABLE_MULTI_BUFFER_OPTIMIZE == 1))
 #ifdef DO_RFC_1812_CHECKS
 
 #define        IPV4_MIN_VER_IHL        0x45
@@ -1015,12 +1155,11 @@ l3fwd_simple_forward(struct rte_mbuf *m, uint8_t portid, struct lcore_conf *qcon
  * to BAD_PORT value.
  */
 static inline __attribute__((always_inline)) void
-rfc1812_process(struct ipv4_hdr *ipv4_hdr, uint16_t *dp, uint32_t flags)
+rfc1812_process(struct ipv4_hdr *ipv4_hdr, uint16_t *dp, uint32_t ptype)
 {
        uint8_t ihl;
 
-       if ((flags & PKT_RX_IPV4_HDR) != 0) {
-
+       if (RTE_ETH_IS_IPV4_HDR(ptype)) {
                ihl = ipv4_hdr->version_ihl - IPV4_MIN_VER_IHL;
 
                ipv4_hdr->time_to_live--;
@@ -1037,6 +1176,7 @@ rfc1812_process(struct ipv4_hdr *ipv4_hdr, uint16_t *dp, uint32_t flags)
 #else
 #define        rfc1812_process(mb, dp) do { } while (0)
 #endif /* DO_RFC_1812_CHECKS */
+#endif /* APP_LOOKUP_LPM && ENABLE_MULTI_BUFFER_OPTIMIZE */
 
 
 #if ((APP_LOOKUP_METHOD == APP_LOOKUP_LPM) && \
@@ -1050,11 +1190,11 @@ get_dst_port(const struct lcore_conf *qconf, struct rte_mbuf *pkt,
        struct ipv6_hdr *ipv6_hdr;
        struct ether_hdr *eth_hdr;
 
-       if (pkt->ol_flags & PKT_RX_IPV4_HDR) {
+       if (RTE_ETH_IS_IPV4_HDR(pkt->packet_type)) {
                if (rte_lpm_lookup(qconf->ipv4_lookup_struct, dst_ipv4,
                                &next_hop) != 0)
                        next_hop = portid;
-       } else if (pkt->ol_flags & PKT_RX_IPV6_HDR) {
+       } else if (RTE_ETH_IS_IPV6_HDR(pkt->packet_type)) {
                eth_hdr = rte_pktmbuf_mtod(pkt, struct ether_hdr *);
                ipv6_hdr = (struct ipv6_hdr *)(eth_hdr + 1);
                if (rte_lpm6_lookup(qconf->ipv6_lookup_struct,
@@ -1084,21 +1224,23 @@ process_packet(struct lcore_conf *qconf, struct rte_mbuf *pkt,
        dst_ipv4 = rte_be_to_cpu_32(dst_ipv4);
        dp = get_dst_port(qconf, pkt, dst_ipv4, portid);
 
-       te = _mm_load_si128((__m128i *)eth_hdr);
+       te = _mm_loadu_si128((__m128i *)eth_hdr);
        ve = val_eth[dp];
 
        dst_port[0] = dp;
-       rfc1812_process(ipv4_hdr, dst_port, pkt->ol_flags);
+       rfc1812_process(ipv4_hdr, dst_port, pkt->packet_type);
 
        te =  _mm_blend_epi16(te, ve, MASK_ETH);
-       _mm_store_si128((__m128i *)eth_hdr, te);
+       _mm_storeu_si128((__m128i *)eth_hdr, te);
 }
 
 /*
- * Read ol_flags and destination IPV4 addresses from 4 mbufs.
+ * Read packet_type and destination IPV4 addresses from 4 mbufs.
  */
 static inline void
-processx4_step1(struct rte_mbuf *pkt[FWDSTEP], __m128i *dip, uint32_t *flag)
+processx4_step1(struct rte_mbuf *pkt[FWDSTEP],
+               __m128i *dip,
+               uint32_t *ipv4_flag)
 {
        struct ipv4_hdr *ipv4_hdr;
        struct ether_hdr *eth_hdr;
@@ -1107,22 +1249,22 @@ processx4_step1(struct rte_mbuf *pkt[FWDSTEP], __m128i *dip, uint32_t *flag)
        eth_hdr = rte_pktmbuf_mtod(pkt[0], struct ether_hdr *);
        ipv4_hdr = (struct ipv4_hdr *)(eth_hdr + 1);
        x0 = ipv4_hdr->dst_addr;
-       flag[0] = pkt[0]->ol_flags & PKT_RX_IPV4_HDR;
+       ipv4_flag[0] = pkt[0]->packet_type & RTE_PTYPE_L3_IPV4;
 
        eth_hdr = rte_pktmbuf_mtod(pkt[1], struct ether_hdr *);
        ipv4_hdr = (struct ipv4_hdr *)(eth_hdr + 1);
        x1 = ipv4_hdr->dst_addr;
-       flag[0] &= pkt[1]->ol_flags;
+       ipv4_flag[0] &= pkt[1]->packet_type;
 
        eth_hdr = rte_pktmbuf_mtod(pkt[2], struct ether_hdr *);
        ipv4_hdr = (struct ipv4_hdr *)(eth_hdr + 1);
        x2 = ipv4_hdr->dst_addr;
-       flag[0] &= pkt[2]->ol_flags;
+       ipv4_flag[0] &= pkt[2]->packet_type;
 
        eth_hdr = rte_pktmbuf_mtod(pkt[3], struct ether_hdr *);
        ipv4_hdr = (struct ipv4_hdr *)(eth_hdr + 1);
        x3 = ipv4_hdr->dst_addr;
-       flag[0] &= pkt[3]->ol_flags;
+       ipv4_flag[0] &= pkt[3]->packet_type;
 
        dip[0] = _mm_set_epi32(x3, x2, x1, x0);
 }
@@ -1132,8 +1274,12 @@ processx4_step1(struct rte_mbuf *pkt[FWDSTEP], __m128i *dip, uint32_t *flag)
  * If lookup fails, use incoming port (portid) as destination port.
  */
 static inline void
-processx4_step2(const struct lcore_conf *qconf, __m128i dip, uint32_t flag,
-       uint8_t portid, struct rte_mbuf *pkt[FWDSTEP], uint16_t dprt[FWDSTEP])
+processx4_step2(const struct lcore_conf *qconf,
+               __m128i dip,
+               uint32_t ipv4_flag,
+               uint8_t portid,
+               struct rte_mbuf *pkt[FWDSTEP],
+               uint16_t dprt[FWDSTEP])
 {
        rte_xmm_t dst;
        const  __m128i bswap_mask = _mm_set_epi8(12, 13, 14, 15, 8, 9, 10, 11,
@@ -1143,7 +1289,7 @@ processx4_step2(const struct lcore_conf *qconf, __m128i dip, uint32_t flag,
        dip = _mm_shuffle_epi8(dip, bswap_mask);
 
        /* if all 4 packets are IPV4. */
-       if (likely(flag != 0)) {
+       if (likely(ipv4_flag)) {
                rte_lpm_lookupx4(qconf->ipv4_lookup_struct, dip, dprt, portid);
        } else {
                dst.x = dip;
@@ -1171,16 +1317,16 @@ processx4_step3(struct rte_mbuf *pkt[FWDSTEP], uint16_t dst_port[FWDSTEP])
        p[3] = rte_pktmbuf_mtod(pkt[3], __m128i *);
 
        ve[0] = val_eth[dst_port[0]];
-       te[0] = _mm_load_si128(p[0]);
+       te[0] = _mm_loadu_si128(p[0]);
 
        ve[1] = val_eth[dst_port[1]];
-       te[1] = _mm_load_si128(p[1]);
+       te[1] = _mm_loadu_si128(p[1]);
 
        ve[2] = val_eth[dst_port[2]];
-       te[2] = _mm_load_si128(p[2]);
+       te[2] = _mm_loadu_si128(p[2]);
 
        ve[3] = val_eth[dst_port[3]];
-       te[3] = _mm_load_si128(p[3]);
+       te[3] = _mm_loadu_si128(p[3]);
 
        /* Update first 12 bytes, keep rest bytes intact. */
        te[0] =  _mm_blend_epi16(te[0], ve[0], MASK_ETH);
@@ -1188,19 +1334,19 @@ processx4_step3(struct rte_mbuf *pkt[FWDSTEP], uint16_t dst_port[FWDSTEP])
        te[2] =  _mm_blend_epi16(te[2], ve[2], MASK_ETH);
        te[3] =  _mm_blend_epi16(te[3], ve[3], MASK_ETH);
 
-       _mm_store_si128(p[0], te[0]);
-       _mm_store_si128(p[1], te[1]);
-       _mm_store_si128(p[2], te[2]);
-       _mm_store_si128(p[3], te[3]);
+       _mm_storeu_si128(p[0], te[0]);
+       _mm_storeu_si128(p[1], te[1]);
+       _mm_storeu_si128(p[2], te[2]);
+       _mm_storeu_si128(p[3], te[3]);
 
        rfc1812_process((struct ipv4_hdr *)((struct ether_hdr *)p[0] + 1),
-               &dst_port[0], pkt[0]->ol_flags);
+               &dst_port[0], pkt[0]->packet_type);
        rfc1812_process((struct ipv4_hdr *)((struct ether_hdr *)p[1] + 1),
-               &dst_port[1], pkt[1]->ol_flags);
+               &dst_port[1], pkt[1]->packet_type);
        rfc1812_process((struct ipv4_hdr *)((struct ether_hdr *)p[2] + 1),
-               &dst_port[2], pkt[2]->ol_flags);
+               &dst_port[2], pkt[2]->packet_type);
        rfc1812_process((struct ipv4_hdr *)((struct ether_hdr *)p[3] + 1),
-               &dst_port[3], pkt[3]->ol_flags);
+               &dst_port[3], pkt[3]->packet_type);
 }
 
 /*
@@ -1387,7 +1533,7 @@ main_loop(__attribute__((unused)) void *dummy)
        uint16_t *lp;
        uint16_t dst_port[MAX_PKT_BURST];
        __m128i dip[MAX_PKT_BURST / FWDSTEP];
-       uint32_t flag[MAX_PKT_BURST / FWDSTEP];
+       uint32_t ipv4_flag[MAX_PKT_BURST / FWDSTEP];
        uint16_t pnum[MAX_PKT_BURST + 1];
 #endif
 
@@ -1411,7 +1557,7 @@ main_loop(__attribute__((unused)) void *dummy)
                        portid, queueid);
        }
 
-       while (1) {
+       while (!force_quit) {
 
                cur_tsc = rte_rdtsc();
 
@@ -1452,20 +1598,26 @@ main_loop(__attribute__((unused)) void *dummy)
 #if (APP_LOOKUP_METHOD == APP_LOOKUP_EXACT_MATCH)
                        {
                                /*
-                                * Send nb_rx - nb_rx%4 packets
-                                * in groups of 4.
+                                * Send nb_rx - nb_rx%8 packets
+                                * in groups of 8.
                                 */
-                               int32_t n = RTE_ALIGN_FLOOR(nb_rx, 4);
-                               for (j = 0; j < n ; j+=4) {
-                                       uint32_t ol_flag = pkts_burst[j]->ol_flags
-                                                       & pkts_burst[j+1]->ol_flags
-                                                       & pkts_burst[j+2]->ol_flags
-                                                       & pkts_burst[j+3]->ol_flags;
-                                       if (ol_flag & PKT_RX_IPV4_HDR ) {
-                                               simple_ipv4_fwd_4pkts(&pkts_burst[j],
-                                                                       portid, qconf);
-                                       } else if (ol_flag & PKT_RX_IPV6_HDR) {
-                                               simple_ipv6_fwd_4pkts(&pkts_burst[j],
+                               int32_t n = RTE_ALIGN_FLOOR(nb_rx, 8);
+                               for (j = 0; j < n; j += 8) {
+                                       uint32_t pkt_type =
+                                               pkts_burst[j]->packet_type &
+                                               pkts_burst[j+1]->packet_type &
+                                               pkts_burst[j+2]->packet_type &
+                                               pkts_burst[j+3]->packet_type &
+                                               pkts_burst[j+4]->packet_type &
+                                               pkts_burst[j+5]->packet_type &
+                                               pkts_burst[j+6]->packet_type &
+                                               pkts_burst[j+7]->packet_type;
+                                       if (pkt_type & RTE_PTYPE_L3_IPV4) {
+                                               simple_ipv4_fwd_8pkts(
+                                               &pkts_burst[j], portid, qconf);
+                                       } else if (pkt_type &
+                                               RTE_PTYPE_L3_IPV6) {
+                                               simple_ipv6_fwd_8pkts(&pkts_burst[j],
                                                                        portid, qconf);
                                        } else {
                                                l3fwd_simple_forward(pkts_burst[j],
@@ -1476,6 +1628,14 @@ main_loop(__attribute__((unused)) void *dummy)
                                                                        portid, qconf);
                                                l3fwd_simple_forward(pkts_burst[j+3],
                                                                        portid, qconf);
+                                               l3fwd_simple_forward(pkts_burst[j+4],
+                                                                       portid, qconf);
+                                               l3fwd_simple_forward(pkts_burst[j+5],
+                                                                       portid, qconf);
+                                               l3fwd_simple_forward(pkts_burst[j+6],
+                                                                       portid, qconf);
+                                               l3fwd_simple_forward(pkts_burst[j+7],
+                                                                       portid, qconf);
                                        }
                                }
                                for (; j < nb_rx ; j++) {
@@ -1489,13 +1649,13 @@ main_loop(__attribute__((unused)) void *dummy)
                        for (j = 0; j != k; j += FWDSTEP) {
                                processx4_step1(&pkts_burst[j],
                                        &dip[j / FWDSTEP],
-                                       &flag[j / FWDSTEP]);
+                                       &ipv4_flag[j / FWDSTEP]);
                        }
 
                        k = RTE_ALIGN_FLOOR(nb_rx, FWDSTEP);
                        for (j = 0; j != k; j += FWDSTEP) {
                                processx4_step2(qconf, dip[j / FWDSTEP],
-                                       flag[j / FWDSTEP], portid,
+                                       ipv4_flag[j / FWDSTEP], portid,
                                        &pkts_burst[j], &dst_port[j]);
                        }
 
@@ -1625,6 +1785,8 @@ main_loop(__attribute__((unused)) void *dummy)
 
                }
        }
+
+       return 0;
 }
 
 static int
@@ -1918,7 +2080,7 @@ parse_args(int argc, char **argv)
                        }
 
                        if (!strncmp(lgopts[option_index].name, CMD_LINE_OPT_ETH_DEST,
-                               sizeof(CMD_LINE_OPT_CONFIG))) {
+                               sizeof(CMD_LINE_OPT_ETH_DEST))) {
                                        parse_eth_dest(optarg);
                        }
 
@@ -2360,8 +2522,12 @@ check_all_ports_link_status(uint8_t port_num, uint32_t port_mask)
        printf("\nChecking link status");
        fflush(stdout);
        for (count = 0; count <= MAX_CHECK_TIME; count++) {
+               if (force_quit)
+                       return;
                all_ports_up = 1;
                for (portid = 0; portid < port_num; portid++) {
+                       if (force_quit)
+                               return;
                        if ((port_mask & (1 << portid)) == 0)
                                continue;
                        memset(&link, 0, sizeof(link));
@@ -2403,6 +2569,16 @@ check_all_ports_link_status(uint8_t port_num, uint32_t port_mask)
        }
 }
 
+static void
+signal_handler(int signum)
+{
+       if (signum == SIGINT || signum == SIGTERM) {
+               printf("\n\nSignal %d received, preparing to exit...\n",
+                               signum);
+               force_quit = true;
+       }
+}
+
 int
 main(int argc, char **argv)
 {
@@ -2423,6 +2599,10 @@ main(int argc, char **argv)
        argc -= ret;
        argv += ret;
 
+       force_quit = false;
+       signal(SIGINT, signal_handler);
+       signal(SIGTERM, signal_handler);
+
        /* pre-init dst MACs for all ports to 02:00:00:00:00:xx */
        for (portid = 0; portid < RTE_MAX_ETHPORTS; portid++) {
                dest_eth_addr[portid] = ETHER_LOCAL_ADMIN_ADDR + ((uint64_t)portid << 40);
@@ -2577,12 +2757,26 @@ main(int argc, char **argv)
 
        check_all_ports_link_status((uint8_t)nb_ports, enabled_port_mask);
 
+       ret = 0;
        /* launch per-lcore init on every lcore */
        rte_eal_mp_remote_launch(main_loop, NULL, CALL_MASTER);
        RTE_LCORE_FOREACH_SLAVE(lcore_id) {
-               if (rte_eal_wait_lcore(lcore_id) < 0)
-                       return -1;
+               if (rte_eal_wait_lcore(lcore_id) < 0) {
+                       ret = -1;
+                       break;
+               }
        }
 
-       return 0;
+       /* stop ports */
+       for (portid = 0; portid < nb_ports; portid++) {
+               if ((enabled_port_mask & (1 << portid)) == 0)
+                       continue;
+               printf("Closing port %d...", portid);
+               rte_eth_dev_stop(portid);
+               rte_eth_dev_close(portid);
+               printf(" Done\n");
+       }
+       printf("Bye...\n");
+
+       return ret;
 }