table: add unified params struct and mask-based hash func
[dpdk.git] / lib / librte_table / rte_table_hash_key16.c
index f78db77..7f6651c 100644 (file)
@@ -35,6 +35,7 @@
 
 #include <rte_common.h>
 #include <rte_mbuf.h>
+#include <rte_memory.h>
 #include <rte_malloc.h>
 #include <rte_log.h>
 
 
 #define RTE_BUCKET_ENTRY_VALID                                         0x1LLU
 
+#ifdef RTE_TABLE_STATS_COLLECT
+
+#define RTE_TABLE_HASH_KEY16_STATS_PKTS_IN_ADD(table, val) \
+       table->stats.n_pkts_in += val
+#define RTE_TABLE_HASH_KEY16_STATS_PKTS_LOOKUP_MISS(table, val) \
+       table->stats.n_pkts_lookup_miss += val
+
+#else
+
+#define RTE_TABLE_HASH_KEY16_STATS_PKTS_IN_ADD(table, val)
+#define RTE_TABLE_HASH_KEY16_STATS_PKTS_LOOKUP_MISS(table, val)
+
+#endif
+
 struct rte_bucket_4_16 {
        /* Cache line 0 */
        uint64_t signature[4 + 1];
@@ -60,6 +75,8 @@ struct rte_bucket_4_16 {
 };
 
 struct rte_table_hash {
+       struct rte_table_stats stats;
+
        /* Input parameters */
        uint32_t n_buckets;
        uint32_t n_entries_per_bucket;
@@ -68,7 +85,8 @@ struct rte_table_hash {
        uint32_t bucket_size;
        uint32_t signature_offset;
        uint32_t key_offset;
-       rte_table_hash_op_hash f_hash;
+       uint64_t key_mask[2];
+       rte_table_hash_op_hash_nomask f_hash;
        uint64_t seed;
 
        /* Extendible buckets */
@@ -88,18 +106,6 @@ check_params_create_lru(struct rte_table_hash_key16_lru_params *params) {
                return -EINVAL;
        }
 
-       /* signature offset */
-       if ((params->signature_offset & 0x3) != 0) {
-               RTE_LOG(ERR, TABLE, "%s: invalid signature_offset\n", __func__);
-               return -EINVAL;
-       }
-
-       /* key offset */
-       if ((params->key_offset & 0x7) != 0) {
-               RTE_LOG(ERR, TABLE, "%s: invalid key_offset\n", __func__);
-               return -EINVAL;
-       }
-
        /* f_hash */
        if (params->f_hash == NULL) {
                RTE_LOG(ERR, TABLE,
@@ -123,8 +129,8 @@ rte_table_hash_create_key16_lru(void *params,
 
        /* Check input parameters */
        if ((check_params_create_lru(p) != 0) ||
-               ((sizeof(struct rte_table_hash) % CACHE_LINE_SIZE) != 0) ||
-               ((sizeof(struct rte_bucket_4_16) % CACHE_LINE_SIZE) != 0))
+               ((sizeof(struct rte_table_hash) % RTE_CACHE_LINE_SIZE) != 0) ||
+               ((sizeof(struct rte_bucket_4_16) % 64) != 0))
                return NULL;
        n_entries_per_bucket = 4;
        key_size = 16;
@@ -133,11 +139,11 @@ rte_table_hash_create_key16_lru(void *params,
        n_buckets = rte_align32pow2((p->n_entries + n_entries_per_bucket - 1) /
                n_entries_per_bucket);
        bucket_size_cl = (sizeof(struct rte_bucket_4_16) + n_entries_per_bucket
-               * entry_size + CACHE_LINE_SIZE - 1) / CACHE_LINE_SIZE;
+               * entry_size + RTE_CACHE_LINE_SIZE - 1) / RTE_CACHE_LINE_SIZE;
        total_size = sizeof(struct rte_table_hash) + n_buckets *
-               bucket_size_cl * CACHE_LINE_SIZE;
+               bucket_size_cl * RTE_CACHE_LINE_SIZE;
 
-       f = rte_zmalloc_socket("TABLE", total_size, CACHE_LINE_SIZE, socket_id);
+       f = rte_zmalloc_socket("TABLE", total_size, RTE_CACHE_LINE_SIZE, socket_id);
        if (f == NULL) {
                RTE_LOG(ERR, TABLE,
                "%s: Cannot allocate %u bytes for hash table\n",
@@ -153,12 +159,20 @@ rte_table_hash_create_key16_lru(void *params,
        f->n_entries_per_bucket = n_entries_per_bucket;
        f->key_size = key_size;
        f->entry_size = entry_size;
-       f->bucket_size = bucket_size_cl * CACHE_LINE_SIZE;
+       f->bucket_size = bucket_size_cl * RTE_CACHE_LINE_SIZE;
        f->signature_offset = p->signature_offset;
        f->key_offset = p->key_offset;
        f->f_hash = p->f_hash;
        f->seed = p->seed;
 
+       if (p->key_mask != NULL) {
+               f->key_mask[0] = ((uint64_t *)p->key_mask)[0];
+               f->key_mask[1] = ((uint64_t *)p->key_mask)[1];
+       } else {
+               f->key_mask[0] = 0xFFFFFFFFFFFFFFFFLLU;
+               f->key_mask[1] = 0xFFFFFFFFFFFFFFFFLLU;
+       }
+
        for (i = 0; i < n_buckets; i++) {
                struct rte_bucket_4_16 *bucket;
 
@@ -173,7 +187,7 @@ rte_table_hash_create_key16_lru(void *params,
 static int
 rte_table_hash_free_key16_lru(void *table)
 {
-       struct rte_table_hash *f = (struct rte_table_hash *) table;
+       struct rte_table_hash *f = table;
 
        /* Check input parameters */
        if (f == NULL) {
@@ -193,7 +207,7 @@ rte_table_hash_entry_add_key16_lru(
        int *key_found,
        void **entry_ptr)
 {
-       struct rte_table_hash *f = (struct rte_table_hash *) table;
+       struct rte_table_hash *f = table;
        struct rte_bucket_4_16 *bucket;
        uint64_t signature, pos;
        uint32_t bucket_index, i;
@@ -259,7 +273,7 @@ rte_table_hash_entry_delete_key16_lru(
        int *key_found,
        void *entry)
 {
-       struct rte_table_hash *f = (struct rte_table_hash *) table;
+       struct rte_table_hash *f = table;
        struct rte_bucket_4_16 *bucket;
        uint64_t signature;
        uint32_t bucket_index, i;
@@ -306,18 +320,6 @@ check_params_create_ext(struct rte_table_hash_key16_ext_params *params) {
                return -EINVAL;
        }
 
-       /* signature offset */
-       if ((params->signature_offset & 0x3) != 0) {
-               RTE_LOG(ERR, TABLE, "%s: invalid signature offset\n", __func__);
-               return -EINVAL;
-       }
-
-       /* key offset */
-       if ((params->key_offset & 0x7) != 0) {
-               RTE_LOG(ERR, TABLE, "%s: invalid key offset\n", __func__);
-               return -EINVAL;
-       }
-
        /* f_hash */
        if (params->f_hash == NULL) {
                RTE_LOG(ERR, TABLE,
@@ -341,8 +343,8 @@ rte_table_hash_create_key16_ext(void *params,
 
        /* Check input parameters */
        if ((check_params_create_ext(p) != 0) ||
-               ((sizeof(struct rte_table_hash) % CACHE_LINE_SIZE) != 0) ||
-               ((sizeof(struct rte_bucket_4_16) % CACHE_LINE_SIZE) != 0))
+               ((sizeof(struct rte_table_hash) % RTE_CACHE_LINE_SIZE) != 0) ||
+               ((sizeof(struct rte_bucket_4_16) % 64) != 0))
                return NULL;
 
        n_entries_per_bucket = 4;
@@ -354,14 +356,14 @@ rte_table_hash_create_key16_ext(void *params,
        n_buckets_ext = (p->n_entries_ext + n_entries_per_bucket - 1) /
                n_entries_per_bucket;
        bucket_size_cl = (sizeof(struct rte_bucket_4_16) + n_entries_per_bucket
-               * entry_size + CACHE_LINE_SIZE - 1) / CACHE_LINE_SIZE;
-       stack_size_cl = (n_buckets_ext * sizeof(uint32_t) + CACHE_LINE_SIZE - 1)
-               / CACHE_LINE_SIZE;
+               * entry_size + RTE_CACHE_LINE_SIZE - 1) / RTE_CACHE_LINE_SIZE;
+       stack_size_cl = (n_buckets_ext * sizeof(uint32_t) + RTE_CACHE_LINE_SIZE - 1)
+               / RTE_CACHE_LINE_SIZE;
        total_size = sizeof(struct rte_table_hash) +
                ((n_buckets + n_buckets_ext) * bucket_size_cl + stack_size_cl) *
-               CACHE_LINE_SIZE;
+               RTE_CACHE_LINE_SIZE;
 
-       f = rte_zmalloc_socket("TABLE", total_size, CACHE_LINE_SIZE, socket_id);
+       f = rte_zmalloc_socket("TABLE", total_size, RTE_CACHE_LINE_SIZE, socket_id);
        if (f == NULL) {
                RTE_LOG(ERR, TABLE,
                        "%s: Cannot allocate %u bytes for hash table\n",
@@ -377,7 +379,7 @@ rte_table_hash_create_key16_ext(void *params,
        f->n_entries_per_bucket = n_entries_per_bucket;
        f->key_size = key_size;
        f->entry_size = entry_size;
-       f->bucket_size = bucket_size_cl * CACHE_LINE_SIZE;
+       f->bucket_size = bucket_size_cl * RTE_CACHE_LINE_SIZE;
        f->signature_offset = p->signature_offset;
        f->key_offset = p->key_offset;
        f->f_hash = p->f_hash;
@@ -391,13 +393,21 @@ rte_table_hash_create_key16_ext(void *params,
        for (i = 0; i < n_buckets_ext; i++)
                f->stack[i] = i;
 
+       if (p->key_mask != NULL) {
+               f->key_mask[0] = (((uint64_t *)p->key_mask)[0]);
+               f->key_mask[1] = (((uint64_t *)p->key_mask)[1]);
+       } else {
+               f->key_mask[0] = 0xFFFFFFFFFFFFFFFFLLU;
+               f->key_mask[1] = 0xFFFFFFFFFFFFFFFFLLU;
+       }
+
        return f;
 }
 
 static int
 rte_table_hash_free_key16_ext(void *table)
 {
-       struct rte_table_hash *f = (struct rte_table_hash *) table;
+       struct rte_table_hash *f = table;
 
        /* Check input parameters */
        if (f == NULL) {
@@ -417,7 +427,7 @@ rte_table_hash_entry_add_key16_ext(
        int *key_found,
        void **entry_ptr)
 {
-       struct rte_table_hash *f = (struct rte_table_hash *) table;
+       struct rte_table_hash *f = table;
        struct rte_bucket_4_16 *bucket0, *bucket, *bucket_prev;
        uint64_t signature;
        uint32_t bucket_index, i;
@@ -494,7 +504,7 @@ rte_table_hash_entry_delete_key16_ext(
        int *key_found,
        void *entry)
 {
-       struct rte_table_hash *f = (struct rte_table_hash *) table;
+       struct rte_table_hash *f = table;
        struct rte_bucket_4_16 *bucket0, *bucket, *bucket_prev;
        uint64_t signature;
        uint32_t bucket_index, i;
@@ -534,9 +544,8 @@ rte_table_hash_entry_delete_key16_ext(
 
                                        memset(bucket, 0,
                                                sizeof(struct rte_bucket_4_16));
-                                       bucket_index = (bucket -
-                                               ((struct rte_bucket_4_16 *)
-                                               f->memory)) - f->n_buckets;
+                                       bucket_index = (((uint8_t *)bucket -
+                                               (uint8_t *)f->memory)/f->bucket_size) - f->n_buckets;
                                        f->stack[f->stack_pos++] = bucket_index;
                                }
 
@@ -586,29 +595,38 @@ rte_table_hash_entry_delete_key16_ext(
                pos = 3;                                        \
 }
 
-#define lookup1_stage0(pkt0_index, mbuf0, pkts, pkts_mask)     \
+#define lookup1_stage0(pkt0_index, mbuf0, pkts, pkts_mask, f)  \
 {                                                              \
        uint64_t pkt_mask;                                      \
+       uint32_t key_offset = f->key_offset;\
                                                                \
        pkt0_index = __builtin_ctzll(pkts_mask);                \
        pkt_mask = 1LLU << pkt0_index;                          \
        pkts_mask &= ~pkt_mask;                                 \
                                                                \
        mbuf0 = pkts[pkt0_index];                               \
-       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf0, 0));   \
+       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf0, key_offset));\
 }
 
 #define lookup1_stage1(mbuf1, bucket1, f)                      \
 {                                                              \
-       uint64_t signature;                                     \
-       uint32_t bucket_index;                                  \
+       uint64_t *key;                                          \
+       uint64_t signature = 0;                         \
+       uint32_t bucket_index;                          \
+       uint64_t hash_key_buffer[2];            \
+                                                               \
+       key = RTE_MBUF_METADATA_UINT64_PTR(mbuf1, f->key_offset);\
+                                                               \
+       hash_key_buffer[0] = key[0] & f->key_mask[0];   \
+       hash_key_buffer[1] = key[1] & f->key_mask[1];   \
+       signature = f->f_hash(hash_key_buffer,                  \
+                       RTE_TABLE_HASH_KEY_SIZE, f->seed);              \
                                                                \
-       signature = RTE_MBUF_METADATA_UINT32(mbuf1, f->signature_offset);\
        bucket_index = signature & (f->n_buckets - 1);          \
        bucket1 = (struct rte_bucket_4_16 *)                    \
                &f->memory[bucket_index * f->bucket_size];      \
        rte_prefetch0(bucket1);                                 \
-       rte_prefetch0((void *)(((uintptr_t) bucket1) + CACHE_LINE_SIZE));\
+       rte_prefetch0((void *)(((uintptr_t) bucket1) + RTE_CACHE_LINE_SIZE));\
 }
 
 #define lookup1_stage2_lru(pkt2_index, mbuf2, bucket2,         \
@@ -617,11 +635,14 @@ rte_table_hash_entry_delete_key16_ext(
        void *a;                                                \
        uint64_t pkt_mask;                                      \
        uint64_t *key;                                          \
+       uint64_t hash_key_buffer[2];            \
        uint32_t pos;                                           \
                                                                \
        key = RTE_MBUF_METADATA_UINT64_PTR(mbuf2, f->key_offset);\
+       hash_key_buffer[0] = key[0] & f->key_mask[0];   \
+       hash_key_buffer[1] = key[1] & f->key_mask[1];   \
                                                                \
-       lookup_key16_cmp(key, bucket2, pos);                    \
+       lookup_key16_cmp(hash_key_buffer, bucket2, pos);        \
                                                                \
        pkt_mask = (bucket2->signature[pos] & 1LLU) << pkt2_index;\
        pkts_mask_out |= pkt_mask;                              \
@@ -639,11 +660,14 @@ rte_table_hash_entry_delete_key16_ext(
        void *a;                                                \
        uint64_t pkt_mask, bucket_mask;                         \
        uint64_t *key;                                          \
+       uint64_t hash_key_buffer[2];            \
        uint32_t pos;                                           \
                                                                \
        key = RTE_MBUF_METADATA_UINT64_PTR(mbuf2, f->key_offset);\
+       hash_key_buffer[0] = key[0] & f->key_mask[0];   \
+       hash_key_buffer[1] = key[1] & f->key_mask[1];   \
                                                                \
-       lookup_key16_cmp(key, bucket2, pos);                    \
+       lookup_key16_cmp(hash_key_buffer, bucket2, pos);        \
                                                                \
        pkt_mask = (bucket2->signature[pos] & 1LLU) << pkt2_index;\
        pkts_mask_out |= pkt_mask;                              \
@@ -666,12 +690,15 @@ rte_table_hash_entry_delete_key16_ext(
        void *a;                                                \
        uint64_t pkt_mask, bucket_mask;                         \
        uint64_t *key;                                          \
+       uint64_t hash_key_buffer[2];            \
        uint32_t pos;                                           \
                                                                \
        bucket = buckets[pkt_index];                            \
        key = keys[pkt_index];                                  \
+       hash_key_buffer[0] = key[0] & f->key_mask[0];   \
+       hash_key_buffer[1] = key[1] & f->key_mask[1];   \
                                                                \
-       lookup_key16_cmp(key, bucket, pos);                     \
+       lookup_key16_cmp(hash_key_buffer, bucket, pos); \
                                                                \
        pkt_mask = (bucket->signature[pos] & 1LLU) << pkt_index;\
        pkts_mask_out |= pkt_mask;                              \
@@ -684,42 +711,44 @@ rte_table_hash_entry_delete_key16_ext(
        buckets_mask |= bucket_mask;                            \
        bucket_next = bucket->next;                             \
        rte_prefetch0(bucket_next);                             \
-       rte_prefetch0((void *)(((uintptr_t) bucket_next) + CACHE_LINE_SIZE));\
+       rte_prefetch0((void *)(((uintptr_t) bucket_next) + RTE_CACHE_LINE_SIZE));\
        buckets[pkt_index] = bucket_next;                       \
        keys[pkt_index] = key;                                  \
 }
 
 #define lookup2_stage0(pkt00_index, pkt01_index, mbuf00, mbuf01,\
-               pkts, pkts_mask)                                \
+               pkts, pkts_mask, f)                             \
 {                                                              \
        uint64_t pkt00_mask, pkt01_mask;                        \
+       uint32_t key_offset = f->key_offset;            \
                                                                \
        pkt00_index = __builtin_ctzll(pkts_mask);               \
        pkt00_mask = 1LLU << pkt00_index;                       \
        pkts_mask &= ~pkt00_mask;                               \
                                                                \
        mbuf00 = pkts[pkt00_index];                             \
-       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf00, 0));  \
+       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf00, key_offset));\
                                                                \
        pkt01_index = __builtin_ctzll(pkts_mask);               \
        pkt01_mask = 1LLU << pkt01_index;                       \
        pkts_mask &= ~pkt01_mask;                               \
                                                                \
        mbuf01 = pkts[pkt01_index];                             \
-       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf01, 0));  \
+       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf01, key_offset));\
 }
 
 #define lookup2_stage0_with_odd_support(pkt00_index, pkt01_index,\
-               mbuf00, mbuf01, pkts, pkts_mask)                \
+               mbuf00, mbuf01, pkts, pkts_mask, f)             \
 {                                                              \
        uint64_t pkt00_mask, pkt01_mask;                        \
+       uint32_t key_offset = f->key_offset;            \
                                                                \
        pkt00_index = __builtin_ctzll(pkts_mask);               \
        pkt00_mask = 1LLU << pkt00_index;                       \
        pkts_mask &= ~pkt00_mask;                               \
                                                                \
        mbuf00 = pkts[pkt00_index];                             \
-       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf00, 0));  \
+       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf00, key_offset)); \
                                                                \
        pkt01_index = __builtin_ctzll(pkts_mask);               \
        if (pkts_mask == 0)                                     \
@@ -728,27 +757,37 @@ rte_table_hash_entry_delete_key16_ext(
        pkts_mask &= ~pkt01_mask;                               \
                                                                \
        mbuf01 = pkts[pkt01_index];                             \
-       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf01, 0));  \
+       rte_prefetch0(RTE_MBUF_METADATA_UINT8_PTR(mbuf01, key_offset)); \
 }
 
 #define lookup2_stage1(mbuf10, mbuf11, bucket10, bucket11, f)  \
 {                                                              \
+       uint64_t *key10, *key11;                                        \
+       uint64_t hash_offset_buffer[2];                         \
        uint64_t signature10, signature11;                      \
-       uint32_t bucket10_index, bucket11_index;                \
+       uint32_t bucket10_index, bucket11_index;        \
                                                                \
-       signature10 = RTE_MBUF_METADATA_UINT32(mbuf10, f->signature_offset);\
+       key10 = RTE_MBUF_METADATA_UINT64_PTR(mbuf10, f->key_offset);\
+       hash_offset_buffer[0] = key10[0] & f->key_mask[0];      \
+       hash_offset_buffer[1] = key10[1] & f->key_mask[1];      \
+       signature10 = f->f_hash(hash_offset_buffer,                     \
+                       RTE_TABLE_HASH_KEY_SIZE, f->seed);\
        bucket10_index = signature10 & (f->n_buckets - 1);      \
-       bucket10 = (struct rte_bucket_4_16 *)                   \
+       bucket10 = (struct rte_bucket_4_16 *)                           \
                &f->memory[bucket10_index * f->bucket_size];    \
        rte_prefetch0(bucket10);                                \
-       rte_prefetch0((void *)(((uintptr_t) bucket10) + CACHE_LINE_SIZE));\
+       rte_prefetch0((void *)(((uintptr_t) bucket10) + RTE_CACHE_LINE_SIZE));\
                                                                \
-       signature11 = RTE_MBUF_METADATA_UINT32(mbuf11, f->signature_offset);\
+       key11 = RTE_MBUF_METADATA_UINT64_PTR(mbuf11, f->key_offset);\
+       hash_offset_buffer[0] = key11[0] & f->key_mask[0];      \
+       hash_offset_buffer[1] = key11[1] & f->key_mask[1];      \
+       signature11 = f->f_hash(hash_offset_buffer,                     \
+                       RTE_TABLE_HASH_KEY_SIZE, f->seed);\
        bucket11_index = signature11 & (f->n_buckets - 1);      \
        bucket11 = (struct rte_bucket_4_16 *)                   \
                &f->memory[bucket11_index * f->bucket_size];    \
        rte_prefetch0(bucket11);                                \
-       rte_prefetch0((void *)(((uintptr_t) bucket11) + CACHE_LINE_SIZE));\
+       rte_prefetch0((void *)(((uintptr_t) bucket11) + RTE_CACHE_LINE_SIZE));\
 }
 
 #define lookup2_stage2_lru(pkt20_index, pkt21_index, mbuf20, mbuf21,\
@@ -757,13 +796,19 @@ rte_table_hash_entry_delete_key16_ext(
        void *a20, *a21;                                        \
        uint64_t pkt20_mask, pkt21_mask;                        \
        uint64_t *key20, *key21;                                \
+       uint64_t hash_key_buffer20[2];                  \
+       uint64_t hash_key_buffer21[2];                  \
        uint32_t pos20, pos21;                                  \
                                                                \
        key20 = RTE_MBUF_METADATA_UINT64_PTR(mbuf20, f->key_offset);\
        key21 = RTE_MBUF_METADATA_UINT64_PTR(mbuf21, f->key_offset);\
+       hash_key_buffer20[0] = key20[0] & f->key_mask[0];       \
+       hash_key_buffer20[1] = key20[1] & f->key_mask[1];       \
+       hash_key_buffer21[0] = key21[0] & f->key_mask[0];       \
+       hash_key_buffer21[1] = key21[1] & f->key_mask[1];       \
                                                                \
-       lookup_key16_cmp(key20, bucket20, pos20);               \
-       lookup_key16_cmp(key21, bucket21, pos21);               \
+       lookup_key16_cmp(hash_key_buffer20, bucket20, pos20);   \
+       lookup_key16_cmp(hash_key_buffer21, bucket21, pos21);   \
                                                                \
        pkt20_mask = (bucket20->signature[pos20] & 1LLU) << pkt20_index;\
        pkt21_mask = (bucket21->signature[pos21] & 1LLU) << pkt21_index;\
@@ -786,13 +831,19 @@ rte_table_hash_entry_delete_key16_ext(
        void *a20, *a21;                                        \
        uint64_t pkt20_mask, pkt21_mask, bucket20_mask, bucket21_mask;\
        uint64_t *key20, *key21;                                \
+       uint64_t hash_key_buffer20[2];                  \
+       uint64_t hash_key_buffer21[2];                  \
        uint32_t pos20, pos21;                                  \
                                                                \
        key20 = RTE_MBUF_METADATA_UINT64_PTR(mbuf20, f->key_offset);\
        key21 = RTE_MBUF_METADATA_UINT64_PTR(mbuf21, f->key_offset);\
+       hash_key_buffer20[0] = key20[0] & f->key_mask[0];       \
+       hash_key_buffer20[1] = key20[1] & f->key_mask[1];       \
+       hash_key_buffer21[0] = key21[0] & f->key_mask[0];       \
+       hash_key_buffer21[1] = key21[1] & f->key_mask[1];       \
                                                                \
-       lookup_key16_cmp(key20, bucket20, pos20);               \
-       lookup_key16_cmp(key21, bucket21, pos21);               \
+       lookup_key16_cmp(hash_key_buffer20, bucket20, pos20);   \
+       lookup_key16_cmp(hash_key_buffer21, bucket21, pos21);   \
                                                                \
        pkt20_mask = (bucket20->signature[pos20] & 1LLU) << pkt20_index;\
        pkt21_mask = (bucket21->signature[pos21] & 1LLU) << pkt21_index;\
@@ -831,6 +882,10 @@ rte_table_hash_lookup_key16_lru(
        uint32_t pkt11_index, pkt20_index, pkt21_index;
        uint64_t pkts_mask_out = 0;
 
+       __rte_unused uint32_t n_pkts_in = __builtin_popcountll(pkts_mask);
+
+       RTE_TABLE_HASH_KEY16_STATS_PKTS_IN_ADD(f, n_pkts_in);
+
        /* Cannot run the pipeline with less than 5 packets */
        if (__builtin_popcountll(pkts_mask) < 5) {
                for ( ; pkts_mask; ) {
@@ -838,13 +893,15 @@ rte_table_hash_lookup_key16_lru(
                        struct rte_mbuf *mbuf;
                        uint32_t pkt_index;
 
-                       lookup1_stage0(pkt_index, mbuf, pkts, pkts_mask);
+                       lookup1_stage0(pkt_index, mbuf, pkts, pkts_mask, f);
                        lookup1_stage1(mbuf, bucket, f);
                        lookup1_stage2_lru(pkt_index, mbuf, bucket,
                                pkts_mask_out, entries, f);
                }
 
                *lookup_hit_mask = pkts_mask_out;
+               RTE_TABLE_HASH_KEY16_STATS_PKTS_LOOKUP_MISS(f, n_pkts_in -
+                       __builtin_popcountll(pkts_mask_out));
                return 0;
        }
 
@@ -854,7 +911,7 @@ rte_table_hash_lookup_key16_lru(
         */
        /* Pipeline stage 0 */
        lookup2_stage0(pkt00_index, pkt01_index, mbuf00, mbuf01, pkts,
-               pkts_mask);
+               pkts_mask, f);
 
        /* Pipeline feed */
        mbuf10 = mbuf00;
@@ -864,7 +921,7 @@ rte_table_hash_lookup_key16_lru(
 
        /* Pipeline stage 0 */
        lookup2_stage0(pkt00_index, pkt01_index, mbuf00, mbuf01, pkts,
-               pkts_mask);
+               pkts_mask, f);
 
        /* Pipeline stage 1 */
        lookup2_stage1(mbuf10, mbuf11, bucket10, bucket11, f);
@@ -888,7 +945,7 @@ rte_table_hash_lookup_key16_lru(
 
                /* Pipeline stage 0 */
                lookup2_stage0_with_odd_support(pkt00_index, pkt01_index,
-                       mbuf00, mbuf01, pkts, pkts_mask);
+                       mbuf00, mbuf01, pkts, pkts_mask, f);
 
                /* Pipeline stage 1 */
                lookup2_stage1(mbuf10, mbuf11, bucket10, bucket11, f);
@@ -934,6 +991,8 @@ rte_table_hash_lookup_key16_lru(
                bucket20, bucket21, pkts_mask_out, entries, f);
 
        *lookup_hit_mask = pkts_mask_out;
+       RTE_TABLE_HASH_KEY16_STATS_PKTS_LOOKUP_MISS(f, n_pkts_in -
+               __builtin_popcountll(pkts_mask_out));
        return 0;
 } /* rte_table_hash_lookup_key16_lru() */
 
@@ -954,6 +1013,10 @@ rte_table_hash_lookup_key16_ext(
        struct rte_bucket_4_16 *buckets[RTE_PORT_IN_BURST_SIZE_MAX];
        uint64_t *keys[RTE_PORT_IN_BURST_SIZE_MAX];
 
+       __rte_unused uint32_t n_pkts_in = __builtin_popcountll(pkts_mask);
+
+       RTE_TABLE_HASH_KEY16_STATS_PKTS_IN_ADD(f, n_pkts_in);
+
        /* Cannot run the pipeline with less than 5 packets */
        if (__builtin_popcountll(pkts_mask) < 5) {
                for ( ; pkts_mask; ) {
@@ -961,7 +1024,7 @@ rte_table_hash_lookup_key16_ext(
                        struct rte_mbuf *mbuf;
                        uint32_t pkt_index;
 
-                       lookup1_stage0(pkt_index, mbuf, pkts, pkts_mask);
+                       lookup1_stage0(pkt_index, mbuf, pkts, pkts_mask, f);
                        lookup1_stage1(mbuf, bucket, f);
                        lookup1_stage2_ext(pkt_index, mbuf, bucket,
                                pkts_mask_out, entries, buckets_mask,
@@ -977,7 +1040,7 @@ rte_table_hash_lookup_key16_ext(
         */
        /* Pipeline stage 0 */
        lookup2_stage0(pkt00_index, pkt01_index, mbuf00, mbuf01, pkts,
-               pkts_mask);
+               pkts_mask, f);
 
        /* Pipeline feed */
        mbuf10 = mbuf00;
@@ -987,7 +1050,7 @@ rte_table_hash_lookup_key16_ext(
 
        /* Pipeline stage 0 */
        lookup2_stage0(pkt00_index, pkt01_index, mbuf00, mbuf01, pkts,
-               pkts_mask);
+               pkts_mask, f);
 
        /* Pipeline stage 1 */
        lookup2_stage1(mbuf10, mbuf11, bucket10, bucket11, f);
@@ -1011,7 +1074,7 @@ rte_table_hash_lookup_key16_ext(
 
                /* Pipeline stage 0 */
                lookup2_stage0_with_odd_support(pkt00_index, pkt01_index,
-                       mbuf00, mbuf01, pkts, pkts_mask);
+                       mbuf00, mbuf01, pkts, pkts_mask, f);
 
                /* Pipeline stage 1 */
                lookup2_stage1(mbuf10, mbuf11, bucket10, bucket11, f);
@@ -1080,15 +1143,32 @@ grind_next_buckets:
        }
 
        *lookup_hit_mask = pkts_mask_out;
+       RTE_TABLE_HASH_KEY16_STATS_PKTS_LOOKUP_MISS(f, n_pkts_in -
+               __builtin_popcountll(pkts_mask_out));
        return 0;
 } /* rte_table_hash_lookup_key16_ext() */
 
+static int
+rte_table_hash_key16_stats_read(void *table, struct rte_table_stats *stats, int clear)
+{
+       struct rte_table_hash *t = table;
+
+       if (stats != NULL)
+               memcpy(stats, &t->stats, sizeof(t->stats));
+
+       if (clear)
+               memset(&t->stats, 0, sizeof(t->stats));
+
+       return 0;
+}
+
 struct rte_table_ops rte_table_hash_key16_lru_ops = {
        .f_create = rte_table_hash_create_key16_lru,
        .f_free = rte_table_hash_free_key16_lru,
        .f_add = rte_table_hash_entry_add_key16_lru,
        .f_delete = rte_table_hash_entry_delete_key16_lru,
        .f_lookup = rte_table_hash_lookup_key16_lru,
+       .f_stats = rte_table_hash_key16_stats_read,
 };
 
 struct rte_table_ops rte_table_hash_key16_ext_ops = {
@@ -1097,4 +1177,5 @@ struct rte_table_ops rte_table_hash_key16_ext_ops = {
        .f_add = rte_table_hash_entry_add_key16_ext,
        .f_delete = rte_table_hash_entry_delete_key16_ext,
        .f_lookup = rte_table_hash_lookup_key16_ext,
+       .f_stats = rte_table_hash_key16_stats_read,
 };