X-Git-Url: http://git.droids-corp.org/?a=blobdiff_plain;f=lib%2Flibrte_hash%2Frte_hash_crc.h;h=63e74aa4742201b85b8f24c8a553bf18ac55926d;hb=fed622dfd90ffc754808ecb464d7e62e77f0da58;hp=1cd626cb4abe2a47a05ab864163760e7238e0bb4;hpb=42a03256321858a576cef1d2c351b1015b3b4bf4;p=dpdk.git diff --git a/lib/librte_hash/rte_hash_crc.h b/lib/librte_hash/rte_hash_crc.h index 1cd626cb4a..63e74aa474 100644 --- a/lib/librte_hash/rte_hash_crc.h +++ b/lib/librte_hash/rte_hash_crc.h @@ -327,6 +327,28 @@ static const uint32_t crc32c_tables[8][256] = {{ (crc32c_tables[(n)][(crc) & 0xFF] ^ \ crc32c_tables[(n)-1][((crc) >> 8) & 0xFF]) +static inline uint32_t +crc32c_1byte(uint8_t data, uint32_t init_val) +{ + uint32_t crc; + crc = init_val; + crc ^= data; + + return crc32c_tables[0][crc & 0xff] ^ (crc >> 8); +} + +static inline uint32_t +crc32c_2bytes(uint16_t data, uint32_t init_val) +{ + uint32_t crc; + crc = init_val; + crc ^= data; + + crc = CRC32_UPD(crc, 1) ^ (crc >> 16); + + return crc; +} + static inline uint32_t crc32c_1word(uint32_t data, uint32_t init_val) { @@ -366,6 +388,26 @@ crc32c_2words(uint64_t data, uint32_t init_val) } #if defined(RTE_ARCH_I686) || defined(RTE_ARCH_X86_64) +static inline uint32_t +crc32c_sse42_u8(uint8_t data, uint32_t init_val) +{ + __asm__ volatile( + "crc32b %[data], %[init_val];" + : [init_val] "+r" (init_val) + : [data] "rm" (data)); + return init_val; +} + +static inline uint32_t +crc32c_sse42_u16(uint16_t data, uint32_t init_val) +{ + __asm__ volatile( + "crc32w %[data], %[init_val];" + : [init_val] "+r" (init_val) + : [data] "rm" (data)); + return init_val; +} + static inline uint32_t crc32c_sse42_u32(uint32_t data, uint32_t init_val) { @@ -407,9 +449,14 @@ crc32c_sse42_u64(uint64_t data, uint64_t init_val) #define CRC32_SSE42 (1U << 1) #define CRC32_x64 (1U << 2) #define CRC32_SSE42_x64 (CRC32_x64|CRC32_SSE42) +#define CRC32_ARM64 (1U << 3) static uint8_t crc32_alg = CRC32_SW; +#if defined(RTE_ARCH_ARM64) +#include "rte_crc_arm64.h" +#else + /** * Allow or disallow use of SSE4.2 instrinsics for CRC32 hash * calculation. @@ -425,12 +472,14 @@ static inline void rte_hash_crc_set_alg(uint8_t alg) { switch (alg) { +#if defined(RTE_ARCH_I686) || defined(RTE_ARCH_X86_64) case CRC32_SSE42_x64: if (! rte_cpu_get_flag_enabled(RTE_CPUFLAG_EM64T)) alg = CRC32_SSE42; case CRC32_SSE42: if (! rte_cpu_get_flag_enabled(RTE_CPUFLAG_SSE4_2)) alg = CRC32_SW; +#endif case CRC32_SW: crc32_alg = alg; default: @@ -445,6 +494,52 @@ rte_hash_crc_init_alg(void) rte_hash_crc_set_alg(CRC32_SSE42_x64); } +/** + * Use single crc32 instruction to perform a hash on a byte value. + * Fall back to software crc32 implementation in case SSE4.2 is + * not supported + * + * @param data + * Data to perform hash on. + * @param init_val + * Value to initialise hash generator. + * @return + * 32bit calculated hash value. + */ +static inline uint32_t +rte_hash_crc_1byte(uint8_t data, uint32_t init_val) +{ +#if defined RTE_ARCH_I686 || defined RTE_ARCH_X86_64 + if (likely(crc32_alg & CRC32_SSE42)) + return crc32c_sse42_u8(data, init_val); +#endif + + return crc32c_1byte(data, init_val); +} + +/** + * Use single crc32 instruction to perform a hash on a 2 bytes value. + * Fall back to software crc32 implementation in case SSE4.2 is + * not supported + * + * @param data + * Data to perform hash on. + * @param init_val + * Value to initialise hash generator. + * @return + * 32bit calculated hash value. + */ +static inline uint32_t +rte_hash_crc_2byte(uint16_t data, uint32_t init_val) +{ +#if defined RTE_ARCH_I686 || defined RTE_ARCH_X86_64 + if (likely(crc32_alg & CRC32_SSE42)) + return crc32c_sse42_u16(data, init_val); +#endif + + return crc32c_2bytes(data, init_val); +} + /** * Use single crc32 instruction to perform a hash on a 4 byte value. * Fall back to software crc32 implementation in case SSE4.2 is @@ -496,6 +591,8 @@ rte_hash_crc_8byte(uint64_t data, uint32_t init_val) return crc32c_2words(data, init_val); } +#endif + /** * Calculate CRC32 hash on user-supplied byte array. * @@ -512,42 +609,26 @@ static inline uint32_t rte_hash_crc(const void *data, uint32_t data_len, uint32_t init_val) { unsigned i; - uint64_t temp = 0; - const uint64_t *p64 = (const uint64_t *)data; + uintptr_t pd = (uintptr_t) data; for (i = 0; i < data_len / 8; i++) { - init_val = rte_hash_crc_8byte(*p64++, init_val); + init_val = rte_hash_crc_8byte(*(const uint64_t *)pd, init_val); + pd += 8; } - switch (7 - (data_len & 0x07)) { - case 0: - temp |= (uint64_t) *((const uint8_t *)p64 + 6) << 48; - /* Fallthrough */ - case 1: - temp |= (uint64_t) *((const uint8_t *)p64 + 5) << 40; - /* Fallthrough */ - case 2: - temp |= (uint64_t) *((const uint8_t *)p64 + 4) << 32; - temp |= *((const uint32_t *)p64); - init_val = rte_hash_crc_8byte(temp, init_val); - break; - case 3: - init_val = rte_hash_crc_4byte(*(const uint32_t *)p64, init_val); - break; - case 4: - temp |= *((const uint8_t *)p64 + 2) << 16; - /* Fallthrough */ - case 5: - temp |= *((const uint8_t *)p64 + 1) << 8; - /* Fallthrough */ - case 6: - temp |= *((const uint8_t *)p64); - init_val = rte_hash_crc_4byte(temp, init_val); - /* Fallthrough */ - default: - break; + if (data_len & 0x4) { + init_val = rte_hash_crc_4byte(*(const uint32_t *)pd, init_val); + pd += 4; } + if (data_len & 0x2) { + init_val = rte_hash_crc_2byte(*(const uint16_t *)pd, init_val); + pd += 2; + } + + if (data_len & 0x1) + init_val = rte_hash_crc_1byte(*(const uint8_t *)pd, init_val); + return init_val; }