numam-dpdk/lib/librte_hash/rte_cmp_x86.h
Yipeng Wang 606bd11736 hash: fix TSX aborts with newer gcc
gcc 7 and 8 with O3 will generate vzeroupper from rte_memcpy
into TSX region which may abort the TSX transaction.

This fix changes rte_memcpy to memcpy which will not insert
extra vzeroupper into the library.

Fixes: f2e3001b53 ("hash: support read/write concurrency")
Cc: stable@dpdk.org

Signed-off-by: Yipeng Wang <yipeng1.wang@intel.com>
Signed-off-by: Bruce Richardson <bruce.richardson@intel.com>
2018-11-14 01:02:07 +01:00

77 lines
2.2 KiB
C

/* SPDX-License-Identifier: BSD-3-Clause
* Copyright(c) 2015 Intel Corporation
*/
#include <rte_vect.h>
/* Functions to compare multiple of 16 byte keys (up to 128 bytes) */
static int
rte_hash_k16_cmp_eq(const void *key1, const void *key2, size_t key_len __rte_unused)
{
const __m128i k1 = _mm_loadu_si128((const __m128i *) key1);
const __m128i k2 = _mm_loadu_si128((const __m128i *) key2);
const __m128i x = _mm_xor_si128(k1, k2);
return !_mm_test_all_zeros(x, x);
}
static int
rte_hash_k32_cmp_eq(const void *key1, const void *key2, size_t key_len)
{
return rte_hash_k16_cmp_eq(key1, key2, key_len) ||
rte_hash_k16_cmp_eq((const char *) key1 + 16,
(const char *) key2 + 16, key_len);
}
static int
rte_hash_k48_cmp_eq(const void *key1, const void *key2, size_t key_len)
{
return rte_hash_k16_cmp_eq(key1, key2, key_len) ||
rte_hash_k16_cmp_eq((const char *) key1 + 16,
(const char *) key2 + 16, key_len) ||
rte_hash_k16_cmp_eq((const char *) key1 + 32,
(const char *) key2 + 32, key_len);
}
static int
rte_hash_k64_cmp_eq(const void *key1, const void *key2, size_t key_len)
{
return rte_hash_k32_cmp_eq(key1, key2, key_len) ||
rte_hash_k32_cmp_eq((const char *) key1 + 32,
(const char *) key2 + 32, key_len);
}
static int
rte_hash_k80_cmp_eq(const void *key1, const void *key2, size_t key_len)
{
return rte_hash_k64_cmp_eq(key1, key2, key_len) ||
rte_hash_k16_cmp_eq((const char *) key1 + 64,
(const char *) key2 + 64, key_len);
}
static int
rte_hash_k96_cmp_eq(const void *key1, const void *key2, size_t key_len)
{
return rte_hash_k64_cmp_eq(key1, key2, key_len) ||
rte_hash_k32_cmp_eq((const char *) key1 + 64,
(const char *) key2 + 64, key_len);
}
static int
rte_hash_k112_cmp_eq(const void *key1, const void *key2, size_t key_len)
{
return rte_hash_k64_cmp_eq(key1, key2, key_len) ||
rte_hash_k32_cmp_eq((const char *) key1 + 64,
(const char *) key2 + 64, key_len) ||
rte_hash_k16_cmp_eq((const char *) key1 + 96,
(const char *) key2 + 96, key_len);
}
static int
rte_hash_k128_cmp_eq(const void *key1, const void *key2, size_t key_len)
{
return rte_hash_k64_cmp_eq(key1, key2, key_len) ||
rte_hash_k64_cmp_eq((const char *) key1 + 64,
(const char *) key2 + 64, key_len);
}