numam-dpdk/lib/librte_member/rte_member_x86.h
Radu Nicolau 84fb33fec1 build: remove deprecated cpuflag macros
Replace use of RTE_MACHINE_CPUFLAG macros with regular compiler
macros, which are more complete than those provided by DPDK, and as such
it allows new instruction sets to be leveraged without having to do
extra work to set them up in DPDK.

Signed-off-by: Sean Morrissey <sean.morrissey@intel.com>
Signed-off-by: Radu Nicolau <radu.nicolau@intel.com>
Acked-by: David Marchand <david.marchand@redhat.com>
2020-09-25 11:13:57 +02:00

79 lines
1.9 KiB
C

/* SPDX-License-Identifier: BSD-3-Clause
* Copyright(c) 2017 Intel Corporation
*/
#ifndef _RTE_MEMBER_X86_H_
#define _RTE_MEMBER_X86_H_
#ifdef __cplusplus
extern "C" {
#endif
#include <x86intrin.h>
#if defined(__AVX2__)
static inline int
update_entry_search_avx(uint32_t bucket_id, member_sig_t tmp_sig,
struct member_ht_bucket *buckets,
member_set_t set_id)
{
uint32_t hitmask = _mm256_movemask_epi8((__m256i)_mm256_cmpeq_epi16(
_mm256_load_si256((__m256i const *)buckets[bucket_id].sigs),
_mm256_set1_epi16(tmp_sig)));
if (hitmask) {
uint32_t hit_idx = __builtin_ctzl(hitmask) >> 1;
buckets[bucket_id].sets[hit_idx] = set_id;
return 1;
}
return 0;
}
static inline int
search_bucket_single_avx(uint32_t bucket_id, member_sig_t tmp_sig,
struct member_ht_bucket *buckets,
member_set_t *set_id)
{
uint32_t hitmask = _mm256_movemask_epi8((__m256i)_mm256_cmpeq_epi16(
_mm256_load_si256((__m256i const *)buckets[bucket_id].sigs),
_mm256_set1_epi16(tmp_sig)));
while (hitmask) {
uint32_t hit_idx = __builtin_ctzl(hitmask) >> 1;
if (buckets[bucket_id].sets[hit_idx] != RTE_MEMBER_NO_MATCH) {
*set_id = buckets[bucket_id].sets[hit_idx];
return 1;
}
hitmask &= ~(3U << ((hit_idx) << 1));
}
return 0;
}
static inline void
search_bucket_multi_avx(uint32_t bucket_id, member_sig_t tmp_sig,
struct member_ht_bucket *buckets,
uint32_t *counter,
uint32_t match_per_key,
member_set_t *set_id)
{
uint32_t hitmask = _mm256_movemask_epi8((__m256i)_mm256_cmpeq_epi16(
_mm256_load_si256((__m256i const *)buckets[bucket_id].sigs),
_mm256_set1_epi16(tmp_sig)));
while (hitmask) {
uint32_t hit_idx = __builtin_ctzl(hitmask) >> 1;
if (buckets[bucket_id].sets[hit_idx] != RTE_MEMBER_NO_MATCH) {
set_id[*counter] = buckets[bucket_id].sets[hit_idx];
(*counter)++;
if (*counter >= match_per_key)
return;
}
hitmask &= ~(3U << ((hit_idx) << 1));
}
}
#endif
#ifdef __cplusplus
}
#endif
#endif /* _RTE_MEMBER_X86_H_ */