84fb33fec1
Replace use of RTE_MACHINE_CPUFLAG macros with regular compiler macros, which are more complete than those provided by DPDK, and as such it allows new instruction sets to be leveraged without having to do extra work to set them up in DPDK. Signed-off-by: Sean Morrissey <sean.morrissey@intel.com> Signed-off-by: Radu Nicolau <radu.nicolau@intel.com> Acked-by: David Marchand <david.marchand@redhat.com>
79 lines
1.9 KiB
C
79 lines
1.9 KiB
C
/* SPDX-License-Identifier: BSD-3-Clause
|
|
* Copyright(c) 2017 Intel Corporation
|
|
*/
|
|
|
|
#ifndef _RTE_MEMBER_X86_H_
|
|
#define _RTE_MEMBER_X86_H_
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
#include <x86intrin.h>
|
|
|
|
#if defined(__AVX2__)
|
|
|
|
static inline int
|
|
update_entry_search_avx(uint32_t bucket_id, member_sig_t tmp_sig,
|
|
struct member_ht_bucket *buckets,
|
|
member_set_t set_id)
|
|
{
|
|
uint32_t hitmask = _mm256_movemask_epi8((__m256i)_mm256_cmpeq_epi16(
|
|
_mm256_load_si256((__m256i const *)buckets[bucket_id].sigs),
|
|
_mm256_set1_epi16(tmp_sig)));
|
|
if (hitmask) {
|
|
uint32_t hit_idx = __builtin_ctzl(hitmask) >> 1;
|
|
buckets[bucket_id].sets[hit_idx] = set_id;
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static inline int
|
|
search_bucket_single_avx(uint32_t bucket_id, member_sig_t tmp_sig,
|
|
struct member_ht_bucket *buckets,
|
|
member_set_t *set_id)
|
|
{
|
|
uint32_t hitmask = _mm256_movemask_epi8((__m256i)_mm256_cmpeq_epi16(
|
|
_mm256_load_si256((__m256i const *)buckets[bucket_id].sigs),
|
|
_mm256_set1_epi16(tmp_sig)));
|
|
while (hitmask) {
|
|
uint32_t hit_idx = __builtin_ctzl(hitmask) >> 1;
|
|
if (buckets[bucket_id].sets[hit_idx] != RTE_MEMBER_NO_MATCH) {
|
|
*set_id = buckets[bucket_id].sets[hit_idx];
|
|
return 1;
|
|
}
|
|
hitmask &= ~(3U << ((hit_idx) << 1));
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static inline void
|
|
search_bucket_multi_avx(uint32_t bucket_id, member_sig_t tmp_sig,
|
|
struct member_ht_bucket *buckets,
|
|
uint32_t *counter,
|
|
uint32_t match_per_key,
|
|
member_set_t *set_id)
|
|
{
|
|
uint32_t hitmask = _mm256_movemask_epi8((__m256i)_mm256_cmpeq_epi16(
|
|
_mm256_load_si256((__m256i const *)buckets[bucket_id].sigs),
|
|
_mm256_set1_epi16(tmp_sig)));
|
|
while (hitmask) {
|
|
uint32_t hit_idx = __builtin_ctzl(hitmask) >> 1;
|
|
if (buckets[bucket_id].sets[hit_idx] != RTE_MEMBER_NO_MATCH) {
|
|
set_id[*counter] = buckets[bucket_id].sets[hit_idx];
|
|
(*counter)++;
|
|
if (*counter >= match_per_key)
|
|
return;
|
|
}
|
|
hitmask &= ~(3U << ((hit_idx) << 1));
|
|
}
|
|
}
|
|
#endif
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|
|
#endif /* _RTE_MEMBER_X86_H_ */
|