Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions rabitqlib/fastscan/fastscan.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -184,7 +184,7 @@ inline void accumulate(

for (size_t i = 0; i < code_length; i += 64) {
c = _mm256_loadu_si256((__m256i*)&codes[i]);
lut = _mm256_loadu_si256((__m256i*)&LUT[i]);
lut = _mm256_loadu_si256((__m256i*)&lut[i]);
lo = _mm256_and_si256(c, low_mask);
hi = _mm256_and_si256(_mm256_srli_epi16(c, 4), low_mask);

Expand All @@ -197,7 +197,7 @@ inline void accumulate(
accu3 = _mm256_add_epi16(accu3, _mm256_srli_epi16(res_hi, 8));

c = _mm256_loadu_si256((__m256i*)&codes[i + 32]);
lut = _mm256_loadu_si256((__m256i*)&LUT[i + 32]);
lut = _mm256_loadu_si256((__m256i*)&lut[i + 32]);
lo = _mm256_and_si256(c, low_mask);
hi = _mm256_and_si256(_mm256_srli_epi16(c, 4), low_mask);

Expand Down
2 changes: 1 addition & 1 deletion rabitqlib/fastscan/highacc_fastscan.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,7 @@ inline void transfer_lut_hacc(const uint16_t* lut, size_t dim, uint8_t* hc_lut)
#if defined(__AVX512F__)
constexpr size_t kRegBits = 512;
#elif defined(__AVX2__)
constexpr size_t B_regi = 256;
constexpr size_t kRegBits = 256;
#else
static_assert(false, "At least requried AVX2 for using fastscan\n");
exit(1);
Expand Down