Skip to content

Commit 01bca6b

Browse files
authored
Merge pull request #13 from zhangdapao745/main
fix fastscan for AVX2
2 parents 19b64b7 + 0cb1b52 commit 01bca6b

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

rabitqlib/fastscan/fastscan.hpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -184,7 +184,7 @@ inline void accumulate(
184184

185185
for (size_t i = 0; i < code_length; i += 64) {
186186
c = _mm256_loadu_si256((__m256i*)&codes[i]);
187-
lut = _mm256_loadu_si256((__m256i*)&LUT[i]);
187+
lut = _mm256_loadu_si256((__m256i*)&lut[i]);
188188
lo = _mm256_and_si256(c, low_mask);
189189
hi = _mm256_and_si256(_mm256_srli_epi16(c, 4), low_mask);
190190

@@ -197,7 +197,7 @@ inline void accumulate(
197197
accu3 = _mm256_add_epi16(accu3, _mm256_srli_epi16(res_hi, 8));
198198

199199
c = _mm256_loadu_si256((__m256i*)&codes[i + 32]);
200-
lut = _mm256_loadu_si256((__m256i*)&LUT[i + 32]);
200+
lut = _mm256_loadu_si256((__m256i*)&lut[i + 32]);
201201
lo = _mm256_and_si256(c, low_mask);
202202
hi = _mm256_and_si256(_mm256_srli_epi16(c, 4), low_mask);
203203

rabitqlib/fastscan/highacc_fastscan.hpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ inline void transfer_lut_hacc(const uint16_t* lut, size_t dim, uint8_t* hc_lut)
2323
#if defined(__AVX512F__)
2424
constexpr size_t kRegBits = 512;
2525
#elif defined(__AVX2__)
26-
constexpr size_t B_regi = 256;
26+
constexpr size_t kRegBits = 256;
2727
#else
2828
static_assert(false, "At least requried AVX2 for using fastscan\n");
2929
exit(1);

0 commit comments

Comments
 (0)