mirror of
https://github.com/VectorCamp/vectorscan.git
synced 2025-06-28 16:41:01 +03:00
teddy: we only need the upper lane
Just use an extract, no need to shuffle first.
This commit is contained in:
parent
adf820bbba
commit
1b3e795fc9
@ -204,7 +204,7 @@ do { \
|
|||||||
if (unlikely(isnonzero256(var))) { \
|
if (unlikely(isnonzero256(var))) { \
|
||||||
u32 arrCnt = 0; \
|
u32 arrCnt = 0; \
|
||||||
m128 lo = cast256to128(var); \
|
m128 lo = cast256to128(var); \
|
||||||
m128 hi = cast256to128(swap128in256(var)); \
|
m128 hi = movdq_hi(var); \
|
||||||
bit_array_fast_teddy(lo, bitArr, &arrCnt, offset); \
|
bit_array_fast_teddy(lo, bitArr, &arrCnt, offset); \
|
||||||
bit_array_fast_teddy(hi, bitArr, &arrCnt, offset + 2); \
|
bit_array_fast_teddy(hi, bitArr, &arrCnt, offset + 2); \
|
||||||
for (u32 i = 0; i < arrCnt; i++) { \
|
for (u32 i = 0; i < arrCnt; i++) { \
|
||||||
|
Loading…
x
Reference in New Issue
Block a user