This is better

This commit is contained in:
Alexey Milovidov 2024-11-14 00:21:41 +01:00
parent 6ea31c81e1
commit d59087a0f6

View File

@ -622,8 +622,8 @@ private:
}
}
#else
/// Process chunks in vectorized manner
static constexpr size_t VEC_SIZE = 4;
/// Process chunks in a vectorized manner.
static constexpr size_t VEC_SIZE = 16;
typename Kernel::template State<ResultType> states[VEC_SIZE];
for (; prev + VEC_SIZE < off; i += VEC_SIZE, prev += VEC_SIZE)
{
@ -635,7 +635,7 @@ private:
for (const auto & other_state : states)
Kernel::template combine<ResultType>(state, other_state, kernel_params);
#endif
/// Process the tail
/// Process the tail.
for (; prev < off; ++i, ++prev)
{
Kernel::template accumulate<ResultType>(