We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 79c080d commit d8da1e3Copy full SHA for d8da1e3
hwy/contrib/dot/dot-inl.h
@@ -172,8 +172,8 @@ struct Dot {
172
// Won't be able to do a full vector load without padding => scalar loop.
173
if (!kIsAtLeastOneVector && !kIsMultipleOfVector && !kIsPaddedToVector &&
174
HWY_UNLIKELY(num_elements < N)) {
175
- float_t sum0 = 0.0f; // Only 2x unroll to avoid excessive code size for..
176
- float_t sum1 = 0.0f; // this unlikely(?) case.
+ float sum0 = 0.0f; // Only 2x unroll to avoid excessive code size for..
+ float sum1 = 0.0f; // this unlikely(?) case.
177
for (; i + 2 <= num_elements; i += 2) {
178
sum0 += F32FromBF16(pa[i + 0]) * F32FromBF16(pb[i + 0]);
179
sum1 += F32FromBF16(pa[i + 1]) * F32FromBF16(pb[i + 1]);
0 commit comments