diff --git a/dnn/vec_avx.h b/dnn/vec_avx.h index f18c771a..e4ccdb41 100644 --- a/dnn/vec_avx.h +++ b/dnn/vec_avx.h @@ -502,7 +502,40 @@ static inline void sparse_sgemv_accum8x4(float *_out, const qweight *w, int rows colblocks = *idx++; y = &out[i]; vy0 = _mm256_loadu_si256((const __m256i *)&y[0]); - for (j=0;j