From 60d6eab63d70d6892eea86543f2c84227ec3ac9a Mon Sep 17 00:00:00 2001 From: Jean-Marc Valin Date: Tue, 6 Jul 2021 17:33:33 -0400 Subject: [PATCH] Doing a bit of unrolling to speed things up --- dnn/vec_avx.h | 35 ++++++++++++++++++++++++++++++++++- 1 file changed, 34 insertions(+), 1 deletion(-) diff --git a/dnn/vec_avx.h b/dnn/vec_avx.h index f18c771a..e4ccdb41 100644 --- a/dnn/vec_avx.h +++ b/dnn/vec_avx.h @@ -502,7 +502,40 @@ static inline void sparse_sgemv_accum8x4(float *_out, const qweight *w, int rows colblocks = *idx++; y = &out[i]; vy0 = _mm256_loadu_si256((const __m256i *)&y[0]); - for (j=0;j