From 3ab5a37fdf0265feba9b370aeff5bb965ca13c31 Mon Sep 17 00:00:00 2001 From: avcodecs <50400420+avcodecs@users.noreply.github.com> Date: Sat, 15 Jun 2024 11:02:44 +0800 Subject: [PATCH] Update vec_neon.h optimized sparse_cgemv8x4 for improve performance --- src/vec_neon.h | 78 ++++++++++++++++++++++---------------------------- 1 file changed, 34 insertions(+), 44 deletions(-) diff --git a/src/vec_neon.h b/src/vec_neon.h index 31b736c3..420e24f2 100644 --- a/src/vec_neon.h +++ b/src/vec_neon.h @@ -299,63 +299,53 @@ static inline void sgemv(float *out, const float *weights, int rows, int cols, i } } -/* Temporarily use unoptimized version */ static inline void sparse_sgemv8x4(float *out, const float *w, const int *idx, int rows, const float *x) { int i, j; - RNN_CLEAR(out, rows); for (i=0;i