From a4abf7828efe2bd40321366505b75deb2e200cc7 Mon Sep 17 00:00:00 2001 From: Chip Kerchner Date: Thu, 18 Sep 2025 21:30:22 +0000 Subject: [PATCH] Fix _Float16 casting issue and reduce LMUL for certain vector instruction from m2 to m1. --- kernel/riscv64/shgemm_kernel_16x8_zvl256b.c | 92 +++---- kernel/riscv64/shgemm_kernel_8x8_zvl128b.c | 258 ++++++++++---------- 2 files changed, 175 insertions(+), 175 deletions(-) diff --git a/kernel/riscv64/shgemm_kernel_16x8_zvl256b.c b/kernel/riscv64/shgemm_kernel_16x8_zvl256b.c index fb98f564c3..746e07d55f 100644 --- a/kernel/riscv64/shgemm_kernel_16x8_zvl256b.c +++ b/kernel/riscv64/shgemm_kernel_16x8_zvl256b.c @@ -295,22 +295,22 @@ int CNAME(BLASLONG M, BLASLONG N, BLASLONG K, FLOAT alpha, IFLOAT *A, IFLOAT *B, BLASLONG bi = n_top * K; for(BLASLONG k=0; k