From 729af6406fd9e1c45993629990cd093fb5e3da1e Mon Sep 17 00:00:00 2001 From: lilianhuang Date: Mon, 5 Dec 2022 05:10:18 -0500 Subject: [PATCH] bugfix for sbgemm_ncopy_8_neoversen2 --- kernel/arm64/sbgemm_ncopy_8_neoversen2.c | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/kernel/arm64/sbgemm_ncopy_8_neoversen2.c b/kernel/arm64/sbgemm_ncopy_8_neoversen2.c index ff41e487c..1b13c8de9 100644 --- a/kernel/arm64/sbgemm_ncopy_8_neoversen2.c +++ b/kernel/arm64/sbgemm_ncopy_8_neoversen2.c @@ -83,13 +83,13 @@ int CNAME(BLASLONG m, BLASLONG n, IFLOAT *a, BLASLONG lda, IFLOAT *b) { if (m & 3) { BLASLONG rest = m & 3; - for (BLASLONG col = 0; col < 4; col++) { + for (BLASLONG col = 0; col < 8; col++) { b_offset[4 * col] = a_offsetx[col][0]; b_offset[4 * col + 1] = rest == 1 ? 0 : a_offsetx[col][1]; b_offset[4 * col + 2] = rest <= 2 ? 0 : a_offsetx[col][2]; b_offset[4 * col + 3] = rest <= 3 ? 0 : a_offsetx[col][3]; } - b_offset += 16; + b_offset += 32; } }