Browse Source

modify sve zgemmcopy kernels

tags/v0.3.20
Bine Brank 4 years ago
parent
commit
87537b8c55
2 changed files with 1 additions and 4 deletions
  1. +1
    -2
      kernel/arm64/zgemm_ncopy_sve_v1.c
  2. +0
    -2
      kernel/arm64/zgemm_tcopy_sve_v1.c

+ 1
- 2
kernel/arm64/zgemm_ncopy_sve_v1.c View File

@@ -47,7 +47,6 @@ int CNAME(BLASLONG m, BLASLONG n, IFLOAT *a, BLASLONG lda, IFLOAT *b){
IFLOAT *aoffset, *aoffset1, *boffset;

svint64_t lda_vec = svindex_s64(0LL, lda * 2);
uint64_t sve_size = svcntd();

aoffset = a;
boffset = b;
@@ -67,7 +66,7 @@ int CNAME(BLASLONG m, BLASLONG n, IFLOAT *a, BLASLONG lda, IFLOAT *b){
aoffset1 += 2;
boffset += active * 2;
}
aoffset += sve_size * lda * 2;
aoffset += active * lda * 2;

j += svcntd();
pg = svwhilelt_b64(j, n);


+ 0
- 2
kernel/arm64/zgemm_tcopy_sve_v1.c View File

@@ -46,8 +46,6 @@ int CNAME(BLASLONG m, BLASLONG n, IFLOAT *a, BLASLONG lda, IFLOAT *b){
BLASLONG j;
IFLOAT *aoffset, *aoffset1, *boffset;

uint64_t sve_size = svcntd();

aoffset = a;
boffset = b;



Loading…
Cancel
Save