|
|
|
@@ -48,7 +48,7 @@ static int swap_kernel_sve(BLASLONG n, FLOAT *x, FLOAT *y) |
|
|
|
for (BLASLONG i = 0; i < n; i += sve_width * 2) |
|
|
|
{ |
|
|
|
svbool_t pg_a = SVE_WHILELT((uint64_t)i, (uint64_t)n); |
|
|
|
svbool_t pg_b = SVE_WHILELT((i + sve_width), n); |
|
|
|
svbool_t pg_b = SVE_WHILELT((uint64_t)(i + sve_width), (uint64_t)n); |
|
|
|
SVE_TYPE x_vec_a = svld1(pg_a, &x[i]); |
|
|
|
SVE_TYPE y_vec_a = svld1(pg_a, &y[i]); |
|
|
|
SVE_TYPE x_vec_b = svld1(pg_b, &x[i + sve_width]); |
|
|
|
@@ -59,4 +59,4 @@ static int swap_kernel_sve(BLASLONG n, FLOAT *x, FLOAT *y) |
|
|
|
svst1(pg_b, &y[i + sve_width], x_vec_b); |
|
|
|
} |
|
|
|
return (0); |
|
|
|
} |
|
|
|
} |