|
|
|
@@ -127,9 +127,9 @@ static void dgemv_kernel_4x2(BLASLONG n, FLOAT *ap0, FLOAT *ap1, FLOAT *x, FLOAT |
|
|
|
"movsd %%xmm11,8(%2) \n\t" |
|
|
|
|
|
|
|
: |
|
|
|
: |
|
|
|
"r" (i), // 0 |
|
|
|
"r" (n), // 1 |
|
|
|
"+r" (i), // 0 |
|
|
|
"+r" (n) // 1 |
|
|
|
: |
|
|
|
"r" (y), // 2 |
|
|
|
"r" (ap0), // 3 |
|
|
|
"r" (ap1), // 4 |
|
|
|
@@ -195,9 +195,9 @@ static void dgemv_kernel_4x1(BLASLONG n, FLOAT *ap, FLOAT *x, FLOAT *y) |
|
|
|
"movsd %%xmm10, (%2) \n\t" |
|
|
|
|
|
|
|
: |
|
|
|
: |
|
|
|
"r" (i), // 0 |
|
|
|
"r" (n), // 1 |
|
|
|
"+r" (i), // 0 |
|
|
|
"+r" (n) // 1 |
|
|
|
: |
|
|
|
"r" (y), // 2 |
|
|
|
"r" (ap), // 3 |
|
|
|
"r" (x) // 4 |
|
|
|
@@ -259,9 +259,9 @@ static void add_y(BLASLONG n, FLOAT da , FLOAT *src, FLOAT *dest, BLASLONG inc_d |
|
|
|
"jnz 1b \n\t" |
|
|
|
|
|
|
|
: |
|
|
|
: |
|
|
|
"r" (i), // 0 |
|
|
|
"r" (n), // 1 |
|
|
|
"+r" (i), // 0 |
|
|
|
"+r" (n) // 1 |
|
|
|
: |
|
|
|
"r" (&da), // 2 |
|
|
|
"r" (src), // 3 |
|
|
|
"r" (dest) // 4 |
|
|
|
|