Browse Source

Fix declaration of assembly arguments in SSYMV and DSYMV microkernels

Arguments 0 and 1 are both input and output
tags/v0.3.6^2
Martin Kroeker GitHub 7 years ago
parent
commit
b824fa70eb
No known key found for this signature in database GPG Key ID: 4AEE18F83AFDEB23
8 changed files with 24 additions and 24 deletions
  1. +3
    -3
      kernel/x86_64/dsymv_U_microk_bulldozer-2.c
  2. +3
    -3
      kernel/x86_64/dsymv_U_microk_haswell-2.c
  3. +3
    -3
      kernel/x86_64/dsymv_U_microk_nehalem-2.c
  4. +3
    -3
      kernel/x86_64/dsymv_U_microk_sandy-2.c
  5. +3
    -3
      kernel/x86_64/ssymv_U_microk_bulldozer-2.c
  6. +3
    -3
      kernel/x86_64/ssymv_U_microk_haswell-2.c
  7. +3
    -3
      kernel/x86_64/ssymv_U_microk_nehalem-2.c
  8. +3
    -3
      kernel/x86_64/ssymv_U_microk_sandy-2.c

+ 3
- 3
kernel/x86_64/dsymv_U_microk_bulldozer-2.c View File

@@ -106,9 +106,9 @@ static void dsymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"vmovsd %%xmm3 ,24(%9) \n\t" // save temp2

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


+ 3
- 3
kernel/x86_64/dsymv_U_microk_haswell-2.c View File

@@ -107,9 +107,9 @@ static void dsymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"vzeroupper \n\t"

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


+ 3
- 3
kernel/x86_64/dsymv_U_microk_nehalem-2.c View File

@@ -101,9 +101,9 @@ static void dsymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"movsd %%xmm3 , 24(%9) \n\t" // save temp2

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


+ 3
- 3
kernel/x86_64/dsymv_U_microk_sandy-2.c View File

@@ -116,9 +116,9 @@ static void dsymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"vzeroupper \n\t"

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


+ 3
- 3
kernel/x86_64/ssymv_U_microk_bulldozer-2.c View File

@@ -90,9 +90,9 @@ static void ssymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"vmovss %%xmm3 ,12(%9) \n\t" // save temp2

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


+ 3
- 3
kernel/x86_64/ssymv_U_microk_haswell-2.c View File

@@ -112,9 +112,9 @@ static void ssymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"vzeroupper \n\t"

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


+ 3
- 3
kernel/x86_64/ssymv_U_microk_nehalem-2.c View File

@@ -106,9 +106,9 @@ static void ssymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"movss %%xmm3 , 12(%9) \n\t" // save temp2

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


+ 3
- 3
kernel/x86_64/ssymv_U_microk_sandy-2.c View File

@@ -120,9 +120,9 @@ static void ssymv_kernel_4x4(BLASLONG n, FLOAT *a0, FLOAT *a1, FLOAT *a2, FLOAT
"vzeroupper \n\t"

:
:
"r" (i), // 0
"r" (n), // 1
"+r" (i), // 0
"+r" (n) // 1
:
"r" (x), // 2
"r" (y), // 3
"r" (a0), // 4


Loading…
Cancel
Save