Browse Source

modification for clang compiler

tags/v0.2.12^2
wernsaar 11 years ago
parent
commit
20cd850125
3 changed files with 24 additions and 24 deletions
  1. +8
    -8
      kernel/x86_64/cgemm_kernel_8x2_haswell.S
  2. +10
    -10
      kernel/x86_64/sgemm_kernel_16x4_haswell.S
  3. +6
    -6
      kernel/x86_64/zgemm_kernel_4x2_haswell.S

+ 8
- 8
kernel/x86_64/cgemm_kernel_8x2_haswell.S View File

@@ -227,8 +227,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADDPS_I( %ymm7 ,%ymm3,%ymm1 )


addq $6*SIZE, BO
addq $16*SIZE, AO
addq $ 6*SIZE, BO
addq $ 16*SIZE, AO
decq %rax
.endm

@@ -356,8 +356,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADDPS_R( %ymm4 ,%ymm2,%ymm0 )
VFMADDPS_I( %ymm5 ,%ymm3,%ymm0 )

addq $6*SIZE, BO
addq $8*SIZE, AO
addq $ 6*SIZE, BO
addq $ 8*SIZE, AO
decq %rax
.endm

@@ -447,8 +447,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADDPS_R( %xmm4 ,%xmm2,%xmm0 )
VFMADDPS_I( %xmm5 ,%xmm3,%xmm0 )

addq $6*SIZE, BO
addq $4*SIZE, AO
addq $ 6*SIZE, BO
addq $ 4*SIZE, AO
decq %rax

.endm
@@ -540,8 +540,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADDPS_R( %xmm4 ,%xmm2,%xmm0 )
VFMADDPS_I( %xmm5 ,%xmm3,%xmm0 )

addq $6*SIZE, BO
addq $2*SIZE, AO
addq $ 6*SIZE, BO
addq $ 2*SIZE, AO
decq %rax

.endm


+ 10
- 10
kernel/x86_64/sgemm_kernel_16x4_haswell.S View File

@@ -181,8 +181,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADD231PS_( %ymm14,%ymm3,%ymm0 )
VFMADD231PS_( %ymm15,%ymm3,%ymm1 )
addq $6*SIZE, BO
addq $16*SIZE, AO
addq $ 6*SIZE, BO
addq $ 16*SIZE, AO
decq %rax
.endm
@@ -268,8 +268,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADD231PS_( %ymm12,%ymm2,%ymm0 )
VFMADD231PS_( %ymm14,%ymm3,%ymm0 )
addq $6*SIZE, BO
addq $8*SIZE, AO
addq $ 6*SIZE, BO
addq $ 8*SIZE, AO
decq %rax
.endm
@@ -327,8 +327,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADD231PS_( %xmm12,%xmm2,%xmm0 )
VFMADD231PS_( %xmm14,%xmm3,%xmm0 )
addq $6*SIZE, BO
addq $4*SIZE, AO
addq $ 6*SIZE, BO
addq $ 4*SIZE, AO
decq %rax
.endm
@@ -392,8 +392,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADD231SS_( %xmm14,%xmm3,%xmm0 )
VFMADD231SS_( %xmm15,%xmm3,%xmm1 )
addq $6*SIZE, BO
addq $2*SIZE, AO
addq $ 6*SIZE, BO
addq $ 2*SIZE, AO
decq %rax
.endm
@@ -478,8 +478,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADD231SS_( %xmm12,%xmm2,%xmm0 )
VFMADD231SS_( %xmm14,%xmm3,%xmm0 )
addq $6*SIZE, BO
addq $1*SIZE, AO
addq $ 6*SIZE, BO
addq $ 1*SIZE, AO
decq %rax
.endm


+ 6
- 6
kernel/x86_64/zgemm_kernel_4x2_haswell.S View File

@@ -222,8 +222,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADDPD_I( %ymm5 ,%ymm3,%ymm0 )
VFMADDPD_I( %ymm7 ,%ymm3,%ymm1 )
addq $6*SIZE, BO
addq $8*SIZE, AO
addq $ 6*SIZE, BO
addq $ 8*SIZE, AO
decq %rax
.endm
@@ -362,8 +362,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADDPD_I( %xmm5 ,%xmm3,%xmm0 )
VFMADDPD_I( %xmm7 ,%xmm3,%xmm1 )
addq $6*SIZE, BO
addq $4*SIZE, AO
addq $ 6*SIZE, BO
addq $ 4*SIZE, AO
decq %rax
.endm
@@ -491,8 +491,8 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
VFMADDPD_R( %xmm4 ,%xmm2,%xmm0 )
VFMADDPD_I( %xmm5 ,%xmm3,%xmm0 )
addq $6*SIZE, BO
addq $2*SIZE, AO
addq $ 6*SIZE, BO
addq $ 2*SIZE, AO
decq %rax
.endm


Loading…
Cancel
Save