Browse Source

Refs #154. Fixed gemv_t bug about overflow 16MB buffer on x86.

tags/v0.2.6
Zhang Xianyi 13 years ago
parent
commit
0b08f7479e
2 changed files with 6 additions and 2 deletions
  1. +3
    -1
      kernel/x86/gemv_t_sse.S
  2. +3
    -1
      kernel/x86/gemv_t_sse2.S

+ 3
- 1
kernel/x86/gemv_t_sse.S View File

@@ -142,7 +142,9 @@
.L0t:
xorl J,J
addl $1,J
sall $21,J # J=2^22
sall $22,J # J=2^24*sizeof(float)=buffer size(16MB)
subl $8, J # Don't use last 8 float in the buffer.
# Now, split M by block J
subl J,MMM # MMM=MMM-J
movl J,M
jge .L00t


+ 3
- 1
kernel/x86/gemv_t_sse2.S View File

@@ -128,7 +128,9 @@
.L0t:
xorl J,J
addl $1,J
sall $22,J # J=2^22
sall $21,J # J=2^21*sizeof(double)=buffer size(16MB)
subl $4, J # Don't use last 4 double in the buffer.
# Now, split M by block J
subl J,MMM # MMM=MMM-J
movl J,M
jge .L00t


Loading…
Cancel
Save