Browse Source

Update dgemm_kernel_4x8_haswell.S

tags/v0.3.7
wjc404 GitHub 6 years ago
parent
commit
4801c6d36b
No known key found for this signature in database GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 4 additions and 4 deletions
  1. +4
    -4
      kernel/x86_64/dgemm_kernel_4x8_haswell.S

+ 4
- 4
kernel/x86_64/dgemm_kernel_4x8_haswell.S View File

@@ -1866,7 +1866,7 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
SAVE4x12
/* here for the prefetch of next b source block */
/* the increment should be proportional to the ratio of GEMM_Q/GEMM_P */
/* the increment should be proportional to GEMM_Q/GEMM_P */
salq $3, K
#ifdef WINDOWS_ABI /* GEMM_P == GEMM_Q * 4 */
@@ -2184,19 +2184,19 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
SAVE4x12
/* here for the prefetch of next b source block */
/* the increment should be proportional to the ratio of GEMM_Q/GEMM_P */
/* the increment should be proportional to GEMM_Q/GEMM_P */
salq $3, K
#ifdef WINDOWS_ABI /* GEMM_P == GEMM_Q * 4 */
prefetcht2 (B)
prefetcht2 (B, K, 8)
addq $64, B
addq $64, B /* increment */
#else /* GEMM_P == GEMM_Q * 2 under linux x86_64 */
prefetcht2 (B)
prefetcht2 (B, K, 8)
prefetcht2 64(B)
prefetcht2 64(B, K, 8)
addq $128, B
addq $128, B /* increment */
#endif
sarq $3, K


Loading…
Cancel
Save