Browse Source

try to maintain cache line alignment for odd BLAS L1 work splits

pull/1907/head
Andrew 7 years ago
parent
commit
5f99b61aa7
1 changed files with 2 additions and 2 deletions
  1. +2
    -2
      driver/others/blas_l1_thread.c

+ 2
- 2
driver/others/blas_l1_thread.c View File

@@ -65,7 +65,7 @@ int blas_level1_thread(int mode, BLASLONG m, BLASLONG n, BLASLONG k, void *alpha
/* Adjust Parameters */
width = blas_quickdivide(i + nthreads - num_cpu - 1,
nthreads - num_cpu);
width = MAX(width,((width-1)&~15)+16);
i -= width;
if (i < 0) width = width + i;

@@ -136,7 +136,7 @@ int blas_level1_thread_with_return_value(int mode, BLASLONG m, BLASLONG n, BLASL
/* Adjust Parameters */
width = blas_quickdivide(i + nthreads - num_cpu - 1,
nthreads - num_cpu);
width = MAX(width,((width-1)&~15)+16);
i -= width;
if (i < 0) width = width + i;



Loading…
Cancel
Save