Browse Source

fixed syrk_thread.c taken from wernsaar

Stride calculation fix copied from https://github.com/wernsaar/OpenBLAS/commit/88900e1
tags/v0.2.20^2
Martin Kroeker GitHub 8 years ago
parent
commit
49e62c0e77
1 changed files with 2 additions and 2 deletions
  1. +2
    -2
      driver/level3/syrk_thread.c

+ 2
- 2
driver/level3/syrk_thread.c View File

@@ -109,7 +109,7 @@ int CNAME(int mode, blas_arg_t *arg, BLASLONG *range_m, BLASLONG *range_n, int (
if (nthreads - num_cpu > 1) {

di = (double)i;
width = ((BLASLONG)( sqrt(di * di + dnum) - di) + mask) & ~mask;
width = (BLASLONG)(( sqrt(di * di + dnum) - di + mask)/(mask+1)) * (mask+1);

if ((width <= 0) || (width > n_to - i)) width = n_to - i;

@@ -149,7 +149,7 @@ int CNAME(int mode, blas_arg_t *arg, BLASLONG *range_m, BLASLONG *range_n, int (
if (nthreads - num_cpu > 1) {

di = (double)(arg -> n - i);
width = ((BLASLONG)(-sqrt(di * di + dnum) + di) + mask) & ~mask;
width = ((BLASLONG)((-sqrt(di * di + dnum) + di) + mask)/(mask+1)) * (mask+1);

if ((width <= 0) || (width > n_to - i)) width = n_to - i;



Loading…
Cancel
Save