| @@ -71,16 +71,25 @@ int CNAME(int mode, blas_arg_t *arg, BLASLONG *range_m, BLASLONG *range_n, int ( | |||||
| queue[num_cpu].args = arg; | queue[num_cpu].args = arg; | ||||
| queue[num_cpu].range_m = range_m; | queue[num_cpu].range_m = range_m; | ||||
| queue[num_cpu].range_n = &range[num_cpu]; | queue[num_cpu].range_n = &range[num_cpu]; | ||||
| queue[num_cpu].sa = sa + GEMM_OFFSET_A1 * num_cpu; //NULL; | |||||
| queue[num_cpu].sb = queue[num_cpu].sa + GEMM_OFFSET_A1 * 5;//NULL; | |||||
| #if defined(LOONGSON3A) | |||||
| queue[num_cpu].sa = sa + GEMM_OFFSET_A1 * num_cpu; | |||||
| queue[num_cpu].sb = queue[num_cpu].sa + GEMM_OFFSET_A1 * 5; | |||||
| #else | |||||
| queue[num_cpu].sa = NULL; | |||||
| queue[num_cpu].sb = NULL; | |||||
| #endif | |||||
| queue[num_cpu].next = &queue[num_cpu + 1]; | queue[num_cpu].next = &queue[num_cpu + 1]; | ||||
| num_cpu ++; | num_cpu ++; | ||||
| } | } | ||||
| if (num_cpu) { | if (num_cpu) { | ||||
| #if defined(LOONGSON3A) | |||||
| queue[0].sa = sa; | queue[0].sa = sa; | ||||
| queue[0].sb = sa + GEMM_OFFSET_A1 * 5; | queue[0].sb = sa + GEMM_OFFSET_A1 * 5; | ||||
| #else | |||||
| queue[0].sa = sa; | |||||
| queue[0].sb = sb; | |||||
| #endif | |||||
| queue[num_cpu - 1].next = NULL; | queue[num_cpu - 1].next = NULL; | ||||
| exec_blas(num_cpu, | exec_blas(num_cpu, | ||||