| @@ -72,6 +72,11 @@ BLASLONG shgemm_p = DEFAULT_GEMM_P; | |||||
| #else | #else | ||||
| BLASLONG shgemm_p = SHGEMM_P; | BLASLONG shgemm_p = SHGEMM_P; | ||||
| #endif | #endif | ||||
| #if BGEMM_P == bgemm_p | |||||
| BLASLONG bgemm_p = DEFAULT_GEMM_P; | |||||
| #else | |||||
| BLASLONG bgemm_p = BGEMM_P; | |||||
| #endif | |||||
| #if SGEMM_P == sgemm_p | #if SGEMM_P == sgemm_p | ||||
| BLASLONG sgemm_p = DEFAULT_GEMM_P; | BLASLONG sgemm_p = DEFAULT_GEMM_P; | ||||
| #else | #else | ||||
| @@ -103,6 +108,11 @@ BLASLONG shgemm_q = DEFAULT_GEMM_Q; | |||||
| #else | #else | ||||
| BLASLONG shgemm_q = SHGEMM_Q; | BLASLONG shgemm_q = SHGEMM_Q; | ||||
| #endif | #endif | ||||
| #if BGEMM_Q == bgemm_q | |||||
| BLASLONG bgemm_q = DEFAULT_GEMM_Q; | |||||
| #else | |||||
| BLASLONG bgemm_q = BGEMM_Q; | |||||
| #endif | |||||
| #if SGEMM_Q == sgemm_q | #if SGEMM_Q == sgemm_q | ||||
| BLASLONG sgemm_q = DEFAULT_GEMM_Q; | BLASLONG sgemm_q = DEFAULT_GEMM_Q; | ||||
| #else | #else | ||||
| @@ -134,6 +144,11 @@ BLASLONG shgemm_r = DEFAULT_GEMM_R; | |||||
| #else | #else | ||||
| BLASLONG shgemm_r = SHGEMM_R; | BLASLONG shgemm_r = SHGEMM_R; | ||||
| #endif | #endif | ||||
| #if BGEMM_R == bgemm_r | |||||
| BLASLONG bgemm_r = DEFAULT_GEMM_R; | |||||
| #else | |||||
| BLASLONG bgemm_r = BGEMM_R; | |||||
| #endif | |||||
| #if SGEMM_R == sgemm_r | #if SGEMM_R == sgemm_r | ||||
| BLASLONG sgemm_r = DEFAULT_GEMM_R; | BLASLONG sgemm_r = DEFAULT_GEMM_R; | ||||
| #else | #else | ||||
| @@ -541,6 +556,7 @@ void blas_set_parameter(void){ | |||||
| #ifdef BUILD_BFLOAT16 | #ifdef BUILD_BFLOAT16 | ||||
| sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; | sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; | ||||
| bgemm_r = (((BUFFER_SIZE - ((BGEMM_P * BGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (BGEMM_Q * 4)) - 15) & ~15; | |||||
| #endif | #endif | ||||
| #ifdef BUILD_HFLOAT16 | #ifdef BUILD_HFLOAT16 | ||||
| shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; | shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; | ||||
| @@ -653,6 +669,7 @@ void blas_set_parameter(void){ | |||||
| #ifdef BUILD_BFLOAT16 | #ifdef BUILD_BFLOAT16 | ||||
| sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; | sbgemm_r = (((BUFFER_SIZE - ((SBGEMM_P * SBGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SBGEMM_Q * 4)) - 15) & ~15; | ||||
| bgemm_r = (((BUFFER_SIZE - ((BGEMM_P * BGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (BGEMM_Q * 4)) - 15) & ~15; | |||||
| #endif | #endif | ||||
| #ifdef BUILD_HFLOAT16 | #ifdef BUILD_HFLOAT16 | ||||
| shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; | shgemm_r = (((BUFFER_SIZE - ((SHGEMM_P * SHGEMM_Q * 4 + GEMM_OFFSET_A + GEMM_ALIGN) & ~GEMM_ALIGN)) / (SHGEMM_Q * 4)) - 15) & ~15; | ||||