Browse Source

improve skylakex paralleled sgemm performance

tags/v0.3.8^2
wjc404 GitHub 6 years ago
parent
commit
1c67567008
No known key found for this signature in database GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 2 additions and 7 deletions
  1. +2
    -7
      param.h

+ 2
- 7
param.h View File

@@ -1690,18 +1690,13 @@ USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

#else

#define SGEMM_DEFAULT_P 768
#define SGEMM_DEFAULT_P 640
#define DGEMM_DEFAULT_P 384
#define CGEMM_DEFAULT_P 384
#define ZGEMM_DEFAULT_P 256

#ifdef WINDOWS_ABI
#define SGEMM_DEFAULT_Q 192
#define DGEMM_DEFAULT_Q 168
#else
#define SGEMM_DEFAULT_Q 192
#define SGEMM_DEFAULT_Q 320
#define DGEMM_DEFAULT_Q 168
#endif
#define CGEMM_DEFAULT_Q 192
#define ZGEMM_DEFAULT_Q 128



Loading…
Cancel
Save