Browse Source

Tune generic SVE constants closer to other SVE cores

This allows us to use the `ARMV8` and `ARMV8SVE` targets in a minimal build without losing too much performance.
pull/4833/head
Chris Sidebottom 1 year ago
parent
commit
22d8803593
1 changed files with 6 additions and 4 deletions
  1. +6
    -4
      param.h

+ 6
- 4
param.h View File

@@ -3671,8 +3671,10 @@ Until then, just keep it different than DGEMM_DEFAULT_UNROLL_N to keep copy rout


#if defined(XDOUBLE) || defined(DOUBLE) #if defined(XDOUBLE) || defined(DOUBLE)
#define SWITCH_RATIO 8 #define SWITCH_RATIO 8
#define GEMM_PREFERED_SIZE 4
#else #else
#define SWITCH_RATIO 16 #define SWITCH_RATIO 16
#define GEMM_PREFERED_SIZE 8
#endif #endif


#define SGEMM_DEFAULT_UNROLL_M 4 // Actually 1VL (8) but kept seperate to keep copies seperate #define SGEMM_DEFAULT_UNROLL_M 4 // Actually 1VL (8) but kept seperate to keep copies seperate
@@ -3689,13 +3691,13 @@ Until then, just keep it different than DGEMM_DEFAULT_UNROLL_N to keep copy rout
#define ZGEMM_DEFAULT_UNROLL_N 4 #define ZGEMM_DEFAULT_UNROLL_N 4
#define ZGEMM_DEFAULT_UNROLL_MN 16 #define ZGEMM_DEFAULT_UNROLL_MN 16


#define SGEMM_DEFAULT_P 128
#define DGEMM_DEFAULT_P 160
#define SGEMM_DEFAULT_P 240
#define DGEMM_DEFAULT_P 240
#define CGEMM_DEFAULT_P 128 #define CGEMM_DEFAULT_P 128
#define ZGEMM_DEFAULT_P 128 #define ZGEMM_DEFAULT_P 128


#define SGEMM_DEFAULT_Q 352
#define DGEMM_DEFAULT_Q 128
#define SGEMM_DEFAULT_Q 640
#define DGEMM_DEFAULT_Q 320
#define CGEMM_DEFAULT_Q 224 #define CGEMM_DEFAULT_Q 224
#define ZGEMM_DEFAULT_Q 112 #define ZGEMM_DEFAULT_Q 112




Loading…
Cancel
Save