You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

Makefile.rule 7.7 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216
  1. #
  2. # Beginning of user configuration
  3. #
  4. # This library's version
  5. VERSION = 0.3.3.dev
  6. # If you set the suffix, the library name will be libopenblas_$(LIBNAMESUFFIX).a
  7. # and libopenblas_$(LIBNAMESUFFIX).so. Meanwhile, the soname in shared library
  8. # is libopenblas_$(LIBNAMESUFFIX).so.0.
  9. # LIBNAMESUFFIX = omp
  10. # You can specify the target architecture, otherwise it's
  11. # automatically detected.
  12. # TARGET = PENRYN
  13. # If you want to support multiple architecture in one binary
  14. # DYNAMIC_ARCH = 1
  15. # If you want the full list of x86_64 architectures supported in DYNAMIC_ARCH
  16. # mode (including individual optimizied codes for PENRYN, DUNNINGTON, OPTERON,
  17. # OPTERON_SSE3, ATOM and NANO rather than fallbacks to older architectures)
  18. # DYNAMIC_OLDER = 1
  19. # C compiler including binary type(32bit / 64bit). Default is gcc.
  20. # Don't use Intel Compiler or PGI, it won't generate right codes as I expect.
  21. # CC = gcc
  22. # Fortran compiler. Default is g77.
  23. # FC = gfortran
  24. # Even you can specify cross compiler. Meanwhile, please set HOSTCC.
  25. # cross compiler for Windows
  26. # CC = x86_64-w64-mingw32-gcc
  27. # FC = x86_64-w64-mingw32-gfortran
  28. # cross compiler for 32bit ARM
  29. # CC = arm-linux-gnueabihf-gcc
  30. # FC = arm-linux-gnueabihf-gfortran
  31. # cross compiler for 64bit ARM
  32. # CC = aarch64-linux-gnu-gcc
  33. # FC = aarch64-linux-gnu-gfortran
  34. # If you use the cross compiler, please set this host compiler.
  35. # HOSTCC = gcc
  36. # If you need 32bit binary, define BINARY=32, otherwise define BINARY=64
  37. # BINARY=64
  38. # About threaded BLAS. It will be automatically detected if you don't
  39. # specify it.
  40. # For force setting for single threaded, specify USE_THREAD = 0
  41. # For force setting for multi threaded, specify USE_THREAD = 1
  42. # USE_THREAD = 0
  43. # If you're going to use this library with OpenMP, please comment it in.
  44. # This flag is always set for POWER8. Don't modify the flag
  45. # USE_OPENMP = 1
  46. # The OpenMP scheduler to use - by default this is "static" and you
  47. # will normally not want to change this unless you know that your main
  48. # workload will involve tasks that have highly unbalanced running times
  49. # for individual threads. Changing away from "static" may also adversely
  50. # affect memory access locality in NUMA systems. Setting to "runtime" will
  51. # allow you to select the scheduler from the environment variable OMP_SCHEDULE
  52. # CCOMMON_OPT += -DOMP_SCHED=dynamic
  53. # You can define maximum number of threads. Basically it should be
  54. # less than actual number of cores. If you don't specify one, it's
  55. # automatically detected by the the script.
  56. # NUM_THREADS = 24
  57. # If you have enabled USE_OPENMP and your application would call
  58. # OpenBLAS's calculation API from multi threads, please comment it in.
  59. # This flag defines how many instances of OpenBLAS's calculation API can
  60. # actually run in parallel. If more threads call OpenBLAS's calculation API,
  61. # they need to wait for the preceding API calls to finish or risk data corruption.
  62. # NUM_PARALLEL = 2
  63. # if you don't need to install the static library, please comment it in.
  64. # NO_STATIC = 1
  65. # if you don't need generate the shared library, please comment it in.
  66. # NO_SHARED = 1
  67. # If you don't need CBLAS interface, please comment it in.
  68. # NO_CBLAS = 1
  69. # If you only want CBLAS interface without installing Fortran compiler,
  70. # please comment it in.
  71. # ONLY_CBLAS = 1
  72. # If you don't need LAPACK, please comment it in.
  73. # If you set NO_LAPACK=1, the library automatically sets NO_LAPACKE=1.
  74. # NO_LAPACK = 1
  75. # If you don't need LAPACKE (C Interface to LAPACK), please comment it in.
  76. # NO_LAPACKE = 1
  77. # Build LAPACK Deprecated functions since LAPACK 3.6.0
  78. BUILD_LAPACK_DEPRECATED = 1
  79. # Build RecursiveLAPACK on top of LAPACK
  80. # BUILD_RELAPACK = 1
  81. # If you want to use legacy threaded Level 3 implementation.
  82. # USE_SIMPLE_THREADED_LEVEL3 = 1
  83. # If you want to drive whole 64bit region by BLAS. Not all Fortran
  84. # compiler supports this. It's safe to keep comment it out if you
  85. # are not sure(equivalent to "-i8" option).
  86. # INTERFACE64 = 1
  87. # Unfortunately most of kernel won't give us high quality buffer.
  88. # BLAS tries to find the best region before entering main function,
  89. # but it will consume time. If you don't like it, you can disable one.
  90. NO_WARMUP = 1
  91. # If you want to disable CPU/Memory affinity on Linux.
  92. NO_AFFINITY = 1
  93. # if you are compiling for Linux and you have more than 16 numa nodes or more than 256 cpus
  94. # BIGNUMA = 1
  95. # Don't use AVX kernel on Sandy Bridge. It is compatible with old compilers
  96. # and OS. However, the performance is low.
  97. # NO_AVX = 1
  98. # Don't use Haswell optimizations if binutils is too old (e.g. RHEL6)
  99. # NO_AVX2 = 1
  100. # Don't use parallel make.
  101. # NO_PARALLEL_MAKE = 1
  102. # Force number of make jobs. The default is the number of logical CPU of the host.
  103. # This is particularly useful when using distcc.
  104. # A negative value will disable adding a -j flag to make, allowing to use a parent
  105. # make -j value. This is useful to call OpenBLAS make from an other project
  106. # makefile
  107. # MAKE_NB_JOBS = 2
  108. # If you would like to know minute performance report of GotoBLAS.
  109. # FUNCTION_PROFILE = 1
  110. # Support for IEEE quad precision(it's *real* REAL*16)( under testing)
  111. # QUAD_PRECISION = 1
  112. # Theads are still working for a while after finishing BLAS operation
  113. # to reduce thread activate/deactivate overhead. You can determine
  114. # time out to improve performance. This number should be from 4 to 30
  115. # which corresponds to (1 << n) cycles. For example, if you set to 26,
  116. # thread will be running for (1 << 26) cycles(about 25ms on 3.0GHz
  117. # system). Also you can control this mumber by THREAD_TIMEOUT
  118. # CCOMMON_OPT += -DTHREAD_TIMEOUT=26
  119. # Using special device driver for mapping physically contigous memory
  120. # to the user space. If bigphysarea is enabled, it will use it.
  121. # DEVICEDRIVER_ALLOCATION = 1
  122. # If you need to synchronize FP CSR between threads (for x86/x86_64 only).
  123. # CONSISTENT_FPCSR = 1
  124. # If any gemm arguement m, n or k is less or equal this threshold, gemm will be execute
  125. # with single thread. (Actually in recent versions this is a factor proportional to the
  126. # number of floating point operations necessary for the given problem size, no longer
  127. # an individual dimension). You can use this setting to avoid the overhead of multi-
  128. # threading in small matrix sizes. The default value is 4, but values as high as 50 have
  129. # been reported to be optimal for certain workloads (50 is the recommended value for Julia).
  130. # GEMM_MULTITHREAD_THRESHOLD = 4
  131. # If you need santy check by comparing reference BLAS. It'll be very
  132. # slow (Not implemented yet).
  133. # SANITY_CHECK = 1
  134. # The installation directory.
  135. # PREFIX = /opt/OpenBLAS
  136. # Common Optimization Flag;
  137. # The default -O2 is enough.
  138. # Flags for POWER8 are defined in Makefile.power. Don't modify COMMON_OPT
  139. # COMMON_OPT = -O2
  140. # gfortran option for LAPACK
  141. # enable this flag only on 64bit Linux and if you need a thread safe lapack library
  142. # Flags for POWER8 are defined in Makefile.power. Don't modify FCOMMON_OPT
  143. # FCOMMON_OPT = -frecursive
  144. # Profiling flags
  145. COMMON_PROF = -pg
  146. # Build Debug version
  147. # DEBUG = 1
  148. # Set maximum stack allocation.
  149. # The default value is 2048. 0 disable stack allocation a may reduce GER and GEMV
  150. # performance. For details, https://github.com/xianyi/OpenBLAS/pull/482
  151. #
  152. # MAX_STACK_ALLOC = 0
  153. # Add a prefix or suffix to all exported symbol names in the shared library.
  154. # Avoid conflicts with other BLAS libraries, especially when using
  155. # 64 bit integer interfaces in OpenBLAS.
  156. # For details, https://github.com/xianyi/OpenBLAS/pull/459
  157. #
  158. # The same prefix and suffix are also added to the library name,
  159. # i.e. you get lib$(SYMBOLPREFIX)openblas$(SYMBOLSUFFIX) rather than libopenblas
  160. #
  161. # SYMBOLPREFIX=
  162. # SYMBOLSUFFIX=
  163. #
  164. # End of user configuration
  165. #