You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

Makefile 5.4 kB

7 years ago
5 years ago
7 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. ifdef TARGET_CORE
  2. TARGET = $(TARGET_CORE)
  3. endif
  4. TOPDIR = ..
  5. include $(TOPDIR)/Makefile.system
  6. ifeq ($(C_COMPILER), GCC)
  7. GCCVERSIONGTEQ9 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 9)
  8. GCCVERSIONGTEQ10 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 10)
  9. endif
  10. ifeq ($(ARCH), power)
  11. ifeq ($(C_COMPILER), CLANG)
  12. override CFLAGS += -fno-integrated-as
  13. endif
  14. endif
  15. AVX2OPT =
  16. ifeq ($(C_COMPILER), GCC)
  17. # AVX2 support was added in 4.7.0
  18. GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
  19. GCCMINORVERSIONGTEQ7 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 7)
  20. ifeq ($(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ7), 11)
  21. AVX2OPT = -mavx2
  22. endif
  23. endif
  24. ifeq ($(C_COMPILER), CLANG)
  25. # Any clang posing as gcc 4.2 should be new enough (3.4 or later)
  26. GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
  27. GCCMINORVERSIONGTEQ2 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 2)
  28. ifeq ($(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ2), 11)
  29. AVX2OPT = -mavx2
  30. endif
  31. endif
  32. ifdef NO_AVX2
  33. AVX2OPT=
  34. endif
  35. ifdef TARGET_CORE
  36. ifeq ($(TARGET_CORE), COOPERLAKE)
  37. override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE)
  38. ifeq ($(GCCVERSIONGTEQ10), 1)
  39. override CFLAGS += -march=cooperlake
  40. else
  41. override CFLAGS += -march=skylake-avx512
  42. endif
  43. ifeq ($(OSNAME), CYGWIN_NT)
  44. override CFLAGS += -fno-asynchronous-unwind-tables
  45. endif
  46. ifeq ($(OSNAME), WINNT)
  47. ifeq ($(C_COMPILER), GCC)
  48. override CFLAGS += -fno-asynchronous-unwind-tables
  49. endif
  50. endif
  51. else ifeq ($(TARGET_CORE), SKYLAKEX)
  52. override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE) -march=skylake-avx512
  53. ifeq ($(OSNAME), CYGWIN_NT)
  54. override CFLAGS += -fno-asynchronous-unwind-tables
  55. endif
  56. ifeq ($(OSNAME), WINNT)
  57. ifeq ($(C_COMPILER), GCC)
  58. override CFLAGS += -fno-asynchronous-unwind-tables
  59. endif
  60. endif
  61. else ifeq ($(TARGET_CORE), HASWELL)
  62. override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE) $(AVX2OPT)
  63. else
  64. override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE)
  65. endif
  66. BUILD_KERNEL = 1
  67. KDIR =
  68. TSUFFIX = _$(TARGET_CORE)
  69. else
  70. TARGET_CORE = $(CORE)
  71. KDIR =
  72. TSUFFIX =
  73. endif
  74. -include $(KERNELDIR)/KERNEL.$(TARGET_CORE)
  75. include $(KERNELDIR)/KERNEL
  76. include Makefile.L1
  77. include Makefile.L2
  78. include Makefile.L3
  79. include Makefile.LA
  80. HPLOBJS = \
  81. dgemm_kernel.$(SUFFIX) \
  82. $(DGEMMINCOPYOBJ) $(DGEMMITCOPYOBJ) \
  83. $(DGEMMONCOPYOBJ) $(DGEMMOTCOPYOBJ) \
  84. dtrsm_kernel_LN.$(SUFFIX) dtrsm_kernel_LT.$(SUFFIX) \
  85. dtrsm_kernel_RN.$(SUFFIX) dtrsm_kernel_RT.$(SUFFIX) \
  86. daxpy_k.$(SUFFIX) dcopy_k.$(SUFFIX) ddot_k.$(SUFFIX) \
  87. dger_k.$(SUFFIX) dscal_k.$(SUFFIX) idamax_k.$(SUFFIX) \
  88. dgemv_n.$(SUFFIX) dgemv_t.$(SUFFIX) dgemm_beta.$(SUFFIX) \
  89. dtrsm_iunucopy.$(SUFFIX) dtrsm_iunncopy.$(SUFFIX) \
  90. dtrsm_ilnucopy.$(SUFFIX) dtrsm_ilnncopy.$(SUFFIX) \
  91. dtrsm_iutucopy.$(SUFFIX) dtrsm_iutncopy.$(SUFFIX) \
  92. dtrsm_iltucopy.$(SUFFIX) dtrsm_iltncopy.$(SUFFIX) \
  93. dtrsm_ounucopy.$(SUFFIX) dtrsm_ounncopy.$(SUFFIX) \
  94. dtrsm_olnucopy.$(SUFFIX) dtrsm_olnncopy.$(SUFFIX) \
  95. dtrsm_outucopy.$(SUFFIX) dtrsm_outncopy.$(SUFFIX) \
  96. dtrsm_oltucopy.$(SUFFIX) dtrsm_oltncopy.$(SUFFIX)
  97. COMMONOBJS += lsame.$(SUFFIX) scabs1.$(SUFFIX) dcabs1.$(SUFFIX)
  98. ifeq ($(DYNAMIC_ARCH), 1)
  99. SBLASOBJS += setparam$(TSUFFIX).$(SUFFIX)
  100. CCOMMON_OPT += -DTS=$(TSUFFIX)
  101. endif
  102. KERNEL_INTERFACE = ../common_level1.h ../common_level2.h ../common_level3.h
  103. ifneq ($(NO_LAPACK), 1)
  104. KERNEL_INTERFACE += ../common_lapack.h
  105. endif
  106. ifeq ($(ARCH), x86)
  107. COMMONOBJS += cpuid.$(SUFFIX)
  108. endif
  109. ifdef EXPRECISION
  110. COMMONOBJS += qconjg.$(SUFFIX) qcabs1.$(SUFFIX)
  111. endif
  112. ifdef QUAD_PRECISION
  113. COMMONOBJS += qconjg.$(SUFFIX) qcabs1.$(SUFFIX)
  114. endif
  115. all : libs
  116. scabs1.$(SUFFIX): $(KERNELDIR)/$(SCABS_KERNEL)
  117. $(CC) -c $(CFLAGS) -DCOMPLEX -UDOUBLE -DF_INTERFACE $< -o $(@F)
  118. dcabs1.$(SUFFIX): $(KERNELDIR)/$(DCABS_KERNEL)
  119. $(CC) -c $(CFLAGS) -DCOMPLEX -DDOUBLE -DF_INTERFACE $< -o $(@F)
  120. qcabs1.$(SUFFIX): $(KERNELDIR)/$(QCABS_KERNEL)
  121. $(CC) -c $(CFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  122. qconjg.$(SUFFIX): $(KERNELDIR)/qconjg.S
  123. $(CC) -c $(CFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  124. lsame.$(SUFFIX): $(KERNELDIR)/$(LSAME_KERNEL)
  125. $(CC) -c $(CFLAGS) -DF_INTERFACE $< -o $(@F)
  126. setparam$(TSUFFIX).$(SUFFIX): setparam$(TSUFFIX).c kernel$(TSUFFIX).h
  127. ifeq ($(USE_GEMM3M), 1)
  128. $(CC) -c $(CFLAGS) -DUSE_GEMM3M $< -o $@
  129. else
  130. $(CC) -c $(CFLAGS) $< -o $@
  131. endif
  132. setparam$(TSUFFIX).c : setparam-ref.c
  133. sed 's/TS/$(TSUFFIX)/g' $< > $(@F)
  134. kernel$(TSUFFIX).h : $(KERNEL_INTERFACE)
  135. sed 's/\ *(/$(TSUFFIX)(/g' $^ > $(@F)
  136. cpuid.$(SUFFIX): $(KERNELDIR)/cpuid.S
  137. $(CC) -c $(CFLAGS) $< -o $(@F)
  138. scabs1.$(PSUFFIX): $(KERNELDIR)/$(SCABS_KERNEL)
  139. $(CC) -c $(PFLAGS) -DCOMPLEX -UDOUBLE -DF_INTERFACE $< -o $(@F)
  140. dcabs1.$(PSUFFIX): $(KERNELDIR)/$(DCABS_KERNEL)
  141. $(CC) -c $(PFLAGS) -DCOMPLEX -DDOUBLE -DF_INTERFACE $< -o $(@F)
  142. qcabs1.$(PSUFFIX): $(KERNELDIR)/$(QCABS_KERNEL)
  143. $(CC) -c $(PFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  144. qconjg.$(PSUFFIX): $(KERNELDIR)/qconjg.S
  145. $(CC) -c $(PFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  146. lsame.$(PSUFFIX): $(KERNELDIR)/$(LSAME_KERNEL)
  147. $(CC) -c $(PFLAGS) -DF_INTERFACE $< -o $(@F)
  148. cpuid.$(PSUFFIX): $(KERNELDIR)/cpuid.S
  149. $(CC) -c $(PFLAGS) $< -o $(@F)
  150. #ifdef DYNAMIC_ARCH
  151. clean ::
  152. @rm -f setparam_*.c kernel_*.h setparam.h kernel.h
  153. #endif
  154. include $(TOPDIR)/Makefile.tail