You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

Makefile 4.8 kB

7 years ago
7 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171
  1. ifdef TARGET_CORE
  2. TARGET = $(TARGET_CORE)
  3. endif
  4. TOPDIR = ..
  5. include $(TOPDIR)/Makefile.system
  6. ifeq ($(C_COMPILER), GCC)
  7. GCCVERSIONGTEQ9 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 9)
  8. endif
  9. AVX2OPT =
  10. ifeq ($(C_COMPILER), GCC)
  11. # AVX2 support was added in 4.7.0
  12. GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
  13. GCCMINORVERSIONGTEQ7 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 7)
  14. ifeq ($(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ7), 11)
  15. AVX2OPT = -mavx2
  16. endif
  17. endif
  18. ifeq ($(C_COMPILER), CLANG)
  19. # Any clang posing as gcc 4.2 should be new enough (3.4 or later)
  20. GCCVERSIONGTEQ4 := $(shell expr `$(CC) -dumpversion | cut -f1 -d.` \>= 4)
  21. GCCMINORVERSIONGTEQ2 := $(shell expr `$(CC) -dumpversion | cut -f2 -d.` \>= 2)
  22. ifeq ($(GCCVERSIONGTEQ4)$(GCCMINORVERSIONGTEQ2), 11)
  23. AVX2OPT = -mavx2
  24. endif
  25. endif
  26. ifdef NO_AVX2
  27. AVX2OPT=
  28. endif
  29. ifdef TARGET_CORE
  30. ifeq ($(TARGET_CORE), SKYLAKEX)
  31. override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE) -march=skylake-avx512
  32. ifeq ($(OSNAME), CYGWIN_NT)
  33. override CFLAGS += -fno-asynchronous-unwind-tables
  34. endif
  35. ifeq ($(OSNAME), WINNT)
  36. ifeq ($(C_COMPILER), GCC)
  37. override CFLAGS += -fno-asynchronous-unwind-tables
  38. endif
  39. endif
  40. else ifeq ($(TARGET_CORE), HASWELL)
  41. override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE) $(AVX2OPT)
  42. else
  43. override CFLAGS += -DBUILD_KERNEL -DTABLE_NAME=gotoblas_$(TARGET_CORE)
  44. endif
  45. BUILD_KERNEL = 1
  46. KDIR =
  47. TSUFFIX = _$(TARGET_CORE)
  48. else
  49. TARGET_CORE = $(CORE)
  50. KDIR =
  51. TSUFFIX =
  52. endif
  53. -include $(KERNELDIR)/KERNEL.$(TARGET_CORE)
  54. include $(KERNELDIR)/KERNEL
  55. include Makefile.L1
  56. include Makefile.L2
  57. include Makefile.L3
  58. include Makefile.LA
  59. HPLOBJS = \
  60. dgemm_kernel.$(SUFFIX) \
  61. $(DGEMMINCOPYOBJ) $(DGEMMITCOPYOBJ) \
  62. $(DGEMMONCOPYOBJ) $(DGEMMOTCOPYOBJ) \
  63. dtrsm_kernel_LN.$(SUFFIX) dtrsm_kernel_LT.$(SUFFIX) \
  64. dtrsm_kernel_RN.$(SUFFIX) dtrsm_kernel_RT.$(SUFFIX) \
  65. daxpy_k.$(SUFFIX) dcopy_k.$(SUFFIX) ddot_k.$(SUFFIX) \
  66. dger_k.$(SUFFIX) dscal_k.$(SUFFIX) idamax_k.$(SUFFIX) \
  67. dgemv_n.$(SUFFIX) dgemv_t.$(SUFFIX) dgemm_beta.$(SUFFIX) \
  68. dtrsm_iunucopy.$(SUFFIX) dtrsm_iunncopy.$(SUFFIX) \
  69. dtrsm_ilnucopy.$(SUFFIX) dtrsm_ilnncopy.$(SUFFIX) \
  70. dtrsm_iutucopy.$(SUFFIX) dtrsm_iutncopy.$(SUFFIX) \
  71. dtrsm_iltucopy.$(SUFFIX) dtrsm_iltncopy.$(SUFFIX) \
  72. dtrsm_ounucopy.$(SUFFIX) dtrsm_ounncopy.$(SUFFIX) \
  73. dtrsm_olnucopy.$(SUFFIX) dtrsm_olnncopy.$(SUFFIX) \
  74. dtrsm_outucopy.$(SUFFIX) dtrsm_outncopy.$(SUFFIX) \
  75. dtrsm_oltucopy.$(SUFFIX) dtrsm_oltncopy.$(SUFFIX)
  76. COMMONOBJS += lsame.$(SUFFIX) scabs1.$(SUFFIX) dcabs1.$(SUFFIX)
  77. ifeq ($(DYNAMIC_ARCH), 1)
  78. SBLASOBJS += setparam$(TSUFFIX).$(SUFFIX)
  79. CCOMMON_OPT += -DTS=$(TSUFFIX)
  80. endif
  81. KERNEL_INTERFACE = ../common_level1.h ../common_level2.h ../common_level3.h
  82. ifneq ($(NO_LAPACK), 1)
  83. KERNEL_INTERFACE += ../common_lapack.h
  84. endif
  85. ifeq ($(ARCH), x86)
  86. COMMONOBJS += cpuid.$(SUFFIX)
  87. endif
  88. ifdef EXPRECISION
  89. COMMONOBJS += qconjg.$(SUFFIX) qcabs1.$(SUFFIX)
  90. endif
  91. ifdef QUAD_PRECISION
  92. COMMONOBJS += qconjg.$(SUFFIX) qcabs1.$(SUFFIX)
  93. endif
  94. all : libs
  95. scabs1.$(SUFFIX): $(KERNELDIR)/$(SCABS_KERNEL)
  96. $(CC) -c $(CFLAGS) -DCOMPLEX -UDOUBLE -DF_INTERFACE $< -o $(@F)
  97. dcabs1.$(SUFFIX): $(KERNELDIR)/$(DCABS_KERNEL)
  98. $(CC) -c $(CFLAGS) -DCOMPLEX -DDOUBLE -DF_INTERFACE $< -o $(@F)
  99. qcabs1.$(SUFFIX): $(KERNELDIR)/$(QCABS_KERNEL)
  100. $(CC) -c $(CFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  101. qconjg.$(SUFFIX): $(KERNELDIR)/qconjg.S
  102. $(CC) -c $(CFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  103. lsame.$(SUFFIX): $(KERNELDIR)/$(LSAME_KERNEL)
  104. $(CC) -c $(CFLAGS) -DF_INTERFACE $< -o $(@F)
  105. setparam$(TSUFFIX).$(SUFFIX): setparam$(TSUFFIX).c kernel$(TSUFFIX).h
  106. ifeq ($(USE_GEMM3M), 1)
  107. $(CC) -c $(CFLAGS) -DUSE_GEMM3M $< -o $@
  108. else
  109. $(CC) -c $(CFLAGS) $< -o $@
  110. endif
  111. setparam$(TSUFFIX).c : setparam-ref.c
  112. sed 's/TS/$(TSUFFIX)/g' $< > $(@F)
  113. kernel$(TSUFFIX).h : $(KERNEL_INTERFACE)
  114. sed 's/\ *(/$(TSUFFIX)(/g' $^ > $(@F)
  115. cpuid.$(SUFFIX): $(KERNELDIR)/cpuid.S
  116. $(CC) -c $(CFLAGS) $< -o $(@F)
  117. scabs1.$(PSUFFIX): $(KERNELDIR)/$(SCABS_KERNEL)
  118. $(CC) -c $(PFLAGS) -DCOMPLEX -UDOUBLE -DF_INTERFACE $< -o $(@F)
  119. dcabs1.$(PSUFFIX): $(KERNELDIR)/$(DCABS_KERNEL)
  120. $(CC) -c $(PFLAGS) -DCOMPLEX -DDOUBLE -DF_INTERFACE $< -o $(@F)
  121. qcabs1.$(PSUFFIX): $(KERNELDIR)/$(QCABS_KERNEL)
  122. $(CC) -c $(PFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  123. qconjg.$(PSUFFIX): $(KERNELDIR)/qconjg.S
  124. $(CC) -c $(PFLAGS) -DCOMPLEX -DXDOUBLE -DF_INTERFACE $< -o $(@F)
  125. lsame.$(PSUFFIX): $(KERNELDIR)/$(LSAME_KERNEL)
  126. $(CC) -c $(PFLAGS) -DF_INTERFACE $< -o $(@F)
  127. cpuid.$(PSUFFIX): $(KERNELDIR)/cpuid.S
  128. $(CC) -c $(PFLAGS) $< -o $(@F)
  129. #ifdef DYNAMIC_ARCH
  130. clean ::
  131. @rm -f setparam_*.c kernel_*.h setparam.h kernel.h
  132. #endif
  133. include $(TOPDIR)/Makefile.tail