You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

Makefile 10 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400
  1. TOPDIR = ..
  2. include ../Makefile.system
  3. ifeq ($(F_COMPILER),GFORTRAN)
  4. override FFLAGS = $(filter_out(-O2 -O3,$(FFLAGS)) -O0
  5. override FFLAGS += -fno-tree-vectorize
  6. endif
  7. SUPPORT_GEMM3M = 0
  8. ifeq ($(ARCH), x86)
  9. SUPPORT_GEMM3M = 1
  10. endif
  11. ifeq ($(ARCH), x86_64)
  12. SUPPORT_GEMM3M = 1
  13. endif
  14. ifeq ($(ARCH), ia64)
  15. SUPPORT_GEMM3M = 1
  16. endif
  17. ifeq ($(ARCH), MIPS)
  18. SUPPORT_GEMM3M = 1
  19. endif
  20. ifeq ($(NOFORTRAN),1)
  21. all ::
  22. else
  23. all :: level1 level2 level3
  24. endif
  25. ifeq ($(BUILD_SINGLE),1)
  26. S1=sblat1
  27. endif
  28. ifeq ($(BUILD_DOUBLE),1)
  29. D1=dblat1
  30. endif
  31. ifeq ($(BUILD_COMPLEX),1)
  32. C1=cblat1
  33. endif
  34. ifeq ($(BUILD_COMPLEX16),1)
  35. Z1=zblat1
  36. endif
  37. level1: $(S1) $(D1) $(C1) $(Z1)
  38. ifneq ($(CROSS), 1)
  39. ifeq ($(BUILD_SINGLE),1)
  40. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat1
  41. endif
  42. ifeq ($(BUILD_DOUBLE),1)
  43. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat1
  44. endif
  45. ifeq ($(BUILD_COMPLEX),1)
  46. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat1
  47. endif
  48. ifeq ($(BUILD_COMPLEX16),1)
  49. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat1
  50. endif
  51. ifdef SMP
  52. ifeq ($(USE_OPENMP), 1)
  53. ifeq ($(BUILD_SINGLE),1)
  54. OMP_NUM_THREADS=2 ./sblat1
  55. endif
  56. ifeq ($(BUILD_DOUBLE),1)
  57. OMP_NUM_THREADS=2 ./dblat1
  58. endif
  59. ifeq ($(BUILD_COMPLEX),1)
  60. OMP_NUM_THREADS=2 ./cblat1
  61. endif
  62. ifeq ($(BUILD_COMPLEX16),1)
  63. OMP_NUM_THREADS=2 ./zblat1
  64. endif
  65. else
  66. ifeq ($(BUILD_SINGLE),1)
  67. OPENBLAS_NUM_THREADS=2 ./sblat1
  68. endif
  69. ifeq ($(BUILD_DOUBLE),1)
  70. OPENBLAS_NUM_THREADS=2 ./dblat1
  71. endif
  72. ifeq ($(BUILD_COMPLEX),1)
  73. OPENBLAS_NUM_THREADS=2 ./cblat1
  74. endif
  75. ifeq ($(BUILD_COMPLEX16),1)
  76. OPENBLAS_NUM_THREADS=2 ./zblat1
  77. endif
  78. endif
  79. endif
  80. endif
  81. ifeq ($(BUILD_SINGLE),1)
  82. S2=sblat2
  83. endif
  84. ifeq ($(BUILD_DOUBLE),1)
  85. D2=dblat2
  86. endif
  87. ifeq ($(BUILD_COMPLEX),1)
  88. C2=cblat2
  89. endif
  90. ifeq ($(BUILD_COMPLEX16),1)
  91. Z2=zblat2
  92. endif
  93. level2: $(S2) $(D2) $(C2) $(Z2)
  94. ifneq ($(CROSS), 1)
  95. rm -f ?BLAT2.SUMM
  96. ifeq ($(BUILD_SINGLE),1)
  97. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat2 < ./sblat2.dat
  98. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  99. endif
  100. ifeq ($(BUILD_DOUBLE),1)
  101. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat2 < ./dblat2.dat
  102. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  103. endif
  104. ifeq ($(BUILD_COMPLEX),1)
  105. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat2 < ./cblat2.dat
  106. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  107. endif
  108. ifeq ($(BUILD_COMPLEX16),1)
  109. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat2 < ./zblat2.dat
  110. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  111. endif
  112. ifdef SMP
  113. rm -f ?BLAT2.SUMM
  114. ifeq ($(USE_OPENMP), 1)
  115. ifeq ($(BUILD_SINGLE),1)
  116. OMP_NUM_THREADS=2 ./sblat2 < ./sblat2.dat
  117. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  118. endif
  119. ifeq ($(BUILD_DOUBLE),1)
  120. OMP_NUM_THREADS=2 ./dblat2 < ./dblat2.dat
  121. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  122. endif
  123. ifeq ($(BUILD_COMPLEX),1)
  124. OMP_NUM_THREADS=2 ./cblat2 < ./cblat2.dat
  125. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  126. endif
  127. ifeq ($(BUILD_COMPLEX16),1)
  128. OMP_NUM_THREADS=2 ./zblat2 < ./zblat2.dat
  129. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  130. endif
  131. else
  132. ifeq ($(BUILD_SINGLE),1)
  133. OPENBLAS_NUM_THREADS=2 ./sblat2 < ./sblat2.dat
  134. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  135. endif
  136. ifeq ($(BUILD_DOUBLE),1)
  137. OPENBLAS_NUM_THREADS=2 ./dblat2 < ./dblat2.dat
  138. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  139. endif
  140. ifeq ($(BUILD_COMPLEX),1)
  141. OPENBLAS_NUM_THREADS=2 ./cblat2 < ./cblat2.dat
  142. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  143. endif
  144. ifeq ($(BUILD_COMPLEX16),1)
  145. OPENBLAS_NUM_THREADS=2 ./zblat2 < ./zblat2.dat
  146. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  147. endif
  148. endif
  149. endif
  150. endif
  151. ifeq ($(BUILD_BFLOAT16),1)
  152. B3= test_sbgemm
  153. endif
  154. ifeq ($(BUILD_SINGLE),1)
  155. S3=sblat3
  156. endif
  157. ifeq ($(BUILD_DOUBLE),1)
  158. D3=dblat3
  159. endif
  160. ifeq ($(BUILD_COMPLEX),1)
  161. ifeq ($(SUPPORT_GEMM3M),1)
  162. C3=cblat3 cblat3_3m
  163. else
  164. C3=cblat3
  165. endif
  166. endif
  167. ifeq ($(BUILD_COMPLEX16),1)
  168. ifeq ($(SUPPORT_GEMM3M),1)
  169. Z3=zblat3 zblat3_3m
  170. else
  171. Z3=zblat3
  172. endif
  173. endif
  174. level3: $(B3) $(S3) $(D3) $(C3) $(Z3)
  175. ifneq ($(CROSS), 1)
  176. rm -f ?BLAT3.SUMM
  177. ifeq ($(BUILD_BFLOAT16),1)
  178. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./test_sbgemm > SBBLAT3.SUMM
  179. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  180. endif
  181. ifeq ($(BUILD_SINGLE),1)
  182. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat3 < ./sblat3.dat
  183. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  184. endif
  185. ifeq ($(BUILD_DOUBLE),1)
  186. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat3 < ./dblat3.dat
  187. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  188. endif
  189. ifeq ($(BUILD_COMPLEX),1)
  190. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat3 < ./cblat3.dat
  191. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  192. endif
  193. ifeq ($(BUILD_COMPLEX16),1)
  194. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat3 < ./zblat3.dat
  195. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  196. endif
  197. ifdef SMP
  198. rm -f ?BLAT3.SUMM
  199. ifeq ($(USE_OPENMP), 1)
  200. ifeq ($(BUILD_BFLOAT16),1)
  201. OMP_NUM_THREADS=2 ./test_sbgemm > SBBLAT3.SUMM
  202. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  203. endif
  204. ifeq ($(BUILD_SINGLE),1)
  205. OMP_NUM_THREADS=2 ./sblat3 < ./sblat3.dat
  206. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  207. endif
  208. ifeq ($(BUILD_DOUBLE),1)
  209. OMP_NUM_THREADS=2 ./dblat3 < ./dblat3.dat
  210. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  211. endif
  212. ifeq ($(BUILD_COMPLEX),1)
  213. OMP_NUM_THREADS=2 ./cblat3 < ./cblat3.dat
  214. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  215. endif
  216. ifeq ($(BUILD_COMPLEX16),1)
  217. OMP_NUM_THREADS=2 ./zblat3 < ./zblat3.dat
  218. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  219. endif
  220. else
  221. ifeq ($(BUILD_BFLOAT16),1)
  222. OPENBLAS_NUM_THREADS=2 ./test_sbgemm > SBBLAT3.SUMM
  223. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  224. endif
  225. ifeq ($(BUILD_SINGLE),1)
  226. OPENBLAS_NUM_THREADS=2 ./sblat3 < ./sblat3.dat
  227. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  228. endif
  229. ifeq ($(BUILD_DOUBLE),1)
  230. OPENBLAS_NUM_THREADS=2 ./dblat3 < ./dblat3.dat
  231. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  232. endif
  233. ifeq ($(BUILD_COMPLEX),1)
  234. OPENBLAS_NUM_THREADS=2 ./cblat3 < ./cblat3.dat
  235. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  236. endif
  237. ifeq ($(BUILD_COMPLEX16),1)
  238. OPENBLAS_NUM_THREADS=2 ./zblat3 < ./zblat3.dat
  239. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  240. endif
  241. endif
  242. endif
  243. endif
  244. level3_3m : zblat3_3m cblat3_3m
  245. ifneq ($(CROSS), 1)
  246. rm -f ?BLAT3_3M.SUMM
  247. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat3_3m < ./cblat3_3m.dat
  248. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  249. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat3_3m < ./zblat3_3m.dat
  250. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  251. ifdef SMP
  252. rm -f ?BLAT3_3M.SUMM
  253. ifeq ($(USE_OPENMP), 1)
  254. OMP_NUM_THREADS=2 ./cblat3_3m < ./cblat3_3m.dat
  255. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  256. OMP_NUM_THREADS=2 ./zblat3_3m < ./zblat3_3m.dat
  257. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  258. else
  259. OPENBLAS_NUM_THREADS=2 ./cblat3_3m < ./cblat3_3m.dat
  260. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  261. OPENBLAS_NUM_THREADS=2 ./zblat3_3m < ./zblat3_3m.dat
  262. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  263. endif
  264. endif
  265. endif
  266. FLDFLAGS = $(FFLAGS:-fPIC=) $(LDFLAGS)
  267. CLDFLAGS = $(CFLAGS) $(LDFLAGS)
  268. ifeq ($(USE_OPENMP), 1)
  269. ifeq ($(F_COMPILER), GFORTRAN)
  270. ifeq ($(C_COMPILER), CLANG)
  271. CEXTRALIB += -lomp
  272. endif
  273. endif
  274. ifeq ($(F_COMPILER), NAG)
  275. CEXTRALIB = -lgomp
  276. endif
  277. ifeq ($(F_COMPILER), IBM)
  278. ifeq ($(C_COMPILER), GCC)
  279. CEXTRALIB += -lgomp
  280. endif
  281. ifeq ($(C_COMPILER), CLANG)
  282. CEXTRALIB += -lomp
  283. endif
  284. endif
  285. endif
  286. ifeq ($(BUILD_SINGLE),1)
  287. sblat1 : sblat1.$(SUFFIX) ../$(LIBNAME)
  288. $(FC) $(FLDFLAGS) -o sblat1 sblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  289. sblat2 : sblat2.$(SUFFIX) ../$(LIBNAME)
  290. $(FC) $(FLDFLAGS) -o sblat2 sblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  291. sblat3 : sblat3.$(SUFFIX) ../$(LIBNAME)
  292. $(FC) $(FLDFLAGS) -o sblat3 sblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  293. endif
  294. ifeq ($(BUILD_DOUBLE),1)
  295. dblat1 : dblat1.$(SUFFIX) ../$(LIBNAME)
  296. $(FC) $(FLDFLAGS) -o dblat1 dblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  297. dblat2 : dblat2.$(SUFFIX) ../$(LIBNAME)
  298. $(FC) $(FLDFLAGS) -o dblat2 dblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  299. dblat3 : dblat3.$(SUFFIX) ../$(LIBNAME)
  300. $(FC) $(FLDFLAGS) -o dblat3 dblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  301. else
  302. dblat2:
  303. dblat3:
  304. endif
  305. qblat1 : qblat1.$(SUFFIX) ../$(LIBNAME)
  306. $(FC) $(FLDFLAGS) -o qblat1 qblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  307. ifeq ($(BUILD_COMPLEX),1)
  308. cblat1 : cblat1.$(SUFFIX) ../$(LIBNAME)
  309. $(FC) $(FLDFLAGS) -o cblat1 cblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  310. cblat2 : cblat2.$(SUFFIX) ../$(LIBNAME)
  311. $(FC) $(FLDFLAGS) -o cblat2 cblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  312. cblat3 : cblat3.$(SUFFIX) ../$(LIBNAME)
  313. $(FC) $(FLDFLAGS) -o cblat3 cblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  314. endif
  315. ifeq ($(BUILD_COMPLEX16),1)
  316. zblat1 : zblat1.$(SUFFIX) ../$(LIBNAME)
  317. $(FC) $(FLDFLAGS) -o zblat1 zblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  318. zblat2 : zblat2.$(SUFFIX) ../$(LIBNAME)
  319. $(FC) $(FLDFLAGS) -o zblat2 zblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  320. zblat3 : zblat3.$(SUFFIX) ../$(LIBNAME)
  321. $(FC) $(FLDFLAGS) -o zblat3 zblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  322. endif
  323. ifeq ($(BUILD_BFLOAT16),1)
  324. test_sbgemm : compare_sgemm_sbgemm.c ../$(LIBNAME)
  325. $(CC) $(CLDFLAGS) -o test_sbgemm compare_sgemm_sbgemm.c ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  326. endif
  327. ifeq ($(BUILD_COMPLEX),1)
  328. cblat3_3m : cblat3_3m.$(SUFFIX) ../$(LIBNAME)
  329. $(FC) $(FLDFLAGS) -o cblat3_3m cblat3_3m.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  330. endif
  331. ifeq ($(BUILD_COMPLEX16),1)
  332. zblat3_3m : zblat3_3m.$(SUFFIX) ../$(LIBNAME)
  333. $(FC) $(FLDFLAGS) -o zblat3_3m zblat3_3m.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  334. endif
  335. clean:
  336. @rm -f *.$(SUFFIX) *.$(PSUFFIX) gmon.$(SUFFIX)ut *.SUMM *.cxml *.exe *.pdb *.dwf \
  337. sblat1 dblat1 cblat1 zblat1 \
  338. sblat2 dblat2 cblat2 zblat2 \
  339. test_sbgemm sblat3 dblat3 cblat3 zblat3 \
  340. sblat1p dblat1p cblat1p zblat1p \
  341. sblat2p dblat2p cblat2p zblat2p \
  342. sblat3p dblat3p cblat3p zblat3p \
  343. zblat3_3m zblat3_3mp \
  344. cblat3_3m cblat3_3mp \
  345. *.stackdump *.dll
  346. libs:
  347. prof:
  348. quick :
  349. $(MAKE) -C $(TOPDIR) libs
  350. # include ../Makefile.tail