You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

Makefile 10 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399
  1. TOPDIR = ..
  2. include ../Makefile.system
  3. ifeq ($(F_COMPILER),GFORTRAN)
  4. override FFLAGS += -fno-tree-vectorize
  5. endif
  6. SUPPORT_GEMM3M = 0
  7. ifeq ($(ARCH), x86)
  8. SUPPORT_GEMM3M = 1
  9. endif
  10. ifeq ($(ARCH), x86_64)
  11. SUPPORT_GEMM3M = 1
  12. endif
  13. ifeq ($(ARCH), ia64)
  14. SUPPORT_GEMM3M = 1
  15. endif
  16. ifeq ($(ARCH), MIPS)
  17. SUPPORT_GEMM3M = 1
  18. endif
  19. ifeq ($(NOFORTRAN),1)
  20. all ::
  21. else
  22. all :: level1 level2 level3
  23. endif
  24. ifeq ($(BUILD_SINGLE),1)
  25. S1=sblat1
  26. endif
  27. ifeq ($(BUILD_DOUBLE),1)
  28. D1=dblat1
  29. endif
  30. ifeq ($(BUILD_COMPLEX),1)
  31. C1=cblat1
  32. endif
  33. ifeq ($(BUILD_COMPLEX16),1)
  34. Z1=zblat1
  35. endif
  36. level1: $(S1) $(D1) $(C1) $(Z1)
  37. ifneq ($(CROSS), 1)
  38. ifeq ($(BUILD_SINGLE),1)
  39. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat1
  40. endif
  41. ifeq ($(BUILD_DOUBLE),1)
  42. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat1
  43. endif
  44. ifeq ($(BUILD_COMPLEX),1)
  45. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat1
  46. endif
  47. ifeq ($(BUILD_COMPLEX16),1)
  48. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat1
  49. endif
  50. ifdef SMP
  51. ifeq ($(USE_OPENMP), 1)
  52. ifeq ($(BUILD_SINGLE),1)
  53. OMP_NUM_THREADS=2 ./sblat1
  54. endif
  55. ifeq ($(BUILD_DOUBLE),1)
  56. OMP_NUM_THREADS=2 ./dblat1
  57. endif
  58. ifeq ($(BUILD_COMPLEX),1)
  59. OMP_NUM_THREADS=2 ./cblat1
  60. endif
  61. ifeq ($(BUILD_COMPLEX16),1)
  62. OMP_NUM_THREADS=2 ./zblat1
  63. endif
  64. else
  65. ifeq ($(BUILD_SINGLE),1)
  66. OPENBLAS_NUM_THREADS=2 ./sblat1
  67. endif
  68. ifeq ($(BUILD_DOUBLE),1)
  69. OPENBLAS_NUM_THREADS=2 ./dblat1
  70. endif
  71. ifeq ($(BUILD_COMPLEX),1)
  72. OPENBLAS_NUM_THREADS=2 ./cblat1
  73. endif
  74. ifeq ($(BUILD_COMPLEX16),1)
  75. OPENBLAS_NUM_THREADS=2 ./zblat1
  76. endif
  77. endif
  78. endif
  79. endif
  80. ifeq ($(BUILD_SINGLE),1)
  81. S2=sblat2
  82. endif
  83. ifeq ($(BUILD_DOUBLE),1)
  84. D2=dblat2
  85. endif
  86. ifeq ($(BUILD_COMPLEX),1)
  87. C2=cblat2
  88. endif
  89. ifeq ($(BUILD_COMPLEX16),1)
  90. Z2=zblat2
  91. endif
  92. level2: $(S2) $(D2) $(C2) $(Z2)
  93. ifneq ($(CROSS), 1)
  94. rm -f ?BLAT2.SUMM
  95. ifeq ($(BUILD_SINGLE),1)
  96. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat2 < ./sblat2.dat
  97. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  98. endif
  99. ifeq ($(BUILD_DOUBLE),1)
  100. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat2 < ./dblat2.dat
  101. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  102. endif
  103. ifeq ($(BUILD_COMPLEX),1)
  104. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat2 < ./cblat2.dat
  105. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  106. endif
  107. ifeq ($(BUILD_COMPLEX16),1)
  108. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat2 < ./zblat2.dat
  109. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  110. endif
  111. ifdef SMP
  112. rm -f ?BLAT2.SUMM
  113. ifeq ($(USE_OPENMP), 1)
  114. ifeq ($(BUILD_SINGLE),1)
  115. OMP_NUM_THREADS=2 ./sblat2 < ./sblat2.dat
  116. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  117. endif
  118. ifeq ($(BUILD_DOUBLE),1)
  119. OMP_NUM_THREADS=2 ./dblat2 < ./dblat2.dat
  120. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  121. endif
  122. ifeq ($(BUILD_COMPLEX),1)
  123. OMP_NUM_THREADS=2 ./cblat2 < ./cblat2.dat
  124. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  125. endif
  126. ifeq ($(BUILD_COMPLEX16),1)
  127. OMP_NUM_THREADS=2 ./zblat2 < ./zblat2.dat
  128. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  129. endif
  130. else
  131. ifeq ($(BUILD_SINGLE),1)
  132. OPENBLAS_NUM_THREADS=2 ./sblat2 < ./sblat2.dat
  133. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  134. endif
  135. ifeq ($(BUILD_DOUBLE),1)
  136. OPENBLAS_NUM_THREADS=2 ./dblat2 < ./dblat2.dat
  137. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  138. endif
  139. ifeq ($(BUILD_COMPLEX),1)
  140. OPENBLAS_NUM_THREADS=2 ./cblat2 < ./cblat2.dat
  141. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  142. endif
  143. ifeq ($(BUILD_COMPLEX16),1)
  144. OPENBLAS_NUM_THREADS=2 ./zblat2 < ./zblat2.dat
  145. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  146. endif
  147. endif
  148. endif
  149. endif
  150. ifeq ($(BUILD_BFLOAT16),1)
  151. B3= test_sbgemm
  152. endif
  153. ifeq ($(BUILD_SINGLE),1)
  154. S3=sblat3
  155. endif
  156. ifeq ($(BUILD_DOUBLE),1)
  157. D3=dblat3
  158. endif
  159. ifeq ($(BUILD_COMPLEX),1)
  160. ifeq ($(SUPPORT_GEMM3M),1)
  161. C3=cblat3 cblat3_3m
  162. else
  163. C3=cblat3
  164. endif
  165. endif
  166. ifeq ($(BUILD_COMPLEX16),1)
  167. ifeq ($(SUPPORT_GEMM3M),1)
  168. Z3=zblat3 zblat3_3m
  169. else
  170. Z3=zblat3
  171. endif
  172. endif
  173. level3: $(B3) $(S3) $(D3) $(C3) $(Z3)
  174. ifneq ($(CROSS), 1)
  175. rm -f ?BLAT3.SUMM
  176. ifeq ($(BUILD_BFLOAT16),1)
  177. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./test_sbgemm > SBBLAT3.SUMM
  178. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  179. endif
  180. ifeq ($(BUILD_SINGLE),1)
  181. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat3 < ./sblat3.dat
  182. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  183. endif
  184. ifeq ($(BUILD_DOUBLE),1)
  185. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat3 < ./dblat3.dat
  186. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  187. endif
  188. ifeq ($(BUILD_COMPLEX),1)
  189. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat3 < ./cblat3.dat
  190. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  191. endif
  192. ifeq ($(BUILD_COMPLEX16),1)
  193. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat3 < ./zblat3.dat
  194. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  195. endif
  196. ifdef SMP
  197. rm -f ?BLAT3.SUMM
  198. ifeq ($(USE_OPENMP), 1)
  199. ifeq ($(BUILD_BFLOAT16),1)
  200. OMP_NUM_THREADS=2 ./test_sbgemm > SBBLAT3.SUMM
  201. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  202. endif
  203. ifeq ($(BUILD_SINGLE),1)
  204. OMP_NUM_THREADS=2 ./sblat3 < ./sblat3.dat
  205. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  206. endif
  207. ifeq ($(BUILD_DOUBLE),1)
  208. OMP_NUM_THREADS=2 ./dblat3 < ./dblat3.dat
  209. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  210. endif
  211. ifeq ($(BUILD_COMPLEX),1)
  212. OMP_NUM_THREADS=2 ./cblat3 < ./cblat3.dat
  213. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  214. endif
  215. ifeq ($(BUILD_COMPLEX16),1)
  216. OMP_NUM_THREADS=2 ./zblat3 < ./zblat3.dat
  217. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  218. endif
  219. else
  220. ifeq ($(BUILD_BFLOAT16),1)
  221. OPENBLAS_NUM_THREADS=2 ./test_sbgemm > SBBLAT3.SUMM
  222. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  223. endif
  224. ifeq ($(BUILD_SINGLE),1)
  225. OPENBLAS_NUM_THREADS=2 ./sblat3 < ./sblat3.dat
  226. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  227. endif
  228. ifeq ($(BUILD_DOUBLE),1)
  229. OPENBLAS_NUM_THREADS=2 ./dblat3 < ./dblat3.dat
  230. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  231. endif
  232. ifeq ($(BUILD_COMPLEX),1)
  233. OPENBLAS_NUM_THREADS=2 ./cblat3 < ./cblat3.dat
  234. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  235. endif
  236. ifeq ($(BUILD_COMPLEX16),1)
  237. OPENBLAS_NUM_THREADS=2 ./zblat3 < ./zblat3.dat
  238. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  239. endif
  240. endif
  241. endif
  242. endif
  243. level3_3m : zblat3_3m cblat3_3m
  244. ifneq ($(CROSS), 1)
  245. rm -f ?BLAT3_3M.SUMM
  246. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat3_3m < ./cblat3_3m.dat
  247. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  248. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat3_3m < ./zblat3_3m.dat
  249. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  250. ifdef SMP
  251. rm -f ?BLAT3_3M.SUMM
  252. ifeq ($(USE_OPENMP), 1)
  253. OMP_NUM_THREADS=2 ./cblat3_3m < ./cblat3_3m.dat
  254. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  255. OMP_NUM_THREADS=2 ./zblat3_3m < ./zblat3_3m.dat
  256. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  257. else
  258. OPENBLAS_NUM_THREADS=2 ./cblat3_3m < ./cblat3_3m.dat
  259. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  260. OPENBLAS_NUM_THREADS=2 ./zblat3_3m < ./zblat3_3m.dat
  261. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  262. endif
  263. endif
  264. endif
  265. FLDFLAGS = $(FFLAGS:-fPIC=) $(LDFLAGS)
  266. CLDFLAGS = $(CFLAGS) $(LDFLAGS)
  267. ifeq ($(USE_OPENMP), 1)
  268. ifeq ($(F_COMPILER), GFORTRAN)
  269. ifeq ($(C_COMPILER), CLANG)
  270. CEXTRALIB += -lomp
  271. endif
  272. endif
  273. ifeq ($(F_COMPILER), NAG)
  274. CEXTRALIB = -lgomp
  275. endif
  276. ifeq ($(F_COMPILER), IBM)
  277. ifeq ($(C_COMPILER), GCC)
  278. CEXTRALIB += -lgomp
  279. endif
  280. ifeq ($(C_COMPILER), CLANG)
  281. CEXTRALIB += -lomp
  282. endif
  283. endif
  284. endif
  285. ifeq ($(BUILD_SINGLE),1)
  286. sblat1 : sblat1.$(SUFFIX) ../$(LIBNAME)
  287. $(FC) $(FLDFLAGS) -o sblat1 sblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  288. sblat2 : sblat2.$(SUFFIX) ../$(LIBNAME)
  289. $(FC) $(FLDFLAGS) -o sblat2 sblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  290. sblat3 : sblat3.$(SUFFIX) ../$(LIBNAME)
  291. $(FC) $(FLDFLAGS) -o sblat3 sblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  292. endif
  293. ifeq ($(BUILD_DOUBLE),1)
  294. dblat1 : dblat1.$(SUFFIX) ../$(LIBNAME)
  295. $(FC) $(FLDFLAGS) -o dblat1 dblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  296. dblat2 : dblat2.$(SUFFIX) ../$(LIBNAME)
  297. $(FC) $(FLDFLAGS) -o dblat2 dblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  298. dblat3 : dblat3.$(SUFFIX) ../$(LIBNAME)
  299. $(FC) $(FLDFLAGS) -o dblat3 dblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  300. else
  301. dblat2:
  302. dblat3:
  303. endif
  304. qblat1 : qblat1.$(SUFFIX) ../$(LIBNAME)
  305. $(FC) $(FLDFLAGS) -o qblat1 qblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  306. ifeq ($(BUILD_COMPLEX),1)
  307. cblat1 : cblat1.$(SUFFIX) ../$(LIBNAME)
  308. $(FC) $(FLDFLAGS) -o cblat1 cblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  309. cblat2 : cblat2.$(SUFFIX) ../$(LIBNAME)
  310. $(FC) $(FLDFLAGS) -o cblat2 cblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  311. cblat3 : cblat3.$(SUFFIX) ../$(LIBNAME)
  312. $(FC) $(FLDFLAGS) -o cblat3 cblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  313. endif
  314. ifeq ($(BUILD_COMPLEX16),1)
  315. zblat1 : zblat1.$(SUFFIX) ../$(LIBNAME)
  316. $(FC) $(FLDFLAGS) -o zblat1 zblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  317. zblat2 : zblat2.$(SUFFIX) ../$(LIBNAME)
  318. $(FC) $(FLDFLAGS) -o zblat2 zblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  319. zblat3 : zblat3.$(SUFFIX) ../$(LIBNAME)
  320. $(FC) $(FLDFLAGS) -o zblat3 zblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  321. endif
  322. ifeq ($(BUILD_BFLOAT16),1)
  323. test_sbgemm : compare_sgemm_sbgemm.c ../$(LIBNAME)
  324. $(CC) $(CLDFLAGS) -o test_sbgemm compare_sgemm_sbgemm.c ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  325. endif
  326. ifeq ($(BUILD_COMPLEX),1)
  327. cblat3_3m : cblat3_3m.$(SUFFIX) ../$(LIBNAME)
  328. $(FC) $(FLDFLAGS) -o cblat3_3m cblat3_3m.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  329. endif
  330. ifeq ($(BUILD_COMPLEX16),1)
  331. zblat3_3m : zblat3_3m.$(SUFFIX) ../$(LIBNAME)
  332. $(FC) $(FLDFLAGS) -o zblat3_3m zblat3_3m.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  333. endif
  334. clean:
  335. @rm -f *.$(SUFFIX) *.$(PSUFFIX) gmon.$(SUFFIX)ut *.SUMM *.cxml *.exe *.pdb *.dwf \
  336. sblat1 dblat1 cblat1 zblat1 \
  337. sblat2 dblat2 cblat2 zblat2 \
  338. test_sbgemm sblat3 dblat3 cblat3 zblat3 \
  339. sblat1p dblat1p cblat1p zblat1p \
  340. sblat2p dblat2p cblat2p zblat2p \
  341. sblat3p dblat3p cblat3p zblat3p \
  342. zblat3_3m zblat3_3mp \
  343. cblat3_3m cblat3_3mp \
  344. *.stackdump *.dll
  345. libs:
  346. prof:
  347. quick :
  348. $(MAKE) -C $(TOPDIR) libs
  349. # include ../Makefile.tail