You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

Makefile 10 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402
  1. TOPDIR = ..
  2. include ../Makefile.system
  3. ifeq ($(F_COMPILER),GFORTRAN)
  4. ifneq (, $(filter $(CORE),LOONGSON3R3 LOONGSON3R4))
  5. override FFLAGS = $(filter_out(-O2 -O3,$(FFLAGS)) -O0
  6. endif
  7. override FFLAGS += -fno-tree-vectorize
  8. endif
  9. SUPPORT_GEMM3M = 0
  10. ifeq ($(ARCH), x86)
  11. SUPPORT_GEMM3M = 1
  12. endif
  13. ifeq ($(ARCH), x86_64)
  14. SUPPORT_GEMM3M = 1
  15. endif
  16. ifeq ($(ARCH), ia64)
  17. SUPPORT_GEMM3M = 1
  18. endif
  19. ifeq ($(ARCH), MIPS)
  20. SUPPORT_GEMM3M = 1
  21. endif
  22. ifeq ($(NOFORTRAN),1)
  23. all ::
  24. else
  25. all :: level1 level2 level3
  26. endif
  27. ifeq ($(BUILD_SINGLE),1)
  28. S1=sblat1
  29. endif
  30. ifeq ($(BUILD_DOUBLE),1)
  31. D1=dblat1
  32. endif
  33. ifeq ($(BUILD_COMPLEX),1)
  34. C1=cblat1
  35. endif
  36. ifeq ($(BUILD_COMPLEX16),1)
  37. Z1=zblat1
  38. endif
  39. level1: $(S1) $(D1) $(C1) $(Z1)
  40. ifneq ($(CROSS), 1)
  41. ifeq ($(BUILD_SINGLE),1)
  42. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat1
  43. endif
  44. ifeq ($(BUILD_DOUBLE),1)
  45. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat1
  46. endif
  47. ifeq ($(BUILD_COMPLEX),1)
  48. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat1
  49. endif
  50. ifeq ($(BUILD_COMPLEX16),1)
  51. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat1
  52. endif
  53. ifdef SMP
  54. ifeq ($(USE_OPENMP), 1)
  55. ifeq ($(BUILD_SINGLE),1)
  56. OMP_NUM_THREADS=2 ./sblat1
  57. endif
  58. ifeq ($(BUILD_DOUBLE),1)
  59. OMP_NUM_THREADS=2 ./dblat1
  60. endif
  61. ifeq ($(BUILD_COMPLEX),1)
  62. OMP_NUM_THREADS=2 ./cblat1
  63. endif
  64. ifeq ($(BUILD_COMPLEX16),1)
  65. OMP_NUM_THREADS=2 ./zblat1
  66. endif
  67. else
  68. ifeq ($(BUILD_SINGLE),1)
  69. OPENBLAS_NUM_THREADS=2 ./sblat1
  70. endif
  71. ifeq ($(BUILD_DOUBLE),1)
  72. OPENBLAS_NUM_THREADS=2 ./dblat1
  73. endif
  74. ifeq ($(BUILD_COMPLEX),1)
  75. OPENBLAS_NUM_THREADS=2 ./cblat1
  76. endif
  77. ifeq ($(BUILD_COMPLEX16),1)
  78. OPENBLAS_NUM_THREADS=2 ./zblat1
  79. endif
  80. endif
  81. endif
  82. endif
  83. ifeq ($(BUILD_SINGLE),1)
  84. S2=sblat2
  85. endif
  86. ifeq ($(BUILD_DOUBLE),1)
  87. D2=dblat2
  88. endif
  89. ifeq ($(BUILD_COMPLEX),1)
  90. C2=cblat2
  91. endif
  92. ifeq ($(BUILD_COMPLEX16),1)
  93. Z2=zblat2
  94. endif
  95. level2: $(S2) $(D2) $(C2) $(Z2)
  96. ifneq ($(CROSS), 1)
  97. rm -f ?BLAT2.SUMM
  98. ifeq ($(BUILD_SINGLE),1)
  99. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat2 < ./sblat2.dat
  100. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  101. endif
  102. ifeq ($(BUILD_DOUBLE),1)
  103. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat2 < ./dblat2.dat
  104. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  105. endif
  106. ifeq ($(BUILD_COMPLEX),1)
  107. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat2 < ./cblat2.dat
  108. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  109. endif
  110. ifeq ($(BUILD_COMPLEX16),1)
  111. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat2 < ./zblat2.dat
  112. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  113. endif
  114. ifdef SMP
  115. rm -f ?BLAT2.SUMM
  116. ifeq ($(USE_OPENMP), 1)
  117. ifeq ($(BUILD_SINGLE),1)
  118. OMP_NUM_THREADS=2 ./sblat2 < ./sblat2.dat
  119. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  120. endif
  121. ifeq ($(BUILD_DOUBLE),1)
  122. OMP_NUM_THREADS=2 ./dblat2 < ./dblat2.dat
  123. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  124. endif
  125. ifeq ($(BUILD_COMPLEX),1)
  126. OMP_NUM_THREADS=2 ./cblat2 < ./cblat2.dat
  127. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  128. endif
  129. ifeq ($(BUILD_COMPLEX16),1)
  130. OMP_NUM_THREADS=2 ./zblat2 < ./zblat2.dat
  131. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  132. endif
  133. else
  134. ifeq ($(BUILD_SINGLE),1)
  135. OPENBLAS_NUM_THREADS=2 ./sblat2 < ./sblat2.dat
  136. @$(GREP) -q FATAL SBLAT2.SUMM && cat SBLAT2.SUMM || exit 0
  137. endif
  138. ifeq ($(BUILD_DOUBLE),1)
  139. OPENBLAS_NUM_THREADS=2 ./dblat2 < ./dblat2.dat
  140. @$(GREP) -q FATAL DBLAT2.SUMM && cat DBLAT2.SUMM || exit 0
  141. endif
  142. ifeq ($(BUILD_COMPLEX),1)
  143. OPENBLAS_NUM_THREADS=2 ./cblat2 < ./cblat2.dat
  144. @$(GREP) -q FATAL CBLAT2.SUMM && cat CBLAT2.SUMM || exit 0
  145. endif
  146. ifeq ($(BUILD_COMPLEX16),1)
  147. OPENBLAS_NUM_THREADS=2 ./zblat2 < ./zblat2.dat
  148. @$(GREP) -q FATAL ZBLAT2.SUMM && cat ZBLAT2.SUMM || exit 0
  149. endif
  150. endif
  151. endif
  152. endif
  153. ifeq ($(BUILD_BFLOAT16),1)
  154. B3= test_sbgemm
  155. endif
  156. ifeq ($(BUILD_SINGLE),1)
  157. S3=sblat3
  158. endif
  159. ifeq ($(BUILD_DOUBLE),1)
  160. D3=dblat3
  161. endif
  162. ifeq ($(BUILD_COMPLEX),1)
  163. ifeq ($(SUPPORT_GEMM3M),1)
  164. C3=cblat3 cblat3_3m
  165. else
  166. C3=cblat3
  167. endif
  168. endif
  169. ifeq ($(BUILD_COMPLEX16),1)
  170. ifeq ($(SUPPORT_GEMM3M),1)
  171. Z3=zblat3 zblat3_3m
  172. else
  173. Z3=zblat3
  174. endif
  175. endif
  176. level3: $(B3) $(S3) $(D3) $(C3) $(Z3)
  177. ifneq ($(CROSS), 1)
  178. rm -f ?BLAT3.SUMM
  179. ifeq ($(BUILD_BFLOAT16),1)
  180. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./test_sbgemm > SBBLAT3.SUMM
  181. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  182. endif
  183. ifeq ($(BUILD_SINGLE),1)
  184. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./sblat3 < ./sblat3.dat
  185. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  186. endif
  187. ifeq ($(BUILD_DOUBLE),1)
  188. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./dblat3 < ./dblat3.dat
  189. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  190. endif
  191. ifeq ($(BUILD_COMPLEX),1)
  192. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat3 < ./cblat3.dat
  193. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  194. endif
  195. ifeq ($(BUILD_COMPLEX16),1)
  196. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat3 < ./zblat3.dat
  197. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  198. endif
  199. ifdef SMP
  200. rm -f ?BLAT3.SUMM
  201. ifeq ($(USE_OPENMP), 1)
  202. ifeq ($(BUILD_BFLOAT16),1)
  203. OMP_NUM_THREADS=2 ./test_sbgemm > SBBLAT3.SUMM
  204. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  205. endif
  206. ifeq ($(BUILD_SINGLE),1)
  207. OMP_NUM_THREADS=2 ./sblat3 < ./sblat3.dat
  208. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  209. endif
  210. ifeq ($(BUILD_DOUBLE),1)
  211. OMP_NUM_THREADS=2 ./dblat3 < ./dblat3.dat
  212. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  213. endif
  214. ifeq ($(BUILD_COMPLEX),1)
  215. OMP_NUM_THREADS=2 ./cblat3 < ./cblat3.dat
  216. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  217. endif
  218. ifeq ($(BUILD_COMPLEX16),1)
  219. OMP_NUM_THREADS=2 ./zblat3 < ./zblat3.dat
  220. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  221. endif
  222. else
  223. ifeq ($(BUILD_BFLOAT16),1)
  224. OPENBLAS_NUM_THREADS=2 ./test_sbgemm > SBBLAT3.SUMM
  225. @$(GREP) -q FATAL SBBLAT3.SUMM && cat SBBLAT3.SUMM || exit 0
  226. endif
  227. ifeq ($(BUILD_SINGLE),1)
  228. OPENBLAS_NUM_THREADS=2 ./sblat3 < ./sblat3.dat
  229. @$(GREP) -q FATAL SBLAT3.SUMM && cat SBLAT3.SUMM || exit 0
  230. endif
  231. ifeq ($(BUILD_DOUBLE),1)
  232. OPENBLAS_NUM_THREADS=2 ./dblat3 < ./dblat3.dat
  233. @$(GREP) -q FATAL DBLAT3.SUMM && cat DBLAT3.SUMM || exit 0
  234. endif
  235. ifeq ($(BUILD_COMPLEX),1)
  236. OPENBLAS_NUM_THREADS=2 ./cblat3 < ./cblat3.dat
  237. @$(GREP) -q FATAL CBLAT3.SUMM && cat CBLAT3.SUMM || exit 0
  238. endif
  239. ifeq ($(BUILD_COMPLEX16),1)
  240. OPENBLAS_NUM_THREADS=2 ./zblat3 < ./zblat3.dat
  241. @$(GREP) -q FATAL ZBLAT3.SUMM && cat ZBLAT3.SUMM || exit 0
  242. endif
  243. endif
  244. endif
  245. endif
  246. level3_3m : zblat3_3m cblat3_3m
  247. ifneq ($(CROSS), 1)
  248. rm -f ?BLAT3_3M.SUMM
  249. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./cblat3_3m < ./cblat3_3m.dat
  250. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  251. OPENBLAS_NUM_THREADS=1 OMP_NUM_THREADS=1 ./zblat3_3m < ./zblat3_3m.dat
  252. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  253. ifdef SMP
  254. rm -f ?BLAT3_3M.SUMM
  255. ifeq ($(USE_OPENMP), 1)
  256. OMP_NUM_THREADS=2 ./cblat3_3m < ./cblat3_3m.dat
  257. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  258. OMP_NUM_THREADS=2 ./zblat3_3m < ./zblat3_3m.dat
  259. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  260. else
  261. OPENBLAS_NUM_THREADS=2 ./cblat3_3m < ./cblat3_3m.dat
  262. @$(GREP) -q FATAL CBLAT3_3M.SUMM && cat CBLAT3_3M.SUMM || exit 0
  263. OPENBLAS_NUM_THREADS=2 ./zblat3_3m < ./zblat3_3m.dat
  264. @$(GREP) -q FATAL ZBLAT3_3M.SUMM && cat ZBLAT3_3M.SUMM || exit 0
  265. endif
  266. endif
  267. endif
  268. FLDFLAGS = $(FFLAGS:-fPIC=) $(LDFLAGS)
  269. CLDFLAGS = $(CFLAGS) $(LDFLAGS)
  270. ifeq ($(USE_OPENMP), 1)
  271. ifeq ($(F_COMPILER), GFORTRAN)
  272. ifeq ($(C_COMPILER), CLANG)
  273. CEXTRALIB += -lomp
  274. endif
  275. endif
  276. ifeq ($(F_COMPILER), NAG)
  277. CEXTRALIB = -lgomp
  278. endif
  279. ifeq ($(F_COMPILER), IBM)
  280. ifeq ($(C_COMPILER), GCC)
  281. CEXTRALIB += -lgomp
  282. endif
  283. ifeq ($(C_COMPILER), CLANG)
  284. CEXTRALIB += -lomp
  285. endif
  286. endif
  287. endif
  288. ifeq ($(BUILD_SINGLE),1)
  289. sblat1 : sblat1.$(SUFFIX) ../$(LIBNAME)
  290. $(FC) $(FLDFLAGS) -o sblat1 sblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  291. sblat2 : sblat2.$(SUFFIX) ../$(LIBNAME)
  292. $(FC) $(FLDFLAGS) -o sblat2 sblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  293. sblat3 : sblat3.$(SUFFIX) ../$(LIBNAME)
  294. $(FC) $(FLDFLAGS) -o sblat3 sblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  295. endif
  296. ifeq ($(BUILD_DOUBLE),1)
  297. dblat1 : dblat1.$(SUFFIX) ../$(LIBNAME)
  298. $(FC) $(FLDFLAGS) -o dblat1 dblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  299. dblat2 : dblat2.$(SUFFIX) ../$(LIBNAME)
  300. $(FC) $(FLDFLAGS) -o dblat2 dblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  301. dblat3 : dblat3.$(SUFFIX) ../$(LIBNAME)
  302. $(FC) $(FLDFLAGS) -o dblat3 dblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  303. else
  304. dblat2:
  305. dblat3:
  306. endif
  307. qblat1 : qblat1.$(SUFFIX) ../$(LIBNAME)
  308. $(FC) $(FLDFLAGS) -o qblat1 qblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  309. ifeq ($(BUILD_COMPLEX),1)
  310. cblat1 : cblat1.$(SUFFIX) ../$(LIBNAME)
  311. $(FC) $(FLDFLAGS) -o cblat1 cblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  312. cblat2 : cblat2.$(SUFFIX) ../$(LIBNAME)
  313. $(FC) $(FLDFLAGS) -o cblat2 cblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  314. cblat3 : cblat3.$(SUFFIX) ../$(LIBNAME)
  315. $(FC) $(FLDFLAGS) -o cblat3 cblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  316. endif
  317. ifeq ($(BUILD_COMPLEX16),1)
  318. zblat1 : zblat1.$(SUFFIX) ../$(LIBNAME)
  319. $(FC) $(FLDFLAGS) -o zblat1 zblat1.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  320. zblat2 : zblat2.$(SUFFIX) ../$(LIBNAME)
  321. $(FC) $(FLDFLAGS) -o zblat2 zblat2.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  322. zblat3 : zblat3.$(SUFFIX) ../$(LIBNAME)
  323. $(FC) $(FLDFLAGS) -o zblat3 zblat3.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  324. endif
  325. ifeq ($(BUILD_BFLOAT16),1)
  326. test_sbgemm : compare_sgemm_sbgemm.c ../$(LIBNAME)
  327. $(CC) $(CLDFLAGS) -o test_sbgemm compare_sgemm_sbgemm.c ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  328. endif
  329. ifeq ($(BUILD_COMPLEX),1)
  330. cblat3_3m : cblat3_3m.$(SUFFIX) ../$(LIBNAME)
  331. $(FC) $(FLDFLAGS) -o cblat3_3m cblat3_3m.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  332. endif
  333. ifeq ($(BUILD_COMPLEX16),1)
  334. zblat3_3m : zblat3_3m.$(SUFFIX) ../$(LIBNAME)
  335. $(FC) $(FLDFLAGS) -o zblat3_3m zblat3_3m.$(SUFFIX) ../$(LIBNAME) $(EXTRALIB) $(CEXTRALIB)
  336. endif
  337. clean:
  338. @rm -f *.$(SUFFIX) *.$(PSUFFIX) gmon.$(SUFFIX)ut *.SUMM *.cxml *.exe *.pdb *.dwf \
  339. sblat1 dblat1 cblat1 zblat1 \
  340. sblat2 dblat2 cblat2 zblat2 \
  341. test_sbgemm sblat3 dblat3 cblat3 zblat3 \
  342. sblat1p dblat1p cblat1p zblat1p \
  343. sblat2p dblat2p cblat2p zblat2p \
  344. sblat3p dblat3p cblat3p zblat3p \
  345. zblat3_3m zblat3_3mp \
  346. cblat3_3m cblat3_3mp \
  347. *.stackdump *.dll
  348. libs:
  349. prof:
  350. quick :
  351. $(MAKE) -C $(TOPDIR) libs
  352. # include ../Makefile.tail