You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

system.cmake 24 kB

2 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813
  1. ##
  2. ## Author: Hank Anderson <hank@statease.com>
  3. ## Description: Ported from OpenBLAS/Makefile.system
  4. ##
  5. set(NETLIB_LAPACK_DIR "${PROJECT_SOURCE_DIR}/lapack-netlib")
  6. # System detection, via CMake.
  7. include("${PROJECT_SOURCE_DIR}/cmake/system_check.cmake")
  8. if(CMAKE_CROSSCOMPILING AND NOT DEFINED TARGET)
  9. # Detect target without running getarch
  10. if (ARM64)
  11. set(TARGET "ARMV8")
  12. elseif(ARM)
  13. set(TARGET "ARMV7") # TODO: Ask compiler which arch this is
  14. else()
  15. message(FATAL_ERROR "When cross compiling, a TARGET is required.")
  16. endif()
  17. endif()
  18. # Other files expect CORE, which is actually TARGET and will become TARGET_CORE for kernel build. Confused yet?
  19. # It seems we are meant to use TARGET as input and CORE internally as kernel.
  20. if(NOT DEFINED CORE AND DEFINED TARGET)
  21. set(CORE ${TARGET})
  22. endif()
  23. # TARGET_CORE will override TARGET which is used in DYNAMIC_ARCH=1.
  24. if (DEFINED TARGET_CORE)
  25. set(TARGET ${TARGET_CORE})
  26. endif ()
  27. # Force fallbacks for 32bit
  28. if (DEFINED BINARY AND DEFINED TARGET AND BINARY EQUAL 32)
  29. message(STATUS "Compiling a ${BINARY}-bit binary.")
  30. set(NO_AVX 1)
  31. if (${TARGET} STREQUAL "HASWELL" OR ${TARGET} STREQUAL "SANDYBRIDGE" OR ${TARGET} STREQUAL "SKYLAKEX" OR ${TARGET} STREQUAL "COOPERLAKE" OR ${TARGET} STREQUAL "SAPPHIRERAPIDS")
  32. set(TARGET "NEHALEM")
  33. endif ()
  34. if (${TARGET} STREQUAL "BULLDOZER" OR ${TARGET} STREQUAL "PILEDRIVER" OR ${TARGET} STREQUAL "ZEN")
  35. set(TARGET "BARCELONA")
  36. endif ()
  37. if (${TARGET} STREQUAL "ARMV8" OR ${TARGET} STREQUAL "CORTEXA57" OR ${TARGET} STREQUAL "CORTEXA53" OR ${TARGET} STREQUAL "CORTEXA55")
  38. set(TARGET "ARMV7")
  39. endif ()
  40. if (${TARGET} STREQUAL "POWER8" OR ${TARGET} STREQUAL "POWER9" OR ${TARGET} STREQUAL "POWER10")
  41. set(TARGET "POWER6")
  42. endif ()
  43. endif ()
  44. if (DEFINED TARGET)
  45. message(STATUS "-- -- -- -- -- -- -- -- -- -- -- -- --")
  46. message(STATUS "Targeting the ${TARGET} architecture.")
  47. set(GETARCH_FLAGS "-DFORCE_${TARGET}")
  48. endif ()
  49. # On x86_64 build getarch with march=native. This is required to detect AVX512 support in getarch.
  50. if (X86_64 AND NOT (${CMAKE_C_COMPILER_ID} STREQUAL "PGI" OR ${CMAKE_C_COMPILER_ID} STREQUAL "NVHPC"))
  51. set(GETARCH_FLAGS "${GETARCH_FLAGS} -march=native")
  52. endif ()
  53. # On x86 no AVX support is available
  54. if (X86 OR X86_64)
  55. if ((DEFINED BINARY AND BINARY EQUAL 32) OR ("$CMAKE_SIZEOF_VOID_P}" EQUAL "4"))
  56. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX -DNO_AVX2 -DNO_AVX512")
  57. endif ()
  58. endif ()
  59. if (INTERFACE64)
  60. message(STATUS "Using 64-bit integers.")
  61. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DUSE64BITINT")
  62. endif ()
  63. if (NOT DEFINED GEMM_MULTITHREAD_THRESHOLD)
  64. set(GEMM_MULTITHREAD_THRESHOLD 4)
  65. endif ()
  66. message(STATUS "GEMM multithread threshold set to ${GEMM_MULTITHREAD_THRESHOLD}.")
  67. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DGEMM_MULTITHREAD_THRESHOLD=${GEMM_MULTITHREAD_THRESHOLD}")
  68. if (NO_AVX)
  69. message(STATUS "Disabling Advanced Vector Extensions (AVX).")
  70. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX")
  71. endif ()
  72. if (NO_AVX2)
  73. message(STATUS "Disabling Advanced Vector Extensions 2 (AVX2).")
  74. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX2")
  75. endif ()
  76. if (NO_AVX512)
  77. message(STATUS "Disabling Advanced Vector Extensions 512 (AVX512).")
  78. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX512")
  79. endif ()
  80. if (CMAKE_BUILD_TYPE STREQUAL "Debug")
  81. set(GETARCH_FLAGS "${GETARCH_FLAGS} ${CMAKE_C_FLAGS_DEBUG}")
  82. endif ()
  83. if (NOT DEFINED NO_PARALLEL_MAKE)
  84. set(NO_PARALLEL_MAKE 0)
  85. endif ()
  86. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_PARALLEL_MAKE=${NO_PARALLEL_MAKE}")
  87. if (CMAKE_C_COMPILER STREQUAL loongcc)
  88. set(GETARCH_FLAGS "${GETARCH_FLAGS} -static")
  89. endif ()
  90. if (POWER)
  91. set(NO_WARMUP 1)
  92. set(HAVE_GAS 1)
  93. if (CMAKE_ASM_COMPILER_ID STREQUAL "GNU")
  94. set(HAVE_GAS 0)
  95. elseif (CMAKE_ASM_COMPILER_ID STREQUAL "Clang")
  96. set(CCOMMON_OPT "${CCOMMON_OPT} -fno-integrated-as")
  97. set(HAVE_GAS 0)
  98. endif ()
  99. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DHAVE_GAS=${HAVE_GAS}")
  100. endif ()
  101. #if don't use Fortran, it will only compile CBLAS.
  102. if (ONLY_CBLAS)
  103. set(NO_LAPACK 1)
  104. else ()
  105. set(ONLY_CBLAS 0)
  106. endif ()
  107. # N.B. this is NUM_THREAD in Makefile.system which is probably a bug -hpa
  108. if (NOT CMAKE_CROSSCOMPILING)
  109. if (NOT DEFINED NUM_CORES)
  110. include(ProcessorCount)
  111. ProcessorCount(NUM_CORES)
  112. endif()
  113. endif()
  114. if (NOT DEFINED NUM_PARALLEL)
  115. set(NUM_PARALLEL 1)
  116. endif()
  117. if (NOT DEFINED NUM_THREADS)
  118. if (DEFINED NUM_CORES AND NOT NUM_CORES EQUAL 0)
  119. # HT?
  120. set(NUM_THREADS ${NUM_CORES})
  121. else ()
  122. set(NUM_THREADS 0)
  123. endif ()
  124. endif()
  125. if (${NUM_THREADS} LESS 2)
  126. set(USE_THREAD 0)
  127. elseif(NOT DEFINED USE_THREAD)
  128. set(USE_THREAD 1)
  129. endif ()
  130. if (USE_THREAD)
  131. message(STATUS "Multi-threading enabled with ${NUM_THREADS} threads.")
  132. else()
  133. if (${USE_LOCKING})
  134. set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_LOCKING")
  135. endif ()
  136. endif ()
  137. include("${PROJECT_SOURCE_DIR}/cmake/prebuild.cmake")
  138. if (DEFINED TARGET)
  139. if (${TARGET} STREQUAL COOPERLAKE AND NOT NO_AVX512)
  140. if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
  141. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  142. if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 10.09)
  143. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=cooperlake")
  144. else()
  145. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
  146. endif()
  147. elseif (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
  148. if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 8.99)
  149. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=cooperlake -exhaustive-register-search")
  150. else()
  151. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512 -exhaustive-register-search")
  152. endif()
  153. endif()
  154. endif()
  155. if (${TARGET} STREQUAL SAPPHIRERAPIDS AND NOT NO_AVX512)
  156. if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
  157. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  158. if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 11.0)
  159. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=sapphirerapids")
  160. else()
  161. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
  162. endif()
  163. elseif (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
  164. if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 12.0)
  165. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=sapphirerapids -exhaustive-register-search")
  166. else()
  167. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512 -exhaustive-register-search")
  168. endif()
  169. endif()
  170. endif()
  171. if (${TARGET} STREQUAL SKYLAKEX AND NOT NO_AVX512)
  172. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
  173. if (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
  174. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -exhaustive-register-search")
  175. endif()
  176. endif()
  177. if (((${TARGET} STREQUAL ZEN) AND HAVE_AVX512VL) AND NOT NO_AVX512)
  178. if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
  179. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  180. if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 12.99)
  181. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=znver4")
  182. else()
  183. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
  184. endif()
  185. elseif (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
  186. if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 15.99)
  187. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=znver4")
  188. else()
  189. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
  190. endif()
  191. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -exhaustive-register-search")
  192. endif()
  193. endif()
  194. if ((${TARGET} STREQUAL HASWELL OR (${TARGET} STREQUAL ZEN AND NOT HAVE_AVX512VL)) AND NOT NO_AVX2)
  195. if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
  196. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  197. if (${GCC_VERSION} VERSION_GREATER 4.7 OR ${GCC_VERSION} VERSION_EQUAL 4.7)
  198. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx2")
  199. endif()
  200. elseif (${CMAKE_C_COMPILER_ID} STREQUAL "CLANG")
  201. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx2 -mfma")
  202. endif()
  203. endif()
  204. if (DEFINED HAVE_AVX)
  205. if (NOT NO_AVX)
  206. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx")
  207. endif()
  208. endif()
  209. if (DEFINED HAVE_AVX2)
  210. if (NOT NO_AVX2)
  211. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx2")
  212. endif()
  213. endif()
  214. # if (DEFINED HAVE_FMA3)
  215. # if (NOT NO_AVX2)
  216. # set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mfma")
  217. # endif()
  218. # endif()
  219. if (DEFINED HAVE_SSE)
  220. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse")
  221. endif()
  222. if (DEFINED HAVE_SSE2)
  223. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse2")
  224. endif()
  225. if (DEFINED HAVE_SSE3)
  226. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse3")
  227. endif()
  228. if (DEFINED HAVE_SSSE3)
  229. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mssse3")
  230. endif()
  231. if (DEFINED HAVE_SSE4_1)
  232. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse4.1")
  233. endif()
  234. if (${TARGET} STREQUAL POWER10)
  235. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  236. if (${GCC_VERSION} VERSION_GREATER 10.2 OR ${GCC_VERSION} VERSION_EQUAL 10.2)
  237. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power10 -mtune=power10 -mvsx -fno-fast-math")
  238. else ()
  239. message(FATAL_ERROR "Compiler GCC.${GCC_VERSION} does not support Power10.")
  240. endif()
  241. endif()
  242. if (${TARGET} STREQUAL POWER9)
  243. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  244. if (${GCC_VERSION} VERSION_GREATER 5.0 OR ${GCC_VERSION} VERSION_EQUAL 5.0)
  245. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power9 -mtune=power9 -mvsx -fno-fast-math")
  246. else ()
  247. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power8 -mtune=power8 -mvsx -fno-fast-math")
  248. message(WARNING "Compiler GCC.${GCC_VERSION} does not support fully Power9.")
  249. endif()
  250. endif()
  251. if (${TARGET} STREQUAL POWER8)
  252. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power8 -mtune=power8 -mvsx -fno-fast-math")
  253. endif()
  254. if (${TARGET} STREQUAL NEOVERSEV1)
  255. if (${CMAKE_C_COMPILER_ID} STREQUAL "PGI" AND NOT NO_SVE)
  256. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -Msve_intrinsics -march=armv8.4-a+sve -mtune=neoverse-v1")
  257. else ()
  258. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  259. if (${GCC_VERSION} VERSION_GREATER 10.4 OR ${GCC_VERSION} VERSION_EQUAL 10.4)
  260. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=armv8.4-a+sve -mtune=neoverse-v1")
  261. else ()
  262. message(FATAL_ERROR "Compiler ${CMAKE_C_COMPILER} ${GCC_VERSION} does not support Neoverse V1.")
  263. endif()
  264. endif()
  265. endif()
  266. if (${TARGET} STREQUAL NEOVERSEN2)
  267. if (${CMAKE_C_COMPILER_ID} STREQUAL "PGI" AND NOT NO_SVE)
  268. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -Msve-intrinsics -march=armv8.5-a+sve+sve2+bf16 -mtune=neoverse-n2")
  269. else ()
  270. execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
  271. if (${GCC_VERSION} VERSION_GREATER 10.4 OR ${GCC_VERSION} VERSION_EQUAL 10.4)
  272. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=armv8.5-a+sve+sve2+bf16 -mtune=neoverse-n2")
  273. else ()
  274. message(FATAL_ERROR "Compiler $${CMAKE_C_COMPILER} {GCC_VERSION} does not support Neoverse N2.")
  275. endif()
  276. endif()
  277. endif()
  278. if (${TARGET} STREQUAL ARMV8SVE)
  279. if (${CMAKE_C_COMPILER_ID} STREQUAL "PGI" AND NOT NO_SVE)
  280. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -Msve-intrinsics -march=armv8.2-a+sve")
  281. else ()
  282. set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=armv8.2-a+sve")
  283. endif()
  284. endif()
  285. endif()
  286. if (DEFINED BINARY)
  287. message(STATUS "Compiling a ${BINARY}-bit binary.")
  288. endif ()
  289. if (NOT DEFINED NEED_PIC)
  290. set(NEED_PIC 1)
  291. endif ()
  292. # OS dependent settings
  293. include("${PROJECT_SOURCE_DIR}/cmake/os.cmake")
  294. # Architecture dependent settings
  295. include("${PROJECT_SOURCE_DIR}/cmake/arch.cmake")
  296. # C Compiler dependent settings
  297. include("${PROJECT_SOURCE_DIR}/cmake/cc.cmake")
  298. if (INTERFACE64)
  299. set(SUFFIX64 64)
  300. set(SUFFIX64_UNDERSCORE _64)
  301. endif()
  302. if (NOT NOFORTRAN)
  303. # Fortran Compiler dependent settings
  304. include("${PROJECT_SOURCE_DIR}/cmake/fc.cmake")
  305. else ()
  306. if (NOT XXXX)
  307. set(C_LAPACK 1)
  308. if (INTERFACE64)
  309. set (CCOMMON_OPT "${CCOMMON_OPT} -DLAPACK_ILP64")
  310. endif ()
  311. set(TIMER "NONE")
  312. else ()
  313. set (NO_LAPACK 1)
  314. endif ()
  315. endif ()
  316. if (BINARY64)
  317. if (INTERFACE64)
  318. # CCOMMON_OPT += -DUSE64BITINT
  319. endif ()
  320. endif ()
  321. if(EMBEDDED)
  322. set(CCOMMON_OPT "${CCOMMON_OPT} -DOS_EMBEDDED")
  323. set(CCOMMON_OPT "${CCOMMON_OPT} -mthumb -mcpu=cortex-m4 -mfloat-abi=hard -mfpu=fpv4-sp-d16")
  324. endif()
  325. if (NEED_PIC)
  326. if (${CMAKE_C_COMPILER} STREQUAL "IBM")
  327. set(CCOMMON_OPT "${CCOMMON_OPT} -qpic=large")
  328. else ()
  329. set(CCOMMON_OPT "${CCOMMON_OPT} -fPIC")
  330. endif ()
  331. if (NOT NOFORTRAN)
  332. if (${F_COMPILER} STREQUAL "SUN")
  333. set(FCOMMON_OPT "${FCOMMON_OPT} -pic")
  334. else ()
  335. set(FCOMMON_OPT "${FCOMMON_OPT} -fPIC")
  336. endif ()
  337. endif()
  338. endif ()
  339. if (X86_64 OR ${CORE} STREQUAL POWER10)
  340. set(SMALL_MATRIX_OPT TRUE)
  341. endif ()
  342. if (SMALL_MATRIX_OPT)
  343. set(CCOMMON_OPT "${CCOMMON_OPT} -DSMALL_MATRIX_OPT")
  344. endif ()
  345. if (DYNAMIC_ARCH)
  346. if (X86 OR X86_64 OR ARM64 OR POWER)
  347. set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_ARCH")
  348. if (DYNAMIC_OLDER)
  349. set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_OLDER")
  350. endif ()
  351. else ()
  352. unset (DYNAMIC_ARCH)
  353. message (STATUS "DYNAMIC_ARCH is not supported on the target architecture, removing")
  354. endif ()
  355. endif ()
  356. if (DYNAMIC_LIST)
  357. set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_LIST")
  358. foreach(DCORE ${DYNAMIC_LIST})
  359. set(CCOMMON_OPT "${CCOMMON_OPT} -DDYN_${DCORE}")
  360. endforeach ()
  361. endif ()
  362. if (NO_LAPACK)
  363. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_LAPACK")
  364. #Disable LAPACK C interface
  365. set(NO_LAPACKE 1)
  366. endif ()
  367. if (NO_LAPACKE)
  368. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_LAPACKE")
  369. endif ()
  370. if (NO_AVX)
  371. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX")
  372. endif ()
  373. if (X86)
  374. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX")
  375. endif ()
  376. if (NO_AVX2)
  377. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX2")
  378. endif ()
  379. if (NO_AVX512)
  380. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX512")
  381. endif ()
  382. if (USE_THREAD)
  383. # USE_SIMPLE_THREADED_LEVEL3 = 1
  384. # NO_AFFINITY = 1
  385. set(CCOMMON_OPT "${CCOMMON_OPT} -DSMP_SERVER")
  386. if (MIPS64)
  387. if (NOT ${CORE} STREQUAL "LOONGSON3B")
  388. set(USE_SIMPLE_THREADED_LEVEL3 1)
  389. endif ()
  390. endif ()
  391. if (BIGNUMA)
  392. set(CCOMMON_OPT "${CCOMMON_OPT} -DBIGNUMA")
  393. endif ()
  394. endif ()
  395. if (NO_WARMUP)
  396. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_WARMUP")
  397. endif ()
  398. if (CONSISTENT_FPCSR)
  399. set(CCOMMON_OPT "${CCOMMON_OPT} -DCONSISTENT_FPCSR")
  400. endif ()
  401. if (USE_TLS)
  402. set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_TLS")
  403. endif ()
  404. # Only for development
  405. # set(CCOMMON_OPT "${CCOMMON_OPT} -DPARAMTEST")
  406. # set(CCOMMON_OPT "${CCOMMON_OPT} -DPREFETCHTEST")
  407. # set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_SWITCHING")
  408. # set(USE_PAPI 1)
  409. if (USE_PAPI)
  410. set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_PAPI")
  411. set(EXTRALIB "${EXTRALIB} -lpapi -lperfctr")
  412. endif ()
  413. if (DYNAMIC_THREADS)
  414. set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_THREADS")
  415. endif ()
  416. set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_CPU_NUMBER=${NUM_THREADS}")
  417. set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_PARALLEL_NUMBER=${NUM_PARALLEL}")
  418. if (BUFFERSIZE)
  419. set(CCOMMON_OPT "${CCOMMON_OPT} -DBUFFERSIZE=${BUFFERSIZE}")
  420. endif ()
  421. if (USE_SIMPLE_THREADED_LEVEL3)
  422. set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_SIMPLE_THREADED_LEVEL3")
  423. endif ()
  424. if (NOT ${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  425. if (DEFINED MAX_STACK_ALLOC)
  426. if (NOT ${MAX_STACK_ALLOC} EQUAL 0)
  427. set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_STACK_ALLOC=${MAX_STACK_ALLOC}")
  428. endif ()
  429. else ()
  430. set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_STACK_ALLOC=2048")
  431. endif ()
  432. endif ()
  433. if (NOT ${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  434. if (DEFINED BLAS3_MEM_ALLOC_THRESHOLD)
  435. if (NOT ${BLAS3_MEM_ALLOC_THRESHOLD} EQUAL 32)
  436. set(CCOMMON_OPT "${CCOMMON_OPT} -DBLAS3_MEM_ALLOC_THRESHOLD=${BLAS3_MEM_ALLOC_THRESHOLD}")
  437. endif()
  438. endif()
  439. endif()
  440. set(LIBPREFIX "lib${LIBNAMEPREFIX}openblas")
  441. if (DEFINED LIBNAMESUFFIX)
  442. set(LIBPREFIX "${LIBNAMEPREFIX}_${LIBNAMESUFFIX}")
  443. endif ()
  444. if (NOT DEFINED SYMBOLPREFIX)
  445. set(SYMBOLPREFIX "")
  446. endif ()
  447. if (NOT DEFINED SYMBOLSUFFIX)
  448. set(SYMBOLSUFFIX "")
  449. endif ()
  450. set(KERNELDIR "${PROJECT_SOURCE_DIR}/kernel/${ARCH}")
  451. # TODO: need to convert these Makefiles
  452. # include ${PROJECT_SOURCE_DIR}/cmake/${ARCH}.cmake
  453. if (${CORE} STREQUAL "PPC440")
  454. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_QALLOC")
  455. endif ()
  456. if (${CORE} STREQUAL "PPC440FP2")
  457. set(STATIC_ALLOCATION 1)
  458. endif ()
  459. if (NOT ${CMAKE_SYSTEM_NAME} STREQUAL "Linux")
  460. set(NO_AFFINITY 1)
  461. endif ()
  462. if (NOT X86_64 AND NOT X86 AND NOT ${CORE} STREQUAL "LOONGSON3B")
  463. set(NO_AFFINITY 1)
  464. endif ()
  465. if (NO_AFFINITY)
  466. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AFFINITY")
  467. endif ()
  468. if (FUNCTION_PROFILE)
  469. set(CCOMMON_OPT "${CCOMMON_OPT} -DFUNCTION_PROFILE")
  470. endif ()
  471. if (HUGETLB_ALLOCATION)
  472. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_HUGETLB")
  473. endif ()
  474. if (DEFINED HUGETLBFILE_ALLOCATION)
  475. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_HUGETLBFILE -DHUGETLB_FILE_NAME=${HUGETLBFILE_ALLOCATION})")
  476. endif ()
  477. if (STATIC_ALLOCATION)
  478. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_STATIC")
  479. endif ()
  480. if (DEVICEDRIVER_ALLOCATION)
  481. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_DEVICEDRIVER -DDEVICEDRIVER_NAME=\"/dev/mapper\"")
  482. endif ()
  483. if (MIXED_MEMORY_ALLOCATION)
  484. set(CCOMMON_OPT "${CCOMMON_OPT} -DMIXED_MEMORY_ALLOCATION")
  485. endif ()
  486. set(CCOMMON_OPT "${CCOMMON_OPT} -DVERSION=\"\\\"${OpenBLAS_VERSION}\\\"\"")
  487. set(REVISION "-r${OpenBLAS_VERSION}")
  488. set(MAJOR_VERSION ${OpenBLAS_MAJOR_VERSION})
  489. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${CCOMMON_OPT}")
  490. if (NOT BUILD_SINGLE AND NOT BUILD_DOUBLE AND NOT BUILD_COMPLEX AND NOT BUILD_COMPLEX16)
  491. set (BUILD_SINGLE ON)
  492. set (BUILD_DOUBLE ON)
  493. set (BUILD_COMPLEX ON)
  494. set (BUILD_COMPLEX16 ON)
  495. endif()
  496. if (BUILD_SINGLE)
  497. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_SINGLE")
  498. endif()
  499. if (BUILD_DOUBLE)
  500. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_DOUBLE")
  501. endif()
  502. if (BUILD_COMPLEX)
  503. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_COMPLEX")
  504. endif()
  505. if (BUILD_COMPLEX16)
  506. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_COMPLEX16")
  507. endif()
  508. if (BUILD_BFLOAT16)
  509. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_BFLOAT16")
  510. endif()
  511. if(NOT MSVC)
  512. set(CMAKE_ASM_FLAGS "${CMAKE_ASM_FLAGS} ${CCOMMON_OPT}")
  513. endif()
  514. # TODO: not sure what PFLAGS is -hpa
  515. set(PFLAGS "${PFLAGS} ${CCOMMON_OPT} -I${TOPDIR} -DPROFILE ${COMMON_PROF}")
  516. set(CMAKE_Fortran_FLAGS "${CMAKE_Fortran_FLAGS} ${FCOMMON_OPT}")
  517. # TODO: not sure what FPFLAGS is -hpa
  518. set(FPFLAGS "${FPFLAGS} ${FCOMMON_OPT} ${COMMON_PROF}")
  519. #For LAPACK Fortran codes.
  520. set(LAPACK_FFLAGS "${LAPACK_FFLAGS} ${CMAKE_Fortran_FLAGS}")
  521. set(LAPACK_FPFLAGS "${LAPACK_FPFLAGS} ${FPFLAGS}")
  522. #Disable -fopenmp for LAPACK Fortran codes on Windows.
  523. if (${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  524. set(FILTER_FLAGS "-fopenmp;-mp;-openmp;-xopenmp=parallel")
  525. foreach (FILTER_FLAG ${FILTER_FLAGS})
  526. string(REPLACE ${FILTER_FLAG} "" LAPACK_FFLAGS ${LAPACK_FFLAGS})
  527. string(REPLACE ${FILTER_FLAG} "" LAPACK_FPFLAGS ${LAPACK_FPFLAGS})
  528. endforeach ()
  529. endif ()
  530. if (CMAKE_Fortran_COMPILER)
  531. if (${F_COMPILER} STREQUAL "NAG" OR ${F_COMPILER} STREQUAL "CRAY" OR CMAKE_Fortran_COMPILER_ID MATCHES "LLVMFlang.*")
  532. set(FILTER_FLAGS "-msse3;-mssse3;-msse4.1;-mavx;-mavx2,-mskylake-avx512")
  533. if (CMAKE_Fortran_COMPILER_ID MATCHES "LLVMFlang.*")
  534. message(STATUS "removing fortran flags")
  535. set(FILTER_FLAGS "${FILTER_FLAGS};-m32;-m64")
  536. endif ()
  537. foreach (FILTER_FLAG ${FILTER_FLAGS})
  538. string(REPLACE ${FILTER_FLAG} "" LAPACK_FFLAGS ${LAPACK_FFLAGS})
  539. string(REPLACE ${FILTER_FLAG} "" LAPACK_FPFLAGS ${LAPACK_FPFLAGS})
  540. endforeach ()
  541. endif ()
  542. endif ()
  543. if ("${F_COMPILER}" STREQUAL "GFORTRAN")
  544. # lapack-netlib is rife with uninitialized warnings -hpa
  545. set(LAPACK_FFLAGS "${LAPACK_FFLAGS} -Wno-maybe-uninitialized")
  546. endif ()
  547. set(LAPACK_CFLAGS "${CMAKE_C_CFLAGS} -DHAVE_LAPACK_CONFIG_H")
  548. if (INTERFACE64)
  549. set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DLAPACK_ILP64")
  550. endif ()
  551. if (${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  552. set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DOPENBLAS_OS_WINDOWS")
  553. endif ()
  554. if (${CMAKE_C_COMPILER} STREQUAL "LSB" OR ${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  555. set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DLAPACK_COMPLEX_STRUCTURE")
  556. endif ()
  557. if ("${CMAKE_BUILD_TYPE}" STREQUAL "Release")
  558. if ("${F_COMPILER}" STREQUAL "FLANG")
  559. if (${CMAKE_Fortran_COMPILER_VERSION} VERSION_LESS_EQUAL 3)
  560. set(CMAKE_Fortran_FLAGS_RELEASE "${CMAKE_Fortran_FLAGS_RELEASE} -fno-unroll-loops")
  561. endif ()
  562. endif ()
  563. endif ()
  564. if (NOT DEFINED SUFFIX)
  565. set(SUFFIX o)
  566. endif ()
  567. if (NOT DEFINED PSUFFIX)
  568. set(PSUFFIX po)
  569. endif ()
  570. if (NOT DEFINED LIBSUFFIX)
  571. set(LIBSUFFIX a)
  572. endif ()
  573. if (DYNAMIC_ARCH)
  574. if (USE_THREAD)
  575. set(LIBNAME "${LIBPREFIX}p${REVISION}.${LIBSUFFIX}")
  576. set(LIBNAME_P "${LIBPREFIX}p${REVISION}_p.${LIBSUFFIX}")
  577. else ()
  578. set(LIBNAME "${LIBPREFIX}${REVISION}.${LIBSUFFIX}")
  579. set(LIBNAME_P "${LIBPREFIX}${REVISION}_p.${LIBSUFFIX}")
  580. endif ()
  581. else ()
  582. if (USE_THREAD)
  583. set(LIBNAME "${LIBPREFIX}_${LIBCORE}p${REVISION}.${LIBSUFFIX}")
  584. set(LIBNAME_P "${LIBPREFIX}_${LIBCORE}p${REVISION}_p.${LIBSUFFIX}")
  585. else ()
  586. set(LIBNAME "${LIBPREFIX}_${LIBCORE}${REVISION}.${LIBSUFFIX}")
  587. set(LIBNAME_P "${LIBPREFIX}_${LIBCORE}${REVISION}_p.${LIBSUFFIX}")
  588. endif ()
  589. endif ()
  590. if (DEFINED FIXED_LIBNAME)
  591. set (LIBNAME "${LIBPREFIX}.${LIBSUFFIX}")
  592. set (LIBNAME "${LIBPREFIX}_p.${LIBSUFFIX}")
  593. endif()
  594. set(LIBDLLNAME "${LIBPREFIX}.dll")
  595. set(LIBSONAME "${LIBNAME}.${LIBSUFFIX}.so")
  596. set(LIBDYNNAME "${LIBNAME}.${LIBSUFFIX}.dylib")
  597. set(LIBDEFNAME "${LIBNAME}.${LIBSUFFIX}.def")
  598. set(LIBEXPNAME "${LIBNAME}.${LIBSUFFIX}.exp")
  599. set(LIBZIPNAME "${LIBNAME}.${LIBSUFFIX}.zip")
  600. set(LIBS "${PROJECT_SOURCE_DIR}/${LIBNAME}")
  601. set(LIBS_P "${PROJECT_SOURCE_DIR}/${LIBNAME_P}")
  602. set(LIB_COMPONENTS BLAS)
  603. if (NOT NO_CBLAS)
  604. set(LIB_COMPONENTS "${LIB_COMPONENTS} CBLAS")
  605. endif ()
  606. if (NOT NO_LAPACK)
  607. set(LIB_COMPONENTS "${LIB_COMPONENTS} LAPACK")
  608. if (NOT NO_LAPACKE)
  609. set(LIB_COMPONENTS "${LIB_COMPONENTS} LAPACKE")
  610. endif ()
  611. if (BUILD_RELAPACK)
  612. set(LIB_COMPONENTS "${LIB_COMPONENTS} ReLAPACK")
  613. endif ()
  614. endif ()
  615. if (ONLY_CBLAS)
  616. set(LIB_COMPONENTS CBLAS)
  617. endif ()
  618. # For GEMM3M
  619. set(USE_GEMM3M 0)
  620. if (DEFINED ARCH)
  621. if (X86 OR X86_64 OR ${ARCH} STREQUAL "ia64" OR MIPS64)
  622. set(USE_GEMM3M 1)
  623. endif ()
  624. if (${CORE} STREQUAL "generic")
  625. set(USE_GEMM3M 0)
  626. endif ()
  627. endif ()
  628. #export OSNAME
  629. #export ARCH
  630. #export CORE
  631. #export LIBCORE
  632. #export PGCPATH
  633. #export CONFIG
  634. #export CC
  635. #export FC
  636. #export BU
  637. #export FU
  638. #export NEED2UNDERSCORES
  639. #export USE_THREAD
  640. #export NUM_THREADS
  641. #export NUM_CORES
  642. #export SMP
  643. #export MAKEFILE_RULE
  644. #export NEED_PIC
  645. #export BINARY
  646. #export BINARY32
  647. #export BINARY64
  648. #export F_COMPILER
  649. #export C_COMPILER
  650. #export USE_OPENMP
  651. #export CROSS
  652. #export CROSS_SUFFIX
  653. #export NOFORTRAN
  654. #export NO_FBLAS
  655. #export EXTRALIB
  656. #export CEXTRALIB
  657. #export FEXTRALIB
  658. #export HAVE_SSE
  659. #export HAVE_SSE2
  660. #export HAVE_SSE3
  661. #export HAVE_SSSE3
  662. #export HAVE_SSE4_1
  663. #export HAVE_SSE4_2
  664. #export HAVE_SSE4A
  665. #export HAVE_SSE5
  666. #export HAVE_AVX
  667. #export HAVE_VFP
  668. #export HAVE_VFPV3
  669. #export HAVE_VFPV4
  670. #export HAVE_NEON
  671. #export KERNELDIR
  672. #export FUNCTION_PROFILE
  673. #export TARGET_CORE
  674. #
  675. #export SBGEMM_UNROLL_M
  676. #export SBGEMM_UNROLL_N
  677. #export SGEMM_UNROLL_M
  678. #export SGEMM_UNROLL_N
  679. #export DGEMM_UNROLL_M
  680. #export DGEMM_UNROLL_N
  681. #export QGEMM_UNROLL_M
  682. #export QGEMM_UNROLL_N
  683. #export CGEMM_UNROLL_M
  684. #export CGEMM_UNROLL_N
  685. #export ZGEMM_UNROLL_M
  686. #export ZGEMM_UNROLL_N
  687. #export XGEMM_UNROLL_M
  688. #export XGEMM_UNROLL_N
  689. #export CGEMM3M_UNROLL_M
  690. #export CGEMM3M_UNROLL_N
  691. #export ZGEMM3M_UNROLL_M
  692. #export ZGEMM3M_UNROLL_N
  693. #export XGEMM3M_UNROLL_M
  694. #export XGEMM3M_UNROLL_N
  695. #if (USE_CUDA)
  696. # export CUDADIR
  697. # export CUCC
  698. # export CUFLAGS
  699. # export CULIB
  700. #endif