You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

system.cmake 12 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527
  1. ##
  2. ## Author: Hank Anderson <hank@statease.com>
  3. ## Description: Ported from OpenBLAS/Makefile.system
  4. ##
  5. set(NETLIB_LAPACK_DIR "${CMAKE_SOURCE_DIR}/lapack-netlib")
  6. # TODO: Makefile.system detects Darwin (mac) and switches to clang here -hpa
  7. # http://stackoverflow.com/questions/714100/os-detecting-makefile
  8. # TODO: Makefile.system sets HOSTCC = $(CC) here if not already set -hpa
  9. # TARGET_CORE will override TARGET which is used in DYNAMIC_ARCH=1.
  10. if (DEFINED TARGET_CORE)
  11. set(TARGET ${TARGET_CORE})
  12. endif ()
  13. # Force fallbacks for 32bit
  14. if (DEFINED BINARY AND DEFINED TARGET AND BINARY EQUAL 32)
  15. message(STATUS "Compiling a ${BINARY}-bit binary.")
  16. set(NO_AVX 1)
  17. if (${TARGET} STREQUAL "HASWELL" OR ${TARGET} STREQUAL "SANDYBRIDGE")
  18. set(TARGET "NEHALEM")
  19. endif ()
  20. if (${TARGET} STREQUAL "BULLDOZER" OR ${TARGET} STREQUAL "PILEDRIVER")
  21. set(TARGET "BARCELONA")
  22. endif ()
  23. endif ()
  24. if (DEFINED TARGET)
  25. message(STATUS "Targetting the ${TARGET} architecture.")
  26. set(GETARCH_FLAGS "-DFORCE_${TARGET}")
  27. endif ()
  28. if (INTERFACE64)
  29. message(STATUS "Using 64-bit integers.")
  30. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DUSE64BITINT")
  31. endif ()
  32. if (NOT DEFINED GEMM_MULTITHREAD_THRESHOLD)
  33. set(GEMM_MULTITHREAD_THRESHOLD 4)
  34. endif ()
  35. message(STATUS "GEMM multithread threshold set to ${GEMM_MULTITHREAD_THRESHOLD}.")
  36. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DGEMM_MULTITHREAD_THRESHOLD=${GEMM_MULTITHREAD_THRESHOLD}")
  37. if (NO_AVX)
  38. message(STATUS "Disabling Advanced Vector Extensions (AVX).")
  39. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX")
  40. endif ()
  41. if (NO_AVX2)
  42. message(STATUS "Disabling Advanced Vector Extensions 2 (AVX2).")
  43. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX2")
  44. endif ()
  45. if (CMAKE_BUILD_TYPE STREQUAL Debug)
  46. set(GETARCH_FLAGS "${GETARCH_FLAGS} -g")
  47. endif ()
  48. # TODO: let CMake handle this? -hpa
  49. #if (${QUIET_MAKE})
  50. # set(MAKE "${MAKE} -s")
  51. #endif()
  52. if (NOT DEFINED NO_PARALLEL_MAKE)
  53. set(NO_PARALLEL_MAKE 0)
  54. endif ()
  55. set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_PARALLEL_MAKE=${NO_PARALLEL_MAKE}")
  56. if (CMAKE_CXX_COMPILER STREQUAL loongcc)
  57. set(GETARCH_FLAGS "${GETARCH_FLAGS} -static")
  58. endif ()
  59. #if don't use Fortran, it will only compile CBLAS.
  60. if (ONLY_CBLAS)
  61. set(NO_LAPACK 1)
  62. else ()
  63. set(ONLY_CBLAS 0)
  64. endif ()
  65. include("${CMAKE_SOURCE_DIR}/cmake/prebuild.cmake")
  66. if (NOT DEFINED NUM_THREADS)
  67. set(NUM_THREADS ${NUM_CORES})
  68. endif ()
  69. if (${NUM_THREADS} EQUAL 1)
  70. set(USE_THREAD 0)
  71. endif ()
  72. if (DEFINED USE_THREAD)
  73. if (NOT ${USE_THREAD})
  74. unset(SMP)
  75. else ()
  76. set(SMP 1)
  77. endif ()
  78. else ()
  79. # N.B. this is NUM_THREAD in Makefile.system which is probably a bug -hpa
  80. if (${NUM_THREADS} EQUAL 1)
  81. unset(SMP)
  82. else ()
  83. set(SMP 1)
  84. endif ()
  85. endif ()
  86. if (${SMP})
  87. message(STATUS "SMP enabled.")
  88. endif ()
  89. if (NOT DEFINED NEED_PIC)
  90. set(NEED_PIC 1)
  91. endif ()
  92. # TODO: I think CMake should be handling all this stuff -hpa
  93. unset(ARFLAGS)
  94. set(CPP "${COMPILER} -E")
  95. set(AR "${CROSS_SUFFIX}ar")
  96. set(AS "${CROSS_SUFFIX}as")
  97. set(LD "${CROSS_SUFFIX}ld")
  98. set(RANLIB "${CROSS_SUFFIX}ranlib")
  99. set(NM "${CROSS_SUFFIX}nm")
  100. set(DLLWRAP "${CROSS_SUFFIX}dllwrap")
  101. set(OBJCOPY "${CROSS_SUFFIX}objcopy")
  102. set(OBJCONV "${CROSS_SUFFIX}objconv")
  103. # OS dependent settings
  104. include("${CMAKE_SOURCE_DIR}/cmake/os.cmake")
  105. # Architecture dependent settings
  106. include("${CMAKE_SOURCE_DIR}/cmake/arch.cmake")
  107. # C Compiler dependent settings
  108. include("${CMAKE_SOURCE_DIR}/cmake/cc.cmake")
  109. if (NOT NOFORTRAN)
  110. # Fortran Compiler dependent settings
  111. include("${CMAKE_SOURCE_DIR}/cmake/fc.cmake")
  112. endif ()
  113. if (BINARY64)
  114. if (INTERFACE64)
  115. # CCOMMON_OPT += -DUSE64BITINT
  116. endif ()
  117. endif ()
  118. if (NEED_PIC)
  119. if (${CMAKE_C_COMPILER} STREQUAL "IBM")
  120. set(CCOMMON_OPT "${CCOMMON_OPT} -qpic=large")
  121. else ()
  122. set(CCOMMON_OPT "${CCOMMON_OPT} -fPIC")
  123. endif ()
  124. if (${F_COMPILER} STREQUAL "SUN")
  125. set(FCOMMON_OPT "${FCOMMON_OPT} -pic")
  126. else ()
  127. set(FCOMMON_OPT "${FCOMMON_OPT} -fPIC")
  128. endif ()
  129. endif ()
  130. if (DYNAMIC_ARCH)
  131. set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_ARCH")
  132. endif ()
  133. if (NO_LAPACK)
  134. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_LAPACK")
  135. #Disable LAPACK C interface
  136. set(NO_LAPACKE 1)
  137. endif ()
  138. if (NO_LAPACKE)
  139. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_LAPACKE")
  140. endif ()
  141. if (NO_AVX)
  142. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX")
  143. endif ()
  144. if (${ARCH} STREQUAL "x86")
  145. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX")
  146. endif ()
  147. if (NO_AVX2)
  148. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX2")
  149. endif ()
  150. if (SMP)
  151. set(CCOMMON_OPT "${CCOMMON_OPT} -DSMP_SERVER")
  152. if (${ARCH} STREQUAL "mips64")
  153. if (NOT ${CORE} STREQUAL "LOONGSON3B")
  154. set(USE_SIMPLE_THREADED_LEVEL3 1)
  155. endif ()
  156. endif ()
  157. if (USE_OPENMP)
  158. # USE_SIMPLE_THREADED_LEVEL3 = 1
  159. # NO_AFFINITY = 1
  160. set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_OPENMP")
  161. endif ()
  162. if (BIGNUMA)
  163. set(CCOMMON_OPT "${CCOMMON_OPT} -DBIGNUMA")
  164. endif ()
  165. endif ()
  166. if (NO_WARMUP)
  167. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_WARMUP")
  168. endif ()
  169. if (CONSISTENT_FPCSR)
  170. set(CCOMMON_OPT "${CCOMMON_OPT} -DCONSISTENT_FPCSR")
  171. endif ()
  172. # Only for development
  173. # set(CCOMMON_OPT "${CCOMMON_OPT} -DPARAMTEST")
  174. # set(CCOMMON_OPT "${CCOMMON_OPT} -DPREFETCHTEST")
  175. # set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_SWITCHING")
  176. # set(USE_PAPI 1)
  177. if (USE_PAPI)
  178. set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_PAPI")
  179. set(EXTRALIB "${EXTRALIB} -lpapi -lperfctr")
  180. endif ()
  181. if (DYNAMIC_THREADS)
  182. set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_THREADS")
  183. endif ()
  184. set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_CPU_NUMBER=${NUM_THREADS}")
  185. if (USE_SIMPLE_THREADED_LEVEL3)
  186. set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_SIMPLE_THREADED_LEVEL3")
  187. endif ()
  188. if (DEFINED LIBNAMESUFFIX)
  189. set(LIBPREFIX "libopenblas_${LIBNAMESUFFIX}")
  190. else ()
  191. set(LIBPREFIX "libopenblas")
  192. endif ()
  193. if (NOT DEFINED SYMBOLPREFIX)
  194. set(SYMBOLPREFIX "")
  195. endif ()
  196. if (NOT DEFINED SYMBOLSUFFIX)
  197. set(SYMBOLSUFFIX "")
  198. endif ()
  199. set(KERNELDIR "${CMAKE_SOURCE_DIR}/kernel/${ARCH}")
  200. # TODO: nead to convert these Makefiles
  201. # include ${CMAKE_SOURCE_DIR}/cmake/${ARCH}.cmake
  202. if (${CORE} STREQUAL "PPC440")
  203. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_QALLOC")
  204. endif ()
  205. if (${CORE} STREQUAL "PPC440FP2")
  206. set(STATIC_ALLOCATION 1)
  207. endif ()
  208. if (NOT ${CMAKE_SYSTEM_NAME} STREQUAL "Linux")
  209. set(NO_AFFINITY 1)
  210. endif ()
  211. if (NOT ${ARCH} STREQUAL "x86_64" AND NOT ${ARCH} STREQUAL "x86" AND NOT ${CORE} STREQUAL "LOONGSON3B")
  212. set(NO_AFFINITY 1)
  213. endif ()
  214. if (NO_AFFINITY)
  215. set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AFFINITY")
  216. endif ()
  217. if (FUNCTION_PROFILE)
  218. set(CCOMMON_OPT "${CCOMMON_OPT} -DFUNCTION_PROFILE")
  219. endif ()
  220. if (HUGETLB_ALLOCATION)
  221. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_HUGETLB")
  222. endif ()
  223. if (DEFINED HUGETLBFILE_ALLOCATION)
  224. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_HUGETLBFILE -DHUGETLB_FILE_NAME=${HUGETLBFILE_ALLOCATION})")
  225. endif ()
  226. if (STATIC_ALLOCATION)
  227. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_STATIC")
  228. endif ()
  229. if (DEVICEDRIVER_ALLOCATION)
  230. set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_DEVICEDRIVER -DDEVICEDRIVER_NAME=\"/dev/mapper\"")
  231. endif ()
  232. if (MIXED_MEMORY_ALLOCATION)
  233. set(CCOMMON_OPT "${CCOMMON_OPT} -DMIXED_MEMORY_ALLOCATION")
  234. endif ()
  235. if (${CMAKE_SYSTEM_NAME} STREQUAL "SunOS")
  236. set(TAR gtar)
  237. set(PATCH gpatch)
  238. set(GREP ggrep)
  239. else ()
  240. set(TAR tar)
  241. set(PATCH patch)
  242. set(GREP grep)
  243. endif ()
  244. if (NOT DEFINED MD5SUM)
  245. set(MD5SUM md5sum)
  246. endif ()
  247. set(AWK awk)
  248. set(REVISION "-r${OpenBLAS_VERSION}")
  249. set(MAJOR_VERSION ${OpenBLAS_MAJOR_VERSION})
  250. if (DEBUG)
  251. set(COMMON_OPT "${COMMON_OPT} -g")
  252. endif ()
  253. if (NOT DEFINED COMMON_OPT)
  254. set(COMMON_OPT "-O2")
  255. endif ()
  256. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${COMMON_OPT} ${CCOMMON_OPT}")
  257. # TODO: not sure what PFLAGS is -hpa
  258. set(PFLAGS "${PFLAGS} ${COMMON_OPT} ${CCOMMON_OPT} -I${TOPDIR} -DPROFILE ${COMMON_PROF}")
  259. set(CMAKE_Fortran_FLAGS "${CMAKE_Fortran_FLAGS} ${COMMON_OPT} ${FCOMMON_OPT}")
  260. # TODO: not sure what FPFLAGS is -hpa
  261. set(FPFLAGS "${FPFLAGS} ${COMMON_OPT} ${FCOMMON_OPT} ${COMMON_PROF}")
  262. #For LAPACK Fortran codes.
  263. set(LAPACK_FFLAGS "${LAPACK_FFLAGS} ${CMAKE_Fortran_FLAGS}")
  264. set(LAPACK_FPFLAGS "${LAPACK_FPFLAGS} ${FPFLAGS}")
  265. #Disable -fopenmp for LAPACK Fortran codes on Windows.
  266. if (${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  267. set(FILTER_FLAGS "-fopenmp;-mp;-openmp;-xopenmp=parralel")
  268. foreach (FILTER_FLAG ${FILTER_FLAGS})
  269. string(REPLACE ${FILTER_FLAG} "" LAPACK_FFLAGS ${LAPACK_FFLAGS})
  270. string(REPLACE ${FILTER_FLAG} "" LAPACK_FPFLAGS ${LAPACK_FPFLAGS})
  271. endforeach ()
  272. endif ()
  273. if ("${F_COMPILER}" STREQUAL "GFORTRAN")
  274. # lapack-netlib is rife with uninitialized warnings -hpa
  275. set(LAPACK_FFLAGS "${LAPACK_FFLAGS} -Wno-maybe-uninitialized")
  276. endif ()
  277. set(LAPACK_CFLAGS "${CMAKE_C_CFLAGS} -DHAVE_LAPACK_CONFIG_H")
  278. if (INTERFACE64)
  279. set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DLAPACK_ILP64")
  280. endif ()
  281. if (${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  282. set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DOPENBLAS_OS_WINDOWS")
  283. endif ()
  284. if (${CMAKE_C_COMPILER} STREQUAL "LSB" OR ${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
  285. set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DLAPACK_COMPLEX_STRUCTURE")
  286. endif ()
  287. if (NOT DEFINED SUFFIX)
  288. set(SUFFIX o)
  289. endif ()
  290. if (NOT DEFINED PSUFFIX)
  291. set(PSUFFIX po)
  292. endif ()
  293. if (NOT DEFINED LIBSUFFIX)
  294. set(LIBSUFFIX a)
  295. endif ()
  296. if (DYNAMIC_ARCH)
  297. if (DEFINED SMP)
  298. set(LIBNAME "${LIBPREFIX}p${REVISION}.${LIBSUFFIX}")
  299. set(LIBNAME_P "${LIBPREFIX}p${REVISION}_p.${LIBSUFFIX}")
  300. else ()
  301. set(LIBNAME "${LIBPREFIX}${REVISION}.${LIBSUFFIX}")
  302. set(LIBNAME_P "${LIBPREFIX}${REVISION}_p.${LIBSUFFIX}")
  303. endif ()
  304. else ()
  305. if (DEFINED SMP)
  306. set(LIBNAME "${LIBPREFIX}_${LIBCORE}p${REVISION}.${LIBSUFFIX}")
  307. set(LIBNAME_P "${LIBPREFIX}_${LIBCORE}p${REVISION}_p.${LIBSUFFIX}")
  308. else ()
  309. set(LIBNAME "${LIBPREFIX}_${LIBCORE}${REVISION}.${LIBSUFFIX}")
  310. set(LIBNAME_P "${LIBPREFIX}_${LIBCORE}${REVISION}_p.${LIBSUFFIX}")
  311. endif ()
  312. endif ()
  313. set(LIBDLLNAME "${LIBPREFIX}.dll")
  314. set(LIBSONAME "${LIBNAME}.${LIBSUFFIX}.so")
  315. set(LIBDYNNAME "${LIBNAME}.${LIBSUFFIX}.dylib")
  316. set(LIBDEFNAME "${LIBNAME}.${LIBSUFFIX}.def")
  317. set(LIBEXPNAME "${LIBNAME}.${LIBSUFFIX}.exp")
  318. set(LIBZIPNAME "${LIBNAME}.${LIBSUFFIX}.zip")
  319. set(LIBS "${CMAKE_SOURCE_DIR}/${LIBNAME}")
  320. set(LIBS_P "${CMAKE_SOURCE_DIR}/${LIBNAME_P}")
  321. set(LIB_COMPONENTS BLAS)
  322. if (NOT NO_CBLAS)
  323. set(LIB_COMPONENTS "${LIB_COMPONENTS} CBLAS")
  324. endif ()
  325. if (NOT NO_LAPACK)
  326. set(LIB_COMPONENTS "${LIB_COMPONENTS} LAPACK")
  327. if (NOT NO_LAPACKE)
  328. set(LIB_COMPONENTS "${LIB_COMPONENTS} LAPACKE")
  329. endif ()
  330. endif ()
  331. if (ONLY_CBLAS)
  332. set(LIB_COMPONENTS CBLAS)
  333. endif ()
  334. #export OSNAME
  335. #export ARCH
  336. #export CORE
  337. #export LIBCORE
  338. #export PGCPATH
  339. #export CONFIG
  340. #export CC
  341. #export FC
  342. #export BU
  343. #export FU
  344. #export NEED2UNDERSCORES
  345. #export USE_THREAD
  346. #export NUM_THREADS
  347. #export NUM_CORES
  348. #export SMP
  349. #export MAKEFILE_RULE
  350. #export NEED_PIC
  351. #export BINARY
  352. #export BINARY32
  353. #export BINARY64
  354. #export F_COMPILER
  355. #export C_COMPILER
  356. #export USE_OPENMP
  357. #export CROSS
  358. #export CROSS_SUFFIX
  359. #export NOFORTRAN
  360. #export NO_FBLAS
  361. #export EXTRALIB
  362. #export CEXTRALIB
  363. #export FEXTRALIB
  364. #export HAVE_SSE
  365. #export HAVE_SSE2
  366. #export HAVE_SSE3
  367. #export HAVE_SSSE3
  368. #export HAVE_SSE4_1
  369. #export HAVE_SSE4_2
  370. #export HAVE_SSE4A
  371. #export HAVE_SSE5
  372. #export HAVE_AVX
  373. #export HAVE_VFP
  374. #export HAVE_VFPV3
  375. #export HAVE_VFPV4
  376. #export HAVE_NEON
  377. #export KERNELDIR
  378. #export FUNCTION_PROFILE
  379. #export TARGET_CORE
  380. #
  381. #export SGEMM_UNROLL_M
  382. #export SGEMM_UNROLL_N
  383. #export DGEMM_UNROLL_M
  384. #export DGEMM_UNROLL_N
  385. #export QGEMM_UNROLL_M
  386. #export QGEMM_UNROLL_N
  387. #export CGEMM_UNROLL_M
  388. #export CGEMM_UNROLL_N
  389. #export ZGEMM_UNROLL_M
  390. #export ZGEMM_UNROLL_N
  391. #export XGEMM_UNROLL_M
  392. #export XGEMM_UNROLL_N
  393. #export CGEMM3M_UNROLL_M
  394. #export CGEMM3M_UNROLL_N
  395. #export ZGEMM3M_UNROLL_M
  396. #export ZGEMM3M_UNROLL_N
  397. #export XGEMM3M_UNROLL_M
  398. #export XGEMM3M_UNROLL_N
  399. #if (USE_CUDA)
  400. # export CUDADIR
  401. # export CUCC
  402. # export CUFLAGS
  403. # export CULIB
  404. #endif
  405. #.SUFFIXES: .$(PSUFFIX) .$(SUFFIX) .f
  406. #
  407. #.f.$(SUFFIX):
  408. # $(FC) $(FFLAGS) -c $< -o $(@F)
  409. #
  410. #.f.$(PSUFFIX):
  411. # $(FC) $(FPFLAGS) -pg -c $< -o $(@F)
  412. # these are not cross-platform
  413. #ifdef BINARY64
  414. #PATHSCALEPATH = /opt/pathscale/lib/3.1
  415. #PGIPATH = /opt/pgi/linux86-64/7.1-5/lib
  416. #else
  417. #PATHSCALEPATH = /opt/pathscale/lib/3.1/32
  418. #PGIPATH = /opt/pgi/linux86/7.1-5/lib
  419. #endif
  420. #ACMLPATH = /opt/acml/4.3.0
  421. #ifneq ($(OSNAME), Darwin)
  422. #MKLPATH = /opt/intel/mkl/10.2.2.025/lib
  423. #else
  424. #MKLPATH = /Library/Frameworks/Intel_MKL.framework/Versions/10.0.1.014/lib
  425. #endif
  426. #ATLASPATH = /opt/atlas/3.9.17/opteron
  427. #FLAMEPATH = $(HOME)/flame/lib
  428. #ifneq ($(OSNAME), SunOS)
  429. #SUNPATH = /opt/sunstudio12.1
  430. #else
  431. #SUNPATH = /opt/SUNWspro
  432. #endif