You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

CMakeLists.txt 12 kB

2 months ago
2 months ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288
  1. ###############################################################################
  2. # Copyright (c) 2025, The OpenBLAS Project
  3. # All rights reserved.
  4. # Redistribution and use in source and binary forms, with or without
  5. # modification, are permitted provided that the following conditions are
  6. # met:
  7. # 1. Redistributions of source code must retain the above copyright
  8. # notice, this list of conditions and the following disclaimer.
  9. # 2. Redistributions in binary form must reproduce the above copyright
  10. # notice, this list of conditions and the following disclaimer in
  11. # the documentation and/or other materials provided with the
  12. # distribution.
  13. # 3. Neither the name of the OpenBLAS project nor the names of
  14. # its contributors may be used to endorse or promote products
  15. # derived from this software without specific prior written permission.
  16. # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  17. # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  18. # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  19. # ARE DISCLAIMED. IN NO EVENT SHALL THE OPENBLAS PROJECT OR CONTRIBUTORS BE
  20. # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  21. # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  22. # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  23. # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  24. # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  25. # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  26. # POSSIBILITY OF SUCH DAMAGE.
  27. ###############################################################################
  28. include_directories(${PROJECT_SOURCE_DIR})
  29. include_directories(${PROJECT_BINARY_DIR})
  30. set(BLAS1_SOURCES
  31. copy.c
  32. nrm2.c
  33. )
  34. set(BLAS1_REAL_ONLY_SOURCES
  35. rotm.c rotmg.c # N.B. these do not have complex counterparts
  36. rot.c
  37. asum.c
  38. sum.c
  39. )
  40. # these will have 'z' prepended for the complex version
  41. set(BLAS1_MANGLED_SOURCES
  42. axpy.c swap.c
  43. scal.c
  44. dot.c
  45. rotg.c
  46. axpby.c
  47. )
  48. # TODO: USE_NETLIB_GEMV should switch gemv.c to netlib/*gemv.f
  49. # these all have 'z' sources for complex versions
  50. set(BLAS2_SOURCES
  51. gemv.c ger.c
  52. trsv.c trmv.c
  53. syr2.c gbmv.c
  54. sbmv.c spmv.c
  55. spr2.c
  56. tbsv.c tbmv.c
  57. tpsv.c tpmv.c
  58. )
  59. set(BLAS2_REAL_ONLY_SOURCES
  60. symv.c syr.c spr.c
  61. )
  62. set(BLAS2_COMPLEX_LAPACK_SOURCES
  63. symv.c syr.c spr.c
  64. )
  65. set(BLAS2_COMPLEX_ONLY_MANGLED_SOURCES
  66. hemv.c hbmv.c
  67. her.c her2.c
  68. hpmv.c hpr.c
  69. hpr2.c
  70. )
  71. # these do not have separate 'z' sources
  72. set(BLAS3_SOURCES
  73. gemm.c symm.c
  74. trsm.c syrk.c syr2k.c gemmt.c
  75. )
  76. set(BLAS3_MANGLED_SOURCES
  77. omatcopy.c imatcopy.c
  78. geadd.c
  79. )
  80. # generate the BLAS objs once with and once without cblas
  81. set (CBLAS_FLAGS "")
  82. if (NOT DEFINED NO_FBLAS)
  83. list(APPEND CBLAS_FLAGS 0)
  84. endif ()
  85. if (NOT DEFINED NO_CBLAS)
  86. list(APPEND CBLAS_FLAGS 1)
  87. endif ()
  88. foreach (CBLAS_FLAG ${CBLAS_FLAGS})
  89. # TODO: don't compile complex sources with cblas for now, the naming schemes are all different and they will have to be handled separately from SINGLE/DOUBLE
  90. set(DISABLE_COMPLEX 0)
  91. set(MANGLE_COMPLEX 3)
  92. if (CBLAS_FLAG EQUAL 1)
  93. # set(DISABLE_COMPLEX 1)
  94. # set(MANGLE_COMPLEX 1)
  95. endif ()
  96. GenerateNamedObjects("${BLAS1_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${DISABLE_COMPLEX})
  97. GenerateNamedObjects("${BLAS1_REAL_ONLY_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false 1)
  98. GenerateNamedObjects("${BLAS1_MANGLED_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${MANGLE_COMPLEX})
  99. GenerateNamedObjects("${BLAS2_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${MANGLE_COMPLEX})
  100. GenerateNamedObjects("${BLAS2_REAL_ONLY_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false 1)
  101. if (NOT DEFINED NO_LAPACK)
  102. GenerateNamedObjects("${BLAS2_COMPLEX_LAPACK_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${MANGLE_COMPLEX})
  103. endif ()
  104. GenerateNamedObjects("${BLAS2_COMPLEX_ONLY_MANGLED_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false 4)
  105. GenerateNamedObjects("${BLAS3_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${DISABLE_COMPLEX})
  106. GenerateNamedObjects("${BLAS3_MANGLED_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${MANGLE_COMPLEX})
  107. GenerateNamedObjects("xerbla.c" "" "xerbla" ${CBLAS_FLAG} "" "" true)
  108. #sdsdot, dsdot
  109. if (BUILD_SINGLE OR BUILD_DOUBLE)
  110. GenerateNamedObjects("sdsdot.c" "" "sdsdot" ${CBLAS_FLAG} "" "" true "SINGLE")
  111. if(CBLAS_FLAG EQUAL 1)
  112. GenerateNamedObjects("gemm_batch.c" "" "gemm_batch" ${CBLAS_FLAG} "" "" false)
  113. endif ()
  114. endif ()
  115. if (BUILD_DOUBLE)
  116. GenerateNamedObjects("dsdot.c" "" "dsdot" ${CBLAS_FLAG} "" "" true "SINGLE")
  117. endif ()
  118. # trmm is trsm with a compiler flag set
  119. GenerateNamedObjects("trsm.c" "TRMM" "trmm" ${CBLAS_FLAG})
  120. # gemmtr is gemmt under the name adopted by the Reference BLAS
  121. GenerateNamedObjects("gemm.c" "RNAME" "gemmtr" ${CBLAS_FLAG})
  122. # max and imax are compiled 4 times
  123. GenerateNamedObjects("max.c" "" "" ${CBLAS_FLAG})
  124. GenerateNamedObjects("max.c" "USE_ABS" "amax" ${CBLAS_FLAG})
  125. GenerateNamedObjects("max.c" "USE_ABS;USE_MIN" "amin" ${CBLAS_FLAG})
  126. GenerateNamedObjects("max.c" "USE_MIN" "min" ${CBLAS_FLAG})
  127. GenerateNamedObjects("imax.c" "" "i*max" ${CBLAS_FLAG})
  128. GenerateNamedObjects("imax.c" "USE_ABS" "i*amax" ${CBLAS_FLAG})
  129. GenerateNamedObjects("imax.c" "USE_ABS;USE_MIN" "i*amin" ${CBLAS_FLAG})
  130. GenerateNamedObjects("imax.c" "USE_MIN" "i*min" ${CBLAS_FLAG})
  131. if (BUILD_BFLOAT16)
  132. GenerateNamedObjects("bf16dot.c" "" "sbdot" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  133. GenerateNamedObjects("gemm.c" "BGEMM" "bgemm" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  134. GenerateNamedObjects("gemm.c" "" "sbgemm" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  135. GenerateNamedObjects("sbgemmt.c" "" "sbgemmt" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  136. GenerateNamedObjects("sbgemmt.c" "RNAME" "sbgemmtr" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  137. GenerateNamedObjects("sbgemv.c" "" "sbgemv" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  138. GenerateNamedObjects("tobf16.c" "SINGLE_PREC" "sbstobf16" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  139. GenerateNamedObjects("tobf16.c" "DOUBLE_PREC" "sbdtobf16" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  140. GenerateNamedObjects("bf16to.c" "SINGLE_PREC" "sbf16tos" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  141. GenerateNamedObjects("bf16to.c" "DOUBLE_PREC" "dbf16tod" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  142. if(CBLAS_FLAG EQUAL 1)
  143. GenerateNamedObjects("gemm_batch.c" "" "sbgemm_batch" ${CBLAS_FLAG} "" "" true "BFLOAT16")
  144. endif ()
  145. endif ()
  146. if (BUILD_HFLOAT16)
  147. GenerateNamedObjects("gemm.c" "" "shgemm" ${CBLAS_FLAG} "" "" true "HFLOAT16")
  148. endif ()
  149. # complex-specific sources
  150. foreach (float_type ${FLOAT_TYPES})
  151. if (${float_type} STREQUAL "COMPLEX" OR ${float_type} STREQUAL "ZCOMPLEX")
  152. GenerateNamedObjects("zaxpy.c" "CONJ" "axpyc" ${CBLAS_FLAG} "" "" false ${float_type})
  153. GenerateNamedObjects("zger.c" "" "geru" ${CBLAS_FLAG} "" "" false ${float_type})
  154. GenerateNamedObjects("zger.c" "CONJ" "gerc" ${CBLAS_FLAG} "" "" false ${float_type})
  155. GenerateNamedObjects("zdot.c" "CONJ" "dotc" ${CBLAS_FLAG} "" "" false ${float_type})
  156. GenerateNamedObjects("zdot.c" "" "dotu" ${CBLAS_FLAG} "" "" false ${float_type})
  157. GenerateNamedObjects("symm.c" "HEMM" "hemm" ${CBLAS_FLAG} "" "" false ${float_type})
  158. GenerateNamedObjects("syrk.c" "HEMM" "herk" ${CBLAS_FLAG} "" "" false ${float_type})
  159. GenerateNamedObjects("syr2k.c" "HEMM" "her2k" ${CBLAS_FLAG} "" "" false ${float_type})
  160. if (USE_GEMM3M)
  161. GenerateNamedObjects("gemm.c" "GEMM3M" "gemm3m" ${CBLAS_FLAG} "" "" false ${float_type})
  162. endif()
  163. endif ()
  164. if (${float_type} STREQUAL "COMPLEX")
  165. GenerateNamedObjects("zscal.c" "SSCAL" "sscal" ${CBLAS_FLAG} "" "" false "COMPLEX")
  166. GenerateNamedObjects("nrm2.c" "" "scnrm2" ${CBLAS_FLAG} "" "" true "COMPLEX")
  167. GenerateNamedObjects("zrot.c" "" "csrot" ${CBLAS_FLAG} "" "" true "COMPLEX")
  168. GenerateNamedObjects("max.c" "USE_ABS;USE_MIN" "scamin" ${CBLAS_FLAG} "" "" true "COMPLEX")
  169. GenerateNamedObjects("max.c" "USE_ABS" "scamax" ${CBLAS_FLAG} "" "" true "COMPLEX")
  170. GenerateNamedObjects("asum.c" "" "scasum" ${CBLAS_FLAG} "" "" true "COMPLEX")
  171. GenerateNamedObjects("sum.c" "" "scsum" ${CBLAS_FLAG} "" "" true "COMPLEX")
  172. if(CBLAS_FLAG EQUAL 1)
  173. GenerateNamedObjects("gemm_batch.c" "" "cgemm_batch" ${CBLAS_FLAG} "" "" true "COMPLEX")
  174. endif ()
  175. endif ()
  176. if (${float_type} STREQUAL "ZCOMPLEX")
  177. GenerateNamedObjects("zscal.c" "SSCAL" "dscal" ${CBLAS_FLAG} "" "" false "ZCOMPLEX")
  178. GenerateNamedObjects("nrm2.c" "" "dznrm2" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  179. GenerateNamedObjects("zrot.c" "" "zdrot" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  180. GenerateNamedObjects("max.c" "USE_ABS;USE_MIN" "dzamin" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  181. GenerateNamedObjects("max.c" "USE_ABS" "dzamax" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  182. GenerateNamedObjects("asum.c" "" "dzasum" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  183. GenerateNamedObjects("sum.c" "" "dzsum" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  184. if(CBLAS_FLAG EQUAL 1)
  185. GenerateNamedObjects("gemm_batch.c" "" "zgemm_batch" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  186. endif ()
  187. endif ()
  188. endforeach ()
  189. endforeach ()
  190. #Special functions for CBLAS
  191. if (NOT DEFINED NO_CBLAS)
  192. foreach (float_type ${FLOAT_TYPES})
  193. if (${float_type} STREQUAL "COMPLEX" OR ${float_type} STREQUAL "ZCOMPLEX")
  194. #cblas_dotc_sub cblas_dotu_sub
  195. GenerateNamedObjects("zdot.c" "FORCE_USE_STACK" "dotu_sub" 1 "" "" false ${float_type})
  196. GenerateNamedObjects("zdot.c" "FORCE_USE_STACK;CONJ" "dotc_sub" 1 "" "" false ${float_type})
  197. endif()
  198. endforeach ()
  199. endif()
  200. if (NOT NO_LAPACK)
  201. set(LAPACK_SOURCES
  202. lapack/gesv.c
  203. )
  204. # prepend z for complex versions
  205. set(LAPACK_MANGLED_SOURCES
  206. lapack/getrf.c lapack/getrs.c lapack/potrf.c lapack/getf2.c
  207. lapack/potf2.c lapack/laswp.c lapack/lauu2.c
  208. lapack/lauum.c lapack/trti2.c lapack/trtri.c
  209. )
  210. GenerateNamedObjects("${LAPACK_SOURCES}")
  211. if (NOT RELAPACK_REPLACE)
  212. GenerateNamedObjects("${LAPACK_MANGLED_SOURCES}" "" "" 0 "" "" 0 3)
  213. else ()
  214. GenerateNamedObjects("lapack/getrs.c" "" "" 0 "" "" 0 3)
  215. GenerateNamedObjects("lapack/getf2.c" "" "" 0 "" "" 0 3)
  216. GenerateNamedObjects("lapack/potf2.c" "" "" 0 "" "" 0 3)
  217. GenerateNamedObjects("lapack/laswp.c" "" "" 0 "" "" 0 3)
  218. GenerateNamedObjects("lapack/lauu2.c" "" "" 0 "" "" 0 3)
  219. GenerateNamedObjects("lapack/trti2.c" "" "" 0 "" "" 0 3)
  220. endif()
  221. GenerateNamedObjects("lapack/laed3.c" "" "" 0 "" "" 0 1)
  222. endif ()
  223. if ( BUILD_COMPLEX AND NOT BUILD_SINGLE)
  224. GenerateNamedObjects("scal.c" "" "scal" 0 "" "" false "SINGLE")
  225. GenerateNamedObjects("copy.c" "" "copy" 0 "" "" false "SINGLE")
  226. GenerateNamedObjects("dot.c" "" "dot" 0 "" "" false "SINGLE")
  227. GenerateNamedObjects("rot.c" "" "rot" 0 "" "" false "SINGLE")
  228. GenerateNamedObjects("nrm2.c" "" "nrm2" 0 "" "" false "SINGLE")
  229. GenerateNamedObjects("gemv.c" "" "gemv" 0 "" "" false "SINGLE")
  230. GenerateNamedObjects("gemm.c" "" "gemm" 0 "" "" false "SINGLE")
  231. GenerateNamedObjects("gemm_batch.c" "" "gemm_batch" 1 "" "" false "SINGLE")
  232. GenerateNamedObjects("asum.c" "" "asum" 0 "" "" false "SINGLE")
  233. GenerateNamedObjects("swap.c" "" "swap" 0 "" "" false "SINGLE")
  234. GenerateNamedObjects("axpy.c" "" "axpy" 0 "" "" false "SINGLE")
  235. GenerateNamedObjects("imax.c" "USE_ABS" "i*amax" 0 "" "" false "SINGLE")
  236. endif ()
  237. if ( BUILD_COMPLEX16 AND NOT BUILD_DOUBLE)
  238. GenerateNamedObjects("scal.c" "" "scal" 0 "" "" false "DOUBLE")
  239. GenerateNamedObjects("copy.c" "" "copy" 0 "" "" false "DOUBLE")
  240. GenerateNamedObjects("dot.c" "" "dot" 0 "" "" false "DOUBLE")
  241. GenerateNamedObjects("rot.c" "" "rot" 0 "" "" false "DOUBLE")
  242. GenerateNamedObjects("nrm2.c" "" "nrm2" 0 "" "" false "DOUBLE")
  243. GenerateNamedObjects("gemv.c" "" "gemv" 0 "" "" false "DOUBLE")
  244. GenerateNamedObjects("gemm.c" "" "gemm" 0 "" "" false "DOUBLE")
  245. GenerateNamedObjects("gemm_batch.c" "" "gemm_batch" 1 "" "" false "DOUBLE")
  246. GenerateNamedObjects("asum.c" "" "asum" 0 "" "" false "DOUBLE")
  247. GenerateNamedObjects("swap.c" "" "swap" 0 "" "" false "DOUBLE")
  248. GenerateNamedObjects("axpy.c" "" "axpy" 0 "" "" false "DOUBLE")
  249. GenerateNamedObjects("imax.c" "USE_ABS" "i*amax" 0 "" "" false "DOUBLE")
  250. endif ()
  251. add_library(interface OBJECT ${OPENBLAS_SRC})
  252. if (USE_OPENMP)
  253. target_link_libraries(interface OpenMP::OpenMP_C)
  254. endif()