You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

CMakeLists.txt 5.9 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166
  1. include_directories(${CMAKE_SOURCE_DIR})
  2. set(BLAS1_SOURCES
  3. copy.c
  4. nrm2.c
  5. )
  6. set(BLAS1_REAL_ONLY_SOURCES
  7. rotm.c rotmg.c # N.B. these do not have complex counterparts
  8. rot.c
  9. asum.c
  10. )
  11. # these will have 'z' prepended for the complex version
  12. set(BLAS1_MANGLED_SOURCES
  13. axpy.c swap.c
  14. scal.c
  15. dot.c
  16. rotg.c
  17. axpby.c
  18. )
  19. # TODO: USE_NETLIB_GEMV shoudl switch gemv.c to netlib/*gemv.f
  20. # these all have 'z' sources for complex versions
  21. set(BLAS2_SOURCES
  22. gemv.c ger.c
  23. trsv.c trmv.c symv.c
  24. syr.c syr2.c gbmv.c
  25. sbmv.c spmv.c
  26. spr.c spr2.c
  27. tbsv.c tbmv.c
  28. tpsv.c tpmv.c
  29. )
  30. set(BLAS2_COMPLEX_ONLY_MANGLED_SOURCES
  31. hemv.c hbmv.c
  32. her.c her2.c
  33. hpmv.c hpr.c
  34. hpr2.c
  35. )
  36. # these do not have separate 'z' sources
  37. set(BLAS3_SOURCES
  38. gemm.c symm.c
  39. trsm.c syrk.c syr2k.c
  40. )
  41. set(BLAS3_MANGLED_SOURCES
  42. omatcopy.c imatcopy.c
  43. geadd.c
  44. )
  45. # generate the BLAS objs once with and once without cblas
  46. set (CBLAS_FLAGS "")
  47. if (NOT DEFINED NO_FBLAS)
  48. list(APPEND CBLAS_FLAGS 0)
  49. endif ()
  50. if (NOT DEFINED NO_CBLAS)
  51. list(APPEND CBLAS_FLAGS 1)
  52. endif ()
  53. foreach (CBLAS_FLAG ${CBLAS_FLAGS})
  54. # TODO: don't compile complex sources with cblas for now, the naming schemes are all different and they will have to be handled separately from SINGLE/DOUBLE
  55. set(DISABLE_COMPLEX 0)
  56. set(MANGLE_COMPLEX 3)
  57. if (CBLAS_FLAG EQUAL 1)
  58. # set(DISABLE_COMPLEX 1)
  59. # set(MANGLE_COMPLEX 1)
  60. endif ()
  61. GenerateNamedObjects("${BLAS1_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${DISABLE_COMPLEX})
  62. GenerateNamedObjects("${BLAS1_REAL_ONLY_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false 1)
  63. GenerateNamedObjects("${BLAS1_MANGLED_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${MANGLE_COMPLEX})
  64. GenerateNamedObjects("${BLAS2_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${MANGLE_COMPLEX})
  65. GenerateNamedObjects("${BLAS2_COMPLEX_ONLY_MANGLED_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false 4)
  66. GenerateNamedObjects("${BLAS3_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${DISABLE_COMPLEX})
  67. GenerateNamedObjects("${BLAS3_MANGLED_SOURCES}" "" "" ${CBLAS_FLAG} "" "" false ${MANGLE_COMPLEX})
  68. #sdsdot, dsdot
  69. GenerateNamedObjects("sdsdot.c" "" "sdsdot" ${CBLAS_FLAG} "" "" true "SINGLE")
  70. GenerateNamedObjects("dsdot.c" "" "dsdot" ${CBLAS_FLAG} "" "" true "SINGLE")
  71. # trmm is trsm with a compiler flag set
  72. GenerateNamedObjects("trsm.c" "TRMM" "trmm" ${CBLAS_FLAG})
  73. # max and imax are compiled 4 times
  74. GenerateNamedObjects("max.c" "" "" ${CBLAS_FLAG})
  75. GenerateNamedObjects("max.c" "USE_ABS" "amax" ${CBLAS_FLAG})
  76. GenerateNamedObjects("max.c" "USE_ABS;USE_MIN" "amin" ${CBLAS_FLAG})
  77. GenerateNamedObjects("max.c" "USE_MIN" "min" ${CBLAS_FLAG})
  78. GenerateNamedObjects("imax.c" "" "i*max" ${CBLAS_FLAG})
  79. GenerateNamedObjects("imax.c" "USE_ABS" "i*amax" ${CBLAS_FLAG})
  80. GenerateNamedObjects("imax.c" "USE_ABS;USE_MIN" "i*amin" ${CBLAS_FLAG})
  81. GenerateNamedObjects("imax.c" "USE_MIN" "i*min" ${CBLAS_FLAG})
  82. # complex-specific sources
  83. foreach (float_type ${FLOAT_TYPES})
  84. if (${float_type} STREQUAL "COMPLEX" OR ${float_type} STREQUAL "ZCOMPLEX")
  85. GenerateNamedObjects("zger.c" "" "geru" ${CBLAS_FLAG} "" "" false ${float_type})
  86. GenerateNamedObjects("zger.c" "CONJ" "gerc" ${CBLAS_FLAG} "" "" false ${float_type})
  87. GenerateNamedObjects("zdot.c" "CONJ" "dotc" ${CBLAS_FLAG} "" "" false ${float_type})
  88. GenerateNamedObjects("zdot.c" "" "dotu" ${CBLAS_FLAG} "" "" false ${float_type})
  89. GenerateNamedObjects("symm.c" "HEMM" "hemm" ${CBLAS_FLAG} "" "" false ${float_type})
  90. GenerateNamedObjects("syrk.c" "HEMM" "herk" ${CBLAS_FLAG} "" "" false ${float_type})
  91. GenerateNamedObjects("syr2k.c" "HEMM" "her2k" ${CBLAS_FLAG} "" "" false ${float_type})
  92. if (USE_GEMM3M)
  93. GenerateNamedObjects("gemm.c" "GEMM3M" "gemm3m" false "" "" false ${float_type})
  94. endif()
  95. endif ()
  96. if (${float_type} STREQUAL "COMPLEX")
  97. GenerateNamedObjects("zscal.c" "SSCAL" "sscal" ${CBLAS_FLAG} "" "" false "COMPLEX")
  98. GenerateNamedObjects("nrm2.c" "" "scnrm2" ${CBLAS_FLAG} "" "" true "COMPLEX")
  99. GenerateNamedObjects("zrot.c" "" "csrot" ${CBLAS_FLAG} "" "" true "COMPLEX")
  100. GenerateNamedObjects("max.c" "USE_ABS;USE_MIN" "scamin" ${CBLAS_FLAG} "" "" true "COMPLEX")
  101. GenerateNamedObjects("max.c" "USE_ABS" "scamax" ${CBLAS_FLAG} "" "" true "COMPLEX")
  102. GenerateNamedObjects("asum.c" "" "scasum" ${CBLAS_FLAG} "" "" true "COMPLEX")
  103. endif ()
  104. if (${float_type} STREQUAL "ZCOMPLEX")
  105. GenerateNamedObjects("zscal.c" "SSCAL" "dscal" ${CBLAS_FLAG} "" "" false "ZCOMPLEX")
  106. GenerateNamedObjects("nrm2.c" "" "dznrm2" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  107. GenerateNamedObjects("zrot.c" "" "zdrot" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  108. GenerateNamedObjects("max.c" "USE_ABS;USE_MIN" "dzamin" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  109. GenerateNamedObjects("max.c" "USE_ABS" "dzamax" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  110. GenerateNamedObjects("asum.c" "" "dzasum" ${CBLAS_FLAG} "" "" true "ZCOMPLEX")
  111. endif ()
  112. endforeach ()
  113. endforeach ()
  114. #Special functions for CBLAS
  115. if (NOT DEFINED NO_CBLAS)
  116. foreach (float_type ${FLOAT_TYPES})
  117. if (${float_type} STREQUAL "COMPLEX" OR ${float_type} STREQUAL "ZCOMPLEX")
  118. #cblas_dotc_sub cblas_dotu_sub
  119. GenerateNamedObjects("zdot.c" "FORCE_USE_STACK" "dotu_sub" 1 "" "" false ${float_type})
  120. GenerateNamedObjects("zdot.c" "FORCE_USE_STACK;CONJ" "dotc_sub" 1 "" "" false ${float_type})
  121. endif()
  122. endforeach ()
  123. endif()
  124. if (NOT DEFINED NO_LAPACK)
  125. set(LAPACK_SOURCES
  126. lapack/gesv.c
  127. )
  128. # prepend z for complex versions
  129. set(LAPACK_MANGLED_SOURCES
  130. lapack/getrf.c lapack/getrs.c lapack/potrf.c lapack/getf2.c
  131. lapack/potf2.c lapack/laswp.c lapack/lauu2.c
  132. lapack/lauum.c lapack/trti2.c lapack/trtri.c
  133. )
  134. GenerateNamedObjects("${LAPACK_SOURCES}")
  135. GenerateNamedObjects("${LAPACK_MANGLED_SOURCES}" "" "" 0 "" "" 0 3)
  136. endif ()
  137. add_library(interface OBJECT ${OPENBLAS_SRC})