|
- ##
- ## Author: Hank Anderson <hank@statease.com>
- ## Description: Ported from OpenBLAS/Makefile.system
- ##
- set(NETLIB_LAPACK_DIR "${PROJECT_SOURCE_DIR}/lapack-netlib")
-
- # System detection, via CMake.
- include("${PROJECT_SOURCE_DIR}/cmake/system_check.cmake")
-
- if(CMAKE_CROSSCOMPILING AND NOT DEFINED TARGET)
- # Detect target without running getarch
- if (ARM64)
- set(TARGET "ARMV8")
- elseif(ARM)
- set(TARGET "ARMV7") # TODO: Ask compiler which arch this is
- else()
- message(FATAL_ERROR "When cross compiling, a TARGET is required.")
- endif()
- endif()
-
- # Other files expect CORE, which is actually TARGET and will become TARGET_CORE for kernel build. Confused yet?
- # It seems we are meant to use TARGET as input and CORE internally as kernel.
- if(NOT DEFINED CORE AND DEFINED TARGET)
- set(CORE ${TARGET})
- endif()
-
- # TARGET_CORE will override TARGET which is used in DYNAMIC_ARCH=1.
- if (DEFINED TARGET_CORE)
- set(TARGET ${TARGET_CORE})
- endif ()
-
- # Force fallbacks for 32bit
- if (DEFINED BINARY AND DEFINED TARGET AND BINARY EQUAL 32)
- message(STATUS "Compiling a ${BINARY}-bit binary.")
- set(NO_AVX 1)
- if (${TARGET} STREQUAL "HASWELL" OR ${TARGET} STREQUAL "SANDYBRIDGE" OR ${TARGET} STREQUAL "SKYLAKEX" OR ${TARGET} STREQUAL "COOPERLAKE" OR ${TARGET} STREQUAL "SAPPHIRERAPIDS")
- set(TARGET "NEHALEM")
- endif ()
- if (${TARGET} STREQUAL "BULLDOZER" OR ${TARGET} STREQUAL "PILEDRIVER" OR ${TARGET} STREQUAL "ZEN")
- set(TARGET "BARCELONA")
- endif ()
- if (${TARGET} STREQUAL "ARMV8" OR ${TARGET} STREQUAL "CORTEXA57" OR ${TARGET} STREQUAL "CORTEXA53" OR ${TARGET} STREQUAL "CORTEXA55")
- set(TARGET "ARMV7")
- endif ()
- if (${TARGET} STREQUAL "POWER8" OR ${TARGET} STREQUAL "POWER9" OR ${TARGET} STREQUAL "POWER10")
- set(TARGET "POWER6")
- endif ()
- endif ()
-
-
- if (DEFINED TARGET)
- message(STATUS "-- -- -- -- -- -- -- -- -- -- -- -- --")
- message(STATUS "Targeting the ${TARGET} architecture.")
- set(GETARCH_FLAGS "-DFORCE_${TARGET}")
- endif ()
-
- # On x86_64 build getarch with march=native. This is required to detect AVX512 support in getarch.
- if (X86_64 AND NOT ${CMAKE_C_COMPILER_ID} STREQUAL "PGI")
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -march=native")
- endif ()
-
- # On x86 no AVX support is available
- if (X86 OR X86_64)
- if ((DEFINED BINARY AND BINARY EQUAL 32) OR ("$CMAKE_SIZEOF_VOID_P}" EQUAL "4"))
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX -DNO_AVX2 -DNO_AVX512")
- endif ()
- endif ()
-
- if (INTERFACE64)
- message(STATUS "Using 64-bit integers.")
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DUSE64BITINT")
- endif ()
-
- if (NOT DEFINED GEMM_MULTITHREAD_THRESHOLD)
- set(GEMM_MULTITHREAD_THRESHOLD 4)
- endif ()
- message(STATUS "GEMM multithread threshold set to ${GEMM_MULTITHREAD_THRESHOLD}.")
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DGEMM_MULTITHREAD_THRESHOLD=${GEMM_MULTITHREAD_THRESHOLD}")
-
- if (NO_AVX)
- message(STATUS "Disabling Advanced Vector Extensions (AVX).")
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX")
- endif ()
-
- if (NO_AVX2)
- message(STATUS "Disabling Advanced Vector Extensions 2 (AVX2).")
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX2")
- endif ()
-
- if (NO_AVX512)
- message(STATUS "Disabling Advanced Vector Extensions 512 (AVX512).")
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_AVX512")
- endif ()
-
- if (CMAKE_BUILD_TYPE STREQUAL "Debug")
- set(GETARCH_FLAGS "${GETARCH_FLAGS} ${CMAKE_C_FLAGS_DEBUG}")
- endif ()
-
- if (NOT DEFINED NO_PARALLEL_MAKE)
- set(NO_PARALLEL_MAKE 0)
- endif ()
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DNO_PARALLEL_MAKE=${NO_PARALLEL_MAKE}")
-
- if (CMAKE_C_COMPILER STREQUAL loongcc)
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -static")
- endif ()
-
- if (POWER)
- set(NO_WARMUP 1)
- set(HAVE_GAS 1)
- if (CMAKE_ASM_COMPILER_ID STREQUAL "GNU")
- set(HAVE_GAS 0)
- elseif (CMAKE_ASM_COMPILER_ID STREQUAL "Clang")
- set(CCOMMON_OPT "${CCOMMON_OPT} -fno-integrated-as")
- set(HAVE_GAS 0)
- endif ()
- set(GETARCH_FLAGS "${GETARCH_FLAGS} -DHAVE_GAS=${HAVE_GAS}")
- endif ()
-
- #if don't use Fortran, it will only compile CBLAS.
- if (ONLY_CBLAS)
- set(NO_LAPACK 1)
- else ()
- set(ONLY_CBLAS 0)
- endif ()
-
- # N.B. this is NUM_THREAD in Makefile.system which is probably a bug -hpa
- if (NOT CMAKE_CROSSCOMPILING)
- if (NOT DEFINED NUM_CORES)
- include(ProcessorCount)
- ProcessorCount(NUM_CORES)
- endif()
-
- endif()
-
- if (NOT DEFINED NUM_PARALLEL)
- set(NUM_PARALLEL 1)
- endif()
-
- if (NOT DEFINED NUM_THREADS)
- if (DEFINED NUM_CORES AND NOT NUM_CORES EQUAL 0)
- # HT?
- set(NUM_THREADS ${NUM_CORES})
- else ()
- set(NUM_THREADS 0)
- endif ()
- endif()
-
- if (${NUM_THREADS} LESS 2)
- set(USE_THREAD 0)
- elseif(NOT DEFINED USE_THREAD)
- set(USE_THREAD 1)
- endif ()
-
- if (USE_THREAD)
- message(STATUS "Multi-threading enabled with ${NUM_THREADS} threads.")
- else()
- if (${USE_LOCKING})
- set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_LOCKING")
- endif ()
- endif ()
-
- include("${PROJECT_SOURCE_DIR}/cmake/prebuild.cmake")
- if (DEFINED TARGET)
- if (${TARGET} STREQUAL COOPERLAKE AND NOT NO_AVX512)
- if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
- execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
- if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 10.09)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=cooperlake")
- else()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
- endif()
- elseif (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
- if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 8.99)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=cooperlake -exhaustive-register-search")
- else()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512 -exhaustive-register-search")
- endif()
- endif()
- endif()
- if (${TARGET} STREQUAL SAPPHIRERAPIDS AND NOT NO_AVX512)
- if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
- execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
- if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 11.0)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=sapphirerapids")
- else()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
- endif()
- elseif (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
- if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 12.0)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=sapphirerapids -exhaustive-register-search")
- else()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512 -exhaustive-register-search")
- endif()
- endif()
- endif()
- if (${TARGET} STREQUAL SKYLAKEX AND NOT NO_AVX512)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
- if (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -exhaustive-register-search")
- endif()
- endif()
-
- if (((${TARGET} STREQUAL ZEN) AND HAVE_AVX512VL) AND NOT NO_AVX512)
- if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
- execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
- if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 12.99)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=znver4")
- else()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
- endif()
- elseif (${CMAKE_C_COMPILER_ID} STREQUAL "Clang" OR ${CMAKE_C_COMPILER_ID} STREQUAL "AppleClang")
- if (${CMAKE_C_COMPILER_VERSION} VERSION_GREATER 15.99)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=znver4")
- else()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -march=skylake-avx512")
- endif()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -exhaustive-register-search")
- endif()
- endif()
-
- if ((${TARGET} STREQUAL HASWELL OR (${TARGET} STREQUAL ZEN AND NOT HAVE_AVX512VL)) AND NOT NO_AVX2)
- if (${CMAKE_C_COMPILER_ID} STREQUAL "GNU")
- execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
- if (${GCC_VERSION} VERSION_GREATER 4.7 OR ${GCC_VERSION} VERSION_EQUAL 4.7)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx2")
- endif()
- elseif (${CMAKE_C_COMPILER_ID} STREQUAL "CLANG")
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx2 -mfma")
- endif()
- endif()
- if (DEFINED HAVE_AVX)
- if (NOT NO_AVX)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx")
- endif()
- endif()
- if (DEFINED HAVE_AVX2)
- if (NOT NO_AVX2)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mavx2")
- endif()
- endif()
- # if (DEFINED HAVE_FMA3)
- # if (NOT NO_AVX2)
- # set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mfma")
- # endif()
- # endif()
- if (DEFINED HAVE_SSE)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse")
- endif()
- if (DEFINED HAVE_SSE2)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse2")
- endif()
- if (DEFINED HAVE_SSE3)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse3")
- endif()
- if (DEFINED HAVE_SSSE3)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mssse3")
- endif()
- if (DEFINED HAVE_SSE4_1)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -msse4.1")
- endif()
-
- if (${TARGET} STREQUAL POWER10)
- execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
- if (${GCC_VERSION} VERSION_GREATER 10.2 OR ${GCC_VERSION} VERSION_EQUAL 10.2)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power10 -mtune=power10 -mvsx -fno-fast-math")
- else ()
- message(FATAL_ERROR "Compiler GCC.${GCC_VERSION} does not support Power10.")
- endif()
- endif()
- if (${TARGET} STREQUAL POWER9)
- execute_process(COMMAND ${CMAKE_C_COMPILER} -dumpversion OUTPUT_VARIABLE GCC_VERSION)
- if (${GCC_VERSION} VERSION_GREATER 5.0 OR ${GCC_VERSION} VERSION_EQUAL 5.0)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power9 -mtune=power9 -mvsx -fno-fast-math")
- else ()
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power8 -mtune=power8 -mvsx -fno-fast-math")
- message(WARNING "Compiler GCC.${GCC_VERSION} does not support fully Power9.")
- endif()
- endif()
- if (${TARGET} STREQUAL POWER8)
- set (KERNEL_DEFINITIONS "${KERNEL_DEFINITIONS} -mcpu=power8 -mtune=power8 -mvsx -fno-fast-math")
- endif()
- endif()
- if (DEFINED BINARY)
- message(STATUS "Compiling a ${BINARY}-bit binary.")
- endif ()
- if (NOT DEFINED NEED_PIC)
- set(NEED_PIC 1)
- endif ()
-
- # OS dependent settings
- include("${PROJECT_SOURCE_DIR}/cmake/os.cmake")
-
- # Architecture dependent settings
- include("${PROJECT_SOURCE_DIR}/cmake/arch.cmake")
-
- # C Compiler dependent settings
- include("${PROJECT_SOURCE_DIR}/cmake/cc.cmake")
-
- if (INTERFACE64)
- set(SUFFIX64 64)
- set(SUFFIX64_UNDERSCORE _64)
- endif()
-
- if (NOT NOFORTRAN)
- # Fortran Compiler dependent settings
- include("${PROJECT_SOURCE_DIR}/cmake/fc.cmake")
- else ()
- if (NOT XXXX)
- set(C_LAPACK 1)
- if (INTERFACE64)
- set (CCOMMON_OPT "${CCOMMON_OPT} -DLAPACK_ILP64")
- endif ()
- set(TIMER "NONE")
- else ()
- set (NO_LAPACK 1)
- endif ()
- endif ()
-
- if (BINARY64)
- if (INTERFACE64)
- # CCOMMON_OPT += -DUSE64BITINT
- endif ()
- endif ()
-
- if(EMBEDDED)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DOS_EMBEDDED")
- set(CCOMMON_OPT "${CCOMMON_OPT} -mthumb -mcpu=cortex-m4 -mfloat-abi=hard -mfpu=fpv4-sp-d16")
- endif()
-
- if (NEED_PIC)
- if (${CMAKE_C_COMPILER} STREQUAL "IBM")
- set(CCOMMON_OPT "${CCOMMON_OPT} -qpic=large")
- else ()
- set(CCOMMON_OPT "${CCOMMON_OPT} -fPIC")
- endif ()
-
- if (NOT NOFORTRAN)
- if (${F_COMPILER} STREQUAL "SUN")
- set(FCOMMON_OPT "${FCOMMON_OPT} -pic")
- else ()
- set(FCOMMON_OPT "${FCOMMON_OPT} -fPIC")
- endif ()
- endif()
- endif ()
-
- if (X86_64 OR ${CORE} STREQUAL POWER10)
- set(SMALL_MATRIX_OPT TRUE)
- endif ()
- if (SMALL_MATRIX_OPT)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DSMALL_MATRIX_OPT")
- endif ()
-
- if (DYNAMIC_ARCH)
- if (X86 OR X86_64 OR ARM64 OR POWER)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_ARCH")
- if (DYNAMIC_OLDER)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_OLDER")
- endif ()
- else ()
- unset (DYNAMIC_ARCH)
- message (STATUS "DYNAMIC_ARCH is not supported on the target architecture, removing")
- endif ()
- endif ()
-
- if (DYNAMIC_LIST)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_LIST")
- foreach(DCORE ${DYNAMIC_LIST})
- set(CCOMMON_OPT "${CCOMMON_OPT} -DDYN_${DCORE}")
- endforeach ()
- endif ()
-
- if (NO_LAPACK)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_LAPACK")
- #Disable LAPACK C interface
- set(NO_LAPACKE 1)
- endif ()
-
- if (NO_LAPACKE)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_LAPACKE")
- endif ()
-
- if (NO_AVX)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX")
- endif ()
-
- if (X86)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX")
- endif ()
-
- if (NO_AVX2)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX2")
- endif ()
-
- if (NO_AVX512)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AVX512")
- endif ()
-
- if (USE_THREAD)
- # USE_SIMPLE_THREADED_LEVEL3 = 1
- # NO_AFFINITY = 1
- set(CCOMMON_OPT "${CCOMMON_OPT} -DSMP_SERVER")
-
- if (MIPS64)
- if (NOT ${CORE} STREQUAL "LOONGSON3B")
- set(USE_SIMPLE_THREADED_LEVEL3 1)
- endif ()
- endif ()
-
- if (BIGNUMA)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DBIGNUMA")
- endif ()
- endif ()
-
- if (NO_WARMUP)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_WARMUP")
- endif ()
-
- if (CONSISTENT_FPCSR)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DCONSISTENT_FPCSR")
- endif ()
-
- if (USE_TLS)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_TLS")
- endif ()
-
- # Only for development
- # set(CCOMMON_OPT "${CCOMMON_OPT} -DPARAMTEST")
- # set(CCOMMON_OPT "${CCOMMON_OPT} -DPREFETCHTEST")
- # set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_SWITCHING")
- # set(USE_PAPI 1)
-
- if (USE_PAPI)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_PAPI")
- set(EXTRALIB "${EXTRALIB} -lpapi -lperfctr")
- endif ()
-
- if (DYNAMIC_THREADS)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DDYNAMIC_THREADS")
- endif ()
-
- set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_CPU_NUMBER=${NUM_THREADS}")
-
- set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_PARALLEL_NUMBER=${NUM_PARALLEL}")
-
- if (BUFFERSIZE)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DBUFFERSIZE=${BUFFERSIZE}")
- endif ()
-
- if (USE_SIMPLE_THREADED_LEVEL3)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DUSE_SIMPLE_THREADED_LEVEL3")
- endif ()
-
- if (NOT ${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
- if (DEFINED MAX_STACK_ALLOC)
- if (NOT ${MAX_STACK_ALLOC} EQUAL 0)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_STACK_ALLOC=${MAX_STACK_ALLOC}")
- endif ()
- else ()
- set(CCOMMON_OPT "${CCOMMON_OPT} -DMAX_STACK_ALLOC=2048")
- endif ()
- endif ()
- if (NOT ${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
- if (DEFINED BLAS3_MEM_ALLOC_THRESHOLD)
- if (NOT ${BLAS3_MEM_ALLOC_THRESHOLD} EQUAL 32)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DBLAS3_MEM_ALLOC_THRESHOLD=${BLAS3_MEM_ALLOC_THRESHOLD}")
- endif()
- endif()
- endif()
- if (DEFINED LIBNAMESUFFIX)
- set(LIBPREFIX "libopenblas_${LIBNAMESUFFIX}")
- else ()
- set(LIBPREFIX "libopenblas")
- endif ()
-
- if (NOT DEFINED SYMBOLPREFIX)
- set(SYMBOLPREFIX "")
- endif ()
-
- if (NOT DEFINED SYMBOLSUFFIX)
- set(SYMBOLSUFFIX "")
- endif ()
-
- set(KERNELDIR "${PROJECT_SOURCE_DIR}/kernel/${ARCH}")
-
- # TODO: need to convert these Makefiles
- # include ${PROJECT_SOURCE_DIR}/cmake/${ARCH}.cmake
-
- if (${CORE} STREQUAL "PPC440")
- set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_QALLOC")
- endif ()
-
- if (${CORE} STREQUAL "PPC440FP2")
- set(STATIC_ALLOCATION 1)
- endif ()
-
- if (NOT ${CMAKE_SYSTEM_NAME} STREQUAL "Linux")
- set(NO_AFFINITY 1)
- endif ()
-
- if (NOT X86_64 AND NOT X86 AND NOT ${CORE} STREQUAL "LOONGSON3B")
- set(NO_AFFINITY 1)
- endif ()
-
- if (NO_AFFINITY)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DNO_AFFINITY")
- endif ()
-
- if (FUNCTION_PROFILE)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DFUNCTION_PROFILE")
- endif ()
-
- if (HUGETLB_ALLOCATION)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_HUGETLB")
- endif ()
-
- if (DEFINED HUGETLBFILE_ALLOCATION)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_HUGETLBFILE -DHUGETLB_FILE_NAME=${HUGETLBFILE_ALLOCATION})")
- endif ()
-
- if (STATIC_ALLOCATION)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_STATIC")
- endif ()
-
- if (DEVICEDRIVER_ALLOCATION)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DALLOC_DEVICEDRIVER -DDEVICEDRIVER_NAME=\"/dev/mapper\"")
- endif ()
-
- if (MIXED_MEMORY_ALLOCATION)
- set(CCOMMON_OPT "${CCOMMON_OPT} -DMIXED_MEMORY_ALLOCATION")
- endif ()
-
- set(CCOMMON_OPT "${CCOMMON_OPT} -DVERSION=\"\\\"${OpenBLAS_VERSION}\\\"\"")
-
- set(REVISION "-r${OpenBLAS_VERSION}")
- set(MAJOR_VERSION ${OpenBLAS_MAJOR_VERSION})
-
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${CCOMMON_OPT}")
-
- if (NOT BUILD_SINGLE AND NOT BUILD_DOUBLE AND NOT BUILD_COMPLEX AND NOT BUILD_COMPLEX16)
- set (BUILD_SINGLE ON)
- set (BUILD_DOUBLE ON)
- set (BUILD_COMPLEX ON)
- set (BUILD_COMPLEX16 ON)
- endif()
- if (BUILD_SINGLE)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_SINGLE")
- endif()
- if (BUILD_DOUBLE)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_DOUBLE")
- endif()
- if (BUILD_COMPLEX)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_COMPLEX")
- endif()
- if (BUILD_COMPLEX16)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_COMPLEX16")
- endif()
- if (BUILD_BFLOAT16)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DBUILD_BFLOAT16")
- endif()
- if(NOT MSVC)
- set(CMAKE_ASM_FLAGS "${CMAKE_ASM_FLAGS} ${CCOMMON_OPT}")
- endif()
- # TODO: not sure what PFLAGS is -hpa
- set(PFLAGS "${PFLAGS} ${CCOMMON_OPT} -I${TOPDIR} -DPROFILE ${COMMON_PROF}")
-
- set(CMAKE_Fortran_FLAGS "${CMAKE_Fortran_FLAGS} ${FCOMMON_OPT}")
- # TODO: not sure what FPFLAGS is -hpa
- set(FPFLAGS "${FPFLAGS} ${FCOMMON_OPT} ${COMMON_PROF}")
-
- #For LAPACK Fortran codes.
- set(LAPACK_FFLAGS "${LAPACK_FFLAGS} ${CMAKE_Fortran_FLAGS}")
- set(LAPACK_FPFLAGS "${LAPACK_FPFLAGS} ${FPFLAGS}")
-
- #Disable -fopenmp for LAPACK Fortran codes on Windows.
- if (${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
- set(FILTER_FLAGS "-fopenmp;-mp;-openmp;-xopenmp=parallel")
- foreach (FILTER_FLAG ${FILTER_FLAGS})
- string(REPLACE ${FILTER_FLAG} "" LAPACK_FFLAGS ${LAPACK_FFLAGS})
- string(REPLACE ${FILTER_FLAG} "" LAPACK_FPFLAGS ${LAPACK_FPFLAGS})
- endforeach ()
- endif ()
-
- if ("${F_COMPILER}" STREQUAL "NAG" OR "${F_COMPILER}" STREQUAL "CRAY")
- set(FILTER_FLAGS "-msse3;-mssse3;-msse4.1;-mavx;-mavx2,-mskylake-avx512")
- foreach (FILTER_FLAG ${FILTER_FLAGS})
- string(REPLACE ${FILTER_FLAG} "" LAPACK_FFLAGS ${LAPACK_FFLAGS})
- string(REPLACE ${FILTER_FLAG} "" LAPACK_FPFLAGS ${LAPACK_FPFLAGS})
- endforeach ()
- endif ()
-
- if ("${F_COMPILER}" STREQUAL "GFORTRAN")
- # lapack-netlib is rife with uninitialized warnings -hpa
- set(LAPACK_FFLAGS "${LAPACK_FFLAGS} -Wno-maybe-uninitialized")
- endif ()
-
- set(LAPACK_CFLAGS "${CMAKE_C_CFLAGS} -DHAVE_LAPACK_CONFIG_H")
- if (INTERFACE64)
- set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DLAPACK_ILP64")
- endif ()
-
- if (${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
- set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DOPENBLAS_OS_WINDOWS")
- endif ()
-
- if (${CMAKE_C_COMPILER} STREQUAL "LSB" OR ${CMAKE_SYSTEM_NAME} STREQUAL "Windows")
- set(LAPACK_CFLAGS "${LAPACK_CFLAGS} -DLAPACK_COMPLEX_STRUCTURE")
- endif ()
-
- if ("${CMAKE_BUILD_TYPE}" STREQUAL "Release")
- if ("${F_COMPILER}" STREQUAL "FLANG")
- if (${CMAKE_Fortran_COMPILER_VERSION} VERSION_LESS_EQUAL 3)
- set(CMAKE_Fortran_FLAGS_RELEASE "${CMAKE_Fortran_FLAGS_RELEASE} -fno-unroll-loops")
- endif ()
- endif ()
- endif ()
-
- if (NOT DEFINED SUFFIX)
- set(SUFFIX o)
- endif ()
-
- if (NOT DEFINED PSUFFIX)
- set(PSUFFIX po)
- endif ()
-
- if (NOT DEFINED LIBSUFFIX)
- set(LIBSUFFIX a)
- endif ()
-
- if (DYNAMIC_ARCH)
- if (USE_THREAD)
- set(LIBNAME "${LIBPREFIX}p${REVISION}.${LIBSUFFIX}")
- set(LIBNAME_P "${LIBPREFIX}p${REVISION}_p.${LIBSUFFIX}")
- else ()
- set(LIBNAME "${LIBPREFIX}${REVISION}.${LIBSUFFIX}")
- set(LIBNAME_P "${LIBPREFIX}${REVISION}_p.${LIBSUFFIX}")
- endif ()
- else ()
- if (USE_THREAD)
- set(LIBNAME "${LIBPREFIX}_${LIBCORE}p${REVISION}.${LIBSUFFIX}")
- set(LIBNAME_P "${LIBPREFIX}_${LIBCORE}p${REVISION}_p.${LIBSUFFIX}")
- else ()
- set(LIBNAME "${LIBPREFIX}_${LIBCORE}${REVISION}.${LIBSUFFIX}")
- set(LIBNAME_P "${LIBPREFIX}_${LIBCORE}${REVISION}_p.${LIBSUFFIX}")
- endif ()
- endif ()
-
-
- set(LIBDLLNAME "${LIBPREFIX}.dll")
- set(LIBSONAME "${LIBNAME}.${LIBSUFFIX}.so")
- set(LIBDYNNAME "${LIBNAME}.${LIBSUFFIX}.dylib")
- set(LIBDEFNAME "${LIBNAME}.${LIBSUFFIX}.def")
- set(LIBEXPNAME "${LIBNAME}.${LIBSUFFIX}.exp")
- set(LIBZIPNAME "${LIBNAME}.${LIBSUFFIX}.zip")
-
- set(LIBS "${PROJECT_SOURCE_DIR}/${LIBNAME}")
- set(LIBS_P "${PROJECT_SOURCE_DIR}/${LIBNAME_P}")
-
-
- set(LIB_COMPONENTS BLAS)
- if (NOT NO_CBLAS)
- set(LIB_COMPONENTS "${LIB_COMPONENTS} CBLAS")
- endif ()
-
- if (NOT NO_LAPACK)
- set(LIB_COMPONENTS "${LIB_COMPONENTS} LAPACK")
- if (NOT NO_LAPACKE)
- set(LIB_COMPONENTS "${LIB_COMPONENTS} LAPACKE")
- endif ()
- if (BUILD_RELAPACK)
- set(LIB_COMPONENTS "${LIB_COMPONENTS} ReLAPACK")
- endif ()
- endif ()
-
- if (ONLY_CBLAS)
- set(LIB_COMPONENTS CBLAS)
- endif ()
-
-
- # For GEMM3M
- set(USE_GEMM3M 0)
-
- if (DEFINED ARCH)
- if (X86 OR X86_64 OR ${ARCH} STREQUAL "ia64" OR MIPS64)
- set(USE_GEMM3M 1)
- endif ()
-
- if (${CORE} STREQUAL "generic")
- set(USE_GEMM3M 0)
- endif ()
- endif ()
-
-
- #export OSNAME
- #export ARCH
- #export CORE
- #export LIBCORE
- #export PGCPATH
- #export CONFIG
- #export CC
- #export FC
- #export BU
- #export FU
- #export NEED2UNDERSCORES
- #export USE_THREAD
- #export NUM_THREADS
- #export NUM_CORES
- #export SMP
- #export MAKEFILE_RULE
- #export NEED_PIC
- #export BINARY
- #export BINARY32
- #export BINARY64
- #export F_COMPILER
- #export C_COMPILER
- #export USE_OPENMP
- #export CROSS
- #export CROSS_SUFFIX
- #export NOFORTRAN
- #export NO_FBLAS
- #export EXTRALIB
- #export CEXTRALIB
- #export FEXTRALIB
- #export HAVE_SSE
- #export HAVE_SSE2
- #export HAVE_SSE3
- #export HAVE_SSSE3
- #export HAVE_SSE4_1
- #export HAVE_SSE4_2
- #export HAVE_SSE4A
- #export HAVE_SSE5
- #export HAVE_AVX
- #export HAVE_VFP
- #export HAVE_VFPV3
- #export HAVE_VFPV4
- #export HAVE_NEON
- #export KERNELDIR
- #export FUNCTION_PROFILE
- #export TARGET_CORE
- #
- #export SBGEMM_UNROLL_M
- #export SBGEMM_UNROLL_N
- #export SGEMM_UNROLL_M
- #export SGEMM_UNROLL_N
- #export DGEMM_UNROLL_M
- #export DGEMM_UNROLL_N
- #export QGEMM_UNROLL_M
- #export QGEMM_UNROLL_N
- #export CGEMM_UNROLL_M
- #export CGEMM_UNROLL_N
- #export ZGEMM_UNROLL_M
- #export ZGEMM_UNROLL_N
- #export XGEMM_UNROLL_M
- #export XGEMM_UNROLL_N
- #export CGEMM3M_UNROLL_M
- #export CGEMM3M_UNROLL_N
- #export ZGEMM3M_UNROLL_M
- #export ZGEMM3M_UNROLL_N
- #export XGEMM3M_UNROLL_M
- #export XGEMM3M_UNROLL_N
-
-
- #if (USE_CUDA)
- # export CUDADIR
- # export CUCC
- # export CUFLAGS
- # export CULIB
- #endif
|