123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357 |
- # check systems
- if (NOT UNAME_S)
- execute_process(COMMAND uname -s OUTPUT_VARIABLE UNAME_S)
- endif()
- if (NOT UNAME_P)
- execute_process(COMMAND uname -p OUTPUT_VARIABLE UNAME_P)
- endif()
- if (NOT UNAME_M)
- execute_process(COMMAND uname -m OUTPUT_VARIABLE UNAME_M)
- endif()
- #message(STATUS "UNAME_S: ${UNAME_S} UNAME_P: ${UNAME_P} UNAME_M: ${UNAME_M}")
- # Mac OS + Arm can report x86_64
- # ref: https://github.com/ggerganov/whisper.cpp/issues/66#issuecomment-1282546789
- if (UNAME_S MATCHES "Darwin")
- if (NOT UNAME_P MATCHES "arm")
- execute_process(COMMAND sysctl -n hw.optional.arm64 OUTPUT_VARIABLE SYSCTL_M)
- if (SYSCTL_M MATCHES "1")
- #set(UNAME_P "arm")
- #set(UNAME_M "arm64")
- message(WARNING "Your arch is announced as x86_64, but it seems to actually be ARM64. Not fixing that can lea
- d to bad performance. For more info see: https://github.com/ggerganov/whisper.cpp/issues/66\#issuecomment-#1282546789")
- endif()
- endif()
- endif()
- if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" OR ${CMAKE_SYSTEM_PROCESSOR} MATCHES "aarch64")
- message(STATUS "ARM detected")
- #set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mcpu=apple-m1")
- elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64le" OR ${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64")
- message(STATUS "PPC64 detected")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mpower9-vector")
- else()
- message(STATUS "x86 detected")
- #set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx -mavx2 -mfma -mf16c")
- if (UNAME_S MATCHES "Darwin")
- execute_process(COMMAND sysctl machdep.cpu.features OUTPUT_VARIABLE AVX1_M)
- if (AVX1_M MATCHES "AVX1.0")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
- endif()
- execute_process(COMMAND sysctl machdep.cpu.leaf7_features OUTPUT_VARIABLE AVX2_M)
- if (AVX2_M MATCHES "AVX2")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
- endif()
- if (AVX1_M MATCHES "FMA")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
- endif()
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
- elseif (UNAME_S MATCHES "Linux")
- message(STATUS "Linux detected")
- execute_process(COMMAND grep "avx " /proc/cpuinfo OUTPUT_VARIABLE AVX1_M)
- if (AVX1_M MATCHES "avx")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
- endif()
- execute_process(COMMAND grep "avx2 " /proc/cpuinfo OUTPUT_VARIABLE AVX2_M)
- if (AVX2_M MATCHES "avx2")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
- endif()
- execute_process(COMMAND grep "fma " /proc/cpuinfo OUTPUT_VARIABLE FMA_M)
- if (FMA_M MATCHES "fma")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
- endif()
- execute_process(COMMAND grep "f16c " /proc/cpuinfo OUTPUT_VARIABLE F16C_M)
- if (F16C_M MATCHES "f16c")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
- endif()
- execute_process(COMMAND grep "sse3 " /proc/cpuinfo OUTPUT_VARIABLE SSE3_M)
- if (SSE3_M MATCHES "sse3")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -msse3")
- endif()
- elseif (UNAME_S MATCHES "Haiku")
- message(STATUS "Haiku detected")
- execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX " OUTPUT_VARIABLE AVX1_M)
- if (AVX1_M MATCHES "avx")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
- endif()
- execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX2 " OUTPUT_VARIABLE AVX2_M)
- if (AVX2_M MATCHES "avx2")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
- endif()
- execute_process(COMMAND sysinfo -cpu COMMAND grep "FMA " OUTPUT_VARIABLE FMA_M)
- if (FMA_M MATCHES "fma")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
- endif()
- execute_process(COMMAND sysinfo -cpu COMMAND grep "F16C " OUTPUT_VARIABLE F16C_M)
- if (F16C_M MATCHES "f16c")
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
- endif()
- elseif (MSVC)
- if (GGML_AVX512)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX512")
- # MSVC has no compile-time flags enabling specific
- # AVX512 extensions, neither it defines the
- # macros corresponding to the extensions.
- # Do it manually.
- if (GGML_AVX512_VBMI)
- add_compile_definitions(__AVX512VBMI__)
- endif()
- if (GGML_AVX512_VNNI)
- add_compile_definitions(__AVX512VNNI__)
- endif()
- elseif (GGML_AVX2)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX2")
- elseif (GGML_AVX)
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX")
- endif()
- else()
- set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma -mf16c -mavx -mavx2")
- endif()
- endif()
- # on APPLE - include Accelerate framework
- if (APPLE AND NOT GGML_NO_ACCELERATE)
- find_library(ACCELERATE_FRAMEWORK Accelerate)
- if (ACCELERATE_FRAMEWORK)
- message(STATUS "Accelerate framework found")
- set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${ACCELERATE_FRAMEWORK})
- set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_ACCELERATE)
- else()
- message(WARNING "Accelerate framework not found")
- endif()
- endif()
- if (GGML_OPENBLAS)
- set(OPENBLAS_INCLUDE_SEARCH_PATHS
- /usr/include
- /usr/include/openblas
- /usr/include/openblas-base
- /usr/local/include
- /usr/local/include/openblas
- /usr/local/include/openblas-base
- /opt/OpenBLAS/include
- $ENV{OpenBLAS_HOME}
- $ENV{OpenBLAS_HOME}/include
- )
- find_path(OPENBLAS_INC NAMES cblas.h PATHS ${OPENBLAS_INCLUDE_SEARCH_PATHS})
- find_library(OPENBLAS_LIB NAMES openblas libopenblas)
- if (OPENBLAS_LIB)
- message(STATUS "OpenBLAS found")
- set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${OPENBLAS_LIB})
- set(GGML_EXTRA_INCS ${GGML_EXTRA_INCS} ${OPENBLAS_INC})
- set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_OPENBLAS)
- else()
- message(WARNING "OpenBLAS not found")
- endif()
- endif()
- # undefine NDEBUG so asserts don't get disabled in tests
- add_definitions(-UNDEBUG)
- #
- # test-vec0
- set(TEST_TARGET test-vec0)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- #
- # test-vec1 (x86)
- if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "x86")
- set(TEST_TARGET test-vec1)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- endif()
- #
- # test-vec2 (arm)
- if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm")
- set(TEST_TARGET test-vec2)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- endif()
- #
- # test-grad0
- set(TEST_TARGET test-grad0)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-opt
- set(TEST_TARGET test-opt)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-quantize-fns
- set(TEST_TARGET test-quantize-fns)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-quantize-perf
- set(TEST_TARGET test-quantize-perf)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-mul-mat0
- set(TEST_TARGET test-mul-mat0)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS})
- if (MSVC)
- target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB
- endif()
- target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS})
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-mul-mat1 (arm)
- if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" AND NOT GGML_NO_ACCELERATE)
- set(TEST_TARGET test-mul-mat1)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS})
- target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS})
- endif()
- #
- # test-blas0 (arm)
- if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" AND NOT GGML_NO_ACCELERATE)
- set(TEST_TARGET test-blas0)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS})
- target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS})
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}> 128 128 128)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- endif()
- #
- # test-mul-mat2
- set(TEST_TARGET test-mul-mat2)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test0
- set(TEST_TARGET test0)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test1
- set(TEST_TARGET test1)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- if (MSVC)
- target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB
- endif()
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test2
- set(TEST_TARGET test2)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test3
- set(TEST_TARGET test3)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-pool
- set(TEST_TARGET test-pool)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- if (MSVC)
- target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB
- endif()
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-conv-transpose
- set(TEST_TARGET test-conv-transpose)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- #
- # test-rel-pos
- set(TEST_TARGET test-rel-pos)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- #
- # test-svd0 (arm/x86)
- if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" AND NOT GGML_NO_ACCELERATE)
- set(TEST_TARGET test-svd0)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS})
- target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS})
- elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "x86" AND GGML_OPENBLAS)
- set(TEST_TARGET test-svd0)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS})
- target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS})
- endif()
- #
- # test-customop
- set(TEST_TARGET test-customop)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- if (MSVC)
- target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB
- endif()
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
- #
- # test-xpos
- set(TEST_TARGET test-xpos)
- add_executable(${TEST_TARGET} ${TEST_TARGET}.c)
- target_link_libraries(${TEST_TARGET} PRIVATE ggml)
- add_test(NAME ${TEST_TARGET} COMMAND $<TARGET_FILE:${TEST_TARGET}>)
- set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")
|