CMakeLists.txt 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404
  1. if (GGML_ALL_WARNINGS)
  2. if (NOT MSVC)
  3. add_compile_options(-Wunused -Wextra -Wcast-qual -Wdouble-promotion)
  4. add_compile_options("$<$<COMPILE_LANGUAGE:C>:-Wshadow;-Wno-unused-function;-Wmissing-prototypes>")
  5. else()
  6. # todo : windows
  7. endif()
  8. endif()
  9. # compiler flags
  10. if (NOT MSVC)
  11. #set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -fno-math-errno -ffinite-math-only -funsafe-math-optimizations")
  12. endif()
  13. message(STATUS "CMAKE_SYSTEM_PROCESSOR: ${CMAKE_SYSTEM_PROCESSOR}")
  14. if (NOT UNAME_S)
  15. execute_process(COMMAND uname -s OUTPUT_VARIABLE UNAME_S)
  16. endif()
  17. if (NOT UNAME_P)
  18. execute_process(COMMAND uname -p OUTPUT_VARIABLE UNAME_P)
  19. endif()
  20. if (NOT UNAME_M)
  21. execute_process(COMMAND uname -m OUTPUT_VARIABLE UNAME_M)
  22. endif()
  23. #message(STATUS "UNAME_S: ${UNAME_S} UNAME_P: ${UNAME_P} UNAME_M: ${UNAME_M}")
  24. # this version of Apple ld64 is buggy
  25. execute_process(
  26. COMMAND ${CMAKE_C_COMPILER} ${CMAKE_EXE_LINKER_FLAGS} -Wl,-v
  27. ERROR_VARIABLE output
  28. )
  29. if (output MATCHES "dyld-1015\.7")
  30. add_compile_definitions(HAVE_BUGGY_APPLE_LINKER)
  31. endif()
  32. # Mac OS + Arm can report x86_64
  33. # ref: https://github.com/ggerganov/whisper.cpp/issues/66#issuecomment-1282546789
  34. if (UNAME_S MATCHES "Darwin")
  35. if (NOT UNAME_P MATCHES "arm")
  36. execute_process(COMMAND sysctl -n hw.optional.arm64 OUTPUT_VARIABLE SYSCTL_M)
  37. if (SYSCTL_M MATCHES "1")
  38. #set(UNAME_P "arm")
  39. #set(UNAME_M "arm64")
  40. message(WARNING "Your arch is announced as x86_64, but it seems to actually be ARM64. Not fixing that can lead to bad performance. For more info see: https://github.com/ggerganov/whisper.cpp/issues/66\#issuecomment-#1282546789")
  41. endif()
  42. endif()
  43. endif()
  44. if (${CMAKE_SYSTEM_NAME} STREQUAL "Emscripten")
  45. message(STATUS "Emscripten detected")
  46. elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" OR ${CMAKE_SYSTEM_PROCESSOR} MATCHES "aarch64")
  47. message(STATUS "ARM detected")
  48. #set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mcpu=apple-m1")
  49. elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64le" OR ${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64")
  50. message(STATUS "PPC64 detected")
  51. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mpower9-vector")
  52. else()
  53. message(STATUS "x86 detected")
  54. #set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx -mavx2 -mfma -mf16c")
  55. if (UNAME_S MATCHES "Darwin")
  56. execute_process(COMMAND sysctl machdep.cpu.features OUTPUT_VARIABLE AVX1_M)
  57. if (AVX1_M MATCHES "AVX1.0")
  58. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
  59. endif()
  60. execute_process(COMMAND sysctl machdep.cpu.leaf7_features OUTPUT_VARIABLE AVX2_M)
  61. if (AVX2_M MATCHES "AVX2")
  62. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
  63. endif()
  64. if (AVX1_M MATCHES "FMA")
  65. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
  66. endif()
  67. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
  68. elseif (UNAME_S MATCHES "Linux")
  69. message(STATUS "Linux detected")
  70. execute_process(COMMAND grep "avx " /proc/cpuinfo OUTPUT_VARIABLE AVX1_M)
  71. if (AVX1_M MATCHES "avx")
  72. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
  73. endif()
  74. execute_process(COMMAND grep "avx2 " /proc/cpuinfo OUTPUT_VARIABLE AVX2_M)
  75. if (AVX2_M MATCHES "avx2")
  76. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
  77. endif()
  78. execute_process(COMMAND grep "fma " /proc/cpuinfo OUTPUT_VARIABLE FMA_M)
  79. if (FMA_M MATCHES "fma")
  80. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
  81. endif()
  82. execute_process(COMMAND grep "f16c " /proc/cpuinfo OUTPUT_VARIABLE F16C_M)
  83. if (F16C_M MATCHES "f16c")
  84. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
  85. endif()
  86. execute_process(COMMAND grep "sse3 " /proc/cpuinfo OUTPUT_VARIABLE SSE3_M)
  87. if (SSE3_M MATCHES "sse3")
  88. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -msse3")
  89. endif()
  90. elseif (UNAME_S MATCHES "Haiku")
  91. message(STATUS "Haiku detected")
  92. execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX " OUTPUT_VARIABLE AVX1_M)
  93. if (AVX1_M MATCHES "avx")
  94. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
  95. endif()
  96. execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX2 " OUTPUT_VARIABLE AVX2_M)
  97. if (AVX2_M MATCHES "avx2")
  98. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
  99. endif()
  100. execute_process(COMMAND sysinfo -cpu COMMAND grep "FMA " OUTPUT_VARIABLE FMA_M)
  101. if (FMA_M MATCHES "fma")
  102. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
  103. endif()
  104. execute_process(COMMAND sysinfo -cpu COMMAND grep "F16C " OUTPUT_VARIABLE F16C_M)
  105. if (F16C_M MATCHES "f16c")
  106. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
  107. endif()
  108. elseif (MSVC)
  109. if (GGML_AVX512)
  110. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX512")
  111. # MSVC has no compile-time flags enabling specific
  112. # AVX512 extensions, neither it defines the
  113. # macros corresponding to the extensions.
  114. # Do it manually.
  115. if (GGML_AVX512_VBMI)
  116. add_compile_definitions(__AVX512VBMI__)
  117. endif()
  118. if (GGML_AVX512_VNNI)
  119. add_compile_definitions(__AVX512VNNI__)
  120. endif()
  121. elseif (GGML_AVX2)
  122. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX2")
  123. elseif (GGML_AVX)
  124. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX")
  125. endif()
  126. else()
  127. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma -mf16c -mavx -mavx2")
  128. endif()
  129. endif()
  130. # ggml
  131. set(TARGET ggml)
  132. # on APPLE - include Accelerate framework
  133. if (APPLE AND NOT GGML_NO_ACCELERATE)
  134. find_library(ACCELERATE_FRAMEWORK Accelerate)
  135. if (ACCELERATE_FRAMEWORK)
  136. message(STATUS "Accelerate framework found")
  137. set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${ACCELERATE_FRAMEWORK})
  138. set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_ACCELERATE)
  139. else()
  140. message(WARNING "Accelerate framework not found")
  141. endif()
  142. endif()
  143. if (GGML_OPENBLAS)
  144. set(OPENBLAS_INCLUDE_SEARCH_PATHS
  145. /usr/include
  146. /usr/include/openblas
  147. /usr/include/openblas-base
  148. /usr/local/include
  149. /usr/local/include/openblas
  150. /usr/local/include/openblas-base
  151. /opt/OpenBLAS/include
  152. $ENV{OpenBLAS_HOME}
  153. $ENV{OpenBLAS_HOME}/include
  154. )
  155. find_path(OPENBLAS_INC NAMES cblas.h PATHS ${OPENBLAS_INCLUDE_SEARCH_PATHS})
  156. find_library(OPENBLAS_LIB NAMES openblas libopenblas)
  157. if (OPENBLAS_LIB)
  158. message(STATUS "OpenBLAS found")
  159. set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${OPENBLAS_LIB})
  160. set(GGML_EXTRA_INCS ${GGML_EXTRA_INCS} ${OPENBLAS_INC})
  161. set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_OPENBLAS)
  162. else()
  163. message(WARNING "OpenBLAS not found")
  164. endif()
  165. endif()
  166. if (GGML_CLBLAST)
  167. set(CLBLAST_INCLUDE_SEARCH_PATHS
  168. /usr/include
  169. /usr/local/include
  170. $ENV{CLBLAST_HOME}
  171. $ENV{CLBLAST_HOME}/include
  172. )
  173. find_path(CLBLAST_INC NAMES clblast.h PATHS ${CLBLAST_INCLUDE_SEARCH_PATHS})
  174. find_library(CLBLAST_LIB NAMES clblast)
  175. find_library(OPENCL_LIB NAMES OpenCL)
  176. if (CLBLAST_LIB AND OPENCL_LIB AND CLBLAST_INC)
  177. message(STATUS "clBLAST found")
  178. set(GGML_EXTRA_INCS ${GGML_EXTRA_INCS} ${CLBLAST_INC})
  179. set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${CLBLAST_LIB} ${OPENCL_LIB})
  180. set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_CLBLAST)
  181. set(GGML_OPENCL_SOURCES ggml-opencl.cpp ggml-opencl.h)
  182. link_libraries("-Wl,--copy-dt-needed-entries")
  183. else()
  184. message(WARNING "clBLAST not found")
  185. endif()
  186. endif()
  187. if (GGML_CUBLAS)
  188. cmake_minimum_required(VERSION 3.17)
  189. find_package(CUDAToolkit)
  190. if (CUDAToolkit_FOUND)
  191. message(STATUS "cuBLAS found")
  192. enable_language(CUDA)
  193. set(GGML_CUDA_SOURCES ggml-cuda.cu ggml-cuda.h)
  194. set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_CUBLAS)
  195. if (GGML_CUDA_FORCE_DMMV)
  196. add_compile_definitions(GGML_CUDA_FORCE_DMMV)
  197. endif()
  198. if (GGML_CUDA_FORCE_MMQ)
  199. add_compile_definitions(GGML_CUDA_FORCE_MMQ)
  200. endif()
  201. # required for dynamic parallelism
  202. # set(CMAKE_CUDA_SEPARABLE_COMPILATION ON)
  203. if (GGML_STATIC)
  204. set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} CUDA::cudart_static CUDA::cublas_static CUDA::cublasLt_static)
  205. else()
  206. set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} CUDA::cudart CUDA::cublas CUDA::cublasLt)
  207. endif()
  208. if (CMAKE_BUILD_TYPE MATCHES Debug)
  209. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -lineinfo")
  210. endif()
  211. else()
  212. message(WARNING "cuBLAS not found")
  213. endif()
  214. endif()
  215. if (GGML_HIPBLAS)
  216. list(APPEND CMAKE_PREFIX_PATH /opt/rocm)
  217. if (NOT ${CMAKE_C_COMPILER_ID} MATCHES "Clang")
  218. message(WARNING "Only LLVM is supported for HIP, hint: CC=/opt/rocm/llvm/bin/clang")
  219. endif()
  220. if (NOT ${CMAKE_CXX_COMPILER_ID} MATCHES "Clang")
  221. message(WARNING "Only LLVM is supported for HIP, hint: CXX=/opt/rocm/llvm/bin/clang++")
  222. endif()
  223. find_package(hip)
  224. find_package(hipblas)
  225. find_package(rocblas)
  226. if (${hipblas_FOUND} AND ${hip_FOUND})
  227. message(STATUS "HIP and hipBLAS found")
  228. set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_CUBLAS)
  229. add_library(ggml-rocm OBJECT ggml-cuda.cu ggml-cuda.h)
  230. if (BUILD_SHARED_LIBS)
  231. set_target_properties(ggml-rocm PROPERTIES POSITION_INDEPENDENT_CODE ON)
  232. endif()
  233. if (GGML_CUDA_FORCE_DMMV)
  234. target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_FORCE_DMMV)
  235. endif()
  236. if (GGML_CUDA_FORCE_MMQ)
  237. target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_FORCE_MMQ)
  238. endif()
  239. target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_DMMV_X=${GGML_CUDA_DMMV_X})
  240. target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_MMV_Y=${GGML_CUDA_MMV_Y})
  241. target_compile_definitions(ggml-rocm PRIVATE K_QUANTS_PER_ITERATION=${GGML_CUDA_KQUANTS_ITER})
  242. set_source_files_properties(ggml-cuda.cu PROPERTIES LANGUAGE CXX)
  243. target_link_libraries(ggml-rocm PRIVATE hip::device PUBLIC hip::host roc::rocblas roc::hipblas)
  244. target_include_directories(ggml-rocm PRIVATE . ../include ../include/ggml)
  245. if (GGML_STATIC)
  246. message(FATAL_ERROR "Static linking not supported for HIP/ROCm")
  247. endif()
  248. set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ggml-rocm)
  249. else()
  250. message(WARNING "hipBLAS or HIP not found. Try setting CMAKE_PREFIX_PATH=/opt/rocm")
  251. endif()
  252. endif()
  253. if (GGML_METAL)
  254. find_library(FOUNDATION_LIBRARY Foundation REQUIRED)
  255. find_library(METAL_FRAMEWORK Metal REQUIRED)
  256. find_library(METALKIT_FRAMEWORK MetalKit REQUIRED)
  257. find_library(METALPERFORMANCE_FRAMEWORK MetalPerformanceShaders REQUIRED)
  258. set(GGML_METAL_SOURCES ggml-metal.m ggml-metal.h)
  259. set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_METAL)
  260. #add_compile_definitions(GGML_METAL_NDEBUG)
  261. # get full path to the file
  262. #add_compile_definitions(GGML_METAL_DIR_KERNELS="${CMAKE_CURRENT_SOURCE_DIR}/")
  263. # copy ggml-metal.metal to bin directory
  264. configure_file(ggml-metal.metal ${CMAKE_RUNTIME_OUTPUT_DIRECTORY}/ggml-metal.metal COPYONLY)
  265. set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS}
  266. ${FOUNDATION_LIBRARY}
  267. ${METAL_FRAMEWORK}
  268. ${METALKIT_FRAMEWORK}
  269. ${METALPERFORMANCE_FRAMEWORK}
  270. )
  271. endif()
  272. if (GGML_PERF)
  273. set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_PERF)
  274. endif()
  275. add_library(${TARGET}
  276. ggml.c
  277. ggml-alloc.c
  278. ggml-backend.c
  279. ggml-quants.c
  280. ggml-impl.h
  281. ggml-backend-impl.h
  282. ../include/ggml/ggml.h
  283. ../include/ggml/ggml-alloc.h
  284. ../include/ggml/ggml-backend.h
  285. ${GGML_CUDA_SOURCES}
  286. ${GGML_OPENCL_SOURCES}
  287. ${GGML_METAL_SOURCES}
  288. )
  289. target_include_directories(${TARGET} PUBLIC
  290. .
  291. ../include
  292. ../include/ggml
  293. ../examples/
  294. ${GGML_EXTRA_INCS}
  295. )
  296. if (MSVC)
  297. target_link_libraries(${TARGET} PUBLIC ${GGML_EXTRA_LIBS} ${CMAKE_THREAD_LIBS_INIT} kaldi-native-fbank)
  298. else()
  299. target_link_libraries(${TARGET} PUBLIC m ${GGML_EXTRA_LIBS} ${CMAKE_THREAD_LIBS_INIT} kaldi-native-fbank)
  300. endif()
  301. if (BUILD_SHARED_LIBS)
  302. set(CMAKE_WINDOWS_EXPORT_ALL_SYMBOLS ON)
  303. target_link_libraries(${TARGET} PUBLIC
  304. ${CMAKE_DL_LIBS}
  305. )
  306. target_compile_definitions(${TARGET} PUBLIC
  307. GGML_SHARED
  308. )
  309. target_compile_definitions(${TARGET} PRIVATE
  310. GGML_BUILD
  311. )
  312. if (GGML_METAL)
  313. set_target_properties(${TARGET} PROPERTIES RESOURCE "${CMAKE_CURRENT_SOURCE_DIR}/ggml-metal.metal")
  314. endif()
  315. endif()
  316. target_compile_definitions(${TARGET} PUBLIC
  317. ${GGML_EXTRA_FLAGS}
  318. )
  319. if (MINGW)
  320. target_link_libraries(${TARGET} PUBLIC
  321. stdc++
  322. )
  323. endif()
  324. if (GGML_CUDA_SOURCES)
  325. message(STATUS "GGML CUDA sources found")
  326. if (NOT DEFINED CMAKE_CUDA_ARCHITECTURES)
  327. # Only configure gmml CUDA architectures is not globally set
  328. if (NOT DEFINED GGML_CUDA_ARCHITECTURES)
  329. # Not overriden by user, so set defaults
  330. set(GGML_CUDA_ARCHITECTURES 52 61 70)
  331. endif()
  332. message(STATUS "GGML Configuring CUDA architectures ${GGML_CUDA_ARCHITECTURES}")
  333. set_property(TARGET ggml PROPERTY CUDA_ARCHITECTURES ${GGML_CUDA_ARCHITECTURES})
  334. endif()
  335. set_property(TARGET ggml PROPERTY CUDA_SELECT_NVCC_ARCH_FLAGS "Auto")
  336. if (NOT MSVC)
  337. target_link_libraries(ggml PUBLIC stdc++)
  338. endif()
  339. endif()
  340. set (GGML_PUBLIC_HEADERS
  341. ${CMAKE_CURRENT_SOURCE_DIR}/../include/ggml/ggml.h
  342. ${CMAKE_CURRENT_SOURCE_DIR}/../include/ggml/ggml-alloc.h
  343. ${CMAKE_CURRENT_SOURCE_DIR}/../include/ggml/ggml-backend.h)
  344. set_target_properties(${TARGET} PROPERTIES
  345. PUBLIC_HEADER "${GGML_PUBLIC_HEADERS}")
  346. install(TARGETS ${TARGET}
  347. LIBRARY DESTINATION lib
  348. PUBLIC_HEADER DESTINATION include/ggml
  349. )