CMakeLists.txt 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358
  1. cmake_minimum_required(VERSION 3.14) # for add_link_options and implicit target directories.
  2. project("ggml" C CXX)
  3. include(CheckIncludeFileCXX)
  4. set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
  5. if (NOT XCODE AND NOT MSVC AND NOT CMAKE_BUILD_TYPE)
  6. set(CMAKE_BUILD_TYPE Release CACHE STRING "Build type" FORCE)
  7. set_property(CACHE CMAKE_BUILD_TYPE PROPERTY STRINGS "Debug" "Release" "MinSizeRel" "RelWithDebInfo")
  8. endif()
  9. if (CMAKE_SOURCE_DIR STREQUAL CMAKE_CURRENT_SOURCE_DIR)
  10. set(GGML_STANDALONE ON)
  11. set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/bin)
  12. # configure project version
  13. # TODO
  14. else()
  15. set(GGML_STANDALONE OFF)
  16. endif()
  17. if (EMSCRIPTEN)
  18. set(BUILD_SHARED_LIBS_DEFAULT OFF)
  19. option(GGML_WASM_SINGLE_FILE "ggml: embed WASM inside the generated ggml.js" ON)
  20. else()
  21. if (MINGW)
  22. set(BUILD_SHARED_LIBS_DEFAULT OFF)
  23. else()
  24. set(BUILD_SHARED_LIBS_DEFAULT ON)
  25. endif()
  26. endif()
  27. # remove the lib prefix on win32 mingw
  28. if (WIN32)
  29. set(CMAKE_STATIC_LIBRARY_PREFIX "")
  30. set(CMAKE_SHARED_LIBRARY_PREFIX "")
  31. set(CMAKE_SHARED_MODULE_PREFIX "")
  32. endif()
  33. option(BUILD_SHARED_LIBS "ggml: build shared libraries" ${BUILD_SHARED_LIBS_DEFAULT})
  34. option(GGML_BACKEND_DL "ggml: build backends as dynamic libraries (requires BUILD_SHARED_LIBS)" OFF)
  35. #
  36. # option list
  37. #
  38. # TODO: mark all options as advanced when not GGML_STANDALONE
  39. if (APPLE)
  40. set(GGML_METAL_DEFAULT ON)
  41. set(GGML_BLAS_DEFAULT ON)
  42. set(GGML_BLAS_VENDOR_DEFAULT "Apple")
  43. else()
  44. set(GGML_METAL_DEFAULT OFF)
  45. set(GGML_BLAS_DEFAULT OFF)
  46. set(GGML_BLAS_VENDOR_DEFAULT "Generic")
  47. endif()
  48. if (CMAKE_CROSSCOMPILING OR DEFINED ENV{SOURCE_DATE_EPOCH})
  49. message(STATUS "Setting GGML_NATIVE_DEFAULT to OFF")
  50. set(GGML_NATIVE_DEFAULT OFF)
  51. else()
  52. set(GGML_NATIVE_DEFAULT ON)
  53. endif()
  54. # defaults
  55. if (NOT GGML_LLAMAFILE_DEFAULT)
  56. set(GGML_LLAMAFILE_DEFAULT OFF)
  57. endif()
  58. if (NOT GGML_CUDA_GRAPHS_DEFAULT)
  59. set(GGML_CUDA_GRAPHS_DEFAULT OFF)
  60. endif()
  61. # general
  62. option(GGML_STATIC "ggml: static link libraries" OFF)
  63. option(GGML_NATIVE "ggml: optimize the build for the current system" ${GGML_NATIVE_DEFAULT})
  64. option(GGML_LTO "ggml: enable link time optimization" OFF)
  65. option(GGML_CCACHE "ggml: use ccache if available" ON)
  66. # debug
  67. option(GGML_ALL_WARNINGS "ggml: enable all compiler warnings" ON)
  68. option(GGML_ALL_WARNINGS_3RD_PARTY "ggml: enable all compiler warnings in 3rd party libs" OFF)
  69. option(GGML_GPROF "ggml: enable gprof" OFF)
  70. # build
  71. option(GGML_FATAL_WARNINGS "ggml: enable -Werror flag" OFF)
  72. # sanitizers
  73. option(GGML_SANITIZE_THREAD "ggml: enable thread sanitizer" OFF)
  74. option(GGML_SANITIZE_ADDRESS "ggml: enable address sanitizer" OFF)
  75. option(GGML_SANITIZE_UNDEFINED "ggml: enable undefined sanitizer" OFF)
  76. # instruction set specific
  77. if (GGML_NATIVE OR NOT GGML_NATIVE_DEFAULT)
  78. set(INS_ENB OFF)
  79. else()
  80. set(INS_ENB ON)
  81. endif()
  82. option(GGML_CPU_HBM "ggml: use memkind for CPU HBM" OFF)
  83. option(GGML_CPU_AARCH64 "ggml: use runtime weight conversion of Q4_0 to Q4_X_X" ON)
  84. option(GGML_CPU_KLEIDIAI "ggml: use KleidiAI optimized kernels if applicable" OFF)
  85. option(GGML_AVX "ggml: enable AVX" ${INS_ENB})
  86. option(GGML_AVX_VNNI "ggml: enable AVX-VNNI" OFF)
  87. option(GGML_AVX2 "ggml: enable AVX2" ${INS_ENB})
  88. option(GGML_BMI2 "ggml: enable BMI2" ${INS_ENB})
  89. option(GGML_AVX512 "ggml: enable AVX512F" OFF)
  90. option(GGML_AVX512_VBMI "ggml: enable AVX512-VBMI" OFF)
  91. option(GGML_AVX512_VNNI "ggml: enable AVX512-VNNI" OFF)
  92. option(GGML_AVX512_BF16 "ggml: enable AVX512-BF16" OFF)
  93. if (NOT MSVC)
  94. # in MSVC F16C and FMA is implied with AVX2/AVX512
  95. option(GGML_FMA "ggml: enable FMA" ${INS_ENB})
  96. option(GGML_F16C "ggml: enable F16C" ${INS_ENB})
  97. # MSVC does not seem to support AMX
  98. option(GGML_AMX_TILE "ggml: enable AMX-TILE" OFF)
  99. option(GGML_AMX_INT8 "ggml: enable AMX-INT8" OFF)
  100. option(GGML_AMX_BF16 "ggml: enable AMX-BF16" OFF)
  101. endif()
  102. option(GGML_LASX "ggml: enable lasx" ON)
  103. option(GGML_LSX "ggml: enable lsx" ON)
  104. option(GGML_RVV "ggml: enable rvv" ON)
  105. option(GGML_RV_ZFH "ggml: enable riscv zfh" OFF)
  106. option(GGML_VXE "ggml: enable vxe" ON)
  107. option(GGML_CPU_ALL_VARIANTS "ggml: build all variants of the CPU backend (requires GGML_BACKEND_DL)" OFF)
  108. set(GGML_CPU_ARM_ARCH "" CACHE STRING "ggml: CPU architecture for ARM")
  109. set(GGML_CPU_POWERPC_CPUTYPE "" CACHE STRING "ggml: CPU type for PowerPC")
  110. if (WIN32)
  111. set(GGML_WIN_VER "0x602" CACHE STRING "ggml: Windows version")
  112. endif()
  113. # ggml core
  114. set(GGML_SCHED_MAX_COPIES "4" CACHE STRING "ggml: max input copies for pipeline parallelism")
  115. option(GGML_CPU "ggml: enable CPU backend" ON)
  116. # 3rd party libs / backends
  117. option(GGML_ACCELERATE "ggml: enable Accelerate framework" ON)
  118. option(GGML_BLAS "ggml: use BLAS" ${GGML_BLAS_DEFAULT})
  119. set(GGML_BLAS_VENDOR ${GGML_BLAS_VENDOR_DEFAULT} CACHE STRING
  120. "ggml: BLAS library vendor")
  121. option(GGML_LLAMAFILE "ggml: use LLAMAFILE" ${GGML_LLAMAFILE_DEFAULT})
  122. option(GGML_CUDA "ggml: use CUDA" OFF)
  123. option(GGML_MUSA "ggml: use MUSA" OFF)
  124. option(GGML_CUDA_FORCE_MMQ "ggml: use mmq kernels instead of cuBLAS" OFF)
  125. option(GGML_CUDA_FORCE_CUBLAS "ggml: always use cuBLAS instead of mmq kernels" OFF)
  126. option(GGML_CUDA_F16 "ggml: use 16 bit floats for some calculations" OFF)
  127. set (GGML_CUDA_PEER_MAX_BATCH_SIZE "128" CACHE STRING
  128. "ggml: max. batch size for using peer access")
  129. option(GGML_CUDA_NO_PEER_COPY "ggml: do not use peer to peer copies" OFF)
  130. option(GGML_CUDA_NO_VMM "ggml: do not try to use CUDA VMM" OFF)
  131. option(GGML_CUDA_FA "ggml: compile ggml FlashAttention CUDA kernels" ON)
  132. option(GGML_CUDA_FA_ALL_QUANTS "ggml: compile all quants for FlashAttention" OFF)
  133. option(GGML_CUDA_GRAPHS "ggml: use CUDA graphs (llama.cpp only)" ${GGML_CUDA_GRAPHS_DEFAULT})
  134. set (GGML_CUDA_COMPRESSION_MODE "size" CACHE STRING
  135. "ggml: cuda link binary compression mode; requires cuda 12.8+")
  136. set_property(CACHE GGML_CUDA_COMPRESSION_MODE PROPERTY STRINGS "none;speed;balance;size")
  137. option(GGML_HIP "ggml: use HIP" OFF)
  138. option(GGML_HIP_GRAPHS "ggml: use HIP graph, experimental, slow" OFF)
  139. option(GGML_HIP_NO_VMM "ggml: do not try to use HIP VMM" ON)
  140. option(GGML_HIP_ROCWMMA_FATTN "ggml: enable rocWMMA for FlashAttention" OFF)
  141. option(GGML_HIP_UMA "ggml: use HIP unified memory architecture" OFF)
  142. option(GGML_VULKAN "ggml: use Vulkan" OFF)
  143. option(GGML_VULKAN_CHECK_RESULTS "ggml: run Vulkan op checks" OFF)
  144. option(GGML_VULKAN_DEBUG "ggml: enable Vulkan debug output" OFF)
  145. option(GGML_VULKAN_MEMORY_DEBUG "ggml: enable Vulkan memory debug output" OFF)
  146. option(GGML_VULKAN_SHADER_DEBUG_INFO "ggml: enable Vulkan shader debug info" OFF)
  147. option(GGML_VULKAN_PERF "ggml: enable Vulkan perf output" OFF)
  148. option(GGML_VULKAN_VALIDATE "ggml: enable Vulkan validation" OFF)
  149. option(GGML_VULKAN_RUN_TESTS "ggml: run Vulkan tests" OFF)
  150. option(GGML_KOMPUTE "ggml: use Kompute" OFF)
  151. option(GGML_METAL "ggml: use Metal" ${GGML_METAL_DEFAULT})
  152. option(GGML_METAL_USE_BF16 "ggml: use bfloat if available" OFF)
  153. option(GGML_METAL_NDEBUG "ggml: disable Metal debugging" OFF)
  154. option(GGML_METAL_SHADER_DEBUG "ggml: compile Metal with -fno-fast-math" OFF)
  155. option(GGML_METAL_EMBED_LIBRARY "ggml: embed Metal library" ${GGML_METAL})
  156. set (GGML_METAL_MACOSX_VERSION_MIN "" CACHE STRING
  157. "ggml: metal minimum macOS version")
  158. set (GGML_METAL_STD "" CACHE STRING "ggml: metal standard version (-std flag)")
  159. option(GGML_OPENMP "ggml: use OpenMP" ON)
  160. option(GGML_RPC "ggml: use RPC" OFF)
  161. option(GGML_SYCL "ggml: use SYCL" OFF)
  162. option(GGML_SYCL_F16 "ggml: use 16 bit floats for sycl calculations" OFF)
  163. option(GGML_SYCL_GRAPH "ggml: enable graphs in the SYCL backend" ON)
  164. set (GGML_SYCL_TARGET "INTEL" CACHE STRING
  165. "ggml: sycl target device")
  166. set (GGML_SYCL_DEVICE_ARCH "" CACHE STRING
  167. "ggml: sycl device architecture")
  168. option(GGML_OPENCL "ggml: use OpenCL" OFF)
  169. option(GGML_OPENCL_PROFILING "ggml: use OpenCL profiling (increases overhead)" OFF)
  170. option(GGML_OPENCL_EMBED_KERNELS "ggml: embed kernels" ON)
  171. option(GGML_OPENCL_USE_ADRENO_KERNELS "ggml: use optimized kernels for Adreno" ON)
  172. set (GGML_OPENCL_TARGET_VERSION "300" CACHE STRING
  173. "gmml: OpenCL API version to target")
  174. # toolchain for vulkan-shaders-gen
  175. set (GGML_VULKAN_SHADERS_GEN_TOOLCHAIN "" CACHE FILEPATH "ggml: toolchain file for vulkan-shaders-gen")
  176. # extra artifacts
  177. option(GGML_BUILD_TESTS "ggml: build tests" ${GGML_STANDALONE})
  178. option(GGML_BUILD_EXAMPLES "ggml: build examples" ${GGML_STANDALONE})
  179. #
  180. # dependencies
  181. #
  182. set(CMAKE_C_STANDARD 11)
  183. set(CMAKE_C_STANDARD_REQUIRED true)
  184. set(CMAKE_CXX_STANDARD 17)
  185. set(CMAKE_CXX_STANDARD_REQUIRED true)
  186. set(THREADS_PREFER_PTHREAD_FLAG ON)
  187. find_package(Threads REQUIRED)
  188. include(GNUInstallDirs)
  189. #
  190. # build the library
  191. #
  192. add_subdirectory(src)
  193. #
  194. # tests and examples
  195. #
  196. if (GGML_BUILD_TESTS)
  197. enable_testing()
  198. add_subdirectory(tests)
  199. endif ()
  200. if (GGML_BUILD_EXAMPLES)
  201. add_subdirectory(examples)
  202. endif ()
  203. #
  204. # install
  205. #
  206. include(CMakePackageConfigHelpers)
  207. # all public headers
  208. set(GGML_PUBLIC_HEADERS
  209. include/ggml.h
  210. include/ggml-cpu.h
  211. include/ggml-alloc.h
  212. include/ggml-backend.h
  213. include/ggml-blas.h
  214. include/ggml-cann.h
  215. include/ggml-cpp.h
  216. include/ggml-cuda.h
  217. include/ggml-kompute.h
  218. include/ggml-opt.h
  219. include/ggml-metal.h
  220. include/ggml-rpc.h
  221. include/ggml-sycl.h
  222. include/ggml-vulkan.h
  223. include/gguf.h)
  224. set_target_properties(ggml PROPERTIES PUBLIC_HEADER "${GGML_PUBLIC_HEADERS}")
  225. #if (GGML_METAL)
  226. # set_target_properties(ggml PROPERTIES RESOURCE "${CMAKE_CURRENT_SOURCE_DIR}/src/ggml-metal.metal")
  227. #endif()
  228. install(TARGETS ggml LIBRARY PUBLIC_HEADER)
  229. install(TARGETS ggml-base LIBRARY)
  230. if (GGML_STANDALONE)
  231. configure_file(${CMAKE_CURRENT_SOURCE_DIR}/ggml.pc.in
  232. ${CMAKE_CURRENT_BINARY_DIR}/ggml.pc
  233. @ONLY)
  234. install(FILES ${CMAKE_CURRENT_BINARY_DIR}/ggml.pc
  235. DESTINATION share/pkgconfig)
  236. endif()
  237. #
  238. # Create CMake package
  239. #
  240. # Generate version info based on git commit.
  241. if(NOT DEFINED GGML_BUILD_NUMBER)
  242. find_program(GIT_EXE NAMES git git.exe REQUIRED NO_CMAKE_FIND_ROOT_PATH)
  243. execute_process(COMMAND ${GIT_EXE} rev-list --count HEAD
  244. WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}
  245. OUTPUT_VARIABLE GGML_BUILD_NUMBER
  246. OUTPUT_STRIP_TRAILING_WHITESPACE
  247. )
  248. if(GGML_BUILD_NUMBER EQUAL 1)
  249. message(WARNING "GGML build version fixed at 1 likely due to a shallow clone.")
  250. endif()
  251. execute_process(COMMAND ${GIT_EXE} rev-parse --short HEAD
  252. WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}
  253. OUTPUT_VARIABLE GGML_BUILD_COMMIT
  254. OUTPUT_STRIP_TRAILING_WHITESPACE
  255. )
  256. endif()
  257. # Capture variables prefixed with GGML_.
  258. set(variable_set_statements
  259. "
  260. ####### Expanded from @GGML_VARIABLES_EXPANED@ by configure_package_config_file() #######
  261. ####### Any changes to this file will be overwritten by the next CMake run #######
  262. ")
  263. set(GGML_SHARED_LIB ${BUILD_SHARED_LIBS})
  264. get_cmake_property(all_variables VARIABLES)
  265. foreach(variable_name IN LISTS all_variables)
  266. if(variable_name MATCHES "^GGML_")
  267. string(REPLACE ";" "\\;"
  268. variable_value "${${variable_name}}")
  269. set(variable_set_statements
  270. "${variable_set_statements}set(${variable_name} \"${variable_value}\")\n")
  271. endif()
  272. endforeach()
  273. set(GGML_VARIABLES_EXPANDED ${variable_set_statements})
  274. # Create the CMake package and set install location.
  275. set(GGML_INSTALL_VERSION 0.0.${GGML_BUILD_NUMBER})
  276. set(GGML_INCLUDE_INSTALL_DIR ${CMAKE_INSTALL_INCLUDEDIR} CACHE PATH "Location of header files")
  277. set(GGML_LIB_INSTALL_DIR ${CMAKE_INSTALL_LIBDIR} CACHE PATH "Location of library files")
  278. set(GGML_BIN_INSTALL_DIR ${CMAKE_INSTALL_BINDIR} CACHE PATH "Location of binary files")
  279. configure_package_config_file(
  280. ${CMAKE_CURRENT_SOURCE_DIR}/cmake/ggml-config.cmake.in
  281. ${CMAKE_CURRENT_BINARY_DIR}/ggml-config.cmake
  282. INSTALL_DESTINATION ${CMAKE_INSTALL_LIBDIR}/cmake/ggml
  283. PATH_VARS GGML_INCLUDE_INSTALL_DIR
  284. GGML_LIB_INSTALL_DIR
  285. GGML_BIN_INSTALL_DIR)
  286. write_basic_package_version_file(
  287. ${CMAKE_CURRENT_BINARY_DIR}/ggml-version.cmake
  288. VERSION ${GGML_INSTALL_VERSION}
  289. COMPATIBILITY SameMajorVersion)
  290. install(FILES ${CMAKE_CURRENT_BINARY_DIR}/ggml-config.cmake
  291. ${CMAKE_CURRENT_BINARY_DIR}/ggml-version.cmake
  292. DESTINATION ${CMAKE_INSTALL_LIBDIR}/cmake/ggml)