CMakeLists.txt 9.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264
  1. cmake_minimum_required(VERSION 3.14) # for add_link_options and implicit target directories.
  2. project("ggml" C CXX)
  3. include(CheckIncludeFileCXX)
  4. set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
  5. if (NOT XCODE AND NOT MSVC AND NOT CMAKE_BUILD_TYPE)
  6. set(CMAKE_BUILD_TYPE Release CACHE STRING "Build type" FORCE)
  7. set_property(CACHE CMAKE_BUILD_TYPE PROPERTY STRINGS "Debug" "Release" "MinSizeRel" "RelWithDebInfo")
  8. endif()
  9. if (CMAKE_SOURCE_DIR STREQUAL CMAKE_CURRENT_SOURCE_DIR)
  10. set(GGML_STANDALONE ON)
  11. set(CMAKE_RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}/bin)
  12. # configure project version
  13. # TODO
  14. else()
  15. set(GGML_STANDALONE OFF)
  16. endif()
  17. if (EMSCRIPTEN)
  18. set(BUILD_SHARED_LIBS_DEFAULT OFF)
  19. option(GGML_WASM_SINGLE_FILE "ggml: embed WASM inside the generated ggml.js" ON)
  20. else()
  21. if (MINGW)
  22. set(BUILD_SHARED_LIBS_DEFAULT OFF)
  23. else()
  24. set(BUILD_SHARED_LIBS_DEFAULT ON)
  25. endif()
  26. endif()
  27. option(BUILD_SHARED_LIBS "ggml: build shared libraries" ${BUILD_SHARED_LIBS_DEFAULT})
  28. #
  29. # option list
  30. #
  31. # TODO: mark all options as advanced when not GGML_STANDALONE
  32. if (APPLE)
  33. set(GGML_METAL_DEFAULT ON)
  34. set(GGML_BLAS_DEFAULT ON)
  35. set(GGML_BLAS_VENDOR_DEFAULT "Apple")
  36. else()
  37. set(GGML_METAL_DEFAULT OFF)
  38. set(GGML_BLAS_DEFAULT OFF)
  39. set(GGML_BLAS_VENDOR_DEFAULT "Generic")
  40. endif()
  41. if (CMAKE_CROSSCOMPILING)
  42. set(GGML_NATIVE_DEFAULT OFF)
  43. else()
  44. set(GGML_NATIVE_DEFAULT ON)
  45. endif()
  46. # defaults
  47. if (NOT GGML_LLAMAFILE_DEFAULT)
  48. set(GGML_LLAMAFILE_DEFAULT OFF)
  49. endif()
  50. if (NOT GGML_CUDA_GRAPHS_DEFAULT)
  51. set(GGML_CUDA_GRAPHS_DEFAULT OFF)
  52. endif()
  53. # general
  54. option(GGML_STATIC "ggml: static link libraries" OFF)
  55. option(GGML_NATIVE "ggml: enable -march=native flag" ${GGML_NATIVE_DEFAULT})
  56. option(GGML_LTO "ggml: enable link time optimization" OFF)
  57. option(GGML_CCACHE "ggml: use ccache if available" ON)
  58. # debug
  59. option(GGML_ALL_WARNINGS "ggml: enable all compiler warnings" ON)
  60. option(GGML_ALL_WARNINGS_3RD_PARTY "ggml: enable all compiler warnings in 3rd party libs" OFF)
  61. option(GGML_GPROF "ggml: enable gprof" OFF)
  62. # build
  63. option(GGML_FATAL_WARNINGS "ggml: enable -Werror flag" OFF)
  64. # sanitizers
  65. option(GGML_SANITIZE_THREAD "ggml: enable thread sanitizer" OFF)
  66. option(GGML_SANITIZE_ADDRESS "ggml: enable address sanitizer" OFF)
  67. option(GGML_SANITIZE_UNDEFINED "ggml: enable undefined sanitizer" OFF)
  68. # instruction set specific
  69. if (GGML_NATIVE OR NOT GGML_NATIVE_DEFAULT)
  70. set(INS_ENB OFF)
  71. else()
  72. set(INS_ENB ON)
  73. endif()
  74. option(GGML_CPU_HBM "ggml: use memkind for CPU HBM" OFF)
  75. option(GGML_AVX "ggml: enable AVX" ${INS_ENB})
  76. option(GGML_AVX2 "ggml: enable AVX2" ${INS_ENB})
  77. option(GGML_AVX512 "ggml: enable AVX512" OFF)
  78. option(GGML_AVX512_VBMI "ggml: enable AVX512-VBMI" OFF)
  79. option(GGML_AVX512_VNNI "ggml: enable AVX512-VNNI" OFF)
  80. option(GGML_AVX512_BF16 "ggml: enable AVX512-BF16" OFF)
  81. option(GGML_FMA "ggml: enable FMA" ${INS_ENB})
  82. if (NOT MSVC)
  83. option(GGML_F16C "ggml: enable F16C" ${INS_ENB}) # in MSVC F16C is implied with AVX2/AVX512
  84. endif()
  85. option(GGML_LASX "ggml: enable lasx" ON)
  86. option(GGML_LSX "ggml: enable lsx" ON)
  87. option(GGML_SVE "ggml: enable SVE" OFF)
  88. if (WIN32)
  89. set(GGML_WIN_VER "0x602" CACHE STRING "ggml: Windows Version")
  90. endif()
  91. # ggml core
  92. set(GGML_SCHED_MAX_COPIES "4" CACHE STRING "ggml: max input copies for pipeline parallelism")
  93. # 3rd party libs / backends
  94. option(GGML_ACCELERATE "ggml: enable Accelerate framework" ON)
  95. option(GGML_BLAS "ggml: use BLAS" ${GGML_BLAS_DEFAULT})
  96. set(GGML_BLAS_VENDOR ${GGML_BLAS_VENDOR_DEFAULT} CACHE STRING
  97. "ggml: BLAS library vendor")
  98. option(GGML_LLAMAFILE "ggml: use LLAMAFILE" ${GGML_LLAMAFILE_DEFAULT})
  99. option(GGML_CUDA "ggml: use CUDA" OFF)
  100. option(GGML_MUSA "ggml: use MUSA" OFF)
  101. option(GGML_CUDA_FORCE_DMMV "ggml: use dmmv instead of mmvq CUDA kernels" OFF)
  102. option(GGML_CUDA_FORCE_MMQ "ggml: use mmq kernels instead of cuBLAS" OFF)
  103. option(GGML_CUDA_FORCE_CUBLAS "ggml: always use cuBLAS instead of mmq kernels" OFF)
  104. set (GGML_CUDA_DMMV_X "32" CACHE STRING "ggml: x stride for dmmv CUDA kernels")
  105. set (GGML_CUDA_MMV_Y "1" CACHE STRING "ggml: y block size for mmv CUDA kernels")
  106. option(GGML_CUDA_F16 "ggml: use 16 bit floats for some calculations" OFF)
  107. set (GGML_CUDA_KQUANTS_ITER "2" CACHE STRING
  108. "ggml: iters./thread per block for Q2_K/Q6_K")
  109. set (GGML_CUDA_PEER_MAX_BATCH_SIZE "128" CACHE STRING
  110. "ggml: max. batch size for using peer access")
  111. option(GGML_CUDA_NO_PEER_COPY "ggml: do not use peer to peer copies" OFF)
  112. option(GGML_CUDA_NO_VMM "ggml: do not try to use CUDA VMM" OFF)
  113. option(GGML_CUDA_FA_ALL_QUANTS "ggml: compile all quants for FlashAttention" OFF)
  114. option(GGML_CUDA_GRAPHS "ggml: use CUDA graphs (llama.cpp only)" ${GGML_CUDA_GRAPHS_DEFAULT})
  115. option(GGML_HIPBLAS "ggml: use hipBLAS" OFF)
  116. option(GGML_HIP_UMA "ggml: use HIP unified memory architecture" OFF)
  117. option(GGML_VULKAN "ggml: use Vulkan" OFF)
  118. option(GGML_VULKAN_CHECK_RESULTS "ggml: run Vulkan op checks" OFF)
  119. option(GGML_VULKAN_DEBUG "ggml: enable Vulkan debug output" OFF)
  120. option(GGML_VULKAN_MEMORY_DEBUG "ggml: enable Vulkan memory debug output" OFF)
  121. option(GGML_VULKAN_SHADER_DEBUG_INFO "ggml: enable Vulkan shader debug info" OFF)
  122. option(GGML_VULKAN_PERF "ggml: enable Vulkan perf output" OFF)
  123. option(GGML_VULKAN_VALIDATE "ggml: enable Vulkan validation" OFF)
  124. option(GGML_VULKAN_RUN_TESTS "ggml: run Vulkan tests" OFF)
  125. option(GGML_KOMPUTE "ggml: use Kompute" OFF)
  126. option(GGML_METAL "ggml: use Metal" ${GGML_METAL_DEFAULT})
  127. option(GGML_METAL_NDEBUG "ggml: disable Metal debugging" OFF)
  128. option(GGML_METAL_SHADER_DEBUG "ggml: compile Metal with -fno-fast-math" OFF)
  129. option(GGML_METAL_EMBED_LIBRARY "ggml: embed Metal library" ${GGML_METAL})
  130. set (GGML_METAL_MACOSX_VERSION_MIN "" CACHE STRING
  131. "ggml: metal minimum macOS version")
  132. set (GGML_METAL_STD "" CACHE STRING "ggml: metal standard version (-std flag)")
  133. option(GGML_OPENMP "ggml: use OpenMP" ON)
  134. option(GGML_RPC "ggml: use RPC" OFF)
  135. option(GGML_SYCL "ggml: use SYCL" OFF)
  136. option(GGML_SYCL_F16 "ggml: use 16 bit floats for sycl calculations" OFF)
  137. set (GGML_SYCL_TARGET "INTEL" CACHE STRING
  138. "ggml: sycl target device")
  139. # extra artifacts
  140. option(GGML_BUILD_TESTS "ggml: build tests" ${GGML_STANDALONE})
  141. option(GGML_BUILD_EXAMPLES "ggml: build examples" ${GGML_STANDALONE})
  142. #
  143. # dependencies
  144. #
  145. set(CMAKE_C_STANDARD 11)
  146. set(CMAKE_C_STANDARD_REQUIRED true)
  147. if (GGML_SYCL)
  148. set(CMAKE_CXX_STANDARD 17)
  149. else()
  150. set(CMAKE_CXX_STANDARD 11)
  151. endif()
  152. set(CMAKE_CXX_STANDARD_REQUIRED true)
  153. set(THREADS_PREFER_PTHREAD_FLAG ON)
  154. find_package(Threads REQUIRED)
  155. #
  156. # build the library
  157. #
  158. add_subdirectory(src)
  159. #
  160. # tests and examples
  161. #
  162. if (GGML_BUILD_TESTS)
  163. enable_testing()
  164. add_subdirectory(tests)
  165. endif ()
  166. if (GGML_BUILD_EXAMPLES)
  167. add_subdirectory(examples)
  168. endif ()
  169. #
  170. # install
  171. #
  172. include(GNUInstallDirs)
  173. include(CMakePackageConfigHelpers)
  174. # all public headers
  175. set(GGML_PUBLIC_HEADERS
  176. include/ggml.h
  177. include/ggml-alloc.h
  178. include/ggml-backend.h
  179. include/ggml-blas.h
  180. include/ggml-cann.h
  181. include/ggml-cuda.h
  182. include/ggml.h
  183. include/ggml-kompute.h
  184. include/ggml-metal.h
  185. include/ggml-rpc.h
  186. include/ggml-sycl.h
  187. include/ggml-vulkan.h)
  188. set_target_properties(ggml PROPERTIES PUBLIC_HEADER "${GGML_PUBLIC_HEADERS}")
  189. #if (GGML_METAL)
  190. # set_target_properties(ggml PROPERTIES RESOURCE "${CMAKE_CURRENT_SOURCE_DIR}/src/ggml-metal.metal")
  191. #endif()
  192. install(TARGETS ggml PUBLIC_HEADER)
  193. if (BUILD_SHARED_LIBS)
  194. install(TARGETS ggml LIBRARY)
  195. endif()
  196. if (GGML_METAL)
  197. install(
  198. FILES src/ggml-metal.metal
  199. PERMISSIONS
  200. OWNER_READ
  201. OWNER_WRITE
  202. GROUP_READ
  203. WORLD_READ
  204. DESTINATION ${CMAKE_INSTALL_BINDIR})
  205. if (NOT GGML_METAL_EMBED_LIBRARY)
  206. install(
  207. FILES ${CMAKE_RUNTIME_OUTPUT_DIRECTORY}/default.metallib
  208. DESTINATION ${CMAKE_INSTALL_BINDIR}
  209. )
  210. endif()
  211. endif()
  212. if (GGML_STANDALONE)
  213. configure_file(${CMAKE_CURRENT_SOURCE_DIR}/ggml.pc.in
  214. ${CMAKE_CURRENT_BINARY_DIR}/ggml.pc
  215. @ONLY)
  216. install(FILES ${CMAKE_CURRENT_BINARY_DIR}/ggml.pc
  217. DESTINATION share/pkgconfig)
  218. endif()