if (GGML_ALL_WARNINGS)
|
if (NOT MSVC)
|
add_compile_options(-Wunused -Wextra -Wcast-qual -Wdouble-promotion)
|
add_compile_options("$<$<COMPILE_LANGUAGE:C>:-Wshadow;-Wno-unused-function;-Wmissing-prototypes>")
|
else()
|
# todo : windows
|
endif()
|
endif()
|
|
# compiler flags
|
|
if (NOT MSVC)
|
#set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -fno-math-errno -ffinite-math-only -funsafe-math-optimizations")
|
endif()
|
|
message(STATUS "CMAKE_SYSTEM_PROCESSOR: ${CMAKE_SYSTEM_PROCESSOR}")
|
|
if (NOT UNAME_S)
|
execute_process(COMMAND uname -s OUTPUT_VARIABLE UNAME_S)
|
endif()
|
if (NOT UNAME_P)
|
execute_process(COMMAND uname -p OUTPUT_VARIABLE UNAME_P)
|
endif()
|
if (NOT UNAME_M)
|
execute_process(COMMAND uname -m OUTPUT_VARIABLE UNAME_M)
|
endif()
|
#message(STATUS "UNAME_S: ${UNAME_S} UNAME_P: ${UNAME_P} UNAME_M: ${UNAME_M}")
|
|
# this version of Apple ld64 is buggy
|
execute_process(
|
COMMAND ${CMAKE_C_COMPILER} ${CMAKE_EXE_LINKER_FLAGS} -Wl,-v
|
ERROR_VARIABLE output
|
)
|
if (output MATCHES "dyld-1015\.7")
|
add_compile_definitions(HAVE_BUGGY_APPLE_LINKER)
|
endif()
|
|
# Mac OS + Arm can report x86_64
|
# ref: https://github.com/ggerganov/whisper.cpp/issues/66#issuecomment-1282546789
|
if (UNAME_S MATCHES "Darwin")
|
if (NOT UNAME_P MATCHES "arm")
|
execute_process(COMMAND sysctl -n hw.optional.arm64 OUTPUT_VARIABLE SYSCTL_M)
|
if (SYSCTL_M MATCHES "1")
|
#set(UNAME_P "arm")
|
#set(UNAME_M "arm64")
|
message(WARNING "Your arch is announced as x86_64, but it seems to actually be ARM64. Not fixing that can lead to bad performance. For more info see: https://github.com/ggerganov/whisper.cpp/issues/66\#issuecomment-#1282546789")
|
endif()
|
endif()
|
endif()
|
|
if (${CMAKE_SYSTEM_NAME} STREQUAL "Emscripten")
|
message(STATUS "Emscripten detected")
|
elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" OR ${CMAKE_SYSTEM_PROCESSOR} MATCHES "aarch64")
|
message(STATUS "ARM detected")
|
#set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mcpu=apple-m1")
|
elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64le" OR ${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64")
|
message(STATUS "PPC64 detected")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mpower9-vector")
|
else()
|
message(STATUS "x86 detected")
|
#set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx -mavx2 -mfma -mf16c")
|
if (UNAME_S MATCHES "Darwin")
|
execute_process(COMMAND sysctl machdep.cpu.features OUTPUT_VARIABLE AVX1_M)
|
if (AVX1_M MATCHES "AVX1.0")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
|
endif()
|
execute_process(COMMAND sysctl machdep.cpu.leaf7_features OUTPUT_VARIABLE AVX2_M)
|
if (AVX2_M MATCHES "AVX2")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
|
endif()
|
if (AVX1_M MATCHES "FMA")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
|
endif()
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
|
elseif (UNAME_S MATCHES "Linux")
|
message(STATUS "Linux detected")
|
execute_process(COMMAND grep "avx " /proc/cpuinfo OUTPUT_VARIABLE AVX1_M)
|
if (AVX1_M MATCHES "avx")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
|
endif()
|
execute_process(COMMAND grep "avx2 " /proc/cpuinfo OUTPUT_VARIABLE AVX2_M)
|
if (AVX2_M MATCHES "avx2")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
|
endif()
|
execute_process(COMMAND grep "fma " /proc/cpuinfo OUTPUT_VARIABLE FMA_M)
|
if (FMA_M MATCHES "fma")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
|
endif()
|
execute_process(COMMAND grep "f16c " /proc/cpuinfo OUTPUT_VARIABLE F16C_M)
|
if (F16C_M MATCHES "f16c")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
|
endif()
|
execute_process(COMMAND grep "sse3 " /proc/cpuinfo OUTPUT_VARIABLE SSE3_M)
|
if (SSE3_M MATCHES "sse3")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -msse3")
|
endif()
|
elseif (UNAME_S MATCHES "Haiku")
|
message(STATUS "Haiku detected")
|
execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX " OUTPUT_VARIABLE AVX1_M)
|
if (AVX1_M MATCHES "avx")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx")
|
endif()
|
execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX2 " OUTPUT_VARIABLE AVX2_M)
|
if (AVX2_M MATCHES "avx2")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2")
|
endif()
|
execute_process(COMMAND sysinfo -cpu COMMAND grep "FMA " OUTPUT_VARIABLE FMA_M)
|
if (FMA_M MATCHES "fma")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma")
|
endif()
|
execute_process(COMMAND sysinfo -cpu COMMAND grep "F16C " OUTPUT_VARIABLE F16C_M)
|
if (F16C_M MATCHES "f16c")
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c")
|
endif()
|
elseif (MSVC)
|
if (GGML_AVX512)
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX512")
|
# MSVC has no compile-time flags enabling specific
|
# AVX512 extensions, neither it defines the
|
# macros corresponding to the extensions.
|
# Do it manually.
|
if (GGML_AVX512_VBMI)
|
add_compile_definitions(__AVX512VBMI__)
|
endif()
|
if (GGML_AVX512_VNNI)
|
add_compile_definitions(__AVX512VNNI__)
|
endif()
|
elseif (GGML_AVX2)
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX2")
|
elseif (GGML_AVX)
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX")
|
endif()
|
else()
|
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma -mf16c -mavx -mavx2")
|
endif()
|
endif()
|
|
# ggml
|
|
set(TARGET ggml)
|
|
# on APPLE - include Accelerate framework
|
if (APPLE AND NOT GGML_NO_ACCELERATE)
|
find_library(ACCELERATE_FRAMEWORK Accelerate)
|
if (ACCELERATE_FRAMEWORK)
|
message(STATUS "Accelerate framework found")
|
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${ACCELERATE_FRAMEWORK})
|
set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_ACCELERATE)
|
else()
|
message(WARNING "Accelerate framework not found")
|
endif()
|
endif()
|
|
if (GGML_OPENBLAS)
|
set(OPENBLAS_INCLUDE_SEARCH_PATHS
|
/usr/include
|
/usr/include/openblas
|
/usr/include/openblas-base
|
/usr/local/include
|
/usr/local/include/openblas
|
/usr/local/include/openblas-base
|
/opt/OpenBLAS/include
|
$ENV{OpenBLAS_HOME}
|
$ENV{OpenBLAS_HOME}/include
|
)
|
find_path(OPENBLAS_INC NAMES cblas.h PATHS ${OPENBLAS_INCLUDE_SEARCH_PATHS})
|
find_library(OPENBLAS_LIB NAMES openblas libopenblas)
|
if (OPENBLAS_LIB)
|
message(STATUS "OpenBLAS found")
|
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${OPENBLAS_LIB})
|
set(GGML_EXTRA_INCS ${GGML_EXTRA_INCS} ${OPENBLAS_INC})
|
set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_OPENBLAS)
|
else()
|
message(WARNING "OpenBLAS not found")
|
endif()
|
endif()
|
|
if (GGML_CLBLAST)
|
set(CLBLAST_INCLUDE_SEARCH_PATHS
|
/usr/include
|
/usr/local/include
|
$ENV{CLBLAST_HOME}
|
$ENV{CLBLAST_HOME}/include
|
)
|
find_path(CLBLAST_INC NAMES clblast.h PATHS ${CLBLAST_INCLUDE_SEARCH_PATHS})
|
find_library(CLBLAST_LIB NAMES clblast)
|
find_library(OPENCL_LIB NAMES OpenCL)
|
if (CLBLAST_LIB AND OPENCL_LIB AND CLBLAST_INC)
|
message(STATUS "clBLAST found")
|
|
set(GGML_EXTRA_INCS ${GGML_EXTRA_INCS} ${CLBLAST_INC})
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${CLBLAST_LIB} ${OPENCL_LIB})
|
set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_CLBLAST)
|
|
set(GGML_OPENCL_SOURCES ggml-opencl.cpp ggml-opencl.h)
|
|
link_libraries("-Wl,--copy-dt-needed-entries")
|
else()
|
message(WARNING "clBLAST not found")
|
endif()
|
endif()
|
|
if (GGML_CUBLAS)
|
cmake_minimum_required(VERSION 3.17)
|
|
find_package(CUDAToolkit)
|
if (CUDAToolkit_FOUND)
|
message(STATUS "cuBLAS found")
|
|
enable_language(CUDA)
|
|
set(GGML_CUDA_SOURCES ggml-cuda.cu ggml-cuda.h)
|
|
set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_CUBLAS)
|
|
if (GGML_CUDA_FORCE_DMMV)
|
add_compile_definitions(GGML_CUDA_FORCE_DMMV)
|
endif()
|
if (GGML_CUDA_FORCE_MMQ)
|
add_compile_definitions(GGML_CUDA_FORCE_MMQ)
|
endif()
|
|
# required for dynamic parallelism
|
# set(CMAKE_CUDA_SEPARABLE_COMPILATION ON)
|
|
if (GGML_STATIC)
|
if (WIN32)
|
# As of 12.3.1 CUDA Tookit for Windows does not offer a static cublas library
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} CUDA::cudart_static CUDA::cublas CUDA::cublasLt)
|
else ()
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} CUDA::cudart_static CUDA::cublas_static CUDA::cublasLt_static)
|
endif()
|
else()
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} CUDA::cudart CUDA::cublas CUDA::cublasLt)
|
endif()
|
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} CUDA::cuda_driver)
|
|
if (CMAKE_BUILD_TYPE MATCHES Debug)
|
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -lineinfo")
|
endif()
|
else()
|
message(WARNING "cuBLAS not found")
|
endif()
|
endif()
|
|
if (GGML_HIPBLAS)
|
list(APPEND CMAKE_PREFIX_PATH /opt/rocm)
|
|
if (NOT ${CMAKE_C_COMPILER_ID} MATCHES "Clang")
|
message(WARNING "Only LLVM is supported for HIP, hint: CC=/opt/rocm/llvm/bin/clang")
|
endif()
|
if (NOT ${CMAKE_CXX_COMPILER_ID} MATCHES "Clang")
|
message(WARNING "Only LLVM is supported for HIP, hint: CXX=/opt/rocm/llvm/bin/clang++")
|
endif()
|
|
find_package(hip)
|
find_package(hipblas)
|
find_package(rocblas)
|
|
if (${hipblas_FOUND} AND ${hip_FOUND})
|
message(STATUS "HIP and hipBLAS found")
|
|
add_compile_definitions(GGML_USE_HIPBLAS GGML_USE_CUBLAS)
|
|
add_library(ggml-rocm OBJECT ggml-cuda.cu ggml-cuda.h)
|
if (BUILD_SHARED_LIBS)
|
set_target_properties(ggml-rocm PROPERTIES POSITION_INDEPENDENT_CODE ON)
|
endif()
|
if (GGML_CUDA_FORCE_DMMV)
|
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_FORCE_DMMV)
|
endif()
|
if (GGML_CUDA_FORCE_MMQ)
|
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_FORCE_MMQ)
|
endif()
|
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_DMMV_X=${GGML_CUDA_DMMV_X})
|
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_MMV_Y=${GGML_CUDA_MMV_Y})
|
target_compile_definitions(ggml-rocm PRIVATE K_QUANTS_PER_ITERATION=${GGML_CUDA_KQUANTS_ITER})
|
set_source_files_properties(ggml-cuda.cu PROPERTIES LANGUAGE CXX)
|
target_link_libraries(ggml-rocm PRIVATE hip::device PUBLIC hip::host roc::rocblas roc::hipblas)
|
target_include_directories(ggml-rocm PRIVATE . ../include ../include/ggml)
|
|
if (GGML_STATIC)
|
message(FATAL_ERROR "Static linking not supported for HIP/ROCm")
|
endif()
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ggml-rocm)
|
else()
|
message(WARNING "hipBLAS or HIP not found. Try setting CMAKE_PREFIX_PATH=/opt/rocm")
|
endif()
|
endif()
|
|
if (GGML_METAL)
|
find_library(FOUNDATION_LIBRARY Foundation REQUIRED)
|
find_library(METAL_FRAMEWORK Metal REQUIRED)
|
find_library(METALKIT_FRAMEWORK MetalKit REQUIRED)
|
find_library(METALPERFORMANCE_FRAMEWORK MetalPerformanceShaders REQUIRED)
|
|
set(GGML_METAL_SOURCES ggml-metal.m ggml-metal.h)
|
|
set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_METAL)
|
|
#add_compile_definitions(GGML_METAL_NDEBUG)
|
|
# get full path to the file
|
#add_compile_definitions(GGML_METAL_DIR_KERNELS="${CMAKE_CURRENT_SOURCE_DIR}/")
|
|
# copy ggml-metal.metal to bin directory
|
configure_file(ggml-metal.metal ${CMAKE_RUNTIME_OUTPUT_DIRECTORY}/ggml-metal.metal COPYONLY)
|
|
set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS}
|
${FOUNDATION_LIBRARY}
|
${METAL_FRAMEWORK}
|
${METALKIT_FRAMEWORK}
|
${METALPERFORMANCE_FRAMEWORK}
|
)
|
endif()
|
|
if (GGML_PERF)
|
set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_PERF)
|
endif()
|
|
add_library(${TARGET}
|
ggml.c
|
ggml-alloc.c
|
ggml-backend.c
|
ggml-quants.c
|
ggml-impl.h
|
ggml-backend-impl.h
|
../include/ggml/ggml.h
|
../include/ggml/ggml-alloc.h
|
../include/ggml/ggml-backend.h
|
${GGML_CUDA_SOURCES}
|
${GGML_OPENCL_SOURCES}
|
${GGML_METAL_SOURCES}
|
)
|
|
target_include_directories(${TARGET} PUBLIC
|
.
|
../include
|
../include/ggml
|
${GGML_EXTRA_INCS}
|
)
|
|
find_library(MATH_LIBRARY m)
|
if (MATH_LIBRARY)
|
target_link_libraries(${TARGET} PUBLIC ${MATH_LIBRARY})
|
endif()
|
|
target_link_libraries(${TARGET} PUBLIC ${GGML_EXTRA_LIBS} ${CMAKE_THREAD_LIBS_INIT})
|
|
if (BUILD_SHARED_LIBS)
|
set(CMAKE_WINDOWS_EXPORT_ALL_SYMBOLS ON)
|
|
target_link_libraries(${TARGET} PUBLIC
|
${CMAKE_DL_LIBS}
|
)
|
|
target_compile_definitions(${TARGET} PUBLIC
|
GGML_SHARED
|
)
|
|
target_compile_definitions(${TARGET} PRIVATE
|
GGML_BUILD
|
)
|
|
if (GGML_METAL)
|
set_target_properties(${TARGET} PROPERTIES RESOURCE "${CMAKE_CURRENT_SOURCE_DIR}/ggml-metal.metal")
|
endif()
|
endif()
|
|
target_compile_definitions(${TARGET} PUBLIC
|
${GGML_EXTRA_FLAGS}
|
)
|
|
if (MINGW)
|
target_link_libraries(${TARGET} PUBLIC
|
stdc++
|
)
|
endif()
|
|
if (GGML_CUDA_SOURCES)
|
message(STATUS "GGML CUDA sources found")
|
if (NOT DEFINED CMAKE_CUDA_ARCHITECTURES)
|
# Only configure gmml CUDA architectures is not globally set
|
if (NOT DEFINED GGML_CUDA_ARCHITECTURES)
|
# Not overriden by user, so set defaults
|
set(GGML_CUDA_ARCHITECTURES 52 61 70)
|
endif()
|
message(STATUS "GGML Configuring CUDA architectures ${GGML_CUDA_ARCHITECTURES}")
|
set_property(TARGET ggml PROPERTY CUDA_ARCHITECTURES ${GGML_CUDA_ARCHITECTURES})
|
endif()
|
set_property(TARGET ggml PROPERTY CUDA_SELECT_NVCC_ARCH_FLAGS "Auto")
|
if (NOT MSVC)
|
target_link_libraries(ggml PUBLIC stdc++)
|
endif()
|
endif()
|
|
set (GGML_PUBLIC_HEADERS
|
${CMAKE_CURRENT_SOURCE_DIR}/../include/ggml/ggml.h
|
${CMAKE_CURRENT_SOURCE_DIR}/../include/ggml/ggml-alloc.h
|
${CMAKE_CURRENT_SOURCE_DIR}/../include/ggml/ggml-backend.h)
|
|
set_target_properties(${TARGET} PROPERTIES
|
PUBLIC_HEADER "${GGML_PUBLIC_HEADERS}")
|
|
install(TARGETS ${TARGET}
|
LIBRARY DESTINATION lib
|
PUBLIC_HEADER DESTINATION include/ggml
|
)
|