find_library(MATH_LIBRARY m) # check systems if (NOT UNAME_S) execute_process(COMMAND uname -s OUTPUT_VARIABLE UNAME_S) endif() if (NOT UNAME_P) execute_process(COMMAND uname -p OUTPUT_VARIABLE UNAME_P) endif() if (NOT UNAME_M) execute_process(COMMAND uname -m OUTPUT_VARIABLE UNAME_M) endif() #message(STATUS "UNAME_S: ${UNAME_S} UNAME_P: ${UNAME_P} UNAME_M: ${UNAME_M}") # Mac OS + Arm can report x86_64 # ref: https://github.com/ggerganov/whisper.cpp/issues/66#issuecomment-1282546789 if (UNAME_S MATCHES "Darwin") if (NOT UNAME_P MATCHES "arm") execute_process(COMMAND sysctl -n hw.optional.arm64 OUTPUT_VARIABLE SYSCTL_M) if (SYSCTL_M MATCHES "1") #set(UNAME_P "arm") #set(UNAME_M "arm64") message(WARNING "Your arch is announced as x86_64, but it seems to actually be ARM64. Not fixing that can lea d to bad performance. For more info see: https://github.com/ggerganov/whisper.cpp/issues/66\#issuecomment-#1282546789") endif() endif() endif() if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "^(aarch64|arm.*|ARM64)$") message(STATUS "ARM detected") #set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mcpu=apple-m1") elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64le" OR ${CMAKE_SYSTEM_PROCESSOR} MATCHES "ppc64") message(STATUS "PPC64 detected") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mpower9-vector") elseif (${CMAKE_SYSTEM_PROCESSOR} MATCHES "loongarch64") message(STATUS "loongarch64 detected") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mlsx -mlasx") else() message(STATUS "x86 detected") #set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx -mavx2 -mfma -mf16c") if (UNAME_S MATCHES "Darwin") execute_process(COMMAND sysctl machdep.cpu.features OUTPUT_VARIABLE AVX1_M) if (AVX1_M MATCHES "AVX1.0") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx") endif() execute_process(COMMAND sysctl machdep.cpu.leaf7_features OUTPUT_VARIABLE AVX2_M) if (AVX2_M MATCHES "AVX2") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2") endif() if (AVX1_M MATCHES "FMA") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma") endif() set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c") elseif (UNAME_S MATCHES "Linux") message(STATUS "Linux detected") # must have to build on ubuntu22 with gcc11: find_package(Threads) set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} Threads::Threads) execute_process(COMMAND grep "avx " /proc/cpuinfo OUTPUT_VARIABLE AVX1_M) if (AVX1_M MATCHES "avx") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx") endif() execute_process(COMMAND grep "avx2 " /proc/cpuinfo OUTPUT_VARIABLE AVX2_M) if (AVX2_M MATCHES "avx2") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2") endif() execute_process(COMMAND grep "fma " /proc/cpuinfo OUTPUT_VARIABLE FMA_M) if (FMA_M MATCHES "fma") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma") endif() execute_process(COMMAND grep "f16c " /proc/cpuinfo OUTPUT_VARIABLE F16C_M) if (F16C_M MATCHES "f16c") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c") endif() execute_process(COMMAND grep "sse3 " /proc/cpuinfo OUTPUT_VARIABLE SSE3_M) if (SSE3_M MATCHES "sse3") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -msse3") endif() elseif (UNAME_S MATCHES "Haiku") message(STATUS "Haiku detected") execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX " OUTPUT_VARIABLE AVX1_M) if (AVX1_M MATCHES "avx") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx") endif() execute_process(COMMAND sysinfo -cpu COMMAND grep "AVX2 " OUTPUT_VARIABLE AVX2_M) if (AVX2_M MATCHES "avx2") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mavx2") endif() execute_process(COMMAND sysinfo -cpu COMMAND grep "FMA " OUTPUT_VARIABLE FMA_M) if (FMA_M MATCHES "fma") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma") endif() execute_process(COMMAND sysinfo -cpu COMMAND grep "F16C " OUTPUT_VARIABLE F16C_M) if (F16C_M MATCHES "f16c") set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mf16c") endif() elseif (MSVC) if (GGML_AVX512) set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX512") # MSVC has no compile-time flags enabling specific # AVX512 extensions, neither it defines the # macros corresponding to the extensions. # Do it manually. if (GGML_AVX512_VBMI) add_compile_definitions(__AVX512VBMI__) endif() if (GGML_AVX512_VNNI) add_compile_definitions(__AVX512VNNI__) endif() elseif (GGML_AVX2) set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX2") elseif (GGML_AVX) set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} /arch:AVX") endif() else() set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mfma -mf16c -mavx -mavx2") endif() endif() # on APPLE - include Accelerate framework if (APPLE AND NOT GGML_NO_ACCELERATE) find_library(ACCELERATE_FRAMEWORK Accelerate) if (ACCELERATE_FRAMEWORK) message(STATUS "Accelerate framework found") set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${ACCELERATE_FRAMEWORK}) set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_ACCELERATE) else() message(WARNING "Accelerate framework not found") endif() endif() if (GGML_OPENBLAS) set(OPENBLAS_INCLUDE_SEARCH_PATHS /usr/include /usr/include/openblas /usr/include/openblas-base /usr/local/include /usr/local/include/openblas /usr/local/include/openblas-base /opt/OpenBLAS/include $ENV{OpenBLAS_HOME} $ENV{OpenBLAS_HOME}/include ) find_path(OPENBLAS_INC NAMES cblas.h PATHS ${OPENBLAS_INCLUDE_SEARCH_PATHS}) find_library(OPENBLAS_LIB NAMES openblas libopenblas) if (OPENBLAS_LIB) message(STATUS "OpenBLAS found") set(GGML_EXTRA_LIBS ${GGML_EXTRA_LIBS} ${OPENBLAS_LIB}) set(GGML_EXTRA_INCS ${GGML_EXTRA_INCS} ${OPENBLAS_INC}) set(GGML_EXTRA_FLAGS ${GGML_EXTRA_FLAGS} -DGGML_USE_OPENBLAS) else() message(WARNING "OpenBLAS not found") endif() endif() # undefine NDEBUG so asserts don't get disabled in tests add_definitions(-UNDEBUG) # # test-vec0 set(TEST_TARGET test-vec0) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) # # test-vec1 (x86) if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "x86" AND "${CMAKE_C_FLAGS}" MATCHES "avx") set(TEST_TARGET test-vec1) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) endif() # # test-vec2 (arm) if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm") set(TEST_TARGET test-vec2) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) endif() # # test-opt set(TEST_TARGET test-opt) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-quantize-fns set(TEST_TARGET test-quantize-fns) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-quantize-perf set(TEST_TARGET test-quantize-perf) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-mul-mat0 set(TEST_TARGET test-mul-mat0) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS}) if (MSVC) target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB endif() target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS}) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-mul-mat1 (arm) if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" AND NOT GGML_NO_ACCELERATE) set(TEST_TARGET test-mul-mat1) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS}) target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS}) endif() # # test-blas0 (arm) if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "arm" AND NOT GGML_NO_ACCELERATE) set(TEST_TARGET test-blas0) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS}) target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS}) add_test(NAME ${TEST_TARGET} COMMAND $ 128 128 128) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") endif() # # test-mul-mat2 set(TEST_TARGET test-mul-mat2) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") if (MATH_LIBRARY) target_link_libraries(test-mul-mat2 PRIVATE ${MATH_LIBRARY}) endif() # # test0 set(TEST_TARGET test0) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-pool set(TEST_TARGET test-pool) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) if (MSVC) target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB endif() add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-arange set(TEST_TARGET test-arange) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml Threads::Threads) if (MSVC) target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB endif() add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-timestep_embedding set(TEST_TARGET test-timestep_embedding) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) if (MSVC) target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB endif() add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-pad-reflect-1d set(TEST_TARGET test-pad-reflect-1d) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) # # test-conv-transpose set(TEST_TARGET test-conv-transpose) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) # test-conv-transpose-1d set(TEST_TARGET test-conv-transpose-1d) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) # # test-dup set(TEST_TARGET test-dup) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) # # test-rel-pos set(TEST_TARGET test-rel-pos) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) # # test-svd0 (x86) if (${CMAKE_SYSTEM_PROCESSOR} MATCHES "x86" AND GGML_OPENBLAS) set(TEST_TARGET test-svd0) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml ${GGML_EXTRA_LIBS}) target_compile_options(${TEST_TARGET} PRIVATE ${GGML_EXTRA_FLAGS}) endif() # # test-customop set(TEST_TARGET test-customop) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) if (MSVC) target_link_options(${TEST_TARGET} PRIVATE "/STACK: 8388608") # 8MB endif() add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-conv1d set(TEST_TARGET test-conv1d) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-conv2d set(TEST_TARGET test-conv2d) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-mul-mat set(TEST_TARGET test-mul-mat) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-backend-ops set(TEST_TARGET test-backend-ops) add_executable(${TEST_TARGET} ${TEST_TARGET}.cpp) target_link_libraries(${TEST_TARGET} PRIVATE ggml Threads::Threads) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw") # # test-cont set(TEST_TARGET test-cont) add_executable(${TEST_TARGET} ${TEST_TARGET}.c) target_link_libraries(${TEST_TARGET} PRIVATE ggml) add_test(NAME ${TEST_TARGET} COMMAND $) set_property(TEST ${TEST_TARGET} PROPERTY ENVIRONMENT "LLVM_PROFILE_FILE=${TEST_TARGET}.profraw")