option(GGML_BLAS "ggml: use BLAS" ${GGML_BLAS_DEFAULT})
set(GGML_BLAS_VENDOR ${GGML_BLAS_VENDOR_DEFAULT} CACHE STRING
"ggml: BLAS library vendor")
-option(GGML_LLAMAFILE "ggml: use ggml SGEMM" OFF)
+option(GGML_LLAMAFILE "ggml: use LLAMAFILE" OFF)
option(GGML_CUDA "ggml: use CUDA" OFF)
option(GGML_CUDA_FORCE_DMMV "ggml: use dmmv instead of mmvq CUDA kernels" OFF)
endif()
if (GGML_LLAMAFILE)
- message(STATUS "Using ggml SGEMM")
+ message(STATUS "Using llamafile")
add_compile_definitions(GGML_USE_LLAMAFILE)
- set(GGML_HEADERS_LLAMAFILE sgemm.h)
- set(GGML_SOURCES_LLAMAFILE sgemm.cpp)
+ set(GGML_HEADERS_LLAMAFILE llamafile/sgemm.h)
+ set(GGML_SOURCES_LLAMAFILE llamafile/sgemm.cpp)
endif()
if (GGML_CUDA)
#include "ggml.h"
#include "ggml-aarch64.h"
-
#if defined(_MSC_VER) || defined(__MINGW32__)
#include <malloc.h> // using malloc.h with MSC/MINGW
#elif !defined(__FreeBSD__) && !defined(__NetBSD__) && !defined(__OpenBSD__)
#endif
#ifdef GGML_USE_LLAMAFILE
-#include "sgemm.h"
+#include <llamafile/sgemm.h>
#endif
#if defined(_MSC_VER)