@@ -43,6 +43,18 @@ else()
43
43
set (LLAMA_METAL_DEFAULT OFF )
44
44
endif ()
45
45
46
+ # TODO: fix this for Android CI
47
+ # https://github.com/ggerganov/llama.cpp/pull/6716#issuecomment-2061509191
48
+ #if (CMAKE_SYSTEM_NAME MATCHES "ANDROID")
49
+ # set(LLAMA_LLAMAFILE_DEFAULT OFF)
50
+ #else()
51
+ # set(LLAMA_LLAMAFILE_DEFAULT ON)
52
+ #endif()
53
+
54
+ # TODO: temporary disable until MoE is fixed
55
+ # https://github.com/ggerganov/llama.cpp/pull/6716
56
+ set (LLAMA_LLAMAFILE_DEFAULT OFF )
57
+
46
58
# general
47
59
option (BUILD_SHARED_LIBS "build shared libraries" OFF )
48
60
option (LLAMA_STATIC "llama: static link libraries" OFF )
@@ -88,7 +100,7 @@ endif()
88
100
# 3rd party libs
89
101
option (LLAMA_ACCELERATE "llama: enable Accelerate framework" ON )
90
102
option (LLAMA_BLAS "llama: use BLAS" OFF )
91
- option (LLAMA_LLAMAFILE "llama: use llamafile SGEMM" ON )
103
+ option (LLAMA_LLAMAFILE "llama: use llamafile SGEMM" ${LLAMA_LLAMAFILE_DEFAULT} )
92
104
set (LLAMA_BLAS_VENDOR "Generic" CACHE STRING "llama: BLAS library vendor" )
93
105
option (LLAMA_CUDA "llama: use CUDA" OFF )
94
106
option (LLAMA_CUBLAS "llama: use CUDA (deprecated, use LLAMA_CUDA)" OFF )
@@ -372,6 +384,9 @@ endif()
372
384
373
385
if (LLAMA_LLAMAFILE)
374
386
add_compile_definitions (GGML_USE_LLAMAFILE)
387
+
388
+ set (GGML_HEADERS_LLAMAFILE sgemm.h)
389
+ set (GGML_SOURCES_LLAMAFILE sgemm.cpp)
375
390
endif ()
376
391
377
392
if (LLAMA_QKK_64)
@@ -1157,17 +1172,16 @@ add_library(ggml OBJECT
1157
1172
ggml-backend.h
1158
1173
ggml-quants.c
1159
1174
ggml-quants.h
1160
- sgemm.cpp
1161
- sgemm.h
1162
- ${GGML_SOURCES_CUDA} ${GGML_HEADERS_CUDA}
1163
- ${GGML_SOURCES_OPENCL} ${GGML_HEADERS_OPENCL}
1164
- ${GGML_SOURCES_METAL} ${GGML_HEADERS_METAL}
1165
- ${GGML_SOURCES_MPI} ${GGML_HEADERS_MPI}
1166
- ${GGML_SOURCES_EXTRA} ${GGML_HEADERS_EXTRA}
1167
- ${GGML_SOURCES_SYCL} ${GGML_HEADERS_SYCL}
1168
- ${GGML_SOURCES_KOMPUTE} ${GGML_HEADERS_KOMPUTE}
1169
- ${GGML_SOURCES_VULKAN} ${GGML_HEADERS_VULKAN}
1170
- ${GGML_SOURCES_ROCM} ${GGML_HEADERS_ROCM}
1175
+ ${GGML_SOURCES_CUDA} ${GGML_HEADERS_CUDA}
1176
+ ${GGML_SOURCES_OPENCL} ${GGML_HEADERS_OPENCL}
1177
+ ${GGML_SOURCES_METAL} ${GGML_HEADERS_METAL}
1178
+ ${GGML_SOURCES_MPI} ${GGML_HEADERS_MPI}
1179
+ ${GGML_SOURCES_EXTRA} ${GGML_HEADERS_EXTRA}
1180
+ ${GGML_SOURCES_SYCL} ${GGML_HEADERS_SYCL}
1181
+ ${GGML_SOURCES_KOMPUTE} ${GGML_HEADERS_KOMPUTE}
1182
+ ${GGML_SOURCES_VULKAN} ${GGML_HEADERS_VULKAN}
1183
+ ${GGML_SOURCES_ROCM} ${GGML_HEADERS_ROCM}
1184
+ ${GGML_SOURCES_LLAMAFILE} ${GGML_HEADERS_LLAMAFILE}
1171
1185
)
1172
1186
1173
1187
target_include_directories (ggml PUBLIC . ${LLAMA_EXTRA_INCLUDES} )
0 commit comments