Skip to content

Commit 7409fdc

Browse files
authored
Merge pull request #704 from axel7083/fix/cuda-build
fix(modell_server): deprecated make arguments for llamacpp server
2 parents e273eae + f60606d commit 7409fdc

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

model_servers/llamacpp_python/cuda/Containerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ RUN dnf install -y gcc-toolset-13-gcc gcc-toolset-13-gcc-c++
44
USER 1001
55
WORKDIR /locallm
66
COPY src .
7-
ENV CMAKE_ARGS="-DLLAMA_CUBLAS=on -DLLAMA_AVX2=OFF -DLLAMA_FMA=OFF -DLLAMA_F16C=OFF"
7+
ENV CMAKE_ARGS="-DGGML_CUDA=on -DLLAMA_AVX2=OFF -DLLAMA_FMA=OFF -DLLAMA_F16C=OFF"
88
ENV FORCE_CMAKE=1
99
RUN CC="/opt/rh/gcc-toolset-13/root/usr/bin/gcc" CXX="/opt/rh/gcc-toolset-13/root/usr/bin/g++" pip install --no-cache-dir -r ./requirements.txt
1010
ENTRYPOINT [ "sh", "run.sh" ]

0 commit comments

Comments
 (0)