From 5d8ccdf9d1273bfd83ad8f72565885acc450997e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Adrien=20Gallou=C3=ABt?= Date: Fri, 26 Jun 2026 15:15:48 +0200 Subject: [PATCH] devops : add llama in all docker images (#25035) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: Adrien Gallouët --- .devops/cann.Dockerfile | 4 ++-- .devops/cpu.Dockerfile | 4 ++-- .devops/cuda.Dockerfile | 4 ++-- .devops/intel.Dockerfile | 4 ++-- .devops/musa.Dockerfile | 4 ++-- .devops/openvino.Dockerfile | 4 ++-- .devops/rocm.Dockerfile | 4 ++-- .devops/s390x.Dockerfile | 4 ++-- .devops/vulkan.Dockerfile | 4 ++-- .devops/zendnn.Dockerfile | 4 ++-- 10 files changed, 20 insertions(+), 20 deletions(-) diff --git a/.devops/cann.Dockerfile b/.devops/cann.Dockerfile index dc95e3f38d..36cee7bdb6 100644 --- a/.devops/cann.Dockerfile +++ b/.devops/cann.Dockerfile @@ -145,7 +145,7 @@ ENTRYPOINT ["/app/tools.sh"] # ============================================================================== FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app ENTRYPOINT [ "/app/llama-cli" ] @@ -156,7 +156,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app HEALTHCHECK --interval=5m CMD [ "curl", "-f", "http://localhost:8080/health" ] diff --git a/.devops/cpu.Dockerfile b/.devops/cpu.Dockerfile index caf727bcdb..cb92343d6c 100644 --- a/.devops/cpu.Dockerfile +++ b/.devops/cpu.Dockerfile @@ -104,7 +104,7 @@ ENTRYPOINT ["/app/tools.sh"] ### Light, CLI only FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app WORKDIR /app @@ -115,7 +115,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app WORKDIR /app diff --git a/.devops/cuda.Dockerfile b/.devops/cuda.Dockerfile index b16b9a8f1a..c9a498d538 100644 --- a/.devops/cuda.Dockerfile +++ b/.devops/cuda.Dockerfile @@ -113,7 +113,7 @@ ENTRYPOINT ["/app/tools.sh"] ### Light, CLI only FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app WORKDIR /app @@ -124,7 +124,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app WORKDIR /app diff --git a/.devops/intel.Dockerfile b/.devops/intel.Dockerfile index 3c059eb301..b4bcd94b92 100644 --- a/.devops/intel.Dockerfile +++ b/.devops/intel.Dockerfile @@ -141,7 +141,7 @@ ENTRYPOINT ["/app/tools.sh"] FROM base AS light COPY --from=build /app/lib/ /app -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app WORKDIR /app @@ -153,7 +153,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 COPY --from=build /app/lib/ /app -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app WORKDIR /app diff --git a/.devops/musa.Dockerfile b/.devops/musa.Dockerfile index 0c23cc5547..d30a70bb36 100644 --- a/.devops/musa.Dockerfile +++ b/.devops/musa.Dockerfile @@ -115,7 +115,7 @@ ENTRYPOINT ["/app/tools.sh"] ### Light, CLI only FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app WORKDIR /app @@ -126,7 +126,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app WORKDIR /app diff --git a/.devops/openvino.Dockerfile b/.devops/openvino.Dockerfile index bcaea16cc3..9b2784b664 100644 --- a/.devops/openvino.Dockerfile +++ b/.devops/openvino.Dockerfile @@ -214,7 +214,7 @@ ENTRYPOINT ["/app/tools.sh"] ### Light, CLI only FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app/ +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app/ WORKDIR /app @@ -225,7 +225,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app/ +COPY --from=build /app/full/llama /app/full/llama-server /app/ WORKDIR /app diff --git a/.devops/rocm.Dockerfile b/.devops/rocm.Dockerfile index 7fad0c22e5..a8bc4e1fcd 100644 --- a/.devops/rocm.Dockerfile +++ b/.devops/rocm.Dockerfile @@ -127,7 +127,7 @@ ENTRYPOINT ["/app/tools.sh"] ### Light, CLI only FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app WORKDIR /app @@ -138,7 +138,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app WORKDIR /app diff --git a/.devops/s390x.Dockerfile b/.devops/s390x.Dockerfile index d88dd2d92d..94a715ff2d 100644 --- a/.devops/s390x.Dockerfile +++ b/.devops/s390x.Dockerfile @@ -124,7 +124,7 @@ WORKDIR /llama.cpp/bin # Copy llama.cpp binaries and libraries COPY --from=collector /llama.cpp/bin/*.so /llama.cpp/bin -COPY --from=collector /llama.cpp/bin/llama-cli /llama.cpp/bin/llama-completion /llama.cpp/bin +COPY --from=collector /llama.cpp/bin/llama /llama.cpp/bin/llama-cli /llama.cpp/bin/llama-completion /llama.cpp/bin ENTRYPOINT [ "/llama.cpp/bin/llama-cli" ] @@ -138,7 +138,7 @@ WORKDIR /llama.cpp/bin # Copy llama.cpp binaries and libraries COPY --from=collector /llama.cpp/bin/*.so /llama.cpp/bin -COPY --from=collector /llama.cpp/bin/llama-server /llama.cpp/bin +COPY --from=collector /llama.cpp/bin/llama /llama.cpp/bin/llama-server /llama.cpp/bin EXPOSE 8080 diff --git a/.devops/vulkan.Dockerfile b/.devops/vulkan.Dockerfile index 26c1902b14..d3599ffb82 100644 --- a/.devops/vulkan.Dockerfile +++ b/.devops/vulkan.Dockerfile @@ -107,7 +107,7 @@ ENTRYPOINT ["/app/tools.sh"] ### Light, CLI only FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app WORKDIR /app @@ -118,7 +118,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app WORKDIR /app diff --git a/.devops/zendnn.Dockerfile b/.devops/zendnn.Dockerfile index 80daf56710..8a50b3ef6a 100644 --- a/.devops/zendnn.Dockerfile +++ b/.devops/zendnn.Dockerfile @@ -97,7 +97,7 @@ ENTRYPOINT ["/app/tools.sh"] ### Light, CLI only FROM base AS light -COPY --from=build /app/full/llama-cli /app/full/llama-completion /app +COPY --from=build /app/full/llama /app/full/llama-cli /app/full/llama-completion /app WORKDIR /app @@ -108,7 +108,7 @@ FROM base AS server ENV LLAMA_ARG_HOST=0.0.0.0 -COPY --from=build /app/full/llama-server /app +COPY --from=build /app/full/llama /app/full/llama-server /app WORKDIR /app