@@ -57,22 +57,22 @@ RUN apt update -y \
5757# Copy llama.cpp libraries
5858COPY --from=collector /lib/llama.cpp /usr/lib/s390x-linux-gnu
5959
60- # Copy all shared libraries
60+ # Copy all distro libraries
6161COPY --from=collector /lib/distro /lib/s390x-linux-gnu
6262
6363
6464# ## CLI Only
6565FROM --platform=linux/s390x base AS light
6666
6767# Copy llama.cpp binaries and libraries
68- COPY --from=collector /bin/llama.cpp/llama-cli /
69- COPY --from=collector /bin/llama.cpp/libggml-cpu.so /
70- COPY --from=collector /bin/llama.cpp/libggml-blas.so /
68+ COPY --from=collector /bin/llama.cpp/llama-cli /llama.cpp/bin
69+ COPY --from=collector /bin/llama.cpp/libggml-cpu.so /llama.cpp/bin
70+ COPY --from=collector /bin/llama.cpp/libggml-blas.so /llama.cpp/bin
7171
7272USER root:root
7373WORKDIR /models
7474
75- ENTRYPOINT [ "/llama-cli" ]
75+ ENTRYPOINT [ "/llama.cpp/bin/llama -cli" ]
7676
7777
7878# ## Hardened Server
@@ -81,18 +81,18 @@ FROM --platform=linux/s390x gcr.io/distroless/cc-debian${DEBIAN_VERSION}:nonroot
8181ENV LLAMA_ARG_HOST=0.0.0.0
8282
8383# Copy llama.cpp binaries and libraries
84- COPY --from=collector /bin/llama.cpp/llama-server /
84+ COPY --from=collector /bin/llama.cpp/llama-server /llama.cpp/bin
8585COPY --from=collector /lib/llama.cpp /usr/lib/s390x-linux-gnu
8686
8787# Fixes model loading errors
88- COPY --from=collector /bin/llama.cpp/libggml-cpu.so /
89- COPY --from=collector /bin/llama.cpp/libggml-blas.so /
88+ COPY --from=collector /bin/llama.cpp/libggml-cpu.so /llama.cpp/bin
89+ COPY --from=collector /bin/llama.cpp/libggml-blas.so /llama.cpp/bin
9090
91- # Copy all shared libraries
91+ # Copy all distro libraries
9292COPY --from=collector /lib/distro /lib/s390x-linux-gnu
9393
9494USER nonroot:nonroot
9595WORKDIR /models
9696EXPOSE 8080
9797
98- ENTRYPOINT [ "/llama-server" ]
98+ ENTRYPOINT [ "/llama.cpp/bin/llama -server" ]
0 commit comments