devops: fix missing ggml shared object

failure to load model

Signed-off-by: Aaron Teo <aaron.teo1@ibm.com>
This commit is contained in:
Aaron Teo
2025-09-09 16:38:05 +08:00
parent b23e72e1d0
commit 944ef7f0bc

View File

@@ -51,11 +51,14 @@ ENV LLAMA_ARG_PORT=8080
COPY --from=collector /bin/llama.cpp /
COPY --from=collector /lib/llama.cpp /usr/lib/s390x-linux-gnu
# Fixes model loading errors
COPY --from=collector /bin/llama.cpp/*.so /
# Copy all shared libraries
COPY --from=collector /lib/distro /lib/s390x-linux-gnu
USER nonroot:nonroot
WORKDIR /models
EXPOSE ${LLAMA_ARG_PORT}
EXPOSE 8080
ENTRYPOINT [ "/llama-server" ]