feat: fix CUDA images and update go-llama to use full GPU offloading (#618)

Signed-off-by: mudler <mudler@localai.io> Co-authored-by: mudler <mudler@localai.io>
2025-06-03 09:24:59 +00:00 · 2023-06-18 08:27:29 +02:00 · 2023-06-18 08:27:29 +02:00 · d3d3187e51
commit d3d3187e51
parent 6c94f3cd67
5 changed files with 11 additions and 47 deletions
--- a/6
+++ b/6
@ -1,4 +1,4 @@
-ARG GO_VERSION=1.20
+ARG GO_VERSION=1.20-bullseye

 FROM golang:$GO_VERSION as requirements

@ -9,7 +9,7 @@ ARG CUDA_MINOR_VERSION=7
 ENV BUILD_TYPE=${BUILD_TYPE}

 RUN apt-get update && \
-    apt-get install -y ca-certificates cmake curl
+    apt-get install -y ca-certificates cmake curl patch

 # CuBLAS requirements
 RUN if [ "${BUILD_TYPE}" = "cublas" ]; then \
@ -67,4 +67,4 @@ HEALTHCHECK --interval=1m --timeout=10m --retries=10 \
  CMD curl -f $HEALTHCHECK_ENDPOINT || exit 1

 EXPOSE 8080
-ENTRYPOINT [ "/build/entrypoint.sh" ]
+ENTRYPOINT [ "/build/entrypoint.sh" ]