mirror of
https://github.com/mudler/LocalAI.git
synced 2025-06-03 09:24:59 +00:00
feat: fix CUDA images and update go-llama to use full GPU offloading (#618)
Signed-off-by: mudler <mudler@localai.io> Co-authored-by: mudler <mudler@localai.io>
This commit is contained in:
parent
6c94f3cd67
commit
d3d3187e51
5 changed files with 11 additions and 47 deletions
|
@ -1,4 +1,4 @@
|
|||
ARG GO_VERSION=1.20
|
||||
ARG GO_VERSION=1.20-bullseye
|
||||
|
||||
FROM golang:$GO_VERSION as requirements
|
||||
|
||||
|
@ -9,7 +9,7 @@ ARG CUDA_MINOR_VERSION=7
|
|||
ENV BUILD_TYPE=${BUILD_TYPE}
|
||||
|
||||
RUN apt-get update && \
|
||||
apt-get install -y ca-certificates cmake curl
|
||||
apt-get install -y ca-certificates cmake curl patch
|
||||
|
||||
# CuBLAS requirements
|
||||
RUN if [ "${BUILD_TYPE}" = "cublas" ]; then \
|
||||
|
@ -67,4 +67,4 @@ HEALTHCHECK --interval=1m --timeout=10m --retries=10 \
|
|||
CMD curl -f $HEALTHCHECK_ENDPOINT || exit 1
|
||||
|
||||
EXPOSE 8080
|
||||
ENTRYPOINT [ "/build/entrypoint.sh" ]
|
||||
ENTRYPOINT [ "/build/entrypoint.sh" ]
|
Loading…
Add table
Add a link
Reference in a new issue