feat: bump llama.cpp, add gguf support (#943)

**Description** This PR syncs up the `llama` backend to use `gguf` (https://github.com/go-skynet/go-llama.cpp/pull/180). It also adds `llama-stable` to the targets so we can still load ggml. It adapts the current tests to use the `llama-backend` for ggml and uses a `gguf` model to run tests on the new backend. In order to consume the new version of go-llama.cpp, it also bump go to 1.21 (images, pipelines, etc) --------- Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
2025-05-28 14:35:00 +00:00 · 2023-08-24 01:18:58 +02:00 · 2023-08-24 01:18:58 +02:00 · 1120847f72
commit 1120847f72
parent 704323b805
7 changed files with 89 additions and 16 deletions
--- a/.github/workflows/release.yaml
+++ b/.github/workflows/release.yaml
@ -22,6 +22,9 @@ jobs:
        uses: actions/checkout@v3
        with:
          submodules: true
+      - uses: actions/setup-go@v4
+        with:
+          go-version: '>=1.21.0'
      - name: Dependencies
        run: |
          sudo apt-get update
@ -60,6 +63,9 @@ jobs:
        uses: actions/checkout@v3
        with:
          submodules: true
+      - uses: actions/setup-go@v4
+        with:
+          go-version: '>=1.21.0'
      - name: Build
        id: build
        env:
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@ -18,7 +18,7 @@ jobs:
    runs-on: ubuntu-latest
    strategy:
      matrix:
-        go-version: ['1.20.x', 'stable']
+        go-version: ['1.21.x']
    steps:
      - name: Clone
        uses: actions/checkout@v3
@ -63,7 +63,7 @@ jobs:
    runs-on: macOS-latest
    strategy:
      matrix:
-        go-version: ['1.20.x', 'stable']
+        go-version: ['1.21.x']
    steps:
      - name: Clone
        uses: actions/checkout@v3