From 13bf048cfcc7d0168cc41ecfea5e3b927e36a95a Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Wed, 27 Nov 2024 18:44:53 +0100 Subject: [PATCH 1/4] chore(model): add llama-3.1-tulu-3-70b-dpo model config (#4276) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 15 +++++++++++++++ 1 file changed, 15 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 57a9ee8c..406989f5 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -3176,6 +3176,21 @@ - filename: Tulu-3.1-8B-SuperNova.i1-Q4_K_M.gguf sha256: c6cc2e1a4c3d2338973ca0050af1cf4462b3f62838f62b4c8a204f2a74eeb01f uri: huggingface://mradermacher/Tulu-3.1-8B-SuperNova-i1-GGUF/Tulu-3.1-8B-SuperNova.i1-Q4_K_M.gguf +- !!merge <<: *llama31 + name: "llama-3.1-tulu-3-70b-dpo" + icon: "https://huggingface.co/datasets/allenai/blog-images/resolve/main/tulu3/Tulu3-logo.png" + urls: + - https://huggingface.co/allenai/Llama-3.1-Tulu-3-70B-DPO + - https://huggingface.co/bartowski/Llama-3.1-Tulu-3-70B-DPO-GGUF + description: | + Tülu3 is a leading instruction following model family, offering fully open-source data, code, and recipes designed to serve as a comprehensive guide for modern post-training techniques. Tülu3 is designed for state-of-the-art performance on a diversity of tasks in addition to chat, such as MATH, GSM8K, and IFEval. + overrides: + parameters: + model: Llama-3.1-Tulu-3-70B-DPO-Q4_K_M.gguf + files: + - filename: Llama-3.1-Tulu-3-70B-DPO-Q4_K_M.gguf + sha256: e2d9c59736274f9dd94f30ef3edcee68fec1d6649eb01d6bad7e3e8a6024f77d + uri: huggingface://bartowski/Llama-3.1-Tulu-3-70B-DPO-GGUF/Llama-3.1-Tulu-3-70B-DPO-Q4_K_M.gguf - &deepseek ## Deepseek url: "github:mudler/LocalAI/gallery/deepseek.yaml@master" From fa20628b3a685c1404271aaff49ba3f6f2a46677 Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Wed, 27 Nov 2024 19:01:54 +0100 Subject: [PATCH 2/4] chore(model): add llama-3.1-tulu-3-8b-sft to the gallery (#4277) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 15 +++++++++++++++ 1 file changed, 15 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 406989f5..2cfd61c8 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -3191,6 +3191,21 @@ - filename: Llama-3.1-Tulu-3-70B-DPO-Q4_K_M.gguf sha256: e2d9c59736274f9dd94f30ef3edcee68fec1d6649eb01d6bad7e3e8a6024f77d uri: huggingface://bartowski/Llama-3.1-Tulu-3-70B-DPO-GGUF/Llama-3.1-Tulu-3-70B-DPO-Q4_K_M.gguf +- !!merge <<: *llama31 + name: "llama-3.1-tulu-3-8b-sft" + icon: "https://huggingface.co/datasets/allenai/blog-images/resolve/main/tulu3/Tulu3-logo.png" + urls: + - https://huggingface.co/allenai/Llama-3.1-Tulu-3-8B-SFT + - https://huggingface.co/bartowski/Llama-3.1-Tulu-3-8B-SFT-GGUF + description: | + Tülu3 is a leading instruction following model family, offering fully open-source data, code, and recipes designed to serve as a comprehensive guide for modern post-training techniques. Tülu3 is designed for state-of-the-art performance on a diversity of tasks in addition to chat, such as MATH, GSM8K, and IFEval. + overrides: + parameters: + model: Llama-3.1-Tulu-3-8B-SFT-Q4_K_M.gguf + files: + - filename: Llama-3.1-Tulu-3-8B-SFT-Q4_K_M.gguf + sha256: 3fad2c96aa9b9de19c2cda0f88a381c47ac768ca03a95059d9f6c439791f8592 + uri: huggingface://bartowski/Llama-3.1-Tulu-3-8B-SFT-GGUF/Llama-3.1-Tulu-3-8B-SFT-Q4_K_M.gguf - &deepseek ## Deepseek url: "github:mudler/LocalAI/gallery/deepseek.yaml@master" From 5f688d7a8d53f2cc1610b7bb11710ecfe82420e9 Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Wed, 27 Nov 2024 19:02:05 +0100 Subject: [PATCH 3/4] chore(model): add eva-qwen2.5-72b-v0.2 to the gallery (#4278) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 17 +++++++++++++++++ 1 file changed, 17 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 2cfd61c8..b4b73e4b 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1614,6 +1614,23 @@ - filename: Q2.5-MS-Mistoria-72b-v2-Q4_K_M.gguf sha256: 33df8aac5a790d1c286fe0fc4f9d340311f282eca19b78db6f7abb845923425c uri: huggingface://bartowski/Q2.5-MS-Mistoria-72b-v2-GGUF/Q2.5-MS-Mistoria-72b-v2-Q4_K_M.gguf +- !!merge <<: *qwen25 + name: "eva-qwen2.5-72b-v0.2" + urls: + - https://huggingface.co/EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2 + - https://huggingface.co/bartowski/EVA-Qwen2.5-72B-v0.2-GGUF + description: | + A RP/storywriting specialist model, full-parameter finetune of Qwen2.5-72B on mixture of synthetic and natural data. + It uses Celeste 70B 0.1 data mixture, greatly expanding it to improve versatility, creativity and "flavor" of the resulting model. + + Version notes for 0.2: Optimized training hyperparameters and increased sequence length. Better instruction following deeper into context and less repetition. + overrides: + parameters: + model: EVA-Qwen2.5-72B-v0.2-Q4_K_M.gguf + files: + - filename: EVA-Qwen2.5-72B-v0.2-Q4_K_M.gguf + sha256: 03ea0ecac3ee24a332ca43cf925b669c58714b9754be0f4bc232bd996681ef4b + uri: huggingface://bartowski/EVA-Qwen2.5-72B-v0.2-GGUF/EVA-Qwen2.5-72B-v0.2-Q4_K_M.gguf - &archfunct license: apache-2.0 tags: From 0597f3b9e9d9ab4d6d6d9e97a017105574bba4de Mon Sep 17 00:00:00 2001 From: "LocalAI [bot]" <139863280+localai-bot@users.noreply.github.com> Date: Wed, 27 Nov 2024 23:24:47 +0100 Subject: [PATCH 4/4] chore: :arrow_up: Update ggerganov/llama.cpp to `3ad5451f3b75809e3033e4e577b9f60bcaf6676a` (#4280) :arrow_up: Update ggerganov/llama.cpp Signed-off-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: mudler <2420543+mudler@users.noreply.github.com> --- Makefile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Makefile b/Makefile index 83ce9661..69ba3539 100644 --- a/Makefile +++ b/Makefile @@ -8,7 +8,7 @@ DETECT_LIBS?=true # llama.cpp versions GOLLAMA_REPO?=https://github.com/go-skynet/go-llama.cpp GOLLAMA_VERSION?=2b57a8ae43e4699d3dc5d1496a1ccd42922993be -CPPLLAMA_VERSION?=30ec39832165627dd6ed98938df63adfc6e6a21a +CPPLLAMA_VERSION?=3ad5451f3b75809e3033e4e577b9f60bcaf6676a # whisper.cpp version WHISPER_REPO?=https://github.com/ggerganov/whisper.cpp