diff --git a/gallery/index.yaml b/gallery/index.yaml index bc837f92..0a1fcf36 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -5909,6 +5909,21 @@ - filename: huihui-ai_DeepSeek-R1-Distill-Llama-70B-abliterated-Q4_K_M.gguf sha256: 2ed91d01c4b7a0f33f578c6389d0dd6a64d071b3f7963c40b4e1e71235dc74d6 uri: huggingface://bartowski/huihui-ai_DeepSeek-R1-Distill-Llama-70B-abliterated-GGUF/huihui-ai_DeepSeek-R1-Distill-Llama-70B-abliterated-Q4_K_M.gguf +- !!merge <<: *deepseek-r1 + name: "agentica-org_deepscaler-1.5b-preview" + icon: https://avatars.githubusercontent.com/u/174067447?s=200&v=4 + urls: + - https://huggingface.co/agentica-org/DeepScaleR-1.5B-Preview + - https://huggingface.co/bartowski/agentica-org_DeepScaleR-1.5B-Preview-GGUF + description: | + DeepScaleR-1.5B-Preview is a language model fine-tuned from DeepSeek-R1-Distilled-Qwen-1.5B using distributed reinforcement learning (RL) to scale up to long context lengths. The model achieves 43.1% Pass@1 accuracy on AIME 2024, representing a 15% improvement over the base model (28.8%) and surpassing OpenAI's O1-Preview performance with just 1.5B parameters. + overrides: + parameters: + model: agentica-org_DeepScaleR-1.5B-Preview-Q4_K_M.gguf + files: + - filename: agentica-org_DeepScaleR-1.5B-Preview-Q4_K_M.gguf + sha256: bf51b412360a84792ae9145e2ca322379234c118dbff498ff08e589253b67ded + uri: huggingface://bartowski/agentica-org_DeepScaleR-1.5B-Preview-GGUF/agentica-org_DeepScaleR-1.5B-Preview-Q4_K_M.gguf - &qwen2 url: "github:mudler/LocalAI/gallery/chatml.yaml@master" ## Start QWEN2 name: "qwen2-7b-instruct"