From cf63c1e7d4deee11426a1bfe4dc08468ba8c98cb Mon Sep 17 00:00:00 2001 From: mudler <2420543+mudler@users.noreply.github.com> Date: Mon, 1 Jun 2026 01:19:59 +0000 Subject: [PATCH] chore(model gallery): :robot: add new models via gallery agent Signed-off-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --- gallery/index.yaml | 55 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 55 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 97b0d472f67d..475fd6b017de 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,59 @@ --- +- name: "lfm2.5-8b-a1b" + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + urls: + - https://huggingface.co/unsloth/LFM2.5-8B-A1B-GGUF + description: | + Try LFM • + Docs • + LEAP • + Discord + + # LFM2.5-8B-A1B + + LFM2.5 is a new family of hybrid models designed for on-device deployment. It builds on the LFM2 architecture with extended pre-training and reinforcement learning. + + - **On-device personal assistant**: Designed to power real-life applications, chaining tool calls, and following complex instructions on all devices. + - **Compressed performance**: Competitive with much larger dense and MoE models on instruction following and agentic tasks. + - **Unmatched throughput**: Fastest in its size class on both CPU and GPU inference, with day-one support for llama.cpp, MLX, vLLM, and SGLang. + + Find more information about LFM2.5-8B-A1B in our blog post. + + **AA-Omniscience Index (higher is better) rewards correct answers and penalizes hallucinations. Scores range from -100 to 100. See more results on Artificial Analysis.* + + ## 🗒️ Model Details + + LFM2.5-8B-A1B is a general-purpose text-only model with the following features: + + ... + license: "other" + tags: + - llm + - gguf + icon: https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/qUZVGkns1bg3sZUShBbhv.png + overrides: + backend: llama-cpp + function: + automatic_tool_parsing_fallback: true + grammar: + disable: true + known_usecases: + - chat + options: + - use_jinja:true + parameters: + min_p: 0.15 + model: llama-cpp/models/LFM2.5-8B-A1B-GGUF/LFM2.5-8B-A1B-UD-Q4_K_M.gguf + repeat_penalty: 1.05 + temperature: 0.1 + top_k: 50 + top_p: 0.1 + template: + use_tokenizer_template: true + files: + - filename: llama-cpp/models/LFM2.5-8B-A1B-GGUF/LFM2.5-8B-A1B-UD-Q4_K_M.gguf + sha256: e2c8350d5e6e7c633b2ba4e20805a2c86bc46884cd285e8f3fe36ad917b772c7 + uri: https://huggingface.co/unsloth/LFM2.5-8B-A1B-GGUF/resolve/main/LFM2.5-8B-A1B-UD-Q4_K_M.gguf - name: "lfm2.5-8b-a1b" url: "github:mudler/LocalAI/gallery/virtual.yaml@master" urls: