diff --git a/gallery/index.yaml b/gallery/index.yaml index 945b6e8a4..48ce727f9 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,59 @@ --- +- name: "lfm2.5-8b-a1b" + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + urls: + - https://huggingface.co/LiquidAI/LFM2.5-8B-A1B-GGUF + description: | + Try LFM • + Docs • + LEAP • + Discord + + # LFM2.5-8B-A1B + + LFM2.5 is a new family of hybrid models designed for on-device deployment. It builds on the LFM2 architecture with extended pre-training and reinforcement learning. + + - **On-device personal assistant**: Designed to power real-life applications, chaining tool calls, and following complex instructions on all devices. + - **Compressed performance**: Competitive with much larger dense and MoE models on instruction following and agentic tasks. + - **Unmatched throughput**: Fastest in its size class on both CPU and GPU inference, with day-one support for llama.cpp, MLX, vLLM, and SGLang. + + Find more information about LFM2.5-8B-A1B in our blog post. + + **AA-Omniscience Index (higher is better) rewards correct answers and penalizes hallucinations. Scores range from -100 to 100. See more results on Artificial Analysis.* + + ## 🗒️ Model Details + + LFM2.5-8B-A1B is a general-purpose text-only model with the following features: + + ... + license: "other" + tags: + - llm + - gguf + icon: https://cdn-uploads.huggingface.co/production/uploads/61b8e2ba285851687028d395/qUZVGkns1bg3sZUShBbhv.png + overrides: + backend: llama-cpp + function: + automatic_tool_parsing_fallback: true + grammar: + disable: true + known_usecases: + - chat + options: + - use_jinja:true + parameters: + min_p: 0.15 + model: llama-cpp/models/LFM2.5-8B-A1B-GGUF/LFM2.5-8B-A1B-Q4_K_M.gguf + repeat_penalty: 1.05 + temperature: 0.1 + top_k: 50 + top_p: 0.1 + template: + use_tokenizer_template: true + files: + - filename: llama-cpp/models/LFM2.5-8B-A1B-GGUF/LFM2.5-8B-A1B-Q4_K_M.gguf + sha256: 3ef9879143342a46cdd00b5f6f3919b77ee693945f9d73eea99344eadd6950b6 + uri: https://huggingface.co/LiquidAI/LFM2.5-8B-A1B-GGUF/resolve/main/LFM2.5-8B-A1B-Q4_K_M.gguf - name: "qwopus3.5-9b-coder-mtp" url: "github:mudler/LocalAI/gallery/virtual.yaml@master" urls: