From ad97bcbbddd0b2b3397035ba591115739aff9b77 Mon Sep 17 00:00:00 2001 From: "LocalAI [bot]" <139863280+localai-bot@users.noreply.github.com> Date: Thu, 2 Jul 2026 19:16:09 +0200 Subject: [PATCH] chore(model gallery): :robot: add 1 new models via gallery agent (#10644) chore(model gallery): :robot: add new models via gallery agent Signed-off-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: mudler <2420543+mudler@users.noreply.github.com> --- gallery/index.yaml | 57 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 57 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 143f23c25..61e4cf39e 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,61 @@ --- +- name: "ornith-1.0-9b-mtp" + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + urls: + - https://huggingface.co/protoLabsAI/Ornith-1.0-9B-MTP-GGUF + description: | + [](https://deep-reinforce.com/ornith.html) + + # Ornith-1.0-9B + + Aloha! 🌺 Today, we are releasing Ornith-1.0, a self-improving family of open-source models for agentic coding. + + Highlights: + + - **State-of-the-Art Coding Agents**: Available in 9B-Dense, 31B-Dense, 35B-MoE, and 397B-MoE (post-trained on top of Gemma 4 and Qwen 3.5), achieving state-of-the-art performance among open-source models of comparable size on coding benchmarks such as Terminal-Bench 2.1, SWE-Bench, NL2Repo and OpenClaw. + - **Self-Improving Training Framework**:  Ornith-1.0 employs RL to learn to generate not only solution rollouts, but also the scallfold that drive those rollouts. By jointly optimizing the scaffold and the resulting solution, the model discovers better search trajectories and generates higher-quality solutions. + - **Licence**: MIT licensed, globally accessible, and free from regional limitations. + + ## Ornith 1.0 9B + + This model card documents **Ornith-1.0-9B**, the most lightweight member of the Ornith family, designed for efficient single-GPU deployment. + + ### Benchmarks + + Ornith-1.0-9B + Qwen3.5-9B + Qwen3.5-35B + Gemma4-12B + Gemma4-31B + + Agentic Coding + + ... + license: "mit" + tags: + - llm + - gguf + overrides: + backend: llama-cpp + function: + automatic_tool_parsing_fallback: true + grammar: + disable: true + known_usecases: + - chat + options: + - use_jinja:true + - spec_type:draft-mtp + - spec_n_max:6 + - spec_p_min:0.75 + parameters: + model: llama-cpp/models/ornith-9b-mtp-kl-Q4_K_M/ornith-9b-mtp-kl-Q4_K_M.gguf + template: + use_tokenizer_template: true + files: + - filename: llama-cpp/models/ornith-9b-mtp-kl-Q4_K_M/ornith-9b-mtp-kl-Q4_K_M.gguf + sha256: 03de14e9849a02258b9ac9ec2830af39dd7ac48f1ca5492b35539d1838707bc8 + uri: https://huggingface.co/protoLabsAI/Ornith-1.0-9B-MTP-GGUF/resolve/main/ornith-9b-mtp-kl-Q4_K_M.gguf - name: "qwen-agentworld-35b-a3b" url: "github:mudler/LocalAI/gallery/virtual.yaml@master" urls: