diff --git a/gallery/index.yaml b/gallery/index.yaml index 892485eda..41b163edd 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,66 @@ --- +- name: "qwen3.6-27b" + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + urls: + - https://huggingface.co/unsloth/Qwen3.6-27B-GGUF + description: | + # Qwen3.6-27B + + [](https://chat.qwen.ai) + + > [!Note] + > This repository contains model weights and configuration files for the post-trained model in the Hugging Face Transformers format. + > + > These artifacts are compatible with Hugging Face Transformers, vLLM, SGLang, KTransformers, etc. + + Following the February release of the Qwen3.5 series, we're pleased to share the first open-weight variant of Qwen3.6. Built on direct feedback from the community, Qwen3.6 prioritizes stability and real-world utility, offering developers a more intuitive, responsive, and genuinely productive coding experience. + + ## Qwen3.6 Highlights + + This release delivers substantial upgrades, particularly in + + - **Agentic Coding:** the model now handles frontend workflows and repository-level reasoning with greater fluency and precision. + - **Thinking Preservation:** we've introduced a new option to retain reasoning context from historical messages, streamlining iterative development and reducing overhead. + + For more details, please refer to our blog post Qwen3.6-27B. + + ## Model Overview + + ... + license: "apache-2.0" + tags: + - llm + - gguf + - qwen + icon: https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen3.6/Figures/qwen3.6_27b_score.png + overrides: + backend: llama-cpp + function: + automatic_tool_parsing_fallback: true + grammar: + disable: true + known_usecases: + - chat + mmproj: llama-cpp/mmproj/Qwen3.6-27B-GGUF/mmproj-F32.gguf + options: + - use_jinja:true + parameters: + min_p: 0 + model: llama-cpp/models/Qwen3.6-27B-GGUF/Qwen3.6-27B-Q4_K_M.gguf + presence_penalty: 1.5 + repeat_penalty: 1 + temperature: 0.7 + top_k: 20 + top_p: 0.8 + template: + use_tokenizer_template: true + files: + - filename: llama-cpp/models/Qwen3.6-27B-GGUF/Qwen3.6-27B-Q4_K_M.gguf + sha256: 5ed60d0af4650a854b1755bd392f9aef4872643dc25a254bc68043fa638392a0 + uri: https://huggingface.co/unsloth/Qwen3.6-27B-GGUF/resolve/main/Qwen3.6-27B-Q4_K_M.gguf + - filename: llama-cpp/mmproj/Qwen3.6-27B-GGUF/mmproj-F32.gguf + sha256: fdc443e974cad1f61c45af1cfd5580855855ddce0d6c14cc500a5714c486ac1d + uri: https://huggingface.co/unsloth/Qwen3.6-27B-GGUF/resolve/main/mmproj-F32.gguf - name: "qwen3.6-35b-a3b-claude-4.6-opus-reasoning-distilled" url: "github:mudler/LocalAI/gallery/virtual.yaml@master" urls: