From 36c7036be59bac6de6c97f3f6d5cf17bb2b27181 Mon Sep 17 00:00:00 2001 From: mudler <2420543+mudler@users.noreply.github.com> Date: Sat, 16 May 2026 01:01:30 +0000 Subject: [PATCH] chore(model gallery): :robot: add new models via gallery agent Signed-off-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --- gallery/index.yaml | 62 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 62 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index f00dfd6283de..0a078c2574f1 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,66 @@ --- +- name: "qwen3.6-35b-a3b-mtp" + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + urls: + - https://huggingface.co/unsloth/Qwen3.6-35B-A3B-MTP-GGUF + description: | + # Qwen3.6-35B-A3B + + [](https://chat.qwen.ai) + + > [!Note] + > This repository contains model weights and configuration files for the post-trained model in the Hugging Face Transformers format. + > + > These artifacts are compatible with Hugging Face Transformers, vLLM, SGLang, KTransformers, etc. + + Following the February release of the Qwen3.5 series, we're pleased to share the first open-weight variant of Qwen3.6. Built on direct feedback from the community, Qwen3.6 prioritizes stability and real-world utility, offering developers a more intuitive, responsive, and genuinely productive coding experience. + + ## Qwen3.6 Highlights + + This release delivers substantial upgrades, particularly in + + - **Agentic Coding:** the model now handles frontend workflows and repository-level reasoning with greater fluency and precision. + - **Thinking Preservation:** we've introduced a new option to retain reasoning context from historical messages, streamlining iterative development and reducing overhead. + + For more details, please refer to our blog post Qwen3.6-35B-A3B. + + ## Model Overview + + ... + license: "apache-2.0" + tags: + - llm + - gguf + - qwen + icon: https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen3.6/Figures/qwen3.6_35b_a3b_score.png + overrides: + backend: llama-cpp + function: + automatic_tool_parsing_fallback: true + grammar: + disable: true + known_usecases: + - chat + mmproj: llama-cpp/mmproj/Qwen3.6-35B-A3B-MTP-GGUF/mmproj-F32.gguf + options: + - use_jinja:true + parameters: + min_p: 0 + model: llama-cpp/models/Qwen3.6-35B-A3B-MTP-GGUF/Qwen3.6-35B-A3B-UD-Q4_K_M.gguf + presence_penalty: 1.5 + repeat_penalty: 1 + temperature: 0.7 + top_k: 20 + top_p: 0.8 + template: + use_tokenizer_template: true + files: + - filename: llama-cpp/models/Qwen3.6-35B-A3B-MTP-GGUF/Qwen3.6-35B-A3B-UD-Q4_K_M.gguf + sha256: 0b21525e972670ed59e1812e170b27c26355381f0656ecc4e25617ece7dac58b + uri: https://huggingface.co/unsloth/Qwen3.6-35B-A3B-MTP-GGUF/resolve/main/Qwen3.6-35B-A3B-UD-Q4_K_M.gguf + - filename: llama-cpp/mmproj/Qwen3.6-35B-A3B-MTP-GGUF/mmproj-F32.gguf + sha256: 2c52a4ccbc8f0fdb716fb526bfee9506ed0092b2e6dc5d593759f7d200146663 + uri: https://huggingface.co/unsloth/Qwen3.6-35B-A3B-MTP-GGUF/resolve/main/mmproj-F32.gguf - name: "qwen3.6-40b-claude-4.6-opus-deckard-heretic-uncensored-thinking-neo-code-di-imatrix-max" url: "github:mudler/LocalAI/gallery/virtual.yaml@master" urls: