diff --git a/gallery/index.yaml b/gallery/index.yaml index a37764bed722..1ff1a21ed82c 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,65 @@ --- +- name: "qwopus3.5-9b-coder" + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + urls: + - https://huggingface.co/Jackrong/Qwopus3.5-9B-Coder-GGUF + description: | + # 🌟 Qwopus3.5-9B-v3.5 + + ## 💡 Model Overview & v3.5 Design + + Qwopus3.5-9B-v3.5 is a **data-scaled continuation** of the Qwopus3.5-9B-v3 model. + + The training data in v3.5 is expanded to cover a broader range of domains, including mathematics, programming, puzzle-solving, multilingual dialogue, instruction-following, multi-turn interactions, and STEM-related tasks. + + Qwopus3.5-9B-v3.5 is a reasoning-enhanced model based on **Qwen3.5-9B**, designed for: + + - 🧩 Structured reasoning + - 🔧 Tool-augmented workflows + - 🔁 Multi-step agentic tasks + - ⚡ Token-efficient inference + + Compared with Qwopus3.5-9B-v3, **3.5 version does not introduce a new architecture, RL stage, or template redesign**. + + This version is trained with approximately **2× more SFT data**. + + ## 🎯 Motivation & Generalization Insight + + The motivation behind v3.5 comes from a simple observation: + + > This work is motivated by the hypothesis that scaling high-quality SFT data may further enhance the generalization ability of large language models. + + In earlier Qwopus3.5 experiments, structured reasoning was observed to improve both **accuracy and efficiency**: + + ... + license: "apache-2.0" + tags: + - llm + - gguf + - reasoning + icon: https://cdn-uploads.huggingface.co/production/uploads/66309bd090589b7c65950665/9EnS13MSxNU3snpAgEiLq.jpeg + overrides: + backend: llama-cpp + function: + automatic_tool_parsing_fallback: true + grammar: + disable: true + known_usecases: + - chat + mmproj: llama-cpp/mmproj/Qwopus3.5-9B-Coder-GGUF/mmproj.gguf + options: + - use_jinja:true + parameters: + model: llama-cpp/models/Qwopus3.5-9B-Coder-GGUF/Qwopus3.5-9B-coder-Exp-Q4_K_M.gguf + template: + use_tokenizer_template: true + files: + - filename: llama-cpp/models/Qwopus3.5-9B-Coder-GGUF/Qwopus3.5-9B-coder-Exp-Q4_K_M.gguf + sha256: 4e8f836c4afe01e9bf2a9931434ddd15e2a243cd8ec82a0aa3bc6573d4564051 + uri: https://huggingface.co/Jackrong/Qwopus3.5-9B-Coder-GGUF/resolve/main/Qwopus3.5-9B-coder-Exp-Q4_K_M.gguf + - filename: llama-cpp/mmproj/Qwopus3.5-9B-Coder-GGUF/mmproj.gguf + sha256: 5c769161b31697b6a2d83d8a806f37ee8ee7104bca15313c608dc53359fa0ef2 + uri: https://huggingface.co/Jackrong/Qwopus3.5-9B-Coder-GGUF/resolve/main/mmproj.gguf - name: "qwen3.6-40b-claude-4.6-opus-deckard-heretic-uncensored-thinking-neo-code-di-imatrix-max" url: "github:mudler/LocalAI/gallery/virtual.yaml@master" urls: