|
1 | 1 | --- |
| 2 | +- name: "qwopus-glm-18b-merged" |
| 3 | + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" |
| 4 | + urls: |
| 5 | + - https://huggingface.co/Jackrong/Qwopus-GLM-18B-Merged-GGUF |
| 6 | + description: | |
| 7 | + # 🪐 Qwen3.5-9B-GLM5.1-Distill-v1 |
| 8 | + |
| 9 | + ## 📌 Model Overview |
| 10 | + |
| 11 | + **Model Name:** `Jackrong/Qwen3.5-9B-GLM5.1-Distill-v1` |
| 12 | + **Base Model:** Qwen3.5-9B |
| 13 | + **Training Type:** Supervised Fine-Tuning (SFT, Distillation) |
| 14 | + **Parameter Scale:** 9B |
| 15 | + **Training Framework:** Unsloth |
| 16 | + |
| 17 | + This model is a distilled variant of **Qwen3.5-9B**, trained on high-quality reasoning data derived from **GLM-5.1**. |
| 18 | + |
| 19 | + The primary goals are to: |
| 20 | + |
| 21 | + - Improve **structured reasoning ability** |
| 22 | + - Enhance **instruction-following consistency** |
| 23 | + - Activate **latent knowledge via better reasoning structure** |
| 24 | + |
| 25 | + ## 📊 Training Data |
| 26 | + |
| 27 | + ### Main Dataset |
| 28 | + |
| 29 | + - `Jackrong/GLM-5.1-Reasoning-1M-Cleaned` |
| 30 | + - Cleaned from the original `Kassadin88/GLM-5.1-1000000x` dataset. |
| 31 | + - Generated from a **GLM-5.1 teacher model** |
| 32 | + - Approximately **700x** the scale of `Qwen3.5-reasoning-700x` |
| 33 | + - Training used a **filtered subset**, not the full source dataset. |
| 34 | + |
| 35 | + ### Auxiliary Dataset |
| 36 | + |
| 37 | + - `Jackrong/Qwen3.5-reasoning-700x` |
| 38 | + |
| 39 | + ... |
| 40 | + license: "apache-2.0" |
| 41 | + tags: |
| 42 | + - llm |
| 43 | + - gguf |
| 44 | + - reasoning |
| 45 | + icon: https://cdn-uploads.huggingface.co/production/uploads/66309bd090589b7c65950665/BnSg_x99v9bG9T5-8sKa1.png |
| 46 | + overrides: |
| 47 | + backend: llama-cpp |
| 48 | + function: |
| 49 | + automatic_tool_parsing_fallback: true |
| 50 | + grammar: |
| 51 | + disable: true |
| 52 | + known_usecases: |
| 53 | + - chat |
| 54 | + options: |
| 55 | + - use_jinja:true |
| 56 | + parameters: |
| 57 | + model: llama-cpp/models/Qwopus-GLM-18B-Merged-GGUF/Qwopus-GLM-18B-Healed-Q4_K_M.gguf |
| 58 | + template: |
| 59 | + use_tokenizer_template: true |
| 60 | + files: |
| 61 | + - filename: llama-cpp/models/Qwopus-GLM-18B-Merged-GGUF/Qwopus-GLM-18B-Healed-Q4_K_M.gguf |
| 62 | + sha256: 13bd039f95c9ea46ef1d75905faa7be6ca4e47a5af9d4cf62e298a738a5b195f |
| 63 | + uri: https://huggingface.co/Jackrong/Qwopus-GLM-18B-Merged-GGUF/resolve/main/Qwopus-GLM-18B-Healed-Q4_K_M.gguf |
2 | 64 | - name: "qwen3.6-35b-a3b-apex" |
3 | 65 | url: "github:mudler/LocalAI/gallery/virtual.yaml@master" |
4 | 66 | urls: |
|
0 commit comments