From b807863aef58acbbea272caf9bda3603552d120a Mon Sep 17 00:00:00 2001 From: mudler <2420543+mudler@users.noreply.github.com> Date: Wed, 24 Dec 2025 00:01:47 +0000 Subject: [PATCH] chore(model gallery): :robot: add new models via gallery agent Signed-off-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --- gallery/index.yaml | 31 +++++++++++++++++++++++++++++++ 1 file changed, 31 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index a8bdba1d6a3f..80c4bd2c4f9d 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,35 @@ --- +- name: "qwen3-coder-30b-a3b-instruct-rtpurbo-i1" + urls: + - https://huggingface.co/mradermacher/Qwen3-Coder-30B-A3B-Instruct-RTPurbo-i1-GGUF + description: | + The model in question is a quantized version of the original **Qwen3-Coder** large language model, specifically tailored for code generation. The base model, **RTP-LLM/Qwen3-Coder-30B-A3B-Instruct-RTPurbo**, is a 30B-parameter variant optimized for instruction-following and code-related tasks. It employs the **A3B attention mechanism** and is trained on diverse data to excel in programming and logical reasoning. The current repository provides a quantized (compressed) version of this model, which is suitable for deployment on hardware with limited memory but loses some precision compared to the original. For a high-fidelity version, the unquantized base model is recommended. + tags: + - llm + - code + - instruction-tuned + - text-to-text + - gguf + - qwen3 + overrides: + parameters: + model: llama-cpp/models/Qwen3-Coder-30B-A3B-Instruct-RTPurbo.i1-Q4_K_M.gguf + name: Qwen3-Coder-30B-A3B-Instruct-RTPurbo-i1-GGUF + backend: llama-cpp + template: + use_tokenizer_template: true + known_usecases: + - chat + function: + grammar: + disable: true + description: Imported from https://huggingface.co/mradermacher/Qwen3-Coder-30B-A3B-Instruct-RTPurbo-i1-GGUF + options: + - use_jinja:true + files: + - filename: llama-cpp/models/Qwen3-Coder-30B-A3B-Instruct-RTPurbo.i1-Q4_K_M.gguf + sha256: a25f1817a557da703ab685e6b98550cd7ed87e4a74573b5057e6e2f26b21140e + uri: https://huggingface.co/mradermacher/Qwen3-Coder-30B-A3B-Instruct-RTPurbo-i1-GGUF/resolve/main/Qwen3-Coder-30B-A3B-Instruct-RTPurbo.i1-Q4_K_M.gguf - name: "glm-4.5v-i1" urls: - https://huggingface.co/mradermacher/GLM-4.5V-i1-GGUF