From acc3a66a9ef2d5891b96952295a9482f9b014495 Mon Sep 17 00:00:00 2001 From: mudler <2420543+mudler@users.noreply.github.com> Date: Fri, 2 Jan 2026 12:33:40 +0000 Subject: [PATCH] chore(model gallery): :robot: add new models via gallery agent Signed-off-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --- gallery/index.yaml | 37 +++++++++++++++++++++++++++++++++++++ 1 file changed, 37 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index acd91884749a..138433264344 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -1,4 +1,41 @@ --- +- name: "iquest-coder-v1-40b-instruct-i1" + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + urls: + - https://huggingface.co/mradermacher/IQuest-Coder-V1-40B-Instruct-i1-GGUF + description: | + The **IQuest-Coder-V1-40B-Instruct-i1-GGUF** is a quantized version of the original **IQuestLab/IQuest-Coder-V1-40B-Instruct** model, designed for efficient deployment. It is an **instruction-following large language model** with 40 billion parameters, optimized for tasks like code generation and reasoning. + + **Key Features:** + - **Size:** 40B parameters (quantized for efficiency). + - **Purpose:** Instruction-based coding and reasoning. + - **Format:** GGUF (supports multi-part files). + - **Quantization:** Uses advanced techniques (e.g., IQ3_M, Q4_K_M) for balance between performance and quality. + + **Available Quantizations:** + - Optimized for speed and size: **i1-Q4_K_M** (recommended). + - Lower-quality options for trade-off between size/quality. + + **Note:** This is a **quantized version** of the original model, but the base model (IQuestLab/IQuest-Coder-V1-40B-Instruct) is the official source. For full functionality, use the unquantized version or verify compatibility with your deployment tools. + overrides: + parameters: + model: llama-cpp/models/IQuest-Coder-V1-40B-Instruct.i1-Q4_K_M.gguf + name: IQuest-Coder-V1-40B-Instruct-i1-GGUF + backend: llama-cpp + template: + use_tokenizer_template: true + known_usecases: + - chat + function: + grammar: + disable: true + description: Imported from https://huggingface.co/mradermacher/IQuest-Coder-V1-40B-Instruct-i1-GGUF + options: + - use_jinja:true + files: + - filename: llama-cpp/models/IQuest-Coder-V1-40B-Instruct.i1-Q4_K_M.gguf + sha256: 0090b84ea8e5a862352cbb44498bd6b4cd38564834182813c35ed84209050b51 + uri: https://huggingface.co/mradermacher/IQuest-Coder-V1-40B-Instruct-i1-GGUF/resolve/main/IQuest-Coder-V1-40B-Instruct.i1-Q4_K_M.gguf - name: "onerec-8b" url: "github:mudler/LocalAI/gallery/virtual.yaml@master" urls: