From dda2653d6bbd68eb827f36cefb79cc128bdc4e00 Mon Sep 17 00:00:00 2001 From: rampa3 <68955305+rampa3@users.noreply.github.com> Date: Tue, 27 Jan 2026 14:11:52 +0100 Subject: [PATCH 1/2] chore(model gallery): Add entry for Mistral Small 3.1 with mmproj Signed-off-by: rampa3 <68955305+rampa3@users.noreply.github.com> --- gallery/index.yaml | 31 +++++++++++++++++++++++++++++++ 1 file changed, 31 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 941f041c67f0..5b2261b36df7 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -11344,6 +11344,37 @@ - filename: mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf sha256: c5743c1bf39db0ae8a5ade5df0374b8e9e492754a199cfdad7ef393c1590f7c0 uri: huggingface://bartowski/mistralai_Mistral-Small-3.1-24B-Instruct-2503-GGUF/mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf +- !!merge <<: *mistral03 + name: "mistralai_mistral-small-3.1-24b-instruct-2503-multimodal" + urls: + - https://huggingface.co/mistralai/Mistral-Small-3.1-24B-Instruct-2503 + - https://huggingface.co/bartowski/mistralai_Mistral-Small-3.1-24B-Instruct-2503-GGUF + description: | + Building upon Mistral Small 3 (2501), Mistral Small 3.1 (2503) adds state-of-the-art vision understanding and enhances long context capabilities up to 128k tokens without compromising text performance. With 24 billion parameters, this model achieves top-tier capabilities in both text and vision tasks. + This model is an instruction-finetuned version of: Mistral-Small-3.1-24B-Base-2503. + + Mistral Small 3.1 can be deployed locally and is exceptionally "knowledge-dense," fitting within a single RTX 4090 or a 32GB RAM MacBook once quantized. + + This gallery entry includes mmproj for multimodality. + tags: + - llm + - gguf + - gpu + - mistral + - cpu + - function-calling + - multimodal + overrides: + parameters: + model: mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf + mmproj: mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf + files: + - filename: mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf + sha256: c5743c1bf39db0ae8a5ade5df0374b8e9e492754a199cfdad7ef393c1590f7c0 + uri: huggingface://bartowski/mistralai_Mistral-Small-3.1-24B-Instruct-2503-GGUF/mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf + - filename: mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf + sha256: f5add93ad360ef6ccba571bba15e8b4bd4471f3577440a8b18785f8707d987ed + uri: huggingface://bartowski/mistralai_Mistral-Small-3.1-24B-Instruct-2503-GGUF/mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf - !!merge <<: *mistral03 url: "github:mudler/LocalAI/gallery/chatml.yaml@master" name: "gryphe_pantheon-rp-1.8-24b-small-3.1" From faeaecba9124b4c241e5c43c22b96d1411cf5fea Mon Sep 17 00:00:00 2001 From: rampa3 <68955305+rampa3@users.noreply.github.com> Date: Tue, 27 Jan 2026 14:23:56 +0100 Subject: [PATCH 2/2] Use llama-cpp subfolder structure akin to Qwen 3 VL Signed-off-by: rampa3 <68955305+rampa3@users.noreply.github.com> --- gallery/index.yaml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/gallery/index.yaml b/gallery/index.yaml index 5b2261b36df7..c3fa5cf5fa3a 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -11366,13 +11366,13 @@ - multimodal overrides: parameters: - model: mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf - mmproj: mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf + model: llama-cpp/models/mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf + mmproj: llama-cpp/mmproj/mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf files: - - filename: mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf + - filename: llama-cpp/models/mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf sha256: c5743c1bf39db0ae8a5ade5df0374b8e9e492754a199cfdad7ef393c1590f7c0 uri: huggingface://bartowski/mistralai_Mistral-Small-3.1-24B-Instruct-2503-GGUF/mistralai_Mistral-Small-3.1-24B-Instruct-2503-Q4_K_M.gguf - - filename: mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf + - filename: llama-cpp/mmproj/mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf sha256: f5add93ad360ef6ccba571bba15e8b4bd4471f3577440a8b18785f8707d987ed uri: huggingface://bartowski/mistralai_Mistral-Small-3.1-24B-Instruct-2503-GGUF/mmproj-mistralai_Mistral-Small-3.1-24B-Instruct-2503-f16.gguf - !!merge <<: *mistral03