Skip to content

Commit ec21b58

Browse files
authored
chore(model gallery): add smolvlm-256m-instruct (#5412)
Signed-off-by: Ettore Di Giacinto <[email protected]>
1 parent 996259b commit ec21b58

File tree

2 files changed

+49
-0
lines changed

2 files changed

+49
-0
lines changed

gallery/index.yaml

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,34 @@
11
---
2+
- &smolvlm:
3+
url: "github:mudler/LocalAI/gallery/smolvlm.yaml@master"
4+
name: "smolvlm-256m-instruct"
5+
icon: https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/SmolVLM_256_banner.png
6+
urls:
7+
- https://huggingface.co/HuggingFaceTB/SmolVLM-256M-Instruct
8+
- https://huggingface.co/ggml-org/SmolVLM-256M-Instruct-GGUF
9+
license: apache-2.0
10+
description: |
11+
SmolVLM-256M is the smallest multimodal model in the world. It accepts arbitrary sequences of image and text inputs to produce text outputs. It's designed for efficiency. SmolVLM can answer questions about images, describe visual content, or transcribe text. Its lightweight architecture makes it suitable for on-device applications while maintaining strong performance on multimodal tasks. It can run inference on one image with under 1GB of GPU RAM.
12+
tags:
13+
- llm
14+
- gguf
15+
- gpu
16+
- cpu
17+
- vision
18+
- multimodal
19+
- smollvlm
20+
- image-to-text
21+
overrides:
22+
parameters:
23+
model: SmolVLM-256M-Instruct-Q8_0.gguf
24+
mmproj: mmproj-SmolVLM-256M-Instruct-Q8_0.gguf
25+
files:
26+
- filename: mmproj-SmolVLM-256M-Instruct-Q8_0.gguf
27+
sha256: 7e943f7c53f0382a6fc41b6ee0c2def63ba4fded9ab8ed039cc9e2ab905e0edd
28+
uri: huggingface://ggml-org/SmolVLM-256M-Instruct-GGUF/mmproj-SmolVLM-256M-Instruct-Q8_0.gguf
29+
- filename: SmolVLM-256M-Instruct-Q8_0.gguf
30+
sha256: 2a31195d3769c0b0fd0a4906201666108834848db768af11de1d2cef7cd35e65
31+
uri: huggingface://ggml-org/SmolVLM-256M-Instruct-GGUF/SmolVLM-256M-Instruct-Q8_0.gguf
232
- &qwen3
333
url: "github:mudler/LocalAI/gallery/qwen3.yaml@master"
434
name: "qwen3-30b-a3b"

gallery/smolvlm.yaml

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,19 @@
1+
---
2+
name: smolvlm
3+
# yamllint disable-line rule:trailing-spaces
4+
config_file: |
5+
mmap: true
6+
template:
7+
chat_message: |
8+
{{if eq .RoleName "assistant"}}Assistant{{else if eq .RoleName "system"}}System{{else if eq .RoleName "user"}}User{{end}}: {{.Content }}<end_of_utterance>
9+
chat: "<|im_start|>\n{{.Input -}}\nAssistant: "
10+
completion: |
11+
{{-.Input}}
12+
f16: true
13+
stopwords:
14+
- '<|im_end|>'
15+
- '<dummy32000>'
16+
- '</s>'
17+
- '<|'
18+
- '<end_of_utterance>'
19+
- '<|endoftext|>'

0 commit comments

Comments
 (0)