FROM ghcr.io/ggerganov/llama.cpp:full

RUN apt update && apt install wget -y
# Download the GGUF file for ggml-org/gemma-3-4b-it-GGUF
RUN wget "https://huggingface.co/ggml-org/SmolVLM2-2.2B-Instruct-GGUF/resolve/main/SmolVLM2-2.2B-Instruct-Q8_0.gguf" -O /smoll.gguf
# Download the mmproj file for ggml-org/gemma-3-4b-it-GGUF
RUN wget "https://huggingface.co/ggml-org/SmolVLM2-2.2B-Instruct-GGUF/resolve/main/mmproj-SmolVLM2-2.2B-Instruct-Q8_0.gguf" -O /mmproj.gguf

CMD ["--server", "-m", "/smoll.gguf", "--mmproj", "/mmproj.gguf", "--port", "7860", "--host", "0.0.0.0", "-n", "512"]