Gguf-size-test / Dockerfile
Boning c
Update Dockerfile
a80269e verified
raw
history blame contribute delete
413 Bytes
FROM ghcr.io/ggml-org/llama.cpp:full
RUN apt update && apt install wget -y
RUN wget "https://huggingface.co/mradermacher/aquif-3-moe-17b-a2.8b-thinking-i1-GGUF/resolve/main/aquif-3-moe-17b-a2.8b-thinking.i1-Q4_K_M.gguf" -O /aquif-3-moe-17b-a2.8b-thinking.i1-Q4_K_M.gguf
CMD ["--server", "-m", "/aquif-3-moe-17b-a2.8b-thinking.i1-Q4_K_M.gguf", "--port", "7860", "--host", "0.0.0.0", "-n", "512", "--no-warmup"]