FROM ghcr.io/ggerganov/llama.cpp:full | |
RUN apt update && apt install wget -y | |
RUN wget "https://huggingface.co/unsloth/Qwen3-0.6B-GGUF/resolve/main/Qwen3-0.6B-Q8_0.gguf" -O /qwen.gguf | |
CMD ["--server", "-m", "/qwen.gguf", "--port", "7860", "--host", "0.0.0.0", "-n", "512"] |