Gguf-size-test / Dockerfile
Boning c
Update Dockerfile
59fff27 verified
raw
history blame contribute delete
314 Bytes
FROM ghcr.io/ggml-org/llama.cpp:full
RUN apt update && apt install wget -y
RUN wget "https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-Q2_K.gguf" -O /gpt-oss-20b-Q2_K.gguf
CMD ["--server", "-m", "/gpt-oss-20b-Q2_K.gguf", "--port", "7860", "--host", "0.0.0.0", "-n", "512", "--no-warmup"]