rahul7star's picture
Update Dockerfile
0b69cac verified
raw
history blame
499 Bytes
FROM ghcr.io/ggml-org/llama.cpp:full
RUN apt update && apt install -y wget python3 python3-pip
RUN pip install gradio requests
COPY app.py /app/app.py
WORKDIR /app
CMD ["bash", "-c", "\
if [ ! -f /gpt-oss-20b_Q4_0.gguf ]; then \
echo 'Downloading model...'; \
wget -q 'https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b_Q4_0.gguf' -O /gpt-oss-20b_Q4_0.gguf; \
fi; \
llama.cpp --server -m /gpt-oss-20b_Q4_0.gguf --port 7860 --host 0.0.0.0 -n 512 & \
python3 /app/app.py"]