Priya / Dockerfile
AparnaHerself's picture
Update Dockerfile
5f236f1 verified
raw
history blame contribute delete
407 Bytes
FROM ghcr.io/ggml-org/llama.cpp:server
WORKDIR /app
# 🌸 Downloading the 3B Genius!
RUN apt-get update && apt-get install -y wget && \
wget https://huggingface.co/bartowski/Llama-3.2-3B-Instruct-GGUF/resolve/main/Llama-3.2-3B-Instruct-Q4_K_M.gguf -O model.gguf
# 🧸 Setting 32K context so it's super snappy and fast!
CMD ["-m", "model.gguf", "--host", "0.0.0.0", "--port", "7860", "-c", "32768"]