Spaces:
Sleeping
Sleeping
File size: 1,836 Bytes
4e16e37 d0b0680 4e16e37 c6b9370 4e16e37 c6b9370 4e16e37 d0b0680 4e16e37 d0b0680 4e16e37 d0b0680 4e16e37 d0b0680 4e16e37 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 | # βββ Stage: Base ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
# Hugging Face Spaces uses port 7860 by default.
# We install Ollama (llama.cpp under the hood) for fast CPU inference.
FROM python:3.11-slim
# System dependencies for Ollama install script + curl
RUN apt-get update && apt-get install -y \
curl \
ca-certificates \
bash \
zstd \
&& rm -rf /var/lib/apt/lists/*
# βββ Install Ollama βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
RUN curl -fsSL https://ollama.com/install.sh | bash
WORKDIR /app
# βββ Python dependencies ββββββββββββββββββββββββββββββββββββββββββββββββββββββ
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt
# βββ Copy source code βββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
COPY app/ ./app/
COPY tests/ ./tests/
COPY startup.sh .
RUN chmod +x startup.sh
# βββ Environment ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
# Set MOCK_LLM=false to use Ollama. Override at runtime if needed for testing.
ENV MOCK_LLM=false
ENV MODEL_NAME=qwen2.5:0.5b
ENV OLLAMA_HOST=http://localhost:11434
EXPOSE 7860
# startup.sh: boots Ollama, pulls model, starts FastAPI
CMD ["./startup.sh"] |