FROM python:3.10-slim ARG HF_TOKEN ENV DEBIAN_FRONTEND=noninteractive \ PYTHONUNBUFFERED=1 \ PYTHONDONTWRITEBYTECODE=1 \ HF_TOKEN=${HF_TOKEN} WORKDIR /code # System Dependencies RUN apt-get update && apt-get install -y --no-install-recommends \ build-essential \ git \ curl \ libopenblas-dev \ libomp-dev \ && rm -rf /var/lib/apt/lists/* # Copy requirements and install Python dependencies COPY requirements.txt . RUN pip install --no-cache-dir -r requirements.txt # Hugging Face dependencies RUN pip install --no-cache-dir huggingface-hub sentencepiece # Hugging Face cache environment ENV HF_HOME=/data/huggingface \ HUGGINGFACE_HUB_CACHE=/data/huggingface \ HF_HUB_CACHE=/data/huggingface \ MODEL_ID=google/gemma-3-4b-it \ API_PORT=7860 # Create cache dir and set permissions RUN mkdir -p /data/huggingface && chmod -R 777 /data # Copy project files COPY . . EXPOSE 7860 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]