| FROM python:3.10-slim |
|
|
| ARG HF_TOKEN |
|
|
| ENV DEBIAN_FRONTEND=noninteractive \ |
| PYTHONUNBUFFERED=1 \ |
| PYTHONDONTWRITEBYTECODE=1 \ |
| HF_TOKEN=${HF_TOKEN} |
|
|
| WORKDIR /code |
|
|
| |
| RUN apt-get update && apt-get install -y --no-install-recommends \ |
| build-essential \ |
| git \ |
| curl \ |
| libopenblas-dev \ |
| libomp-dev \ |
| && rm -rf /var/lib/apt/lists/* |
|
|
| |
| COPY requirements.txt . |
| RUN pip install --no-cache-dir -r requirements.txt |
|
|
| |
| RUN pip install --no-cache-dir huggingface-hub sentencepiece |
|
|
| |
| ENV HF_HOME=/data/huggingface \ |
| HUGGINGFACE_HUB_CACHE=/data/huggingface \ |
| HF_HUB_CACHE=/data/huggingface \ |
| MODEL_ID=google/gemma-3-4b-it \ |
| API_PORT=7860 |
|
|
| |
| RUN mkdir -p /data/huggingface && chmod -R 777 /data |
|
|
| |
| COPY . . |
|
|
| EXPOSE 7860 |
|
|
| CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"] |
|
|