Spaces:
Sleeping
Sleeping
| # ============================================================ | |
| # Dockerfile β Qwen3.5-0.8B CPU-Only API for HF Spaces | |
| # No GPU required. Port 7860. | |
| # ============================================================ | |
| FROM python:3.11-slim | |
| # ββ System deps ββ | |
| RUN apt-get update && \ | |
| apt-get install -y --no-install-recommends git && \ | |
| rm -rf /var/lib/apt/lists/* | |
| # ββ Python deps (CPU-only torch β no CUDA bloat) ββ | |
| RUN pip install --no-cache-dir \ | |
| torch --index-url https://download.pytorch.org/whl/cpu | |
| RUN pip install --no-cache-dir \ | |
| transformers \ | |
| accelerate \ | |
| fastapi \ | |
| uvicorn \ | |
| pydantic \ | |
| huggingface_hub | |
| # ββ Pre-download model at build time (~1.8 GB baked into image) ββ | |
| ENV HF_HOME=/tmp/hf_cache | |
| RUN python3 -c "\ | |
| from huggingface_hub import snapshot_download; \ | |
| snapshot_download('Qwen/Qwen2.5-0.5B-Instruct', cache_dir='/tmp/hf_cache')" | |
| # ββ Copy app ββ | |
| WORKDIR /app | |
| COPY app.py . | |
| EXPOSE 7860 | |
| CMD ["python3", "app.py"] |