FROM ollama/ollama:latest # HF Spaces (free CPU) expects port 7860 ENV OLLAMA_HOST=0.0.0.0:7860 ENV OLLAMA_MAX_LOADED_MODELS=1 EXPOSE 7860 # Override default entrypoint so we can run normal commands ENTRYPOINT [] # Start Ollama server + pull Qwen3 8B (quantized for CPU) + keep alive CMD ollama serve & sleep 15 && ollama pull qwen3:8b-q4_K_M && echo "✅ Qwen3 8B ready!" && tail -f /dev/null