| # 1. 后台启动 Ollama 服务 | |
| echo "Starting Ollama server..." | |
| ollama serve & | |
| # 2. 等待服务完全启动 (避免立即拉取模型导致失败) | |
| until curl -s localhost:7860 > /dev/null; do | |
| echo "Waiting for Ollama to start..." | |
| sleep 2 | |
| done | |
| # 3. 预下载模型 (如果不下载,第一次 API 调用会非常慢) | |
| echo "Downloading model: hf.co/apothic/bonsai-8B-1bit-turboquant..." | |
| ollama run hf.co/apothic/bonsai-8B-1bit-turboquant "hello" | |
| # 4. 保持进程运行,防止 Docker 容器退出 | |
| echo "Model ready! Space is running on port 7860." | |
| wait |