version: "3.9" services: qwen3-api: build: . image: qwen3-api:latest container_name: qwen3-api ports: - "8000:8000" volumes: # /data is the HF Spaces persistent storage bucket — model lives here - /data:/data environment: - MODEL_PATH=/data/qwen3-14b-q4_k_m.gguf - MODEL_URL=https://huggingface.co/bartowski/Qwen_Qwen3-14B-GGUF/resolve/main/Qwen_Qwen3-14B-Q4_K_M.gguf - MODEL_ID=qwen3-14b - N_CTX=4096 - N_THREADS=8 - N_BATCH=512 - VERBOSE=false - HF_TOKEN restart: unless-stopped