version: '3.8' services: policy-analysis: build: context: . dockerfile: Dockerfile ports: - "7860:7860" environment: - PRELOAD_MODELS=false # Models are already cached in the image volumes: - model_cache:/root/.cache/huggingface # Optional: persist model cache restart: unless-stopped healthcheck: test: ["CMD", "curl", "-f", "http://localhost:7860/health"] interval: 30s timeout: 10s retries: 3 start_period: 40s volumes: model_cache: