| # fly.toml - Fly.io deployment configuration | |
| # Deploy with: fly launch | |
| app = "cascade-llm-router" | |
| primary_region = "sjc" | |
| [build] | |
| dockerfile = "Dockerfile" | |
| [env] | |
| PORT = "8080" | |
| PYTHONPATH = "/app/src" | |
| [http_service] | |
| internal_port = 8080 | |
| force_https = true | |
| auto_stop_machines = true | |
| auto_start_machines = true | |
| min_machines_running = 0 | |
| processes = ["app"] | |
| [[http_service.checks]] | |
| grace_period = "10s" | |
| interval = "30s" | |
| method = "GET" | |
| timeout = "5s" | |
| path = "/health" | |
| [[vm]] | |
| cpu_kind = "shared" | |
| cpus = 1 | |
| memory_mb = 512 | |