scorevision: push artifact
Browse files- chute_config.yml +34 -0
chute_config.yml
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Image:
|
| 2 |
+
from_base: parachutes/python:3.12
|
| 3 |
+
run_command:
|
| 4 |
+
- pip install --upgrade setuptools wheel
|
| 5 |
+
- pip install 'numpy>=1.23' 'onnxruntime-gpu>=1.16' 'nvidia-cudnn-cu12>=9.0' 'nvidia-cublas-cu12>=12.8' 'nvidia-cuda-runtime-cu12>=12.8' 'opencv-python>=4.7' 'pillow>=9.5' 'huggingface_hub>=0.19.4' 'pydantic>=2.0' 'pyyaml>=6.0' 'aiohttp>=3.9' 'torch>=2.8'
|
| 6 |
+
|
| 7 |
+
NodeSelector:
|
| 8 |
+
gpu_count: 1
|
| 9 |
+
min_vram_gb_per_gpu: 16
|
| 10 |
+
# max_hourly_price_per_gpu belongs in NodeSelector, not Chute.
|
| 11 |
+
# pro_6000 lists at $1.80/hr on api.chutes.ai/pricing; 2.00 leaves headroom.
|
| 12 |
+
max_hourly_price_per_gpu: 2.00
|
| 13 |
+
# TEE mandate for new SN44 chutes: include=['pro_6000'] + Chute.tee=true.
|
| 14 |
+
include:
|
| 15 |
+
- "pro_6000"
|
| 16 |
+
# Chutes caps exclude at 5. Pattern from production person/vehicle chute.
|
| 17 |
+
exclude:
|
| 18 |
+
- "5090"
|
| 19 |
+
- "b200"
|
| 20 |
+
- "h200"
|
| 21 |
+
- "mi300x"
|
| 22 |
+
|
| 23 |
+
Chute:
|
| 24 |
+
# Chute.__init__ only accepts these params; anything else is silently
|
| 25 |
+
# dropped by safe_instantiate() in the template. Previously-used keys
|
| 26 |
+
# `shutdown_after` (was dropped because the real name is
|
| 27 |
+
# `shutdown_after_seconds`) and `timeout_seconds` (not a Chute param)
|
| 28 |
+
# caused chutes to auto-deprovision after 5 min of idle.
|
| 29 |
+
concurrency: 4
|
| 30 |
+
max_instances: 5
|
| 31 |
+
scaling_threshold: 0.5
|
| 32 |
+
shutdown_after_seconds: 288000 # 80h idle tolerance
|
| 33 |
+
# SDK source has Chute(tee: bool = False) — required for new SN44 chutes.
|
| 34 |
+
tee: true
|