meaculpitt commited on
Commit
466f5b7
·
verified ·
1 Parent(s): a8c4f6c

scorevision: push artifact

Browse files
Files changed (1) hide show
  1. chute_config.yml +34 -0
chute_config.yml ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Image:
2
+ from_base: parachutes/python:3.12
3
+ run_command:
4
+ - pip install --upgrade setuptools wheel
5
+ - pip install 'numpy>=1.23' 'onnxruntime-gpu>=1.16' 'nvidia-cudnn-cu12>=9.0' 'nvidia-cublas-cu12>=12.8' 'nvidia-cuda-runtime-cu12>=12.8' 'opencv-python>=4.7' 'pillow>=9.5' 'huggingface_hub>=0.19.4' 'pydantic>=2.0' 'pyyaml>=6.0' 'aiohttp>=3.9' 'torch>=2.8'
6
+
7
+ NodeSelector:
8
+ gpu_count: 1
9
+ min_vram_gb_per_gpu: 16
10
+ # max_hourly_price_per_gpu belongs in NodeSelector, not Chute.
11
+ # pro_6000 lists at $1.80/hr on api.chutes.ai/pricing; 2.00 leaves headroom.
12
+ max_hourly_price_per_gpu: 2.00
13
+ # TEE mandate for new SN44 chutes: include=['pro_6000'] + Chute.tee=true.
14
+ include:
15
+ - "pro_6000"
16
+ # Chutes caps exclude at 5. Pattern from production person/vehicle chute.
17
+ exclude:
18
+ - "5090"
19
+ - "b200"
20
+ - "h200"
21
+ - "mi300x"
22
+
23
+ Chute:
24
+ # Chute.__init__ only accepts these params; anything else is silently
25
+ # dropped by safe_instantiate() in the template. Previously-used keys
26
+ # `shutdown_after` (was dropped because the real name is
27
+ # `shutdown_after_seconds`) and `timeout_seconds` (not a Chute param)
28
+ # caused chutes to auto-deprovision after 5 min of idle.
29
+ concurrency: 4
30
+ max_instances: 5
31
+ scaling_threshold: 0.5
32
+ shutdown_after_seconds: 288000 # 80h idle tolerance
33
+ # SDK source has Chute(tee: bool = False) — required for new SN44 chutes.
34
+ tee: true