chute_config: GPU restricted to 4090/3090, max_hourly_price 0.50
Browse files- chute_config.yml +42 -0
chute_config.yml
CHANGED
|
@@ -7,6 +7,47 @@ Image:
|
|
| 7 |
NodeSelector:
|
| 8 |
gpu_count: 1
|
| 9 |
min_vram_gb_per_gpu: 16
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
|
| 11 |
Chute:
|
| 12 |
timeout_seconds: 300
|
|
@@ -14,3 +55,4 @@ Chute:
|
|
| 14 |
max_instances: 5
|
| 15 |
scaling_threshold: 0.5
|
| 16 |
shutdown_after: 288000
|
|
|
|
|
|
| 7 |
NodeSelector:
|
| 8 |
gpu_count: 1
|
| 9 |
min_vram_gb_per_gpu: 16
|
| 10 |
+
# Restrict to 4090 / 3090 only. Chutes' include-list rejects consumer-only
|
| 11 |
+
# lists per prior incident (M32 in MISTAKES.md), so exclude everything else.
|
| 12 |
+
exclude:
|
| 13 |
+
# Blackwell
|
| 14 |
+
- 5090
|
| 15 |
+
- 5080
|
| 16 |
+
- b200
|
| 17 |
+
- b100
|
| 18 |
+
# Hopper
|
| 19 |
+
- h100
|
| 20 |
+
- h100_sxm
|
| 21 |
+
- h100_nvl
|
| 22 |
+
- h200
|
| 23 |
+
# Ampere data center
|
| 24 |
+
- a100
|
| 25 |
+
- a100_40gb
|
| 26 |
+
- a100_80gb
|
| 27 |
+
- a6000
|
| 28 |
+
- a40
|
| 29 |
+
- a10
|
| 30 |
+
- a10g
|
| 31 |
+
# Lovelace data center
|
| 32 |
+
- l4
|
| 33 |
+
- l40
|
| 34 |
+
- l40s
|
| 35 |
+
# Ada Pro
|
| 36 |
+
- pro_6000
|
| 37 |
+
- rtx_pro_6000
|
| 38 |
+
- rtx_pro_4000
|
| 39 |
+
- rtx_pro_4500
|
| 40 |
+
- rtx_pro_5000
|
| 41 |
+
# AMD
|
| 42 |
+
- mi300x
|
| 43 |
+
- mi300a
|
| 44 |
+
- mi250x
|
| 45 |
+
- mi210
|
| 46 |
+
# Older data center
|
| 47 |
+
- v100
|
| 48 |
+
- t4
|
| 49 |
+
- p100
|
| 50 |
+
- k80
|
| 51 |
|
| 52 |
Chute:
|
| 53 |
timeout_seconds: 300
|
|
|
|
| 55 |
max_instances: 5
|
| 56 |
scaling_threshold: 0.5
|
| 57 |
shutdown_after: 288000
|
| 58 |
+
max_hourly_price: 0.50
|