Update app.py
Browse files
app.py
CHANGED
|
@@ -46,7 +46,7 @@ GPUS = {
|
|
| 46 |
"RTX 5090": {"FP32":201.00, "FP16": 402.00, "INT4":1676.0},
|
| 47 |
|
| 48 |
# Data center / Tesla / A-series
|
| 49 |
-
"Tesla T4": {"FP32": 8.10, "FP16":
|
| 50 |
"Tesla V100": {"FP32": 15.70, "FP16": 31.40, "INT4": 0.0},
|
| 51 |
"NVIDIA A10": {"FP32": 31.20, "FP16": 62.40, "INT4": 0.0},
|
| 52 |
"A100": {"FP32": 19.50, "FP16": 39.00, "INT4": 624.0},
|
|
@@ -78,6 +78,22 @@ GPUS = {
|
|
| 78 |
"MI100": {"FP32": 23.10, "FP16": 46.20, "INT4": 0.0},
|
| 79 |
"MI200": {"FP32":300.0, "FP16": 600.0, "INT4":3000.0},
|
| 80 |
"MI300": {"FP32":400.0, "FP16": 800.0, "INT4":4000.0},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 81 |
}
|
| 82 |
|
| 83 |
# ------------------------
|
|
|
|
| 46 |
"RTX 5090": {"FP32":201.00, "FP16": 402.00, "INT4":1676.0},
|
| 47 |
|
| 48 |
# Data center / Tesla / A-series
|
| 49 |
+
"Tesla T4": {"FP32": 8.10, "FP16": 65.13, "INT4": 0.0},
|
| 50 |
"Tesla V100": {"FP32": 15.70, "FP16": 31.40, "INT4": 0.0},
|
| 51 |
"NVIDIA A10": {"FP32": 31.20, "FP16": 62.40, "INT4": 0.0},
|
| 52 |
"A100": {"FP32": 19.50, "FP16": 39.00, "INT4": 624.0},
|
|
|
|
| 78 |
"MI100": {"FP32": 23.10, "FP16": 46.20, "INT4": 0.0},
|
| 79 |
"MI200": {"FP32":300.0, "FP16": 600.0, "INT4":3000.0},
|
| 80 |
"MI300": {"FP32":400.0, "FP16": 800.0, "INT4":4000.0},
|
| 81 |
+
# Hopper / Grace superchips
|
| 82 |
+
"H200": {"FP32": 350.0, "FP16": 700.0, "INT4": 3500.0},
|
| 83 |
+
"GH200": {"FP32": 300.0, "FP16": 600.0, "INT4": 3000.0}, # H100-class GPU + Grace CPU
|
| 84 |
+
"GB10": {"FP32": 400.0, "FP16": 800.0, "INT4": 4000.0}, # dev module, Blackwell-class
|
| 85 |
+
|
| 86 |
+
# Ada Lovelace datacenter
|
| 87 |
+
"L20": {"FP32": 44.0, "FP16": 88.0, "INT4": 700.0},
|
| 88 |
+
"A40": {"FP32": 37.4, "FP16": 74.8, "INT4": 600.0},
|
| 89 |
+
"A2": {"FP32": 4.5, "FP16": 9.0, "INT4": 160.0},
|
| 90 |
+
|
| 91 |
+
# RTX Ada workstation GPUs
|
| 92 |
+
"RTX A2000": {"FP32": 8.0, "FP16": 16.0, "INT4": 0.0},
|
| 93 |
+
"RTX A4000": {"FP32": 19.2, "FP16": 38.4, "INT4": 0.0},
|
| 94 |
+
"RTX A4500": {"FP32": 23.7, "FP16": 47.4, "INT4": 0.0},
|
| 95 |
+
"RTX A5000": {"FP32": 27.8, "FP16": 55.6, "INT4": 0.0},
|
| 96 |
+
"RTX A6000 Ada": {"FP32": 91.1, "FP16": 182.2, "INT4": 1450.0},
|
| 97 |
}
|
| 98 |
|
| 99 |
# ------------------------
|