Spaces:
Sleeping
Sleeping
deploy
Browse files
app.py
CHANGED
|
@@ -106,6 +106,7 @@ def _predict_generic(context, TP, DP, concurrency, gpu_type, coeffs):
|
|
| 106 |
|
| 107 |
def predict_latency(model, context, TP, DP, concurrency, gpu_type):
|
| 108 |
if TP * DP > 8:
|
|
|
|
| 109 |
msg = "⚠️ Invalid configuration: TP × DP must not exceed 8 GPUs."
|
| 110 |
return (msg, msg)
|
| 111 |
if gpu_type not in ["8× H100", "8× H200"]:
|
|
|
|
| 106 |
|
| 107 |
def predict_latency(model, context, TP, DP, concurrency, gpu_type):
|
| 108 |
if TP * DP > 8:
|
| 109 |
+
print("")
|
| 110 |
msg = "⚠️ Invalid configuration: TP × DP must not exceed 8 GPUs."
|
| 111 |
return (msg, msg)
|
| 112 |
if gpu_type not in ["8× H100", "8× H200"]:
|