Spaces:
Sleeping
Sleeping
Update Deployment_UI_BE.py
Browse files- Deployment_UI_BE.py +5 -8
Deployment_UI_BE.py
CHANGED
|
@@ -751,12 +751,9 @@ async def api_infer(req: Request):
|
|
| 751 |
# ---------------------------------------------------------------------
|
| 752 |
@router.post("/api/middleware/infer")
|
| 753 |
async def api_middleware_infer(req: Request):
|
| 754 |
-
|
| 755 |
-
|
| 756 |
-
|
| 757 |
-
{"error": "predictRoute unresolved; check ROUTE_PROBE logs and HEALTH results."},
|
| 758 |
-
status_code=428
|
| 759 |
-
)
|
| 760 |
|
| 761 |
payload = await req.json()
|
| 762 |
prompt = payload.get("prompt")
|
|
@@ -786,8 +783,9 @@ async def api_middleware_infer(req: Request):
|
|
| 786 |
proxy_base = f"http://{ip}:{port}"
|
| 787 |
_log_status(f"PROMPT_BASE direct={proxy_base}")
|
| 788 |
|
|
|
|
| 789 |
if not proxy_base:
|
| 790 |
-
return JSONResponse({"error": "
|
| 791 |
|
| 792 |
url = f"{proxy_base}{route}"
|
| 793 |
_log_status(f"PROMPT_ENDPOINT {url}")
|
|
@@ -834,7 +832,6 @@ async def api_middleware_infer(req: Request):
|
|
| 834 |
except Exception as e:
|
| 835 |
_job_log("compute", f"[MW] ERROR infer: {e}")
|
| 836 |
return JSONResponse({"error": f"middleware infer failed: {e}"}, status_code=502)
|
| 837 |
-
|
| 838 |
# ---------------------------------------------------------------------
|
| 839 |
# Job progress + callback routes
|
| 840 |
# ---------------------------------------------------------------------
|
|
|
|
| 751 |
# ---------------------------------------------------------------------
|
| 752 |
@router.post("/api/middleware/infer")
|
| 753 |
async def api_middleware_infer(req: Request):
|
| 754 |
+
# Always ensure predictRoute exists
|
| 755 |
+
route = _INST.get("predictRoute") or "/predict"
|
| 756 |
+
_INST["predictRoute"] = route
|
|
|
|
|
|
|
|
|
|
| 757 |
|
| 758 |
payload = await req.json()
|
| 759 |
prompt = payload.get("prompt")
|
|
|
|
| 783 |
proxy_base = f"http://{ip}:{port}"
|
| 784 |
_log_status(f"PROMPT_BASE direct={proxy_base}")
|
| 785 |
|
| 786 |
+
# If neither path is available, do not gate—return clear error
|
| 787 |
if not proxy_base:
|
| 788 |
+
return JSONResponse({"error": "no reachable base yet (no proxy or ip/port)"}, status_code=503)
|
| 789 |
|
| 790 |
url = f"{proxy_base}{route}"
|
| 791 |
_log_status(f"PROMPT_ENDPOINT {url}")
|
|
|
|
| 832 |
except Exception as e:
|
| 833 |
_job_log("compute", f"[MW] ERROR infer: {e}")
|
| 834 |
return JSONResponse({"error": f"middleware infer failed: {e}"}, status_code=502)
|
|
|
|
| 835 |
# ---------------------------------------------------------------------
|
| 836 |
# Job progress + callback routes
|
| 837 |
# ---------------------------------------------------------------------
|