Theflame47 commited on
Commit
deb1e79
·
verified ·
1 Parent(s): 4996b19

Update Deployment_UI_BE.py

Browse files
Files changed (1) hide show
  1. Deployment_UI_BE.py +5 -8
Deployment_UI_BE.py CHANGED
@@ -751,12 +751,9 @@ async def api_infer(req: Request):
751
  # ---------------------------------------------------------------------
752
  @router.post("/api/middleware/infer")
753
  async def api_middleware_infer(req: Request):
754
- route = _INST.get("predictRoute")
755
- if not route:
756
- return JSONResponse(
757
- {"error": "predictRoute unresolved; check ROUTE_PROBE logs and HEALTH results."},
758
- status_code=428
759
- )
760
 
761
  payload = await req.json()
762
  prompt = payload.get("prompt")
@@ -786,8 +783,9 @@ async def api_middleware_infer(req: Request):
786
  proxy_base = f"http://{ip}:{port}"
787
  _log_status(f"PROMPT_BASE direct={proxy_base}")
788
 
 
789
  if not proxy_base:
790
- return JSONResponse({"error": "instance not ready (no base URL)"}, status_code=409)
791
 
792
  url = f"{proxy_base}{route}"
793
  _log_status(f"PROMPT_ENDPOINT {url}")
@@ -834,7 +832,6 @@ async def api_middleware_infer(req: Request):
834
  except Exception as e:
835
  _job_log("compute", f"[MW] ERROR infer: {e}")
836
  return JSONResponse({"error": f"middleware infer failed: {e}"}, status_code=502)
837
-
838
  # ---------------------------------------------------------------------
839
  # Job progress + callback routes
840
  # ---------------------------------------------------------------------
 
751
  # ---------------------------------------------------------------------
752
  @router.post("/api/middleware/infer")
753
  async def api_middleware_infer(req: Request):
754
+ # Always ensure predictRoute exists
755
+ route = _INST.get("predictRoute") or "/predict"
756
+ _INST["predictRoute"] = route
 
 
 
757
 
758
  payload = await req.json()
759
  prompt = payload.get("prompt")
 
783
  proxy_base = f"http://{ip}:{port}"
784
  _log_status(f"PROMPT_BASE direct={proxy_base}")
785
 
786
+ # If neither path is available, do not gate—return clear error
787
  if not proxy_base:
788
+ return JSONResponse({"error": "no reachable base yet (no proxy or ip/port)"}, status_code=503)
789
 
790
  url = f"{proxy_base}{route}"
791
  _log_status(f"PROMPT_ENDPOINT {url}")
 
832
  except Exception as e:
833
  _job_log("compute", f"[MW] ERROR infer: {e}")
834
  return JSONResponse({"error": f"middleware infer failed: {e}"}, status_code=502)
 
835
  # ---------------------------------------------------------------------
836
  # Job progress + callback routes
837
  # ---------------------------------------------------------------------