Spaces:

Theflame47
/

RunPodRun

Sleeping

App Files Files Community

Theflame47 commited on Nov 13, 2025

Commit

63250d9

verified ·

1 Parent(s): a42c87f

Update Deployment_UI_BE.py

Browse files

Files changed (1) hide show

Deployment_UI_BE.py +37 -19

Deployment_UI_BE.py CHANGED Viewed

@@ -111,35 +111,53 @@ def _as_json(r):
 # ---------------------------------------------------------------------
 # Probes and route discovery (new)
 # ---------------------------------------------------------------------
-def _probe(method: str, url: str, timeout=5):
-    t0 = time.time()
-    try:
-        resp = requests.request(method, url, timeout=timeout)
-        ms = int((time.time() - t0) * 1000)
-        return resp.status_code, ms, (resp.text[:200] if resp.text else "")
-    except Exception as e:
-        return -1, int((time.time() - t0) * 1000), str(e)
-_HEALTH_PATHS = ["/health", "/ping", "/healthz", "/v1/models"]
-_POSSIBLE_ROUTES = ["/generate", "/predict", "/predictions",
-                    "/v1/chat/completions", "/v1/models/model:predict"]
 def _infer_routes_from_image(image_uri: str):
     iu = (image_uri or "").lower()
     if "vllm-serve" in iu:
         return ("/generate", "/ping")
     if "hf-inference-toolkit" in iu or "huggingface-pytorch-inference" in iu:
-        return ("/predict", "/ping")
     return (None, None)
-def _discover_route(base_url: str):
-    for path in _POSSIBLE_ROUTES:
-        code, ms, _ = _probe("HEAD", f"{base_url}{path}")
-        _log_status(f"ROUTE_PROBE path={path} code={code} ms={ms}")
-        if code in (200, 204, 405):  # exists (405 = method not allowed but present)
-            return path
-    return None
 # ---------------------------------------------------------------------
 # Blob ingest via Model Blob page JSON (with blob_url override)
 # ---------------------------------------------------------------------

 # ---------------------------------------------------------------------
 # Probes and route discovery (new)
 # ---------------------------------------------------------------------
+# Expanded set: will try these against https://pod:port/<route>
+_POSSIBLE_ROUTES = [
+    "/invocations",          # <— added and placed first
+    "/generate",
+    "/predict",
+    "/predictions",
+    "/v1/chat/completions",
+    "/v1/models/model:predict",
+]
 def _infer_routes_from_image(image_uri: str):
+    """
+    Infer (predict_route, health_route) from known image patterns.
+    """
     iu = (image_uri or "").lower()
+    # vLLM images
     if "vllm-serve" in iu:
         return ("/generate", "/ping")
+    # HuggingFace / Vertex HF Inference Toolkit
+    # changed from "/predict" → "/invocations"
     if "hf-inference-toolkit" in iu or "huggingface-pytorch-inference" in iu:
+        return ("/invocations", "/ping")
+    # Unknown image → allow route scanning fallback
     return (None, None)
+async def _probe_all_routes(base: str, port: str, session):
+    """
+    Try all known routes until one responds 200/OK-ish.
+    Returns (predict_route, health_route or None)
+    """
+    from urllib.parse import urljoin
+    proto_base = f"{base}:{port}"
+    for route in _POSSIBLE_ROUTES:
+        url = urljoin(proto_base + "/", route.lstrip("/"))
+        try:
+            r = await session.get(url, timeout=3)
+            if r.status_code < 500:
+                return route, ("/ping" if "/ping" in route else None)
+        except Exception:
+            pass
+    return None, None
 # ---------------------------------------------------------------------
 # Blob ingest via Model Blob page JSON (with blob_url override)
 # ---------------------------------------------------------------------