Spaces:

build-small-hackathon
/

elysium

Running on Zero

App Files Files Community

Update backend/server.py

by pmrinal2005 - opened 19 days ago

base: refs/heads/main

←

from: refs/pr/7

Discussion Files changed

+214

-68

Files changed (1) hide show

backend/server.py +214 -68

backend/server.py CHANGED Viewed

@@ -1,20 +1,25 @@
 """FastAPI routes attached to gr.Server.
-Key changes vs previous build:
-  • /api/turn now accepts up to 2 attachments (images or PDFs) via repeated
-    'attachments' multipart fields.
-  • Hypergraph maintains per-node spawn parent so frontend can draw correct
-    mycelium threads.
-  • Returns a `metrics` block with civilization-meaningful values
-    (mycelium_density, council_activity, knowledge_growth, civilization_age)
-    instead of fake compliance/laws numbers.
-  • Audio drama segments are returned per-agent so the frontend can sync
-    play/pause + speaking highlight to each utterance.
-  • Removes the raw-JSON dump from the canvas: the frontend never displays
-    raw JSON; it consumes it for nodes / edges / council / TTS only.
 """
 import io
 import json
 import time
 import traceback
 from typing import List, Optional
@@ -42,6 +47,11 @@ HG: Hypergraph = persistence.load()
 GRAMMAR = load_grammar()
 CIVILIZATION_START_TS = time.time()
 # ─── GPU-bound inference ────────────────────────────────────────────────────
 @spaces.GPU(duration=120)
@@ -56,51 +66,193 @@ def _gpu_infer(messages: list, max_tokens: int = 4096) -> str:
     return out["choices"][0]["message"]["content"]
 def _fallback_envelope(user_text: str, err: str) -> dict:
     meta = new_session_meta()
     resp = ElysiumResponse(
         session_id=meta["session_id"],
         timestamp_utc=meta["timestamp_utc"],
         interaction_type="SIMPLE_REPLY",
-        direct_answer=f"(fallback) {err}",
     )
-    return {"user_msg": user_text, "elysium_response": resp.model_dump()}
-def _civilization_metrics(resp: ElysiumResponse) -> dict:
-    """Real, meaningful metrics derived from the hypergraph state."""
     nodes = HG.node_count()
     edges = HG.edge_count()
-    # Mycelium density = edges per node, normalized to 0-100%
-    density = 0.0
-    if nodes > 0:
-        density = min(1.0, edges / max(1, nodes * 1.4))
-    # Council activity = number of active agents (capped at 5)
     council_active = len(resp.council_deliberation.agent_outputs or [])
-    # Knowledge growth (this turn) = nodes added
     knowledge_growth = len(resp.hypergraph_delta.nodes_added or [])
-    # Coherence = inverse of cognitive strain
     coherence = 1.0 - float(resp.strain_metadata.cognitive_strain or 0.3)
-    age_seconds = time.time() - CIVILIZATION_START_TS
-    age_minutes = int(age_seconds / 60)
     return {
         "mycelium_density_pct": round(density * 100),
         "council_active":       council_active,
         "knowledge_growth":     knowledge_growth,
         "coherence_pct":        round(max(0.0, min(1.0, coherence)) * 100),
-        "civilization_age_min": age_minutes,
         "nodes":                nodes,
         "edges":                edges,
         "alert_level":          resp.ui_directives.alert_level or "CALM",
     }
 async def _load_attachment(uf: UploadFile) -> Optional[dict]:
     if uf is None or not uf.filename:
         return None
@@ -112,7 +264,6 @@ async def _load_attachment(uf: UploadFile) -> Optional[dict]:
                 "error": f"file too large ({len(raw)} > {MAX_UPLOAD_BYTES} bytes)"}
     mime = (uf.content_type or "").lower()
     if mime not in ALLOWED_MIME_TYPES:
-        # also accept by extension as last resort
         low = uf.filename.lower()
         if low.endswith(".pdf"):
             mime = "application/pdf"
@@ -123,7 +274,6 @@ async def _load_attachment(uf: UploadFile) -> Optional[dict]:
     if mime == "application/pdf":
         return {"kind": "pdf", "bytes": raw, "name": uf.filename}
-    # image
     try:
         img = Image.open(io.BytesIO(raw))
         img.load()
@@ -172,9 +322,12 @@ def attach(app):
             "node_count": HG.node_count(), "edge_count": HG.edge_count(),
         }
     @app.get("/api/node/{node_id}")
     async def node_detail(node_id: str):
-        """Detail view for one node: payload, connections, related agents."""
         if node_id not in HG._idx:
             raise HTTPException(404, "node not found")
         idx = HG._idx[node_id]
@@ -225,40 +378,34 @@ def attach(app):
             # 2. Build messages with hypergraph context
             messages = build_messages(user_text, valid, HG.context_summary())
-            # 3. GPU inference (returns strict JSON)
             raw = _gpu_infer(messages)
-            # 4. Parse
-            try:
-                envelope = ElysiumEnvelope.model_validate_json(raw)
-            except Exception as parse_err:
-                try:
-                    blob = json.loads(raw)
-                    if "elysium_response" not in blob:
-                        meta = new_session_meta()
-                        envelope = ElysiumEnvelope(
-                            user_msg=user_text,
-                            elysium_response=ElysiumResponse(
-                                session_id=meta["session_id"],
-                                timestamp_utc=meta["timestamp_utc"],
-                                interaction_type="SIMPLE_REPLY",
-                                direct_answer=str(blob)[:600]))
-                    else:
-                        envelope = ElysiumEnvelope.model_validate(blob)
-                except Exception:
-                    return JSONResponse(
-                        _fallback_envelope(user_text, f"parse_error: {parse_err}"))
             resp = envelope.elysium_response
             # 5. Apply hypergraph delta
-            HG.apply_delta(resp.hypergraph_delta)
-            persistence.save(HG)
-            # 6. Execute tools
-            tool_results = execute_all(resp.tool_calls) if resp.tool_calls else []
-            # 7. Build audio drama if needed (combined + per-agent)
             audio_url = None
             per_agent_audio = []
             if resp.council_deliberation.debate_mode in ("AUDIO_DRAMA", "SILENT") \
@@ -274,14 +421,13 @@ def attach(app):
             payload = envelope.model_dump()
             payload["_runtime"] = {
-                "tool_results":    tool_results,
-                "audio_url":       audio_url,
-                "per_agent_audio": per_agent_audio,
-                "metrics":         _civilization_metrics(resp),
-                "attachment_errors": [{"name": e["name"], "error": e["error"]} for e in errors],
-                "attachments_processed": [
-                    {"kind": a["kind"], "name": a["name"]} for a in valid
-                ],
             }
             return JSONResponse(payload)

 """FastAPI routes attached to gr.Server.
+CRITICAL FIXES vs previous build:
+  • Strips <think>...</think> blocks (and other prefixes) from raw model output
+    BEFORE JSON parsing. The fine-tuned MiniCPM-V emits a `<think>\n\n</think>`
+    preamble — that was breaking parse and triggering the
+    "raw JSON toast on top" + repeated `Inference failed` errors.
+  • Accepts BOTH formats:
+        (A) bare ElysiumResponse        — what the model actually emits
+        (B) {user_msg, elysium_response} envelope — historical schema
+    Auto-wraps (A) into (B) so downstream code is unchanged.
+  • Fallback never dumps raw JSON into `direct_answer`; instead returns a
+    short, human-readable error string so the UI cannot accidentally toast
+    a 2 KB blob of JSON.
+  • Always attaches a complete `_runtime` block (metrics, audio, tool_results,
+    per_agent_audio, civilization_map) so the frontend never hits null/undefined.
+  • Adds /api/civilization_map endpoint returning a compact spatial snapshot
+    for the minimap (id, type, color, x_norm, y_norm, edges).
 """
 import io
 import json
+import re
 import time
 import traceback
 from typing import List, Optional
 GRAMMAR = load_grammar()
 CIVILIZATION_START_TS = time.time()
+# Pre-compiled regex to strip <think>...</think> blocks (including newlines)
+_THINK_RE = re.compile(r"<think\b[^>]*>.*?</think\s*>", re.DOTALL | re.IGNORECASE)
+# Match the first balanced JSON object in arbitrary text
+_JSON_OBJECT_RE = re.compile(r"\{.*\}", re.DOTALL)
 # ─── GPU-bound inference ────────────────────────────────────────────────────
 @spaces.GPU(duration=120)
     return out["choices"][0]["message"]["content"]
+# ────────────────────────────────────────────────────────────────────────────
+# Robust raw-output → ElysiumEnvelope parser
+# ────────────────────────────────────────────────────────────────────────────
+def _clean_raw_model_output(raw: str) -> str:
+    """Strip thinking blocks, code fences, and surrounding whitespace.
+    Handles all of the following patterns observed in real model outputs:
+      <think>...</think>\n\n{json}
+      ```json\n{json}\n```
+      Some text {json} trailing text
+    """
+    if not raw:
+        return ""
+    s = raw.strip()
+    # Strip <think>...</think>
+    s = _THINK_RE.sub("", s).strip()
+    # Strip ```json ... ``` fences
+    if s.startswith("```"):
+        s = re.sub(r"^```[a-zA-Z]*\s*", "", s)
+        s = re.sub(r"\s*```\s*$", "", s)
+        s = s.strip()
+    return s
+def _extract_json_blob(cleaned: str) -> Optional[dict]:
+    """Try direct json.loads, then fall back to first-balanced-object extract."""
+    if not cleaned:
+        return None
+    try:
+        return json.loads(cleaned)
+    except Exception:
+        pass
+    m = _JSON_OBJECT_RE.search(cleaned)
+    if not m:
+        return None
+    try:
+        return json.loads(m.group(0))
+    except Exception:
+        # Try a more aggressive cleanup: collapse stray newlines INSIDE strings
+        # (the model sometimes wraps long string values across lines)
+        candidate = m.group(0)
+        # Replace literal newlines inside likely string contexts. This is a
+        # best-effort: only safe for the model's typical output shape.
+        try:
+            candidate2 = re.sub(r'(?<!\\)\n', ' ', candidate)
+            return json.loads(candidate2)
+        except Exception:
+            return None
+def _coerce_to_envelope(raw: str, user_text: str) -> Optional[ElysiumEnvelope]:
+    """Parse arbitrary model output into a validated ElysiumEnvelope.
+    Returns None only when nothing JSON-shaped can be extracted at all.
+    """
+    cleaned = _clean_raw_model_output(raw)
+    blob = _extract_json_blob(cleaned)
+    if blob is None:
+        return None
+    # Case A: bare ElysiumResponse → wrap it
+    if "elysium_response" not in blob and ("schema_version" in blob or
+                                            "interaction_type" in blob or
+                                            "hypergraph_delta" in blob):
+        try:
+            resp = ElysiumResponse.model_validate(blob)
+            return ElysiumEnvelope(user_msg=user_text, elysium_response=resp)
+        except Exception as e:
+            print(f"[parse] bare-response validate failed: {e}")
+            # Fall through to envelope attempt
+    # Case B: full envelope
+    try:
+        return ElysiumEnvelope.model_validate(blob)
+    except Exception as e:
+        print(f"[parse] envelope validate failed: {e}")
+    # Last resort: synthesize a minimal envelope, keeping any direct_answer
+    meta = new_session_meta()
+    direct = ""
+    if isinstance(blob, dict):
+        direct = str(blob.get("direct_answer", "") or "")[:300]
+    return ElysiumEnvelope(
+        user_msg=user_text,
+        elysium_response=ElysiumResponse(
+            session_id=meta["session_id"],
+            timestamp_utc=meta["timestamp_utc"],
+            interaction_type="SIMPLE_REPLY",
+            direct_answer=direct or "(model response could not be fully parsed)",
+        ),
+    )
 def _fallback_envelope(user_text: str, err: str) -> dict:
+    """Last-resort fallback that NEVER contains raw JSON in direct_answer."""
     meta = new_session_meta()
+    # Keep direct_answer short & human readable. Never echo raw JSON.
+    safe_err = (err or "unknown error").splitlines()[0][:200]
     resp = ElysiumResponse(
         session_id=meta["session_id"],
         timestamp_utc=meta["timestamp_utc"],
         interaction_type="SIMPLE_REPLY",
+        direct_answer=f"The civilization could not process that turn ({safe_err}). Try again.",
     )
+    return {
+        "user_msg": user_text,
+        "elysium_response": resp.model_dump(),
+        "_runtime": _empty_runtime(),
+    }
+def _empty_runtime() -> dict:
+    """Always-present runtime envelope; never None on any field."""
+    return {
+        "tool_results":        [],
+        "audio_url":           None,
+        "per_agent_audio":     [],
+        "metrics":             _baseline_metrics(),
+        "attachment_errors":   [],
+        "attachments_processed": [],
+        "civilization_map":    _civilization_map_snapshot(),
+    }
+def _baseline_metrics() -> dict:
     nodes = HG.node_count()
     edges = HG.edge_count()
+    density = 0.0 if nodes == 0 else min(1.0, edges / max(1, nodes * 1.4))
+    age_min = int((time.time() - CIVILIZATION_START_TS) / 60)
+    return {
+        "mycelium_density_pct": round(density * 100),
+        "council_active":       0,
+        "knowledge_growth":     0,
+        "coherence_pct":        70,
+        "civilization_age_min": age_min,
+        "nodes":                nodes,
+        "edges":                edges,
+        "alert_level":          "CALM",
+    }
+def _civilization_metrics(resp: ElysiumResponse) -> dict:
+    nodes = HG.node_count()
+    edges = HG.edge_count()
+    density = 0.0 if nodes == 0 else min(1.0, edges / max(1, nodes * 1.4))
     council_active = len(resp.council_deliberation.agent_outputs or [])
     knowledge_growth = len(resp.hypergraph_delta.nodes_added or [])
     coherence = 1.0 - float(resp.strain_metadata.cognitive_strain or 0.3)
+    age_min = int((time.time() - CIVILIZATION_START_TS) / 60)
     return {
         "mycelium_density_pct": round(density * 100),
         "council_active":       council_active,
         "knowledge_growth":     knowledge_growth,
         "coherence_pct":        round(max(0.0, min(1.0, coherence)) * 100),
+        "civilization_age_min": age_min,
         "nodes":                nodes,
         "edges":                edges,
         "alert_level":          resp.ui_directives.alert_level or "CALM",
     }
+def _civilization_map_snapshot() -> dict:
+    """Compact spatial summary used by the minimap on cold start
+    or as a sync source. Frontend already maintains its own spatial layout;
+    this endpoint provides the canonical ids/types/edges."""
+    nodes_out = []
+    for i in HG.g.node_indexes():
+        d = HG.g[i]
+        nodes_out.append({
+            "node_id":  d["node_id"],
+            "label":    d.get("label", d["node_id"]),
+            "type":     d.get("node_type", "DOMAIN"),
+        })
+    edges_out = []
+    for s, t in HG.g.edge_list():
+        d = HG.g.get_edge_data(s, t)
+        edges_out.append({
+            "edge_id":  d.get("edge_id", f"e_{s}_{t}"),
+            "source":   HG.g[s]["node_id"],
+            "target":   HG.g[t]["node_id"],
+            "type":     d.get("edge_type", "GENERIC"),
+            "weight":   d.get("weight", 0.5),
+        })
+    return {"nodes": nodes_out, "edges": edges_out,
+            "node_count": HG.node_count(), "edge_count": HG.edge_count()}
 async def _load_attachment(uf: UploadFile) -> Optional[dict]:
     if uf is None or not uf.filename:
         return None
                 "error": f"file too large ({len(raw)} > {MAX_UPLOAD_BYTES} bytes)"}
     mime = (uf.content_type or "").lower()
     if mime not in ALLOWED_MIME_TYPES:
         low = uf.filename.lower()
         if low.endswith(".pdf"):
             mime = "application/pdf"
     if mime == "application/pdf":
         return {"kind": "pdf", "bytes": raw, "name": uf.filename}
     try:
         img = Image.open(io.BytesIO(raw))
         img.load()
             "node_count": HG.node_count(), "edge_count": HG.edge_count(),
         }
+    @app.get("/api/civilization_map")
+    async def civilization_map():
+        return _civilization_map_snapshot()
     @app.get("/api/node/{node_id}")
     async def node_detail(node_id: str):
         if node_id not in HG._idx:
             raise HTTPException(404, "node not found")
         idx = HG._idx[node_id]
             # 2. Build messages with hypergraph context
             messages = build_messages(user_text, valid, HG.context_summary())
+            # 3. GPU inference (returns strict JSON, possibly wrapped in <think>)
             raw = _gpu_infer(messages)
+            if not raw:
+                return JSONResponse(_fallback_envelope(user_text, "empty model output"))
+            # 4. Robust parse: strips <think>, extracts JSON, accepts bare ElysiumResponse
+            envelope = _coerce_to_envelope(raw, user_text)
+            if envelope is None:
+                return JSONResponse(_fallback_envelope(user_text, "no JSON in model output"))
             resp = envelope.elysium_response
             # 5. Apply hypergraph delta
+            try:
+                HG.apply_delta(resp.hypergraph_delta)
+                persistence.save(HG)
+            except Exception as e:
+                print(f"[hypergraph] apply_delta failed: {e}")
+                traceback.print_exc()
+            # 6. Execute tools (best-effort)
+            tool_results = []
+            try:
+                tool_results = execute_all(resp.tool_calls) if resp.tool_calls else []
+            except Exception as e:
+                print(f"[tools] execute_all failed: {e}")
+            # 7. Audio drama (combined + per-agent), best-effort
             audio_url = None
             per_agent_audio = []
             if resp.council_deliberation.debate_mode in ("AUDIO_DRAMA", "SILENT") \
             payload = envelope.model_dump()
             payload["_runtime"] = {
+                "tool_results":          tool_results,
+                "audio_url":             audio_url,
+                "per_agent_audio":       per_agent_audio,
+                "metrics":               _civilization_metrics(resp),
+                "attachment_errors":     [{"name": e["name"], "error": e["error"]} for e in errors],
+                "attachments_processed": [{"kind": a["kind"], "name": a["name"]} for a in valid],
+                "civilization_map":      _civilization_map_snapshot(),
             }
             return JSONResponse(payload)