Spaces:

smolagents
/

ml-agent

Running

akseljoonas HF Staff Claude Opus 4.6 commited on Mar 11

Commit

a017896

1 Parent(s): b94b18b

fix: handle interrupt during streaming tool calls without corrupting context

When the user clicks interrupt while the LLM is streaming a tool call,
the accumulated deltas can have empty IDs and truncated arguments.
Previously these got added to the context and caused litellm API errors
on the next call.

- Add cancellation check inside the streaming loop so we stop early
- Drop tool_calls with empty IDs when building from stream deltas
- recover_malformed_tool_calls() now strips empty-ID tool_calls from
assistant messages as a safety net

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

Files changed (2) hide show

agent/context_manager/manager.py +24 -7
agent/core/agent_loop.py +13 -1

agent/context_manager/manager.py CHANGED Viewed

@@ -167,11 +167,11 @@ class ContextManager:
     def recover_malformed_tool_calls(self) -> set[str]:
         """Sanitize malformed tool_call arguments and inject error results.
-        For every tool_call whose arguments are not valid JSON:
-        1. Replaces the arguments with ``"{}"`` so the context stays
-           valid for the LLM API.
-        2. Injects a ``tool`` result message explaining the error and
-           asking the agent to retry with smaller content.
         This method is idempotent — safe to call from both the agent loop
         (before tool execution) and from :meth:`get_messages` (safety net).
@@ -183,7 +183,6 @@ class ContextManager:
         malformed_ids: set[str] = set()
-        # 1. Find and sanitize malformed arguments
         for msg in self.items:
             if getattr(msg, "role", None) != "assistant":
                 continue
@@ -191,6 +190,24 @@ class ContextManager:
             if not tool_calls:
                 continue
             self._normalize_tool_calls(msg)
             for tc in msg.tool_calls:
                 try:
                     json.loads(tc.function.arguments)
@@ -205,7 +222,7 @@ class ContextManager:
         if not malformed_ids:
             return malformed_ids
-        # 2. Inject error results for malformed calls that don't have one yet
         answered_ids = {
             getattr(m, "tool_call_id", None)
             for m in self.items

     def recover_malformed_tool_calls(self) -> set[str]:
         """Sanitize malformed tool_call arguments and inject error results.
+        Handles two classes of corruption:
+        - **Empty/missing IDs**: Stripped from the assistant message entirely
+          (common when streaming is interrupted mid-tool-call).
+        - **Malformed JSON arguments**: Replaced with ``"{}"`` and an error
+          tool-result is injected asking the agent to retry.
         This method is idempotent — safe to call from both the agent loop
         (before tool execution) and from :meth:`get_messages` (safety net).
         malformed_ids: set[str] = set()
         for msg in self.items:
             if getattr(msg, "role", None) != "assistant":
                 continue
             if not tool_calls:
                 continue
             self._normalize_tool_calls(msg)
+            # 1. Strip tool_calls with empty/missing IDs (cannot be repaired)
+            valid_tcs = []
+            for tc in msg.tool_calls:
+                if not getattr(tc, "id", None):
+                    logger.warning(
+                        "Stripping tool_call with empty ID (name=%s) — likely interrupted stream",
+                        getattr(tc.function, "name", "?"),
+                    )
+                    continue
+                valid_tcs.append(tc)
+            if len(valid_tcs) != len(msg.tool_calls):
+                msg.tool_calls = valid_tcs or None
+            if not msg.tool_calls:
+                continue
+            # 2. Fix malformed JSON arguments
             for tc in msg.tool_calls:
                 try:
                     json.loads(tc.function.arguments)
         if not malformed_ids:
             return malformed_ids
+        # 3. Inject error results for malformed calls that don't have one yet
         answered_ids = {
             getattr(m, "tool_call_id", None)
             for m in self.items

agent/core/agent_loop.py CHANGED Viewed

@@ -261,6 +261,11 @@ class Handlers:
                 token_count = 0
                 async for chunk in response:
                     choice = chunk.choices[0] if chunk.choices else None
                     if not choice:
                         # Last chunk may carry only usage info
@@ -309,10 +314,17 @@ class Handlers:
                 # ── Stream finished — reconstruct full message ───────
                 content = full_content or None
-                # Build tool_calls list from accumulated deltas
                 tool_calls: list[ToolCall] = []
                 for idx in sorted(tool_calls_acc.keys()):
                     tc_data = tool_calls_acc[idx]
                     tool_calls.append(
                         ToolCall(
                             id=tc_data["id"],

                 token_count = 0
                 async for chunk in response:
+                    # ── Check cancellation during streaming ──
+                    if session.is_cancelled:
+                        tool_calls_acc.clear()
+                        break
                     choice = chunk.choices[0] if chunk.choices else None
                     if not choice:
                         # Last chunk may carry only usage info
                 # ── Stream finished — reconstruct full message ───────
                 content = full_content or None
+                # Build tool_calls list from accumulated deltas,
+                # dropping any with empty IDs (from interrupted streams)
                 tool_calls: list[ToolCall] = []
                 for idx in sorted(tool_calls_acc.keys()):
                     tc_data = tool_calls_acc[idx]
+                    if not tc_data["id"]:
+                        logger.warning(
+                            "Dropping tool_call with empty ID (name=%s) — likely interrupted stream",
+                            tc_data["function"]["name"],
+                        )
+                        continue
                     tool_calls.append(
                         ToolCall(
                             id=tc_data["id"],