z2api

Sleeping

App Files Files Community

ZyphrZero commited on Sep 15, 2025

Commit

d264039

1 Parent(s): e985dd1

✨ feat(app/utils): 优化SSE工具处理逻辑，支持增量解析和状态管理

Browse files

Files changed (1) hide show

app/utils/sse_tool_handler.py +374 -160

app/utils/sse_tool_handler.py CHANGED Viewed

@@ -3,11 +3,13 @@
 """
 SSE Tool Handler - 处理工具调用的SSE流
 """
 import json
 import time
-from typing import Dict, Any, Optional, Generator
 from app.utils.logger import get_logger
@@ -20,125 +22,367 @@ class SSEToolHandler:
         self.chat_id = chat_id
         self.model = model
         self.has_tool_call = False
-        self.tool_args = ""  # 当前工具的参数累积
-        self.tool_id = ""  # 当前工具ID
-        self.tool_name = ""  # 当前工具名称
         self.tool_call_usage = None  # 工具调用的usage信息
         self.content_index = 0
         self.has_thinking = False
     def process_tool_call_phase(self, data: Dict[str, Any], is_stream: bool = True) -> Generator[str, None, None]:
         """
-        处理tool_call阶段
-        参考JS的forEach逻辑，每个块独立处理
         """
         if not self.has_tool_call:
             self.has_tool_call = True
             logger.debug("🔧 进入工具调用阶段")
         edit_content = data.get("edit_content", "")
         if not edit_content:
             return
-        logger.debug(f"📦 解析数据块: {edit_content}")
-        # 分割glm_block块
-        blocks = edit_content.split("<glm_block >")
-        for index, block in enumerate(blocks):
-            if not block:
-                continue
-            logger.debug(f"  📦 处理块 {index}: {block[:200]}...")
-            if "</glm_block>" not in block:
-                # 这个块不完整，可能是参数片段
-                if index == 0:
-                    # 第一个块的参数片段
-                    self.tool_args += block
-                    logger.debug(f"  📦 累积参数片段: {block}")
-                continue
-            if index == 0:
-                # 第一个块：提取参数片段（到"result"之前）
-                # 提取到 '"result"' 之前的内容
-                if '"result"' in edit_content:
-                    result_index = edit_content.index('"result"')
-                    args_fragment = edit_content[:result_index - 3]
-                    self.tool_args += args_fragment
-                    logger.debug(f"📦 从第一个块提取参数片段: {args_fragment}")
-            else:
-                # 后续块：新的工具调用
-                # 如果当前有工具正在处理，先完成它
-                if self.tool_id:
-                    logger.debug(f"  🎯 完成当前工具: {self.tool_name}")
-                    yield from self._finish_current_tool(is_stream)
-                # 解析新工具信息
-                try:
-                    block_content = block[:block.index("</glm_block>")]
-                    content = json.loads(block_content)
-                    metadata = content.get("data", {}).get("metadata", {})
-                    # 开始新工具
-                    self.tool_id = metadata.get("id", "")
-                    self.tool_name = metadata.get("name", "")
-                    arguments = metadata.get("arguments", {})
-                    # 累积参数（去掉最后的}以便后续累积）
-                    self.tool_args = json.dumps(arguments, ensure_ascii=False)[:-1]
-                    logger.debug(f"🎯 新工具调用: {self.tool_name}(id={self.tool_id})")
-                    logger.debug(f"  📦 初始参数: {self.tool_args}")
-                    if is_stream:
-                        yield self._create_tool_start_chunk()
-                    self.content_index += 1
-                except (json.JSONDecodeError, KeyError) as e:
-                    logger.error(f"❌ 解析工具块失败: {e}")
-                    logger.error(f"  📦 块内容: {block[:500]}")
-    def _finish_current_tool(self, is_stream: bool) -> Generator[str, None, None]:
-        if not self.tool_id:
-            return
         try:
-            test_args = self.tool_args + '"'
-            logger.debug(f"✅ 工具参数解析成功: {self.tool_name}")
-            logger.debug(f"  📦 最终参数字符串: {test_args}")
-            # 解析参数
-            params = json.loads(test_args)
-            logger.debug(f"✅ 完成工具调用: {self.tool_name} with params: {params}")
-            if is_stream:
-                yield self._create_tool_arguments_chunk(params)
         except json.JSONDecodeError as e:
-            logger.error(f"❌ 工具参数解析失败: {e}")
-            logger.error(f"  📦 原始参数: {self.tool_args[:200]}")
-            logger.error(f"  📦 测试参数: {test_args[:200] if 'test_args' in locals() else 'N/A'}")
-            # 解析失败时使用空参数
-            params = {}
             if is_stream:
-                yield self._create_tool_arguments_chunk(params)
-        finally:
-            # 清理当前工具状态
-            self.tool_args = ""
-            self.tool_id = ""
-            self.tool_name = ""
     def process_other_phase(self, data: Dict[str, Any], is_stream: bool = True) -> Generator[str, None, None]:
         """
-        处理other阶段
-        主要检测工具调用结束
         """
         edit_content = data.get("edit_content", "")
         usage = data.get("usage")
         # 保存usage信息
@@ -146,93 +390,63 @@ class SSEToolHandler:
             self.tool_call_usage = usage
             logger.debug(f"💾 保存工具调用usage: {usage}")
-        # 检测工具调用结束标记 "null,"
-        if self.has_tool_call and edit_content and edit_content.startswith("null,"):
-            logger.debug("🏁 检测到工具调用结束标记: null,")
-            # 补充引号并完成最后一个工具调用
-            self.tool_args += '"'
             self.has_tool_call = False
-            try:
-                # 解析最终参数
-                params = json.loads(self.tool_args)
-                logger.debug(f"✅ 最终工具参数解析成功: {params}")
-                if is_stream:
-                    # 创建工具参数块
-                    tool_call_delta = {
-                        "id": self.tool_id,
-                        "type": "function",
-                        "function": {
-                            "name": None,
-                            "arguments": json.dumps(params, ensure_ascii=False),
-                        },
-                    }
-                    delta_res = {
-                        "choices": [
-                            {
-                                "delta": {
-                                    "role": "assistant",
-                                    "content": None,
-                                    "tool_calls": [tool_call_delta],
-                                },
-                                "finish_reason": None,
-                                "index": 0,
-                                "logprobs": None,
-                            }
-                        ],
-                        "created": int(time.time()),
-                        "id": self.chat_id,
-                        "model": self.model,
-                        "object": "chat.completion.chunk",
-                        "system_fingerprint": "fp_zai_001",
-                    }
-                    yield f"data: {json.dumps(delta_res, ensure_ascii=False)}\n\n"
-                    # 发送工具完成信号
-                    finish_res = {
-                        "choices": [
-                            {
-                                "delta": {
-                                    "role": "assistant",
-                                    "content": None,
-                                    "tool_calls": [],
-                                },
-                                "finish_reason": "tool_calls",
-                                "index": 0,
-                                "logprobs": None,
-                            }
-                        ],
-                        "created": int(time.time()),
-                        "id": self.chat_id,
-                        "usage": self.tool_call_usage or None,
-                        "model": self.model,
-                        "object": "chat.completion.chunk",
-                        "system_fingerprint": "fp_zai_001",
-                    }
-                    logger.info("🏁 发送工具调用完成信号")
-                    yield f"data: {json.dumps(finish_res, ensure_ascii=False)}\n\n"
-                    yield "data: [DONE]\n\n"
-            except json.JSONDecodeError as e:
-                logger.error(f"❌ 最终参数解析失败: {e}")
-                logger.error(f"  📦 参数内容: {self.tool_args}")
-            # 重置所有状态
-            self._reset_all_state()
     def _reset_all_state(self):
         """重置所有状态"""
         self.has_tool_call = False
-        self.tool_args = ""
-        self.tool_id = ""
-        self.tool_name = ""
         self.tool_call_usage = None
         self.content_index = 0
-    def _create_tool_start_chunk(self) -> str:
         """创建工具调用开始的chunk"""
         chunk = {
             "choices": [
@@ -242,9 +456,9 @@ class SSEToolHandler:
                         "content": None,
                         "tool_calls": [
                             {
-                                "id": self.tool_id,
                                 "type": "function",
-                                "function": {"name": self.tool_name, "arguments": ""},
                             }
                         ],
                     },
@@ -261,7 +475,7 @@ class SSEToolHandler:
         }
         return f"data: {json.dumps(chunk, ensure_ascii=False)}\n\n"
-    def _create_tool_arguments_chunk(self, arguments: Dict) -> str:
         """创建工具参数的chunk"""
         chunk = {
             "choices": [
@@ -271,14 +485,14 @@ class SSEToolHandler:
                         "content": None,
                         "tool_calls": [
                             {
-                                "id": self.tool_id,
                                 "type": "function",
                                 "function": {"name": None, "arguments": json.dumps(arguments, ensure_ascii=False)},
                             }
                         ],
                     },
                     "finish_reason": None,
-                    "index": self.content_index,  # 使用正确的索引
                     "logprobs": None,
                 }
             ],

 """
 SSE Tool Handler - 处理工具调用的SSE流
+基于 Z.AI 原生的 edit_index 和 edit_content 机制，更原生地处理工具调用
 """
 import json
+import re
 import time
+from typing import Dict, Any, Optional, Generator, List
 from app.utils.logger import get_logger
         self.chat_id = chat_id
         self.model = model
+        # 工具调用状态
         self.has_tool_call = False
         self.tool_call_usage = None  # 工具调用的usage信息
         self.content_index = 0
         self.has_thinking = False
+        # 原生内容重建机制 - 基于 Z.AI 的 edit_index 机制
+        self.content_buffer = bytearray()  # 使用字节数组提高性能
+        self.last_edit_index = 0  # 上次编辑的位置
+        # 工具调用解析状态
+        self.active_tools = {}  # 活跃的工具调用 {tool_id: tool_info}
+        self.completed_tools = []  # 已完成的工具调用
+        self.tool_blocks_cache = {}  # 缓存解析的工具块
     def process_tool_call_phase(self, data: Dict[str, Any], is_stream: bool = True) -> Generator[str, None, None]:
         """
+        处理tool_call阶段 - 基于原生edit_index机制处理工具调用
         """
         if not self.has_tool_call:
             self.has_tool_call = True
             logger.debug("🔧 进入工具调用阶段")
         edit_content = data.get("edit_content", "")
+        edit_index = data.get("edit_index", 0)
         if not edit_content:
             return
+        # logger.debug(f"📦 接收内容片段 [index={edit_index}]: {edit_content[:1000]}...")
+        # 使用原生的edit_index机制更新内容缓冲区
+        self._apply_edit_to_buffer(edit_index, edit_content)
+        # 尝试解析和处理工具调用
+        yield from self._process_tool_calls_from_buffer(is_stream)
+    def _apply_edit_to_buffer(self, edit_index: int, edit_content: str):
+        """
+        基于edit_index原生地更新内容缓冲区
+        这是Z.AI的核心机制：在指定位置替换/插入内容
+        """
+        edit_bytes = edit_content.encode('utf-8')
+        required_length = edit_index + len(edit_bytes)
+        # 扩展缓冲区到所需长度（如果需要）
+        if len(self.content_buffer) < edit_index:
+            # 如果edit_index超出当前缓冲区，用空字节填充
+            self.content_buffer.extend(b'\x00' * (edit_index - len(self.content_buffer)))
+        # 确保缓冲区足够长以容纳新内容
+        if len(self.content_buffer) < required_length:
+            self.content_buffer.extend(b'\x00' * (required_length - len(self.content_buffer)))
+        # 在指定位置替换内容（不是插入，而是覆盖）
+        end_index = edit_index + len(edit_bytes)
+        self.content_buffer[edit_index:end_index] = edit_bytes
+        # logger.debug(f"📝 缓冲区更新 [index={edit_index}, 长度={len(self.content_buffer)}]")
+    def _process_tool_calls_from_buffer(self, is_stream: bool) -> Generator[str, None, None]:
+        """
+        从内容缓冲区中解析和处理工具调用
+        """
+        try:
+            # 解码内容并清理空字节
+            content_str = self.content_buffer.decode('utf-8', errors='ignore').replace('\x00', '')
+            yield from self._extract_and_process_tools(content_str, is_stream)
+        except Exception as e:
+            logger.debug(f"📦 内容解析暂时失败，等待更多数据: {e}")
+            # 不抛出异常，继续等待更多数据
+    def _extract_and_process_tools(self, content_str: str, is_stream: bool) -> Generator[str, None, None]:
+        """
+        从内容字符串中提取和处理工具调用
+        使用更原生的方式解析 glm_block
+        """
+        # 查找所有 glm_block，包括不完整的
+        pattern = r'<glm_block\s*>(.*?)(?:</glm_block>|$)'
+        matches = re.findall(pattern, content_str, re.DOTALL)
+        for block_content in matches:
+            # 尝试解析每个块
+            yield from self._process_single_tool_block(block_content, is_stream)
+    def _process_single_tool_block(self, block_content: str, is_stream: bool) -> Generator[str, None, None]:
+        """
+        处理单个工具块，支持增量解析
+        """
         try:
+            # 尝试修复和解析完整的JSON
+            fixed_content = self._fix_json_structure(block_content)
+            tool_data = json.loads(fixed_content)
+            metadata = tool_data.get("data", {}).get("metadata", {})
+            tool_id = metadata.get("id", "")
+            tool_name = metadata.get("name", "")
+            arguments_raw = metadata.get("arguments", "{}")
+            if not tool_id or not tool_name:
+                return
+            logger.debug(f"🎯 解析完整工具块: {tool_name}(id={tool_id}), 参数: {arguments_raw}")
+            # 检查是否是新工具或更新的工具
+            yield from self._handle_tool_update(tool_id, tool_name, arguments_raw, is_stream)
         except json.JSONDecodeError as e:
+            logger.debug(f"📦 JSON解析失败: {e}, 尝试部分解析")
+            # JSON 不完整，尝试部分解析
+            yield from self._handle_partial_tool_block(block_content, is_stream)
+        except Exception as e:
+            logger.debug(f"📦 工具块处理失败: {e}")
+    def _fix_json_structure(self, content: str) -> str:
+        """
+        修复JSON结构中的常见问题
+        """
+        if not content:
+            return content
+        # 计算括号平衡
+        open_braces = content.count('{')
+        close_braces = content.count('}')
+        # 如果闭括号多于开括号，移除多余的闭括号
+        if close_braces > open_braces:
+            excess = close_braces - open_braces
+            fixed_content = content
+            for _ in range(excess):
+                # 从右侧移除多余的闭括号
+                last_brace_pos = fixed_content.rfind('}')
+                if last_brace_pos != -1:
+                    fixed_content = fixed_content[:last_brace_pos] + fixed_content[last_brace_pos + 1:]
+            return fixed_content
+        return content
+    def _handle_tool_update(self, tool_id: str, tool_name: str, arguments_raw: str, is_stream: bool) -> Generator[str, None, None]:
+        """
+        处理工具的创建或更新
+        """
+        # 解析参数
+        try:
+            if isinstance(arguments_raw, str):
+                # 先处理转义和清理
+                cleaned_args = self._clean_arguments_string(arguments_raw)
+                arguments = json.loads(cleaned_args) if cleaned_args.strip() else {}
+            else:
+                arguments = arguments_raw
+        except json.JSONDecodeError:
+            logger.debug(f"📦 参数解析失败，使用部分参数: {arguments_raw[:100]}")
+            arguments = self._parse_partial_arguments(arguments_raw)
+        # 检查是否是新工具
+        if tool_id not in self.active_tools:
+            logger.debug(f"🎯 发现新工具: {tool_name}(id={tool_id})")
+            self.active_tools[tool_id] = {
+                "id": tool_id,
+                "name": tool_name,
+                "arguments": arguments,
+                "status": "active",
+                "sent_start": False,
+                "sent_args": False
+            }
             if is_stream:
+                # 发送工具开始信号
+                yield self._create_tool_start_chunk(tool_id, tool_name)
+                self.active_tools[tool_id]["sent_start"] = True
+        # 更新参数（如果有变化）
+        current_tool = self.active_tools[tool_id]
+        if current_tool["arguments"] != arguments:
+            current_tool["arguments"] = arguments
+            if is_stream and current_tool["sent_start"] and not current_tool["sent_args"]:
+                # 发送工具参数
+                yield self._create_tool_arguments_chunk(tool_id, arguments)
+                current_tool["sent_args"] = True
+    def _handle_partial_tool_block(self, block_content: str, is_stream: bool) -> Generator[str, None, None]:
+        """
+        处理不完整的工具块，尝试提取可用信息
+        """
+        try:
+            # 尝试提取工具ID和名称
+            id_match = re.search(r'"id":\s*"([^"]+)"', block_content)
+            name_match = re.search(r'"name":\s*"([^"]+)"', block_content)
+            if id_match and name_match:
+                tool_id = id_match.group(1)
+                tool_name = name_match.group(1)
+                # 尝试提取参数部分
+                args_match = re.search(r'"arguments":\s*"([^"]*)', block_content)
+                partial_args = args_match.group(1) if args_match else ""
+                logger.debug(f"📦 部分工具块: {tool_name}(id={tool_id}), 部分参数: {partial_args[:50]}")
+                # 如果是新工具，先创建记录
+                if tool_id not in self.active_tools:
+                    self.active_tools[tool_id] = {
+                        "id": tool_id,
+                        "name": tool_name,
+                        "arguments": {},
+                        "status": "partial",
+                        "sent_start": False,
+                        "sent_args": False,
+                        "partial_args": partial_args
+                    }
+                    if is_stream:
+                        yield self._create_tool_start_chunk(tool_id, tool_name)
+                        self.active_tools[tool_id]["sent_start"] = True
+                else:
+                    # 更新部分参数
+                    self.active_tools[tool_id]["partial_args"] = partial_args
+        except Exception as e:
+            logger.debug(f"📦 部分块解析失败: {e}")
+    def _clean_arguments_string(self, arguments_raw: str) -> str:
+        """
+        清理和标准化参数字符串
+        """
+        if not arguments_raw:
+            return "{}"
+        # 移除首尾空白
+        cleaned = arguments_raw.strip()
+        # 处理特殊值
+        if cleaned.lower() == "null":
+            return "{}"
+        # 处理转义的JSON字符串
+        if cleaned.startswith('{\\"') and cleaned.endswith('\\"}'):
+            # 这是一个转义的JSON字符串，需要反转义
+            cleaned = cleaned.replace('\\"', '"')
+        elif cleaned.startswith('"{\\"') and cleaned.endswith('\\"}'):
+            # 双重转义的情况
+            cleaned = cleaned[1:-1].replace('\\"', '"')
+        # 标准化空格（移除JSON中的多余空格，但保留字符串值中的空格）
+        try:
+            # 先尝试解析，然后重新序列化以标准化格式
+            parsed = json.loads(cleaned)
+            if parsed is None:
+                return "{}"
+            cleaned = json.dumps(parsed, ensure_ascii=False, separators=(',', ':'))
+        except json.JSONDecodeError:
+            # 如果解析失败，只做基本的空格清理
+            pass
+        return cleaned
+    def _parse_partial_arguments(self, arguments_raw: str) -> Dict[str, Any]:
+        """
+        解析不完整的参数字符串，尽可能提取有效信息
+        """
+        if not arguments_raw or arguments_raw.strip() == "" or arguments_raw.strip().lower() == "null":
+            return {}
+        try:
+            # 先尝试清理字符串
+            cleaned = self._clean_arguments_string(arguments_raw)
+            result = json.loads(cleaned)
+            # 确保返回字典类型
+            return result if isinstance(result, dict) else {}
+        except json.JSONDecodeError:
+            pass
+        try:
+            # 尝试修复常见的JSON问题
+            fixed_args = arguments_raw.strip()
+            # 处理转义字符
+            if '\\' in fixed_args:
+                fixed_args = fixed_args.replace('\\"', '"')
+            # 如果不是以{开头，添加{
+            if not fixed_args.startswith('{'):
+                fixed_args = '{' + fixed_args
+            # 如果不是以}结尾，尝试添加}
+            if not fixed_args.endswith('}'):
+                # 计算未闭合的引号和括号
+                quote_count = fixed_args.count('"') - fixed_args.count('\\"')
+                if quote_count % 2 != 0:
+                    fixed_args += '"'
+                fixed_args += '}'
+            return json.loads(fixed_args)
+        except json.JSONDecodeError:
+            # 尝试提取键值对
+            return self._extract_key_value_pairs(arguments_raw)
+        except Exception:
+            # 如果所有方法都失败，返回空字典
+            return {}
+    def _extract_key_value_pairs(self, text: str) -> Dict[str, Any]:
+        """
+        从文本中提取键值对，作为最后的解析尝试
+        """
+        result = {}
+        try:
+            # 使用正则表达式提取简单的键值对
+            import re
+            # 匹配 "key": "value" 或 "key": value 格式
+            pattern = r'"([^"]+)":\s*"([^"]*)"'
+            matches = re.findall(pattern, text)
+            for key, value in matches:
+                result[key] = value
+            # 匹配数字值
+            pattern = r'"([^"]+)":\s*(\d+)'
+            matches = re.findall(pattern, text)
+            for key, value in matches:
+                try:
+                    result[key] = int(value)
+                except ValueError:
+                    result[key] = value
+            # 匹配布尔值
+            pattern = r'"([^"]+)":\s*(true|false)'
+            matches = re.findall(pattern, text)
+            for key, value in matches:
+                result[key] = value.lower() == 'true'
+        except Exception:
+            pass
+        return result
+    def _complete_active_tools(self, is_stream: bool) -> Generator[str, None, None]:
+        """
+        完成所有活跃的工具调用
+        """
+        for tool_id, tool in self.active_tools.items():
+            tool["status"] = "completed"
+            self.completed_tools.append(tool)
+            logger.debug(f"✅ 完成工具调用: {tool['name']}(id={tool_id})")
+        self.active_tools.clear()
+        if is_stream and self.completed_tools:
+            # 发送工具完成信号
+            yield self._create_tool_finish_chunk()
     def process_other_phase(self, data: Dict[str, Any], is_stream: bool = True) -> Generator[str, None, None]:
         """
+        处理other阶段 - 检测工具调用结束和状态更新
         """
         edit_content = data.get("edit_content", "")
+        edit_index = data.get("edit_index", 0)
         usage = data.get("usage")
         # 保存usage信息
             self.tool_call_usage = usage
             logger.debug(f"💾 保存工具调用usage: {usage}")
+        # 如果有edit_content，继续更新内容缓冲区
+        if edit_content:
+            self._apply_edit_to_buffer(edit_index, edit_content)
+            # 继续处理可能的工具调用更新
+            yield from self._process_tool_calls_from_buffer(is_stream)
+        # 检测工具调用结束的多种标记
+        if self.has_tool_call and self._is_tool_call_finished(edit_content):
+            logger.debug("🏁 检测到工具调用结束")
+            # 完成所有活跃的工具
+            yield from self._complete_active_tools(is_stream)
+            if is_stream:
+                logger.info("🏁 发送工具调用完成信号")
+                yield "data: [DONE]\n\n"
+            # 重置工具调用状态
             self.has_tool_call = False
+    def _is_tool_call_finished(self, edit_content: str) -> bool:
+        """
+        检测工具调用是否结束的多种标记
+        """
+        if not edit_content:
+            return False
+        # 检测各种结束标记
+        end_markers = [
+            "null,",  # 原有的结束标记
+            '"status": "completed"',  # 状态完成标记
+            '"is_error": false',  # 错误状态标记
+        ]
+        for marker in end_markers:
+            if marker in edit_content:
+                logger.debug(f"🔍 检测到结束标记: {marker}")
+                return True
+        # 检查是否所有工具都有完整的结构
+        if self.active_tools and '"status": "completed"' in self.content_buffer:
+            return True
+        return False
     def _reset_all_state(self):
         """重置所有状态"""
         self.has_tool_call = False
         self.tool_call_usage = None
         self.content_index = 0
+        self.content_buffer = bytearray()
+        self.last_edit_index = 0
+        self.active_tools.clear()
+        self.completed_tools.clear()
+        self.tool_blocks_cache.clear()
+    def _create_tool_start_chunk(self, tool_id: str, tool_name: str) -> str:
         """创建工具调用开始的chunk"""
         chunk = {
             "choices": [
                         "content": None,
                         "tool_calls": [
                             {
+                                "id": tool_id,
                                 "type": "function",
+                                "function": {"name": tool_name, "arguments": "{}"},
                             }
                         ],
                     },
         }
         return f"data: {json.dumps(chunk, ensure_ascii=False)}\n\n"
+    def _create_tool_arguments_chunk(self, tool_id: str, arguments: Dict) -> str:
         """创建工具参数的chunk"""
         chunk = {
             "choices": [
                         "content": None,
                         "tool_calls": [
                             {
+                                "id": tool_id,
                                 "type": "function",
                                 "function": {"name": None, "arguments": json.dumps(arguments, ensure_ascii=False)},
                             }
                         ],
                     },
                     "finish_reason": None,
+                    "index": self.content_index,
                     "logprobs": None,
                 }
             ],