File size: 49,591 Bytes

5374a2d

from typing import Dict, Any, List, Optional, Tuple
import random
import json
import os
from pydantic import Field

from ...workflow.action_graph import ActionGraph
from ...models.model_configs import LLMConfig, OpenAILLMConfig
from ...models.base_model import LLMOutputParser
from ...workflow.operators import QAScEnsemble
from .utils import (
    format_transcript,
    collect_last_round_candidates,
    collect_round_candidates,
)
from ...prompts.workflow.multi_agent_debate import (
    DEBATER_AGENT_PROMPT,
    JUDGE_AGENT_PROMPT,
    build_agent_prompt,
    build_judge_prompt,
    get_default_personas,
)
from .pruning import PruningPipeline
from ...agents.customize_agent import CustomizeAgent


class DebateAgentOutput(LLMOutputParser):
    """Output structure for individual debater in a round."""

    thought: str = Field(default="", description="Thinking process")
    argument: str = Field(default="", description="Argument or rebuttal for this round")
    answer: Optional[str] = Field(default=None, description="Current answer for this round (optional)")


class DebateJudgeOutput(LLMOutputParser):
    """Final judgment from judge after debate."""

    rationale: str = Field(default="", description="Judging rationale")
    winning_agent_id: int = Field(default=0, description="Winning debater ID (starting from 0)")
    final_answer: str = Field(default="", description="Final answer")


class MultiAgentDebateActionGraph(ActionGraph):
    """Multi-Agent Debate ActionGraph implementation (Google MAD style)."""

    name: str = "MultiAgentDebate"
    description: str = "Multi-agent debate workflow framework"
    # Unified LLM configuration: default configuration for all agents
    llm_config: LLMConfig = Field(default_factory=lambda: OpenAILLMConfig(
        model="gpt-4o-mini",
        openai_key=os.getenv("OPENAI_API_KEY")
    ), description="Default LLM configuration for all agents")
    # Unified agent configuration: all debaters use the same agent configuration
    debater_agents: Optional[List[CustomizeAgent]] = Field(default=None, description="Optional: multiple debater CustomizeAgents, randomly selected during execution")
    judge_agent: Optional[CustomizeAgent] = Field(default=None, description="Optional: judge CustomizeAgent, used for judging phase if provided")
    # Optional model pool: for random selection of different models
    llm_config_pool: Optional[List[LLMConfig]] = Field(default=None, description="Optional: LLM configuration pool for random selection, provides choices for agents without specified models")
    # Group workflow mode (each position occupied by an independent workflow graph instead of agent)
    group_graphs_enabled: bool = Field(default=False, description="Enable group graph mode: replace individual debaters with workflow graphs")
    group_graphs: Optional[List[ActionGraph]] = Field(default=None, description="When group graph mode is enabled, provide workflow graph list (length >= 1)")

    # Runtime attributes
    _sc_ensemble: Optional[QAScEnsemble] = None

    def init_module(self):
        """Initialize module (create LLM, construct reusable operators)."""
        super().init_module()
        
        # Configuration conflict and integrity validation
        if self.group_graphs_enabled and self.debater_agents:
            raise ValueError(
                "Configuration conflict: cannot configure debater_agents when group_graphs_enabled is enabled."
            )
        if self.group_graphs_enabled and (not self.group_graphs or len(self.group_graphs) == 0):
            raise ValueError(
                "Configuration error: must provide non-empty group_graphs list when group graph mode is enabled."
            )
        if (not self.group_graphs_enabled) and self.group_graphs:
            raise ValueError(
                "Configuration error: provided group_graphs but did not enable group_graphs_enabled. Please enable both or remove group_graphs."
            )
        
        self._sc_ensemble = QAScEnsemble(self._llm)
           
    def _create_default_debater_agent(self) -> CustomizeAgent:
        """Create default debater CustomizeAgent (XML parsing thought/argument/answer)."""
        llm_config = random.choice(self.llm_config_pool) if self.llm_config_pool else self.llm_config
        
        return CustomizeAgent(
            name="DebaterAgent",
            description="Generate argument/rebuttal and optional answer per debate round.",
            prompt=DEBATER_AGENT_PROMPT,
            llm_config=llm_config,
            inputs=[
                {"name": "problem", "type": "str", "description": "Problem statement"},
                {"name": "transcript_text", "type": "str", "description": "Formatted debate transcript so far"},
                {"name": "role", "type": "str", "description": "Debater role/persona"},
                {"name": "agent_id", "type": "str", "description": "Debater id (string)"},
                {"name": "round_index", "type": "str", "description": "1-based round index"},
                {"name": "total_rounds", "type": "str", "description": "Total rounds"},
            ],
            outputs=[
                {"name": "thought", "type": "str", "description": "Brief reasoning", "required": True},
                {"name": "argument", "type": "str", "description": "Argument or rebuttal", "required": True},
                {"name": "answer", "type": "str", "description": "Optional current answer", "required": False},
            ],
            parse_mode="xml",
        )

    def _create_default_judge_agent(self) -> CustomizeAgent:
        """Create default judge CustomizeAgent (XML parsing rationale/winning_agent_id/final_answer)."""
        llm_config = random.choice(self.llm_config_pool) if self.llm_config_pool else self.llm_config
        
        return CustomizeAgent(
            name="JudgeAgent",
            description="Deliver final decision and answer based on debate transcript.",
            prompt=JUDGE_AGENT_PROMPT,
            llm_config=llm_config,
            inputs=[
                {"name": "problem", "type": "str", "description": "Problem statement"},
                {"name": "transcript_text", "type": "str", "description": "Formatted debate transcript"},
                {"name": "roles_text", "type": "str", "description": "Roles listing text"},
            ],
            outputs=[
                {"name": "rationale", "type": "str", "description": "Judging rationale", "required": True},
                {"name": "winning_agent_id", "type": "str", "description": "Winning agent id (integer as string)", "required": True},
                {"name": "final_answer", "type": "str", "description": "Final answer", "required": True},
            ],
            parse_mode="xml",
        )

    def execute(
        self,
        problem: str,
        num_agents: int = 3,
        num_rounds: int = 3,
        judge_mode: str = "llm_judge",  # options: ["llm_judge", "self_consistency"]
        personas: Optional[List[str]] = None,
        return_transcript: bool = True,
        agent_llm_configs: Optional[List[LLMConfig]] = None,
        enable_pruning: bool = False,
        pruning_qp_threshold: float = 0.15,
        pruning_dp_similarity_threshold: float = 0.92,
        pruning_enable_mr: bool = False,
        pruning_mr_llm_config: Optional[LLMConfig] = None,
        pruning_snapshot_mode: bool = False,
        transcript_mode: str = "prev",  # options: ["prev", "all"]
        **kwargs,
    ) -> dict:
        """Execute debate workflow (synchronous)."""
        state = self._setup_debate(problem, num_agents, num_rounds, personas, agent_llm_configs)
        transcript = self._run_debate_rounds(problem, state, transcript_mode)
        # Pruning (before consensus, filter and optionally correct last round candidates)
        pruning_info = None
        pruning_debug = None
        pruning_rounds_debug: Optional[List[Dict[str, Any]]] = None
        if enable_pruning:
            # Set minimum retention based on participants (default ratio 0.3, at least 1)
            min_keep = max(1, int(round(state["num_agents"] * 0.3)))
            pipeline = PruningPipeline(
                enable_qp=True,
                enable_dp=True,
                enable_mr=pruning_enable_mr,
                qp_threshold=pruning_qp_threshold,
                dp_similarity_threshold=pruning_dp_similarity_threshold,
                mr_llm_config=pruning_mr_llm_config,
                min_keep_count=min_keep,
            )
            if pruning_snapshot_mode:
                # Generate snapshot for each round (doesn't change main flow, only for display)
                pruning_rounds_debug = []
                for r in range(state["num_rounds"]):
                    rcands = collect_round_candidates(
                        transcript=transcript, num_agents=state["num_agents"], round_index=r
                    )
                    info_r = pipeline.apply(problem=problem, candidates=rcands)
                    pruning_rounds_debug.append(
                        {
                            "round": r,
                            "before_candidates": rcands,
                            "after_candidates": info_r.get("candidates", []),
                            "mr_suggested": info_r.get("mr_suggested"),
                        }
                    )
            candidates = collect_last_round_candidates(
                transcript=transcript, num_agents=state["num_agents"], last_round_index=state["num_rounds"] - 1
            )
            pruning_info = pipeline.apply(problem=problem, candidates=candidates)
            try:
                pruning_debug = {
                    "before_candidates": candidates,
                    "after_candidates": pruning_info.get("candidates", []),
                    "mr_suggested": pruning_info.get("mr_suggested"),
                }
            except Exception:
                pruning_debug = None
        consensus = self._generate_consensus(problem, state, transcript, judge_mode, pruning_info)
        result: Dict[str, Any] = {
            "final_answer": consensus["final_answer"],
            "winner": consensus.get("winner"),
            "rationale": consensus.get("rationale"),
        }
        if return_transcript:
            result["transcript"] = transcript
        if enable_pruning and pruning_debug is not None:
            result["pruning"] = pruning_debug
        if enable_pruning and pruning_snapshot_mode and pruning_rounds_debug is not None:
            result["pruning_rounds"] = pruning_rounds_debug
        return result

    async def async_execute(
        self,
        problem: str,
        num_agents: int = 3,
        num_rounds: int = 3,
        judge_mode: str = "llm_judge",
        personas: Optional[List[str]] = None,
        return_transcript: bool = True,
        agent_llm_configs: Optional[List[LLMConfig]] = None,
        enable_pruning: bool = False,
        pruning_qp_threshold: float = 0.15,
        pruning_dp_similarity_threshold: float = 0.92,
        pruning_enable_mr: bool = False,
        pruning_mr_llm_config: Optional[LLMConfig] = None,
        pruning_snapshot_mode: bool = False,
        transcript_mode: str = "prev",  # options: ["prev", "all"]
        **kwargs,
    ) -> dict:
        """Execute debate workflow (asynchronous)."""
        state = self._setup_debate(problem, num_agents, num_rounds, personas, agent_llm_configs)
        transcript = await self._run_debate_rounds_async(problem, state, transcript_mode)
        pruning_info = None
        pruning_debug = None
        pruning_rounds_debug: Optional[List[Dict[str, Any]]] = None
        if enable_pruning:
            min_keep = max(1, int(round(state["num_agents"] * 0.3)))
            pipeline = PruningPipeline(
                enable_qp=True,
                enable_dp=True,
                enable_mr=pruning_enable_mr,
                qp_threshold=pruning_qp_threshold,
                dp_similarity_threshold=pruning_dp_similarity_threshold,
                mr_llm_config=pruning_mr_llm_config,
                min_keep_count=min_keep,
            )
            if pruning_snapshot_mode:
                pruning_rounds_debug = []
                for r in range(state["num_rounds"]):
                    rcands = collect_round_candidates(
                        transcript=transcript, num_agents=state["num_agents"], round_index=r
                    )
                    info_r = pipeline.apply(problem=problem, candidates=rcands)
                    pruning_rounds_debug.append(
                        {
                            "round": r,
                            "before_candidates": rcands,
                            "after_candidates": info_r.get("candidates", []),
                            "mr_suggested": info_r.get("mr_suggested"),
                        }
                    )
            candidates = collect_last_round_candidates(
                transcript=transcript, num_agents=state["num_agents"], last_round_index=state["num_rounds"] - 1
            )
            pruning_info = pipeline.apply(problem=problem, candidates=candidates)
            try:
                pruning_debug = {
                    "before_candidates": candidates,
                    "after_candidates": pruning_info.get("candidates", []),
                    "mr_suggested": pruning_info.get("mr_suggested"),
                }
            except Exception:
                pruning_debug = None
        consensus = await self._generate_consensus_async(problem, state, transcript, judge_mode, pruning_info)
        result: Dict[str, Any] = {
            "final_answer": consensus["final_answer"],
            "winner": consensus.get("winner"),
        }
        if return_transcript:
            result["transcript"] = transcript
        if enable_pruning and pruning_debug is not None:
            result["pruning"] = pruning_debug
        if enable_pruning and pruning_snapshot_mode and pruning_rounds_debug is not None:
            result["pruning_rounds"] = pruning_rounds_debug
        return result

    def _setup_debate(
        self,
        problem: str,
        num_agents: int,
        num_rounds: int,
        personas: Optional[List[str]],
        agent_llm_configs: Optional[List[LLMConfig]] = None,
    ) -> dict:
        """Setup debate environment."""
        if num_agents <= 1:
            raise ValueError("num_agents must be greater than 1")
        if num_rounds <= 0:
            raise ValueError("num_rounds must be positive")

        roles: List[str] = personas or get_default_personas(num_agents)
        # Based on user input or model pool, prepare each agent object (fixed for entire battle cycle, not randomly changed per round)
        agents_for_ids: List[CustomizeAgent] = self._prepare_runtime_debaters(num_agents, agent_llm_configs)
        state: Dict[str, Any] = {
            "problem": problem,
            "num_agents": num_agents,
            "num_rounds": num_rounds,
            "roles": roles,
            "agents": agents_for_ids,
        }
        return state

    def _prepare_runtime_debaters(self, num_agents: int, agent_llm_configs: Optional[List[LLMConfig]]) -> List[CustomizeAgent]:
        """Select CustomizeAgent for each agent_id that remains unchanged throughout the debate.
        Priority:
        1) User explicitly passes debater_agents → cycle/truncate by length and assign to each position
        2) Pass agent_llm_configs → create default debater for each position
        3) Use llm_config_pool random selection → create default debater for each position (prioritized over default llm_config)
        4) Fallback to default llm_config
        """
        # If group graph mode is enabled, don't generate internal agents (driven by group_graphs instead)
        if self.group_graphs_enabled:
            return []
        
        # 1) Explicit multiple agents
        if self.debater_agents:
            agents: List[CustomizeAgent] = []
            for i in range(num_agents):
                agents.append(self.debater_agents[i % len(self.debater_agents)])
            return agents
        
        # 2) Create based on passed agent_llm_configs
        if agent_llm_configs and len(agent_llm_configs) > 0:
            return [
                self._create_debater_agent_with_llm(agent_llm_configs[i % len(agent_llm_configs)])
                for i in range(num_agents)
            ]
        
        # 3) Use llm_config_pool random selection
        if self.llm_config_pool and len(self.llm_config_pool) > 0:
            return [self._create_debater_agent_with_llm(random.choice(self.llm_config_pool)) for _ in range(num_agents)]
        
        # 4) Default: use llm_config
        default_agent = self._create_default_debater_agent()
        return [default_agent for _ in range(num_agents)]

    def _create_debater_agent_with_llm(self, llm_cfg: LLMConfig) -> CustomizeAgent:
        """Create a debater agent with given LLM configuration that is consistent with default structure."""
        return CustomizeAgent(
            name="DebaterAgent",
            description="Generate argument/rebuttal and optional answer per debate round.",
            prompt=DEBATER_AGENT_PROMPT,
            llm_config=llm_cfg,
            inputs=[
                {"name": "problem", "type": "str", "description": "Problem statement"},
                {"name": "transcript_text", "type": "str", "description": "Formatted debate transcript so far"},
                {"name": "role", "type": "str", "description": "Debater role/persona"},
                {"name": "agent_id", "type": "str", "description": "Debater id (string)"},
                {"name": "round_index", "type": "str", "description": "1-based round index"},
                {"name": "total_rounds", "type": "str", "description": "Total rounds"},
            ],
            outputs=[
                {"name": "thought", "type": "str", "description": "Brief reasoning", "required": True},
                {"name": "argument", "type": "str", "description": "Argument or rebuttal", "required": True},
                {"name": "answer", "type": "str", "description": "Optional current answer", "required": False},
            ],
            parse_mode="xml",
        )

    def _run_debate_rounds(self, problem: str, state: dict, transcript_mode: str = "prev") -> List[dict]:
        """Run debate rounds (synchronous). Return transcript.
        
        Args:
            transcript_mode: Control transcript range accessible to agents
                - "prev": Can only see n-1 round speeches (default)
                - "all": Can see all previous round speeches
        """
        transcript: List[dict] = []
        num_agents: int = state["num_agents"]
        num_rounds: int = state["num_rounds"]
        roles: List[str] = state["roles"]

        for round_index in range(num_rounds):
            for agent_id in range(num_agents):
                # Group graph mode: call corresponding graph.execute()
                if self.group_graphs_enabled and self.group_graphs:
                    graph = self.group_graphs[agent_id % len(self.group_graphs)]
                    # Get corresponding transcript based on access mode
                    transcript_text = self._get_transcript_for_agent(
                        transcript, round_index, agent_id, transcript_mode, num_agents
                    )
                    g_inputs = {
                        "problem": problem,
                        "transcript_text": transcript_text,
                        "role": roles[agent_id],
                        "agent_id": str(agent_id),
                        "round_index": str(round_index + 1),
                        "total_rounds": str(num_rounds),
                    }
                    g_out = graph.execute(**g_inputs)
                    structured = {
                        "argument": g_out.get("argument", g_out.get("output", "")),
                        "answer": g_out.get("answer"),
                        "thought": g_out.get("thought", ""),
                    }
                else:
                    # If _setup_debate has determined agent for each position, use directly
                    selected_agent: Optional[CustomizeAgent] = None
                    agents_for_ids: Optional[List[CustomizeAgent]] = state.get("agents")
                    if agents_for_ids:
                        selected_agent = agents_for_ids[agent_id]
                    elif self.debater_agents:
                        selected_agent = random.choice(self.debater_agents)

                    if selected_agent is not None:
                        try:
                            # Get corresponding transcript based on access mode
                            transcript_text = self._get_transcript_for_agent(
                                transcript, round_index, agent_id, transcript_mode, num_agents
                            )
                            inputs = {
                                "problem": problem,
                                "transcript_text": transcript_text,
                                "role": roles[agent_id],
                                "agent_id": str(agent_id),
                                "round_index": str(round_index + 1),
                                "total_rounds": str(num_rounds),
                            }
                            msg = selected_agent(inputs=inputs)
                            structured = msg.content.get_structured_data()
                        except Exception as e:
                            print(f"Agent execution error: {e}")
                            structured = {"argument": "", "answer": "", "thought": ""}
                    else:
                        # Get corresponding transcript based on access mode
                        transcript_text = self._get_transcript_for_agent(
                            transcript, round_index, agent_id, transcript_mode, num_agents
                        )
                        prompt = build_agent_prompt(
                            problem=problem,
                            transcript_text=transcript_text,
                            role=roles[agent_id],
                            agent_id=agent_id,
                            round_index=round_index,
                            total_rounds=num_rounds,
                        )
                        response = self._llm.generate(
                            prompt=prompt,
                            parser=DebateAgentOutput,
                            parse_mode="xml",
                        )
                        structured = response.get_structured_data()
                transcript.append(
                    {
                        "agent_id": agent_id,
                        "round": round_index,
                        "role": roles[agent_id],
                        "argument": structured.get("argument", ""),
                        "answer": structured.get("answer"),
                        "thought": structured.get("thought", ""),
                    }
                )
                # Print each agent's output immediately (synchronous, complete content)
                try:
                    arg_full = str(structured.get("argument", "")).strip()
                    ans_full = str(structured.get("answer") or "").strip()
                    print(
                        f"[Round {round_index + 1}] Agent#{agent_id} ({roles[agent_id]})\n"
                        f"Argument: {arg_full}\n"
                        f"Answer: {ans_full}\n"
                    )
                except Exception:
                    pass
        return transcript

    def _get_transcript_for_agent(self, transcript: List[dict], round_index: int, agent_id: int, 
                                 transcript_mode: str, num_agents: int) -> str:
        """根据访问模式获取agent可以访问的transcript。
        
        Args:
            transcript: 完整的transcript
            round_index: 当前轮次索引
            agent_id: 当前agent的ID
            transcript_mode: 访问模式
                - "prev": 只能看到n-1轮次的发言（默认）
                - "all": 可以看到之前所有轮次的发言
            num_agents: agent总数
            
        Returns:
            str: 格式化后的transcript文本
        """
        if transcript_mode == "prev":
            # 只包含当前轮次之前的transcript（n-1轮次）
            filtered_transcript = [t for t in transcript if t["round"] < round_index]
        elif transcript_mode == "all":
            # 包含当前轮次之前的所有transcript + 当前轮次中当前agent之前的发言
            filtered_transcript = []
            for t in transcript:
                if t["round"] < round_index:
                    # 之前轮次的所有发言
                    filtered_transcript.append(t)
                elif t["round"] == round_index and t["agent_id"] < agent_id:
                    # 当前轮次中，当前agent之前的发言
                    filtered_transcript.append(t)
        else:
            # 默认使用prev
            filtered_transcript = [t for t in transcript if t["round"] < round_index]
        
        return format_transcript(filtered_transcript)

    async def _run_debate_rounds_async(self, problem: str, state: dict, transcript_mode: str = "prev") -> List[dict]:
        """运行辩论轮次（异步）。返回 transcript。
        
        Args:
            transcript_mode: 控制agent可以访问的transcript范围
                - "prev": 只能看到n-1轮次的发言（默认）
                - "all": 可以看到之前所有轮次的发言
        """
        transcript: List[dict] = []
        num_agents: int = state["num_agents"]
        num_rounds: int = state["num_rounds"]
        roles: List[str] = state["roles"]

        for round_index in range(num_rounds):
            # 每个回合内可并行生成
            # 注意：在异步版本中，我们需要为每个agent单独计算transcript
            # 若分组图模式：逐个调用 graph.execute()（并发复杂性留待后续）
            if self.group_graphs_enabled and self.group_graphs:
                for agent_id in range(num_agents):
                    graph = self.group_graphs[agent_id % len(self.group_graphs)]
                    # 根据访问模式获取相应的transcript
                    transcript_text = self._get_transcript_for_agent(
                        transcript, round_index, agent_id, transcript_mode, num_agents
                    )
                    g_inputs = {
                        "problem": problem,
                        "transcript_text": transcript_text,
                        "role": roles[agent_id],
                        "agent_id": str(agent_id),
                        "round_index": str(round_index + 1),
                        "total_rounds": str(num_rounds),
                    }
                    g_out = graph.execute(**g_inputs)
                    structured = {
                        "argument": g_out.get("argument", g_out.get("output", "")),
                        "answer": g_out.get("answer"),
                        "thought": g_out.get("thought", ""),
                    }
                    transcript.append(
                        {
                            "agent_id": agent_id,
                            "round": round_index,
                            "role": roles[agent_id],
                            "argument": structured.get("argument", ""),
                            "answer": structured.get("answer"),
                            "thought": structured.get("thought", ""),
                        }
                    )
                    # 打印
                    try:
                        print(
                            f"[Round {round_index + 1}] Agent#{agent_id} ({roles[agent_id]})\n"
                            f"Argument: {str(structured.get('argument','')).strip()}\n"
                            f"Answer: {str(structured.get('answer') or '').strip()}\n"
                        )
                    except Exception:
                        pass
            # 若有外部注入的Agent，则并发调用Agent；否则走LLM批量生成
            elif state.get("agents") or self.debater_agents or self.debater_agent is not None:
                import asyncio
                tasks = []
                id_list: List[int] = []
                for agent_id in range(num_agents):
                    agents_for_ids: Optional[List[CustomizeAgent]] = state.get("agents")
                    if agents_for_ids:
                        selected_agent = agents_for_ids[agent_id]
                    elif self.debater_agents:
                        selected_agent = random.choice(self.debater_agents)
                    else:
                        selected_agent = None
                    # 根据访问模式获取相应的transcript
                    transcript_text = self._get_transcript_for_agent(
                        transcript, round_index, agent_id, transcript_mode, num_agents
                    )
                    inputs = {
                        "problem": problem,
                        "transcript_text": transcript_text,
                        "role": roles[agent_id],
                        "agent_id": str(agent_id),
                        "round_index": str(round_index + 1),
                        "total_rounds": str(num_rounds),
                    }
                    tasks.append(selected_agent(inputs=inputs))
                    id_list.append(agent_id)
                messages = await asyncio.gather(*tasks)
                for agent_id, msg in zip(id_list, messages):
                    structured = msg.content.get_structured_data()
                    transcript.append(
                        {
                            "agent_id": agent_id,
                            "round": round_index,
                            "role": roles[agent_id],
                            "argument": structured.get("argument", ""),
                            "answer": structured.get("answer"),
                            "thought": structured.get("thought", ""),
                        }
                    )
                # 即时打印本轮所有 agent 的产出（异步并发完成后逐个打印，完整内容）
                try:
                    for agent_id, msg in zip(id_list, messages):
                        st = msg.content.get_structured_data()
                        arg_full = str(st.get("argument", "")).strip()
                        ans_full = str(st.get("answer") or "").strip()
                        print(
                            f"[Round {round_index + 1}] Agent#{agent_id} ({roles[agent_id]})\n"
                            f"Argument: {arg_full}\n"
                            f"Answer: {ans_full}\n"
                        )
                except Exception:
                    pass
            else:
                prompts: List[Tuple[int, str]] = []
                for agent_id in range(num_agents):
                    # 根据访问模式获取相应的transcript
                    transcript_text = self._get_transcript_for_agent(
                        transcript, round_index, agent_id, transcript_mode, num_agents
                    )
                    prompt = build_agent_prompt(
                        problem=problem,
                        transcript_text=transcript_text,
                        role=roles[agent_id],
                        agent_id=agent_id,
                        round_index=round_index,
                        total_rounds=num_rounds,
                    )
                    prompts.append((agent_id, prompt))

                results = await self._llm.batch_generate_async(
                    batch_messages=[[{"role": "user", "content": p}] for _, p in prompts]
                )
                parsed_list = self._llm.parse_generated_texts(
                    texts=results, parser=DebateAgentOutput, parse_mode="xml"
                )
                for (agent_id, _), parsed in zip(prompts, parsed_list):
                    structured = parsed.get_structured_data()
                    transcript.append(
                        {
                            "agent_id": agent_id,
                            "round": round_index,
                            "role": roles[agent_id],
                            "argument": structured.get("argument", ""),
                            "answer": structured.get("answer"),
                            "thought": structured.get("thought", ""),
                        }
                    )
        return transcript

    def _generate_consensus(
        self, problem: str, state: dict, transcript: List[dict], judge_mode: str, pruning_info: Optional[Dict[str, Any]] = None
    ) -> dict:
        """根据 judge 模式生成最终共识（同步）。"""
        if judge_mode == "self_consistency":
            # 使用 QAScEnsemble 对各辩手最终答案做投票
            agent_final_answers = self._collect_agent_final_answers(state, transcript)
            if len(agent_final_answers) == 0:
                # 无人给出显式答案，则合并最后一轮的论据
                agent_final_answers = [t["argument"] for t in transcript if t.get("argument")]
            sc = self._sc_ensemble.execute(solutions=agent_final_answers)
            return {
                "final_answer": sc["response"],
                "winner": None,
            }

        # 默认 LLM 裁判；若外部注入 judge_agent，则优先使用
        if self.judge_agent is not None:
            roles_text = "\n".join([f"#{i}: {r}" for i, r in enumerate(state["roles"])])
            inputs = {
                "problem": problem,
                "transcript_text": format_transcript(transcript),
                "roles_text": roles_text,
            }
            # 将剪枝摘要附加给裁判（若存在 MR 建议，可以在裁判 prompt 中强调）
            if pruning_info and pruning_info.get("mr_suggested"):
                suggested = pruning_info["mr_suggested"].get("corrected", "")
                if suggested:
                    inputs["problem"] = problem + "\n\n(Consider corrected consolidation, if helpful.)"
            msg = self.judge_agent(inputs=inputs)
            jd = msg.content.get_structured_data()
        else:
            judge_prompt = build_judge_prompt(
                problem=problem,
                transcript_text=format_transcript(transcript),
                roles=state["roles"],
            )
            judge_resp = self._llm.generate(
                prompt=judge_prompt, parser=DebateJudgeOutput, parse_mode="xml"
            )
            jd = judge_resp.get_structured_data()
        
        winner_id = int(jd.get("winning_agent_id", 0))
        final_answer = jd.get("final_answer", "")
        
        # 获取获胜者的答案
        winner_answer = self._get_winner_answer(transcript, winner_id, state["num_rounds"])
        
        return {
            "final_answer": final_answer,
            "winner": winner_id,
            "winner_answer": winner_answer,
            "rationale": jd.get("rationale", ""),
        }

    async def _generate_consensus_async(
        self, problem: str, state: dict, transcript: List[dict], judge_mode: str, pruning_info: Optional[Dict[str, Any]] = None
    ) -> dict:
        """根据 judge 模式生成最终共识（异步）。"""
        if judge_mode == "self_consistency":
            agent_final_answers = self._collect_agent_final_answers(state, transcript)
            if len(agent_final_answers) == 0:
                agent_final_answers = [t["argument"] for t in transcript if t.get("argument")]
            sc = await self._sc_ensemble.async_execute(solutions=agent_final_answers)
            return {
                "final_answer": sc["response"],
                "winner": None,
            }

        if self.judge_agent is not None:
            roles_text = "\n".join([f"#{i}: {r}" for i, r in enumerate(state["roles"])])
            inputs = {
                "problem": problem,
                "transcript_text": format_transcript(transcript),
                "roles_text": roles_text,
            }
            if pruning_info and pruning_info.get("mr_suggested"):
                suggested = pruning_info["mr_suggested"].get("corrected", "")
                if suggested:
                    inputs["problem"] = problem + "\n\n(Consider corrected consolidation, if helpful.)"
            msg = await self.judge_agent(inputs=inputs)
            jd = msg.content.get_structured_data()
        else:
            judge_prompt = build_judge_prompt(
                problem=problem,
                transcript_text=format_transcript(transcript),
                roles=state["roles"],
            )
            judge_resp = await self._llm.async_generate(
                prompt=judge_prompt, parser=DebateJudgeOutput, parse_mode="xml"
            )
            jd = judge_resp.get_structured_data()
        
        winner_id = int(jd.get("winning_agent_id", 0))
        final_answer = jd.get("final_answer", "")
        
        # 获取获胜者的答案
        winner_answer = self._get_winner_answer(transcript, winner_id, state["num_rounds"])
        
        return {
            "final_answer": final_answer,
            "winner": winner_id,
            "winner_answer": winner_answer,
            "rationale": jd.get("rationale", ""),
        }

    def _collect_agent_final_answers(self, state: dict, transcript: List[dict]) -> List[str]:
        """收集每位辩手的最终答案（若有）。"""
        num_agents = state["num_agents"]
        num_rounds = state["num_rounds"]
        final_answers: List[str] = []
        for agent_id in range(num_agents):
            # 查找该辩手在最后一轮的记录
            records = [t for t in transcript if t["agent_id"] == agent_id and t["round"] == num_rounds - 1]
            if len(records) == 0:
                continue
            ans = records[-1].get("answer")
            if ans and isinstance(ans, str) and len(ans.strip()) > 0:
                final_answers.append(ans)
        return final_answers

    def _get_winner_answer(self, transcript: List[dict], winner_id: int, num_rounds: int) -> Optional[str]:
        """获取获胜者在最后一轮的答案。"""
        # 查找获胜者在最后一轮的记录
        records = [t for t in transcript if t["agent_id"] == winner_id and t["round"] == num_rounds - 1]
        if len(records) == 0:
            return None
        
        answer = records[-1].get("answer")
        if answer and isinstance(answer, str) and len(answer.strip()) > 0:
            return answer.strip()
        
        # 如果没有明确的答案，返回最后一轮的论据
        argument = records[-1].get("argument", "")
        return argument.strip() if argument else None

    def save_module(self, path: str, ignore: List[str] = [], **kwargs) -> str:
        """保存模块配置（直接保存agents，不保存llm_config_pool）"""
        # 确保目录存在
        os.makedirs(os.path.dirname(path) if os.path.dirname(path) else ".", exist_ok=True)
        
        # 保存debater agents
        agent_pool_path = path.replace('.json', '_agents.json')
        if self.debater_agents:
            agent_data = []
            for i, agent in enumerate(self.debater_agents):
                # 为每个agent创建单独的保存路径
                agent_path = agent_pool_path.replace('.json', f'_{i}.json')
                agent.save_module(agent_path)
                agent_data.append({
                    "name": agent.name,
                    "description": agent.description,
                    "file_path": agent_path
                })
            
            with open(agent_pool_path, 'w', encoding='utf-8') as f:
                json.dump(agent_data, f, ensure_ascii=False, indent=2)
        
        # 保存judge agent
        judge_agent_path = path.replace('.json', '_judge.json')
        if self.judge_agent:
            self.judge_agent.save_module(judge_agent_path)
        
        # 保存debate配置（只保存基本配置，不保存llm_config_pool）
        config = {
            "llm_config": self._serialize_llm_config(self.llm_config),
            "name": self.name,
            "description": self.description,
            "agent_pool_file": agent_pool_path if self.debater_agents else None,
            "judge_agent_file": judge_agent_path if self.judge_agent else None
        }
        
        with open(path, 'w', encoding='utf-8') as f:
            json.dump(config, f, ensure_ascii=False, indent=2)
        
        print(f"模块配置已保存到: {path}")
        return path
    
    def get_config(self) -> dict:
        """获取当前模块的配置字典（不包含llm_config_pool）"""
        config = {
            "llm_config": self._serialize_llm_config(self.llm_config),
            "name": self.name,
            "description": self.description,
        }
        
        # 序列化agent pool
        if self.debater_agents:
            agent_data = []
            for agent in self.debater_agents:
                agent_info = {
                    "name": agent.name,
                    "description": agent.description,
                    "config": agent.get_config()
                }
                agent_data.append(agent_info)
            config["debater_agents"] = agent_data
        
        # 序列化judge agent
        if self.judge_agent:
            config["judge_agent"] = {
                "name": self.judge_agent.name,
                "description": self.judge_agent.description,
                "config": self.judge_agent.get_config()
            }
        
        return config
    
    @classmethod
    def from_dict(cls, data: Dict[str, Any], **kwargs) -> 'MultiAgentDebateActionGraph':
        """从配置字典创建MultiAgentDebateActionGraph实例（不重建llm_config_pool）"""
        # 创建实例
        instance = cls()
        
        # 重建llm_config
        if data.get("llm_config"):
            instance.llm_config = instance._deserialize_llm_config(data["llm_config"])
        
        # 设置其他属性
        if data.get("name"):
            instance.name = data["name"]
        
        if data.get("description"):
            instance.description = data["description"]
        
        # 重建agent pool
        if data.get("debater_agents"):
            agents = []
            for agent_info in data["debater_agents"]:
                try:
                    agent_config = agent_info.get("config", {})
                    llm_config = instance._deserialize_llm_config(agent_config.get("llm_config"))
                    
                    # 从agent_config中移除可能重复的字段
                    agent_config_clean = {k: v for k, v in agent_config.items() 
                                        if k not in ['name', 'description', 'llm_config']}
                    
                    agent = CustomizeAgent(
                        name=agent_info["name"],
                        description=agent_info["description"],
                        llm_config=llm_config,
                        **agent_config_clean
                    )
                    agents.append(agent)
                except Exception as e:
                    print(f"警告: 重建agent {agent_info.get('name', 'unknown')}失败: {e}")
                    continue
            
            instance.debater_agents = agents
        
        # 重建judge agent
        if data.get("judge_agent"):
            try:
                judge_info = data["judge_agent"]
                judge_config = judge_info.get("config", {})
                llm_config = instance._deserialize_llm_config(judge_config.get("llm_config"))
                
                # 从judge_config中移除可能重复的字段
                judge_config_clean = {k: v for k, v in judge_config.items() 
                                    if k not in ['name', 'description', 'llm_config']}
                
                instance.judge_agent = CustomizeAgent(
                    name=judge_info["name"],
                    description=judge_info["description"],
                    llm_config=llm_config,
                    **judge_config_clean
                )
            except Exception as e:
                print(f"警告: 重建judge agent失败: {e}")
        
        return instance
    
    @classmethod
    def load_module(cls, path: str, llm_config: LLMConfig = None, **kwargs) -> 'MultiAgentDebateActionGraph':
        """从文件加载MultiAgentDebateActionGraph实例（类方法，不重建llm_config_pool）"""
        if not os.path.exists(path):
            raise FileNotFoundError(f"模块配置文件不存在: {path}")
        
        try:
            with open(path, 'r', encoding='utf-8') as f:
                config = json.load(f)
        except json.JSONDecodeError as e:
            raise ValueError(f"配置文件格式错误: {e}")
        except Exception as e:
            raise RuntimeError(f"读取配置文件失败: {e}")
        
        # 创建实例
        instance = cls()
        
        # 重建llm_config
        if config.get("llm_config"):
            try:
                instance.llm_config = instance._deserialize_llm_config(config["llm_config"])
            except Exception as e:
                print(f"警告: 重建llm_config失败: {e}")
        
        # 设置其他属性
        if config.get("name"):
            instance.name = config["name"]
        
        if config.get("description"):
            instance.description = config["description"]
        
        # 加载agent pool
        agent_pool_file = config.get("agent_pool_file")
        if agent_pool_file and os.path.exists(agent_pool_file):
            try:
                with open(agent_pool_file, 'r', encoding='utf-8') as f:
                    agent_data = json.load(f)
                
                agents = []
                for agent_info in agent_data:
                    try:
                        agent_path = agent_info.get("file_path")
                        if agent_path and os.path.exists(agent_path):
                            # 使用agent的load_module方法
                            agent = CustomizeAgent.from_file(
                                path=agent_path,
                                llm_config=instance.llm_config or llm_config
                            )
                            agents.append(agent)
                        else:
                            print(f"警告: agent文件不存在: {agent_path}")
                    except Exception as e:
                        print(f"警告: 加载agent {agent_info.get('name', 'unknown')}失败: {e}")
                        continue
                
                instance.debater_agents = agents
                print(f"从 {agent_pool_file} 加载了 {len(agents)} 个agents")
            except Exception as e:
                print(f"警告: 加载agent pool失败: {e}")
        
        # 加载judge agent
        judge_agent_file = config.get("judge_agent_file")
        if judge_agent_file and os.path.exists(judge_agent_file):
            try:
                # 使用agent的from_file方法
                instance.judge_agent = CustomizeAgent.from_file(
                    path=judge_agent_file,
                    llm_config=instance.llm_config or llm_config
                )
                print(f"从 {judge_agent_file} 加载了judge agent")
            except Exception as e:
                print(f"警告: 加载judge agent失败: {e}")
        
        print(f"从 {path} 加载了模块配置")
        return instance
    

    
    def _serialize_llm_config(self, llm_config) -> Optional[Dict[str, Any]]:
        """序列化LLM配置（只保存模型名称和基本参数）"""
        if not llm_config:
            return None
        
        config_info = {
            "model": llm_config.model if hasattr(llm_config, 'model') else None,
            "temperature": llm_config.temperature if hasattr(llm_config, 'temperature') else None,
            "config_type": type(llm_config).__name__
        }
        
        return config_info
    
    def _deserialize_llm_config(self, config_info: Optional[Dict[str, Any]]) -> Optional[LLMConfig]:
        """反序列化LLM配置（从环境变量重建）"""
        if not config_info:
            return None
        
        config_type = config_info.get("config_type", "OpenAILLMConfig")
        
        if config_type == "OpenAILLMConfig":
            from ...models.model_configs import OpenAILLMConfig
            return OpenAILLMConfig(
                model=config_info.get("model", "gpt-4o-mini"),
                openai_key=os.getenv("OPENAI_API_KEY")
            )
        elif config_type == "OpenRouterConfig":
            from ...models.model_configs import OpenRouterConfig
            return OpenRouterConfig(
                model=config_info.get("model", "meta-llama/llama-3.1-70b-instruct"),
                openrouter_key=os.getenv("OPENROUTER_API_KEY")
            )
        
        return None