Spaces:

Cheng-1
/

CodeAgent-MCP

Running

File size: 7,013 Bytes

5b9f9a3

import json
import logging
import re
from dataclasses import dataclass, field

logger = logging.getLogger(__name__)


@dataclass
class ExecutionResult:
    plan: list[dict]
    results: list[dict]
    execution_log: list[dict]
    total_tokens: int = 0


class Orchestrator:
    def __init__(self, planner, coder, reviewer, config: dict):
        self.planner = planner
        self.coder = coder
        self.reviewer = reviewer
        self.max_review_rounds = config.get("max_review_rounds", 3)
        self.review_threshold = config.get("review_threshold", 7.0)
        self.execution_log: list[dict] = []

    async def run(self, user_requirement: str) -> ExecutionResult:
        self.execution_log = []

        plan_output = await self.planner.run(user_requirement)
        tasks = self._parse_plan(plan_output)
        self._log("plan", {"raw_output": plan_output, "parsed_tasks": tasks})

        logger.info(f"[Orchestrator] Plan: {len(tasks)} tasks")

        results = []
        for i, task in enumerate(tasks):
            logger.info(f"[Orchestrator] Executing task {i+1}/{len(tasks)}: {task['description'][:60]}")
            task_result = await self._execute_task(task)
            results.append(task_result)

        total_tokens = (
            self.planner.total_tokens_used
            + self.coder.total_tokens_used
            + self.reviewer.total_tokens_used
        )

        return ExecutionResult(
            plan=tasks,
            results=results,
            execution_log=self.execution_log,
            total_tokens=total_tokens,
        )

    async def _execute_task(self, task: dict) -> dict:
        code_output = None
        review = None

        for attempt in range(self.max_review_rounds):
            await self._sync_workspace_files()

            if attempt == 0:
                coder_input = self.coder.format_input(task)
            else:
                coder_input = self.coder.format_input(task)
                coder_input += (
                    f"\n\n--- Reviewer 反馈 (得分: {review['score']}/10) ---\n"
                    f"问题: {json.dumps(review['issues'], ensure_ascii=False)}\n"
                    f"建议: {json.dumps(review['suggestions'], ensure_ascii=False)}\n"
                    f"请根据反馈修改代码。如果 workspace 已有文件，用 file_read 读取后修改再 file_write 写回。"
                )

            code_output = await self.coder.run(coder_input)
            self._log("coder", {"task_id": task.get("task_id"), "attempt": attempt, "output_preview": code_output[:500]})

            reviewer_input = self.reviewer.format_input({
                "task": task,
                "code": code_output,
            })
            review_raw = await self.reviewer.run(reviewer_input)
            review = self._parse_review(review_raw)
            self._log("reviewer", {"task_id": task.get("task_id"), "attempt": attempt, "review": review})

            logger.info(f"  [Review] Attempt {attempt+1}: score={review['score']}, passed={review['passed']}")

            if review["passed"]:
                return {
                    "task": task,
                    "code": code_output,
                    "review": review,
                    "attempts": attempt + 1,
                    "status": "completed",
                }

        return {
            "task": task,
            "code": code_output,
            "review": review,
            "attempts": self.max_review_rounds,
            "status": "max_attempts_reached",
        }

    def _parse_plan(self, plan_text: str) -> list[dict]:
        parsed = self._extract_json(plan_text)
        if parsed and "tasks" in parsed:
            return parsed["tasks"]

        tasks = []
        lines = plan_text.strip().split("\n")
        for i, line in enumerate(lines):
            line = line.strip()
            if re.match(r'^[\d]+[.)\-]', line):
                desc = re.sub(r'^[\d]+[.)\-]\s*', '', line)
                tasks.append({"task_id": f"T{i+1}", "description": desc, "dependencies": []})

        if not tasks:
            tasks = [{"task_id": "T1", "description": plan_text, "dependencies": []}]

        return tasks

    def _parse_review(self, review_text: str) -> dict:
        parsed = self._extract_json(review_text)
        if parsed and "score" in parsed:
            parsed.setdefault("passed", parsed["score"] >= self.review_threshold)
            parsed.setdefault("issues", [])
            parsed.setdefault("suggestions", [])
            parsed.setdefault("summary", "")
            return parsed

        score_match = re.search(r'(\d+\.?\d*)\s*/\s*10', review_text)
        score = float(score_match.group(1)) if score_match else 5.0

        return {
            "score": score,
            "passed": score >= self.review_threshold,
            "issues": [],
            "suggestions": [],
            "summary": review_text[:200],
        }

    def _extract_json(self, text: str) -> dict | None:
        if "```json" in text:
            match = re.search(r'```json\s*(.*?)```', text, re.DOTALL)
            if match:
                try:
                    return json.loads(match.group(1).strip())
                except json.JSONDecodeError:
                    pass
        if "```" in text:
            match = re.search(r'```\s*(.*?)```', text, re.DOTALL)
            if match:
                try:
                    return json.loads(match.group(1).strip())
                except json.JSONDecodeError:
                    pass
        try:
            return json.loads(text)
        except json.JSONDecodeError:
            pass
        match = re.search(r'\{[^{}]*(?:\{[^{}]*\}[^{}]*)*\}', text, re.DOTALL)
        if match:
            try:
                return json.loads(match.group())
            except json.JSONDecodeError:
                pass
        return None

    async def _sync_workspace_files(self):
        if not hasattr(self.coder, 'set_workspace_files'):
            return
        if not self.coder.mcp:
            return
        try:
            result = await self.coder.mcp.call_tool("file_list", {"directory": "."})
            text = str(result)
            if text == "(empty directory)" or text.startswith("Error"):
                self.coder.set_workspace_files([])
                return
            files = []
            for line in text.split('\n'):
                line = line.strip()
                if not line or line.endswith('/'):
                    continue
                name = re.sub(r'\s*\(\d+B\)\s*$', '', line)
                if name:
                    files.append(name)
            self.coder.set_workspace_files(files)
            logger.info(f"[Orchestrator] Workspace files: {files}")
        except Exception as e:
            logger.debug(f"[Orchestrator] Could not list workspace: {e}")
            self.coder.set_workspace_files([])

    def _log(self, stage: str, data: dict):
        self.execution_log.append({"stage": stage, **data})