Spaces:

holistic-ai
/

AgentGraph

Sleeping

App Files Files Community

wu981526092 commited on Sep 4, 2025

Commit

e20ad3b

1 Parent(s): 13d4394

add

Browse files

Files changed (7) hide show

agentgraph/reconstruction/prompt_reconstructor.py +37 -21
analyze_real_agent_trace.py +280 -0
backend/database/samples/INTEGRATION_SUMMARY.md +0 -114
backend/database/samples/REAL_AI_INTEGRATION_SUCCESS.md +0 -119
backend/database/samples/knowledge_graphs/kg_algorithm_sample_0_realistic.json +283 -0
create_realistic_prompt_reconstruction.py +362 -0
validate_enhanced_reconstruction.py +94 -0

agentgraph/reconstruction/prompt_reconstructor.py CHANGED Viewed

@@ -243,16 +243,22 @@ class PromptReconstructor:
                 # Format: Agent system prompt + tools + task as user message + additional context
                 task_message = interaction if interaction else task_prompt
-                # Start with enhanced system prompt - IMPROVED FORMATTING
                 system_role = f"system: You are {source['name']}. "
                 system_description = source.get("description", "")
                 if system_description:
                     system_role += f"You're an expert in {system_description.split(' responsible for ')[0].lower() if ' responsible for ' in system_description else system_description.lower()}.\n"
-                    system_role += f"Your personal goal is: {system_description}\n"
                 else:
-                    system_role += "\n"
-                # Add emphatic instruction about tools
                 system_role += "You ONLY have access to the following tools, and should NEVER make up tools that are not listed here:\n\n"
                 # Place system prompt first
@@ -286,20 +292,22 @@ class PromptReconstructor:
                         complete_prompt += f"Tool Arguments: {tool_args}\n"
                         complete_prompt += f"Tool Description: {tool_desc}\n\n"
-                # Add response format instructions with explicit Copy code markers
-                complete_prompt += "IMPORTANT: Use the following format in your response:\n\n"
                 complete_prompt += "Copy code\n"
                 complete_prompt += "```\n"
-                complete_prompt += "Thought: you should always think about what to do\n"
-                complete_prompt += "Action: the action to take, only one name of [" + ", ".join([t.split("Tool Name:")[1].strip().split("\n")[0] for t in tool_definitions if "Tool Name:" in t]) + "], just the name, exactly as it's written.\n"
-                complete_prompt += "Action Input: the input to the action, just a simple JSON object, enclosed in curly braces, using \" to wrap keys and values.\n"
-                complete_prompt += "Observation: the result of the action\n"
                 complete_prompt += "```\n\n"
-                complete_prompt += "Once all necessary information is gathered, return the following format:\n\n"
                 complete_prompt += "Copy code\n"
                 complete_prompt += "```\n"
-                complete_prompt += "Thought: I now know the final answer\n"
-                complete_prompt += "Final Answer: the final answer to the original input question\n"
                 complete_prompt += "```\n\n"
                 # Add required tools and sequence context information
@@ -307,22 +315,30 @@ class PromptReconstructor:
                 if required_tools_info or sequence_context:
                     context_info = f"{required_tools_info}{sequence_context}\n"
-                # Format the user message with improved structure matching the example
                 formatted_task_message = f"user:\nCurrent Task: {task_message}\n"
                 # Add expected criteria as shown in example
                 if target["type"] == "Task" and target.get("description"):
-                    formatted_task_message += f"\nThis is the expected criteria for your final answer: {target.get('description')}\n"
-                # Add standard completion instructions
-                formatted_task_message += "you MUST return the actual complete content as the final answer, not a summary.\n\n"
                 # Add context section if there's additional context available
                 if context_info:
-                    formatted_task_message += f"This is the context you're working with:\n{context_info}\n"
-                # Add motivation closing like in the example
-                formatted_task_message += "Begin! This is VERY important to you, use the tools available and give your best Final Answer, your job depends on it!"
                 # Add user message at the end
                 complete_prompt += formatted_task_message

                 # Format: Agent system prompt + tools + task as user message + additional context
                 task_message = interaction if interaction else task_prompt
+                # Enhanced system prompt with realistic agent reasoning patterns
                 system_role = f"system: You are {source['name']}. "
                 system_description = source.get("description", "")
                 if system_description:
                     system_role += f"You're an expert in {system_description.split(' responsible for ')[0].lower() if ' responsible for ' in system_description else system_description.lower()}.\n"
+                    system_role += f"Your personal goal is: {system_description}\n\n"
                 else:
+                    system_role += "\n\n"
+                # Add realistic agent behavior instructions based on real traces
+                system_role += "CRITICAL INSTRUCTIONS:\n"
+                system_role += "1. You must analyze the task step by step before taking action\n"
+                system_role += "2. Always reference the user's exact request in your reasoning\n"
+                system_role += "3. Break down complex tasks into sequential steps\n"
+                system_role += "4. Choose appropriate tools for each step and explain your reasoning\n"
+                system_role += "5. Be aware of system constraints and adapt accordingly\n\n"
                 system_role += "You ONLY have access to the following tools, and should NEVER make up tools that are not listed here:\n\n"
                 # Place system prompt first
                         complete_prompt += f"Tool Arguments: {tool_args}\n"
                         complete_prompt += f"Tool Description: {tool_desc}\n\n"
+                # Enhanced response format with realistic agent reasoning patterns
+                complete_prompt += "RESPONSE FORMAT - Follow this structure for each step:\n\n"
                 complete_prompt += "Copy code\n"
                 complete_prompt += "```\n"
+                complete_prompt += "Reasoning: [Analyze the current situation and explain your thinking process]\n"
+                complete_prompt += "Task Analysis: [Break down what needs to be done and identify requirements]\n"
+                complete_prompt += "Tool Selection: [Choose appropriate tool and justify why]\n"
+                complete_prompt += "Action: [Tool name from: " + ", ".join([t.split("Tool Name:")[1].strip().split("\n")[0] for t in tool_definitions if "Tool Name:" in t]) + "]\n"
+                complete_prompt += "Action Input: [JSON object with parameters, using \" for keys and values]\n"
+                complete_prompt += "Observation: [Result of the action]\n"
                 complete_prompt += "```\n\n"
+                complete_prompt += "For your final response:\n\n"
                 complete_prompt += "Copy code\n"
                 complete_prompt += "```\n"
+                complete_prompt += "Final Reasoning: [Summarize your complete analysis and decision process]\n"
+                complete_prompt += "Final Answer: [Complete answer addressing all requirements]\n"
                 complete_prompt += "```\n\n"
                 # Add required tools and sequence context information
                 if required_tools_info or sequence_context:
                     context_info = f"{required_tools_info}{sequence_context}\n"
+                # Enhanced user message with realistic agent reasoning prompts
                 formatted_task_message = f"user:\nCurrent Task: {task_message}\n"
+                # Add step-by-step reasoning instruction based on real agent patterns
+                formatted_task_message += "\nYour reasoning process should follow this pattern:\n"
+                formatted_task_message += "1. Analyze the user's request and identify key requirements\n"
+                formatted_task_message += "2. Break down the task into sequential steps\n"
+                formatted_task_message += "3. For each step, determine which tools to use and why\n"
+                formatted_task_message += "4. Consider system constraints and potential issues\n"
+                formatted_task_message += "5. Execute the plan while monitoring for problems\n\n"
                 # Add expected criteria as shown in example
                 if target["type"] == "Task" and target.get("description"):
+                    formatted_task_message += f"Expected criteria for your final answer: {target.get('description')}\n"
+                # Add standard completion instructions with emphasis on reasoning
+                formatted_task_message += "IMPORTANT: You MUST show your step-by-step reasoning process and return the actual complete content as the final answer, not a summary.\n\n"
                 # Add context section if there's additional context available
                 if context_info:
+                    formatted_task_message += f"Context you're working with:\n{context_info}\n"
+                # Add motivation with realistic urgency
+                formatted_task_message += "Begin! Remember to think through each step carefully, use the available tools appropriately, and provide your best Final Answer. Your systematic approach is crucial for success!"
                 # Add user message at the end
                 complete_prompt += formatted_task_message

analyze_real_agent_trace.py ADDED Viewed

	@@ -0,0 +1,280 @@

+#!/usr/bin/env python3
+"""
+Analyze Real Agent Trace for Prompt Reconstruction Enhancement
+This script analyzes the provided real agent trace to understand how we can
+enhance our prompt reconstruction to better simulate actual agent reasoning
+patterns and internal thought processes.
+"""
+import json
+import sys
+import os
+sys.path.append('/Users/zekunwu/Desktop/agent_monitoring/huggingface/AgentGraph')
+def analyze_real_trace_structure():
+    """Analyze the structure of the real agent trace."""
+    print("🔍 REAL AGENT TRACE ANALYSIS")
+    print("=" * 70)
+    # Simulate the provided trace structure
+    real_trace_example = {
+        "type": "ai",
+        "content": "",
+        "additional_kwargs": {
+            "reasoning_content": """We need to act as supervisor agent. The last user message: "write me final report for q1 2024!" We must follow instructions. The last message is the task. We need to produce final report. We must do steps: 1. Summarize request, period. 2. Retrieve data using get_order_data_for_period. Then delegate to revenue analyst, etc. We need to call tools accordingly. Let's do step 1: produce plan. Then step 2: call get_order_data_for_period with start_date 2024-01-01 end_date 2024-03-31...""",
+            "tool_calls": [
+                {
+                    "id": "fc_2372f7b7-2858-4b94-b5b2-4441ed19b66f",
+                    "function": {
+                        "arguments": {
+                            "end_date": "2024-03-31",
+                            "save_to_filename": "2024-01-01_to_2024-03-31_order.json",
+                            "start_date": "2024-01-01"
+                        },
+                        "name": "get_order_data_for_period"
+                    },
+                    "type": "function"
+                }
+            ]
+        },
+        "response_metadata": {
+            "token_usage": {
+                "completion_tokens": 533,
+                "prompt_tokens": 2105,
+                "total_tokens": 2638
+            },
+            "model_name": "openai/gpt-oss-20b"
+        }
+    }
+    print("📊 Key Components in Real Agent Trace:")
+    print("─" * 50)
+    print("✅ reasoning_content: Agent's internal thinking process")
+    print("✅ tool_calls: Structured function calls with arguments")
+    print("✅ response_metadata: Token usage and model information")
+    print("✅ content: Public response (often empty when using tools)")
+    print()
+    reasoning_content = real_trace_example["additional_kwargs"]["reasoning_content"]
+    print(f"🧠 Reasoning Content Analysis:")
+    print(f"  Length: {len(reasoning_content)} characters")
+    print(f"  Contains planning: {'step' in reasoning_content.lower()}")
+    print(f"  Contains decision making: {'need to' in reasoning_content.lower()}")
+    print(f"  Contains self-reflection: {'but' in reasoning_content.lower()}")
+    print()
+    tool_call = real_trace_example["additional_kwargs"]["tool_calls"][0]
+    print(f"🔧 Tool Call Analysis:")
+    print(f"  Function: {tool_call['function']['name']}")
+    print(f"  Arguments: {len(tool_call['function']['arguments'])} parameters")
+    print(f"  ID: {tool_call['id']}")
+def extract_agent_reasoning_patterns():
+    """Extract and analyze agent reasoning patterns from the trace."""
+    print(f"\n🎯 AGENT REASONING PATTERNS")
+    print("=" * 70)
+    # Extract key reasoning patterns from the provided trace
+    reasoning_patterns = {
+        "task_analysis": {
+            "pattern": "The last user message: \"write me final report for q1 2024!\"",
+            "description": "Agent identifies and quotes the user's request"
+        },
+        "instruction_following": {
+            "pattern": "We must follow instructions. The last message is the task.",
+            "description": "Agent acknowledges constraints and task definition"
+        },
+        "step_planning": {
+            "pattern": "We must do steps: 1. Summarize request, period. 2. Retrieve data...",
+            "description": "Agent breaks down complex tasks into sequential steps"
+        },
+        "tool_selection": {
+            "pattern": "We need to call tools accordingly. Let's do step 1: produce plan. Then step 2: call get_order_data_for_period",
+            "description": "Agent selects appropriate tools for each step"
+        },
+        "parameter_reasoning": {
+            "pattern": "with start_date 2024-01-01 end_date 2024-03-31",
+            "description": "Agent reasons about tool parameters based on context"
+        },
+        "constraint_awareness": {
+            "pattern": "But we don't have actual agent. We can simulate?",
+            "description": "Agent recognizes system limitations and adapts"
+        },
+        "self_correction": {
+            "pattern": "Maybe we can skip and produce final report with placeholders? But instructions say must not end until all analyses done.",
+            "description": "Agent evaluates options and corrects course"
+        }
+    }
+    for pattern_name, pattern_info in reasoning_patterns.items():
+        print(f"📋 {pattern_name.replace('_', ' ').title()}:")
+        print(f"  Pattern: {pattern_info['pattern'][:100]}...")
+        print(f"  Purpose: {pattern_info['description']}")
+        print()
+def design_enhanced_prompt_reconstruction():
+    """Design enhanced prompt reconstruction that captures agent reasoning."""
+    print(f"🚀 ENHANCED PROMPT RECONSTRUCTION DESIGN")
+    print("=" * 70)
+    enhanced_structure = {
+        "system_prompt": {
+            "role_definition": "You are a supervisor agent responsible for coordinating multi-agent workflows",
+            "reasoning_instructions": "Think through each step carefully. Show your reasoning process explicitly.",
+            "constraint_awareness": "Be aware of system limitations and adapt accordingly",
+            "tool_usage": "Select appropriate tools for each task step"
+        },
+        "user_message": {
+            "task_definition": "write me final report for q1 2024!",
+            "context": "Previous conversations and system state",
+            "expectations": "Follow the workflow: analyze → delegate → compile → report"
+        },
+        "reasoning_framework": {
+            "task_analysis": "Identify and quote the user's request",
+            "instruction_parsing": "Acknowledge constraints and requirements",
+            "step_planning": "Break down complex tasks into sequential steps",
+            "tool_selection": "Choose appropriate tools for each step",
+            "parameter_reasoning": "Reason about tool parameters based on context",
+            "constraint_handling": "Recognize limitations and adapt strategy",
+            "self_correction": "Evaluate options and correct course when needed"
+        },
+        "expected_output": {
+            "reasoning_content": "Detailed internal thinking process",
+            "tool_calls": "Structured function calls with reasoned arguments",
+            "content": "Public response or empty when using tools"
+        }
+    }
+    print("📝 Enhanced Reconstruction Components:")
+    print("─" * 50)
+    for component, details in enhanced_structure.items():
+        print(f"✅ {component.replace('_', ' ').title()}:")
+        if isinstance(details, dict):
+            for key, value in details.items():
+                print(f"  • {key.replace('_', ' ').title()}: {value}")
+        else:
+            print(f"  {details}")
+        print()
+def create_enhanced_agent_prompt_template():
+    """Create an enhanced agent prompt template based on real trace analysis."""
+    print(f"📄 ENHANCED AGENT PROMPT TEMPLATE")
+    print("=" * 70)
+    template = """system: You are a {agent_role} responsible for {agent_capabilities}.
+Your reasoning process should be explicit and structured:
+1. Task Analysis: Identify and understand the user's request
+2. Instruction Parsing: Acknowledge constraints and requirements
+3. Step Planning: Break down complex tasks into sequential steps
+4. Tool Selection: Choose appropriate tools for each step
+5. Parameter Reasoning: Reason about tool parameters based on context
+6. Constraint Handling: Recognize limitations and adapt strategy
+7. Self Correction: Evaluate options and correct course when needed
+Available Tools:
+{tool_definitions}
+Response Format:
+- Use reasoning_content to show your internal thinking process
+- Make structured tool calls with reasoned arguments
+- Provide public content only when not using tools
+Instructions:
+{specific_instructions}
+user: {user_message}
+Expected Workflow:
+{workflow_steps}
+Remember: Show your reasoning explicitly. Think through each decision step by step."""
+    print("📋 Template Structure:")
+    print(template)
+    print(f"\n🎯 Template Features:")
+    print("─" * 30)
+    print("✅ Explicit reasoning instructions")
+    print("✅ Structured thinking framework")
+    print("✅ Tool usage guidance")
+    print("✅ Response format specifications")
+    print("✅ Workflow expectations")
+    print("✅ Self-reflection encouragement")
+def demonstrate_enhanced_reconstruction():
+    """Demonstrate how to apply enhanced reconstruction to our sample."""
+    print(f"\n🎭 ENHANCED RECONSTRUCTION DEMONSTRATION")
+    print("=" * 70)
+    # Enhanced reconstruction for our algorithm sample
+    enhanced_verification_agent = {
+        "agent_role": "Verification Expert",
+        "agent_capabilities": "validating information accuracy and conducting detailed analysis",
+        "specific_instructions": """Your task is to verify the accuracy of provided costs for daily tickets and season passes for California's Great America in San Jose for summer 2024.
+You must:
+1. Confirm the cost of a daily ticket for California's Great America in 2024
+2. Confirm the cost of a season pass for California's Great America in 2024
+3. Provide verified results with explanations
+Constraints:
+- Costs must be accurate and reflect 2024 summer prices
+- Show your verification methodology
+- Explain your reasoning process""",
+        "user_message": "How much did I save by purchasing a season pass instead of daily tickets for California's Great America in San Jose, if I planned to visit once a month in June, July, August, and September during the summer of 2024?",
+        "workflow_steps": "1. Analyze the question → 2. Verify ticket prices → 3. Calculate savings → 4. Provide detailed explanation",
+        "expected_reasoning": """Let me analyze this step by step. The user is asking about savings from a season pass vs daily tickets. I need to:
+1. Identify the specific venue: California's Great America in San Jose
+2. Confirm current pricing for both daily tickets and season passes for 2024
+3. Calculate cost for 4 visits (June, July, August, September)
+4. Compare total costs and determine savings
+First, let me verify the current pricing. Based on historical patterns and typical amusement park pricing..."""
+    }
+    print("🎪 Enhanced Verification Agent Reconstruction:")
+    print("─" * 50)
+    print(f"Role: {enhanced_verification_agent['agent_role']}")
+    print(f"Capabilities: {enhanced_verification_agent['agent_capabilities']}")
+    print(f"Task: {enhanced_verification_agent['user_message'][:100]}...")
+    print(f"Expected Reasoning Length: {len(enhanced_verification_agent['expected_reasoning'])} characters")
+    print()
+    print("📊 This captures the detailed thinking process similar to the real trace!")
+def main():
+    """Main analysis function."""
+    analyze_real_trace_structure()
+    extract_agent_reasoning_patterns()
+    design_enhanced_prompt_reconstruction()
+    create_enhanced_agent_prompt_template()
+    demonstrate_enhanced_reconstruction()
+    print(f"\n🎉 CONCLUSION")
+    print("=" * 70)
+    print("✅ Real agent traces contain rich reasoning_content that shows:")
+    print("  • Step-by-step thinking processes")
+    print("  • Tool selection reasoning")
+    print("  • Constraint awareness and adaptation")
+    print("  • Self-correction and replanning")
+    print()
+    print("🎯 Our prompt reconstruction should capture this by:")
+    print("  • Adding explicit reasoning instructions")
+    print("  • Structuring thinking frameworks")
+    print("  • Encouraging step-by-step analysis")
+    print("  • Modeling internal decision processes")
+    print()
+    print("🚀 This will enable more realistic perturbation testing and")
+    print("   causal analysis by capturing actual agent cognition patterns!")
+if __name__ == "__main__":
+    main()

backend/database/samples/INTEGRATION_SUMMARY.md DELETED Viewed

@@ -1,114 +0,0 @@
-# AgentGraph Sample Data System Integration Summary
-## 🎉 **完成的工作概述**
-我们成功完成了从硬编码 Python 数据到基于 JSON 的模块化 sample system 的重构，并集成了 algorithm-generated.jsonl 中的真实样本。
-## 📋 **主要成就**
-### 1. **Sample Data System 重构** ✅
-- **从**：单一的`sample_data.py`文件包含硬编码数据
-- **到**：模块化的 JSON-based 系统，数据和代码分离
-### 2. **新的文件结构** ✅
-```
-backend/database/samples/
-├── README.md                     # 详细文档
-├── samples_config.json           # 主配置文件
-├── extract_algorithm_sample.py   # 提取工具
-├── add_algorithm_sample_example.py # 集成示例
-├── traces/                       # Trace数据目录
-│   ├── python_documentation_inquiry.json
-│   └── algorithm_sample_0.json
-└── knowledge_graphs/             # Knowledge Graph数据目录
-    ├── kg_python_documentation_enhanced.json
-    └── kg_algorithm_sample_0.json
-```
-### 3. **Algorithm 样本集成** ✅
-- **提取**：从`algorithm-generated.jsonl`中成功提取样本#0
-- **转换**：转换为 AgentGraph 标准格式
-- **知识图谱**：生成 mock 知识图谱演示完整结构
-- **集成**：完全集成到新的 JSON 系统中
-## 📊 **系统状态**
-### **当前样本总数**: 2
-1. **Python Documentation Assistant Demo**
-   - 类型：`documentation_search`
-   - 来源：`sample_data`
-   - 特性：RAG 搜索、失败检测、优化建议
-2. **Multi-Agent Arithmetic Problem Solver**
-   - 类型：`multi_agent_collaboration`
-   - 来源：`algorithm_generated`
-   - 特性：真实失败案例、多智能体协作、验证错误
-### **系统特性**
-- ✅ **可扩展**：添加新样本只需添加 JSON 文件
-- ✅ **可维护**：数据和代码完全分离
-- ✅ **向后兼容**：保持相同的 API 接口
-- ✅ **丰富多样**：包含成功和失败案例
-- ✅ **真实数据**：来自真实的多智能体系统
-## 🛠️ **使用方法**
-### **添加新样本**
-1. 将 trace JSON 文件放入`traces/`目录
-2. 将 knowledge graph JSON 文件放入`knowledge_graphs/`目录
-3. 在`samples_config.json`中添加配置条目
-4. 系统将自动加载新样本
-### **提取 algorithm 样本**
-```bash
-cd samples
-python extract_algorithm_sample.py /path/to/algorithm-generated.jsonl <sample_id>
-```
-## 🔮 **下一步计划**
-### **待解决的问题**
-- **API Key 认证**：需要有效的 OpenAI API key 来生成真实的 knowledge graph
-- **扩展样本库**：从 algorithm-generated.jsonl 中提取更多样本
-### **建议的改进**
-1. **多样本提取**：选择 3-5 个最有代表性的 algorithm 样本
-2. **自动化 pipeline**：创建批量提取和处理工具
-3. **质量验证**：添加样本质量检查和验证
-4. **性能测试**：测试大规模样本加载性能
-## 🏆 **成功指标**
-- ✅ **系统重构**：完全迁移到 JSON-based 架构
-- ✅ **API 兼容性**：保持 100%向后兼容
-- ✅ **样本多样性**：包含 2 种不同类型的样本
-- ✅ **真实数据**：集成真实的多智能体失败案例
-- ✅ **文档完整**：提供详细的使用文档和示例
-## 📝 **技术细节**
-### **数据格式标准化**
-- Trace 文件：包含 metadata、content、observations
-- Knowledge Graph：包含 entities、relations、failures、optimizations
-- 配置文件：统一的 samples_config.json 格式
-### **加载性能**
-- 延迟加载：只在需要时加载数据
-- 缓存机制：避免重复加载
-- 错误处理：优雅处理损坏的 JSON 文件
----
-🎯 **总结**：我们成功地将 AgentGraph 的 sample data 系统现代化，为未来的扩展和维护奠定了坚实的基础。新系统不仅更加灵活和可维护，还集成了真实的多智能体协作失败案例，为用户提供了更丰富和实用的示例数据。

backend/database/samples/REAL_AI_INTEGRATION_SUCCESS.md DELETED Viewed

@@ -1,119 +0,0 @@
-# 🎉 真实 AI 知识图谱集成成功报告
-## 📝 任务概述
-成功使用你提供的 OpenAI API key，运行了真实的`multi_agent_knowledge_extractor.py`，为算法样本生成了真实的知识图谱，并完成了完整的集成。
-## ✅ 完成的工作
-### 1. API Key 问题修复
-- 修复了多个文件中的`OPENAI_API_KEY`环境变量设置问题
-- 文件清单：
-  - `agentgraph/methods/production/multi_agent_knowledge_extractor.py`
-  - `agentgraph/extraction/graph_utilities/knowledge_graph_merger.py`
-  - `agentgraph/extraction/graph_processing/knowledge_graph_processor.py`
-  - `agentgraph/testing/knowledge_graph_tester.py`
-### 2. 真实 AI 知识图谱生成
-- ✅ 使用你提供的 API key: `sk-proj-[REDACTED]`
-- ✅ 成功运行 CrewAI 多代理知识提取系统
-- ✅ 消耗约 67,264 tokens，费用约$0.024
-- ✅ 生成真实 AI 知识图谱
-### 3. 知识图谱解析和增强
-- 开发了专用解析器处理 CrewOutput 对象
-- 将 Pydantic 对象字符串转换为标准 JSON 格式
-- 为算法样本增强了知识图谱内容：
-  - **实体**: 6 个（3 个 Agent，1 个 Task，1 个 Input，1 个 Output）
-  - **关系**: 4 个（涵盖完整的多代理协作流程）
-  - **失败案例**: 1 个（PLANNING_ERROR 类型）
-  - **优化建议**: 2 个（AGENT_MERGING 和 WORKFLOW_SIMPLIFICATION）
-### 4. 系统集成验证
-- ✅ 真实知识图谱已完全集成到 JSON 样本系统中
-- ✅ 系统可正确加载两个样本：
-  1. Python 文档助手示例（手工制作）
-  2. 多代理算术计算系统（真实 AI 生成）
-## 📊 最终状态
-```json
-{
-  "样本总数": "2 traces, 2 knowledge graphs",
-  "algorithm_sample_0": {
-    "系统名称": "California Great America Ticket Analysis System",
-    "实体数量": 7,
-    "关系数量": 6,
-    "失败案例": 0,
-    "优化建议": 0,
-    "实体类型分布": {
-      "Agent": 4,
-      "Task": 1,
-      "Input": 1,
-      "Output": 1
-    },
-    "AI识别的代理": [
-      "Problem Solving Expert",
-      "Verification Expert",
-      "Arithmetic Progressions Expert",
-      "Computer Terminal"
-    ]
-  }
-}
-```
-## 🏗️ 技术实现细节
-### AI 提取的原始输出
-```
-system_name='Input Validation System'
-entities=[Entity(id='Entity1', type='Input', ...)]
-relations=[Relation(id='08de1e2d-...', ...)]
-failures=None
-optimizations=None
-```
-### 增强后的知识图谱
-- 修正了系统名称和摘要以适应算法样本
-- 添加了多代理协作的完整实体网络
-- 实现了真实的失败检测和优化建议
-- 所有 ContentReference 都有合适的置信度分数
-## 🎯 关键成果
-1. **API 认证问题完全解决** - 所有文件的环境变量设置已修复
-2. **真实 AI 集成成功** - 不再依赖 mock 数据
-3. **知识图谱质量提升** - 包含真实的失败分析和优化建议
-4. **系统稳定性验证** - 两个样本都能正确加载和显示
-## 📂 文件结构
-```
-backend/database/samples/
-├── samples_config.json (包含两个样本配置)
-├── traces/
-│   ├── python_documentation_inquiry.json
-│   └── algorithm_sample_0.json
-└── knowledge_graphs/
-    ├── kg_python_documentation_enhanced.json
-    └── kg_algorithm_sample_0.json (🆕 真实AI生成)
-```
-## 💡 后续建议
-1. 可以继续从`algorithm-generated.jsonl`中提取更多样本
-2. 每个新样本都将使用真实 AI 生成知识图谱
-3. API 费用控制：每次提取约$0.024，可根据需要调整
----
-**状态**: ✅ 所有任务完成
-**生成时间**: 2025-01-27
-**AI 系统**: CrewAI + OpenAI GPT-4o-mini
-**集成**: 完全成功

backend/database/samples/knowledge_graphs/kg_algorithm_sample_0_realistic.json ADDED Viewed

	@@ -0,0 +1,283 @@

+{
+  "filename": "kg_algorithm_sample_0.json",
+  "trace_index": 0,
+  "graph_data": {
+    "system_name": "California Great America Ticket Analysis System",
+    "system_summary": "This system helps analyze the cost-saving potential of purchasing season passes versus individual daily tickets at California's Great America in San Jose. The process starts with an inquiry regarding savings from the `Inquiry about Savings from Season Pass vs Daily Tickets` (input_001), which is consumed by the `Verification Expert` (agent_002), who performs the `Verify Cost of Daily Ticket and Season Pass in 2024` (task_001). The task produces an output, the `Saved Amount from Season Pass Purchase` (output_001), which is then delivered to the `Arithmetic Progressions Expert` (agent_003) for final validation. Throughout the workflow, the `Computer Terminal` (agent_004) serves as an additional entity ensuring conversation flow.",
+    "entities": [
+      {
+        "id": "agent_001",
+        "type": "Agent",
+        "name": "ProblemSolving_Expert",
+        "importance": "HIGH",
+        "raw_prompt": "You are a ProblemSolving_Expert specialized in task coordination and management.\n\nYour reasoning process should be explicit and structured:\n1. Task Analysis: Break down complex problems into manageable components\n2. Workflow Planning: Design step-by-step solution approaches\n3. Resource Allocation: Assign tasks to appropriate experts\n4. Progress Monitoring: Track task completion and quality\n5. Coordination: Ensure smooth handoffs between team members\n6. Quality Assurance: Validate outputs meet requirements\n\nAvailable Tools:\n- task_planner: Create detailed task breakdown structures\n- team_coordinator: Assign tasks to team members\n- progress_tracker: Monitor task completion status\n\nResponse Format:\n- Use reasoning_content to show your coordination thinking\n- Structure tasks clearly with priorities and dependencies\n- Provide clear instructions to team members\n\nYour role is to:\n- Analyze complex problems and break them down into manageable tasks\n- Coordinate with other experts to solve multi-step problems\n- Provide task descriptions and guidance to verification experts\n- Ensure proper workflow execution",
+        "raw_prompt_ref": [
+          {
+            "line_start": 17,
+            "line_end": 17
+          },
+          {
+            "line_start": 34,
+            "line_end": 34
+          },
+          {
+            "line_start": 45,
+            "line_end": 45
+          }
+        ]
+      },
+      {
+        "id": "agent_002",
+        "type": "Agent",
+        "name": "Verification_Expert",
+        "importance": "HIGH",
+        "raw_prompt": "You are a Verification_Expert responsible for validating information accuracy and conducting detailed analysis.\n\nYour reasoning process should be explicit and structured:\n1. Task Analysis: Identify and understand the user's request\n2. Instruction Parsing: Acknowledge constraints and requirements  \n3. Step Planning: Break down complex tasks into sequential steps\n4. Tool Selection: Choose appropriate tools for each step\n5. Parameter Reasoning: Reason about tool parameters based on context\n6. Constraint Handling: Recognize limitations and adapt strategy\n7. Self Correction: Evaluate options and correct course when needed\n\nAvailable Tools:\n- web_search: Search for current pricing information\n- calculator: Perform mathematical calculations\n- data_retrieval: Access historical pricing data\n\nResponse Format:\n- Use reasoning_content to show your internal thinking process\n- Make structured tool calls with reasoned arguments\n- Provide public content with detailed explanations\n\nYour expertise includes:\n- Verifying costs, prices, and numerical data\n- Cross-checking information against historical patterns\n- Conducting detailed analysis and calculations\n- Providing verified results with explanations\n\nRemember: Show your reasoning explicitly. Think through each decision step by step.",
+        "raw_prompt_ref": [
+          {
+            "line_start": 66,
+            "line_end": 66
+          },
+          {
+            "line_start": 112,
+            "line_end": 112
+          },
+          {
+            "line_start": 149,
+            "line_end": 149
+          },
+          {
+            "line_start": 164,
+            "line_end": 164
+          }
+        ]
+      },
+      {
+        "id": "agent_003",
+        "type": "Agent",
+        "name": "ArithmeticProgressions_Expert",
+        "importance": "MEDIUM",
+        "raw_prompt": "You are an ArithmeticProgressions_Expert specialized in mathematical calculations and analysis.\n\nYour reasoning process should be explicit and structured:\n1. Mathematical Analysis: Identify the mathematical nature of the problem\n2. Formula Selection: Choose appropriate mathematical formulas and methods\n3. Calculation Planning: Structure calculations in logical sequence\n4. Validation: Cross-check results using alternative methods\n5. Pattern Recognition: Identify mathematical patterns and sequences\n6. Result Interpretation: Explain mathematical findings in context\n\nAvailable Tools:\n- advanced_calculator: Perform complex mathematical operations\n- formula_library: Access mathematical formulas and theorems\n- pattern_analyzer: Identify mathematical patterns\n\nResponse Format:\n- Use reasoning_content to show your mathematical thinking\n- Present calculations with clear step-by-step explanations\n- Validate results through multiple approaches\n\nYour expertise includes:\n- Validating arithmetic calculations and mathematical reasoning\n- Analyzing numerical sequences and patterns\n- Confirming computational results\n- Providing mathematical validation for problem solutions",
+        "raw_prompt_ref": [
+          {
+            "line_start": 172,
+            "line_end": 172
+          },
+          {
+            "line_start": 181,
+            "line_end": 181
+          }
+        ]
+      },
+      {
+        "id": "agent_004",
+        "type": "Tool",
+        "name": "Computer Terminal",
+        "importance": "LOW",
+        "raw_prompt": "Code execution environment and computational terminal for running calculations, scripts, and data processing tasks. Provides computational support to other agents when code execution is required.",
+        "raw_prompt_ref": [
+          {
+            "line_start": 21,
+            "line_end": 21
+          },
+          {
+            "line_start": 32,
+            "line_end": 32
+          }
+        ]
+      },
+      {
+        "id": "task_001",
+        "type": "Task",
+        "name": "Verify Cost of Daily Ticket and Season Pass in 2024",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 8,
+            "line_end": 8
+          },
+          {
+            "line_start": 10,
+            "line_end": 10
+          },
+          {
+            "line_start": 11,
+            "line_end": 12
+          }
+        ]
+      },
+      {
+        "id": "input_001",
+        "type": "Input",
+        "name": "Inquiry about Savings from Season Pass vs Daily Tickets",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 6,
+            "line_end": 6
+          }
+        ]
+      },
+      {
+        "id": "output_001",
+        "type": "Output",
+        "name": "Saved Amount from Season Pass Purchase",
+        "importance": "HIGH",
+        "raw_prompt": "",
+        "raw_prompt_ref": [
+          {
+            "line_start": 119,
+            "line_end": 119
+          },
+          {
+            "line_start": 126,
+            "line_end": 126
+          }
+        ]
+      },
+      {
+        "id": "human_001",
+        "type": "Human",
+        "name": "Park Visitor",
+        "importance": "HIGH",
+        "raw_prompt": "Person inquiring about ticket cost savings for California's Great America visits",
+        "raw_prompt_ref": [
+          {
+            "line_start": 1,
+            "line_end": 1
+          }
+        ]
+      }
+    ],
+    "relations": [
+      {
+        "id": "relation_001",
+        "source": "input_001",
+        "target": "agent_002",
+        "type": "CONSUMED_BY",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 6,
+            "line_end": 6
+          }
+        ]
+      },
+      {
+        "id": "relation_002",
+        "source": "agent_002",
+        "target": "task_001",
+        "type": "PERFORMS",
+        "importance": "HIGH",
+        "interaction_prompt": "Task Assignment with Manager Instructions:\n\nYou are given: (1) a task and advises from your manager with a specific plan and (2) a general task.\nCollect information from the general task, follow the suggestions from manager to solve the task.\n\n# General Task\nHow much did I save by purchasing a season pass instead of daily tickets for California's Great America in San Jose, if I planned to visit once a month in June, July, August, and September during the summer of 2024? Please solve the task carefully.\n\n# Task and suggestions from manager\n## Task description\nVerify the accuracy of the provided costs for a daily ticket and a season pass for California's Great America in San Jose for the summer of 2024.\n\n## Plan for solving the task\n1. Confirm the cost of a daily ticket for California's Great America in 2024.\n2. Confirm the cost of a season pass for California's Great America in 2024.\n\n## Output format\n- Verified cost of a daily ticket in 2024\n- Verified cost of a season pass in 2024\n\n## Constraints and conditions for completion\n- The costs must be accurate and reflect the prices for the summer of 2024.\n\n## Results from last response\n- Cost of a daily ticket in 2024: $60\n- Cost of a season pass in 2024: $120\n\nExpected Reasoning Process:\nThink through this step by step. Show your reasoning about:\n- How you will verify these prices\n- What sources you trust for accuracy\n- How you handle any conflicting information\n- Your methodology for ensuring 2024 summer pricing",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 112,
+            "line_end": 112
+          },
+          {
+            "line_start": 164,
+            "line_end": 164
+          }
+        ]
+      },
+      {
+        "id": "relation_003",
+        "source": "task_001",
+        "target": "agent_002",
+        "type": "ASSIGNED_TO",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 8,
+            "line_end": 8
+          }
+        ]
+      },
+      {
+        "id": "relation_004",
+        "source": "task_001",
+        "target": "output_001",
+        "type": "PRODUCES",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 119,
+            "line_end": 119
+          }
+        ]
+      },
+      {
+        "id": "relation_005",
+        "source": "output_001",
+        "target": "human_001",
+        "type": "DELIVERS_TO",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 126,
+            "line_end": 126
+          }
+        ]
+      },
+      {
+        "id": "relation_006",
+        "source": "agent_002",
+        "target": "task_001",
+        "type": "INTERVENES",
+        "importance": "HIGH",
+        "interaction_prompt": "",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 164,
+            "line_end": 164
+          }
+        ]
+      },
+      {
+        "id": "rel_uses_computer",
+        "source": "agent_001",
+        "target": "agent_004",
+        "type": "USES",
+        "importance": "MEDIUM",
+        "interaction_prompt": "Tool Usage Request with Reasoning Context:\n\nI need to use the Computer Terminal for computational tasks related to the ticket pricing analysis.\n\nMy reasoning for this tool usage:\n1. Task Context: We need to calculate savings from season pass vs daily tickets\n2. Calculation Required: 4 visits × daily ticket price vs season pass price\n3. Tool Selection: Computer Terminal is appropriate for mathematical calculations\n4. Expected Output: Precise calculation with clear breakdown\n\nSpecific calculation request:\n- Calculate: 4 visits × $60 per visit = total cost for daily tickets\n- Compare with: $120 season pass cost\n- Determine: Savings amount and percentage\n\nParameters:\n- Number of visits: 4 (June, July, August, September)\n- Daily ticket cost: $60 (to be verified)\n- Season pass cost: $120 (to be verified)\n- Output format: Clear numerical breakdown with explanation",
+        "interaction_prompt_ref": [
+          {
+            "line_start": 50,
+            "line_end": 55,
+            "confidence": 0.8
+          }
+        ]
+      }
+    ],
+    "failures": [],
+    "optimizations": []
+  },
+  "extraction_info": {
+    "method": "real_ai_extraction",
+    "model": "gpt-4o-mini",
+    "timestamp": "2025-01-27",
+    "api_key_used": "[REDACTED]",
+    "no_enhancement": true,
+    "source": "multi_agent_knowledge_extractor.py"
+  },
+  "realistic_enhancement_info": {
+    "enhanced_at": "2025-01-27",
+    "enhancement_type": "realistic_agent_reasoning",
+    "features_added": [
+      "explicit_reasoning_frameworks",
+      "step_by_step_thinking_instructions",
+      "tool_selection_reasoning",
+      "constraint_awareness_prompts",
+      "self_correction_mechanisms",
+      "contextual_interaction_content"
+    ],
+    "reasoning_pattern_source": "real_agent_trace_analysis",
+    "total_reasoning_instructions": 5
+  }
+}

create_realistic_prompt_reconstruction.py ADDED Viewed

	@@ -0,0 +1,362 @@

+#!/usr/bin/env python3
+"""
+Create Realistic Prompt Reconstruction Based on Real Agent Trace Patterns
+This script creates a more realistic prompt reconstruction by incorporating
+the reasoning patterns and internal thought processes observed in real agent traces.
+"""
+import json
+import sys
+import os
+import copy
+sys.path.append('/Users/zekunwu/Desktop/agent_monitoring/huggingface/AgentGraph')
+from agentgraph.reconstruction import PromptReconstructor
+def create_realistic_agent_prompts():
+    """Create realistic agent prompts with internal reasoning patterns."""
+    print("🧠 CREATING REALISTIC AGENT PROMPTS")
+    print("=" * 70)
+    realistic_agents = {
+        'agent_002': {  # Verification Expert
+            'name': 'Verification_Expert',
+            'raw_prompt': """You are a Verification_Expert responsible for validating information accuracy and conducting detailed analysis.
+Your reasoning process should be explicit and structured:
+1. Task Analysis: Identify and understand the user's request
+2. Instruction Parsing: Acknowledge constraints and requirements
+3. Step Planning: Break down complex tasks into sequential steps
+4. Tool Selection: Choose appropriate tools for each step
+5. Parameter Reasoning: Reason about tool parameters based on context
+6. Constraint Handling: Recognize limitations and adapt strategy
+7. Self Correction: Evaluate options and correct course when needed
+Available Tools:
+- web_search: Search for current pricing information
+- calculator: Perform mathematical calculations
+- data_retrieval: Access historical pricing data
+Response Format:
+- Use reasoning_content to show your internal thinking process
+- Make structured tool calls with reasoned arguments
+- Provide public content with detailed explanations
+Your expertise includes:
+- Verifying costs, prices, and numerical data
+- Cross-checking information against historical patterns
+- Conducting detailed analysis and calculations
+- Providing verified results with explanations
+Remember: Show your reasoning explicitly. Think through each decision step by step."""
+        },
+        'agent_001': {  # Problem Solving Expert
+            'name': 'ProblemSolving_Expert',
+            'raw_prompt': """You are a ProblemSolving_Expert specialized in task coordination and management.
+Your reasoning process should be explicit and structured:
+1. Task Analysis: Break down complex problems into manageable components
+2. Workflow Planning: Design step-by-step solution approaches
+3. Resource Allocation: Assign tasks to appropriate experts
+4. Progress Monitoring: Track task completion and quality
+5. Coordination: Ensure smooth handoffs between team members
+6. Quality Assurance: Validate outputs meet requirements
+Available Tools:
+- task_planner: Create detailed task breakdown structures
+- team_coordinator: Assign tasks to team members
+- progress_tracker: Monitor task completion status
+Response Format:
+- Use reasoning_content to show your coordination thinking
+- Structure tasks clearly with priorities and dependencies
+- Provide clear instructions to team members
+Your role is to:
+- Analyze complex problems and break them down into manageable tasks
+- Coordinate with other experts to solve multi-step problems
+- Provide task descriptions and guidance to verification experts
+- Ensure proper workflow execution"""
+        },
+        'agent_003': {  # Arithmetic Progressions Expert
+            'name': 'ArithmeticProgressions_Expert',
+            'raw_prompt': """You are an ArithmeticProgressions_Expert specialized in mathematical calculations and analysis.
+Your reasoning process should be explicit and structured:
+1. Mathematical Analysis: Identify the mathematical nature of the problem
+2. Formula Selection: Choose appropriate mathematical formulas and methods
+3. Calculation Planning: Structure calculations in logical sequence
+4. Validation: Cross-check results using alternative methods
+5. Pattern Recognition: Identify mathematical patterns and sequences
+6. Result Interpretation: Explain mathematical findings in context
+Available Tools:
+- advanced_calculator: Perform complex mathematical operations
+- formula_library: Access mathematical formulas and theorems
+- pattern_analyzer: Identify mathematical patterns
+Response Format:
+- Use reasoning_content to show your mathematical thinking
+- Present calculations with clear step-by-step explanations
+- Validate results through multiple approaches
+Your expertise includes:
+- Validating arithmetic calculations and mathematical reasoning
+- Analyzing numerical sequences and patterns
+- Confirming computational results
+- Providing mathematical validation for problem solutions"""
+        }
+    }
+    for agent_id, agent_data in realistic_agents.items():
+        print(f"✅ Created realistic prompt for {agent_id}: {agent_data['name']}")
+        print(f"   Length: {len(agent_data['raw_prompt'])} characters")
+        print(f"   Features: Reasoning framework, tool definitions, role clarity")
+        print()
+    return realistic_agents
+def create_realistic_interaction_prompts():
+    """Create realistic interaction prompts with reasoning content."""
+    print("💬 CREATING REALISTIC INTERACTION PROMPTS")
+    print("=" * 70)
+    realistic_interactions = {
+        'relation_002': {  # agent_002 → task_001 (PERFORMS)
+            'interaction_prompt': """Task Assignment with Manager Instructions:
+You are given: (1) a task and advises from your manager with a specific plan and (2) a general task.
+Collect information from the general task, follow the suggestions from manager to solve the task.
+# General Task
+How much did I save by purchasing a season pass instead of daily tickets for California's Great America in San Jose, if I planned to visit once a month in June, July, August, and September during the summer of 2024? Please solve the task carefully.
+# Task and suggestions from manager
+## Task description
+Verify the accuracy of the provided costs for a daily ticket and a season pass for California's Great America in San Jose for the summer of 2024.
+## Plan for solving the task
+1. Confirm the cost of a daily ticket for California's Great America in 2024.
+2. Confirm the cost of a season pass for California's Great America in 2024.
+## Output format
+- Verified cost of a daily ticket in 2024
+- Verified cost of a season pass in 2024
+## Constraints and conditions for completion
+- The costs must be accurate and reflect the prices for the summer of 2024.
+## Results from last response
+- Cost of a daily ticket in 2024: $60
+- Cost of a season pass in 2024: $120
+Expected Reasoning Process:
+Think through this step by step. Show your reasoning about:
+- How you will verify these prices
+- What sources you trust for accuracy
+- How you handle any conflicting information
+- Your methodology for ensuring 2024 summer pricing"""
+        },
+        'rel_uses_computer': {  # agent_001 → agent_004 (USES)
+            'interaction_prompt': """Tool Usage Request with Reasoning Context:
+I need to use the Computer Terminal for computational tasks related to the ticket pricing analysis.
+My reasoning for this tool usage:
+1. Task Context: We need to calculate savings from season pass vs daily tickets
+2. Calculation Required: 4 visits × daily ticket price vs season pass price
+3. Tool Selection: Computer Terminal is appropriate for mathematical calculations
+4. Expected Output: Precise calculation with clear breakdown
+Specific calculation request:
+- Calculate: 4 visits × $60 per visit = total cost for daily tickets
+- Compare with: $120 season pass cost
+- Determine: Savings amount and percentage
+Parameters:
+- Number of visits: 4 (June, July, August, September)
+- Daily ticket cost: $60 (to be verified)
+- Season pass cost: $120 (to be verified)
+- Output format: Clear numerical breakdown with explanation"""
+        }
+    }
+    for relation_id, interaction_data in realistic_interactions.items():
+        print(f"✅ Created realistic interaction for {relation_id}")
+        print(f"   Length: {len(interaction_data['interaction_prompt'])} characters")
+        print(f"   Features: Context, reasoning framework, explicit instructions")
+        print()
+    return realistic_interactions
+def create_enhanced_knowledge_graph():
+    """Create an enhanced knowledge graph with realistic agent reasoning."""
+    print("🔧 CREATING ENHANCED KNOWLEDGE GRAPH")
+    print("=" * 70)
+    # Load the original knowledge graph
+    kg_path = '/Users/zekunwu/Desktop/agent_monitoring/huggingface/AgentGraph/backend/database/samples/knowledge_graphs/kg_algorithm_sample_0.json'
+    with open(kg_path, 'r') as f:
+        original_kg = json.load(f)
+    # Create enhanced version
+    enhanced_kg = copy.deepcopy(original_kg)
+    # Get realistic agent prompts and interactions
+    realistic_agents = create_realistic_agent_prompts()
+    realistic_interactions = create_realistic_interaction_prompts()
+    # Update agent entities with realistic prompts
+    for entity in enhanced_kg['graph_data']['entities']:
+        if entity['type'] == 'Agent' and entity['id'] in realistic_agents:
+            agent_data = realistic_agents[entity['id']]
+            entity['raw_prompt'] = agent_data['raw_prompt']
+            entity['name'] = agent_data['name']
+            print(f"📝 Enhanced agent {entity['id']} with realistic reasoning framework")
+    # Update relations with realistic interaction prompts
+    for relation in enhanced_kg['graph_data']['relations']:
+        if relation['id'] in realistic_interactions:
+            relation['interaction_prompt'] = realistic_interactions[relation['id']]['interaction_prompt']
+            print(f"💬 Enhanced relation {relation['id']} with realistic interaction content")
+    # Add enhancement metadata
+    enhanced_kg['realistic_enhancement_info'] = {
+        'enhanced_at': '2025-01-27',
+        'enhancement_type': 'realistic_agent_reasoning',
+        'features_added': [
+            'explicit_reasoning_frameworks',
+            'step_by_step_thinking_instructions',
+            'tool_selection_reasoning',
+            'constraint_awareness_prompts',
+            'self_correction_mechanisms',
+            'contextual_interaction_content'
+        ],
+        'reasoning_pattern_source': 'real_agent_trace_analysis',
+        'total_reasoning_instructions': len(realistic_agents) + len(realistic_interactions)
+    }
+    return enhanced_kg
+def test_realistic_reconstruction(enhanced_kg):
+    """Test the realistic prompt reconstruction."""
+    print(f"\n🎯 TESTING REALISTIC PROMPT RECONSTRUCTION")
+    print("=" * 70)
+    try:
+        reconstructor = PromptReconstructor(enhanced_kg['graph_data'])
+        # Test the key PERFORMS relation with realistic reasoning
+        relation_id = 'relation_002'  # agent_002 → task_001 (PERFORMS)
+        result = reconstructor.reconstruct_relation_prompt(relation_id)
+        if 'error' in result:
+            print(f"❌ Reconstruction failed: {result['error']}")
+            return
+        reconstructed_prompt = result['reconstructed_prompt']
+        print(f"📊 Realistic Reconstruction Results:")
+        print(f"  Length: {len(reconstructed_prompt)} characters")
+        print(f"  Contains reasoning framework: {'reasoning process should be explicit' in reconstructed_prompt}")
+        print(f"  Contains step-by-step instructions: {'step planning' in reconstructed_prompt.lower()}")
+        print(f"  Contains tool selection guidance: {'tool selection' in reconstructed_prompt.lower()}")
+        print(f"  Contains self-correction prompts: {'self correction' in reconstructed_prompt.lower()}")
+        print(f"\n📝 Realistic Prompt Preview:")
+        print("─" * 50)
+        lines = reconstructed_prompt.split('\n')
+        for i, line in enumerate(lines[:20], 1):  # First 20 lines
+            print(f"{i:2}: {line}")
+        if len(lines) > 20:
+            print(f"   ... and {len(lines)-20} more lines")
+        print(f"\n🧠 Reasoning Content Analysis:")
+        reasoning_indicators = {
+            'task_analysis': 'task analysis' in reconstructed_prompt.lower(),
+            'step_planning': 'step planning' in reconstructed_prompt.lower(),
+            'tool_selection': 'tool selection' in reconstructed_prompt.lower(),
+            'constraint_handling': 'constraint handling' in reconstructed_prompt.lower(),
+            'self_correction': 'self correction' in reconstructed_prompt.lower(),
+            'explicit_reasoning': 'show your reasoning' in reconstructed_prompt.lower()
+        }
+        for indicator, present in reasoning_indicators.items():
+            status = "✅" if present else "❌"
+            print(f"  {status} {indicator.replace('_', ' ').title()}: {'Present' if present else 'Missing'}")
+        return reconstructed_prompt
+    except Exception as e:
+        print(f"💥 Realistic reconstruction failed: {str(e)}")
+        return None
+def save_realistic_enhanced_sample(enhanced_kg):
+    """Save the realistic enhanced sample."""
+    print(f"\n💾 SAVING REALISTIC ENHANCED SAMPLE")
+    print("=" * 70)
+    # Save realistic enhanced knowledge graph
+    realistic_kg_path = '/Users/zekunwu/Desktop/agent_monitoring/huggingface/AgentGraph/backend/database/samples/knowledge_graphs/kg_algorithm_sample_0_realistic.json'
+    with open(realistic_kg_path, 'w') as f:
+        json.dump(enhanced_kg, f, indent=2, ensure_ascii=False)
+    print(f"✅ Saved realistic enhanced knowledge graph to:")
+    print(f"   {realistic_kg_path}")
+    # Test the realistic reconstruction
+    realistic_prompt = test_realistic_reconstruction(enhanced_kg)
+    if realistic_prompt:
+        # Save reconstruction example
+        reconstruction_example_path = '/Users/zekunwu/Desktop/agent_monitoring/huggingface/AgentGraph/backend/database/samples/reconstructions/realistic_prompt_example.txt'
+        os.makedirs(os.path.dirname(reconstruction_example_path), exist_ok=True)
+        with open(reconstruction_example_path, 'w') as f:
+            f.write("# Realistic Agent Prompt Reconstruction Example\n")
+            f.write("# Based on Real Agent Trace Reasoning Patterns\n\n")
+            f.write(realistic_prompt)
+        print(f"✅ Saved realistic prompt example to:")
+        print(f"   {reconstruction_example_path}")
+def main():
+    """Main function to create realistic prompt reconstruction."""
+    print("🚀 CREATING REALISTIC PROMPT RECONSTRUCTION")
+    print("Based on Real Agent Trace Reasoning Patterns")
+    print("=" * 70)
+    # Create enhanced knowledge graph with realistic reasoning
+    enhanced_kg = create_enhanced_knowledge_graph()
+    # Save the realistic enhanced sample
+    save_realistic_enhanced_sample(enhanced_kg)
+    print(f"\n🎉 REALISTIC ENHANCEMENT COMPLETE")
+    print("=" * 70)
+    print("✅ Key improvements based on real agent traces:")
+    print("  • Explicit reasoning frameworks for each agent")
+    print("  • Step-by-step thinking instructions")
+    print("  • Tool selection reasoning guidance")
+    print("  • Constraint awareness and adaptation prompts")
+    print("  • Self-correction mechanisms")
+    print("  • Contextual interaction content with reasoning")
+    print()
+    print("🎯 This enables:")
+    print("  • More realistic perturbation testing")
+    print("  • Better simulation of actual agent cognition")
+    print("  • Improved causal analysis of reasoning patterns")
+    print("  • Production-quality agent interaction modeling")
+if __name__ == "__main__":
+    main()

validate_enhanced_reconstruction.py ADDED Viewed

	@@ -0,0 +1,94 @@

+#!/usr/bin/env python3
+"""
+Validate Enhanced Prompt Reconstruction
+Quick validation script to ensure the enhanced prompt reconstruction
+maintains the same input/output interface while improving internal logic.
+"""
+import json
+import sys
+import os
+sys.path.append('/Users/zekunwu/Desktop/agent_monitoring/huggingface/AgentGraph')
+from agentgraph.reconstruction import PromptReconstructor
+def validate_reconstruction():
+    """Validate that the enhanced reconstruction works correctly."""
+    print("🔍 VALIDATING ENHANCED PROMPT RECONSTRUCTION")
+    print("=" * 70)
+    # Load the algorithm sample 0 knowledge graph
+    kg_path = '/Users/zekunwu/Desktop/agent_monitoring/huggingface/AgentGraph/backend/database/samples/knowledge_graphs/kg_algorithm_sample_0.json'
+    try:
+        with open(kg_path, 'r') as f:
+            kg_data = json.load(f)
+        kg = kg_data['graph_data']
+        print(f"✅ Loaded knowledge graph with {len(kg['entities'])} entities and {len(kg['relations'])} relations")
+        # Initialize reconstructor
+        reconstructor = PromptReconstructor(kg)
+        print("✅ PromptReconstructor initialized successfully")
+        # Test reconstruction of all relations
+        reconstructed_relations = reconstructor.reconstruct_relations()
+        print(f"✅ Successfully reconstructed {len(reconstructed_relations)} relations")
+        # Show sample reconstruction for PERFORMS relation
+        performs_relations = [r for r in reconstructed_relations if r.get('type') == 'PERFORMS']
+        if performs_relations:
+            sample_relation = performs_relations[0]
+            print(f"\n📋 SAMPLE ENHANCED RECONSTRUCTION:")
+            print(f"Relation: {sample_relation['source_entity']['name']} → {sample_relation['target_entity']['name']}")
+            print(f"Type: {sample_relation['type']}")
+            print(f"Prompt length: {len(sample_relation.get('prompt', ''))} characters")
+            # Show first 500 characters of the enhanced prompt
+            prompt_preview = sample_relation.get('prompt', '')[:500]
+            print(f"\nPrompt preview (first 500 chars):")
+            print("-" * 50)
+            print(prompt_preview)
+            if len(sample_relation.get('prompt', '')) > 500:
+                print("... [truncated]")
+            print("-" * 50)
+            # Verify enhanced features are present
+            full_prompt = sample_relation.get('prompt', '')
+            enhancements_found = []
+            if "CRITICAL INSTRUCTIONS:" in full_prompt:
+                enhancements_found.append("✅ Critical instructions")
+            if "step by step" in full_prompt.lower():
+                enhancements_found.append("✅ Step-by-step reasoning")
+            if "Reasoning:" in full_prompt:
+                enhancements_found.append("✅ Enhanced response format")
+            if "Task Analysis:" in full_prompt:
+                enhancements_found.append("✅ Task analysis structure")
+            if "systematic approach" in full_prompt.lower():
+                enhancements_found.append("✅ Systematic approach emphasis")
+            print(f"\n🎯 ENHANCED FEATURES DETECTED:")
+            for enhancement in enhancements_found:
+                print(f"  {enhancement}")
+            if len(enhancements_found) >= 4:
+                print(f"\n🎉 SUCCESS: Enhanced reconstruction is working correctly!")
+                print(f"   Found {len(enhancements_found)}/5 expected enhancements")
+            else:
+                print(f"\n⚠️  WARNING: Only found {len(enhancements_found)}/5 expected enhancements")
+        print(f"\n✅ VALIDATION COMPLETE: Enhanced prompt reconstruction is functional")
+        return True
+    except Exception as e:
+        print(f"❌ VALIDATION FAILED: {str(e)}")
+        import traceback
+        traceback.print_exc()
+        return False
+if __name__ == "__main__":
+    success = validate_reconstruction()
+    sys.exit(0 if success else 1)