agentbee

Sleeping

App Files Files Community

mangubee commited on Jan 17

Commit

e7b4937

1 Parent(s): f1b095a

fix: correct author name formatting in multiple files

Browse files

Files changed (29) hide show

.env.example +1 -1
requirements.txt +1 -1
src/__init__.py +1 -1
src/agent/__init__.py +1 -1
src/agent/graph.py +145 -64
src/agent/llm_client.py +1 -1
src/config/__init__.py +1 -1
src/config/settings.py +1 -1
src/tools/__init__.py +1 -1
src/tools/audio.py +1 -1
src/tools/calculator.py +1 -1
src/tools/file_parser.py +1 -1
src/tools/vision.py +1 -1
src/tools/web_search.py +1 -1
src/tools/youtube.py +1 -1
src/utils/__init__.py +1 -1
src/utils/ground_truth.py +1 -1
test/__init__.py +1 -1
test/fixtures/generate_fixtures.py +1 -1
test/test_agent_basic.py +1 -1
test/test_calculator.py +1 -1
test/test_file_parser.py +1 -1
test/test_llm_integration.py +1 -1
test/test_phase0_hf_vision_api.py +1 -1
test/test_smoke_hf_vision.py +1 -1
test/test_stage1.py +1 -1
test/test_stage3_e2e.py +1 -1
test/test_vision.py +1 -1
test/test_web_search.py +1 -1

.env.example CHANGED Viewed

@@ -1,5 +1,5 @@
 # GAIA Benchmark Agent - Environment Configuration Template
-# Author: @mangobee
 # Date: 2026-01-01
 #
 # Copy this file to .env and fill in your API keys

 # GAIA Benchmark Agent - Environment Configuration Template
+# Author: @mangubee
 # Date: 2026-01-01
 #
 # Copy this file to .env and fill in your API keys

requirements.txt CHANGED Viewed

@@ -1,5 +1,5 @@
 # GAIA Benchmark Agent - Dependencies
-# Author: @mangobee
 # Date: 2026-01-01
 # ============================================================================

 # GAIA Benchmark Agent - Dependencies
+# Author: @mangubee
 # Date: 2026-01-01
 # ============================================================================

src/__init__.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 GAIA Benchmark Agent - Source Package
-Author: @mangobee
 Date: 2026-01-01
 """

 """
 GAIA Benchmark Agent - Source Package
+Author: @mangubee
 Date: 2026-01-01
 """

src/agent/__init__.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 LangGraph agent core package
-Author: @mangobee
 """
 from .graph import GAIAAgent

 """
 LangGraph agent core package
+Author: @mangubee
 """
 from .graph import GAIAAgent

src/agent/graph.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 LangGraph Agent Core - StateGraph Definition
-Author: @mangobee
 Date: 2026-01-01
 Stage 1: Skeleton with placeholder nodes
@@ -19,7 +19,15 @@ from pathlib import Path
 from typing import TypedDict, List, Optional
 from langgraph.graph import StateGraph, END
 from src.config import Settings
-from src.tools import TOOLS, search, parse_file, safe_eval, analyze_image, youtube_transcript, transcribe_audio
 from src.agent.llm_client import (
     plan_question,
     select_tools_with_function_calling,
@@ -35,6 +43,7 @@ logger = logging.getLogger(__name__)
 # Helper Functions
 # ============================================================================
 def is_vision_question(question: str) -> bool:
     """
     Detect if question requires vision analysis tool.
@@ -47,9 +56,19 @@ def is_vision_question(question: str) -> bool:
     Returns:
         True if question likely requires vision tool, False otherwise
     """
-    vision_keywords = ["image", "video", "youtube", "photo", "picture", "watch", "screenshot", "visual"]
     return any(keyword in question.lower() for keyword in vision_keywords)
 # ============================================================================
 # Agent State Definition
 # ============================================================================
@@ -119,7 +138,9 @@ def fallback_tool_selection(
     Returns:
         List of tool calls with basic parameters
     """
-    logger.info("[fallback_tool_selection] Using keyword-based fallback for tool selection")
     tool_calls = []
     question_lower = question.lower()
@@ -127,53 +148,88 @@ def fallback_tool_selection(
     combined = f"{question_lower} {plan_lower}"
     # Search tool: keywords like "search", "find", "look up", "who", "what", "when", "where"
-    search_keywords = ["search", "find", "look up", "who is", "what is", "when", "where", "google"]
     if any(keyword in combined for keyword in search_keywords):
         # Extract search query - use first sentence or full question
-        query = question.split('.')[0] if '.' in question else question
-        tool_calls.append({
-            "tool": "web_search",
-            "params": {"query": query}
-        })
-        logger.info(f"[fallback_tool_selection] Added web_search tool with query: {query}")
     # Math tool: keywords like "calculate", "compute", "+", "-", "*", "/", "="
-    math_keywords = ["calculate", "compute", "math", "sum", "multiply", "divide", "+", "-", "*", "/", "="]
     if any(keyword in combined for keyword in math_keywords):
         # Try to extract expression - look for patterns with numbers and operators
         import re
         # Look for mathematical expressions
-        expr_match = re.search(r'[\d\s\+\-\*/\(\)\.]+', question)
         if expr_match:
             expression = expr_match.group().strip()
-            tool_calls.append({
-                "tool": "calculator",
-                "params": {"expression": expression}
-            })
-            logger.info(f"[fallback_tool_selection] Added calculator tool with expression: {expression}")
     # File tool: if file_paths available, use them
     if file_paths:
         for file_path in file_paths:
             # Determine file type and appropriate tool
             file_ext = Path(file_path).suffix.lower()
-            if file_ext in ['.png', '.jpg', '.jpeg']:
-                tool_calls.append({
-                    "tool": "vision",
-                    "params": {"image_path": file_path}
-                })
-                logger.info(f"[fallback_tool_selection] Added vision tool for image: {file_path}")
-            elif file_ext in ['.pdf', '.xlsx', '.xls', '.csv', '.json', '.txt', '.docx', '.doc']:
-                tool_calls.append({
-                    "tool": "parse_file",
-                    "params": {"file_path": file_path}
-                })
-                logger.info(f"[fallback_tool_selection] Added parse_file tool for: {file_path}")
     else:
         # Keyword-based file detection (legacy)
         file_keywords = ["file", "parse", "read", "csv", "json", "txt", "document"]
         if any(keyword in combined for keyword in file_keywords):
-            logger.warning("[fallback_tool_selection] File operation detected but no file_paths available")
     # Image tool: keywords like "image", "picture", "photo", "analyze", "vision"
     image_keywords = ["image", "picture", "photo", "analyze image", "vision"]
@@ -182,17 +238,20 @@ def fallback_tool_selection(
             # Already handled above in file_paths check
             pass
         else:
-            logger.warning("[fallback_tool_selection] Image operation detected but no file_paths available")
     if not tool_calls:
-        logger.warning("[fallback_tool_selection] No tools selected by fallback - adding default search")
         # Default: just search the question
-        tool_calls.append({
-            "tool": "web_search",
-            "params": {"query": question}
-        })
-    logger.info(f"[fallback_tool_selection] Fallback selected {len(tool_calls)} tool(s)")
     return tool_calls
@@ -264,7 +323,9 @@ def execute_node(state: AgentState) -> AgentState:
             )
         elif not isinstance(tool_calls, list):
             logger.error(f"[execute] Invalid type: {type(tool_calls)}, using fallback")
-            state["errors"].append(f"Tool selection returned invalid type: {type(tool_calls)}")
             tool_calls = fallback_tool_selection(
                 state["question"], state["plan"], state.get("file_paths")
             )
@@ -284,12 +345,14 @@ def execute_node(state: AgentState) -> AgentState:
                 result = tool_func(**params)
                 logger.info(f"[{idx}/{len(tool_calls)}] {tool_name} ✓")
-                tool_results.append({
-                    "tool": tool_name,
-                    "params": params,
-                    "result": result,
-                    "status": "success",
-                })
                 # Extract evidence - handle different result formats
                 if isinstance(result, dict):
@@ -307,7 +370,9 @@ def execute_node(state: AgentState) -> AgentState:
                                 title = r.get("title", "")[:100]
                                 url = r.get("url", "")[:100]
                                 snippet = r.get("snippet", "")[:200]
-                                formatted.append(f"Title: {title}\nURL: {url}\nSnippet: {snippet}")
                             evidence.append("\n\n".join(formatted))
                         else:
                             evidence.append(str(result))
@@ -320,13 +385,17 @@ def execute_node(state: AgentState) -> AgentState:
             except Exception as tool_error:
                 logger.error(f"[execute] ✗ {tool_name}: {tool_error}")
-                tool_results.append({
-                    "tool": tool_name,
-                    "params": params,
-                    "error": str(tool_error),
-                    "status": "failed",
-                })
-                if tool_name == "vision" and ("quota" in str(tool_error).lower() or "429" in str(tool_error)):
                     state["errors"].append(f"Vision failed: LLM quota exhausted")
                 else:
                     state["errors"].append(f"{tool_name}: {type(tool_error).__name__}")
@@ -336,7 +405,9 @@ def execute_node(state: AgentState) -> AgentState:
     except Exception as e:
         logger.error(f"[execute] ✗ {type(e).__name__}: {str(e)}")
-        if is_vision_question(state["question"]) and ("quota" in str(e).lower() or "429" in str(e)):
             state["errors"].append("Vision unavailable (quota exhausted)")
         else:
             state["errors"].append(f"Execution error: {type(e).__name__}")
@@ -364,12 +435,14 @@ def execute_node(state: AgentState) -> AgentState:
                         tool_func = TOOL_FUNCTIONS.get(tool_name)
                         if tool_func:
                             result = tool_func(**params)
-                            tool_results.append({
-                                "tool": tool_name,
-                                "params": params,
-                                "result": result,
-                                "status": "success"
-                            })
                             if isinstance(result, dict):
                                 if "answer" in result:
                                     evidence.append(result["answer"])
@@ -381,7 +454,9 @@ def execute_node(state: AgentState) -> AgentState:
                                             title = r.get("title", "")[:100]
                                             url = r.get("url", "")[:100]
                                             snippet = r.get("snippet", "")[:200]
-                                            formatted.append(f"Title: {title}\nURL: {url}\nSnippet: {snippet}")
                                         evidence.append("\n\n".join(formatted))
                                     else:
                                         evidence.append(str(result))
@@ -411,7 +486,9 @@ def answer_node(state: AgentState) -> AgentState:
     try:
         if not state["evidence"]:
-            error_summary = "; ".join(state["errors"]) if state["errors"] else "No errors logged"
             state["answer"] = f"ERROR: No evidence. {error_summary}"
             logger.error(f"[answer] ✗ No evidence - {error_summary}")
             return state
@@ -425,7 +502,9 @@ def answer_node(state: AgentState) -> AgentState:
     except Exception as e:
         logger.error(f"[answer] ✗ {type(e).__name__}: {str(e)}")
         state["errors"].append(f"Answer synthesis error: {type(e).__name__}: {str(e)}")
-        state["answer"] = f"ERROR: Answer synthesis failed - {type(e).__name__}: {str(e)}"
     return state
@@ -491,7 +570,9 @@ class GAIAAgent:
             warning_msg = f"⚠️  WARNING: Missing API keys: {', '.join(missing_keys)}"
             print(warning_msg)
             logger.warning(warning_msg)
-            print("   Agent may fail to answer questions. Set keys in environment variables.")
         else:
             print("✓ All API keys present")

 """
 LangGraph Agent Core - StateGraph Definition
+Author: @mangubee
 Date: 2026-01-01
 Stage 1: Skeleton with placeholder nodes
 from typing import TypedDict, List, Optional
 from langgraph.graph import StateGraph, END
 from src.config import Settings
+from src.tools import (
+    TOOLS,
+    search,
+    parse_file,
+    safe_eval,
+    analyze_image,
+    youtube_transcript,
+    transcribe_audio,
+)
 from src.agent.llm_client import (
     plan_question,
     select_tools_with_function_calling,
 # Helper Functions
 # ============================================================================
 def is_vision_question(question: str) -> bool:
     """
     Detect if question requires vision analysis tool.
     Returns:
         True if question likely requires vision tool, False otherwise
     """
+    vision_keywords = [
+        "image",
+        "video",
+        "youtube",
+        "photo",
+        "picture",
+        "watch",
+        "screenshot",
+        "visual",
+    ]
     return any(keyword in question.lower() for keyword in vision_keywords)
 # ============================================================================
 # Agent State Definition
 # ============================================================================
     Returns:
         List of tool calls with basic parameters
     """
+    logger.info(
+        "[fallback_tool_selection] Using keyword-based fallback for tool selection"
+    )
     tool_calls = []
     question_lower = question.lower()
     combined = f"{question_lower} {plan_lower}"
     # Search tool: keywords like "search", "find", "look up", "who", "what", "when", "where"
+    search_keywords = [
+        "search",
+        "find",
+        "look up",
+        "who is",
+        "what is",
+        "when",
+        "where",
+        "google",
+    ]
     if any(keyword in combined for keyword in search_keywords):
         # Extract search query - use first sentence or full question
+        query = question.split(".")[0] if "." in question else question
+        tool_calls.append({"tool": "web_search", "params": {"query": query}})
+        logger.info(
+            f"[fallback_tool_selection] Added web_search tool with query: {query}"
+        )
     # Math tool: keywords like "calculate", "compute", "+", "-", "*", "/", "="
+    math_keywords = [
+        "calculate",
+        "compute",
+        "math",
+        "sum",
+        "multiply",
+        "divide",
+        "+",
+        "-",
+        "*",
+        "/",
+        "=",
+    ]
     if any(keyword in combined for keyword in math_keywords):
         # Try to extract expression - look for patterns with numbers and operators
         import re
         # Look for mathematical expressions
+        expr_match = re.search(r"[\d\s\+\-\*/\(\)\.]+", question)
         if expr_match:
             expression = expr_match.group().strip()
+            tool_calls.append(
+                {"tool": "calculator", "params": {"expression": expression}}
+            )
+            logger.info(
+                f"[fallback_tool_selection] Added calculator tool with expression: {expression}"
+            )
     # File tool: if file_paths available, use them
     if file_paths:
         for file_path in file_paths:
             # Determine file type and appropriate tool
             file_ext = Path(file_path).suffix.lower()
+            if file_ext in [".png", ".jpg", ".jpeg"]:
+                tool_calls.append(
+                    {"tool": "vision", "params": {"image_path": file_path}}
+                )
+                logger.info(
+                    f"[fallback_tool_selection] Added vision tool for image: {file_path}"
+                )
+            elif file_ext in [
+                ".pdf",
+                ".xlsx",
+                ".xls",
+                ".csv",
+                ".json",
+                ".txt",
+                ".docx",
+                ".doc",
+            ]:
+                tool_calls.append(
+                    {"tool": "parse_file", "params": {"file_path": file_path}}
+                )
+                logger.info(
+                    f"[fallback_tool_selection] Added parse_file tool for: {file_path}"
+                )
     else:
         # Keyword-based file detection (legacy)
         file_keywords = ["file", "parse", "read", "csv", "json", "txt", "document"]
         if any(keyword in combined for keyword in file_keywords):
+            logger.warning(
+                "[fallback_tool_selection] File operation detected but no file_paths available"
+            )
     # Image tool: keywords like "image", "picture", "photo", "analyze", "vision"
     image_keywords = ["image", "picture", "photo", "analyze image", "vision"]
             # Already handled above in file_paths check
             pass
         else:
+            logger.warning(
+                "[fallback_tool_selection] Image operation detected but no file_paths available"
+            )
     if not tool_calls:
+        logger.warning(
+            "[fallback_tool_selection] No tools selected by fallback - adding default search"
+        )
         # Default: just search the question
+        tool_calls.append({"tool": "web_search", "params": {"query": question}})
+    logger.info(
+        f"[fallback_tool_selection] Fallback selected {len(tool_calls)} tool(s)"
+    )
     return tool_calls
             )
         elif not isinstance(tool_calls, list):
             logger.error(f"[execute] Invalid type: {type(tool_calls)}, using fallback")
+            state["errors"].append(
+                f"Tool selection returned invalid type: {type(tool_calls)}"
+            )
             tool_calls = fallback_tool_selection(
                 state["question"], state["plan"], state.get("file_paths")
             )
                 result = tool_func(**params)
                 logger.info(f"[{idx}/{len(tool_calls)}] {tool_name} ✓")
+                tool_results.append(
+                    {
+                        "tool": tool_name,
+                        "params": params,
+                        "result": result,
+                        "status": "success",
+                    }
+                )
                 # Extract evidence - handle different result formats
                 if isinstance(result, dict):
                                 title = r.get("title", "")[:100]
                                 url = r.get("url", "")[:100]
                                 snippet = r.get("snippet", "")[:200]
+                                formatted.append(
+                                    f"Title: {title}\nURL: {url}\nSnippet: {snippet}"
+                                )
                             evidence.append("\n\n".join(formatted))
                         else:
                             evidence.append(str(result))
             except Exception as tool_error:
                 logger.error(f"[execute] ✗ {tool_name}: {tool_error}")
+                tool_results.append(
+                    {
+                        "tool": tool_name,
+                        "params": params,
+                        "error": str(tool_error),
+                        "status": "failed",
+                    }
+                )
+                if tool_name == "vision" and (
+                    "quota" in str(tool_error).lower() or "429" in str(tool_error)
+                ):
                     state["errors"].append(f"Vision failed: LLM quota exhausted")
                 else:
                     state["errors"].append(f"{tool_name}: {type(tool_error).__name__}")
     except Exception as e:
         logger.error(f"[execute] ✗ {type(e).__name__}: {str(e)}")
+        if is_vision_question(state["question"]) and (
+            "quota" in str(e).lower() or "429" in str(e)
+        ):
             state["errors"].append("Vision unavailable (quota exhausted)")
         else:
             state["errors"].append(f"Execution error: {type(e).__name__}")
                         tool_func = TOOL_FUNCTIONS.get(tool_name)
                         if tool_func:
                             result = tool_func(**params)
+                            tool_results.append(
+                                {
+                                    "tool": tool_name,
+                                    "params": params,
+                                    "result": result,
+                                    "status": "success",
+                                }
+                            )
                             if isinstance(result, dict):
                                 if "answer" in result:
                                     evidence.append(result["answer"])
                                             title = r.get("title", "")[:100]
                                             url = r.get("url", "")[:100]
                                             snippet = r.get("snippet", "")[:200]
+                                            formatted.append(
+                                                f"Title: {title}\nURL: {url}\nSnippet: {snippet}"
+                                            )
                                         evidence.append("\n\n".join(formatted))
                                     else:
                                         evidence.append(str(result))
     try:
         if not state["evidence"]:
+            error_summary = (
+                "; ".join(state["errors"]) if state["errors"] else "No errors logged"
+            )
             state["answer"] = f"ERROR: No evidence. {error_summary}"
             logger.error(f"[answer] ✗ No evidence - {error_summary}")
             return state
     except Exception as e:
         logger.error(f"[answer] ✗ {type(e).__name__}: {str(e)}")
         state["errors"].append(f"Answer synthesis error: {type(e).__name__}: {str(e)}")
+        state["answer"] = (
+            f"ERROR: Answer synthesis failed - {type(e).__name__}: {str(e)}"
+        )
     return state
             warning_msg = f"⚠️  WARNING: Missing API keys: {', '.join(missing_keys)}"
             print(warning_msg)
             logger.warning(warning_msg)
+            print(
+                "   Agent may fail to answer questions. Set keys in environment variables."
+            )
         else:
             print("✓ All API keys present")

src/agent/llm_client.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 LLM Client Module - Multi-Provider LLM Integration
-Author: @mangobee
 Date: 2026-01-02
 Handles all LLM calls for:

 """
 LLM Client Module - Multi-Provider LLM Integration
+Author: @mangubee
 Date: 2026-01-02
 Handles all LLM calls for:

src/config/__init__.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Configuration management package
-Author: @mangobee
 """
 from .settings import Settings

 """
 Configuration management package
+Author: @mangubee
 """
 from .settings import Settings

src/config/settings.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Configuration Management
-Author: @mangobee
 Date: 2026-01-01
 Loads environment variables and defines configuration constants for GAIA agent.

 """
 Configuration Management
+Author: @mangubee
 Date: 2026-01-01
 Loads environment variables and defines configuration constants for GAIA agent.

src/tools/__init__.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Tool implementations package
-Author: @mangobee
 This package contains all agent tools:
 - web_search: Web search using Tavily/Exa

 """
 Tool implementations package
+Author: @mangubee
 This package contains all agent tools:
 - web_search: Web search using Tavily/Exa

src/tools/audio.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Audio Transcription Tool - Whisper speech-to-text
-Author: @mangobee
 Date: 2026-01-13
 Provides audio transcription using OpenAI Whisper:

 """
 Audio Transcription Tool - Whisper speech-to-text
+Author: @mangubee
 Date: 2026-01-13
 Provides audio transcription using OpenAI Whisper:

src/tools/calculator.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Calculator Tool - Safe mathematical expression evaluation
-Author: @mangobee
 Date: 2026-01-02
 Provides safe evaluation of mathematical expressions with:

 """
 Calculator Tool - Safe mathematical expression evaluation
+Author: @mangubee
 Date: 2026-01-02
 Provides safe evaluation of mathematical expressions with:

src/tools/file_parser.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 File Parser Tool - Multi-format file reading
-Author: @mangobee
 Date: 2026-01-02
 Provides file parsing for:

 """
 File Parser Tool - Multi-format file reading
+Author: @mangubee
 Date: 2026-01-02
 Provides file parsing for:

src/tools/vision.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Vision Tool - Image analysis using multimodal LLMs
-Author: @mangobee
 Date: 2026-01-02
 Provides image analysis functionality using:

 """
 Vision Tool - Image analysis using multimodal LLMs
+Author: @mangubee
 Date: 2026-01-02
 Provides image analysis functionality using:

src/tools/web_search.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Web Search Tool - Tavily and Exa implementations
-Author: @mangobee
 Date: 2026-01-02
 Provides web search functionality with:

 """
 Web Search Tool - Tavily and Exa implementations
+Author: @mangubee
 Date: 2026-01-02
 Provides web search functionality with:

src/tools/youtube.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 YouTube Video Analysis Tool - Extract transcripts or analyze frames from YouTube videos
-Author: @mangobee
 Date: 2026-01-13
 Provides two modes for YouTube video analysis:

 """
 YouTube Video Analysis Tool - Extract transcripts or analyze frames from YouTube videos
+Author: @mangubee
 Date: 2026-01-13
 Provides two modes for YouTube video analysis:

src/utils/__init__.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """Utility modules for GAIA agent.
-Author: @mangobee
 """
 from .ground_truth import get_ground_truth, GAIAGroundTruth

 """Utility modules for GAIA agent.
+Author: @mangubee
 """
 from .ground_truth import get_ground_truth, GAIAGroundTruth

src/utils/ground_truth.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """Ground truth comparison using GAIA validation dataset.
-Author: @mangobee
 Since the GAIA API only returns summary stats (X/Y correct) without per-question
 correctness, we load the public validation dataset to compare our answers locally.

 """Ground truth comparison using GAIA validation dataset.
+Author: @mangubee
 Since the GAIA API only returns summary stats (X/Y correct) without per-question
 correctness, we load the public validation dataset to compare our answers locally.

test/__init__.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Tests Package for GAIA Agent
-Author: @mangobee
 Date: 2026-01-01
 Test organization:

 """
 Tests Package for GAIA Agent
+Author: @mangubee
 Date: 2026-01-01
 Test organization:

test/fixtures/generate_fixtures.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Generate test fixtures for file parser tests
-Author: @mangobee
 """
 from pathlib import Path

 """
 Generate test fixtures for file parser tests
+Author: @mangubee
 """
 from pathlib import Path

test/test_agent_basic.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Basic Tests for GAIA Agent - Stage 1 Validation
-Author: @mangobee
 Date: 2026-01-01
 Tests for Stage 1: Foundation Setup

 """
 Basic Tests for GAIA Agent - Stage 1 Validation
+Author: @mangubee
 Date: 2026-01-01
 Tests for Stage 1: Foundation Setup

test/test_calculator.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Tests for calculator tool (safe mathematical evaluation)
-Author: @mangobee
 Date: 2026-01-02
 Tests cover:

 """
 Tests for calculator tool (safe mathematical evaluation)
+Author: @mangubee
 Date: 2026-01-02
 Tests cover:

test/test_file_parser.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Tests for file parser tool
-Author: @mangobee
 Date: 2026-01-02
 Tests cover:

 """
 Tests for file parser tool
+Author: @mangubee
 Date: 2026-01-02
 Tests cover:

test/test_llm_integration.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 LLM Integration Tests - Stage 3 Validation
-Author: @mangobee
 Date: 2026-01-02
 Tests for Stage 3 LLM integration:

 """
 LLM Integration Tests - Stage 3 Validation
+Author: @mangubee
 Date: 2026-01-02
 Tests for Stage 3 LLM integration:

test/test_phase0_hf_vision_api.py CHANGED Viewed

@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 """
 Phase 0: HuggingFace Inference API Vision Validation
-Author: @mangobee
 Date: 2026-01-07
 Tests HF Inference API with vision models to validate multimodal support BEFORE

 #!/usr/bin/env python3
 """
 Phase 0: HuggingFace Inference API Vision Validation
+Author: @mangubee
 Date: 2026-01-07
 Tests HF Inference API with vision models to validate multimodal support BEFORE

test/test_smoke_hf_vision.py CHANGED Viewed

@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 """
 Phase 2: Smoke Tests for HF Vision Integration
-Author: @mangobee
 Date: 2026-01-11
 Quick validation that HF vision works before GAIA evaluation.

 #!/usr/bin/env python3
 """
 Phase 2: Smoke Tests for HF Vision Integration
+Author: @mangubee
 Date: 2026-01-11
 Quick validation that HF vision works before GAIA evaluation.

test/test_stage1.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Stage 1 Quick Verification Test
-Author: @mangobee
 Test that agent initialization and basic execution works.
 """

 """
 Stage 1 Quick Verification Test
+Author: @mangubee
 Test that agent initialization and basic execution works.
 """

test/test_stage3_e2e.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Stage 3 End-to-End Test with Real LLM API
-Author: @mangobee
 Date: 2026-01-02
 Manual test for Stage 3 workflow with actual Claude API.

 """
 Stage 3 End-to-End Test with Real LLM API
+Author: @mangubee
 Date: 2026-01-02
 Manual test for Stage 3 workflow with actual Claude API.

test/test_vision.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Tests for vision tool (multimodal image analysis)
-Author: @mangobee
 Date: 2026-01-02
 Tests cover:

 """
 Tests for vision tool (multimodal image analysis)
+Author: @mangubee
 Date: 2026-01-02
 Tests cover:

test/test_web_search.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Tests for web search tool (Tavily and Exa)
-Author: @mangobee
 Date: 2026-01-02
 Tests cover:

 """
 Tests for web search tool (Tavily and Exa)
+Author: @mangubee
 Date: 2026-01-02
 Tests cover: