Spaces:

promptAId
/

operations

Runtime error

jbbove commited on Sep 7, 2025

Commit

bcda1ac

1 Parent(s): a34989b

Phase 4: Implement LLM-based summarization node

🚀 Major Features:
- New llm_summarization_node() in agent/nodes.py for intelligent data analysis
- Enhanced LLMClient with generate_insights() method for data summarization
- Complete Phase 4 architecture: task-specific formatting → LLM insights → response generation

🧪 Comprehensive Testing:
- 5/5 unit tests for LLM summarization node with mock LLM clients
- End-to-end integration tests for temperature and precipitation workflows
- Enhanced test visibility showing complete workflow phases
- Mock testing framework for API-free validation

📊 OMIRL Improvements:
- Removed task-agnostic summarization (replaced with task-specific formatting)
- Enhanced precipitation data parsing and formatting
- Improved station data formatting with scenario-based output
- Updated adapter to use direct task formatting (no LLM dependency)

🔧 Architecture Enhancements:
- Clean separation: LLM summarization adds insights, response generation handles formatting
- Graceful LLM failure handling - workflow continues without insights
- Enhanced response generation to display LLM insights in user-friendly format
- Maintained backward compatibility with existing workflow

✅ Validation:
- Phase 4 working end-to-end with detailed workflow visibility
- Both temperature and precipitation query testing
- Complete test coverage with fast mock tests and integration tests
- Performance analysis and browser management improvements

🗑️ Cleanup:
- Removed unused legacy test files and discovery artifacts
- Cleaned up old task-agnostic summarization service
- Reorganized test structure with proper agent/ subdirectory

Files changed (22) hide show

agent/llm_client.py +79 -0
agent/nodes.py +122 -0
services/text/task_agnostic_summarization.py +0 -633
tests/agent/test_llm_summarization_node.py +308 -0
tests/agent/test_llm_sumnode_integration.py +339 -0
tests/debug_node.py +0 -0
tests/debug_state.py +0 -0
tests/omirl/performance_analysis.py +86 -0
tests/{test_adapter_integration.py → omirl/test_adapter_integration.py} +81 -7
tests/omirl/test_adapter_with_precipitation.py +0 -178
tests/omirl/test_fast.py +252 -0
tests/omirl/test_massimi_precipitazione.py +301 -53
tests/omirl/test_validation.py +390 -0
tests/omirl/test_valori_stazioni.py +296 -0
tests/test_llm_summarization_node.py +0 -0
tests/test_omirl_implementation.py +0 -1
tests/test_phase4_workflow.py +0 -0
tests/test_valori_stazioni.py +0 -155
tools/omirl/adapter.py +8 -11
tools/omirl/tables/__init__.py +2 -3
tools/omirl/tables/massimi_precipitazione.py +129 -72
tools/omirl/tables/valori_stazioni.py +103 -47

agent/llm_client.py CHANGED Viewed

@@ -365,6 +365,85 @@ class LLMClient:
         except Exception as e:
             raise ValueError(f"Failed to parse LLM response: {e}")
     def _create_fallback_proposal(self, user_query: str, error: str) -> ToolProposal:
         """
         Create fallback proposal when LLM routing fails

         except Exception as e:
             raise ValueError(f"Failed to parse LLM response: {e}")
+    async def generate_insights(self, data_prompt: str) -> str:
+        """
+        Generate intelligent insights from OMIRL data using LLM
+        This method takes formatted data from task-specific tools and generates
+        higher-level insights, trends analysis, and operational recommendations.
+        Args:
+            data_prompt: Formatted prompt with OMIRL data to analyze
+        Returns:
+            String with LLM-generated insights and recommendations
+        """
+        try:
+            if self.client == "mock_client":
+                # Return mock insights for testing
+                return ("• **Temperatura**: Valori nella norma per la stagione\n"
+                       "• **Precipitazioni**: Leggera attività nelle zone montane\n"
+                       "• **Raccomandazione**: Monitoraggio ordinario, nessuna criticità rilevata")
+            if self.provider == "gemini":
+                # Use Gemini for insight generation
+                response = await self.client.generate_content_async(
+                    data_prompt,
+                    generation_config=genai.types.GenerationConfig(
+                        temperature=self.temperature,
+                        max_output_tokens=self.max_tokens,
+                        candidate_count=1
+                    )
+                )
+                if response and response.text:
+                    return response.text.strip()
+                else:
+                    raise ValueError("Empty response from Gemini")
+            elif self.provider == "openai":
+                # Use OpenAI for insight generation
+                response = await self.client.chat.completions.create(
+                    model=self.model,
+                    messages=[
+                        {
+                            "role": "system",
+                            "content": "Sei un analista meteorologico esperto che genera insights operativi dai dati OMIRL."
+                        },
+                        {"role": "user", "content": data_prompt}
+                    ],
+                    temperature=self.temperature,
+                    max_tokens=self.max_tokens,
+                    timeout=self.timeout
+                )
+                if response.choices and response.choices[0].message.content:
+                    return response.choices[0].message.content.strip()
+                else:
+                    raise ValueError("Empty response from OpenAI")
+            else:
+                raise ValueError(f"Insight generation not implemented for provider: {self.provider}")
+        except Exception as e:
+            logging.error(f"LLM insight generation failed: {e}")
+            # Try fallback provider if available
+            if hasattr(self, 'fallback_provider') and self.fallback_provider != self.provider:
+                try:
+                    # Quick fallback attempt with simpler prompt
+                    fallback_client = LLMClient(
+                        provider=self.fallback_provider,
+                        model=self.fallback_model,
+                        temperature=self.temperature,
+                        max_tokens=300  # Shorter fallback
+                    )
+                    return await fallback_client.generate_insights(data_prompt)
+                except Exception as fallback_error:
+                    logging.error(f"Fallback insight generation failed: {fallback_error}")
+            # Return empty string on failure - don't break the workflow
+            return ""
     def _create_fallback_proposal(self, user_query: str, error: str) -> ToolProposal:
         """
         Create fallback proposal when LLM routing fails

agent/nodes.py CHANGED Viewed

@@ -31,6 +31,7 @@ from datetime import datetime
 from .state import AgentState, ToolCall, ToolResult, update_processing_status, add_tool_result, add_error
 from .registry import get_tool_registry, get_tool_by_name, validate_tool_parameters
 from .llm_router_node import llm_router_node
 async def llm_routing_node(state: AgentState) -> AgentState:
@@ -192,6 +193,121 @@ async def tool_execution_node(state: AgentState) -> AgentState:
     return state
 async def response_generation_node(state: AgentState) -> AgentState:
     """
     Generate final response based on tool results and LLM router status
@@ -231,6 +347,12 @@ async def response_generation_node(state: AgentState) -> AgentState:
         for result in successful_results:
             response_parts.append(result.summary_text)
             # Add artifact information
             if result.artifacts:
                 response_parts.append(f"\n📄 **File generati:** {len(result.artifacts)}")

 from .state import AgentState, ToolCall, ToolResult, update_processing_status, add_tool_result, add_error
 from .registry import get_tool_registry, get_tool_by_name, validate_tool_parameters
 from .llm_router_node import llm_router_node
+from .llm_client import LLMClient
 async def llm_routing_node(state: AgentState) -> AgentState:
     return state
+async def llm_summarization_node(state: AgentState) -> AgentState:
+    """
+    Generate intelligent insights from tool results using LLM
+    This node takes the raw task-specific formatted data and generates
+    higher-level insights, trends, and cross-task analysis using an LLM.
+    This is Phase 4 of the architecture: LLM-based intelligent summarization.
+    Args:
+        state: Current agent state with tool results
+    Returns:
+        Updated state with LLM-generated insights added to metadata
+    """
+    print(f"🧠 Generating LLM-based insights...")
+    state = update_processing_status(state, "llm_summarization", "Analyzing data with LLM")
+    tool_results = state["tool_results"]
+    # Only process successful results that have substantive data
+    successful_results = [r for r in tool_results if r.success and r.summary_text]
+    if not successful_results:
+        print(f"ℹ️  No successful results to analyze")
+        return state
+    try:
+        # Initialize LLM client for summarization
+        llm_client = LLMClient(
+            provider="gemini",
+            temperature=0.3,  # Slightly higher for more creative insights
+            max_tokens=800,   # Allow for richer analysis
+            timeout=15
+        )
+        # Build summarization prompt
+        prompt_parts = [
+            "Analizza i seguenti dati meteorologici OMIRL e genera insights intelligenti.",
+            "Concentrati su: tendenze, valori anomali, confronti geografici, raccomandazioni operative.",
+            "Rispondi in italiano con bullet points chiari e concisi.\n",
+            "DATI DA ANALIZZARE:"
+        ]
+        # Add each tool result's data
+        for i, result in enumerate(successful_results, 1):
+            prompt_parts.append(f"\n{i}. {result.tool_name.upper()}:")
+            prompt_parts.append(f"   {result.summary_text}")
+            # Add key metadata for context
+            if result.metadata:
+                relevant_metadata = {
+                    k: v for k, v in result.metadata.items()
+                    if k in ['sensor_type', 'filters_applied', 'total_after_filtering', 'zona_allerta_records', 'province_records']
+                }
+                if relevant_metadata:
+                    prompt_parts.append(f"   Dettagli: {relevant_metadata}")
+        prompt_parts.append("\nGENERA INSIGHTS OPERATIVI:")
+        full_prompt = "\n".join(prompt_parts)
+        # Get LLM insights (with fallback)
+        try:
+            insights = await llm_client.generate_insights(full_prompt)
+            if insights and len(insights.strip()) > 20:  # Valid response
+                # Add insights to the first successful result's metadata
+                if successful_results:
+                    # Find existing metadata or create new
+                    original_result = successful_results[0]
+                    enhanced_metadata = original_result.metadata.copy()
+                    enhanced_metadata["llm_insights"] = insights
+                    enhanced_metadata["insights_generated_at"] = datetime.now().isoformat()
+                    # Create new enhanced result
+                    enhanced_result = ToolResult(
+                        tool_name=original_result.tool_name,
+                        success=original_result.success,
+                        summary_text=original_result.summary_text,
+                        artifacts=original_result.artifacts,
+                        sources=original_result.sources,
+                        metadata=enhanced_metadata,
+                        warnings=original_result.warnings
+                    )
+                    # Update the state with enhanced result using state functions
+                    # Remove the original result first
+                    new_results = [r for r in state["tool_results"] if r != original_result]
+                    # Add the enhanced result
+                    new_results.insert(0, enhanced_result)
+                    # Update state
+                    updated_state = dict(state)
+                    updated_state["tool_results"] = new_results
+                    state = updated_state
+                print(f"✅ LLM insights generated ({len(insights)} chars)")
+            else:
+                print(f"⚠️  LLM generated empty insights, skipping")
+        except Exception as llm_error:
+            print(f"⚠️  LLM summarization failed: {llm_error}")
+            # Don't fail the whole workflow - just skip insights
+    except Exception as e:
+        print(f"⚠️  Summarization node error: {e}")
+        # Don't break the workflow - summarization is optional enhancement
+    print(f"✅ LLM summarization complete")
+    return state
 async def response_generation_node(state: AgentState) -> AgentState:
     """
     Generate final response based on tool results and LLM router status
         for result in successful_results:
             response_parts.append(result.summary_text)
+            # Add LLM insights if available (Phase 4 enhancement)
+            llm_insights = result.metadata.get("llm_insights")
+            if llm_insights and len(llm_insights.strip()) > 20:
+                response_parts.append(f"\n🧠 **Analisi Intelligente:**")
+                response_parts.append(llm_insights)
             # Add artifact information
             if result.artifacts:
                 response_parts.append(f"\n📄 **File generati:** {len(result.artifacts)}")

services/text/task_agnostic_summarization.py DELETED Viewed

@@ -1,633 +0,0 @@
-# services/text/task_agnostic_summarization.py
-"""
-Task-Agnostic Multi-Task Summarization Service
-This module provides intelligent summarization that works across all OMIRL tasks
-using standardized data formats. It analyzes multiple task results together and
-generates comprehensive summaries with trend analysis.
-Key Features:
-- Task-agnostic: Works with any OMIRL task (valori_stazioni, massimi_precipitazione, etc.)
-- Multi-task: Combines results from multiple tasks in a single summary
-- Efficient: One LLM call for all tasks combined
-- Trend-focused: Emphasizes temporal patterns and geographical insights
-- Lightweight: Uses structured data format that works with smaller LLMs
-Architecture:
-1. Each task provides standardized TaskSummary format
-2. MultiTaskSummarizer collects all TaskSummary objects
-3. Single LLM call generates comprehensive operational summary
-Usage:
-    # From individual tasks
-    task_summary = TaskSummary(
-        task_type="massimi_precipitazione",
-        geographic_scope="Provincia Genova",
-        temporal_scope="All periods (5'-24h)",
-        data_insights=DataInsights(...)
-    )
-    # Multi-task summarization
-    summarizer = MultiTaskSummarizer()
-    summarizer.add_task_result(task_summary)
-    final_summary = await summarizer.generate_final_summary()
-"""
-import asyncio
-from typing import Dict, Any, List, Optional, Union
-import logging
-from datetime import datetime
-from dataclasses import dataclass, asdict
-import json
-import google.generativeai as genai
-from agent.config.env_config import get_api_key
-# Configure logging
-logger = logging.getLogger(__name__)
-@dataclass
-class DataInsights:
-    """Standardized data insights that work across all task types"""
-    total_records: int
-    records_with_data: int
-    # Numeric analysis (for any numeric data)
-    min_value: Optional[float] = None
-    max_value: Optional[float] = None
-    avg_value: Optional[float] = None
-    unit: Optional[str] = None
-    # Trend analysis (for temporal data)
-    trend_direction: Optional[str] = None  # "increasing", "decreasing", "stable", "peaked"
-    trend_confidence: Optional[str] = None  # "high", "medium", "low"
-    peak_period: Optional[str] = None  # "1h", "24h", etc.
-    # Geographic distribution
-    geographic_pattern: Optional[str] = None  # "concentrated", "distributed", "coastal", "inland"
-    notable_locations: List[Dict[str, Any]] = None
-    # Data quality
-    coverage_quality: str = "complete"  # "complete", "partial", "sparse"
-    def __post_init__(self):
-        if self.notable_locations is None:
-            self.notable_locations = []
-@dataclass
-class TaskSummary:
-    """Standardized summary format for any OMIRL task"""
-    task_type: str  # "valori_stazioni", "massimi_precipitazione", etc.
-    geographic_scope: str  # "Provincia Genova", "Zona A", "Liguria", etc.
-    temporal_scope: str  # "Current values", "All periods (5'-24h)", "Period 1h", etc.
-    data_insights: DataInsights
-    filters_applied: Dict[str, Any] = None
-    extraction_timestamp: str = None
-    def __post_init__(self):
-        if self.filters_applied is None:
-            self.filters_applied = {}
-        if self.extraction_timestamp is None:
-            self.extraction_timestamp = datetime.now().isoformat()
-class MultiTaskSummarizer:
-    """
-    Multi-task summarization coordinator
-    Collects results from multiple OMIRL tasks and generates
-    a single comprehensive operational summary.
-    """
-    def __init__(self):
-        """Initialize the multi-task summarizer"""
-        self.task_results: List[TaskSummary] = []
-        self.api_key = get_api_key('GEMINI_API_KEY')
-        if self.api_key:
-            genai.configure(api_key=self.api_key)
-            self.model = genai.GenerativeModel('gemini-1.5-flash')
-            logger.info("✅ Multi-task summarizer initialized with Gemini API")
-        else:
-            self.model = None
-            logger.warning("⚠️ No Gemini API key found - will use structured fallback summaries")
-    def add_task_result(self, task_summary: TaskSummary) -> None:
-        """Add a task result to be included in final summary"""
-        self.task_results.append(task_summary)
-        logger.info(f"📋 Added {task_summary.task_type} result to multi-task summary queue")
-    def clear_results(self) -> None:
-        """Clear all collected task results"""
-        self.task_results.clear()
-        logger.info("🗑️ Cleared multi-task summary queue")
-    async def generate_final_summary(self, query_context: str = "") -> str:
-        """
-        Generate comprehensive summary from all collected task results
-        Args:
-            query_context: Original user query for context
-        Returns:
-            Comprehensive operational summary in Italian
-        """
-        if not self.task_results:
-            return "📋 Nessun dato OMIRL estratto"
-        try:
-            # Generate summary based on available API
-            if self.model and self.api_key:
-                return await self._generate_llm_multi_task_summary(query_context)
-            else:
-                return self._generate_structured_fallback_summary()
-        except Exception as e:
-            logger.error(f"❌ Error in multi-task summarization: {e}")
-            return self._generate_basic_fallback_summary()
-    async def _generate_llm_multi_task_summary(self, query_context: str) -> str:
-        """Generate intelligent multi-task summary using Gemini API"""
-        # Convert task results to LLM-friendly format
-        summary_data = {
-            "query_context": query_context,
-            "num_tasks": len(self.task_results),
-            "tasks": []
-        }
-        for task in self.task_results:
-            task_data = {
-                "type": task.task_type,
-                "geographic_scope": task.geographic_scope,
-                "temporal_scope": task.temporal_scope,
-                "data": asdict(task.data_insights),
-                "filters": task.filters_applied
-            }
-            summary_data["tasks"].append(task_data)
-        # Build LLM prompt
-        prompt = self._build_multi_task_prompt(summary_data)
-        try:
-            response = self.model.generate_content(prompt)
-            summary = response.text.strip()
-            logger.info(f"✅ Generated multi-task LLM summary ({len(summary)} chars) for {len(self.task_results)} tasks")
-            return summary
-        except Exception as e:
-            logger.error(f"❌ LLM multi-task summarization failed: {e}")
-            return self._generate_structured_fallback_summary()
-    def _build_multi_task_prompt(self, summary_data: Dict[str, Any]) -> str:
-        """Build LLM prompt for multi-task summarization"""
-        prompt = f"""
-Sei un esperto meteorologo che analizza dati OMIRL della Liguria. Hai estratto dati da {summary_data['num_tasks']} operazioni diverse.
-CONTESTO RICHIESTA: "{summary_data['query_context']}"
-DATI ESTRATTI:
-{json.dumps(summary_data, indent=2, ensure_ascii=False)}
-COMPITO:
-Genera un riassunto operativo completo in italiano (max 6 righe) che:
-1. **Riassuma i dati principali** di tutti i task con emoji appropriate
-2. **Identifichi trend temporali** se presenti (es. "trend crescente nelle ultime 24h")
-3. **Evidenzi pattern geografici** se rilevanti (es. "valori più alti nell'entroterra")
-4. **Fornisca insight operativi** utili per decisioni meteorologiche
-5. **Colleghi informazioni** tra diversi task se pertinenti
-FORMATO:
-- Linguaggio naturale e professionale
-- Valori numerici precisi con unità di misura
-- Massimo 6 righe
-- Una riga per task principale + righe per trend/pattern
-ESEMPIO MULTI-TASK:
-🌡️ **Temperatura Liguria**: 15-28°C in 184 stazioni, media 22.1°C con trend stabile.
-🌧️ **Precipitazioni massime**: 0.2-6.2mm, picco 24h a Statale (6.2mm), trend crescente.
-📊 **Pattern regionale**: temperature più alte entroterra, precipitazioni concentrate costa orientale.
-RISPOSTA (solo il riassunto, senza introduzioni):"""
-        return prompt
-    def _generate_structured_fallback_summary(self) -> str:
-        """Generate structured summary without LLM"""
-        lines = []
-        # Group tasks by type for better organization
-        task_groups = {}
-        for task in self.task_results:
-            if task.task_type not in task_groups:
-                task_groups[task.task_type] = []
-            task_groups[task.task_type].append(task)
-        # Generate summary for each task type
-        for task_type, tasks in task_groups.items():
-            emoji = self._get_task_emoji(task_type)
-            if task_type == "valori_stazioni":
-                summary_line = self._summarize_valori_stazioni(tasks, emoji)
-            elif task_type == "massimi_precipitazione":
-                summary_line = self._summarize_massimi_precipitazione(tasks, emoji)
-            else:
-                summary_line = self._summarize_generic_task(tasks, emoji, task_type)
-            if summary_line:
-                lines.append(summary_line)
-        # Add cross-task insights if multiple tasks
-        if len(task_groups) > 1:
-            cross_insights = self._generate_cross_task_insights()
-            if cross_insights:
-                lines.append(cross_insights)
-        return "\n".join(lines) if lines else "📋 Dati OMIRL estratti senza pattern significativi"
-    def _summarize_valori_stazioni(self, tasks: List[TaskSummary], emoji: str) -> str:
-        """Summarize valori_stazioni tasks"""
-        total_records = sum(task.data_insights.total_records for task in tasks)
-        total_with_data = sum(task.data_insights.records_with_data for task in tasks)
-        # Combine geographic scopes
-        scopes = [task.geographic_scope for task in tasks]
-        geographic_summary = ", ".join(set(scopes))
-        # Get value ranges if available
-        values_summary = ""
-        all_mins = [task.data_insights.min_value for task in tasks if task.data_insights.min_value is not None]
-        all_maxs = [task.data_insights.max_value for task in tasks if task.data_insights.max_value is not None]
-        units = [task.data_insights.unit for task in tasks if task.data_insights.unit]
-        if all_mins and all_maxs and units:
-            min_val = min(all_mins)
-            max_val = max(all_maxs)
-            unit = units[0]
-            values_summary = f": {min_val}{unit}-{max_val}{unit}"
-        return f"{emoji} **Stazioni meteo**{values_summary} in {total_with_data}/{total_records} stazioni ({geographic_summary})"
-    def _summarize_massimi_precipitazione(self, tasks: List[TaskSummary], emoji: str) -> str:
-        """Summarize massimi_precipitazione tasks with trend analysis"""
-        total_records = sum(task.data_insights.total_records for task in tasks)
-        # Analyze temporal scope for trend insights
-        temporal_scopes = [task.temporal_scope for task in tasks]
-        has_full_temporal = any("All periods" in scope for scope in temporal_scopes)
-        # Get value ranges
-        all_mins = [task.data_insights.min_value for task in tasks if task.data_insights.min_value is not None]
-        all_maxs = [task.data_insights.max_value for task in tasks if task.data_insights.max_value is not None]
-        if all_mins and all_maxs:
-            min_val = min(all_mins)
-            max_val = max(all_maxs)
-            # Trend analysis for full temporal data
-            trend_text = ""
-            if has_full_temporal:
-                # Look for trend indicators
-                trend_tasks = [task for task in tasks if "All periods" in task.temporal_scope]
-                if trend_tasks and trend_tasks[0].data_insights.trend_direction:
-                    trend = trend_tasks[0].data_insights.trend_direction
-                    peak = trend_tasks[0].data_insights.peak_period
-                    if peak:
-                        trend_text = f", picco {peak}"
-                    elif trend != "stable":
-                        trend_text = f", trend {trend}"
-            return f"{emoji} **Precipitazioni massime**: {min_val}-{max_val}mm in {total_records} aree{trend_text}"
-        return f"{emoji} **Precipitazioni massime**: {total_records} aree analizzate"
-    def _summarize_generic_task(self, tasks: List[TaskSummary], emoji: str, task_type: str) -> str:
-        """Summarize any other task type"""
-        total_records = sum(task.data_insights.total_records for task in tasks)
-        return f"{emoji} **{task_type.replace('_', ' ').title()}**: {total_records} record estratti"
-    def _generate_cross_task_insights(self) -> str:
-        """Generate insights that span multiple tasks"""
-        # Look for geographical patterns across tasks
-        geographic_scopes = [task.geographic_scope for task in self.task_results]
-        unique_scopes = set(geographic_scopes)
-        if len(unique_scopes) > 1:
-            return f"📊 **Copertura geografica**: {', '.join(unique_scopes)}"
-        return ""
-    def _generate_basic_fallback_summary(self) -> str:
-        """Generate very basic summary when all else fails"""
-        task_counts = {}
-        for task in self.task_results:
-            task_counts[task.task_type] = task_counts.get(task.task_type, 0) + 1
-        parts = []
-        for task_type, count in task_counts.items():
-            emoji = self._get_task_emoji(task_type)
-            parts.append(f"{emoji} {task_type}: {count} operazioni")
-        return "📋 " + ", ".join(parts)
-    def _get_task_emoji(self, task_type: str) -> str:
-        """Get appropriate emoji for task type"""
-        emoji_map = {
-            'valori_stazioni': '🌡️',
-            'massimi_precipitazione': '🌧️',
-            'livelli_idrometrici': '🌊',
-            'stazioni': '📍',
-            'mappe': '🗺️',
-            'radar': '📡',
-            'satellite': '🛰️'
-        }
-        return emoji_map.get(task_type, '📊')
-# Convenience functions for task result creation
-def create_valori_stazioni_summary(
-    geographic_scope: str,
-    data_insights: DataInsights,
-    filters_applied: Dict[str, Any] = None
-) -> TaskSummary:
-    """Create standardized summary for valori_stazioni task"""
-    return TaskSummary(
-        task_type="valori_stazioni",
-        geographic_scope=geographic_scope,
-        temporal_scope="Current values",
-        data_insights=data_insights,
-        filters_applied=filters_applied or {}
-    )
-def create_massimi_precipitazione_summary(
-    geographic_scope: str,
-    temporal_scope: str,
-    data_insights: DataInsights,
-    filters_applied: Dict[str, Any] = None
-) -> TaskSummary:
-    """Create standardized summary for massimi_precipitazione task"""
-    return TaskSummary(
-        task_type="massimi_precipitazione",
-        geographic_scope=geographic_scope,
-        temporal_scope=temporal_scope,
-        data_insights=data_insights,
-        filters_applied=filters_applied or {}
-    )
-def analyze_station_data(station_data: List[Dict[str, Any]], sensor_type: str) -> DataInsights:
-    """
-    Analyze station data for trends and patterns
-    Args:
-        station_data: List of station dictionaries with sensor values
-        sensor_type: Type of sensor (Temperatura, Precipitazione, etc.)
-    Returns:
-        DataInsights with station analysis
-    """
-    if not station_data:
-        return DataInsights(
-            total_records=0,
-            records_with_data=0,
-            coverage_quality="no_data"
-        )
-    # Extract current values from stations
-    values = []
-    stations_with_values = []
-    notable_stations = []
-    for station in station_data:
-        try:
-            # Extract current value ("ultimo" field)
-            current_value = station.get("ultimo")
-            if current_value is not None:
-                value = float(current_value)
-                values.append(value)
-                station_info = {
-                    "name": station.get("Nome", "Unknown"),
-                    "code": station.get("Codice", ""),
-                    "comune": station.get("Comune", ""),
-                    "provincia": station.get("Provincia", ""),
-                    "value": value,
-                    "max": float(station.get("Max", value)) if station.get("Max") else value,
-                    "min": float(station.get("Min", value)) if station.get("Min") else value
-                }
-                stations_with_values.append(station_info)
-                # Notable stations (extreme values)
-                if sensor_type.lower() == "temperatura":
-                    if value > 25.0 or value < 5.0:  # Hot or cold thresholds
-                        notable_stations.append(station_info)
-                elif sensor_type.lower() == "precipitazione":
-                    if value > 1.0:  # Any significant precipitation
-                        notable_stations.append(station_info)
-                elif sensor_type.lower() == "vento":
-                    if value > 10.0:  # Strong wind threshold
-                        notable_stations.append(station_info)
-        except (ValueError, TypeError):
-            # Skip stations with invalid data
-            continue
-    if not values:
-        return DataInsights(
-            total_records=len(station_data),
-            records_with_data=0,
-            coverage_quality="sparse"
-        )
-    # Calculate statistics
-    min_value = min(values)
-    max_value = max(values)
-    avg_value = sum(values) / len(values)
-    value_range = max_value - min_value
-    # Determine trend direction based on spatial distribution
-    trend_direction = "stable"  # Stations don't have temporal trends like precipitation
-    confidence_level = "high" if len(values) > 10 else "medium"
-    # Determine coverage quality
-    coverage_ratio = len(values) / len(station_data)
-    if coverage_ratio > 0.8:
-        coverage_quality = "good"
-    elif coverage_ratio > 0.5:
-        coverage_quality = "partial"
-    else:
-        coverage_quality = "sparse"
-    return DataInsights(
-        total_records=len(station_data),
-        records_with_data=len(values),
-        min_value=min_value,
-        max_value=max_value,
-        avg_value=avg_value,
-        unit=_get_sensor_unit(sensor_type),
-        coverage_quality=coverage_quality,
-        trend_direction=trend_direction,
-        trend_confidence=confidence_level,
-        notable_locations=[{
-            "name": s["name"],
-            "value": s["value"],
-            "location": f"{s['comune']}, {s['provincia']}" if s['comune'] else s['provincia']
-        } for s in notable_stations],
-        geographic_pattern="distributed"  # Default for station data
-    )
-def _get_sensor_unit(sensor_type: str) -> str:
-    """Get unit for sensor type"""
-    unit_map = {
-        "temperatura": "°C",
-        "precipitazione": "mm",
-        "vento": "m/s",
-        "umidità": "%",
-        "pressione": "hPa"
-    }
-    for key, unit in unit_map.items():
-        if key.lower() in sensor_type.lower():
-            return unit
-    return ""
-def analyze_precipitation_trends(precipitation_data: Dict[str, Any]) -> DataInsights:
-    """
-    Analyze precipitation data for trends and patterns
-    Args:
-        precipitation_data: Raw precipitation data with time periods
-    Returns:
-        DataInsights with trend analysis
-    """
-    # Time periods in order
-    time_periods = ["5'", "15'", "30'", "1h", "3h", "6h", "12h", "24h"]
-    # Extract values for trend analysis
-    values_by_period = {}
-    notable_locations = []
-    # Analyze both zona_allerta and province data
-    for table_type in ["zona_allerta", "province"]:
-        for record in precipitation_data.get(table_type, []):
-            area_name = record.get("Max (mm)", "")
-            # Extract values for each time period
-            period_values = []
-            for period in time_periods:
-                if period in record and record[period]:
-                    # Parse value from format "0.2 [05:55] Station"
-                    try:
-                        value_str = record[period].split()[0]
-                        value = float(value_str)
-                        period_values.append(value)
-                        # Track notable high values
-                        if value > 1.0:  # Notable threshold
-                            notable_locations.append({
-                                "location": area_name,
-                                "value": value,
-                                "period": period,
-                                "details": record[period]
-                            })
-                    except (ValueError, IndexError):
-                        period_values.append(0.0)
-                else:
-                    period_values.append(0.0)
-            if period_values:
-                values_by_period[area_name] = period_values
-    # Analyze trends
-    all_values = []
-    for values in values_by_period.values():
-        all_values.extend([v for v in values if v > 0])
-    if not all_values:
-        return DataInsights(
-            total_records=len(values_by_period),
-            records_with_data=0,
-            coverage_quality="sparse"
-        )
-    # Calculate trend direction
-    trend_direction = "stable"
-    trend_confidence = "low"
-    peak_period = None
-    # Analyze temporal patterns
-    for area_name, values in values_by_period.items():
-        if len(values) >= 4:  # Need enough data points
-            # Correct trend analysis: compare recent vs older periods
-            # values[0] = 5' ago (most recent), values[-1] = 24h ago (oldest)
-            recent_periods = values[:len(values)//2]  # 5', 15', 30', 1h
-            older_periods = values[len(values)//2:]   # 3h, 6h, 12h, 24h
-            recent_avg = sum(recent_periods) / len(recent_periods) if recent_periods else 0
-            older_avg = sum(older_periods) / len(older_periods) if older_periods else 0
-            # If recent values are higher than older ones, trend is increasing
-            # If older values are higher than recent ones, trend is decreasing
-            if recent_avg > older_avg * 1.5:
-                trend_direction = "increasing"
-                trend_confidence = "medium"
-            elif older_avg > recent_avg * 1.5:
-                trend_direction = "decreasing"
-                trend_confidence = "medium"
-            # Find peak period
-            max_value = max(values)
-            if max_value > 0:
-                max_index = values.index(max_value)
-                peak_period = time_periods[max_index]
-                break
-    return DataInsights(
-        total_records=len(values_by_period),
-        records_with_data=len([v for v in values_by_period.values() if any(val > 0 for val in v)]),
-        min_value=min(all_values) if all_values else None,
-        max_value=max(all_values) if all_values else None,
-        avg_value=sum(all_values) / len(all_values) if all_values else None,
-        unit="mm",
-        trend_direction=trend_direction,
-        trend_confidence=trend_confidence,
-        peak_period=peak_period,
-        notable_locations=notable_locations[:5],  # Limit to top 5
-        coverage_quality="complete" if len(all_values) > 10 else "partial"
-    )
-# Global instance for easy access
-_multi_task_summarizer = None
-def get_multi_task_summarizer() -> MultiTaskSummarizer:
-    """Get global multi-task summarizer instance"""
-    global _multi_task_summarizer
-    if _multi_task_summarizer is None:
-        _multi_task_summarizer = MultiTaskSummarizer()
-    return _multi_task_summarizer

tests/agent/test_llm_summarization_node.py ADDED Viewed

	@@ -0,0 +1,308 @@

+#!/usr/bin/env python3
+"""
+Test for LLM Summarization Node (Phase 4)
+Tests the new LLM-based summarization functionality that generates
+intelligent insights from task-specific formatted data.
+Purpose:
+- Validate LLM summarization node functionality
+- Test integration with existing tool results
+- Verify graceful handling of LLM failures
+- Ensure backward compatibility with existing workflow
+Created: September 7, 2025
+Branch: omirl_refactor
+Phase: 4 - Higher-level LLM summarization
+"""
+import asyncio
+import sys
+from pathlib import Path
+from unittest.mock import patch, AsyncMock
+# Add project root to path
+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+from agent.nodes import llm_summarization_node
+from agent.state import AgentState, ToolResult
+def create_test_state_with_tool_results():
+    """Create a test state with sample tool results"""
+    # Sample OMIRL tool result
+    omirl_result = ToolResult(
+        tool_name="omirl_tool",
+        success=True,
+        summary_text="🌡️ **Dati Temperatura Liguria**\n• 184 stazioni attive\n• Temperatura media: 21.5°C\n• Range: 16.8°C - 28.7°C",
+        artifacts=["stazioni_temperatura_20250907.json"],
+        sources=["https://omirl.regione.liguria.it/#/sensorstable"],
+        metadata={
+            "sensor_type": "Temperatura",
+            "total_after_filtering": 184,
+            "filters_applied": {"tipo_sensore": "Temperatura"},
+            "subtask": "valori_stazioni"
+        },
+        warnings=[]
+    )
+    state = AgentState(
+        user_message="Mostra temperature in Liguria",
+        routing_result={},
+        conversation_history=[],
+        tool_results=[omirl_result],
+        planned_tools=[],
+        errors=[],
+        processing_status="executing_tools",
+        agent_response="",
+        current_operation=None,
+        omirl_data=None,
+        metadata={}
+    )
+    return state
+def create_test_state_with_multiple_results():
+    """Create test state with multiple tool results for cross-analysis"""
+    temp_result = ToolResult(
+        tool_name="omirl_tool",
+        success=True,
+        summary_text="🌡️ Temperatura: 184 stazioni, media 21.5°C",
+        metadata={"sensor_type": "Temperatura", "total_after_filtering": 184},
+        artifacts=[], sources=[], warnings=[]
+    )
+    precip_result = ToolResult(
+        tool_name="omirl_tool",
+        success=True,
+        summary_text="🌧️ Precipitazioni: Zona A: 0.2mm, Genova: 0.4mm",
+        metadata={"subtask": "massimi_precipitazione", "province_records": 1},
+        artifacts=[], sources=[], warnings=[]
+    )
+    state = AgentState(
+        user_message="Analizza meteo completo Liguria",
+        routing_result={},
+        conversation_history=[],
+        tool_results=[temp_result, precip_result],
+        planned_tools=[],
+        errors=[],
+        processing_status="executing_tools",
+        agent_response="",
+        current_operation=None,
+        omirl_data=None,
+        metadata={}
+    )
+    return state
+async def test_summarization_node_basic():
+    """Test basic LLM summarization functionality"""
+    print("🧪 Testing basic LLM summarization...")
+    state = create_test_state_with_tool_results()
+    # Test with mock LLM client to avoid API calls
+    with patch('agent.nodes.LLMClient') as mock_llm_class:
+        mock_client = AsyncMock()
+        mock_client.generate_insights.return_value = (
+            "• **Temperatura**: Valori nella norma stagionale\n"
+            "• **Distribuzione**: Buona copertura territoriale con 184 stazioni\n"
+            "• **Trend**: Temperature stabili, nessuna anomalia rilevata\n"
+            "• **Raccomandazione**: Monitoraggio di routine sufficiente"
+        )
+        mock_llm_class.return_value = mock_client
+        # Execute summarization node
+        result_state = await llm_summarization_node(state)
+        # Verify insights were added
+        assert len(result_state["tool_results"]) == 1
+        enhanced_result = result_state["tool_results"][0]
+        assert "llm_insights" in enhanced_result.metadata
+        assert "Temperatura" in enhanced_result.metadata["llm_insights"]
+        assert "insights_generated_at" in enhanced_result.metadata
+        print("✅ Basic summarization test passed")
+        return True
+async def test_summarization_node_multiple_results():
+    """Test LLM summarization with multiple tool results"""
+    print("🧪 Testing multi-result summarization...")
+    state = create_test_state_with_multiple_results()
+    with patch('agent.nodes.LLMClient') as mock_llm_class:
+        mock_client = AsyncMock()
+        mock_client.generate_insights.return_value = (
+            "• **Situazione Generale**: Condizioni meteo stabili in Liguria\n"
+            "• **Temperatura**: 184 stazioni operative, valori nella norma\n"
+            "• **Precipitazioni**: Attività minima, accumuli trascurabili\n"
+            "• **Correlazione**: Tempo stabile confermato da entrambi i parametri\n"
+            "• **Outlook Operativo**: Nessuna criticità, condizioni favorevoli"
+        )
+        mock_llm_class.return_value = mock_client
+        result_state = await llm_summarization_node(state)
+        # Verify multi-source analysis
+        enhanced_result = result_state["tool_results"][0]
+        insights = enhanced_result.metadata["llm_insights"]
+        assert "Temperatura" in insights
+        assert "Precipitazioni" in insights
+        assert "Correlazione" in insights
+        print("✅ Multi-result summarization test passed")
+        return True
+async def test_summarization_node_llm_failure():
+    """Test graceful handling of LLM failures"""
+    print("🧪 Testing LLM failure handling...")
+    state = create_test_state_with_tool_results()
+    with patch('agent.nodes.LLMClient') as mock_llm_class:
+        mock_client = AsyncMock()
+        mock_client.generate_insights.side_effect = Exception("LLM API error")
+        mock_llm_class.return_value = mock_client
+        # Execute summarization node
+        result_state = await llm_summarization_node(state)
+        # Verify workflow continues without insights
+        assert len(result_state["tool_results"]) == 1
+        original_result = result_state["tool_results"][0]
+        # Should not have insights due to LLM failure
+        assert "llm_insights" not in original_result.metadata
+        # But should still have original data
+        assert original_result.success == True
+        assert "Temperatura" in original_result.summary_text
+        print("✅ LLM failure handling test passed")
+        return True
+async def test_summarization_node_no_results():
+    """Test summarization with no successful results"""
+    print("🧪 Testing with no successful results...")
+    # Create state with failed tool result
+    failed_result = ToolResult(
+        tool_name="omirl_tool",
+        success=False,
+        summary_text="⚠️ Error: Could not fetch data",
+        metadata={"error": "network_timeout"},
+        artifacts=[], sources=[], warnings=[]
+    )
+    state = AgentState(
+        user_message="Test failed request",
+        routing_result={},
+        conversation_history=[],
+        tool_results=[failed_result],
+        planned_tools=[],
+        errors=[],
+        processing_status="executing_tools",
+        agent_response="",
+        current_operation=None,
+        omirl_data=None,
+        metadata={}
+    )
+    result_state = await llm_summarization_node(state)
+    # Verify no LLM call was made and state unchanged
+    assert len(result_state["tool_results"]) == 1
+    assert result_state["tool_results"][0].success == False
+    assert "llm_insights" not in result_state["tool_results"][0].metadata
+    print("✅ No results test passed")
+    return True
+async def test_summarization_integration():
+    """Integration test to verify it works with real workflow steps"""
+    print("🧪 Testing summarization integration...")
+    # This test verifies that the node can be inserted in the workflow
+    # without breaking existing functionality
+    state = create_test_state_with_tool_results()
+    # Mock LLM but test the full node integration
+    with patch('agent.nodes.LLMClient') as mock_llm_class:
+        mock_client = AsyncMock()
+        mock_client.generate_insights.return_value = (
+            "• **Status**: Monitoraggio attivo su 184 stazioni\n"
+            "• **Qualità Dati**: Copertura completa del territorio ligure"
+        )
+        mock_llm_class.return_value = mock_client
+        # Test that processing status is properly updated
+        result_state = await llm_summarization_node(state)
+        # Verify state updates
+        assert result_state["processing_status"] == "llm_summarization"  # Should be updated by node
+        assert len(result_state["tool_results"]) == 1
+        # Verify insights were properly integrated
+        enhanced_result = result_state["tool_results"][0]
+        assert enhanced_result.tool_name == "omirl_tool"
+        assert enhanced_result.success == True
+        assert "llm_insights" in enhanced_result.metadata
+        print("✅ Integration test passed")
+        return True
+async def run_all_tests():
+    """Run comprehensive test suite for LLM summarization node"""
+    print("🚀 Starting LLM Summarization Node Tests")
+    print("=" * 50)
+    tests = [
+        ("Basic Functionality", test_summarization_node_basic),
+        ("Multiple Results", test_summarization_node_multiple_results),
+        ("LLM Failure Handling", test_summarization_node_llm_failure),
+        ("No Results Handling", test_summarization_node_no_results),
+        ("Integration Test", test_summarization_integration),
+    ]
+    results = []
+    for test_name, test_func in tests:
+        print(f"\n📋 Running: {test_name}")
+        try:
+            result = await test_func()
+            results.append(result)
+            print(f"   Result: {'✅ PASS' if result else '❌ FAIL'}")
+        except Exception as e:
+            print(f"   ❌ Test failed with exception: {e}")
+            results.append(False)
+    # Summary
+    passed = sum(results)
+    total = len(results)
+    print(f"\n📊 Test Results: {passed}/{total} tests passed")
+    if passed == total:
+        print("✨ All LLM summarization tests passed!")
+        return True
+    else:
+        print(f"⚠️ {total - passed} tests failed")
+        return False
+if __name__ == "__main__":
+    success = asyncio.run(run_all_tests())
+    sys.exit(0 if success else 1)

tests/agent/test_llm_sumnode_integration.py ADDED Viewed

	@@ -0,0 +1,339 @@

+#!/usr/bin/env python3
+"""
+End-to-end test of Phase 4 summarization workflow
+"""
+import sys
+import asyncio
+from pathlib import Path
+from unittest.mock import patch, AsyncMock
+# Add project root to path
+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+from agent.state import AgentState, ToolResult
+from agent.nodes import llm_summarization_node, response_generation_node
+async def test_full_workflow():
+    """Test complete workflow from tool results through summarization to response"""
+    print("🧪 Testing complete Phase 4 workflow...")
+    # Create realistic OMIRL tool result
+    omirl_result = ToolResult(
+        tool_name="omirl_tool",
+        success=True,
+        summary_text="🌡️ **Dati Temperatura Liguria**\n• 184 stazioni attive\n• Temperatura media: 21.5°C\n• Range: 16.8°C - 28.7°C\n• Province coperte: Genova, Savona, Imperia, La Spezia",
+        artifacts=["stazioni_temperatura_20250907.json"],
+        sources=["https://omirl.regione.liguria.it/#/sensorstable"],
+        metadata={
+            "sensor_type": "Temperatura",
+            "total_after_filtering": 184,
+            "filters_applied": {"tipo_sensore": "Temperatura"},
+            "subtask": "valori_stazioni"
+        },
+        warnings=[]
+    )
+    # Create initial state
+    state = AgentState(
+        user_message="Mostra temperature in Liguria",
+        routing_result={},
+        conversation_history=[],
+        tool_results=[omirl_result],
+        planned_tools=[],
+        errors=[],
+        processing_status="executing_tools",
+        agent_response="",
+        current_operation=None,
+        omirl_data=None,
+        metadata={}
+    )
+    print(f"   Initial tool results: {len(state['tool_results'])}")
+    # Display Phase 1: Original task output
+    print("\n" + "="*60)
+    print("📋 PHASE 1: TASK-SPECIFIC OUTPUT")
+    print("="*60)
+    original_result = state["tool_results"][0]
+    print(f"🔧 Tool: {original_result.tool_name}")
+    print(f"📊 Success: {original_result.success}")
+    print(f"🎯 Filters Applied: {original_result.metadata.get('filters_applied', 'None')}")
+    print(f"📈 Total Records: {original_result.metadata.get('total_after_filtering', 'Unknown')}")
+    print(f"🏷️  Subtask: {original_result.metadata.get('subtask', 'Unknown')}")
+    print(f"\n📄 Task Output Summary:")
+    print("-" * 40)
+    print(original_result.summary_text)
+    if original_result.artifacts:
+        print(f"\n📁 Artifacts: {original_result.artifacts}")
+    if original_result.sources:
+        print(f"🔗 Sources: {original_result.sources}")
+    # Step 1: Run LLM summarization
+    print("\n" + "="*60)
+    print("🧠 PHASE 2: LLM SUMMARIZATION")
+    print("="*60)
+    with patch('agent.nodes.LLMClient') as mock_llm_class:
+        mock_client = AsyncMock()
+        llm_insights = (
+            "• **Copertura Territoriale**: Eccellente con 184 stazioni operative\n"
+            "• **Temperature Attuali**: Valori stagionali nella norma (21.5°C media)\n"
+            "• **Distribuzione Geografica**: Buona rappresentanza di tutte le province liguri\n"
+            "• **Qualità Monitoraggio**: Sistema di rilevamento pienamente operativo\n"
+            "• **Raccomandazioni**: Condizioni stabili, monitoraggio di routine sufficiente"
+        )
+        mock_client.generate_insights.return_value = llm_insights
+        mock_llm_class.return_value = mock_client
+        print("🤖 LLM Client: Initialized (mocked)")
+        print("💭 Generating insights from task data...")
+        # Execute summarization
+        summarized_state = await llm_summarization_node(state)
+        print(f"✅ LLM processing complete")
+        print(f"📊 Results after summarization: {len(summarized_state['tool_results'])}")
+        # Verify insights were added
+        enhanced_result = summarized_state["tool_results"][0]
+        assert "llm_insights" in enhanced_result.metadata
+        print(f"\n🧠 LLM Generated Insights:")
+        print("-" * 40)
+        print(enhanced_result.metadata['llm_insights'])
+        print(f"\n⏰ Insights timestamp: {enhanced_result.metadata.get('insights_generated_at', 'Unknown')}")
+    # Step 2: Run response generation
+    print("\n" + "="*60)
+    print("📝 PHASE 3: RESPONSE GENERATION")
+    print("="*60)
+    print("🔄 Combining task output + LLM insights...")
+    final_state = await response_generation_node(summarized_state)
+    print(f"✅ Response generation complete")
+    print(f"📏 Final response length: {len(final_state['agent_response'])} characters")
+    # Verify response contains both original data and insights
+    response = final_state["agent_response"]
+    assert "🌊 **Estrazione Dati OMIRL Completata**" in response
+    assert "🧠 **Analisi Intelligente:**" in response
+    assert "Copertura Territoriale" in response
+    assert "Temperature Attuali" in response
+    assert "🔗 **Fonti dati:**" in response
+    print("   ✅ Response contains original task data")
+    print("   ✅ Response contains LLM insights section")
+    print("   ✅ Response contains data sources")
+    # Display final combined output
+    print("\n" + "="*60)
+    print("🎯 FINAL COMBINED RESPONSE")
+    print("="*60)
+    print(response)
+    # Summary statistics
+    print("\n" + "="*60)
+    print("� WORKFLOW SUMMARY")
+    print("="*60)
+    print(f"🎯 User Query: '{state['user_message']}'")
+    print(f"🔧 Tool Executed: {original_result.tool_name}")
+    print(f"🎛️ Mode: tables")
+    print(f"📋 Subtask: {original_result.metadata.get('subtask', 'Unknown')}")
+    print(f"🎯 Filters Applied: {original_result.metadata.get('filters_applied')}")
+    print(f"📊 Data Records: {original_result.metadata.get('total_after_filtering')}")
+    print(f"📝 Task Output: {len(original_result.summary_text)} chars")
+    print(f"🧠 LLM Insights: {len(enhanced_result.metadata.get('llm_insights', ''))} chars")
+    print(f"📄 Final Response: {len(response)} chars")
+    print(f"⚡ Processing Status: {final_state['processing_status']}")
+    return True
+async def test_precipitation_workflow():
+    """Test Phase 4 workflow with ambiguous precipitation query"""
+    print("\n" + "="*80)
+    print("🌧️ TESTING PRECIPITATION QUERY: 'mostra le precipitazioni a Genova'")
+    print("="*80)
+    # Create realistic precipitation tool result
+    precip_result = ToolResult(
+        tool_name="omirl_tool",
+        success=True,
+        summary_text="🌧️ **Precipitazioni Massime - Provincia Genova**\n• Zona d'allerta: A (0.0-0.2mm)\n• Provincia Genova: 0.2-0.4mm nelle ultime 24h\n• Picco registrato: 0.4mm alle 11:25 al Passo del Turchino\n• Trend: Attività precipitativa minima",
+        artifacts=["precipitazioni_genova_20250907.json"],
+        sources=["https://omirl.regione.liguria.it/#/maxtable"],
+        metadata={
+            "filters_applied": {"provincia": "GENOVA"},
+            "provincia": "GE",
+            "zona_allerta_records": 7,
+            "province_records": 1,
+            "extraction_method": "dual_table",
+            "subtask": "massimi_precipitazione"
+        },
+        warnings=[]
+    )
+    # Create state for precipitation query
+    precip_state = AgentState(
+        user_message="mostra le precipitazioni a Genova",
+        routing_result={},
+        conversation_history=[],
+        tool_results=[precip_result],
+        planned_tools=[],
+        errors=[],
+        processing_status="executing_tools",
+        agent_response="",
+        current_operation=None,
+        omirl_data=None,
+        metadata={}
+    )
+    print(f"   Initial tool results: {len(precip_state['tool_results'])}")
+    # Display Phase 1: Original task output
+    print("\n" + "="*60)
+    print("📋 PHASE 1: TASK-SPECIFIC OUTPUT")
+    print("="*60)
+    original_result = precip_state["tool_results"][0]
+    print(f"🔧 Tool: {original_result.tool_name}")
+    print(f"🎛️ Mode: tables")
+    print(f"📋 Subtask: {original_result.metadata.get('subtask', 'Unknown')}")
+    print(f"📊 Success: {original_result.success}")
+    print(f"🎯 Filters Applied: {original_result.metadata.get('filters_applied', 'None')}")
+    print(f"📈 Zona d'Allerta Records: {original_result.metadata.get('zona_allerta_records', 'Unknown')}")
+    print(f"📊 Province Records: {original_result.metadata.get('province_records', 'Unknown')}")
+    print(f"🔧 Extraction Method: {original_result.metadata.get('extraction_method', 'Unknown')}")
+    print(f"\n📄 Task Output Summary:")
+    print("-" * 40)
+    print(original_result.summary_text)
+    if original_result.artifacts:
+        print(f"\n📁 Artifacts: {original_result.artifacts}")
+    if original_result.sources:
+        print(f"🔗 Sources: {original_result.sources}")
+    # Step 1: Run LLM summarization for precipitation data
+    print("\n" + "="*60)
+    print("🧠 PHASE 2: LLM SUMMARIZATION")
+    print("="*60)
+    with patch('agent.nodes.LLMClient') as mock_llm_class:
+        mock_client = AsyncMock()
+        llm_insights = (
+            "• **Situazione Precipitazioni**: Attività molto limitata nella provincia di Genova\n"
+            "• **Distribuzione Temporale**: Accumuli minimi (0.2-0.4mm) concentrati nelle ultime 24h\n"
+            "• **Località Principale**: Passo del Turchino con il valore massimo registrato (0.4mm)\n"
+            "• **Trend Meteo**: Condizioni prevalentemente asciutte con episodi sporadici\n"
+            "• **Valutazione Operativa**: Nessuna criticità idrica, situazione nella norma per il periodo\n"
+            "• **Previsioni Immediate**: Stabilità delle condizioni, monitoraggio di routine"
+        )
+        mock_client.generate_insights.return_value = llm_insights
+        mock_llm_class.return_value = mock_client
+        print("🤖 LLM Client: Initialized (mocked)")
+        print("💭 Generating precipitation-specific insights...")
+        # Execute summarization
+        summarized_state = await llm_summarization_node(precip_state)
+        print(f"✅ LLM processing complete")
+        print(f"📊 Results after summarization: {len(summarized_state['tool_results'])}")
+        # Verify insights were added
+        enhanced_result = summarized_state["tool_results"][0]
+        assert "llm_insights" in enhanced_result.metadata
+        print(f"\n🧠 LLM Generated Insights:")
+        print("-" * 40)
+        print(enhanced_result.metadata['llm_insights'])
+        print(f"\n⏰ Insights timestamp: {enhanced_result.metadata.get('insights_generated_at', 'Unknown')}")
+    # Step 2: Run response generation
+    print("\n" + "="*60)
+    print("📝 PHASE 3: RESPONSE GENERATION")
+    print("="*60)
+    print("🔄 Combining precipitation data + LLM insights...")
+    final_state = await response_generation_node(summarized_state)
+    print(f"✅ Response generation complete")
+    print(f"📏 Final response length: {len(final_state['agent_response'])} characters")
+    # Verify response contains precipitation-specific content
+    response = final_state["agent_response"]
+    assert "🌊 **Estrazione Dati OMIRL Completata**" in response
+    assert "🧠 **Analisi Intelligente:**" in response
+    print("   ✅ Response contains original precipitation data")
+    print("   ✅ Response contains LLM precipitation insights")
+    print("   ✅ Response contains data sources")
+    # Display final combined output
+    print("\n" + "="*60)
+    print("🎯 FINAL COMBINED RESPONSE")
+    print("="*60)
+    print(response)
+    # Summary statistics for precipitation
+    print("\n" + "="*60)
+    print("📊 PRECIPITATION WORKFLOW SUMMARY")
+    print("="*60)
+    print(f"🎯 User Query: '{precip_state['user_message']}'")
+    print(f"🔧 Tool Executed: {original_result.tool_name}")
+    print(f"🎛️ Mode: tables")
+    print(f"📋 Subtask: {original_result.metadata.get('subtask', 'Unknown')}")
+    print(f"🎯 Filters Applied: {original_result.metadata.get('filters_applied')}")
+    print(f"📊 Zona Records: {original_result.metadata.get('zona_allerta_records')}")
+    print(f"📊 Province Records: {original_result.metadata.get('province_records')}")
+    print(f"📝 Task Output: {len(original_result.summary_text)} chars")
+    print(f"🧠 LLM Insights: {len(enhanced_result.metadata.get('llm_insights', ''))} chars")
+    print(f"📄 Final Response: {len(response)} chars")
+    print(f"⚡ Processing Status: {final_state['processing_status']}")
+    return True
+async def run_all_tests():
+    """Run both temperature and precipitation workflow tests"""
+    print("🧪 PHASE 4 COMPREHENSIVE WORKFLOW TESTS")
+    print("="*80)
+    try:
+        # Test 1: Temperature query
+        print("TEST 1: Temperature workflow")
+        success1 = await test_full_workflow()
+        # Test 2: Precipitation query
+        print("\nTEST 2: Precipitation workflow")
+        success2 = await test_precipitation_workflow()
+        if success1 and success2:
+            print("\n🎉 All Phase 4 workflow tests successful!")
+            return True
+        else:
+            print("\n❌ Some Phase 4 tests failed")
+            return False
+    except Exception as e:
+        print(f"\n❌ Phase 4 tests failed with error: {e}")
+        import traceback
+        traceback.print_exc()
+        return False
+if __name__ == "__main__":
+    success = asyncio.run(run_all_tests())
+    if success:
+        print("\n🎉 All Phase 4 tests completed successfully!")
+    else:
+        print("\n❌ Some Phase 4 tests failed")

tests/debug_node.py ADDED Viewed

File without changes

tests/debug_state.py ADDED Viewed

File without changes

tests/omirl/performance_analysis.py ADDED Viewed

	@@ -0,0 +1,86 @@

+"""
+OMIRL Performance Test Analysis
+This script analyzes why OMIRL integration tests are slow and provides solutions.
+"""
+import asyncio
+import time
+async def analyze_omirl_performance():
+    """Analyze OMIRL test performance issues"""
+    print("🔍 OMIRL Test Performance Analysis")
+    print("=" * 50)
+    print("\n📊 Current Timing Breakdown:")
+    print("   • Browser initialization: ~2-3 seconds")
+    print("   • Page navigation: ~3-5 seconds")
+    print("   • AngularJS wait: 5 seconds (fixed)")
+    print("   • Network idle wait: 8 seconds (with timeout)")
+    print("   • Angular rendering wait: 2 seconds (fixed)")
+    print("   • Data extraction: ~1-2 seconds")
+    print("   • Rate limiting: 1 second")
+    print("   ─────────────────────────────────")
+    print("   • TOTAL PER TEST: ~22-26 seconds")
+    print("\n🐌 Performance Issues Identified:")
+    print("   1. Fixed waits instead of smart waiting")
+    print("   2. No browser session reuse between tests")
+    print("   3. Full web scraping on every test call")
+    print("   4. OMIRL website may be slow/unreliable")
+    print("   5. Potential browser session accumulation")
+    print("\n💡 Solutions Implemented:")
+    print("   ✅ Fast tests with mocked data (< 0.1s each)")
+    print("   ✅ Test timeouts to prevent hanging")
+    print("   ✅ Proper browser cleanup in finally blocks")
+    print("   ✅ Separate fast vs integration test suites")
+    print("\n⚡ Recommended Test Strategy:")
+    print("   🚀 Daily development: Use fast tests (test_fast.py)")
+    print("   🧪 CI/CD pipeline: Use fast tests + selective integration")
+    print("   🔍 Full validation: Run integration tests weekly")
+    print("   📊 Performance: Mock web calls, test logic only")
+    print("\n🎯 Test Performance Comparison:")
+    print("   • Fast tests (mocked): ~0.08 seconds")
+    print("   • Integration tests: ~22-26 seconds each")
+    print("   • Speed improvement: 275-325x faster!")
+    return True
+async def test_browser_cleanup():
+    """Test browser cleanup to prevent session accumulation"""
+    from services.web.browser import close_all_browser_sessions
+    print("\n🧹 Testing browser cleanup...")
+    try:
+        await close_all_browser_sessions()
+        print("✅ Browser cleanup completed successfully")
+        return True
+    except Exception as e:
+        print(f"⚠️ Browser cleanup warning: {e}")
+        return False
+async def main():
+    """Main analysis function"""
+    await analyze_omirl_performance()
+    print("\n" + "=" * 50)
+    print("🔧 Cleanup Test")
+    await test_browser_cleanup()
+    print("\n" + "=" * 50)
+    print("📋 Summary & Recommendations:")
+    print("   1. Use test_fast.py for regular development")
+    print("   2. Run integration tests only when needed")
+    print("   3. Add timeouts to prevent hanging tests")
+    print("   4. Consider mocking for CI/CD pipelines")
+    print("   5. Monitor OMIRL website availability")
+    print("\n✅ Analysis complete!")
+if __name__ == "__main__":
+    asyncio.run(main())

tests/{test_adapter_integration.py → omirl/test_adapter_integration.py} RENAMED Viewed

@@ -2,21 +2,26 @@
 """
 Test for OMIRL Adapter Integration
-Tests the updated adapter.py that uses the new valori_stazioni implementation
-with YAML-based validation. This focuses on the adapter layer without
-running multiple web scraping operations.
 Created: September 6, 2025
 Branch: omirl_refactor
-Purpose: Validate the adapter integration with new architecture
 """
 import sys
 import asyncio
 from pathlib import Path
-# Add the parent directory to sys.path so we can import the OMIRL modules
-sys.path.insert(0, str(Path(__file__).parent.parent))
 from tools.omirl.adapter import omirl_tool
@@ -55,6 +60,48 @@ async def test_adapter_basic():
         return False
 async def test_adapter_invalid_mode():
     """Test adapter error handling with invalid mode"""
     print("\n🧪 Testing adapter error handling (invalid mode)...")
@@ -105,15 +152,42 @@ async def test_adapter_invalid_sensor():
         return False
 async def main():
     """Run all adapter tests"""
     print("🚀 Starting OMIRL Adapter Integration Tests")
     print("===========================================")
     tests = [
-        ("Basic Functionality", test_adapter_basic),
         ("Invalid Mode Handling", test_adapter_invalid_mode),
         ("Invalid Sensor Handling", test_adapter_invalid_sensor),
     ]
     results = []

 """
 Test for OMIRL Adapter Integration
+Tests the updated adapter.py that supports both valori_stazioni and massimi_precipitazione
+subtasks with YAML-based validation. This comprehensive test covers:
+- Both valori_stazioni and massimi_precipitazione subtasks
+- Filter validation and routing
+- Error handling for invalid modes, sensors, and subtasks
+- Response format consistency
 Created: September 6, 2025
+Updated: September 7, 2025
 Branch: omirl_refactor
+Purpose: Validate the complete adapter integration with new architecture
 """
 import sys
 import asyncio
 from pathlib import Path
+# Add the project root directory to sys.path so we can import the OMIRL modules
+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
 from tools.omirl.adapter import omirl_tool
         return False
+async def test_adapter_precipitation():
+    """Test adapter functionality with massimi_precipitazione subtask"""
+    print("🧪 Testing adapter with precipitation data...")
+    try:
+        result = await omirl_tool(
+            mode="tables",
+            subtask="massimi_precipitazione",
+            filters={"provincia": "GENOVA"},
+            language="it"
+        )
+        print(f"   Success: {'summary_text' in result and len(result.get('summary_text', '')) > 0}")
+        print(f"   Summary length: {len(result.get('summary_text', ''))}")
+        print(f"   Artifacts: {len(result.get('artifacts', []))}")
+        print(f"   Sources: {len(result.get('sources', []))}")
+        print(f"   Metadata keys: {list(result.get('metadata', {}).keys())}")
+        print(f"   Warnings: {len(result.get('warnings', []))}")
+        # Check required fields
+        required_fields = ['summary_text', 'artifacts', 'sources', 'metadata', 'warnings']
+        has_all_fields = all(field in result for field in required_fields)
+        print(f"   Has all required fields: {has_all_fields}")
+        print(f"   Subtask: {result.get('metadata', {}).get('subtask')}")
+        # Validate sources contain precipitation table
+        has_precipitation_source = any('maxtable' in source for source in result.get('sources', []))
+        print(f"   Has precipitation source: {has_precipitation_source}")
+        return (has_all_fields and
+                len(result.get('summary_text', '')) > 0 and
+                result.get('metadata', {}).get('subtask') == 'massimi_precipitazione' and
+                has_precipitation_source)
+    except Exception as e:
+        print(f"   ❌ Test failed with exception: {e}")
+        import traceback
+        traceback.print_exc()
+        return False
 async def test_adapter_invalid_mode():
     """Test adapter error handling with invalid mode"""
     print("\n🧪 Testing adapter error handling (invalid mode)...")
         return False
+async def test_adapter_invalid_subtask():
+    """Test adapter error handling with invalid subtask"""
+    print("\n🧪 Testing adapter error handling (invalid subtask)...")
+    try:
+        result = await omirl_tool(
+            mode="tables",
+            subtask="invalid_subtask",
+            filters={},
+            language="it"
+        )
+        error_keywords = ['non supportato', 'Invalid subtask', 'Sottotask non supportato']
+        has_error = any(keyword in result.get('summary_text', '') for keyword in error_keywords)
+        print(f"   Error detected: {has_error}")
+        print(f"   Summary: {result.get('summary_text', '')[:100]}...")
+        return has_error
+    except Exception as e:
+        print(f"   ❌ Test failed with exception: {e}")
+        return False
 async def main():
     """Run all adapter tests"""
     print("🚀 Starting OMIRL Adapter Integration Tests")
     print("===========================================")
     tests = [
+        ("Basic Functionality (Valori Stazioni)", test_adapter_basic),
+        ("Precipitation Functionality", test_adapter_precipitation),
         ("Invalid Mode Handling", test_adapter_invalid_mode),
         ("Invalid Sensor Handling", test_adapter_invalid_sensor),
+        ("Invalid Subtask Handling", test_adapter_invalid_subtask),
     ]
     results = []

tests/omirl/test_adapter_with_precipitation.py DELETED Viewed

@@ -1,178 +0,0 @@
-"""
-Test suite for OMIRL Adapter with Massimi Precipitazione support
-Tests the updated adapter functionality including:
-- Both valori_stazioni and massimi_precipitazione subtasks
-- Filter validation and routing
-- Response format consistency
-- Error handling
-"""
-import asyncio
-import sys
-from pathlib import Path
-# Add parent directories to path for imports
-sys.path.insert(0, str(Path(__file__).parent.parent.parent))
-from tools.omirl.adapter import omirl_tool
-class TestOMIRLAdapter:
-    """Test cases for OMIRL adapter functionality"""
-    async def test_valori_stazioni_subtask(self):
-        """Test valori_stazioni subtask (existing functionality)"""
-        print("\n🧪 Testing valori_stazioni subtask...")
-        result = await omirl_tool(
-            mode="tables",
-            subtask="valori_stazioni",
-            filters={"tipo_sensore": "Temperatura"},
-            language="it"
-        )
-        # Validate response structure
-        assert isinstance(result, dict)
-        assert "summary_text" in result
-        assert "artifacts" in result
-        assert "sources" in result
-        assert "metadata" in result
-        assert "warnings" in result
-        # Validate sources
-        assert "sensorstable" in result["sources"][0]
-        # Validate metadata
-        assert result["metadata"]["subtask"] == "valori_stazioni"
-        print("✅ Valori stazioni subtask works")
-        return result
-    async def test_massimi_precipitazione_subtask(self):
-        """Test massimi_precipitazione subtask (new functionality)"""
-        print("\n🧪 Testing massimi_precipitazione subtask...")
-        result = await omirl_tool(
-            mode="tables",
-            subtask="massimi_precipitazione",
-            filters={"provincia": "GENOVA"},
-            language="it"
-        )
-        # Validate response structure
-        assert isinstance(result, dict)
-        assert "summary_text" in result
-        assert "artifacts" in result
-        assert "sources" in result
-        assert "metadata" in result
-        assert "warnings" in result
-        # Validate sources
-        assert "maxtable" in result["sources"][0]
-        # Validate metadata
-        assert result["metadata"]["subtask"] == "massimi_precipitazione"
-        print("✅ Massimi precipitazione subtask works")
-        return result
-    async def test_zona_allerta_filter(self):
-        """Test zona d'allerta filtering"""
-        print("\n🧪 Testing zona d'allerta filter...")
-        result = await omirl_tool(
-            mode="tables",
-            subtask="massimi_precipitazione",
-            filters={"zona_allerta": "A"},
-            language="it"
-        )
-        assert isinstance(result, dict)
-        print("✅ Zona d'allerta filter works")
-        return result
-    async def test_invalid_subtask(self):
-        """Test invalid subtask handling"""
-        print("\n🧪 Testing invalid subtask...")
-        result = await omirl_tool(
-            mode="tables",
-            subtask="invalid_subtask",
-            filters={},
-            language="it"
-        )
-        # Should return error response
-        assert isinstance(result, dict)
-        assert "⚠️" in result["summary_text"]
-        assert result["metadata"]["success"] == False
-        print("✅ Invalid subtask handled correctly")
-        return result
-    async def test_sensor_validation_for_precipitation(self):
-        """Test that sensor validation is skipped for precipitation subtask"""
-        print("\n🧪 Testing sensor validation skip for precipitation...")
-        # This should work - sensor type should be ignored for precipitation
-        result = await omirl_tool(
-            mode="tables",
-            subtask="massimi_precipitazione",
-            filters={"tipo_sensore": "SomeInvalidSensor"},  # Should be ignored
-            language="it"
-        )
-        # Should succeed because sensor validation is skipped for precipitation
-        assert isinstance(result, dict)
-        print("✅ Sensor validation correctly skipped for precipitation")
-        return result
-# Integration test function
-async def test_adapter_integration():
-    """Integration test for updated adapter functionality"""
-    print("🧪 Running OMIRL adapter integration test...")
-    print("=" * 60)
-    tests = TestOMIRLAdapter()
-    try:
-        # Test 1: Valori stazioni (existing)
-        print("\n1️⃣ Testing valori_stazioni...")
-        result1 = await tests.test_valori_stazioni_subtask()
-        print(f"   Summary: {result1['summary_text'][:100]}...")
-        # Test 2: Massimi precipitazione (new)
-        print("\n2️⃣ Testing massimi_precipitazione...")
-        result2 = await tests.test_massimi_precipitazione_subtask()
-        print(f"   Summary: {result2['summary_text'][:100]}...")
-        # Test 3: Zona d'allerta filter
-        print("\n3️⃣ Testing zona_allerta filter...")
-        result3 = await tests.test_zona_allerta_filter()
-        print(f"   Summary: {result3['summary_text'][:100]}...")
-        # Test 4: Error handling
-        print("\n4️⃣ Testing error handling...")
-        result4 = await tests.test_invalid_subtask()
-        print(f"   Error: {result4['summary_text'][:100]}...")
-        # Test 5: Sensor validation
-        print("\n5️⃣ Testing sensor validation...")
-        result5 = await tests.test_sensor_validation_for_precipitation()
-        print(f"   Summary: {result5['summary_text'][:100]}...")
-        print("\n✅ All adapter tests completed successfully!")
-        return True
-    except Exception as e:
-        print(f"\n❌ Adapter test failed: {e}")
-        import traceback
-        traceback.print_exc()
-        return False
-if __name__ == "__main__":
-    # Run integration test directly
-    success = asyncio.run(test_adapter_integration())
-    sys.exit(0 if success else 1)

tests/omirl/test_fast.py ADDED Viewed

	@@ -0,0 +1,252 @@

+"""
+Fast OMIRL Tests with Mocked Web Calls
+This test module provides faster unit tests by mocking the slow web scraping calls.
+Use this for CI/CD and development, while keeping the integration tests for full validation.
+"""
+import pytest
+import sys
+from pathlib import Path
+from unittest.mock import Mock, patch, AsyncMock
+# Add parent directories to path for imports
+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+from tools.omirl.shared import OMIRLResult, OMIRLFilterSet
+from tools.omirl.adapter import omirl_tool
+class TestOMIRLAdapterFast:
+    """Fast tests for OMIRL adapter with mocked web calls"""
+    @pytest.mark.asyncio
+    @patch('services.web.table_scraper.fetch_omirl_stations')
+    async def test_valori_stazioni_fast(self, mock_fetch_stations):
+        """Test valori_stazioni with mocked data"""
+        print("\n🚀 Fast test: valori_stazioni...")
+        # Mock the web scraper response
+        mock_fetch_stations.return_value = [
+            {
+                "Nome": "Test Station 1",
+                "Codice": "TEST1",
+                "Comune": "Genova",
+                "Provincia": "GE",
+                "ultimo": "25.5",
+                "Max": "28.0",
+                "Min": "20.1"
+            },
+            {
+                "Nome": "Test Station 2",
+                "Codice": "TEST2",
+                "Comune": "Savona",
+                "Provincia": "SV",
+                "ultimo": "23.2",
+                "Max": "26.8",
+                "Min": "18.5"
+            }
+        ]
+        # Call the adapter
+        result = await omirl_tool(
+            mode="tables",
+            subtask="valori_stazioni",
+            filters={"tipo_sensore": "Temperatura", "provincia": "GE"},
+            language="it"
+        )
+        # Validate response structure
+        assert isinstance(result, dict)
+        assert "summary_text" in result
+        assert "artifacts" in result
+        assert "sources" in result
+        assert "metadata" in result
+        assert "warnings" in result
+        # Verify mock was called
+        mock_fetch_stations.assert_called_once_with("Temperatura")
+        print(f"✅ Fast test completed: {result['summary_text'][:50]}...")
+        return result
+    @pytest.mark.asyncio
+    @patch('services.web.table_scraper.fetch_omirl_massimi_precipitazioni')
+    async def test_massimi_precipitazione_fast(self, mock_fetch_precip):
+        """Test massimi_precipitazione with mocked data"""
+        print("\n🚀 Fast test: massimi_precipitazione...")
+        # Mock the precipitation data response
+        mock_fetch_precip.return_value = {
+            "zona_allerta": [
+                {
+                    "Max (mm)": "A",
+                    "5'": "0.0 [02:10] Station A1",
+                    "15'": "0.0 [02:10] Station A1",
+                    "30'": "0.0 [02:10] Station A1",
+                    "1h": "0.2 [05:45] Station A2",
+                    "3h": "0.4 [08:15] Station A2",
+                    "6h": "0.6 [12:30] Station A3",
+                    "12h": "0.8 [18:45] Station A3",
+                    "24h": "1.2 [06:00] Station A4"
+                }
+            ],
+            "province": [
+                {
+                    "Max (mm)": "Genova",
+                    "5'": "0.1 [03:20] Genova Station",
+                    "15'": "0.2 [08:15] Genova Station",
+                    "30'": "0.3 [09:00] Genova Station",
+                    "1h": "0.5 [11:30] Genova Station",
+                    "3h": "0.8 [14:45] Genova Station",
+                    "6h": "1.2 [18:00] Genova Station",
+                    "12h": "1.8 [22:15] Genova Station",
+                    "24h": "2.5 [08:30] Genova Station"
+                }
+            ]
+        }
+        # Call the adapter
+        result = await omirl_tool(
+            mode="tables",
+            subtask="massimi_precipitazione",
+            filters={"zona_allerta": "A"},
+            language="it"
+        )
+        # Validate response structure
+        assert isinstance(result, dict)
+        assert "summary_text" in result
+        assert "artifacts" in result
+        assert "sources" in result
+        assert "metadata" in result
+        # Verify mock was called
+        mock_fetch_precip.assert_called_once()
+        print(f"✅ Fast test completed: {result['summary_text'][:50]}...")
+        return result
+    @pytest.mark.asyncio
+    async def test_invalid_sensor_validation_fast(self):
+        """Test sensor validation without web calls"""
+        print("\n🚀 Fast test: validation...")
+        result = await omirl_tool(
+            mode="tables",
+            subtask="valori_stazioni",
+            filters={"tipo_sensore": "InvalidSensor"},
+            language="it"
+        )
+        # Should return error without making web calls
+        assert isinstance(result, dict)
+        assert "���️" in result["summary_text"]
+        assert "non valido" in result["summary_text"]
+        print(f"✅ Validation test completed: {result['summary_text'][:50]}...")
+        return result
+    @pytest.mark.asyncio
+    async def test_mode_validation_fast(self):
+        """Test mode validation without web calls"""
+        print("\n🚀 Fast test: mode validation...")
+        result = await omirl_tool(
+            mode="invalid_mode",
+            subtask="valori_stazioni",
+            filters={},
+            language="it"
+        )
+        # Should return error without making web calls
+        assert isinstance(result, dict)
+        assert "⚠️" in result["summary_text"]
+        assert result["metadata"]["success"] == False
+        print(f"✅ Mode validation test completed")
+        return result
+class TestOMIRLTasksFast:
+    """Fast tests for individual OMIRL tasks with mocked data"""
+    @pytest.mark.asyncio
+    @patch('services.web.table_scraper.fetch_omirl_stations')
+    async def test_valori_stazioni_task_fast(self, mock_fetch):
+        """Test valori_stazioni task directly with mocked data"""
+        from tools.omirl.tables.valori_stazioni import fetch_valori_stazioni_async
+        print("\n🚀 Fast task test: valori_stazioni...")
+        # Mock return data
+        mock_fetch.return_value = [
+            {"Nome": "Mock Station", "Codice": "MOCK", "Provincia": "GE"}
+        ]
+        # Test with filter set
+        filters = OMIRLFilterSet({"tipo_sensore": "Temperatura"})
+        result = await fetch_valori_stazioni_async(filters)
+        assert isinstance(result, OMIRLResult)
+        assert result.success
+        assert len(result.data) == 1
+        print("✅ Fast task test completed")
+        return result
+    @pytest.mark.asyncio
+    @patch('services.web.table_scraper.fetch_omirl_massimi_precipitazioni')
+    async def test_massimi_precipitazione_task_fast(self, mock_fetch):
+        """Test massimi_precipitazione task directly with mocked data"""
+        from tools.omirl.tables.massimi_precipitazione import fetch_massimi_precipitazione_async
+        print("\n🚀 Fast task test: massimi_precipitazione...")
+        # Mock return data
+        mock_fetch.return_value = {
+            "zona_allerta": [{"Max (mm)": "A", "24h": "0.5 [12:00] Test"}],
+            "province": []
+        }
+        # Test with filter set
+        filters = OMIRLFilterSet({"zona_allerta": "A"})
+        result = await fetch_massimi_precipitazione_async(filters)
+        assert isinstance(result, OMIRLResult)
+        assert result.success
+        print("✅ Fast task test completed")
+        return result
+# Fast integration test
+@pytest.mark.asyncio
+async def test_fast_integration():
+    """Fast integration test with all validation but no web calls"""
+    print("\n🚀 Running fast integration test...")
+    print("=" * 60)
+    tests = TestOMIRLAdapterFast()
+    try:
+        # Test validation (no web calls)
+        print("\n1️⃣ Testing validation...")
+        result1 = await tests.test_invalid_sensor_validation_fast()
+        print("\n2️⃣ Testing mode validation...")
+        result2 = await tests.test_mode_validation_fast()
+        print("\n✅ Fast integration completed successfully!")
+        print("📊 Tests completed in < 1 second vs 30+ seconds for full integration")
+        return True
+    except Exception as e:
+        print(f"\n❌ Fast integration failed: {e}")
+        return False
+if __name__ == "__main__":
+    # Run fast tests directly
+    import asyncio
+    success = asyncio.run(test_fast_integration())
+    print(f"\nFast test result: {'✅ PASSED' if success else '❌ FAILED'}")

tests/omirl/test_massimi_precipitazione.py CHANGED Viewed

@@ -6,6 +6,21 @@ Tests the massimi_precipitazione module functionality including:
 - Geographic filtering (zona d'allerta and province)
 - Data structure validation
 - Error handling
 """
 import pytest
 import sys
@@ -18,8 +33,9 @@ from tools.omirl.shared import OMIRLFilterSet
 from tools.omirl.tables.massimi_precipitazione import (
     fetch_massimi_precipitazione_async,
     fetch_massimi_precipitazione,
-    _apply_geographic_filters,
-    _parse_single_value
 )
@@ -27,57 +43,180 @@ class TestMassimiPrecipitazione:
     """Test cases for massimi precipitazione functionality"""
     @pytest.mark.asyncio
-    async def test_basic_extraction(self):
-        """Test basic data extraction without filters"""
-        print("\n🧪 Testing basic massimi precipitazione extraction...")
-        # Create empty filter set
-        filters = OMIRLFilterSet({})
-        # Fetch data
-        result = await fetch_massimi_precipitazione_async(filters)
-        # Validate result structure
-        assert result is not None
-        assert hasattr(result, 'success')
-        assert hasattr(result, 'data')
-        assert hasattr(result, 'message')
-        assert hasattr(result, 'metadata')
-        if result.success:
-            print(f"✅ Extraction successful: {result.message}")
-            # Validate data structure
-            assert isinstance(result.data, dict)
-            assert 'zona_allerta' in result.data
-            assert 'province' in result.data
-            zona_data = result.data['zona_allerta']
-            province_data = result.data['province']
-            print(f"📊 Zona d'Allerta records: {len(zona_data)}")
-            print(f"📊 Province records: {len(province_data)}")
-            # Validate zona d'allerta structure
-            if zona_data:
-                sample = zona_data[0]
-                assert 'Max (mm)' in sample
-                # Should have time period columns
-                time_periods = ["5'", "15'", "30'", "1h", "3h", "6h", "12h", "24h"]
-                for period in time_periods:
-                    assert period in sample
-                print(f"✅ Zona sample: {sample.get('Max (mm)')} with {len([k for k in sample.keys() if k in time_periods])} time periods")
-            # Validate province structure
-            if province_data:
-                sample = province_data[0]
-                assert 'Max (mm)' in sample
-                print(f"✅ Province sample: {sample.get('Max (mm)')}")
         else:
-            print(f"⚠️ Extraction failed: {result.message}")
-            # Don't fail test - this might be due to network issues
     def test_sync_wrapper(self):
         """Test the synchronous wrapper function"""
@@ -109,25 +248,26 @@ class TestMassimiPrecipitazione:
         # Test zona d'allerta filtering
         filters_zona = OMIRLFilterSet({"zona_allerta": "B"})
-        filtered = _apply_geographic_filters(sample_data, filters_zona)
         assert len(filtered["zona_allerta"]) == 1
         assert filtered["zona_allerta"][0]["Max (mm)"] == "B"
-        assert len(filtered["province"]) == 3  # No province filter, all included
         print("✅ Zona d'allerta filtering works")
         # Test province filtering
         filters_prov = OMIRLFilterSet({"provincia": "GENOVA"})
-        filtered = _apply_geographic_filters(sample_data, filters_prov)
         assert len(filtered["province"]) == 1
         assert filtered["province"][0]["Max (mm)"] == "Genova"
-        assert len(filtered["zona_allerta"]) == 3  # No zona filter, all included
         print("✅ Province filtering works")
         # Test province code mapping
         filters_code = OMIRLFilterSet({"provincia": "GE"})
-        filtered = _apply_geographic_filters(sample_data, filters_code)
         assert len(filtered["province"]) == 1
         assert filtered["province"][0]["Max (mm)"] == "Genova"
@@ -163,8 +303,116 @@ class TestMassimiPrecipitazione:
         assert result["value"] is None
         print("✅ Empty string handling works")
 # Integration test function that can be run independently
 async def test_massimi_precipitazione_integration():
     """Integration test for massimi precipitazione functionality"""
     print("🧪 Running massimi precipitazione integration test...")

 - Geographic filtering (zona d'allerta and province)
 - Data structure validation
 - Error handling
+TODO - BROWSER MANAGEMENT ISSUES:
+The integrated tests (test_format_precipitation_scenarios, test_invalid_input_scenarios)
+work correctly but occasionally get stuck during browser navigation due to:
+- Selenium WebDriver session management
+- AngularJS table loading timing issues
+- Network timeouts during OMIRL site interaction
+These tests validate the complete workflow but may need optimization for:
+- Browser session reuse across test scenarios
+- Better timeout handling for AngularJS data loading
+- Retry mechanisms for network-dependent operations
+For now, unit tests (test_format_precipitation_data_simple_unit) provide reliable
+validation of the formatting logic without browser dependencies.
 """
 import pytest
 import sys
 from tools.omirl.tables.massimi_precipitazione import (
     fetch_massimi_precipitazione_async,
     fetch_massimi_precipitazione,
+    _apply_filters_to_precipitation_data,
+    _parse_single_value,
+    format_precipitation_data_simple
 )
     """Test cases for massimi precipitazione functionality"""
     @pytest.mark.asyncio
+    async def test_format_precipitation_scenarios(self):
+        """Test formatting function with different input scenarios"""
+        print("\n🧪 Testing precipitation formatting scenarios...")
+        # Scenario 1: Only zona d'allerta
+        print("\n--- Scenario 1: Only zona d'allerta ---")
+        filters1 = OMIRLFilterSet({"zona_allerta": "A"})
+        result1 = await fetch_massimi_precipitazione_async(filters1)
+        if result1.success:
+            print(f"✅ Result: {result1.message}")
+            if result1.metadata.get('summary'):
+                print(f"📋 Summary: {result1.metadata['summary']}")
+        else:
+            print(f"❌ Failed: {result1.message}")
+        # Scenario 2: zona d'allerta + periodo
+        print("\n--- Scenario 2: zona d'allerta + periodo ---")
+        filters2 = OMIRLFilterSet({"zona_allerta": "A", "periodo": "1h"})
+        result2 = await fetch_massimi_precipitazione_async(filters2)
+        if result2.success:
+            print(f"✅ Result: {result2.message}")
+            if result2.metadata.get('summary'):
+                print(f"📋 Summary: {result2.metadata['summary']}")
+        else:
+            print(f"❌ Failed: {result2.message}")
+        # Scenario 3: Only provincia
+        print("\n--- Scenario 3: Only provincia ---")
+        filters3 = OMIRLFilterSet({"provincia": "Genova"})
+        result3 = await fetch_massimi_precipitazione_async(filters3)
+        if result3.success:
+            print(f"✅ Result: {result3.message}")
+            if result3.metadata.get('summary'):
+                print(f"📋 Summary: {result3.metadata['summary']}")
+        else:
+            print(f"❌ Failed: {result3.message}")
+        # Scenario 4: provincia + zona d'allerta (should prioritize zona_allerta)
+        print("\n--- Scenario 4: provincia + zona d'allerta ---")
+        filters4 = OMIRLFilterSet({"provincia": "Genova", "zona_allerta": "A"})
+        result4 = await fetch_massimi_precipitazione_async(filters4)
+        if result4.success:
+            print(f"✅ Result: {result4.message}")
+            if result4.metadata.get('summary'):
+                print(f"📋 Summary: {result4.metadata['summary']}")
         else:
+            print(f"❌ Failed: {result4.message}")
+        # Basic validation that at least one scenario worked
+        assert result1 is not None or result2 is not None or result3 is not None or result4 is not None
+    @pytest.mark.asyncio
+    async def test_invalid_input_scenarios(self):
+        """Test error handling with invalid inputs and edge cases"""
+        print("\n🧪 Testing invalid input scenarios...")
+        # Scenario 5: Missing required filters (no zona_allerta or provincia)
+        print("\n--- Scenario 5: Missing required filters ---")
+        filters5 = OMIRLFilterSet({"periodo": "1h"})  # Only periodo, missing geographic filter
+        result5 = await fetch_massimi_precipitazione_async(filters5)
+        print(f"Expected failure: {result5.message}")
+        assert not result5.success, "Should fail when missing required geographic filters"
+        assert "obbligatori mancanti" in result5.message.lower() or "required" in result5.message.lower()
+        # Scenario 6: Empty filters
+        print("\n--- Scenario 6: Empty filters ---")
+        filters6 = OMIRLFilterSet({})
+        result6 = await fetch_massimi_precipitazione_async(filters6)
+        print(f"Expected failure: {result6.message}")
+        assert not result6.success, "Should fail when no filters provided"
+        # Scenario 7: Invalid zona_allerta value
+        print("\n--- Scenario 7: Invalid zona_allerta ---")
+        filters7 = OMIRLFilterSet({"zona_allerta": "Z"})  # Z is not a valid zone
+        result7 = await fetch_massimi_precipitazione_async(filters7)
+        if result7.success:
+            # Extraction might succeed but should return no data
+            assert len(result7.data.get("zona_allerta", [])) == 0, "Should return empty data for invalid zone"
+            print(f"✅ Handled gracefully: Found {len(result7.data.get('zona_allerta', []))} records for invalid zone")
+        else:
+            print(f"❌ Failed as expected: {result7.message}")
+        # Scenario 8: Invalid provincia value
+        print("\n--- Scenario 8: Invalid provincia ---")
+        filters8 = OMIRLFilterSet({"provincia": "INVALID_PROVINCE"})
+        result8 = await fetch_massimi_precipitazione_async(filters8)
+        if result8.success:
+            # Extraction might succeed but should return no data
+            assert len(result8.data.get("province", [])) == 0, "Should return empty data for invalid province"
+            print(f"✅ Handled gracefully: Found {len(result8.data.get('province', []))} records for invalid province")
+        else:
+            print(f"❌ Failed as expected: {result8.message}")
+        # Scenario 9: Invalid periodo value
+        print("\n--- Scenario 9: Invalid periodo ---")
+        filters9 = OMIRLFilterSet({"zona_allerta": "A", "periodo": "99h"})  # Invalid time period
+        result9 = await fetch_massimi_precipitazione_async(filters9)
+        if result9.success:
+            # Should succeed but with no filtered data for the invalid period
+            filtered_record = result9.data.get("zona_allerta", [])
+            if filtered_record:
+                # Check if the invalid period was filtered out
+                has_invalid_period = any("99h" in str(record) for record in filtered_record)
+                assert not has_invalid_period, "Invalid period should be filtered out"
+            print(f"✅ Handled gracefully: Invalid periodo filtered appropriately")
+        else:
+            print(f"❌ Failed as expected: {result9.message}")
+        # Scenario 10: Valid filters but edge case combination
+        print("\n--- Scenario 10: Edge case - provincia + invalid periodo ---")
+        filters10 = OMIRLFilterSet({"provincia": "Genova", "periodo": "invalid_time"})
+        result10 = await fetch_massimi_precipitazione_async(filters10)
+        if result10.success:
+            print(f"✅ Handled edge case: {result10.message}")
+            # Should have data but no filtered period data
+            if result10.data.get("province"):
+                print(f"📊 Found province data but handled invalid periodo gracefully")
+        else:
+            print(f"❌ Failed as expected: {result10.message}")
+        print("\n✅ Invalid input scenarios testing completed")
+    def test_format_precipitation_data_simple_unit(self):
+        """Test the formatting function directly with mock data"""
+        print("\n🧪 Testing format_precipitation_data_simple function directly...")
+        # Mock data structure
+        mock_filtered_data = {
+            "zona_allerta": [{
+                "Max (mm)": "A",
+                "5'": "0.0 [02:10] Sella di Gouta",
+                "15'": "0.0 [02:10] Sella di Gouta",
+                "1h": "0.0 [02:10] Sella di Gouta",
+                "24h": "0.2 [03:05] Colle Belenda"
+            }],
+            "province": []
+        }
+        # Test scenario: zona_allerta without periodo
+        filters_zona = {"zona_allerta": "A"}
+        result_zona = format_precipitation_data_simple(mock_filtered_data, filters_zona)
+        print(f"📋 Zona without periodo:\n{result_zona}")
+        assert "Zona d'allerta A" in result_zona
+        assert "Riepilogo" in result_zona
+        assert "0.0mm alle 02:10 (Sella di Gouta)" in result_zona
+        assert "0.2mm alle 03:05 (Colle Belenda)" in result_zona
+        # Test scenario: zona_allerta with periodo
+        filters_zona_periodo = {"zona_allerta": "A", "periodo": "1h"}
+        result_zona_periodo = format_precipitation_data_simple(mock_filtered_data, filters_zona_periodo)
+        print(f"\n📋 Zona with periodo:\n{result_zona_periodo}")
+        assert "**1h**: 0.0mm alle 02:10 (Sella di Gouta)" in result_zona_periodo
+        assert "Riepilogo" not in result_zona_periodo  # Should not show summary when specific period requested
+        # Test empty data
+        empty_data = {"zona_allerta": [], "province": []}
+        result_empty = format_precipitation_data_simple(empty_data, filters_zona)
+        print(f"\n📋 Empty data:\n{result_empty}")
+        assert "Nessun dato trovato" in result_empty
+        print("✅ Unit tests for formatting function completed")
     def test_sync_wrapper(self):
         """Test the synchronous wrapper function"""
         # Test zona d'allerta filtering
         filters_zona = OMIRLFilterSet({"zona_allerta": "B"})
+        filters_dict = filters_zona.get_geographic_filters()
+        filtered = _apply_filters_to_precipitation_data(sample_data, filters_dict)
         assert len(filtered["zona_allerta"]) == 1
         assert filtered["zona_allerta"][0]["Max (mm)"] == "B"
         print("✅ Zona d'allerta filtering works")
         # Test province filtering
         filters_prov = OMIRLFilterSet({"provincia": "GENOVA"})
+        filters_dict = filters_prov.get_geographic_filters()
+        filtered = _apply_filters_to_precipitation_data(sample_data, filters_dict)
         assert len(filtered["province"]) == 1
         assert filtered["province"][0]["Max (mm)"] == "Genova"
         print("✅ Province filtering works")
         # Test province code mapping
         filters_code = OMIRLFilterSet({"provincia": "GE"})
+        filters_dict = filters_code.get_geographic_filters()
+        filtered = _apply_filters_to_precipitation_data(sample_data, filters_dict)
         assert len(filtered["province"]) == 1
         assert filtered["province"][0]["Max (mm)"] == "Genova"
         assert result["value"] is None
         print("✅ Empty string handling works")
+    def test_format_precipitation_data_scenarios(self):
+        """Test the new formatting function with different input scenarios"""
+        print("\n🧪 Testing format_precipitation_data_simple with different scenarios...")
+        # Scenario 1: Zona d'allerta with all time periods
+        print("\n📋 Scenario 1: Zona d'allerta A with all time periods")
+        zona_all_periods_data = {
+            "zona_allerta": [{
+                "Max (mm)": "A",
+                "5'": "0.1 [14:25] Colle del Melogno",
+                "15'": "0.2 [14:30] Colle del Melogno",
+                "30'": "0.3 [14:35] Colle del Melogno",
+                "1h": "0.5 [14:40] Colle del Melogno",
+                "3h": "1.2 [14:45] Colle del Melogno",
+                "6h": "2.1 [14:50] Colle del Melogno",
+                "12h": "3.5 [14:55] Colle del Melogno",
+                "24h": "6.2 [15:00] Colle del Melogno"
+            }],
+            "province": []
+        }
+        filters = {"zona_allerta": "A"}
+        result = format_precipitation_data_simple(zona_all_periods_data, filters)
+        print(result)
+        print()
+        # Scenario 2: Zona d'allerta with specific time period
+        print("📋 Scenario 2: Zona d'allerta B with specific period (1h)")
+        zona_specific_period_data = {
+            "zona_allerta": [{
+                "Max (mm)": "B",
+                "1h": "2.8 [13:15] Monte Settepani"
+            }],
+            "province": []
+        }
+        filters = {"zona_allerta": "B", "periodo": "1h"}
+        result = format_precipitation_data_simple(zona_specific_period_data, filters)
+        print(result)
+        print()
+        # Scenario 3: Province with all periods
+        print("📋 Scenario 3: Provincia Genova with all time periods")
+        province_all_periods_data = {
+            "zona_allerta": [],
+            "province": [{
+                "Max (mm)": "Genova",
+                "5'": "0.0 [10:00] Genova Centro",
+                "15'": "0.1 [10:05] Genova Centro",
+                "30'": "0.2 [10:10] Genova Centro",
+                "1h": "0.4 [10:15] Genova Centro",
+                "3h": "0.8 [10:20] Genova Centro",
+                "6h": "1.5 [10:25] Genova Centro",
+                "12h": "2.2 [10:30] Genova Centro",
+                "24h": "4.1 [10:35] Genova Centro"
+            }]
+        }
+        filters = {"provincia": "Genova"}
+        result = format_precipitation_data_simple(province_all_periods_data, filters)
+        print(result)
+        print()
+        # Scenario 4: Province with specific period but no data
+        print("📋 Scenario 4: Provincia Savona with specific period (3h) - no data")
+        province_no_data = {
+            "zona_allerta": [],
+            "province": [{
+                "Max (mm)": "Savona",
+                "3h": ""  # Empty data
+            }]
+        }
+        filters = {"provincia": "Savona", "periodo": "3h"}
+        result = format_precipitation_data_simple(province_no_data, filters)
+        print(result)
+        print()
+        # Scenario 5: Empty data
+        print("📋 Scenario 5: No data found")
+        empty_data = {"zona_allerta": [], "province": []}
+        filters = {"zona_allerta": "C"}
+        result = format_precipitation_data_simple(empty_data, filters)
+        print(result)
+        print()
+        # Scenario 6: Mixed data - both zona and province (shouldn't happen in practice but test anyway)
+        print("📋 Scenario 6: Mixed data (both zona and province)")
+        mixed_data = {
+            "zona_allerta": [{
+                "Max (mm)": "C",
+                "24h": "1.5 [09:00] Zona C Station"
+            }],
+            "province": [{
+                "Max (mm)": "Imperia",
+                "24h": "0.8 [09:00] Imperia Station"
+            }]
+        }
+        filters = {"zona_allerta": "C", "provincia": "Imperia"}  # Both filters (unusual)
+        result = format_precipitation_data_simple(mixed_data, filters)
+        print(result)
+        print()
+        print("✅ All formatting scenarios tested successfully")
 # Integration test function that can be run independently
+@pytest.mark.asyncio
 async def test_massimi_precipitazione_integration():
     """Integration test for massimi precipitazione functionality"""
     print("🧪 Running massimi precipitazione integration test...")

tests/omirl/test_validation.py ADDED Viewed

	@@ -0,0 +1,390 @@

+"""
+Test suite for OMIRL Validation System
+Tests the YAML-based validation architecture including:
+- Sensor type validation with suggestions
+- Province validation and code mapping
+- Zone validation
+- Period validation
+- Complete request validation
+- Error handling and suggestions
+"""
+import pytest
+import sys
+from pathlib import Path
+# Add parent directories to path for imports
+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+from tools.omirl.shared.validation import (
+    OMIRLValidator,
+    get_validator,
+    validate_sensor_type,
+    validate_provincia,
+    validate_zona,
+    validate_periodo,
+    validate_mode_task_combination,
+    get_valid_sensor_types,
+    get_valid_provinces,
+    get_validation_errors
+)
+class TestOMIRLValidation:
+    """Test cases for OMIRL validation functionality"""
+    def test_validator_initialization(self):
+        """Test that validator initializes correctly"""
+        print("\n🧪 Testing validator initialization...")
+        validator = get_validator()
+        assert validator is not None
+        assert hasattr(validator, 'parameters')
+        assert hasattr(validator, 'mode_tasks')
+        assert hasattr(validator, 'validation_rules')
+        print("✅ Validator initialized correctly")
+    def test_sensor_type_validation(self):
+        """Test sensor type validation with valid and invalid inputs"""
+        print("\n🧪 Testing sensor type validation...")
+        validator = get_validator()
+        # Test valid sensor types
+        valid_sensors = ["Temperatura", "Precipitazione", "Vento", "Umidità dell'aria"]
+        for sensor in valid_sensors:
+            is_valid, corrected, suggestions = validator.validate_sensor_type(sensor)
+            assert is_valid, f"Valid sensor '{sensor}' should pass validation"
+            assert corrected == sensor or corrected is None
+            print(f"   ✅ {sensor}: valid")
+        # Test invalid sensor types with suggestions
+        invalid_cases = [
+            ("Temperature", ["Temperatura"]),     # English vs Italian - should get suggestions
+            ("Temperatur", ["Temperatura"]),      # Typo - should get suggestions
+            ("Precipitazioni", ["Precipitazione"]), # Plural vs singular
+            ("Humidity", []),                      # Too different - may not get suggestions
+        ]
+        for invalid_sensor, expected_suggestions in invalid_cases:
+            is_valid, corrected, suggestions = validator.validate_sensor_type(invalid_sensor)
+            assert not is_valid, f"Invalid sensor '{invalid_sensor}' should fail validation"
+            assert corrected is None
+            if expected_suggestions:
+                assert len(suggestions) > 0, f"Should provide suggestions for '{invalid_sensor}'"
+                # Check if at least one expected suggestion is present
+                has_expected = any(exp in suggestions for exp in expected_suggestions)
+                assert has_expected, f"Expected suggestions {expected_suggestions} not found in {suggestions}"
+            print(f"   ❌ {invalid_sensor}: invalid, suggestions: {suggestions}")
+        # Test empty input
+        is_valid, corrected, suggestions = validator.validate_sensor_type("")
+        assert is_valid, "Empty sensor type should be valid (optional parameter)"
+        print("✅ Sensor type validation works correctly")
+    def test_province_validation(self):
+        """Test province validation and code mapping"""
+        print("\n🧪 Testing province validation...")
+        validator = get_validator()
+        # Test valid province codes
+        valid_codes = ["GE", "SV", "IM", "SP"]
+        for code in valid_codes:
+            is_valid, corrected, suggestions = validator.validate_provincia(code)
+            assert is_valid, f"Valid province code '{code}' should pass validation"
+            assert corrected == code
+            print(f"   ✅ {code}: valid code")
+        # Test valid province names (should be converted to codes)
+        province_mappings = {
+            "GENOVA": "GE",
+            "SAVONA": "SV",
+            "IMPERIA": "IM",
+            "LA SPEZIA": "SP"
+        }
+        for name, expected_code in province_mappings.items():
+            is_valid, corrected, suggestions = validator.validate_provincia(name)
+            assert is_valid, f"Valid province name '{name}' should pass validation"
+            assert corrected == expected_code, f"'{name}' should be corrected to '{expected_code}'"
+            print(f"   ✅ {name} → {corrected}: valid conversion")
+        # Test invalid provinces - use cases that might get suggestions
+        invalid_test_cases = [
+            ("GENOA", True),     # Similar to GENOVA - should get suggestions
+            ("SAVON", True),     # Similar to SAVONA - should get suggestions
+            ("ROMA", False),     # Too different - might not get suggestions
+            ("INVALID", False),  # Too different - might not get suggestions
+        ]
+        for invalid, should_have_suggestions in invalid_test_cases:
+            is_valid, corrected, suggestions = validator.validate_provincia(invalid)
+            assert not is_valid, f"Invalid province '{invalid}' should fail validation"
+            assert corrected is None
+            if should_have_suggestions:
+                assert len(suggestions) > 0, f"Should provide suggestions for '{invalid}'"
+            print(f"   ❌ {invalid}: invalid, suggestions: {suggestions}")
+        # Test empty input
+        is_valid, corrected, suggestions = validator.validate_provincia("")
+        assert is_valid, "Empty province should be valid (optional parameter)"
+        print("✅ Province validation works correctly")
+    def test_zone_validation(self):
+        """Test alert zone validation"""
+        print("\n🧪 Testing zone validation...")
+        validator = get_validator()
+        # Test valid zones
+        valid_zones = ["A", "B", "C", "C+", "C-", "D", "E"]
+        for zone in valid_zones:
+            is_valid, corrected, suggestions = validator.validate_zona(zone)
+            assert is_valid, f"Valid zone '{zone}' should pass validation"
+            print(f"   ✅ {zone}: valid zone")
+        # Test invalid zones
+        invalid_zones = ["F", "Z", "1", "AB"]
+        for invalid in invalid_zones:
+            is_valid, corrected, suggestions = validator.validate_zona(invalid)
+            assert not is_valid, f"Invalid zone '{invalid}' should fail validation"
+            print(f"   ❌ {invalid}: invalid, suggestions: {suggestions}")
+        print("✅ Zone validation works correctly")
+    def test_period_validation(self):
+        """Test time period validation"""
+        print("\n🧪 Testing period validation...")
+        validator = get_validator()
+        # Test valid periods
+        valid_periods = ["5'", "15'", "30'", "1h", "3h", "6h", "12h", "24h"]
+        for period in valid_periods:
+            is_valid, corrected, suggestions = validator.validate_periodo(period)
+            assert is_valid, f"Valid period '{period}' should pass validation"
+            print(f"   ✅ {period}: valid period")
+        # Test invalid periods
+        invalid_periods = ["2h", "48h", "1d", "invalid"]
+        for invalid in invalid_periods:
+            is_valid, corrected, suggestions = validator.validate_periodo(invalid)
+            assert not is_valid, f"Invalid period '{invalid}' should fail validation"
+            print(f"   ❌ {invalid}: invalid, suggestions: {suggestions}")
+        print("✅ Period validation works correctly")
+    def test_mode_task_validation(self):
+        """Test mode and task combination validation"""
+        print("\n🧪 Testing mode/task validation...")
+        validator = get_validator()
+        # Test valid combinations
+        valid_combinations = [
+            ("tables", "valori_stazioni"),
+            ("tables", "massimi_precipitazione")
+        ]
+        for mode, task in valid_combinations:
+            is_valid, valid_tasks = validator.validate_mode_task_combination(mode, task)
+            assert is_valid, f"Valid combination '{mode}/{task}' should pass validation"
+            assert task in valid_tasks
+            print(f"   ✅ {mode}/{task}: valid combination")
+        # Test invalid mode
+        is_valid, valid_tasks = validator.validate_mode_task_combination("invalid_mode", "task")
+        assert not is_valid, "Invalid mode should fail validation"
+        assert len(valid_tasks) == 0
+        print("   ❌ invalid_mode: invalid mode")
+        # Test invalid task for valid mode
+        is_valid, valid_tasks = validator.validate_mode_task_combination("tables", "invalid_task")
+        assert not is_valid, "Invalid task should fail validation"
+        assert len(valid_tasks) > 0  # Should still return valid tasks for the mode
+        print("   ❌ tables/invalid_task: invalid task")
+        print("✅ Mode/task validation works correctly")
+    def test_complete_request_validation(self):
+        """Test complete request validation"""
+        print("\n🧪 Testing complete request validation...")
+        validator = get_validator()
+        # Test valid valori_stazioni request
+        valid_request = {
+            "tipo_sensore": "Temperatura",
+            "provincia": "GENOVA"
+        }
+        is_valid, corrected, errors = validator.validate_complete_request(
+            "tables", "valori_stazioni", valid_request
+        )
+        assert is_valid, f"Valid request should pass validation, errors: {errors}"
+        assert corrected["provincia"] == "GE", "Province should be auto-corrected to code"
+        print(f"   ✅ Valid request: corrected filters = {corrected}")
+        # Test invalid request with multiple errors
+        invalid_request = {
+            "tipo_sensore": "InvalidSensor",
+            "provincia": "InvalidProvince",
+            "zona": "InvalidZone"
+        }
+        is_valid, corrected, errors = validator.validate_complete_request(
+            "tables", "valori_stazioni", invalid_request
+        )
+        assert not is_valid, "Invalid request should fail validation"
+        assert len(errors) > 0, "Should provide error messages"
+        print(f"   ❌ Invalid request: {len(errors)} errors = {errors}")
+        # Test massimi_precipitazione request
+        precip_request = {
+            "zona_allerta": "A",
+            "periodo": "24h"
+        }
+        is_valid, corrected, errors = validator.validate_complete_request(
+            "tables", "massimi_precipitazione", precip_request
+        )
+        assert is_valid, f"Valid precipitation request should pass, errors: {errors}"
+        print(f"   ✅ Valid precipitation request: {corrected}")
+        print("✅ Complete request validation works correctly")
+    def test_convenience_functions(self):
+        """Test convenience validation functions"""
+        print("\n🧪 Testing convenience functions...")
+        # Test validate_sensor_type function
+        assert validate_sensor_type("Temperatura"), "Should validate valid sensor"
+        assert not validate_sensor_type("Invalid"), "Should reject invalid sensor"
+        print("   ✅ validate_sensor_type works")
+        # Test validate_provincia function
+        is_valid, corrected = validate_provincia("GENOVA")
+        assert is_valid and corrected == "GE", "Should validate and correct province"
+        print("   ✅ validate_provincia works")
+        # Test validate_zona function
+        assert validate_zona("A"), "Should validate valid zone"
+        assert not validate_zona("Z"), "Should reject invalid zone"
+        print("   ✅ validate_zona works")
+        # Test validate_periodo function
+        assert validate_periodo("24h"), "Should validate valid period"
+        assert not validate_periodo("invalid"), "Should reject invalid period"
+        print("   ✅ validate_periodo works")
+        # Test validate_mode_task_combination function
+        assert validate_mode_task_combination("tables", "valori_stazioni"), "Should validate valid combination"
+        assert not validate_mode_task_combination("invalid", "task"), "Should reject invalid combination"
+        print("   ✅ validate_mode_task_combination works")
+        # Test get_valid_sensor_types function
+        valid_types = get_valid_sensor_types()
+        assert isinstance(valid_types, list), "Should return list"
+        assert len(valid_types) > 0, "Should have valid sensor types"
+        assert "Temperatura" in valid_types, "Should contain expected sensor type"
+        print(f"   ✅ get_valid_sensor_types works: {len(valid_types)} types")
+        # Test get_valid_provinces function
+        valid_provinces = get_valid_provinces()
+        assert isinstance(valid_provinces, dict), "Should return dict"
+        assert "GENOVA" in valid_provinces, "Should contain province mapping"
+        assert valid_provinces["GENOVA"] == "GE", "Should have correct mapping"
+        print(f"   ✅ get_valid_provinces works: {len(valid_provinces)} provinces")
+        # Test get_validation_errors function
+        filters_with_errors = {"tipo_sensore": "Invalid", "provincia": "Invalid"}
+        errors = get_validation_errors(filters_with_errors)
+        assert len(errors) > 0, "Should detect validation errors"
+        print(f"   ✅ get_validation_errors works: {len(errors)} errors detected")
+        print("✅ All convenience functions work correctly")
+    def test_error_messages_and_suggestions(self):
+        """Test that error messages include helpful suggestions"""
+        print("\n🧪 Testing error messages and suggestions...")
+        validator = get_validator()
+        # Test sensor type suggestions - use cases that should get suggestions
+        is_valid, corrected, suggestions = validator.validate_sensor_type("Temperature")
+        assert not is_valid
+        assert "Temperatura" in suggestions, "Should suggest closest match"
+        print(f"   ✅ 'Temperature' suggests: {suggestions}")
+        # Test province suggestions
+        is_valid, corrected, suggestions = validator.validate_provincia("Genova")
+        # This might be valid (converted to GE) or invalid depending on config
+        if not is_valid:
+            assert len(suggestions) > 0, "Should provide suggestions for invalid province"
+            print(f"   ✅ 'Genova' suggests: {suggestions}")
+        else:
+            print(f"   ✅ 'Genova' auto-corrected to: {corrected}")
+        # Test zone suggestions - use a case that should get suggestions
+        is_valid, corrected, suggestions = validator.validate_zona("AA")
+        assert not is_valid
+        assert len(suggestions) > 0, "Should suggest valid zones"
+        assert "A" in suggestions, "Should suggest actual zones"
+        print(f"   ✅ 'AA' suggests: {suggestions}")
+        print("✅ Error messages and suggestions work correctly")
+# Integration test
+def test_validation_integration():
+    """Integration test for the entire validation system"""
+    print("\n🧪 Running validation integration test...")
+    print("=" * 60)
+    try:
+        # Test validator instantiation
+        validator = get_validator()
+        print("✅ Validator created successfully")
+        # Test configuration loading
+        assert len(validator.get_valid_sensor_types()) > 0
+        print("✅ YAML configuration loaded successfully")
+        # Test a complete validation workflow
+        filters = {
+            "tipo_sensore": "Temperatura",
+            "provincia": "GENOVA",
+            "zona_allerta": "A"
+        }
+        is_valid, corrected, errors = validator.validate_complete_request(
+            "tables", "valori_stazioni", filters
+        )
+        if is_valid:
+            print(f"✅ Complete workflow successful: {corrected}")
+        else:
+            print(f"❌ Validation failed: {errors}")
+        print("✅ Integration test completed successfully")
+        return True
+    except Exception as e:
+        print(f"❌ Integration test failed: {e}")
+        import traceback
+        traceback.print_exc()
+        return False
+if __name__ == "__main__":
+    # Run integration test directly
+    success = test_validation_integration()
+    print(f"\nValidation system test: {'✅ PASSED' if success else '❌ FAILED'}")

tests/omirl/test_valori_stazioni.py ADDED Viewed

	@@ -0,0 +1,296 @@

+#!/usr/bin/env python3
+"""
+Test for OMIRL Valori Stazioni Task
+Tests the refactored valori_stazioni functionality that extracts station
+measurement data from OMIRL tables using the new YAML-based architecture.
+Created: September 5, 2025
+Branch: omirl_refactor
+Purpose: Validate the refactored valori_stazioni task implementation
+TODO - BROWSER MANAGEMENT ISSUES:
+Similar to massimi_precipitazione tests, the integrated tests that require
+live OMIRL data extraction may experience browser management issues:
+- Selenium WebDriver session handling
+- AngularJS table loading timing
+- Network-dependent test reliability
+The unit tests (test_format_station_scenarios, test_format_station_edge_cases)
+provide reliable validation of the formatting logic without browser dependencies.
+For live data tests, consider implementing retry mechanisms and better timeout handling.
+"""
+import sys
+from pathlib import Path
+# Add the parent directory to sys.path so we can import the OMIRL modules
+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+from tools.omirl.shared import OMIRLFilterSet
+from tools.omirl.tables.valori_stazioni import fetch_valori_stazioni
+def test_valori_stazioni_basic():
+    """Test basic valori_stazioni functionality with minimal filters"""
+    print("🧪 Testing basic valori_stazioni functionality...")
+    # Test with minimal filters
+    filter_dict = {
+        "tipo_sensore": "Temperatura"
+    }
+    filters = OMIRLFilterSet(filter_dict)
+    result = fetch_valori_stazioni(filters)
+    print(f"   Success: {result.success}")
+    print(f"   Message: {result.message}")
+    print(f"   Data count: {len(result.data) if result.data else 0}")
+    print(f"   Warnings: {result.warnings}")
+    print(f"   Metadata keys: {list(result.metadata.keys()) if result.metadata else []}")
+    return result.success
+def test_valori_stazioni_with_provincia():
+    """Test valori_stazioni with provincia filter"""
+    print("\n🧪 Testing valori_stazioni with provincia filter...")
+    filter_dict = {
+        "tipo_sensore": "Temperatura",
+        "provincia": "GE"
+    }
+    filters = OMIRLFilterSet(filter_dict)
+    result = fetch_valori_stazioni(filters)
+    print(f"   Success: {result.success}")
+    print(f"   Message: {result.message}")
+    print(f"   Data count: {len(result.data) if result.data else 0}")
+    return result.success
+def test_valori_stazioni_with_stazione():
+    """Test valori_stazioni with specific station"""
+    print("\n🧪 Testing valori_stazioni with specific station...")
+    filter_dict = {
+        "tipo_sensore": "Temperatura",
+        "provincia": "GE",
+        "stazione": "GENOVA CENTRO FUNZIONALE"
+    }
+    filters = OMIRLFilterSet(filter_dict)
+    result = fetch_valori_stazioni(filters)
+    print(f"   Success: {result.success}")
+    print(f"   Message: {result.message}")
+    print(f"   Data count: {len(result.data) if result.data else 0}")
+    return result.success
+def test_new_api_compatibility():
+    """Test the new OMIRLFilterSet API"""
+    print("\n🧪 Testing new OMIRLFilterSet API...")
+    # Create filters using new API
+    filters = OMIRLFilterSet({
+        "tipo_sensore": "Temperatura",
+        "provincia": "GE"
+    })
+    result = fetch_valori_stazioni(filters)
+    print(f"   Success: {result.success}")
+    print(f"   Message: {result.message}")
+    print(f"   Data count: {len(result.data) if result.data else 0}")
+    return result.success
+def test_invalid_filters():
+    """Test handling of invalid filters"""
+    print("\n🧪 Testing invalid filter handling...")
+    filter_dict = {
+        "tipo_sensore": "InvalidSensor",
+        "provincia": "InvalidProvince"
+    }
+    filters = OMIRLFilterSet(filter_dict)
+    result = fetch_valori_stazioni(filters)
+    print(f"   Success: {result.success}")
+    print(f"   Message: {result.message}")
+    print(f"   Expected failure: {'✅' if not result.success else '❌'}")
+    return not result.success  # We expect this to fail
+def test_format_station_scenarios():
+    """Test the new formatting function with different scenarios"""
+    print("\n🧪 Testing station formatting scenarios...")
+    # Import the formatting function
+    from tools.omirl.tables.valori_stazioni import format_station_data_simple
+    # Mock station data
+    mock_station_data = [
+        {
+            "Nome": "Stazione Test 1",
+            "Comune": "Genova",
+            "Provincia": "GE",
+            "ultimo": "22.5",
+            "max": "25.3",
+            "min": "18.7",
+            "unita": "°C"
+        },
+        {
+            "Nome": "Stazione Test 2",
+            "Comune": "Genova",
+            "Provincia": "GE",
+            "ultimo": "21.8",
+            "max": "24.1",
+            "min": "19.2",
+            "unita": "°C"
+        },
+        {
+            "Nome": "Stazione Savona",
+            "Comune": "Savona",
+            "Provincia": "SV",
+            "ultimo": "23.1",
+            "max": "26.0",
+            "min": "20.1",
+            "unita": "°C"
+        }
+    ]
+    # Scenario 1: Only tipo_sensore (show all data)
+    print("\n--- Scenario 1: Only tipo_sensore ---")
+    filters1 = OMIRLFilterSet({"tipo_sensore": "Temperatura"})
+    result1 = format_station_data_simple(mock_station_data, filters1, "Temperatura")
+    print(f"📋 All stations output:\n{result1}")
+    # Scenario 2: tipo_sensore + stazione (specific station details)
+    print("\n--- Scenario 2: tipo_sensore + stazione ---")
+    filters2 = OMIRLFilterSet({"tipo_sensore": "Temperatura", "stazione": "Stazione Test 1"})
+    result2 = format_station_data_simple([mock_station_data[0]], filters2, "Temperatura")
+    print(f"📋 Specific station output:\n{result2}")
+    # Scenario 3: tipo_sensore + comune
+    print("\n--- Scenario 3: tipo_sensore + comune ---")
+    filters3 = OMIRLFilterSet({"tipo_sensore": "Temperatura", "comune": "Genova"})
+    genova_stations = [s for s in mock_station_data if s["Comune"] == "Genova"]
+    result3 = format_station_data_simple(genova_stations, filters3, "Temperatura")
+    print(f"📋 Comune-filtered output:\n{result3}")
+    # Scenario 4: tipo_sensore + provincia
+    print("\n--- Scenario 4: tipo_sensore + provincia ---")
+    filters4 = OMIRLFilterSet({"tipo_sensore": "Temperatura", "provincia": "GE"})
+    ge_stations = [s for s in mock_station_data if s["Provincia"] == "GE"]
+    result4 = format_station_data_simple(ge_stations, filters4, "Temperatura")
+    print(f"📋 Provincia-filtered output:\n{result4}")
+    print("✅ Station formatting scenarios completed")
+def test_format_station_edge_cases():
+    """Test edge cases for station formatting"""
+    print("\n🧪 Testing station formatting edge cases...")
+    from tools.omirl.tables.valori_stazioni import format_station_data_simple
+    # Empty data
+    filters_empty = OMIRLFilterSet({"tipo_sensore": "Temperatura"})
+    result_empty = format_station_data_simple([], filters_empty, "Temperatura")
+    print(f"📋 Empty data result:\n{result_empty}")
+    assert "Nessun dato trovato" in result_empty
+    # Data with missing fields
+    incomplete_data = [{
+        "Nome": "Incomplete Station",
+        "Comune": "Unknown",
+        "ultimo": "N/A",
+        "max": None,
+        "min": "",
+        "unita": "°C"
+    }]
+    result_incomplete = format_station_data_simple(incomplete_data, filters_empty, "Temperatura")
+    print(f"\n📋 Incomplete data result:\n{result_incomplete}")
+    assert "N/A" in result_incomplete
+    print("✅ Edge cases testing completed")
+def test_valori_stazioni_invalid_inputs():
+    """Test error handling with invalid inputs"""
+    print("\n🧪 Testing valori_stazioni invalid inputs...")
+    # Missing tipo_sensore
+    print("\n--- Missing tipo_sensore ---")
+    filters1 = OMIRLFilterSet({"provincia": "GE"})
+    result1 = fetch_valori_stazioni(filters1)
+    print(f"Expected failure: {result1.message}")
+    assert not result1.success, "Should fail when tipo_sensore is missing"
+    # Invalid tipo_sensore
+    print("\n--- Invalid tipo_sensore ---")
+    filters2 = OMIRLFilterSet({"tipo_sensore": "InvalidSensor"})
+    result2 = fetch_valori_stazioni(filters2)
+    print(f"Result: {result2.message}")
+    # May succeed but return empty data, or fail validation
+    # Empty filters
+    print("\n--- Empty filters ---")
+    filters3 = OMIRLFilterSet({})
+    result3 = fetch_valori_stazioni(filters3)
+    print(f"Expected failure: {result3.message}")
+    assert not result3.success, "Should fail when no filters provided"
+    print("✅ Invalid inputs testing completed")
+if __name__ == "__main__":
+    print("🚀 Starting OMIRL Valori Stazioni Tests")
+    print("=====================================")
+    tests = [
+        test_valori_stazioni_basic,
+        test_valori_stazioni_with_provincia,
+        test_valori_stazioni_with_stazione,
+        test_new_api_compatibility,
+        test_invalid_filters,
+        test_format_station_scenarios,
+        test_format_station_edge_cases,
+        test_valori_stazioni_invalid_inputs
+    ]
+    results = []
+    try:
+        for test_func in tests:
+            try:
+                result = test_func()
+                results.append(result)
+            except Exception as e:
+                print(f"   ❌ Test failed with exception: {e}")
+                results.append(False)
+        # Summary
+        passed = sum(results)
+        total = len(results)
+        print(f"\n📊 Test Results: {passed}/{total} tests passed")
+        if passed == total:
+            print("✨ All tests completed successfully!")
+        else:
+            print(f"⚠️  {total - passed} tests failed")
+    except Exception as e:
+        print(f"\n❌ Test suite failed with error: {e}")
+        import traceback
+        traceback.print_exc()
+        sys.exit(1)

tests/test_llm_summarization_node.py ADDED Viewed

File without changes

tests/test_omirl_implementation.py CHANGED Viewed

@@ -122,7 +122,6 @@ if __name__ == "__main__":
         await test_massimi_precipitazione_zona()
         await test_massimi_precipitazione_provincia()
         await test_geographic_filtering_validation()
-        await test_task_agnostic_summarization()
         print("
 🏁 All manual tests completed!")

         await test_massimi_precipitazione_zona()
         await test_massimi_precipitazione_provincia()
         await test_geographic_filtering_validation()
         print("
 🏁 All manual tests completed!")

tests/test_phase4_workflow.py ADDED Viewed

File without changes

tests/test_valori_stazioni.py CHANGED Viewed

@@ -1,155 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test for OMIRL Valori Stazioni Task
-Tests the refactored valori_stazioni functionality that extracts station
-measurement data from OMIRL tables using the new YAML-based architecture.
-Created: September 5, 2025
-Branch: omirl_refactor
-Purpose: Validate the refactored valori_stazioni task implementation
-"""
-import sys
-from pathlib import Path
-# Add the parent directory to sys.path so we can import the OMIRL modules
-sys.path.insert(0, str(Path(__file__).parent.parent))
-from tools.omirl.shared import OMIRLFilterSet
-from tools.omirl.tables.valori_stazioni import fetch_valori_stazioni, fetch_valori_stazioni_legacy
-def test_valori_stazioni_basic():
-    """Test basic valori_stazioni functionality with minimal filters"""
-    print("🧪 Testing basic valori_stazioni functionality...")
-    # Test with minimal filters
-    filter_dict = {
-        "tipo_sensore": "Temperatura"
-    }
-    filters = OMIRLFilterSet(filter_dict)
-    result = fetch_valori_stazioni(filters)
-    print(f"   Success: {result.success}")
-    print(f"   Message: {result.message}")
-    print(f"   Data count: {len(result.data) if result.data else 0}")
-    print(f"   Warnings: {result.warnings}")
-    print(f"   Metadata keys: {list(result.metadata.keys()) if result.metadata else []}")
-    return result.success
-def test_valori_stazioni_with_provincia():
-    """Test valori_stazioni with provincia filter"""
-    print("\n🧪 Testing valori_stazioni with provincia filter...")
-    filter_dict = {
-        "tipo_sensore": "Temperatura",
-        "provincia": "GE"
-    }
-    filters = OMIRLFilterSet(filter_dict)
-    result = fetch_valori_stazioni(filters)
-    print(f"   Success: {result.success}")
-    print(f"   Message: {result.message}")
-    print(f"   Data count: {len(result.data) if result.data else 0}")
-    return result.success
-def test_valori_stazioni_with_stazione():
-    """Test valori_stazioni with specific station"""
-    print("\n🧪 Testing valori_stazioni with specific station...")
-    filter_dict = {
-        "tipo_sensore": "Temperatura",
-        "provincia": "GE",
-        "stazione": "GENOVA CENTRO FUNZIONALE"
-    }
-    filters = OMIRLFilterSet(filter_dict)
-    result = fetch_valori_stazioni(filters)
-    print(f"   Success: {result.success}")
-    print(f"   Message: {result.message}")
-    print(f"   Data count: {len(result.data) if result.data else 0}")
-    return result.success
-def test_legacy_compatibility():
-    """Test the legacy API for backward compatibility"""
-    print("\n🧪 Testing legacy API compatibility...")
-    result = fetch_valori_stazioni_legacy(
-        tipo_sensore="Temperatura",
-        provincia="GE"
-    )
-    print(f"   Success: {result.success}")
-    print(f"   Message: {result.message}")
-    print(f"   Data count: {len(result.data) if result.data else 0}")
-    return result.success
-def test_invalid_filters():
-    """Test handling of invalid filters"""
-    print("\n🧪 Testing invalid filter handling...")
-    filter_dict = {
-        "tipo_sensore": "InvalidSensor",
-        "provincia": "InvalidProvince"
-    }
-    filters = OMIRLFilterSet(filter_dict)
-    result = fetch_valori_stazioni(filters)
-    print(f"   Success: {result.success}")
-    print(f"   Message: {result.message}")
-    print(f"   Expected failure: {'✅' if not result.success else '❌'}")
-    return not result.success  # We expect this to fail
-if __name__ == "__main__":
-    print("🚀 Starting OMIRL Valori Stazioni Tests")
-    print("=====================================")
-    tests = [
-        test_valori_stazioni_basic,
-        test_valori_stazioni_with_provincia,
-        test_valori_stazioni_with_stazione,
-        test_legacy_compatibility,
-        test_invalid_filters
-    ]
-    results = []
-    try:
-        for test_func in tests:
-            try:
-                result = test_func()
-                results.append(result)
-            except Exception as e:
-                print(f"   ❌ Test failed with exception: {e}")
-                results.append(False)
-        # Summary
-        passed = sum(results)
-        total = len(results)
-        print(f"\n📊 Test Results: {passed}/{total} tests passed")
-        if passed == total:
-            print("✨ All tests completed successfully!")
-        else:
-            print(f"⚠️  {total - passed} tests failed")
-    except Exception as e:
-        print(f"\n❌ Test suite failed with error: {e}")
-        import traceback
-        traceback.print_exc()
-        sys.exit(1)

tools/omirl/adapter.py CHANGED Viewed

@@ -9,14 +9,14 @@ and handles input validation, delegation, and output formatting.
 Purpose:
 - Validate agent requests against tool specification
 - Route requests to appropriate task-specific modules
-- Format responses using task-agnostic summarization
 - Handle graceful failure (never raise exceptions)
 - Manage browser sessions and cleanup
 Dependencies:
 - Uses YAML-based validation architecture
 - Delegates to task-specific modules in tables/ directory
-- Uses task-agnostic summarization service for all responses
 - Agent expects this interface to match the tool registry schema
 Input Contract:
@@ -29,7 +29,7 @@ Input Contract:
 Output Contract:
     {
-        "summary_text": "LLM-generated operational summary",
         "artifacts": ["path/to/generated/files"],
         "sources": ["https://omirl.regione.liguria.it/..."],
         "metadata": {"timestamp": "...", "filters_applied": "..."},
@@ -38,8 +38,8 @@ Output Contract:
 Task Architecture:
 - Each subtask (valori_stazioni, massimi_precipitazione) has its own module
-- All tasks use standardized TaskSummary and DataInsights formats
-- LLM-based summarization provides rich operational insights
 - Geographic resolution service handles municipality→province mapping
 Note: This is the ONLY file that should be imported by the agent registry.
@@ -69,7 +69,7 @@ async def omirl_tool(
     This function provides the standardized interface for the agent to access
     OMIRL weather station data. It validates inputs, delegates to appropriate
-    task-specific services, and formats responses with LLM-generated summaries.
     Args:
         mode: Operation mode ("tables" for station data extraction)
@@ -87,7 +87,7 @@ async def omirl_tool(
     Returns:
         Dict containing:
-        - summary_text: LLM-generated operational summary with insights
         - artifacts: List of generated JSON file paths
         - sources: List of OMIRL data source URLs
         - metadata: Extraction metadata and statistics
@@ -229,7 +229,7 @@ async def omirl_tool(
         if result.metadata and result.metadata.get("summary"):
             summary_data = result.metadata.get("summary")
-            # Handle new task-agnostic summary format
             if isinstance(summary_data, dict) and "summary_text" in summary_data:
                 summary_text = summary_data["summary_text"]
             elif isinstance(summary_data, str):
@@ -295,9 +295,6 @@ def _format_error_response(
     }
-# Tool specification for agent registry
 # Tool specification for agent registry
 OMIRL_TOOL_SPEC = {
     "name": "omirl_tool",

 Purpose:
 - Validate agent requests against tool specification
 - Route requests to appropriate task-specific modules
+- Format responses using task-specific formatting (no LLM dependency)
 - Handle graceful failure (never raise exceptions)
 - Manage browser sessions and cleanup
 Dependencies:
 - Uses YAML-based validation architecture
 - Delegates to task-specific modules in tables/ directory
+- Uses task-specific formatting for fast, reliable output
 - Agent expects this interface to match the tool registry schema
 Input Contract:
 Output Contract:
     {
+        "summary_text": "Task-specific formatted summary with data details",
         "artifacts": ["path/to/generated/files"],
         "sources": ["https://omirl.regione.liguria.it/..."],
         "metadata": {"timestamp": "...", "filters_applied": "..."},
 Task Architecture:
 - Each subtask (valori_stazioni, massimi_precipitazione) has its own module
+- All tasks provide immediate, formatted output without LLM dependencies
+- Task-specific formatting provides consistent bullet-point summaries
 - Geographic resolution service handles municipality→province mapping
 Note: This is the ONLY file that should be imported by the agent registry.
     This function provides the standardized interface for the agent to access
     OMIRL weather station data. It validates inputs, delegates to appropriate
+    task-specific services, and formats responses with task-specific summaries.
     Args:
         mode: Operation mode ("tables" for station data extraction)
     Returns:
         Dict containing:
+        - summary_text: Task-specific formatted summary with data details
         - artifacts: List of generated JSON file paths
         - sources: List of OMIRL data source URLs
         - metadata: Extraction metadata and statistics
         if result.metadata and result.metadata.get("summary"):
             summary_data = result.metadata.get("summary")
+            # Handle task-specific summary format
             if isinstance(summary_data, dict) and "summary_text" in summary_data:
                 summary_text = summary_data["summary_text"]
             elif isinstance(summary_data, str):
     }
 # Tool specification for agent registry
 OMIRL_TOOL_SPEC = {
     "name": "omirl_tool",

tools/omirl/tables/__init__.py CHANGED Viewed

@@ -5,9 +5,8 @@ This package contains all table-based data extraction tasks for OMIRL.
 These tasks correspond to the "Tabelle" section of the OMIRL website.
 """
-from .valori_stazioni import fetch_valori_stazioni, fetch_valori_stazioni_legacy
 __all__ = [
-    "fetch_valori_stazioni",
-    "fetch_valori_stazioni_legacy"  # For backward compatibility
 ]

 These tasks correspond to the "Tabelle" section of the OMIRL website.
 """
+from .valori_stazioni import fetch_valori_stazioni
 __all__ = [
+    "fetch_valori_stazioni"
 ]

tools/omirl/tables/massimi_precipitazione.py CHANGED Viewed

@@ -105,78 +105,10 @@ async def fetch_massimi_precipitazione_async(filters: OMIRLFilterSet) -> OMIRLRe
         result.data = filtered_data
         result.message = f"Estratti dati precipitazione massima con filtri: {all_filters}"
-                # Generate precipitation-specific summary using new task-agnostic service
         if filtered_data:
-            try:
-                # Import new summarization service
-                from services.text.task_agnostic_summarization import (
-                    create_massimi_precipitazione_summary,
-                    analyze_precipitation_trends,
-                    get_multi_task_summarizer
-                )
-                # Determine geographic and temporal scope
-                if all_filters.get('zona_allerta'):
-                    geographic_scope = f"Zona d'allerta {all_filters['zona_allerta']}"
-                else:
-                    geographic_scope = f"Provincia {all_filters.get('provincia', 'Unknown')}"
-                if all_filters.get('periodo'):
-                    temporal_scope = f"Period {all_filters['periodo']}"
-                else:
-                    temporal_scope = "All periods (5'-24h)"
-                # Analyze precipitation data for trends
-                data_insights = analyze_precipitation_trends(filtered_data)
-                # Create standardized task summary
-                task_summary = create_massimi_precipitazione_summary(
-                    geographic_scope=geographic_scope,
-                    temporal_scope=temporal_scope,
-                    data_insights=data_insights,
-                    filters_applied=all_filters
-                )
-                # For now, generate immediate summary (multi-task will be implemented in adapter)
-                summarizer = get_multi_task_summarizer()
-                summarizer.clear_results()  # Clear any previous results
-                summarizer.add_task_result(task_summary)
-                summary = await summarizer.generate_final_summary(query_context="massimi precipitazione")
-                result.update_metadata(summary=summary)
-            except ImportError as e:
-                logger.warning(f"⚠️ New summarization service not available: {e}")
-                # Fallback to simple summary
-                if all_filters.get('periodo'):
-                    # Specific time period was requested
-                    periodo = all_filters['periodo']
-                    zona_count = len(filtered_data.get("zona_allerta", []))
-                    province_count = len(filtered_data.get("province", []))
-                    if zona_count > 0:
-                        summary = f"🌧️ Precipitazione massima - Zona d'allerta: {zona_count} record trovati per periodo {periodo}"
-                    else:
-                        summary = f"🌧️ Precipitazione massima - Provincia: {province_count} record trovati per periodo {periodo}"
-                else:
-                    # All time periods included - summarize trends
-                    zona_count = len(filtered_data.get("zona_allerta", []))
-                    province_count = len(filtered_data.get("province", []))
-                    if zona_count > 0:
-                        zona_name = all_filters.get('zona_allerta', all_filters.get('zona'))
-                        summary = f"🌧️ Precipitazione massima - Zona d'allerta {zona_name}: dati completi per tutti i periodi temporali (5'-24h)"
-                    else:
-                        provincia_name = filters.provincia if hasattr(filters, 'provincia') and filters.provincia else all_filters.get('provincia')
-                        summary = f"🌧️ Precipitazione massima - Provincia {provincia_name}: dati completi per tutti i periodi temporali (5'-24h)"
-                result.update_metadata(summary=summary)
-            except Exception as e:
-                logger.error(f"❌ Error in precipitation summarization: {e}")
-                # Basic fallback summary if everything fails
-                zona_count = len(filtered_data.get("zona_allerta", []))
-                province_count = len(filtered_data.get("province", []))
-                result.update_metadata(summary=f"🌧️ Estratti dati precipitazione massima: {zona_count} zone d'allerta, {province_count} province")
         # Add detailed metadata
         result.update_metadata(
@@ -396,6 +328,11 @@ def _parse_single_value(raw_value: str) -> Dict[str, Optional[str]]:
                 "time": match.group(2).strip(),
                 "station": match.group(3).strip()
             }
         else:
             return {
                 "value": None,
@@ -407,4 +344,124 @@ def _parse_single_value(raw_value: str) -> Dict[str, Optional[str]]:
             "value": None,
             "time": None,
             "station": raw_value
-        }

         result.data = filtered_data
         result.message = f"Estratti dati precipitazione massima con filtri: {all_filters}"
+        # Generate simple formatted summary (no LLM dependency)
         if filtered_data:
+            summary = format_precipitation_data_simple(filtered_data, all_filters)
+            result.update_metadata(summary=summary)
         # Add detailed metadata
         result.update_metadata(
                 "time": match.group(2).strip(),
                 "station": match.group(3).strip()
             }
+            return {
+                "value": float(match.group(1)),
+                "time": match.group(2).strip(),
+                "station": match.group(3).strip()
+            }
         else:
             return {
                 "value": None,
             "value": None,
             "time": None,
             "station": raw_value
+        }
+def format_precipitation_data_simple(
+    filtered_data: Dict[str, List[Dict]],
+    filters: Dict[str, Any]
+) -> str:
+    """
+    Generate simple, readable summary of precipitation data without LLM.
+    This function provides task-specific formatting that turns raw precipitation
+    data into readable bullet points with basic statistics.
+    Args:
+        filtered_data: Dictionary with 'zona_allerta' and 'province' keys
+        filters: Applied filters (zona_allerta, provincia, periodo, etc.)
+    Returns:
+        Formatted string with bullet points and basic statistics
+    """
+    if not filtered_data or (not filtered_data.get("zona_allerta") and not filtered_data.get("province")):
+        return "🌧️ **Precipitazioni massime**: Nessun dato trovato per i filtri specificati"
+    lines = []
+    time_periods = ["5'", "15'", "30'", "1h", "3h", "6h", "12h", "24h"]
+    # Process zona d'allerta data
+    zona_data = filtered_data.get("zona_allerta", [])
+    if zona_data:
+        zona_name = filters.get('zona_allerta') or filters.get('zona', 'Unknown')
+        lines.append(f"🌧️ **Zona d'allerta {zona_name}**:")
+        for record in zona_data:
+            # Extract precipitation values for different time periods
+            precip_values = []
+            for period in time_periods:
+                if period in record and record[period]:
+                    # Parse the value (format: "value [time] station")
+                    raw_value = record[period]
+                    parsed = _parse_single_value(raw_value)
+                    if parsed["value"] is not None:
+                        precip_values.append({
+                            "period": period,
+                            "value": parsed["value"],
+                            "station": parsed["station"],
+                            "time": parsed["time"]
+                        })
+            if precip_values:
+                # Show range of values found
+                values_only = [pv["value"] for pv in precip_values]
+                min_val, max_val = min(values_only), max(values_only)
+                # Find the period with max value
+                max_period_data = max(precip_values, key=lambda x: x["value"])
+                if filters.get('periodo'):
+                    # Specific period requested
+                    periodo_data = [pv for pv in precip_values if pv["period"] == filters['periodo']]
+                    if periodo_data:
+                        pd = periodo_data[0]
+                        lines.append(f"  • **{filters['periodo']}**: {pd['value']}mm alle {pd['time']} ({pd['station']})")
+                    else:
+                        lines.append(f"  • **{filters['periodo']}**: Nessun dato disponibile")
+                else:
+                    # All periods - show exhaustive details for each period
+                    lines.append(f"  • **Riepilogo**: {min_val}-{max_val}mm su {len(precip_values)} periodi")
+                    for pv in sorted(precip_values, key=lambda x: time_periods.index(x["period"])):
+                        lines.append(f"  • **{pv['period']}**: {pv['value']}mm alle {pv['time']} ({pv['station']})")
+            else:
+                lines.append(f"  • Nessun dato di precipitazione disponibile")
+    # Process province data
+    province_data = filtered_data.get("province", [])
+    if province_data:
+        provincia_name = filters.get('provincia', 'Unknown')
+        if zona_data:  # Add spacing if we had zona data too
+            lines.append("")
+        lines.append(f"🌧️ **Provincia {provincia_name}**:")
+        for record in province_data:
+            # Extract precipitation values for different time periods
+            precip_values = []
+            for period in time_periods:
+                if period in record and record[period]:
+                    # Parse the value (format: "value [time] station")
+                    raw_value = record[period]
+                    parsed = _parse_single_value(raw_value)
+                    if parsed["value"] is not None:
+                        precip_values.append({
+                            "period": period,
+                            "value": parsed["value"],
+                            "station": parsed["station"],
+                            "time": parsed["time"]
+                        })
+            if precip_values:
+                # Show range of values found
+                values_only = [pv["value"] for pv in precip_values]
+                min_val, max_val = min(values_only), max(values_only)
+                # Find the period with max value
+                max_period_data = max(precip_values, key=lambda x: x["value"])
+                if filters.get('periodo'):
+                    # Specific period requested
+                    periodo_data = [pv for pv in precip_values if pv["period"] == filters['periodo']]
+                    if periodo_data:
+                        pd = periodo_data[0]
+                        lines.append(f"  • **{filters['periodo']}**: {pd['value']}mm alle {pd['time']} ({pd['station']})")
+                    else:
+                        lines.append(f"  • **{filters['periodo']}**: Nessun dato disponibile")
+                else:
+                    # All periods - show exhaustive details for each period
+                    lines.append(f"  • **Riepilogo**: {min_val}-{max_val}mm su {len(precip_values)} periodi")
+                    for pv in sorted(precip_values, key=lambda x: time_periods.index(x["period"])):
+                        lines.append(f"  • **{pv['period']}**: {pv['value']}mm alle {pv['time']} ({pv['station']})")
+            else:
+                lines.append(f"  • Nessun dato di precipitazione disponibile")
+    return "\n".join(lines)

tools/omirl/tables/valori_stazioni.py CHANGED Viewed

@@ -58,37 +58,10 @@ async def fetch_valori_stazioni_async(filters: OMIRLFilterSet) -> OMIRLResult:
             result.data = filtered_data
             result.message = f"Estratti {len(filtered_data)} record dalle stazioni meteorologiche"
-            # Generate summary using task-agnostic summarization
             if filtered_data:
-                try:
-                    from services.text.task_agnostic_summarization import (
-                        create_valori_stazioni_summary,
-                        analyze_station_data,
-                        get_multi_task_summarizer
-                    )
-                    # Analyze the station data for insights
-                    data_insights = analyze_station_data(filtered_data, sensor_type)
-                    # Create standardized summary
-                    task_summary = create_valori_stazioni_summary(
-                        geographic_scope=filters.provincia or filters.comune or "Liguria",
-                        data_insights=data_insights,
-                        filters_applied=all_filters
-                    )
-                    # Generate LLM-based summary using MultiTaskSummarizer
-                    summarizer = get_multi_task_summarizer()
-                    summarizer.clear_results()  # Clear any previous results
-                    summarizer.add_task_result(task_summary)
-                    summary = await summarizer.generate_final_summary(
-                        query_context=f"valori stazioni {sensor_type}"
-                    )
-                    result.update_metadata(summary=summary)
-                except ImportError:
-                    # Task-agnostic summarization service not available - continue without summary
-                    pass
             # Add filter metadata
             result.update_metadata(
@@ -151,23 +124,106 @@ def _apply_additional_filters(data: List[Dict], filters: OMIRLFilterSet) -> List
     return filtered_data
-# Backward compatibility function
-def fetch_valori_stazioni_legacy(tipo_sensore=None, provincia=None, comune=None, stazione=None):
     """
-    Legacy function for backward compatibility
-    This maintains the old API while using the new implementation internally.
     """
-    # Convert legacy parameters to new filter format
-    filter_dict = {}
-    if tipo_sensore:
-        filter_dict["tipo_sensore"] = tipo_sensore
-    if provincia:
-        filter_dict["provincia"] = provincia
-    if comune:
-        filter_dict["comune"] = comune
-    if stazione:
-        filter_dict["stazione"] = stazione
-    filters = OMIRLFilterSet(filter_dict)
-    return fetch_valori_stazioni(filters)

             result.data = filtered_data
             result.message = f"Estratti {len(filtered_data)} record dalle stazioni meteorologiche"
+            # Generate simple formatted summary (no LLM dependency)
             if filtered_data:
+                summary = format_station_data_simple(filtered_data, filters, sensor_type)
+                result.update_metadata(summary=summary)
             # Add filter metadata
             result.update_metadata(
     return filtered_data
+def format_station_data_simple(
+    filtered_data: List[Dict],
+    filters: OMIRLFilterSet,
+    sensor_type: str
+) -> str:
     """
+    Generate simple, readable summary of station data without LLM.
+    This function provides task-specific formatting that turns raw station
+    data into readable bullet points based on the filtering criteria.
+    Args:
+        filtered_data: List of station dictionaries
+        filters: OMIRLFilterSet with applied filters
+        sensor_type: Type of sensor (Temperatura, Precipitazione, etc.)
+    Returns:
+        Formatted string with bullet points based on filter specificity
     """
+    if not filtered_data:
+        return f"🌡️ **Stazioni {sensor_type}**: Nessun dato trovato per i filtri specificati"
+    lines = [f"🌡️ **Stazioni {sensor_type}** ({len(filtered_data)} record):"]
+    # Scenario 1: Only tipo_sensore provided - show all table content in bullet points
+    if not filters.stazione and not filters.comune and not filters.provincia:
+        # Group by province for better organization
+        by_province = {}
+        for station in filtered_data:
+            prov = station.get('Provincia', 'Unknown')
+            if prov not in by_province:
+                by_province[prov] = []
+            by_province[prov].append(station)
+        for province, stations in sorted(by_province.items()):
+            lines.append(f"  • **{province}**: {len(stations)} stazioni")
+            for station in stations[:10]:  # Limit to first 10 per province to avoid overwhelming output
+                ultimo = station.get('ultimo', 'N/A')
+                max_val = station.get('max', 'N/A')
+                min_val = station.get('min', 'N/A')
+                unit = station.get('unita', '')
+                nome = station.get('Nome', 'Unknown')
+                comune = station.get('Comune', 'Unknown')
+                lines.append(f"    - **{nome}** ({comune}): {ultimo}{unit} (max: {max_val}{unit}, min: {min_val}{unit})")
+            if len(stations) > 10:
+                lines.append(f"    ... e altre {len(stations) - 10} stazioni")
+    # Scenario 2: tipo_sensore + stazione - show specific station details
+    elif filters.stazione:
+        for station in filtered_data:
+            ultimo = station.get('ultimo', 'N/A')
+            max_val = station.get('max', 'N/A')
+            min_val = station.get('min', 'N/A')
+            unit = station.get('unita', '')
+            nome = station.get('Nome', 'Unknown')
+            comune = station.get('Comune', 'Unknown')
+            provincia = station.get('Provincia', 'Unknown')
+            lines.append(f"  • **{nome}** ({comune}, {provincia}):")
+            lines.append(f"    - **Ultimo**: {ultimo}{unit}")
+            lines.append(f"    - **Massimo**: {max_val}{unit}")
+            lines.append(f"    - **Minimo**: {min_val}{unit}")
+    # Scenario 3: tipo_sensore + comune - show all stations in that comune
+    elif filters.comune:
+        comune_name = filters.comune
+        lines.append(f"  • **Comune: {comune_name}**")
+        for station in filtered_data:
+            ultimo = station.get('ultimo', 'N/A')
+            max_val = station.get('max', 'N/A')
+            min_val = station.get('min', 'N/A')
+            unit = station.get('unita', '')
+            nome = station.get('Nome', 'Unknown')
+            lines.append(f"    - **{nome}**: ultimo {ultimo}{unit}, max {max_val}{unit}, min {min_val}{unit}")
+    # Scenario 4: tipo_sensore + provincia - show all stations in that provincia
+    elif filters.provincia:
+        provincia_name = filters.provincia
+        lines.append(f"  • **Provincia: {provincia_name}**")
+        # Group by comune within the provincia
+        by_comune = {}
+        for station in filtered_data:
+            comune = station.get('Comune', 'Unknown')
+            if comune not in by_comune:
+                by_comune[comune] = []
+            by_comune[comune].append(station)
+        for comune, stations in sorted(by_comune.items()):
+            lines.append(f"    - **{comune}**: {len(stations)} stazioni")
+            for station in stations:
+                ultimo = station.get('ultimo', 'N/A')
+                max_val = station.get('max', 'N/A')
+                min_val = station.get('min', 'N/A')
+                unit = station.get('unita', '')
+                nome = station.get('Nome', 'Unknown')
+                lines.append(f"      • **{nome}**: ultimo {ultimo}{unit}, max {max_val}{unit}, min {min_val}{unit}")
+    return "\n".join(lines)