Spaces:

BinKhoaLe1812
/

EdSummariser

Running

App Files Files Community

LiamKhoaLe commited on Sep 21, 2025

Commit

48a0d5a

1 Parent(s): 6f12b05

Upd report CoT loop and fix bug

Browse files

Files changed (2) hide show

routes/reports.py +75 -12
utils/api/router.py +14 -6

routes/reports.py CHANGED Viewed

@@ -122,12 +122,12 @@ async def generate_report(
     logger.info("[REPORT] Starting CoT planning phase")
     update_report_status(session_id, "planning", "Planning action...", 25)
     # Use enhanced instructions for better CoT planning
-    cot_plan = await generate_cot_plan(enhanced_instructions, file_summary, context_text, web_context_block, nvidia_rotator)
     # Step 2: Execute detailed subtasks based on CoT plan
     logger.info("[REPORT] Executing detailed subtasks")
     update_report_status(session_id, "processing", "Processing data...", 40)
-    detailed_analysis = await execute_detailed_subtasks(cot_plan, context_text, web_context_block, eff_name, nvidia_rotator)
     # Step 3: Synthesize comprehensive report from detailed analysis
     logger.info("[REPORT] Synthesizing comprehensive report")
@@ -184,7 +184,7 @@ async def generate_report_pdf(
 # ────────────────────────────── Chain of Thought Report Generation ──────────────────
-async def generate_cot_plan(instructions: str, file_summary: str, context_text: str, web_context: str, nvidia_rotator) -> Dict[str, Any]:
     """Generate a detailed Chain of Thought plan for report generation using NVIDIA."""
     sys_prompt = """You are an expert research analyst and report planner. Given a user's request and available materials, create a comprehensive plan for generating a detailed, professional report.
@@ -262,23 +262,86 @@ Create a detailed plan for generating a comprehensive report that addresses the
     try:
         selection = {"provider": "nvidia", "model": "meta/llama-3.1-8b-instruct"}
-        response = await generate_answer_with_model(selection, sys_prompt, user_prompt, None, nvidia_rotator)
         # Parse JSON response
         import json
         json_text = response.strip()
         if json_text.startswith('```json'):
             json_text = json_text[7:-3].strip()
         elif json_text.startswith('```'):
             json_text = json_text[3:-3].strip()
         plan = json.loads(json_text)
         logger.info(f"[REPORT] CoT plan generated with {len(plan.get('report_structure', {}).get('sections', []))} sections")
         return plan
     except Exception as e:
         logger.warning(f"[REPORT] CoT planning failed: {e}")
-        # Fallback plan
         return {
             "analysis": {
                 "user_intent": instructions,
@@ -309,7 +372,7 @@ Create a detailed plan for generating a comprehensive report that addresses the
         }
-async def execute_detailed_subtasks(cot_plan: Dict[str, Any], context_text: str, web_context: str, filename: str, nvidia_rotator) -> Dict[str, Any]:
     """Execute detailed analysis for each subtask identified in the CoT plan."""
     detailed_analysis = {}
     synthesis_strategy = cot_plan.get("synthesis_strategy", {})
@@ -338,7 +401,7 @@ async def execute_detailed_subtasks(cot_plan: Dict[str, Any], context_text: str,
             # Generate comprehensive analysis for this subtask
             subtask_result = await analyze_subtask_comprehensive(
                 task, reasoning, sources_needed, depth, sub_actions, expected_output,
-                quality_checks, context_text, web_context, filename, nvidia_rotator
             )
             section_analysis["subtask_results"].append({
@@ -353,7 +416,7 @@ async def execute_detailed_subtasks(cot_plan: Dict[str, Any], context_text: str,
         # Generate section-level synthesis
         section_synthesis = await synthesize_section_analysis(
-            section_analysis, synthesis_strategy, nvidia_rotator
         )
         section_analysis["section_synthesis"] = section_synthesis
@@ -365,7 +428,7 @@ async def execute_detailed_subtasks(cot_plan: Dict[str, Any], context_text: str,
 async def analyze_subtask_comprehensive(task: str, reasoning: str, sources_needed: List[str], depth: str,
                                       sub_actions: List[str], expected_output: str, quality_checks: List[str],
-                                      context_text: str, web_context: str, filename: str, nvidia_rotator) -> str:
     """Analyze a specific subtask with comprehensive detail and sub-actions."""
     # Select appropriate context based on sources_needed
@@ -423,7 +486,7 @@ Perform the comprehensive analysis as specified, following all sub-actions and m
     try:
         selection = {"provider": "nvidia", "model": "meta/llama-3.1-8b-instruct"}
-        analysis = await generate_answer_with_model(selection, sys_prompt, user_prompt, None, nvidia_rotator)
         return analysis.strip()
     except Exception as e:
@@ -431,7 +494,7 @@ Perform the comprehensive analysis as specified, following all sub-actions and m
         return f"Analysis for '{task}' could not be completed due to processing error."
-async def synthesize_section_analysis(section_analysis: Dict[str, Any], synthesis_strategy: Dict[str, str], nvidia_rotator) -> str:
     """Synthesize all subtask results within a section into a coherent analysis."""
     section_title = section_analysis.get("title", "Unknown Section")
@@ -474,7 +537,7 @@ Synthesize these analyses into a comprehensive, coherent section that fulfills t
     try:
         selection = {"provider": "nvidia", "model": "meta/llama-3.1-8b-instruct"}
-        synthesis = await generate_answer_with_model(selection, sys_prompt, user_prompt, None, nvidia_rotator)
         return synthesis.strip()
     except Exception as e:

     logger.info("[REPORT] Starting CoT planning phase")
     update_report_status(session_id, "planning", "Planning action...", 25)
     # Use enhanced instructions for better CoT planning
+    cot_plan = await generate_cot_plan(enhanced_instructions, file_summary, context_text, web_context_block, nvidia_rotator, gemini_rotator)
     # Step 2: Execute detailed subtasks based on CoT plan
     logger.info("[REPORT] Executing detailed subtasks")
     update_report_status(session_id, "processing", "Processing data...", 40)
+    detailed_analysis = await execute_detailed_subtasks(cot_plan, context_text, web_context_block, eff_name, nvidia_rotator, gemini_rotator)
     # Step 3: Synthesize comprehensive report from detailed analysis
     logger.info("[REPORT] Synthesizing comprehensive report")
 # ────────────────────────────── Chain of Thought Report Generation ──────────────────
+async def generate_cot_plan(instructions: str, file_summary: str, context_text: str, web_context: str, nvidia_rotator, gemini_rotator) -> Dict[str, Any]:
     """Generate a detailed Chain of Thought plan for report generation using NVIDIA."""
     sys_prompt = """You are an expert research analyst and report planner. Given a user's request and available materials, create a comprehensive plan for generating a detailed, professional report.
     try:
         selection = {"provider": "nvidia", "model": "meta/llama-3.1-8b-instruct"}
+        response = await generate_answer_with_model(selection, sys_prompt, user_prompt, gemini_rotator, nvidia_rotator)
         # Parse JSON response
         import json
         json_text = response.strip()
+        logger.info(f"[REPORT] Raw CoT response length: {len(json_text)}")
+        logger.info(f"[REPORT] Raw CoT response preview: {json_text[:200]}...")
         if json_text.startswith('```json'):
             json_text = json_text[7:-3].strip()
         elif json_text.startswith('```'):
             json_text = json_text[3:-3].strip()
+        if not json_text:
+            raise ValueError("Empty response from model")
         plan = json.loads(json_text)
         logger.info(f"[REPORT] CoT plan generated with {len(plan.get('report_structure', {}).get('sections', []))} sections")
         return plan
     except Exception as e:
         logger.warning(f"[REPORT] CoT planning failed: {e}")
+        # Try a simpler fallback approach
+        try:
+            logger.info("[REPORT] Attempting simplified CoT planning")
+            simple_sys_prompt = """You are a report planner. Create a simple plan for a report based on the user's request.
+Return a JSON object with this structure:
+{
+  "analysis": {
+    "user_intent": "What the user wants to know",
+    "key_requirements": ["requirement1", "requirement2"],
+    "complexity_level": "intermediate",
+    "focus_areas": ["area1", "area2"]
+  },
+  "report_structure": {
+    "sections": [
+      {
+        "title": "Introduction",
+        "purpose": "Provide overview",
+        "subtasks": [{"task": "Summarize key points", "reasoning": "Set foundation", "sources_needed": ["local"], "depth": "detailed"}]
+      },
+      {
+        "title": "Main Analysis",
+        "purpose": "Address user's request",
+        "subtasks": [{"task": "Detailed analysis", "reasoning": "Core content", "sources_needed": ["local"], "depth": "comprehensive"}]
+      },
+      {
+        "title": "Conclusion",
+        "purpose": "Synthesize findings",
+        "subtasks": [{"task": "Summarize insights", "reasoning": "Provide closure", "sources_needed": ["local"], "depth": "detailed"}]
+      }
+    ]
+  },
+  "reasoning_flow": ["Analyze materials", "Extract insights", "Synthesize findings"]
+}"""
+            simple_user_prompt = f"""USER REQUEST: {instructions}
+FILE SUMMARY: {file_summary[:500]}
+Create a simple plan for this report."""
+            simple_response = await generate_answer_with_model(selection, simple_sys_prompt, simple_user_prompt, gemini_rotator, nvidia_rotator)
+            simple_json_text = simple_response.strip()
+            if simple_json_text.startswith('```json'):
+                simple_json_text = simple_json_text[7:-3].strip()
+            elif simple_json_text.startswith('```'):
+                simple_json_text = simple_json_text[3:-3].strip()
+            if simple_json_text:
+                simple_plan = json.loads(simple_json_text)
+                logger.info("[REPORT] Simplified CoT plan generated successfully")
+                return simple_plan
+        except Exception as simple_e:
+            logger.warning(f"[REPORT] Simplified CoT planning also failed: {simple_e}")
+        # Final fallback plan
+        logger.info("[REPORT] Using hardcoded fallback plan")
         return {
             "analysis": {
                 "user_intent": instructions,
         }
+async def execute_detailed_subtasks(cot_plan: Dict[str, Any], context_text: str, web_context: str, filename: str, nvidia_rotator, gemini_rotator) -> Dict[str, Any]:
     """Execute detailed analysis for each subtask identified in the CoT plan."""
     detailed_analysis = {}
     synthesis_strategy = cot_plan.get("synthesis_strategy", {})
             # Generate comprehensive analysis for this subtask
             subtask_result = await analyze_subtask_comprehensive(
                 task, reasoning, sources_needed, depth, sub_actions, expected_output,
+                quality_checks, context_text, web_context, filename, nvidia_rotator, gemini_rotator
             )
             section_analysis["subtask_results"].append({
         # Generate section-level synthesis
         section_synthesis = await synthesize_section_analysis(
+            section_analysis, synthesis_strategy, nvidia_rotator, gemini_rotator
         )
         section_analysis["section_synthesis"] = section_synthesis
 async def analyze_subtask_comprehensive(task: str, reasoning: str, sources_needed: List[str], depth: str,
                                       sub_actions: List[str], expected_output: str, quality_checks: List[str],
+                                      context_text: str, web_context: str, filename: str, nvidia_rotator, gemini_rotator) -> str:
     """Analyze a specific subtask with comprehensive detail and sub-actions."""
     # Select appropriate context based on sources_needed
     try:
         selection = {"provider": "nvidia", "model": "meta/llama-3.1-8b-instruct"}
+        analysis = await generate_answer_with_model(selection, sys_prompt, user_prompt, gemini_rotator, nvidia_rotator)
         return analysis.strip()
     except Exception as e:
         return f"Analysis for '{task}' could not be completed due to processing error."
+async def synthesize_section_analysis(section_analysis: Dict[str, Any], synthesis_strategy: Dict[str, str], nvidia_rotator, gemini_rotator) -> str:
     """Synthesize all subtask results within a section into a coherent analysis."""
     section_title = section_analysis.get("title", "Unknown Section")
     try:
         selection = {"provider": "nvidia", "model": "meta/llama-3.1-8b-instruct"}
+        synthesis = await generate_answer_with_model(selection, sys_prompt, user_prompt, gemini_rotator, nvidia_rotator)
         return synthesis.strip()
     except Exception as e:

utils/api/router.py CHANGED Viewed

@@ -54,9 +54,13 @@ async def generate_answer_with_model(selection: Dict[str, Any], system_prompt: s
         headers = {"Content-Type": "application/json"}
         data = await robust_post_json(url, headers, payload, gemini_rotator)
         try:
-            return data["candidates"][0]["content"]["parts"][0]["text"]
-        except Exception:
-            logger.warning(f"Unexpected Gemini response: {data}")
             return "I couldn't parse the model response."
     elif provider == "nvidia":
@@ -74,9 +78,13 @@ async def generate_answer_with_model(selection: Dict[str, Any], system_prompt: s
         headers = {"Content-Type": "application/json", "Authorization": f"Bearer {key}"}
         data = await robust_post_json(url, headers, payload, nvidia_rotator)
         try:
-            return data["choices"][0]["message"]["content"]
-        except Exception:
-            logger.warning(f"Unexpected NVIDIA response: {data}")
             return "I couldn't parse the model response."
     return "Unsupported provider."

         headers = {"Content-Type": "application/json"}
         data = await robust_post_json(url, headers, payload, gemini_rotator)
         try:
+            content = data["candidates"][0]["content"]["parts"][0]["text"]
+            if not content or content.strip() == "":
+                logger.warning(f"Empty content from Gemini model: {data}")
+                return "I received an empty response from the model."
+            return content
+        except Exception as e:
+            logger.warning(f"Unexpected Gemini response: {data}, error: {e}")
             return "I couldn't parse the model response."
     elif provider == "nvidia":
         headers = {"Content-Type": "application/json", "Authorization": f"Bearer {key}"}
         data = await robust_post_json(url, headers, payload, nvidia_rotator)
         try:
+            content = data["choices"][0]["message"]["content"]
+            if not content or content.strip() == "":
+                logger.warning(f"Empty content from NVIDIA model: {data}")
+                return "I received an empty response from the model."
+            return content
+        except Exception as e:
+            logger.warning(f"Unexpected NVIDIA response: {data}, error: {e}")
             return "I couldn't parse the model response."
     return "Unsupported provider."