Spaces:

Pulastya0
/

Data-Science-Agent

Running

Data-Science-Agent / src /reasoning /synthesizer.py

Pulastya B

Fixed some minor bugs

c073e6b 16 days ago

11 kB

	"""
	Synthesizer Module - The SYNTHESIZE step of the Reasoning Loop.

	Takes all accumulated findings and produces a coherent, narrative answer.

	Unlike the old approach (where the LLM's last response WAS the summary),
	the Synthesizer deliberately constructs the answer from evidence:
	- Connects findings into a coherent story
	- Cites evidence for each claim
	- Highlights confidence levels
	- Notes what wasn't investigated (limitations)
	- Produces actionable insights, not just numbers

	Architecture:
	FindingsAccumulator → Synthesizer.synthesize() → Markdown narrative
	"""

	import json
	from typing import Dict, Any, List, Optional, Callable

	from .findings import FindingsAccumulator


	SYNTHESIS_SYSTEM_PROMPT = """You are a senior data scientist writing a concise analysis report.

	Given the investigation findings, synthesize a clear, evidence-based answer to the user's question.

	STRUCTURE (use markdown):
	1. Executive Summary (2-3 sentences answering the question directly)
	2. Key Findings (bullet points with evidence references)
	3. Supporting Evidence (specific metrics, correlations, patterns)
	4. Visualizations (mention any plots/charts generated, with file paths)
	5. Limitations & Caveats (what we didn't investigate, caveats)
	6. Recommendations (actionable next steps)

	RULES:
	- Lead with the answer, then show evidence
	- Use specific numbers (not "high correlation" but "r=0.72")
	- Mention generated files/plots so user can find them
	- Be honest about confidence levels
	- Keep it under 500 words unless complex analysis warrants more
	- Use markdown formatting (headers, bullets, bold for emphasis)
	- Do NOT wrap your response in code fences (``` or ```markdown) — output raw markdown directly
	- ONLY report findings from SUCCESSFUL investigation steps
	- Do NOT invent numbers, statistics, or insights that are not present in the findings
	- If a step is marked [FAILED], ignore its results entirely — do not fabricate data from it
	- If most steps failed, be transparent about limited evidence and recommend re-running"""

	SYNTHESIS_USER_TEMPLATE = """Original question: {question}

	Investigation summary:
	{findings_context}

	Generated artifacts:
	{artifacts_summary}

	Write the analysis report now. Focus on answering the question with evidence from the investigation."""


	class Synthesizer:
	"""
	The SYNTHESIZE step of the Reasoning Loop.

	Produces the final answer from accumulated evidence.

	Usage:
	synthesizer = Synthesizer(llm_caller=orchestrator._llm_text_call)
	report = synthesizer.synthesize(
	findings=findings_accumulator,
	artifacts={"plots": [...], "files": [...]}
	)
	"""

	def __init__(self, llm_caller: Callable):
	"""
	Args:
	llm_caller: Function (system_prompt, user_prompt, max_tokens) -> str
	"""
	self.llm_caller = llm_caller

	def synthesize(
	self,
	findings: FindingsAccumulator,
	artifacts: Optional[Dict[str, Any]] = None,
	max_tokens: int = 3000
	) -> str:
	"""
	Synthesize all findings into a coherent answer.

	Args:
	findings: Accumulated findings from the reasoning loop
	artifacts: Optional dict of generated artifacts (plots, files, models)
	max_tokens: Max tokens for synthesis response

	Returns:
	Markdown-formatted analysis report
	"""
	# Build artifacts summary
	artifacts_summary = self._format_artifacts(artifacts or {}, findings)

	# Build findings context — only successful findings get full detail
	findings_context = self._build_filtered_context(findings)

	user_prompt = SYNTHESIS_USER_TEMPLATE.format(
	question=findings.question,
	findings_context=findings_context,
	artifacts_summary=artifacts_summary
	)

	response = self.llm_caller(
	system_prompt=SYNTHESIS_SYSTEM_PROMPT,
	user_prompt=user_prompt,
	max_tokens=max_tokens
	)

	return self._strip_code_fences(response.strip())

	def synthesize_exploratory(
	self,
	findings: FindingsAccumulator,
	artifacts: Optional[Dict[str, Any]] = None,
	max_tokens: int = 3000
	) -> str:
	"""
	Synthesize findings from exploratory analysis (no specific question).

	Uses a different prompt that focuses on discovering patterns
	rather than answering a specific question.
	"""
	exploratory_system = """You are a senior data scientist presenting exploratory analysis results.

	The user asked for a general analysis. Present the most interesting discoveries.

	STRUCTURE (use markdown):
	1. Dataset Overview (size, structure, key characteristics)
	2. Most Interesting Discoveries (ranked by insight value)
	3. Key Patterns & Relationships (correlations, distributions, trends)
	4. Data Quality Notes (missing data, outliers, issues found)
	5. Visualizations Generated (list with descriptions)
	6. Recommended Next Steps (what to investigate deeper)

	RULES:
	- Lead with the most surprising/important finding
	- Use specific numbers and metrics
	- Mention all generated visualizations with file paths
	- Suggest actionable next analysis steps
	- Keep it engaging but data-driven
	- Do NOT wrap your response in code fences (``` or ```markdown) — output raw markdown directly
	- ONLY report findings from SUCCESSFUL investigation steps
	- Do NOT invent numbers or statistics not present in the findings
	- If a step is marked [FAILED], ignore it entirely"""

	artifacts_summary = self._format_artifacts(artifacts or {}, findings)

	# Build filtered context — only successful findings
	findings_context = self._build_filtered_context(findings)

	user_prompt = f"""Analysis request: {findings.question}

	Investigation summary:
	{findings_context}

	Generated artifacts:
	{artifacts_summary}

	Write the exploratory analysis report."""

	response = self.llm_caller(
	system_prompt=exploratory_system,
	user_prompt=user_prompt,
	max_tokens=max_tokens
	)

	return self._strip_code_fences(response.strip())

	def _strip_code_fences(self, text: str) -> str:
	"""
	Remove wrapping code fences from LLM output.

	LLMs sometimes wrap markdown in ```markdown ... ``` which causes
	ReactMarkdown to render the entire response as a code block
	instead of parsing the markdown.
	"""
	import re
	# Strip leading ```markdown or ``` and trailing ```
	stripped = re.sub(r'^\s```(?:markdown\|md\|text)?\s\n', '', text)
	stripped = re.sub(r'\n\s```\s$', '', stripped)
	return stripped.strip()

	def _format_artifacts(self, artifacts: Dict[str, Any], findings: FindingsAccumulator) -> str:
	"""Format artifacts for the synthesis prompt."""
	parts = []

	# Extract plots from findings
	plots = artifacts.get("plots", [])
	if plots:
	parts.append("Plots generated:")
	for plot in plots:
	if isinstance(plot, dict):
	parts.append(f" - {plot.get('title', 'Plot')}: {plot.get('url', plot.get('path', 'N/A'))}")
	else:
	parts.append(f" - {plot}")

	# Extract files from findings
	files = artifacts.get("files", [])
	if files:
	parts.append("Output files:")
	for f in files:
	parts.append(f" - {f}")

	# Extract from findings history — only from successful steps
	for finding in findings.findings:
	if not finding.success:
	continue
	result = finding.result_summary
	if "output_file" in result or "output_path" in result or ".html" in result or ".png" in result:
	parts.append(f" - Step {finding.iteration} ({finding.action}): output in result")

	# Tools used summary
	if findings.tools_used:
	parts.append(f"\nTools used: {', '.join(findings.tools_used)}")

	if not parts:
	return "No artifacts generated yet."

	return "\n".join(parts)

	def _build_filtered_context(self, findings: FindingsAccumulator) -> str:
	"""
	Build synthesis context that only includes SUCCESSFUL findings in detail.
	Failed findings are listed as a brief summary so the LLM knows they happened
	but cannot hallucinate data from them.
	"""
	import json

	parts = []
	parts.append(f"Original question: {findings.question}")
	parts.append(f"Mode: {findings.mode}")

	successful = findings.get_successful_findings()
	failed = [f for f in findings.findings if not f.success]

	parts.append(f"Total iterations: {len(findings.findings)} ({len(successful)} succeeded, {len(failed)} failed)")
	parts.append(f"Tools used: {', '.join(findings.tools_used)}")

	# Only successful findings get full detail
	if successful:
	parts.append("\n## Successful Investigation Steps\n")
	for f in successful:
	parts.append(
	f"### Step {f.iteration}: {f.action}\n"
	f"Hypothesis: {f.hypothesis}\n"
	f"Arguments: {json.dumps(f.arguments, default=str)}\n"
	f"Result: {f.result_summary}\n"
	f"Interpretation: {f.interpretation}\n"
	f"Confidence: {f.confidence:.0%}\n"
	)

	# Failed findings get just a one-line mention
	if failed:
	parts.append("\n## Failed Steps (no usable data — do NOT cite these)\n")
	for f in failed:
	parts.append(f"- Step {f.iteration}: `{f.action}` FAILED — {f.error_message or 'execution error'}")

	# Hypothesis outcomes
	if findings.hypotheses:
	parts.append("\n## Hypothesis Outcomes\n")
	for h in findings.hypotheses:
	status_emoji = {
	"supported": "\u2705",
	"refuted": "\u274c",
	"inconclusive": "\u2753",
	"testing": "\ud83d\udd04",
	"untested": "\u2b1c"
	}.get(h.status, "\u2b1c")
	parts.append(f"{status_emoji} {h.text} \u2192 {h.status}")
	if h.evidence_for:
	parts.append(f" Evidence for: {'; '.join(h.evidence_for)}")
	if h.evidence_against:
	parts.append(f" Evidence against: {'; '.join(h.evidence_against)}")

	return "\n".join(parts)