Spaces:

Hammad712
/

PSA

Sleeping

App Files Files Community

PSA / app /services /rivergen.py

Hammad712

Initial clean deployment: removed binary bloat

7e431a1 about 2 months ago

raw

history blame contribute delete

6.6 kB

	import time
	import json
	import logging
	from typing import Dict, Any, Optional

	# Import agents
	from app.core.agents import (
	router_agent, sql_agent, nosql_agent, multi_source_agent,
	big_data_agent, ml_agent, vector_store_agent, stream_agent, llm_judge
	)

	# 1. Setup Structured Logging
	logger = logging.getLogger("rivergen.orchestrator")
	logging.basicConfig(level=logging.INFO)

	# 2. Agent Registry
	AGENT_MAPPING = {
	"sql_agent": sql_agent,
	"nosql_agent": nosql_agent,
	"multi_source_agent": multi_source_agent,
	"big_data_agent": big_data_agent,
	"ml_agent": ml_agent,
	"vector_store_agent": vector_store_agent,
	"stream_agent": stream_agent
	}

	def run_rivergen_flow(payload: Dict[str, Any]) -> Dict[str, Any]:
	"""
	Main workflow orchestrator: Routing -> Execution -> Judging Loop.
	Tracks TOTAL token usage across all steps (Router + Agent Attempts + Judge).
	"""
	request_id = payload.get("request_id", "unknown_id")
	start_time = time.time()

	# --- 📊 Token Accumulators ---
	total_input_tokens = 0
	total_output_tokens = 0

	logger.info(f"🚀 [Orchestrator] Starting Flow for Request ID: {request_id}")

	# ------------------------------------------------------------------
	# ⚡ CRITICAL FIX: Normalize Data Sources for Blind Agents
	# ------------------------------------------------------------------
	if "data_sources" in payload:
	logger.info(f"🛠️ [Orchestrator] Normalizing {len(payload['data_sources'])} data sources...")

	for i, source in enumerate(payload["data_sources"]):
	# 1. Fix ID Mismatch (Agents might expect 'id' or 'source_id')
	if "data_source_id" in source:
	ds_id = source["data_source_id"]
	if "id" not in source:
	source["id"] = ds_id
	if "source_id" not in source:
	source["source_id"] = ds_id

	# 2. Log the Source Structure (For Debugging)
	# - visualizing how we map the IDs
	logger.info(f" 🔹 Source [{i}]: keys={list(source.keys())} \| type={source.get('type')}")

	# ------------------------------------------------------------------

	try:
	# --- Step 1: Router Agent ---
	router_output = router_agent(payload)

	# Accumulate Router Usage
	if "usage" in router_output:
	total_input_tokens += router_output["usage"].get("input_tokens", 0)
	total_output_tokens += router_output["usage"].get("output_tokens", 0)

	if "error" in router_output:
	logger.error(f"⛔ [Router Error] {request_id}: {router_output['error']}")
	return {"status": "error", "error": router_output["error"]}

	agent_name = router_output.get("selected_agent")
	confidence = router_output.get("confidence", 0.0)

	logger.info(f"🧭 [Router] {request_id} -> Selected: {agent_name} (Conf: {confidence})")

	# --- Step 2: Agent Dispatch ---
	agent_func = AGENT_MAPPING.get(agent_name)
	if not agent_func:
	error_msg = f"Agent '{agent_name}' is not supported."
	logger.critical(f"❌ [Dispatcher] {error_msg}")
	return {"status": "error", "error": error_msg}

	# --- Step 3-5: Generation & Validation Loop ---
	max_retries = 3
	current_feedback = None

	for attempt in range(1, max_retries + 1):
	logger.info(f"🔄 [Attempt {attempt}/{max_retries}] Agent '{agent_name}' working...")

	# A. Generate Plan
	plan = agent_func(payload, feedback=current_feedback)

	# Accumulate Agent Usage
	if "ai_metadata" in plan:
	total_input_tokens += plan["ai_metadata"].get("input_tokens", 0)
	total_output_tokens += plan["ai_metadata"].get("output_tokens", 0)

	# Check for Agent Crash
	if plan.get("error"):
	logger.warning(f"⚠️ [Agent Crash] Attempt {attempt} failed: {plan['error']}")
	current_feedback = f"Agent crashed with error: {plan['error']}"
	continue

	# B. Validate Plan (Judge)
	review = llm_judge(payload, plan)

	# Accumulate Judge Usage
	if "usage" in review:
	total_input_tokens += review["usage"].get("input_tokens", 0)
	total_output_tokens += review["usage"].get("output_tokens", 0)

	if review.get('approved'):
	duration = time.time() - start_time
	logger.info(f"✅ [Judge] Plan Approved for {request_id} in {duration:.2f}s")

	# C. Inject Execution Metadata
	plan["meta"] = {
	"attempts_used": attempt,
	"processing_time_ms": int(duration * 1000),
	"router_confidence": confidence,
	"judge_score": review.get("score", 1.0)
	}

	# Finalize Usage Totals
	if "ai_metadata" not in plan:
	plan["ai_metadata"] = {}

	plan["ai_metadata"]["input_tokens"] = total_input_tokens
	plan["ai_metadata"]["output_tokens"] = total_output_tokens
	plan["ai_metadata"]["total_tokens"] = total_input_tokens + total_output_tokens

	return plan

	else:
	feedback = review.get('feedback', 'Unknown rejection reason.')
	logger.info(f"❌ [Judge] Rejected attempt {attempt}. Feedback: {feedback}")
	current_feedback = feedback

	# --- Final Failure State ---
	logger.error(f"💀 [Failed] {request_id} exhausted {max_retries} attempts.")
	return {
	"status": "error",
	"error": "Plan generation failed validation after maximum retries.",
	"last_feedback": current_feedback,
	"request_id": request_id,
	"usage": {
	"input_tokens": total_input_tokens,
	"output_tokens": total_output_tokens,
	"total_tokens": total_input_tokens + total_output_tokens
	}
	}

	except Exception as e:
	logger.exception(f"🔥 [System Panic] Critical workflow failure for {request_id}")
	return {
	"status": "error",
	"error": "Internal Orchestration Error. Please check logs.",
	"details": str(e),
	"request_id": request_id
	}