Spaces:

stellar413
/

masterllm

Sleeping

App Files Files Community

masterllm / app.py

redhairedshanks1

Update app.py

9d6015f 4 months ago

raw

history blame

54.8 kB

	# # app.py - MasterLLM v2.0 with Bedrock Fallback System
	# """
	# MasterLLM Pipeline Orchestrator v2.0
	# - Bedrock (priority) + Gemini (fallback) for pipeline generation
	# - Bedrock LangChain (priority) + CrewAI (fallback) for execution
	# - MongoDB session management
	# - Complete REST API
	# - Gradio UI with fancy displays
	# """
	# import os
	# import json
	# import uuid
	# from datetime import datetime
	# from typing import List, Optional

	# import gradio as gr
	# from fastapi import FastAPI
	# from fastapi.middleware.cors import CORSMiddleware
	# from contextlib import asynccontextmanager
	# import asyncio

	# # Import our new services
	# from services.pipeline_generator import generate_pipeline, format_pipeline_for_display
	# from services.pipeline_executor import execute_pipeline_streaming
	# from services.session_manager import session_manager
	# from api_routes import router as api_router


	# # ========================
	# # BACKGROUND CLEANUP TASK
	# # ========================

	# async def periodic_cleanup():
	# """Cleanup old sessions every hour"""
	# while True:
	# await asyncio.sleep(3600) # Run every hour
	# try:
	# removed = session_manager.cleanup_old_sessions(max_age_hours=24)
	# if removed > 0:
	# print(f"🧹 Cleaned up {removed} inactive sessions")
	# except Exception as e:
	# print(f"⚠️ Cleanup error: {e}")


	# @asynccontextmanager
	# async def lifespan(app: FastAPI):
	# """Manage application lifecycle"""
	# # Startup
	# print("🚀 Starting MasterLLM v2.0...")
	# task = asyncio.create_task(periodic_cleanup())
	# yield
	# # Shutdown
	# task.cancel()
	# session_manager.close()
	# print("🛑 MasterLLM shut down gracefully")


	# # ========================
	# # FASTAPI APP
	# # ========================

	# app = FastAPI(
	# title="MasterLLM v2.0 - AI Pipeline Orchestrator",
	# description="Bedrock + Gemini fallback system with MongoDB sessions",
	# version="2.0.0",
	# lifespan=lifespan
	# )

	# # CORS Configuration
	# app.add_middleware(
	# CORSMiddleware,
	# allow_origins=[os.getenv("FRONTEND_ORIGIN", "http://localhost:3000")],
	# allow_credentials=True,
	# allow_methods=["*"],
	# allow_headers=["*"],
	# )

	# # Mount API routes
	# app.include_router(api_router)


	# # ========================
	# # CONVERSATION STATE
	# # ========================

	# class ConversationState:
	# INITIAL = "initial"
	# PIPELINE_PROPOSED = "pipeline_proposed"
	# PIPELINE_APPROVED = "pipeline_approved"
	# EXECUTING = "executing"
	# COMPLETED = "completed"
	# ERROR = "error"


	# # ========================
	# # GRADIO UI HANDLERS
	# # ========================

	# def create_new_session():
	# """Create a new session"""
	# return session_manager.create_session()


	# def handle_file_upload(file_path, session_id):
	# """Handle file upload"""
	# if not file_path:
	# return None, json.dumps({
	# "status": "error",
	# "message": "No file uploaded"
	# }, indent=2), session_id

	# if not session_id:
	# session_id = create_new_session()

	# file_name = os.path.basename(file_path)

	# # Update session
	# session_manager.update_session(session_id, {
	# "current_file": file_path,
	# "state": ConversationState.INITIAL
	# })

	# # Add system message
	# session_manager.add_message(
	# session_id,
	# "system",
	# f"File uploaded: {file_name}"
	# )

	# status = {
	# "status": "success",
	# "message": f"File '{file_name}' uploaded successfully",
	# "file_info": {
	# "name": file_name,
	# "path": file_path,
	# "size_bytes": os.path.getsize(file_path) if os.path.exists(file_path) else 0
	# },
	# "next_action": "💬 Now tell me what you'd like to do with this document"
	# }

	# return file_path, json.dumps(status, indent=2), session_id


	# def format_chat_history(history, new_user_msg, new_assistant_msg):
	# """
	# Convert chat history to new Gradio format (list of dicts with role/content)
	# Handles both old format (tuples) and new format (dicts)
	# """
	# messages = []

	# # Handle existing history - could be in old or new format
	# if history:
	# # Check if already in new format (list of dicts with 'role' and 'content')
	# if isinstance(history[0], dict) and 'role' in history[0]:
	# # Already in new format, just copy it
	# messages = list(history)
	# else:
	# # Old format (list of tuples), convert it
	# for item in history:
	# if isinstance(item, (list, tuple)) and len(item) == 2:
	# user_msg, bot_msg = item
	# messages.append({"role": "user", "content": user_msg})
	# messages.append({"role": "assistant", "content": bot_msg})

	# # Add new messages
	# messages.append({"role": "user", "content": new_user_msg})
	# messages.append({"role": "assistant", "content": new_assistant_msg})

	# return messages


	# def chatbot_response_streaming(message: str, history: List, session_id: str, file_path: str = None):
	# """
	# Handle chat messages with streaming updates
	# Uses Bedrock (priority) → Gemini (fallback) for both generation and execution
	# """
	# # Get or create session
	# session = session_manager.get_session(session_id)
	# if not session:
	# session_id = create_new_session()
	# session = session_manager.get_session(session_id)

	# # Update file path if provided
	# if file_path:
	# session_manager.update_session(session_id, {"current_file": file_path})
	# session = session_manager.get_session(session_id)

	# # Add user message to session
	# session_manager.add_message(session_id, "user", message)

	# current_state = session.get("state", ConversationState.INITIAL)

	# # ========================
	# # STATE: INITIAL - Generate Pipeline
	# # ========================
	# if current_state == ConversationState.INITIAL:
	# # Check if file is uploaded
	# if not session.get("current_file"):
	# response = {
	# "status": "error",
	# "message": "Please upload a document first",
	# "action": "📁 Click 'Upload Document' to begin"
	# }
	# response_text = f"```json\n{json.dumps(response, indent=2)}\n```"
	# session_manager.add_message(session_id, "assistant", response_text)
	# yield format_chat_history(history, message, response_text)
	# return

	# try:
	# # Generate pipeline using Bedrock → Gemini fallback
	# yield format_chat_history(history, message, "🤖 Generating pipeline with AI...\n⏳ Trying Bedrock first...")

	# pipeline = generate_pipeline(
	# user_input=message,
	# file_path=session.get("current_file"),
	# prefer_bedrock=True
	# )

	# # Save proposed pipeline to session
	# session_manager.update_session(session_id, {
	# "proposed_pipeline": pipeline,
	# "state": ConversationState.PIPELINE_PROPOSED
	# })

	# # Format for display
	# formatted_display = format_pipeline_for_display(pipeline)

	# # Create response with both fancy display and JSON
	# response_text = formatted_display + f"\n\n```json\n{json.dumps(pipeline, indent=2)}\n```"

	# session_manager.add_message(session_id, "assistant", response_text)
	# yield format_chat_history(history, message, response_text)
	# return

	# except Exception as e:
	# error_response = {
	# "status": "error",
	# "message": "Failed to generate pipeline",
	# "error": str(e),
	# "action": "Please try rephrasing your request"
	# }
	# response_text = f"```json\n{json.dumps(error_response, indent=2)}\n```"
	# session_manager.add_message(session_id, "assistant", response_text)
	# yield format_chat_history(history, message, response_text)
	# return

	# # ========================
	# # STATE: PIPELINE_PROPOSED - Handle Approval/Rejection
	# # ========================
	# elif current_state == ConversationState.PIPELINE_PROPOSED:
	# user_input = message.lower().strip()

	# # APPROVE - Execute the pipeline
	# if "approve" in user_input or "yes" in user_input:
	# session_manager.update_session(session_id, {"state": ConversationState.EXECUTING})

	# plan = session.get("proposed_pipeline", {})

	# # Initial status
	# initial_status = {
	# "status": "executing",
	# "message": "🚀 Starting pipeline execution...",
	# "pipeline": plan.get("pipeline_name", "unknown"),
	# "executor": "Attempting Bedrock LangChain first",
	# "steps": []
	# }
	# accumulated_response = f"```json\n{json.dumps(initial_status, indent=2)}\n```"
	# yield format_chat_history(history, message, accumulated_response)

	# steps_completed = []
	# final_payload = None
	# executor_used = "unknown"

	# try:
	# # Execute pipeline with Bedrock → CrewAI fallback
	# for event in execute_pipeline_streaming(
	# pipeline=plan,
	# file_path=session.get("current_file"),
	# session_id=session_id,
	# prefer_bedrock=True
	# ):
	# event_type = event.get("type")

	# # Info events (fallback notifications, etc.)
	# if event_type == "info":
	# info_status = {
	# "status": "info",
	# "message": event.get("message"),
	# "executor": event.get("executor", "unknown")
	# }
	# accumulated_response = f"```json\n{json.dumps(info_status, indent=2)}\n```"
	# yield format_chat_history(history, message, accumulated_response)

	# # Step updates
	# elif event_type == "step":
	# step_info = {
	# "step": event.get("step", 0),
	# "tool": event.get("tool", "processing"),
	# "status": event.get("status", "running"),
	# "executor": event.get("executor", "unknown")
	# }

	# # Add observation if available (tool output)
	# if "observation" in event:
	# step_info["observation"] = event.get("observation")

	# # Add tool input if available
	# if "input" in event:
	# step_info["input"] = event.get("input")

	# steps_completed.append(step_info)
	# executor_used = event.get("executor", executor_used)

	# # Create more informative status message
	# status_message = f"📍 Step {event.get('step', 0)}: {event.get('tool', 'processing')}"
	# if event.get('status') == 'completed' and 'observation' in event:
	# obs_preview = str(event.get('observation'))[:100]
	# status_message += f" ✅\n Output: {obs_preview}..."
	# elif event.get('status') == 'executing':
	# status_message += " ⏳"

	# progress_status = {
	# "status": "executing",
	# "message": status_message,
	# "pipeline": plan.get("pipeline_name", ""),
	# "executor": executor_used,
	# "current_step": step_info,
	# "steps_completed": steps_completed
	# }
	# accumulated_response = f"```json\n{json.dumps(progress_status, indent=2)}\n```"
	# yield format_chat_history(history, message, accumulated_response)


	# # Final result
	# elif event_type == "final":
	# final_payload = event.get("data")
	# executor_used = event.get("executor", executor_used)

	# # Error
	# elif event_type == "error":
	# error_result = {
	# "status": "failed",
	# "error": event.get("error"),
	# "steps_completed": steps_completed,
	# "executor": event.get("executor", "unknown")
	# }
	# final_response = f"```json\n{json.dumps(error_result, indent=2)}\n```"
	# session_manager.update_session(session_id, {"state": ConversationState.INITIAL})
	# session_manager.add_message(session_id, "assistant", final_response)
	# yield format_chat_history(history, message, final_response)
	# return

	# # Process final result
	# if final_payload:
	# session_manager.update_session(session_id, {
	# "pipeline_result": final_payload,
	# "state": ConversationState.INITIAL
	# })

	# # Save execution to MongoDB
	# session_manager.save_pipeline_execution(
	# session_id=session_id,
	# pipeline=plan,
	# result=final_payload,
	# file_path=session.get("current_file"),
	# executor=executor_used
	# )

	# # Format final response
	# final_display = {
	# "status": "completed",
	# "executor": executor_used,
	# "pipeline": plan.get("pipeline_name"),
	# "result": final_payload,
	# "summary": {
	# "total_steps": len(steps_completed),
	# "completed_successfully": len([s for s in steps_completed if s.get("status") == "completed"])
	# }
	# }
	# final_response = f"```json\n{json.dumps(final_display, indent=2)}\n```"
	# else:
	# final_response = f"```json\n{json.dumps({'status': 'completed', 'steps': steps_completed, 'executor': executor_used}, indent=2)}\n```"
	# session_manager.update_session(session_id, {"state": ConversationState.INITIAL})

	# session_manager.add_message(session_id, "assistant", final_response)
	# yield format_chat_history(history, message, final_response)
	# return

	# except Exception as e:
	# error_result = {
	# "error": str(e),
	# "status": "failed",
	# "message": "Pipeline execution failed",
	# "steps_completed": steps_completed
	# }
	# final_response = f"```json\n{json.dumps(error_result, indent=2)}\n```"
	# session_manager.update_session(session_id, {"state": ConversationState.INITIAL})
	# session_manager.add_message(session_id, "assistant", final_response)
	# yield format_chat_history(history, message, final_response)
	# return

	# # REJECT - Cancel the pipeline
	# elif "reject" in user_input or "no" in user_input:
	# session_manager.update_session(session_id, {
	# "state": ConversationState.INITIAL,
	# "proposed_pipeline": None
	# })
	# response_data = {
	# "status": "rejected",
	# "message": "Pipeline rejected by user",
	# "action": "💬 Please provide a new instruction"
	# }
	# response = f"```json\n{json.dumps(response_data, indent=2)}\n```"
	# session_manager.add_message(session_id, "assistant", response)
	# yield format_chat_history(history, message, response)
	# return

	# # EDIT - Request modifications
	# elif "edit" in user_input or "modify" in user_input:
	# current_pipeline = session.get("proposed_pipeline", {})
	# edit_help = {
	# "status": "edit_mode",
	# "message": "To modify the plan, describe your changes",
	# "current_plan": current_pipeline,
	# "examples": [
	# "Add summarization at the end",
	# "Remove table extraction",
	# "Only process pages 1-3",
	# "Translate to French instead of Spanish"
	# ],
	# "action": "Describe your changes, or say 'approve' to run as-is"
	# }
	# response = f"```json\n{json.dumps(edit_help, indent=2)}\n```"
	# session_manager.add_message(session_id, "assistant", response)
	# yield format_chat_history(history, message, response)
	# return

	# # Try to modify pipeline based on user input
	# else:
	# if len(message.strip()) > 5:
	# try:
	# original_plan = session.get("proposed_pipeline", {})
	# edit_context = f"Original: {original_plan.get('pipeline_name')}. User wants: {message}"

	# # Generate new pipeline with modification
	# new_pipeline = generate_pipeline(
	# user_input=edit_context,
	# file_path=session.get("current_file"),
	# prefer_bedrock=True
	# )

	# session_manager.update_session(session_id, {
	# "proposed_pipeline": new_pipeline,
	# "state": ConversationState.PIPELINE_PROPOSED
	# })

	# formatted = format_pipeline_for_display(new_pipeline)
	# response = formatted + f"\n\n```json\n{json.dumps(new_pipeline, indent=2)}\n```"
	# session_manager.add_message(session_id, "assistant", response)
	# yield format_chat_history(history, message, response)
	# return

	# except Exception as e:
	# error_response = {
	# "status": "edit_failed",
	# "error": str(e),
	# "message": "Could not modify the plan",
	# "action": "Try 'approve' to run as-is, or 'reject' to start over"
	# }
	# response = f"```json\n{json.dumps(error_response, indent=2)}\n```"
	# session_manager.add_message(session_id, "assistant", response)
	# yield format_chat_history(history, message, response)
	# return

	# # Default waiting message
	# response_data = {
	# "status": "waiting_for_confirmation",
	# "message": "Please type 'approve', 'reject', or describe changes",
	# "hint": "You can also say 'edit' for modification hints"
	# }
	# response = f"```json\n{json.dumps(response_data, indent=2)}\n```"
	# session_manager.add_message(session_id, "assistant", response)
	# yield format_chat_history(history, message, response)
	# return

	# # Default fallback
	# response = json.dumps({"status": "ready", "message": "Ready for your next instruction"}, indent=2)
	# session_manager.add_message(session_id, "assistant", response)
	# yield format_chat_history(history, message, response)


	# # ========================
	# # GRADIO UI
	# # ========================

	# # Simple Blocks initialization for HF Spaces compatibility (older Gradio version)
	# with gr.Blocks(title="MasterLLM v2.0 - AI Pipeline Orchestrator") as demo:
	# gr.Markdown("""
	# # 🤖 MasterLLM v2.0 - AI Pipeline Orchestrator

	# 🏆 Bedrock Priority with Gemini Fallback \| 💾 MongoDB Sessions \| 📡 Complete REST API

	# Upload a document, describe what you want, and watch AI orchestrate the perfect pipeline!
	# """)

	# # State management
	# session_id_state = gr.State(value=create_new_session())
	# file_state = gr.State(value=None)

	# with gr.Row():
	# with gr.Column(scale=3):
	# # Chat interface - Gradio auto-detects format from data structure
	# chatbot = gr.Chatbot(label="Chat")

	# # Text input
	# msg = gr.Textbox(
	# placeholder="💬 Type your instruction... (e.g., 'extract text from pages 1-5 and summarize')",
	# label="Your Message",
	# lines=2,
	# max_lines=4,
	# )

	# with gr.Row():
	# submit_btn = gr.Button("🚀 Send", variant="primary", scale=2)
	# clear_btn = gr.Button("🗑️ Clear Chat", scale=1)

	# with gr.Column(scale=1):
	# # File upload section
	# gr.Markdown("### 📁 Upload Document")
	# file_upload = gr.File(
	# label="PDF or Image",
	# file_types=[".pdf", ".png", ".jpg", ".jpeg", ".gif", ".bmp"],
	# type="filepath",
	# )

	# upload_status = gr.Textbox(
	# label="📊 Upload Status",
	# interactive=False,
	# lines=10,
	# max_lines=15,
	# )

	# # Session info
	# gr.Markdown("### 🔗 Session Info")
	# session_display = gr.Textbox(
	# label="Session ID",
	# interactive=False,
	# value=lambda: session_id_state.value[:8] + "...",
	# )

	# # Examples
	# gr.Markdown("### 💡 Example Pipelines")
	# gr.Examples(
	# examples=[
	# "extract text from pages 1-5",
	# "extract text and summarize",
	# "extract text, tables, and translate to Spanish",
	# "get tables from pages 2-4 and summarize",
	# "text-classify-ner from entire document",
	# "describe images and summarize findings",
	# "extract text, detect signatures and stamps",
	# ],
	# inputs=msg,
	# )

	# # System info
	# gr.Markdown("""
	# ### ℹ️ System Features
	# - ✅ Bedrock (Claude 3.5 Sonnet) priority
	# - ✅ Gemini (gemini-2.0-flash) fallback
	# - ✅ MongoDB session persistence
	# - ✅ Streaming real-time updates
	# - ✅ Component-level JSON output
	# - ✅ REST API for integration

	# ### 📊 Pipeline Flow:
	# 1. Upload your document
	# 2. Describe what you want
	# 3. Review AI-generated pipeline
	# 4. Approve to execute
	# 5. Watch streaming updates
	# 6. Get complete JSON results
	# """)

	# # Event handlers
	# file_upload.upload(
	# fn=handle_file_upload,
	# inputs=[file_upload, session_id_state],
	# outputs=[file_state, upload_status, session_id_state],
	# )

	# msg.submit(
	# fn=chatbot_response_streaming,
	# inputs=[msg, chatbot, session_id_state, file_state],
	# outputs=[chatbot],
	# ).then(
	# lambda: "",
	# outputs=msg,
	# )

	# submit_btn.click(
	# fn=chatbot_response_streaming,
	# inputs=[msg, chatbot, session_id_state, file_state],
	# outputs=[chatbot],
	# ).then(
	# lambda: "",
	# outputs=msg,
	# )

	# clear_btn.click(
	# fn=lambda: ([], create_new_session(), None, None, "", ""),
	# outputs=[chatbot, session_id_state, file_state, file_upload, msg, upload_status],
	# )

	# # Mount Gradio on FastAPI
	# app = gr.mount_gradio_app(app, demo, path="/")


	# # ========================
	# # LAUNCH
	# # ========================

	# if __name__ == "__main__":
	# import uvicorn
	# port = int(os.getenv("PORT", 7860))
	# print(f"""
	# ╔════════════════════════════════════════════════════════════╗
	# ║ ║
	# ║ 🚀 MasterLLM v2.0 Starting... ║
	# ║ ║
	# ║ 🌐 Gradio UI: http://localhost:{port} ║
	# ║ 📡 REST API: http://localhost:{port}/api/v1 ║
	# ║ 📚 API Docs: http://localhost:{port}/docs ║
	# ║ ║
	# ║ 🏆 Bedrock: Priority (Claude 3.5 Sonnet) ║
	# ║ 🔄 Gemini: Fallback (gemini-2.0-flash) ║
	# ║ 💾 MongoDB: Session management ║
	# ║ ║
	# ╚════════════════════════════════════════════════════════════╝
	# """)

	# uvicorn.run(app, host="0.0.0.0", port=port)

	# app.py - MasterLLM v2.0 with Bedrock Fallback System
	"""
	MasterLLM Pipeline Orchestrator v2.0
	- Bedrock (priority) + Gemini (fallback) for pipeline generation
	- Bedrock LangChain (priority) + CrewAI (fallback) for execution
	- MongoDB session management
	- Complete REST API
	- Gradio UI with fancy displays
	"""
	import os
	import json
	import uuid
	from datetime import datetime
	from typing import List, Optional

	import gradio as gr
	from fastapi import FastAPI
	from fastapi.middleware.cors import CORSMiddleware
	from contextlib import asynccontextmanager
	import asyncio

	# Import our new services
	from services.pipeline_generator import generate_pipeline, format_pipeline_for_display
	from services.pipeline_executor import execute_pipeline_streaming
	from services.session_manager import session_manager
	from services.intent_classifier import intent_classifier
	from api_routes import router as api_router
	from api_routes_v2 import router as api_router_v2


	# ========================
	# BACKGROUND CLEANUP TASK
	# ========================

	async def periodic_cleanup():
	"""Cleanup old sessions every hour"""
	while True:
	await asyncio.sleep(3600) # Run every hour
	try:
	removed = session_manager.cleanup_old_sessions(max_age_hours=24)
	if removed > 0:
	print(f"🧹 Cleaned up {removed} inactive sessions")
	except Exception as e:
	print(f"⚠️ Cleanup error: {e}")


	@asynccontextmanager
	async def lifespan(app: FastAPI):
	"""Manage application lifecycle"""
	# Startup
	print("🚀 Starting MasterLLM v2.0...")
	task = asyncio.create_task(periodic_cleanup())
	yield
	# Shutdown
	task.cancel()
	session_manager.close()
	print("🛑 MasterLLM shut down gracefully")


	# ========================
	# FASTAPI APP
	# ========================

	app = FastAPI(
	title="MasterLLM v2.0 - AI Pipeline Orchestrator",
	description="Bedrock + Gemini fallback system with MongoDB sessions",
	version="2.0.0",
	lifespan=lifespan
	)

	# CORS Configuration
	app.add_middleware(
	CORSMiddleware,
	allow_origins=[os.getenv("FRONTEND_ORIGIN", "http://localhost:3000")],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# Mount API routes
	app.include_router(api_router) # V1 API (legacy)
	app.include_router(api_router_v2) # V2 API (enhanced with intent classification)


	# ========================
	# CONVERSATION STATE
	# ========================

	class ConversationState:
	INITIAL = "initial"
	PIPELINE_PROPOSED = "pipeline_proposed"
	PIPELINE_APPROVED = "pipeline_approved"
	EXECUTING = "executing"
	COMPLETED = "completed"
	ERROR = "error"


	# ========================
	# GRADIO UI HANDLERS
	# ========================

	def create_new_session():
	"""Create a new session"""
	return session_manager.create_session()


	def handle_file_upload(file_path, session_id):
	"""Handle file upload"""
	if not file_path:
	return None, json.dumps({
	"status": "error",
	"message": "No file uploaded"
	}, indent=2), session_id

	if not session_id:
	session_id = create_new_session()

	file_name = os.path.basename(file_path)

	# Update session
	session_manager.update_session(session_id, {
	"current_file": file_path,
	"state": ConversationState.INITIAL
	})

	# Add system message
	session_manager.add_message(
	session_id,
	"system",
	f"File uploaded: {file_name}"
	)

	status = {
	"status": "success",
	"message": f"File '{file_name}' uploaded successfully",
	"file_info": {
	"name": file_name,
	"path": file_path,
	"size_bytes": os.path.getsize(file_path) if os.path.exists(file_path) else 0
	},
	"next_action": "💬 Now tell me what you'd like to do with this document"
	}

	return file_path, json.dumps(status, indent=2), session_id


	def format_chat_history(history, new_user_msg, new_assistant_msg):
	"""
	Convert chat history to new Gradio format (list of dicts with role/content)
	Handles both old format (tuples) and new format (dicts)
	"""
	messages = []

	# Handle existing history - could be in old or new format
	if history:
	# Check if already in new format (list of dicts with 'role' and 'content')
	if isinstance(history[0], dict) and 'role' in history[0]:
	# Already in new format, just copy it
	messages = list(history)
	else:
	# Old format (list of tuples), convert it
	for item in history:
	if isinstance(item, (list, tuple)) and len(item) == 2:
	user_msg, bot_msg = item
	messages.append({"role": "user", "content": user_msg})
	messages.append({"role": "assistant", "content": bot_msg})

	# Add new messages
	messages.append({"role": "user", "content": new_user_msg})
	messages.append({"role": "assistant", "content": new_assistant_msg})

	return messages


	def chatbot_response_streaming(message: str, history: List, session_id: str, file_path: str = None):
	"""
	Handle chat messages with streaming updates
	Uses intent classification + Bedrock (priority) → Gemini (fallback) for both generation and execution
	"""
	# Get or create session
	session = session_manager.get_session(session_id)
	if not session:
	session_id = create_new_session()
	session = session_manager.get_session(session_id)

	# Update file path if provided
	if file_path:
	session_manager.update_session(session_id, {"current_file": file_path})
	session = session_manager.get_session(session_id)

	# Add user message to session
	session_manager.add_message(session_id, "user", message)

	current_state = session.get("state", ConversationState.INITIAL)

	# ========================
	# CLASSIFY USER INTENT
	# ========================
	intent_data = intent_classifier.classify_intent(message)

	# ========================
	# HANDLE CASUAL CHAT & QUESTIONS
	# ========================
	if intent_data["intent"] in ["casual_chat", "question"] and current_state == ConversationState.INITIAL:
	friendly_response = intent_classifier.get_friendly_response(intent_data["intent"], message)
	session_manager.add_message(session_id, "assistant", friendly_response)
	yield format_chat_history(history, message, friendly_response)
	return

	# ========================
	# HANDLE UNCLEAR INTENT
	# ========================
	if intent_data["intent"] == "unclear" and current_state == ConversationState.INITIAL:
	friendly_response = intent_classifier.get_friendly_response("unclear", message)
	session_manager.add_message(session_id, "assistant", friendly_response)
	yield format_chat_history(history, message, friendly_response)
	return

	# ========================
	# STATE: INITIAL - Generate Pipeline ONLY if intent requires it
	# ========================
	if current_state == ConversationState.INITIAL:
	# Only generate pipeline if user explicitly requested it
	if not intent_data.get("requires_pipeline", False):
	# Not a pipeline request - give friendly response
	friendly_response = "I'm here to help process documents! Please tell me what you'd like to do with your document.\n\nFor example:\n- 'extract text and summarize'\n- 'get tables from pages 2-5'\n- 'translate to Spanish'\n\nType 'help' to see all capabilities!"
	session_manager.add_message(session_id, "assistant", friendly_response)
	yield format_chat_history(history, message, friendly_response)
	return

	# Check if file is uploaded
	if not session.get("current_file"):
	response_text = "📁 Please upload a document first before I can process it!\n\nClick the 'Upload Document' button to get started."
	session_manager.add_message(session_id, "assistant", response_text)
	yield format_chat_history(history, message, response_text)
	return

	try:
	# Generate pipeline using Bedrock → Gemini fallback
	yield format_chat_history(history, message, "🤖 Analyzing your request and creating a pipeline...\n⏳ This will take just a moment...")

	pipeline = generate_pipeline(
	user_input=message,
	file_path=session.get("current_file"),
	prefer_bedrock=True
	)

	# Save proposed pipeline to session
	session_manager.update_session(session_id, {
	"proposed_pipeline": pipeline,
	"state": ConversationState.PIPELINE_PROPOSED
	})

	# Create user-friendly display
	pipeline_name = pipeline.get("pipeline_name", "Document Processing")
	steps_list = pipeline.get("pipeline_steps", [])
	steps_summary = "\n".join([f" {i+1}. {step.get('tool', 'Unknown')}" for i, step in enumerate(steps_list)])

	friendly_display = f"""🎯 Pipeline Created: {pipeline_name}

	Here's what I'll do:
	{steps_summary}

	Ready to proceed?
	- Type 'approve' or 'yes' to execute
	- Type 'reject' or 'no' to cancel
	- Describe changes to modify the plan"""

	# Add technical details in collapsible format
	response_text = friendly_display + f"\n\n<details>\n<summary>📊 Technical Details (for developers)</summary>\n\n```json\n{json.dumps(pipeline, indent=2)}\n```\n</details>"

	session_manager.add_message(session_id, "assistant", response_text)
	yield format_chat_history(history, message, response_text)
	return

	except Exception as e:
	error_response = f"❌ Oops! I encountered an error while creating the pipeline:\n\n{str(e)}\n\nPlease try rephrasing your request or type 'help' for examples."
	session_manager.add_message(session_id, "assistant", error_response)
	yield format_chat_history(history, message, error_response)
	return


	# ========================
	# STATE: PIPELINE_PROPOSED - Handle Approval/Rejection
	# ========================
	elif current_state == ConversationState.PIPELINE_PROPOSED:
	user_input = message.lower().strip()

	# APPROVE - Execute the pipeline
	if "approve" in user_input or "yes" in user_input:
	session_manager.update_session(session_id, {"state": ConversationState.EXECUTING})

	plan = session.get("proposed_pipeline", {})

	# Initial status - User-friendly
	initial_message = f"✅ Approved! Starting execution of: {plan.get('pipeline_name', 'pipeline')}\n\n🚀 Processingplease wait...\n_(Using {plan.get('_generator', 'AI')} - {plan.get('_model', 'model')})_"
	yield format_chat_history(history, message, initial_message)

	steps_completed = []
	final_payload = None
	executor_used = "unknown"
	progress_messages = []

	try:
	# Execute pipeline with Bedrock → CrewAI fallback
	for event in execute_pipeline_streaming(
	pipeline=plan,
	file_path=session.get("current_file"),
	session_id=session_id,
	prefer_bedrock=True
	):
	event_type = event.get("type")

	# Info events (fallback notifications, etc.)
	if event_type == "info":
	info_message = f"ℹ️ {event.get('message')}\n_(Executor: {event.get('executor', 'unknown')})_"
	progress_messages.append(info_message)
	accumulated_response = initial_message + "\n\n" + "\n".join(progress_messages)
	yield format_chat_history(history, message, accumulated_response)

	# Step updates
	elif event_type == "step":
	step_info = {
	"step": event.get("step", 0),
	"tool": event.get("tool", "processing"),
	"status": event.get("status", "running"),
	"executor": event.get("executor", "unknown")
	}

	# Add observation if available (tool output)
	if "observation" in event:
	step_info["observation"] = event.get("observation")

	# Add tool input if available
	if "input" in event:
	step_info["input"] = event.get("input")

	steps_completed.append(step_info)
	executor_used = event.get("executor", executor_used)

	# Create user-friendly progress message
	step_num = event.get('step', 0)
	tool_name = event.get('tool', 'processing')

	if event.get('status') == 'completed' and 'observation' in event:
	obs_preview = str(event.get('observation'))[:80]
	step_message = f"✅ Step {step_num}: {tool_name} - Completed!\n _Preview: {obs_preview}..._"
	elif event.get('status') == 'executing':
	step_message = f"⏳ Step {step_num}: {tool_name} - Processing..."
	else:
	step_message = f"📍 Step {step_num}: {tool_name}"

	progress_messages.append(step_message)
	accumulated_response = initial_message + "\n\n" + "\n\n".join(progress_messages)
	yield format_chat_history(history, message, accumulated_response)



	# Final result
	elif event_type == "final":
	final_payload = event.get("data")
	executor_used = event.get("executor", executor_used)

	# Error
	elif event_type == "error":
	error_msg = event.get("error", "Unknown error")
	friendly_error = f"❌ Pipeline Failed\n\nError: {error_msg}\n\nCompleted {len(steps_completed)} step(s) before failure.\n\nWhat would you like to do next?"
	session_manager.update_session(session_id, {"state": ConversationState.INITIAL})
	session_manager.add_message(session_id, "assistant", friendly_error)
	yield format_chat_history(history, message, friendly_error)
	return

	# Process final result
	if final_payload:
	session_manager.update_session(session_id, {
	"pipeline_result": final_payload,
	"state": ConversationState.INITIAL
	})

	# Save execution to MongoDB
	session_manager.save_pipeline_execution(
	session_id=session_id,
	pipeline=plan,
	result=final_payload,
	file_path=session.get("current_file"),
	executor=executor_used
	)

	# Create user-friendly final response
	success_count = len([s for s in steps_completed if s.get("status") == "completed"])
	friendly_final = f"""🎉 Pipeline Completed Successfully!

	Summary:
	- Pipeline: {plan.get('pipeline_name', 'Document Processing')}
	- Total Steps: {len(steps_completed)}
	- Successful: {success_count}
	- Executor: {executor_used}

	✅ All done! What else would you like me to help you with?

	<details>
	<summary>📊 Detailed Results (for developers)</summary>

	```json
	{json.dumps({"status": "completed", "executor": executor_used, "pipeline": plan.get("pipeline_name"), "result": final_payload, "steps": steps_completed}, indent=2)}
	```
	</details>"""
	final_response = friendly_final
	else:
	final_response = f"✅ Pipeline Completed!\n\nExecuted {len(steps_completed)} steps using {executor_used}.\n\nReady for your next task!"
	session_manager.update_session(session_id, {"state": ConversationState.INITIAL})

	session_manager.add_message(session_id, "assistant", final_response)
	yield format_chat_history(history, message, final_response)
	return

	except Exception as e:
	friendly_error = f"❌ Pipeline Execution Failed\n\nError: {str(e)}\n\nCompleted {len(steps_completed)} step(s) before failure.\n\n<details>\n<summary>📋 Error Details</summary>\n\n```\n{str(e)}\n```\n</details>\n\nWould you like to try again with a different approach?"
	session_manager.update_session(session_id, {"state": ConversationState.INITIAL})
	session_manager.add_message(session_id, "assistant", friendly_error)
	yield format_chat_history(history, message, friendly_error)
	return

	# REJECT - Cancel the pipeline
	elif "reject" in user_input or "no" in user_input:
	session_manager.update_session(session_id, {
	"state": ConversationState.INITIAL,
	"proposed_pipeline": None
	})
	friendly_rejection = "👍 No problem! Pipeline cancelled.\n\nWhat else would you like me to help you with?"
	session_manager.add_message(session_id, "assistant", friendly_rejection)
	yield format_chat_history(history, message, friendly_rejection)
	return

	# EDIT - Request modifications
	elif "edit" in user_input or "modify" in user_input:
	current_pipeline = session.get("proposed_pipeline", {})
	friendly_edit_help = f"""📝 Edit Mode

	Current pipeline: {current_pipeline.get('pipeline_name', 'Unknown')}

	Describe what you'd like to change. For example:
	- "Add summarization at the end"
	- "Remove table extraction"
	- "Only process pages 1-3"
	- "Translate to French instead of Spanish"

	Or type 'approve' to run the current plan as-is."""
	session_manager.add_message(session_id, "assistant", friendly_edit_help)
	yield format_chat_history(history, message, friendly_edit_help)
	return

	# Try to modify pipeline based on user input
	else:
	if len(message.strip()) > 5:
	try:
	original_plan = session.get("proposed_pipeline", {})
	edit_context = f"Original: {original_plan.get('pipeline_name')}. User wants: {message}"

	# Generate new pipeline with modification
	new_pipeline = generate_pipeline(
	user_input=edit_context,
	file_path=session.get("current_file"),
	prefer_bedrock=True
	)

	session_manager.update_session(session_id, {
	"proposed_pipeline": new_pipeline,
	"state": ConversationState.PIPELINE_PROPOSED
	})

	formatted = format_pipeline_for_display(new_pipeline)
	response = formatted + f"\n\n```json\n{json.dumps(new_pipeline, indent=2)}\n```"
	session_manager.add_message(session_id, "assistant", response)
	yield format_chat_history(history, message, response)
	return

	except Exception as e:
	error_response = {
	"status": "edit_failed",
	"error": str(e),
	"message": "Could not modify the plan",
	"action": "Try 'approve' to run as-is, or 'reject' to start over"
	}
	response = f"```json\n{json.dumps(error_response, indent=2)}\n```"
	session_manager.add_message(session_id, "assistant", response)
	yield format_chat_history(history, message, response)
	return

	# Default waiting message
	response_data = {
	"status": "waiting_for_confirmation",
	"message": "Please type 'approve', 'reject', or describe changes",
	"hint": "You can also say 'edit' for modification hints"
	}
	response = f"```json\n{json.dumps(response_data, indent=2)}\n```"
	session_manager.add_message(session_id, "assistant", response)
	yield format_chat_history(history, message, response)
	return

	# Default fallback
	response = json.dumps({"status": "ready", "message": "Ready for your next instruction"}, indent=2)
	session_manager.add_message(session_id, "assistant", response)
	yield format_chat_history(history, message, response)


	# ========================
	# GRADIO UI
	# ========================

	# Simple Blocks initialization for HF Spaces compatibility (older Gradio version)
	with gr.Blocks(title="MasterLLM v2.0 - AI Pipeline Orchestrator") as demo:
	gr.Markdown("""
	# 🤖 MasterLLM v2.0 - AI Pipeline Orchestrator

	🏆 Bedrock Priority with Gemini Fallback \| 💾 MongoDB Sessions \| 📡 Complete REST API

	Upload a document, describe what you want, and watch AI orchestrate the perfect pipeline!
	""")

	# State management
	session_id_state = gr.State(value=create_new_session())
	file_state = gr.State(value=None)

	with gr.Row():
	with gr.Column(scale=3):
	# Chat interface - Gradio auto-detects format from data structure
	chatbot = gr.Chatbot(label="Chat")

	# Text input
	msg = gr.Textbox(
	placeholder="💬 Type your instruction... (e.g., 'extract text from pages 1-5 and summarize')",
	label="Your Message",
	lines=2,
	max_lines=4,
	)

	with gr.Row():
	submit_btn = gr.Button("🚀 Send", variant="primary", scale=2)
	clear_btn = gr.Button("🗑️ Clear Chat", scale=1)

	with gr.Column(scale=1):
	# File upload section
	gr.Markdown("### 📁 Upload Document")
	file_upload = gr.File(
	label="PDF or Image",
	file_types=[".pdf", ".png", ".jpg", ".jpeg", ".gif", ".bmp"],
	type="filepath",
	)

	upload_status = gr.Textbox(
	label="📊 Upload Status",
	interactive=False,
	lines=10,
	max_lines=15,
	)

	# Session info
	gr.Markdown("### 🔗 Session Info")
	session_display = gr.Textbox(
	label="Session ID",
	interactive=False,
	value=lambda: session_id_state.value[:8] + "...",
	)

	# Examples
	gr.Markdown("### 💡 Example Pipelines")
	gr.Examples(
	examples=[
	"extract text from pages 1-5",
	"extract text and summarize",
	"extract text, tables, and translate to Spanish",
	"get tables from pages 2-4 and summarize",
	"text-classify-ner from entire document",
	"describe images and summarize findings",
	"extract text, detect signatures and stamps",
	],
	inputs=msg,
	)

	# System info
	gr.Markdown("""
	### ℹ️ System Features
	- ✅ Bedrock (Claude 3.5 Sonnet) priority
	- ✅ Gemini (gemini-2.0-flash) fallback
	- ✅ MongoDB session persistence
	- ✅ Streaming real-time updates
	- ✅ Component-level JSON output
	- ✅ REST API for integration

	### 📊 Pipeline Flow:
	1. Upload your document
	2. Describe what you want
	3. Review AI-generated pipeline
	4. Approve to execute
	5. Watch streaming updates
	6. Get complete JSON results
	""")

	# Event handlers
	file_upload.upload(
	fn=handle_file_upload,
	inputs=[file_upload, session_id_state],
	outputs=[file_state, upload_status, session_id_state],
	)

	msg.submit(
	fn=chatbot_response_streaming,
	inputs=[msg, chatbot, session_id_state, file_state],
	outputs=[chatbot],
	).then(
	lambda: "",
	outputs=msg,
	)

	submit_btn.click(
	fn=chatbot_response_streaming,
	inputs=[msg, chatbot, session_id_state, file_state],
	outputs=[chatbot],
	).then(
	lambda: "",
	outputs=msg,
	)

	clear_btn.click(
	fn=lambda: ([], create_new_session(), None, None, "", ""),
	outputs=[chatbot, session_id_state, file_state, file_upload, msg, upload_status],
	)

	# Mount Gradio on FastAPI
	app = gr.mount_gradio_app(app, demo, path="/")


	# ========================
	# LAUNCH
	# ========================

	if __name__ == "__main__":
	import uvicorn
	port = int(os.getenv("PORT", 7860))
	print(f"""
	╔════════════════════════════════════════════════════════════╗
	║ ║
	║ 🚀 MasterLLM v2.0 Starting... ║
	║ ║
	║ 🌐 Gradio UI: http://localhost:{port} ║
	║ 📡 REST API: http://localhost:{port}/api/v1 ║
	║ 📚 API Docs: http://localhost:{port}/docs ║
	║ ║
	║ 🏆 Bedrock: Priority (Claude 3.5 Sonnet) ║
	║ 🔄 Gemini: Fallback (gemini-2.0-flash) ║
	║ 💾 MongoDB: Session management ║
	║ ║
	╚════════════════════════════════════════════════════════════╝
	""")

	uvicorn.run(app, host="0.0.0.0", port=port)