Spaces:

nothingworry
/

IntegraChat

Sleeping

App Files Files Community

IntegraChat / app.py

nothingworry

Fix Docker container startup conflicts and improve error diagnostics

62e82b2 8 days ago

raw

history blame

120 kB

	import gradio as gr
	import requests
	import json
	import os
	import sys
	from pathlib import Path
	from collections import Counter
	from datetime import datetime
	from dotenv import load_dotenv
	load_dotenv()

	try:
	import plotly.graph_objects as go
	PLOTLY_AVAILABLE = True
	except ImportError:
	PLOTLY_AVAILABLE = False
	go = None

	BACKEND_BASE_URL = os.getenv("BACKEND_BASE_URL", "http://localhost:8000")

	# Role-based access control permissions
	VALID_ROLES = ["viewer", "editor", "admin", "owner"]
	DEFAULT_ROLE = "viewer"

	def can_manage_rules(role: str) -> bool:
	"""Check if role can manage rules (admin/owner only)."""
	return role in ["admin", "owner"]

	def can_ingest_documents(role: str) -> bool:
	"""Check if role can ingest documents (editor/admin/owner)."""
	return role in ["editor", "admin", "owner"]

	def can_delete_documents(role: str) -> bool:
	"""Check if role can delete documents (admin/owner only)."""
	return role in ["admin", "owner"]

	def can_view_analytics(role: str) -> bool:
	"""Check if role can view analytics (all roles can view)."""
	return role in VALID_ROLES # All roles can view analytics


	def convert_history_to_tuples(history):
	"""
	Convert history from dict format to tuple format for Gradio 4.20.0 compatibility.

	Input format: [{"role": "user", "content": "..."}, {"role": "assistant", "content": "..."}]
	Output format: [("user message", "assistant response"), ...]
	"""
	if not history:
	return []

	# If already in tuple format, return as-is
	if history and isinstance(history[0], (tuple, list)) and len(history[0]) == 2:
	return history

	# Convert dict format to tuple format
	result = []
	current_user = None
	current_assistant = None

	for item in history:
	if isinstance(item, dict):
	if item.get("role") == "user":
	# If we have a pending assistant message, save the pair
	if current_user is not None and current_assistant is not None:
	result.append((current_user, current_assistant))
	current_user = item.get("content", "")
	current_assistant = None
	elif item.get("role") == "assistant":
	current_assistant = item.get("content", "")
	elif isinstance(item, (tuple, list)) and len(item) == 2:
	# Already in tuple format
	result.append(tuple(item))

	# Add the last pair if exists
	if current_user is not None:
	result.append((current_user, current_assistant or ""))

	return result


	def append_to_history(history, role, content):
	"""
	Append a message to history in tuple format for Gradio 4.20.0.
	"""
	history = convert_history_to_tuples(history)

	if role == "user":
	# For user messages, we need to add a new tuple with empty assistant response
	history.append((content, ""))
	elif role == "assistant":
	# For assistant messages, update the last tuple's assistant part
	if history and len(history[-1]) == 2:
	user_msg = history[-1][0]
	history[-1] = (user_msg, content)
	else:
	# If no user message exists, create one with empty user
	history.append(("", content))

	return history


	def update_last_assistant_message(history, content):
	"""
	Update the last assistant message in history (tuple format).
	"""
	history = convert_history_to_tuples(history)
	if history and len(history[-1]) == 2:
	user_msg = history[-1][0]
	history[-1] = (user_msg, content)
	return history


	def chat_with_agent(message, tenant_id, role, history):
	"""
	Send a message to the backend MCP agent and return the response.
	Uses streaming for real-time character-by-character updates for smooth UX.

	Features:
	- Character-by-character streaming for smooth animation
	- Query caching for faster repeated queries
	- Enhanced error handling with actionable messages
	- Multi-query web search for better results

	Args:
	message: User's message text
	tenant_id: Tenant ID for multi-tenant isolation
	history: Chat history (Gradio messages format)

	Yields:
	Updated chat history with agent response (streaming character-by-character)
	"""
	# Convert history to tuple format for Gradio 4.20.0 compatibility
	history = convert_history_to_tuples(history)

	if not message or not message.strip():
	yield history
	return

	if not tenant_id or not tenant_id.strip():
	error_msg = "Please enter a Tenant ID before sending a message."
	history = append_to_history(history, "user", message)
	history = append_to_history(history, "assistant", error_msg)
	yield history
	return

	# Add user message to history
	history = append_to_history(history, "user", message)

	# Backend streaming endpoint
	backend_url = f"{BACKEND_BASE_URL}/agent/message/stream"

	# Prepare request payload
	payload = {
	"tenant_id": tenant_id.strip(),
	"message": message,
	"user_id": None,
	"conversation_history": [],
	"temperature": 0.0
	}

	# Prepare headers with role
	headers = {
	"Content-Type": "application/json",
	"x-tenant-id": tenant_id.strip(),
	"x-user-role": role if role else DEFAULT_ROLE
	}

	try:
	# Make streaming request
	response = requests.post(
	backend_url,
	json=payload,
	headers=headers,
	stream=True,
	timeout=120
	)

	if response.status_code == 200:
	# Initialize assistant message
	assistant_message = ""
	history = append_to_history(history, "assistant", assistant_message)
	yield history # Yield initial empty message

	# Stream tokens character-by-character for smooth UX
	# Backend now streams character-by-character instead of word-by-word
	for line_bytes in response.iter_lines():
	if line_bytes:
	try:
	line = line_bytes.decode('utf-8').strip()
	if not line:
	continue

	if line.startswith('data: '):
	data_str = line[6:] # Remove 'data: ' prefix
	try:
	data = json.loads(data_str)

	# Handle status messages
	if 'status' in data:
	status_msg = data.get('message', '')
	if status_msg:
	# Show status in the message temporarily
	history = update_last_assistant_message(history, f"⏳ {status_msg}")
	yield history
	continue

	# Handle tokens (now character-by-character for smoother streaming)
	token = data.get('token', '')
	if token:
	assistant_message += token
	# Update the last message in history
	history = update_last_assistant_message(history, assistant_message)
	yield history # Yield updated history immediately for smooth character-by-character display

	if data.get('done', False):
	break
	except json.JSONDecodeError:
	continue
	elif line.startswith('error:'):
	try:
	error_data = json.loads(line[6:])
	error_msg = error_data.get('error', 'Unknown error')
	history = update_last_assistant_message(history, f"❌ Error: {error_msg}")
	yield history
	break
	except:
	pass
	except UnicodeDecodeError:
	continue
	else:
	error_msg = f"Error {response.status_code}: {response.text}"
	history = append_to_history(history, "assistant", error_msg)
	yield history

	except requests.exceptions.ConnectionError:
	error_msg = "❌ Connection Error: Could not connect to backend. Please ensure the FastAPI server is running at http://localhost:8000"
	history = append_to_history(history, "assistant", error_msg)
	yield history

	except requests.exceptions.Timeout:
	error_msg = "⏱️ Request Timeout: The backend took longer than 2 minutes to respond. This may happen if:\n- The LLM is processing a complex query\n- Multiple tools (RAG, Web Search) are being used\n- The backend is under heavy load\n\nPlease try again with a simpler query, or check if the backend services (Ollama, MCP servers) are running properly."
	history = append_to_history(history, "assistant", error_msg)
	yield history

	except requests.exceptions.RequestException as e:
	error_msg = f"❌ Request Error: {str(e)}"
	history = append_to_history(history, "assistant", error_msg)
	yield history

	except Exception as e:
	error_msg = f"❌ Unexpected Error: {str(e)}"
	history = append_to_history(history, "assistant", error_msg)
	yield history


	def get_reasoning_trace(tenant_id: str, role: str, message: str):
	"""
	Fetch reasoning trace and tool traces for a message using the debug endpoint.
	Returns formatted markdown showing the reasoning path.
	"""
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required."

	try:
	headers = {
	"Content-Type": "application/json",
	"x-tenant-id": tenant_id.strip(),
	"x-user-role": role if role else DEFAULT_ROLE
	}
	response = requests.post(
	f"{BACKEND_BASE_URL}/agent/debug",
	json={
	"tenant_id": tenant_id.strip(),
	"message": message,
	"conversation_history": [],
	"temperature": 0.0
	},
	headers=headers,
	timeout=60
	)

	if response.status_code == 200:
	data = response.json()
	response_data = data.get("response", {})
	reasoning_trace = response_data.get("reasoning_trace", [])
	tool_traces = response_data.get("tool_traces", [])
	decision = response_data.get("decision", {})

	# Format reasoning trace with latency predictions and context hints
	trace_md = "## 🧠 Reasoning Path\n\n"
	for idx, step in enumerate(reasoning_trace, 1):
	step_name = step.get("step", "unknown")
	trace_md += f"### {idx}. {step_name.replace('_', ' ').title()}\n"

	if step.get("intent"):
	trace_md += f"- Intent: {step['intent']}\n"
	if step.get("match_count"):
	trace_md += f"- Rule Matches: {step['match_count']}\n"
	if step.get("hit_count"):
	trace_md += f"- RAG Hits: {step['hit_count']}\n"
	if step.get("top_score"):
	trace_md += f"- Top RAG Score: {step['top_score']:.3f}\n"
	if step.get("latency_ms"):
	trace_md += f"- Actual Latency: {step['latency_ms']}ms\n"
	if step.get("decision"):
	dec = step['decision']
	trace_md += f"- Tool: {dec.get('tool', 'N/A')}\n"
	trace_md += f"- Action: {dec.get('action', 'N/A')}\n"
	# Show latency prediction if available
	if dec.get('tool_input') and isinstance(dec['tool_input'], dict):
	est_latency = dec['tool_input'].get('_estimated_latency_ms')
	if est_latency:
	trace_md += f"- ⚡ Estimated Latency: {est_latency}ms\n"
	trace_md += "\n"

	# Format tool traces with schema information
	if tool_traces:
	trace_md += "## ⚙️ Tool Invocations\n\n"
	for idx, tool in enumerate(tool_traces, 1):
	tool_name = tool.get("tool", tool.get("tool_name", "unknown"))
	response = tool.get("response", {})
	latency = tool.get("latency_ms", response.get("latency_ms", 0))
	status = tool.get("status", "success")

	trace_md += f"### {idx}. {tool_name.upper()}\n"
	trace_md += f"- Status: {status}\n"
	trace_md += f"- Latency: {latency}ms\n"

	# Show latency prediction vs actual
	if isinstance(response, dict) and response.get("latency_ms"):
	actual = response["latency_ms"]
	trace_md += f"- ⚡ Actual vs Estimated: {actual}ms\n"

	# Show schema-validated output structure
	if isinstance(response, dict):
	if tool_name == "rag" and "results" in response:
	trace_md += f"- 📊 Schema: Valid RAG output\n"
	trace_md += f"- Results: {len(response.get('results', []))} chunks\n"
	trace_md += f"- Top Score: {response.get('top_score', 0):.3f}\n"
	elif tool_name == "web" and "results" in response:
	trace_md += f"- 📊 Schema: Valid Web output\n"
	trace_md += f"- Results: {len(response.get('results', []))} items\n"
	elif tool_name == "admin" and "violations" in response:
	trace_md += f"- 📊 Schema: Valid Admin output\n"
	trace_md += f"- Violations: {len(response.get('violations', []))}\n"
	elif tool_name == "llm" and "text" in response:
	trace_md += f"- 📊 Schema: Valid LLM output\n"
	trace_md += f"- Tokens: {response.get('tokens_used', 0)}\n"

	if tool.get("result_count"):
	trace_md += f"- Result Count: {tool['result_count']}\n"
	trace_md += "\n"

	# Format decision with context-aware routing and latency info
	if decision:
	trace_md += "## 🎯 Final Decision\n\n"
	trace_md += f"- Tool: {decision.get('tool', 'N/A')}\n"
	trace_md += f"- Action: {decision.get('action', 'N/A')}\n"
	if decision.get('reason'):
	reason = decision['reason']
	trace_md += f"- Reason: {reason}\n"

	# Extract and highlight context-aware routing hints
	if "context:" in reason.lower():
	trace_md += "\n### 🧠 Context-Aware Routing:\n"
	if "skip web" in reason.lower() or "rag high" in reason.lower():
	trace_md += "- ⚡ RAG high score → Web search skipped\n"
	if "skip rag" in reason.lower() or "memory" in reason.lower():
	trace_md += "- 💾 Relevant memory available → RAG skipped\n"
	if "skip reasoning" in reason.lower() or "critical" in reason.lower():
	trace_md += "- 🚨 Critical violation → Agent reasoning skipped\n"

	# Extract latency estimates
	if "latency:" in reason.lower() or "est." in reason.lower():
	import re
	latency_match = re.search(r'latency[:\s]+(\d+)ms', reason, re.IGNORECASE)
	if latency_match:
	est_latency = latency_match.group(1)
	trace_md += f"\n### ⚡ Latency Prediction:\n"
	trace_md += f"- Estimated Total Latency: {est_latency}ms\n"

	# Show tool sequence with latency estimates
	if decision.get('tool_input') and isinstance(decision['tool_input'], dict):
	steps = decision['tool_input'].get('steps', [])
	if steps:
	trace_md += "\n### 📋 Tool Execution Plan:\n"
	total_est_latency = 0
	for step_idx, step in enumerate(steps, 1):
	if isinstance(step, dict):
	if "parallel" in step:
	trace_md += f"{step_idx}. Parallel Execution: RAG + Web\n"
	total_est_latency += max(90, 800) # Max of RAG and Web
	elif step.get("tool"):
	tool = step["tool"]
	est_lat = step.get("input", {}).get("_estimated_latency_ms", 0)
	if est_lat:
	total_est_latency += est_lat
	trace_md += f"{step_idx}. {tool.upper()} (est. {est_lat}ms)\n"
	else:
	trace_md += f"{step_idx}. {tool.upper()}\n"
	if total_est_latency > 0:
	trace_md += f"\n- Total Estimated Latency: {total_est_latency}ms\n"

	return trace_md
	else:
	return f"❌ Error {response.status_code}: {response.text}"
	except Exception as e:
	return f"❌ Error fetching reasoning trace: {str(e)}"


	def ingest_document(
	tenant_id: str,
	role: str,
	source_type: str,
	content: str,
	document_url: str,
	filename: str,
	doc_id: str,
	metadata_json: str
	):
	# Debug: Log the role value
	print(f"🔍 DEBUG: ingest_document received role='{role}' (type: {type(role)})", file=sys.stderr)

	if not BACKEND_BASE_URL:
	return "❌ Backend URL is not configured. Please set BACKEND_BASE_URL environment variable or ensure it defaults to http://localhost:8000"

	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required to ingest documents."

	# Ensure role is not None or empty
	if not role or not role.strip():
	role = DEFAULT_ROLE
	print(f"⚠️ WARNING: Role was empty/None in ingest_document, defaulting to '{role}'", file=sys.stderr)
	role = role.strip()

	if not can_ingest_documents(role):
	return "❌ Access Denied: You need Editor, Admin, or Owner role to ingest documents."

	tenant_id = tenant_id.strip()

	payload_content = content or ""
	if source_type == "url" and document_url:
	payload_content = document_url.strip()

	metadata = {}
	if filename:
	metadata["filename"] = filename.strip()
	if document_url:
	metadata["url"] = document_url.strip()
	if doc_id:
	metadata["doc_id"] = doc_id.strip()

	if metadata_json:
	try:
	extra_metadata = json.loads(metadata_json)
	if isinstance(extra_metadata, dict):
	metadata.update(extra_metadata)
	else:
	return "❗ Metadata JSON must represent an object (key/value pairs)."
	except json.JSONDecodeError as exc:
	return f"❗ Invalid metadata JSON: {exc}"

	payload = {
	"action": "ingest_document",
	"tenant_id": tenant_id,
	"source_type": source_type,
	"content": payload_content,
	"metadata": metadata
	}

	try:
	# Ensure role is set correctly for the header
	final_role = role.strip() if role and role.strip() else DEFAULT_ROLE
	print(f"🔍 DEBUG: Sending request with role='{final_role}' in x-user-role header", file=sys.stderr)

	headers = {
	"Content-Type": "application/json",
	"x-tenant-id": tenant_id,
	"x-user-role": final_role
	}
	response = requests.post(
	f"{BACKEND_BASE_URL}/rag/ingest-document",
	json=payload,
	headers=headers,
	timeout=60
	)
	if response.status_code == 200:
	data = response.json()
	message = f"✅ Document ingested successfully.\n\n{data.get('message', '')}"

	# Display extracted metadata if available
	extracted_metadata = data.get('extracted_metadata', {})
	if extracted_metadata:
	message += "\n\n### 🤖 AI-Generated Metadata:\n"
	if extracted_metadata.get('title'):
	message += f"- Title: {extracted_metadata['title']}\n"
	if extracted_metadata.get('summary'):
	message += f"- Summary: {extracted_metadata['summary'][:200]}...\n"
	if extracted_metadata.get('tags'):
	tags = ', '.join(extracted_metadata['tags'][:5])
	message += f"- Tags: {tags}\n"
	if extracted_metadata.get('topics'):
	topics = ', '.join(extracted_metadata['topics'][:3])
	message += f"- Topics: {topics}\n"
	if extracted_metadata.get('quality_score'):
	quality = extracted_metadata['quality_score']
	quality_bar = "█" * int(quality * 10) + "░" * (10 - int(quality * 10))
	message += f"- Quality Score: {quality:.2f} {quality_bar}\n"
	if extracted_metadata.get('detected_date'):
	message += f"- Detected Date: {extracted_metadata['detected_date']}\n"
	if extracted_metadata.get('extraction_method'):
	method = extracted_metadata['extraction_method'].upper()
	message += f"- Extraction Method: {method}\n"

	return message
	elif response.status_code == 403:
	# Permission denied - show clear message
	try:
	error_data = response.json()
	error_detail = error_data.get('detail', response.text)
	except:
	error_detail = response.text
	return f"🔒 Permission Denied (403):\n\n{error_detail}\n\nSolution: Change your User Role dropdown (top right) from 'viewer' to 'editor', 'admin', or 'owner' and try again."
	return f"❌ Ingestion failed ({response.status_code}): {response.text}"
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach the backend. Make sure the FastAPI server is running."
	except requests.exceptions.Timeout:
	return "⏱️ The ingestion request timed out. Please try again."
	except Exception as exc:
	return f"❌ Unexpected error during ingestion: {exc}"


	def ingest_file(tenant_id: str, role: str, file_obj):
	if not BACKEND_BASE_URL:
	return "❌ Backend URL is not configured. Please set BACKEND_BASE_URL environment variable or ensure it defaults to http://localhost:8000"

	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required to ingest files."
	if file_obj is None:
	return "❗ Please select a file to upload."

	if not can_ingest_documents(role):
	return "❌ Access Denied: You need Editor, Admin, or Owner role to ingest files."

	tenant_id = tenant_id.strip()

	try:
	file_path = Path(file_obj.name)
	with open(file_path, "rb") as f:
	file_bytes = f.read()

	files = {
	"file": (file_path.name, file_bytes, "application/octet-stream")
	}
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	response = requests.post(
	f"{BACKEND_BASE_URL}/rag/ingest-file",
	files=files,
	headers=headers,
	timeout=120
	)
	if response.status_code == 200:
	data = response.json()
	message = f"✅ File ingested successfully.\n\n{data.get('message', '')}"

	# Display extracted metadata if available
	extracted_metadata = data.get('extracted_metadata', {})
	if extracted_metadata:
	message += "\n\n### 🤖 AI-Generated Metadata:\n"
	if extracted_metadata.get('title'):
	message += f"- Title: {extracted_metadata['title']}\n"
	if extracted_metadata.get('summary'):
	message += f"- Summary: {extracted_metadata['summary'][:200]}...\n"
	if extracted_metadata.get('tags'):
	tags = ', '.join(extracted_metadata['tags'][:5])
	message += f"- Tags: {tags}\n"
	if extracted_metadata.get('topics'):
	topics = ', '.join(extracted_metadata['topics'][:3])
	message += f"- Topics: {topics}\n"
	if extracted_metadata.get('quality_score'):
	quality = extracted_metadata['quality_score']
	quality_bar = "█" * int(quality * 10) + "░" * (10 - int(quality * 10))
	message += f"- Quality Score: {quality:.2f} {quality_bar}\n"
	if extracted_metadata.get('detected_date'):
	message += f"- Detected Date: {extracted_metadata['detected_date']}\n"
	if extracted_metadata.get('extraction_method'):
	method = extracted_metadata['extraction_method'].upper()
	message += f"- Extraction Method: {method}\n"

	return message
	return f"❌ File ingestion failed ({response.status_code}): {response.text}"
	except FileNotFoundError:
	return "❌ Could not read the uploaded file."
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach the backend. Make sure the FastAPI server is running."
	except requests.exceptions.Timeout:
	return "⏱️ File ingestion timed out. Please try again."
	except Exception as exc:
	return f"❌ Unexpected error during file ingestion: {exc}"


	def _format_rules_table(rules: list[str]) -> list[list]:
	return [[idx + 1, rule] for idx, rule in enumerate(rules)]


	def fetch_admin_rules(tenant_id: str, role: str) -> tuple[str, list[list]]:
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required.", []

	tenant_id = tenant_id.strip()
	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	response = requests.get(
	f"{BACKEND_BASE_URL}/admin/rules",
	headers=headers,
	timeout=30
	)
	if response.status_code == 200:
	rules = response.json().get("rules", [])
	if not rules:
	return "✅ No admin rules have been configured yet.", []
	summary = f"### Current Rules ({len(rules)})"
	return summary, _format_rules_table(rules)
	return f"❌ Error {response.status_code}: {response.text}", []
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach backend. Ensure the FastAPI server is running.", []
	except requests.exceptions.Timeout:
	return "⏱️ Request timed out. Please try again.", []
	except Exception as exc:
	return f"❌ Unexpected error: {exc}", []


	def extract_rules_from_file(file_path) -> str:
	"""
	Extract rules from uploaded file (TXT, PDF, DOC, DOCX).
	Returns the extracted text content.
	"""
	if file_path is None:
	return ""

	try:
	# Gradio File component returns file path as string
	if isinstance(file_path, str):
	file_path = Path(file_path)
	else:
	# Sometimes it's a file object with .name attribute
	file_path = Path(file_path.name if hasattr(file_path, 'name') else file_path)

	if not file_path.exists():
	return f"❌ File not found: {file_path}"

	file_ext = file_path.suffix.lower()

	# Read file based on type
	if file_ext == '.txt' or file_ext == '.md':
	# Plain text files
	with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
	content = f.read()
	return content

	elif file_ext == '.pdf':
	# PDF files - use PyPDF2
	try:
	import PyPDF2
	with open(file_path, 'rb') as f:
	pdf_reader = PyPDF2.PdfReader(f)
	content = []
	for page in pdf_reader.pages:
	content.append(page.extract_text())
	return '\n'.join(content)
	except ImportError:
	return "❌ PDF extraction requires PyPDF2. Install with: pip install PyPDF2"
	except Exception as e:
	return f"❌ Failed to extract text from PDF: {str(e)}"

	elif file_ext in ['.doc', '.docx']:
	# DOC/DOCX files - use python-docx
	try:
	from docx import Document
	doc = Document(file_path)
	content = []
	for paragraph in doc.paragraphs:
	content.append(paragraph.text)
	return '\n'.join(content)
	except ImportError:
	return "❌ DOCX extraction requires python-docx. Install with: pip install python-docx"
	except Exception as e:
	return f"❌ Failed to extract text from DOCX: {str(e)}"

	else:
	return f"❌ Unsupported file type: {file_ext}. Supported: .txt, .pdf, .doc, .docx"

	except Exception as e:
	return f"❌ Error reading file: {str(e)}"


	def add_admin_rules(tenant_id: str, role: str, rules_text: str, enhance: bool = True) -> str:
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required."
	if not rules_text or not rules_text.strip():
	return "❗ Provide at least one rule to upload."

	if not can_manage_rules(role):
	return "❌ Access Denied: You need Admin or Owner role to manage rules."

	tenant_id = tenant_id.strip()
	# Filter out comment lines (starting with #) and empty lines
	rules = [
	rule.strip()
	for rule in rules_text.splitlines()
	if rule.strip() and not rule.strip().startswith("#")
	]
	if not rules:
	return "❗ No valid rules detected. (Comment lines starting with # are ignored)"

	added = []
	enhanced = []
	errors = []

	# Process rules in chunks to avoid timeout
	CHUNK_SIZE = 5 # Process 5 rules at a time
	total_rules = len(rules)

	if total_rules == 1:
	# Single rule - use regular endpoint
	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	resp = requests.post(
	f"{BACKEND_BASE_URL}/admin/rules",
	params={"rule": rules[0], "enhance": "true" if enhance else "false"},
	headers=headers,
	timeout=60 if enhance else 15
	)
	if resp.status_code == 200:
	data = resp.json()
	added.append(data.get("added_rule", rules[0]))
	if data.get("enhanced"):
	edge_cases = data.get("edge_cases", [])
	improvements = data.get("improvements", [])
	explanation = data.get("explanation", "")
	examples = data.get("examples", [])
	missing_patterns = data.get("missing_patterns", [])

	if explanation:
	enhanced.append(f"💡 Explanation: {explanation}")
	if examples:
	examples_list = "\n".join([f" • {ex}" for ex in examples[:5]])
	enhanced.append(f"📋 Examples:\n{examples_list}")
	if missing_patterns:
	patterns_list = "\n".join([f" • {p}" for p in missing_patterns[:5]])
	enhanced.append(f"🔍 Suggested Patterns:\n{patterns_list}")
	if edge_cases or improvements:
	enhanced.append(f"{data.get('added_rule', rules[0])}:")
	if improvements:
	enhanced.append(f" • Improvements: {', '.join(improvements[:3])}")
	if edge_cases:
	enhanced.append(f" • Edge cases identified: {len(edge_cases)}")
	else:
	errors.append(f"{rules[0]} -> {resp.status_code}: {resp.text}")
	except Exception as exc:
	errors.append(f"{rules[0]} -> {exc}")
	else:
	# Multiple rules - process in chunks
	for i in range(0, total_rules, CHUNK_SIZE):
	chunk = rules[i:i + CHUNK_SIZE]
	chunk_num = (i // CHUNK_SIZE) + 1
	total_chunks = (total_rules + CHUNK_SIZE - 1) // CHUNK_SIZE

	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	resp = requests.post(
	f"{BACKEND_BASE_URL}/admin/rules/bulk",
	json={"rules": chunk},
	headers=headers,
	params={"enhance": "true" if enhance else "false"},
	timeout=180 if enhance else 30 # Timeout per chunk (5 rules × 30s per rule + buffer if enhance, else quick)
	)
	if resp.status_code == 200:
	data = resp.json()
	chunk_added = data.get("added_rules", [])
	added.extend(chunk_added)
	if data.get("enhanced"):
	chunk_enhanced = data.get("enhancement_summary", [])
	enhanced.extend([f"[Chunk {chunk_num}/{total_chunks}] {e}" for e in chunk_enhanced])

	# Add explanations for bulk rules if available
	if data.get("explanations"):
	for exp in data["explanations"][:3]: # Show first 3 explanations
	if exp.get("explanation"):
	enhanced.append(f"\n💡 {exp.get('rule', 'Rule')} Explanation: {exp['explanation']}")
	if exp.get("examples"):
	examples_list = "\n".join([f" • {ex}" for ex in exp['examples'][:3]])
	enhanced.append(f"📋 Examples:\n{examples_list}")
	if exp.get("missing_patterns"):
	patterns_list = "\n".join([f" • {p}" for p in exp['missing_patterns'][:3]])
	enhanced.append(f"🔍 Suggested Patterns:\n{patterns_list}")
	else:
	errors.append(f"Chunk {chunk_num}/{total_chunks} failed: {resp.status_code}: {resp.text}")
	except requests.exceptions.Timeout:
	errors.append(f"Chunk {chunk_num}/{total_chunks} timed out after 180s. Try adding rules without enhancement (set enhance=false) or add fewer rules at once.")
	except Exception as exc:
	errors.append(f"Chunk {chunk_num}/{total_chunks} error: {exc}")

	summary = []
	if added:
	summary.append(f"✅ Added {len(added)}/{total_rules} rule(s):\n" + "\n".join([f"- {r}" for r in added[:10]]))
	if len(added) > 10:
	summary.append(f"... and {len(added) - 10} more")
	if enhanced:
	summary.append(f"\n🤖 LLM Enhancement Applied:\n" + "\n".join(enhanced[:5]))
	if len(enhanced) > 5:
	summary.append(f"... and {len(enhanced) - 5} more enhancements")

	if errors:
	summary.append("\n⚠️ Errors:\n" + "\n".join(errors))

	return "\n\n".join(summary) if summary else "No rules were added."


	def delete_admin_rule(tenant_id: str, role: str, rule: str) -> str:
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required."
	if not rule or not rule.strip():
	return "❗ Provide the exact rule text to delete."

	if not can_manage_rules(role):
	return "❌ Access Denied: You need Admin or Owner role to delete rules."

	tenant_id = tenant_id.strip()
	rule = rule.strip()

	# If user entered just a number, try to find the rule by index
	if rule.isdigit():
	try:
	# Fetch rules to get the actual rule text by index
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	resp = requests.get(
	f"{BACKEND_BASE_URL}/admin/rules",
	headers=headers,
	timeout=15
	)
	if resp.status_code == 200:
	rules = resp.json().get("rules", [])
	rule_idx = int(rule) - 1 # Convert to 0-based index
	if 0 <= rule_idx < len(rules):
	rule = rules[rule_idx] # Use the actual rule text
	else:
	return f"❌ Invalid rule number. Please enter a number between 1 and {len(rules)}, or enter the full rule text."
	except Exception as e:
	return f"❌ Error fetching rules: {e}"

	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	# URL encode the rule text to handle special characters
	import urllib.parse
	encoded_rule = urllib.parse.quote(rule, safe='')
	resp = requests.delete(
	f"{BACKEND_BASE_URL}/admin/rules/{encoded_rule}",
	headers=headers,
	timeout=15
	)
	if resp.status_code == 200:
	return f"🗑️ Deleted rule: {rule}"
	elif resp.status_code == 404:
	return f"❌ Rule not found: '{rule}'. Please check the rules table and enter the exact rule text (or rule number)."
	return f"❌ Error {resp.status_code}: {resp.text}"
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach backend. Ensure the FastAPI server is running."
	except requests.exceptions.Timeout:
	return "⏱️ Delete request timed out. Please try again."
	except Exception as exc:
	return f"❌ Unexpected error: {exc}"


	def add_rules_from_file(tenant_id: str, role: str, file_path, enhance: bool = True):
	"""
	Extract rules from uploaded file and add them.
	"""
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required.", "👉 Click Refresh Rules to see existing entries.", []

	if file_path is None:
	return "❗ Please select a file to upload.", "👉 Click Refresh Rules to see existing entries.", []

	# Extract text from file
	extracted_text = extract_rules_from_file(file_path)

	if extracted_text.startswith("❌"):
	# Error occurred during extraction
	summary, rows = fetch_admin_rules(tenant_id)
	return extracted_text, summary, rows

	if not extracted_text or not extracted_text.strip():
	summary, rows = fetch_admin_rules(tenant_id)
	return "❗ No text could be extracted from the file.", summary, rows

	# Add rules from extracted text
	status = add_admin_rules(tenant_id, role, extracted_text, enhance=enhance)
	summary, rows = fetch_admin_rules(tenant_id, role)
	return status, summary, rows


	def add_rules_and_refresh(tenant_id: str, role: str, rules_text: str, enhance: bool = True):
	status = add_admin_rules(tenant_id, role, rules_text, enhance=enhance)
	summary, rows = fetch_admin_rules(tenant_id, role)
	return status, summary, rows


	def delete_rule_and_refresh(tenant_id: str, role: str, rule: str):
	status = delete_admin_rule(tenant_id, role, rule)
	summary, rows = fetch_admin_rules(tenant_id, role)
	return status, summary, rows


	def fetch_admin_analytics(tenant_id: str, role: str):
	"""Fetch analytics data and return formatted results with visualizations."""
	if not tenant_id or not tenant_id.strip():
	error_msg = "❗ Tenant ID is required to view analytics."
	return error_msg, {}, None, None, None, None

	# All roles can view analytics (matching backend permissions)
	# No access check needed here

	tenant_id = tenant_id.strip()
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}

	overview_data = {}
	tool_usage_data = {}
	redflags_data = {}
	activity_data = {}
	error_msg = None

	# Fetch Overview
	try:
	resp = requests.get(
	f"{BACKEND_BASE_URL}/analytics/overview",
	headers=headers,
	timeout=30
	)
	if resp.status_code == 200:
	overview_data = resp.json()
	else:
	error_msg = f"❌ Error fetching overview: {resp.status_code}"
	except Exception as e:
	error_msg = f"❌ Error: {str(e)}"

	# Fetch Tool Usage
	try:
	resp = requests.get(
	f"{BACKEND_BASE_URL}/analytics/tool-usage",
	headers=headers,
	timeout=30
	)
	if resp.status_code == 200:
	tool_usage_data = resp.json()
	except Exception:
	pass

	# Fetch Red Flags
	try:
	resp = requests.get(
	f"{BACKEND_BASE_URL}/analytics/redflags",
	headers=headers,
	timeout=30
	)
	if resp.status_code == 200:
	redflags_data = resp.json()
	except Exception:
	pass

	# Fetch Activity
	try:
	resp = requests.get(
	f"{BACKEND_BASE_URL}/analytics/activity",
	headers=headers,
	timeout=30
	)
	if resp.status_code == 200:
	activity_data = resp.json()
	except Exception:
	pass

	# Extract data for visualizations
	overview = overview_data.get("overview", {})
	tool_usage = overview.get("tool_usage", tool_usage_data.get("tool_usage", {}))
	rag_quality = overview.get("rag_quality", {})

	# Create tool usage bar chart
	tool_chart = None
	if tool_usage and PLOTLY_AVAILABLE:
	try:
	tools = []
	counts = []
	latencies = []
	colors_list = []

	color_map = {
	"rag": "#3b82f6",
	"rag.search": "#2563eb",
	"rag.ingest": "#1d4ed8",
	"rag.list": "#1e40af",
	"web.search": "#06b6d4",
	"admin": "#a855f7",
	"llm": "#10b981"
	}

	for tool_name, stats in tool_usage.items():
	tools.append(tool_name.replace(".", " ").title())
	counts.append(stats.get("count", 0))
	latencies.append(stats.get("avg_latency_ms", 0))
	colors_list.append(color_map.get(tool_name, "#6b7280"))

	if tools:
	fig = go.Figure()
	fig.add_trace(go.Bar(
	x=tools,
	y=counts,
	name="Usage Count",
	marker_color=colors_list,
	text=counts,
	textposition='outside',
	hovertemplate='<b>%{x}</b><br>Count: %{y}<br><extra></extra>'
	))
	fig.update_layout(
	title={
	"text": "Tool Usage Count",
	"x": 0.5,
	"xanchor": "center",
	"font": {"size": 16, "color": "#1f2937"}
	},
	xaxis_title="Tool",
	yaxis_title="Count",
	height=380,
	showlegend=False,
	margin=dict(l=50, r=20, t=60, b=50),
	plot_bgcolor="rgba(0,0,0,0)",
	paper_bgcolor="rgba(0,0,0,0)",
	font=dict(color="#374151", size=12),
	xaxis=dict(gridcolor="rgba(0,0,0,0.1)"),
	yaxis=dict(gridcolor="rgba(0,0,0,0.1)")
	)
	tool_chart = fig
	except Exception:
	tool_chart = None

	# Create latency chart
	latency_chart = None
	if tool_usage and PLOTLY_AVAILABLE:
	try:
	tools = []
	latencies = []
	colors_list = []

	color_map = {
	"rag": "#3b82f6",
	"rag.search": "#2563eb",
	"rag.ingest": "#1d4ed8",
	"rag.list": "#1e40af",
	"web.search": "#06b6d4",
	"admin": "#a855f7",
	"llm": "#10b981"
	}

	for tool_name, stats in tool_usage.items():
	avg_latency = stats.get("avg_latency_ms", 0)
	if avg_latency > 0:
	tools.append(tool_name.replace(".", " ").title())
	latencies.append(round(avg_latency, 2))
	colors_list.append(color_map.get(tool_name, "#6b7280"))

	if tools:
	fig = go.Figure()
	fig.add_trace(go.Bar(
	x=tools,
	y=latencies,
	name="Avg Latency (ms)",
	marker_color=colors_list,
	text=[f"{l}ms" for l in latencies],
	textposition='outside',
	hovertemplate='<b>%{x}</b><br>Avg Latency: %{y}ms<extra></extra>'
	))
	fig.update_layout(
	title={
	"text": "Average Tool Latency",
	"x": 0.5,
	"xanchor": "center",
	"font": {"size": 16, "color": "#1f2937"}
	},
	xaxis_title="Tool",
	yaxis_title="Latency (ms)",
	height=380,
	showlegend=False,
	margin=dict(l=50, r=20, t=60, b=50),
	plot_bgcolor="rgba(0,0,0,0)",
	paper_bgcolor="rgba(0,0,0,0)",
	font=dict(color="#374151", size=12),
	xaxis=dict(gridcolor="rgba(0,0,0,0.1)"),
	yaxis=dict(gridcolor="rgba(0,0,0,0.1)")
	)
	latency_chart = fig
	except Exception:
	latency_chart = None

	# Create RAG quality metrics visualization
	rag_chart = None
	if rag_quality and PLOTLY_AVAILABLE:
	try:
	metrics = ["Avg Hits", "Avg Score", "Avg Top Score"]
	values = [
	rag_quality.get("avg_hits_per_search", 0),
	rag_quality.get("avg_score", 0) * 100, # Convert to percentage
	rag_quality.get("avg_top_score", 0) * 100
	]

	fig = go.Figure(data=[go.Bar(
	x=metrics,
	y=values,
	marker_color=["#3b82f6", "#10b981", "#f59e0b"],
	text=[f"{v:.2f}" for v in values],
	textposition='outside',
	hovertemplate='<b>%{x}</b><br>Value: %{y:.2f}<extra></extra>'
	)])
	fig.update_layout(
	title={
	"text": "RAG Quality Metrics",
	"x": 0.5,
	"xanchor": "center",
	"font": {"size": 16, "color": "#1f2937"}
	},
	xaxis_title="Metric",
	yaxis_title="Value",
	height=350,
	showlegend=False,
	margin=dict(l=50, r=20, t=60, b=50),
	plot_bgcolor="rgba(0,0,0,0)",
	paper_bgcolor="rgba(0,0,0,0)",
	font=dict(color="#374151", size=12),
	xaxis=dict(gridcolor="rgba(0,0,0,0.1)"),
	yaxis=dict(gridcolor="rgba(0,0,0,0.1)")
	)
	rag_chart = fig
	except Exception:
	rag_chart = None

	# Format summary text
	total_queries = overview.get("total_queries", activity_data.get("activity", {}).get("total_queries", 0))
	active_users = overview.get("active_users", activity_data.get("activity", {}).get("active_users", 0))
	redflag_count = overview.get("redflag_count", redflags_data.get("count", 0))
	last_query = overview.get("last_query", activity_data.get("activity", {}).get("last_query"))

	# Calculate total tool usage
	total_tool_calls = sum(stats.get("count", 0) for stats in tool_usage.values())
	total_success = sum(stats.get("success_count", 0) for stats in tool_usage.values())
	total_errors = sum(stats.get("error_count", 0) for stats in tool_usage.values())

	success_rate = (total_success / total_tool_calls * 100) if total_tool_calls > 0 else 0

	summary_text = f"""
	#### 📈 Activity Metrics
	- Total Queries: `{total_queries}`
	- Active Users: `{active_users}`
	- Red Flags: `{redflag_count}`
	- Last Query: `{last_query if last_query else "N/A"}`

	---

	#### 🔧 Tool Usage Overview
	- Total Tool Calls: `{total_tool_calls}`
	- Successful Calls: `{total_success}` ✅
	- Failed Calls: `{total_errors}` {'⚠️' if total_errors > 0 else ''}
	- Success Rate: `{success_rate:.1f}%` {'🟢' if success_rate >= 95 else '🟡' if success_rate >= 80 else '🔴'}

	---

	#### 🔍 RAG Quality Metrics
	- Total Searches: `{rag_quality.get("total_searches", 0)}`
	- Avg Hits per Search: `{rag_quality.get("avg_hits_per_search", 0):.2f}`
	- Avg Relevance Score: `{rag_quality.get("avg_score", 0):.3f}`
	- Avg Top Score: `{rag_quality.get("avg_top_score", 0):.3f}`
	- Avg Search Latency: `{rag_quality.get("avg_latency_ms", 0):.2f}ms`

	---

	#### 📊 Tool Breakdown
	"""

	# Add individual tool stats to summary
	for tool_name, stats in sorted(tool_usage.items(), key=lambda x: x[1].get("count", 0), reverse=True):
	tool_display = tool_name.replace(".", " ").title()
	count = stats.get("count", 0)
	latency = stats.get("avg_latency_ms", 0)
	success = stats.get("success_count", 0)
	errors = stats.get("error_count", 0)
	status_icon = "✅" if errors == 0 else "⚠️"
	summary_text += f"- {tool_display} {status_icon}<br> └ {count} calls • {latency:.1f}ms avg • {success} success • {errors} errors\n"

	return summary_text, tool_usage, tool_chart, latency_chart, rag_chart, error_msg


	def list_documents(tenant_id: str, role: str, limit: int = 1000, offset: int = 0):
	"""
	List all documents for a tenant.
	Returns a tuple of (status_message, documents_list, total_count, stats_dict, chart_fig).
	"""
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required.", [], 0, {}, None

	tenant_id = tenant_id.strip()
	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	response = requests.get(
	f"{BACKEND_BASE_URL}/rag/list",
	params={"tenant_id": tenant_id, "limit": limit, "offset": offset},
	headers=headers,
	timeout=30
	)

	if response.status_code == 200:
	data = response.json()
	documents = data.get("documents", [])
	total = data.get("total", 0)

	# Format documents for display and collect stats
	formatted_docs = []
	type_counts = Counter()
	total_length = 0

	for doc in documents:
	doc_id = doc.get("id", "N/A")
	text = doc.get("text", "")
	created_at = doc.get("created_at", "")
	preview = text[:200] + "..." if len(text) > 200 else text

	# Detect document type
	text_lower = text.lower()
	if "http://" in text_lower or "https://" in text_lower or "www." in text_lower:
	doc_type = "link"
	elif any(x in text_lower for x in ["q:", "question:", "faq", "frequently asked"]):
	doc_type = "faq"
	elif ".pdf" in text_lower or "pdf document" in text_lower:
	doc_type = "pdf"
	else:
	doc_type = "text"

	type_counts[doc_type] += 1
	total_length += len(text)

	# Format as list for Gradio Dataframe (list of lists)
	formatted_docs.append([
	doc_id,
	doc_type,
	preview,
	len(text),
	created_at[:10] if created_at else "N/A"
	])

	# Create statistics dictionary
	stats = {
	"total": total,
	"types": dict(type_counts),
	"avg_length": total_length // total if total > 0 else 0,
	"total_chars": total_length
	}

	# Create pie chart for document types
	chart_fig = None
	if type_counts and PLOTLY_AVAILABLE:
	try:
	labels = list(type_counts.keys())
	values = list(type_counts.values())
	colors = {
	"text": "#3b82f6", # blue
	"pdf": "#ef4444", # red
	"faq": "#a855f7", # purple
	"link": "#06b6d4" # cyan
	}
	chart_colors = [colors.get(label, "#6b7280") for label in labels]

	fig = go.Figure(data=[go.Pie(
	labels=labels,
	values=values,
	hole=0.4,
	marker=dict(colors=chart_colors),
	textinfo='label+percent+value',
	textfont=dict(size=12),
	hovertemplate='<b>%{label}</b><br>Count: %{value}<br>Percentage: %{percent}<extra></extra>'
	)])
	fig.update_layout(
	title={
	"text": "Document Type Distribution",
	"x": 0.5,
	"xanchor": "center",
	"font": {"size": 16}
	},
	height=400,
	showlegend=True,
	margin=dict(l=20, r=20, t=50, b=20)
	)
	chart_fig = fig
	except Exception:
	chart_fig = None

	status = f"✅ Found {total} document(s)"
	return status, formatted_docs, total, stats, chart_fig
	else:
	error_msg = f"❌ Error {response.status_code}: {response.text}"
	return error_msg, [], 0, {}, None
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach backend. Ensure the FastAPI server is running.", [], 0, {}, None
	except requests.exceptions.Timeout:
	return "⏱️ Request timed out. Please try again.", [], 0, {}, None
	except Exception as exc:
	return f"❌ Unexpected error: {exc}", [], 0, {}, None


	def delete_document(tenant_id: str, role: str, document_id: int):
	"""Delete a specific document by ID."""
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required."

	if not document_id or document_id <= 0:
	return "❗ Invalid document ID."

	if not can_delete_documents(role):
	return "❌ Access Denied: You need Admin or Owner role to delete documents."

	tenant_id = tenant_id.strip()
	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	response = requests.delete(
	f"{BACKEND_BASE_URL}/rag/delete/{document_id}",
	params={"tenant_id": tenant_id},
	headers=headers,
	timeout=30
	)

	if response.status_code == 200:
	return f"✅ Document {document_id} deleted successfully."
	elif response.status_code == 404:
	return f"❌ Document {document_id} not found or access denied."
	else:
	error_data = response.json() if response.headers.get("content-type", "").startswith("application/json") else {}
	error_msg = error_data.get("detail", error_data.get("error", response.text))
	return f"❌ Error {response.status_code}: {error_msg}"
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach backend. Ensure the FastAPI server is running."
	except requests.exceptions.Timeout:
	return "⏱️ Request timed out. Please try again."
	except Exception as exc:
	return f"❌ Unexpected error: {exc}"


	def delete_all_documents(tenant_id: str, role: str):
	"""Delete all documents for a tenant."""
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required."

	tenant_id = tenant_id.strip()

	if not can_delete_documents(role):
	return "❌ Access Denied: You need Admin or Owner role to delete documents."

	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	response = requests.delete(
	f"{BACKEND_BASE_URL}/rag/delete-all",
	params={"tenant_id": tenant_id},
	headers=headers,
	timeout=60
	)

	if response.status_code == 200:
	data = response.json()
	deleted_count = data.get("deleted_count", 0)
	return f"✅ Deleted {deleted_count} document(s) successfully."
	else:
	error_data = response.json() if response.headers.get("content-type", "").startswith("application/json") else {}
	error_msg = error_data.get("detail", error_data.get("error", response.text))
	return f"❌ Error {response.status_code}: {error_msg}"
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach backend. Ensure the FastAPI server is running."
	except requests.exceptions.Timeout:
	return "⏱️ Request timed out. Please try again."
	except Exception as exc:
	return f"❌ Unexpected error: {exc}"


	def search_knowledge_base(tenant_id: str, role: str, query: str):
	"""Search the knowledge base using RAG semantic search with cross-encoder re-ranking."""
	if not tenant_id or not tenant_id.strip():
	return "❗ Tenant ID is required.", []

	if not query or not query.strip():
	return "❗ Please enter a search query.", []

	tenant_id = tenant_id.strip()
	query = query.strip()

	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE,
	"Content-Type": "application/json"
	}
	response = requests.post(
	f"{BACKEND_BASE_URL}/rag/search",
	json={"tenant_id": tenant_id, "query": query, "threshold": 0.3},
	headers=headers,
	timeout=30
	)

	if response.status_code == 200:
	data = response.json()
	results = data.get("results", [])

	formatted_results = []
	for idx, result in enumerate(results, 1):
	text = result.get("text", "")
	relevance = result.get("relevance", result.get("score", 0.0))
	formatted_results.append({
	"Rank": idx,
	"Text": text[:300] + "..." if len(text) > 300 else text,
	"Relevance": f"{relevance:.3f}" if relevance else "N/A"
	})

	status = f"✅ Found {len(results)} result(s) for '{query}' (re-ranked with cross-encoder)"
	return status, formatted_results
	else:
	error_msg = f"❌ Error {response.status_code}: {response.text}"
	return error_msg, []
	except requests.exceptions.ConnectionError:
	return "❌ Could not reach backend. Ensure the FastAPI server is running.", []
	except requests.exceptions.Timeout:
	return "⏱️ Request timed out. Please try again.", []
	except Exception as exc:
	return f"❌ Unexpected error: {exc}", []


	# Create Gradio interface
	# Note: some Gradio versions (especially older ones) do not support the `theme` argument
	# on `Blocks`. To keep the Docker image compatible across environments, we rely on
	# custom CSS for styling instead of passing a `theme` kwarg here.
	with gr.Blocks(
	title="IntegraChat — MCP Autonomous Agent",
	css="""
	/* Global dark theme with simpler, basic colors */
	body, .gradio-container {
	font-family: 'Inter', system-ui, -apple-system, sans-serif;
	background: #020617;
	color: #e5e7eb;
	}

	/* Remove default card backgrounds so our custom sections stand out */
	.gradio-container .block {
	background: transparent;
	}

	/* Header styling */
	.header-section {
	background: #020617;
	padding: 28px 24px;
	border-radius: 18px;
	margin-bottom: 24px;
	box-shadow: 0 18px 60px rgba(15, 23, 42, 0.9);
	border: 1px solid rgba(148, 163, 184, 0.25);
	}

	.header-section h1 {
	color: #e5e7eb;
	font-size: 2.4rem;
	font-weight: 700;
	margin-bottom: 8px;
	letter-spacing: 0.02em;
	}

	.header-section p {
	color: #cbd5f5;
	font-size: 0.98rem;
	max-width: 720px;
	}

	/* Input fields strip */
	.input-container {
	background: #020617;
	padding: 18px 20px 22px 20px;
	border-radius: 14px;
	border: 1px solid rgba(148, 163, 184, 0.35);
	backdrop-filter: blur(18px);
	box-shadow: 0 12px 40px rgba(15, 23, 42, 0.9);
	margin-bottom: 18px;
	}

	/* Tenant / role cards */
	.tenant-card,
	.role-card {
	background: #020617;
	border-radius: 14px;
	padding: 16px 16px 14px 16px;
	border: 1px solid rgba(148, 163, 184, 0.6);
	box-shadow: 0 8px 26px rgba(15, 23, 42, 0.9);
	display: flex;
	flex-direction: column;
	transition: border-color 0.15s ease, box-shadow 0.15s ease, transform 0.15s ease;
	}

	# .tenant-card:hover,
	# .role-card:hover {
	# border-color: #38bdf8;
	# box-shadow: 0 12px 36px rgba(56, 189, 248, 0.35);
	# transform: translateY(-1px);
	# }

	.field-label-pill {
	display: inline-flex;
	align-items: center;
	gap: 8px;
	padding: 6px 12px;
	border-radius: 999px;
	background: #0f172a;
	color: #e5e7eb;
	font-size: 0.8rem;
	font-weight: 600;
	letter-spacing: 0.08em;
	text-transform: uppercase;
	border: 1px solid #38bdf8;
	}

	.field-label-pill span.icon {
	font-size: 1rem;
	}

	.field-label-subtitle {
	margin-top: 4px;
	margin-bottom: 4px;
	color: #9ca3af;
	font-size: 0.8rem;
	}

	/* Reduce spacing for dropdown in role card */
	.role-card .field-label-subtitle {
	margin-bottom: 6px;
	}

	.role-card select,
	.role-card .gradio-dropdown {
	margin-top: 2px;
	}

	/* Left/right columns in Chat tab */
	.chat-row > .col:nth-child(1) {
	min-width: 0;
	}

	/* Stat cards */
	.stat-card {
	background: #020617;
	padding: 22px;
	border-radius: 16px;
	color: white;
	text-align: left;
	box-shadow: 0 12px 32px rgba(15, 23, 42, 0.9);
	transition: transform 0.2s ease, box-shadow 0.2s ease, border-color 0.2s ease;
	border: 1px solid rgba(248, 250, 252, 0.25);
	}
	.stat-card:hover {
	transform: translateY(-3px) scale(1.01);
	box-shadow: 0 16px 40px rgba(15, 23, 42, 0.95);
	border-color: #38bdf8;
	}
	.stat-card h3 {
	margin: 0 0 6px 0;
	font-size: 0.78rem;
	opacity: 0.9;
	font-weight: 600;
	letter-spacing: 0.16em;
	text-transform: uppercase;
	}
	.stat-card strong {
	font-size: 1.8rem;
	font-weight: 700;
	display: block;
	margin-top: 8px;
	}

	/* Summary / debug panel */
	.summary-box {
	background: #020617;
	padding: 24px;
	border-radius: 18px;
	border: 1px solid rgba(148, 163, 184, 0.7);
	max-height: 520px;
	overflow-y: auto;
	box-shadow: 0 18px 48px rgba(15, 23, 42, 0.95);
	color: #e5e7eb;
	backdrop-filter: blur(18px);
	transition: border-color 0.15s ease, box-shadow 0.15s ease, transform 0.15s ease;
	}
	.summary-box::-webkit-scrollbar {
	width: 8px;
	}
	.summary-box::-webkit-scrollbar-track {
	background: rgba(15, 23, 42, 1);
	border-radius: 999px;
	}
	.summary-box::-webkit-scrollbar-thumb {
	background: rgba(148, 163, 184, 0.7);
	border-radius: 999px;
	}

	.summary-box:hover {
	border-color: #38bdf8;
	box-shadow: 0 22px 60px rgba(15, 23, 42, 1);
	transform: translateY(-1px);
	}
	.summary-box h3, .summary-box h4 {
	margin-top: 0;
	margin-bottom: 12px;
	color: #f9fafb;
	font-weight: 600;
	}
	.summary-box p,
	.summary-box li {
	color: #e5e7eb;
	margin: 8px 0;
	line-height: 1.7;
	}
	.summary-box code {
	background-color: rgba(15, 23, 42, 0.9);
	color: #22c55e;
	padding: 3px 7px;
	border-radius: 6px;
	font-family: 'Fira Code', 'Courier New', monospace;
	font-size: 0.78rem;
	border: 1px solid rgba(148, 163, 184, 0.45);
	}

	/* Chart titles / section headings */
	.chart-title {
	margin-bottom: 8px;
	margin-top: 0;
	font-weight: 600;
	color: #e5e7eb;
	text-align: center;
	font-size: 1rem;
	}

	/* Primary buttons */
	button.primary {
	background: #0ea5e9;
	border: none;
	box-shadow: 0 8px 26px rgba(15, 23, 42, 0.9);
	transition: transform 0.15s ease, box-shadow 0.15s ease, filter 0.15s ease;
	border-radius: 999px;
	font-weight: 600;
	}
	button.primary:hover {
	transform: translateY(-1px);
	filter: brightness(1.08);
	box-shadow: 0 12px 32px rgba(15, 23, 42, 1);
	}

	/* Tabs */
	.tab-nav {
	border-bottom: 1px solid rgba(148, 163, 184, 0.35);
	}

	/* Role badges */
	.role-badge {
	display: inline-block;
	padding: 5px 11px;
	border-radius: 999px;
	font-size: 0.7rem;
	font-weight: 600;
	text-transform: uppercase;
	letter-spacing: 0.1em;
	}
	.role-viewer {
	background: linear-gradient(135deg, #64748b 0%, #475569 100%);
	color: white;
	}
	.role-editor {
	background: linear-gradient(135deg, #06b6d4 0%, #0891b2 100%);
	color: white;
	}
	.role-admin {
	background: linear-gradient(135deg, #8b5cf6 0%, #7c3aed 100%);
	color: white;
	}
	.role-owner {
	background: linear-gradient(135deg, #f59e0b 0%, #d97706 100%);
	color: white;
	}

	/* Inputs */
	input[type="text"], textarea, select {
	border-radius: 10px !important;
	border: 1px solid rgba(148, 163, 184, 0.5) !important;
	background: rgba(15, 23, 42, 0.92) !important;
	color: #e5e7eb !important;
	transition: border-color 0.2s ease, box-shadow 0.2s ease, background 0.2s ease !important;
	}
	input[type="text"]::placeholder,
	textarea::placeholder {
	color: rgba(148, 163, 184, 0.65) !important;
	}
	input[type="text"]:focus, textarea:focus, select:focus {
	border-color: #06b6d4 !important;
	box-shadow: 0 0 0 1px rgba(6, 182, 212, 0.65) !important;
	background: rgba(15, 23, 42, 1) !important;
	}

	/* Reduce spacing in dropdown menu items */
	.gradio-dropdown ul,
	.gradio-dropdown .dropdown-menu,
	select option {
	padding: 4px 8px !important;
	margin: 0 !important;
	}

	/* Reduce gap between dropdown and label */
	.role-card .gradio-dropdown {
	margin-top: 4px !important;
	}

	/* Generic section card */
	.section-card {
	background: #020617;
	padding: 22px;
	border-radius: 16px;
	border: 1px solid rgba(148, 163, 184, 0.4);
	margin-bottom: 18px;
	backdrop-filter: blur(14px);
	box-shadow: 0 14px 40px rgba(15, 23, 42, 0.95);
	transition: border-color 0.15s ease, box-shadow 0.15s ease, transform 0.15s ease;
	}

	.section-card:hover {
	border-color: #38bdf8;
	box-shadow: 0 18px 52px rgba(15, 23, 42, 1);
	transform: translateY(-1px);
	}

	/* Chatbot + message bubbles */
	.chatbot {
	border-radius: 18px !important;
	border: 1px solid rgba(148, 163, 184, 0.7) !important;
	background: #020617 !important;
	box-shadow: 0 18px 60px rgba(15, 23, 42, 1);
	}

	/* Keep Gradio's default layout, only adjust colors lightly */
	.chatbot .message.user {
	background: #0ea5e9;
	color: #0b1020;
	}

	.chatbot .message.bot {
	background: #020617;
	border-color: rgba(148, 163, 184, 0.8);
	color: #e5e7eb;
	}

	.chatbot .message.error {
	background: rgba(239, 68, 68, 0.18);
	border-color: rgba(248, 113, 113, 0.9);
	}
	"""
	) as demo:
	with gr.Column(elem_classes=["header-section"]):
	gr.Markdown(
	"""
	# 🤖 IntegraChat — MCP Autonomous Agent

	Enterprise-grade AI with autonomous agents, secure multi-tenant RAG, real-time web search, and governance.
	"""
	)
	gr.Markdown(
	"""
	<div style="background: rgba(6, 182, 212, 0.1); padding: 16px; border-radius: 10px; border-left: 4px solid #06b6d4; margin-top: 16px;">
	<strong>🔐 Role-Based Access Control:</strong> Features are automatically shown/hidden based on your role:
	<ul style="margin: 8px 0 0 0; padding-left: 24px;">
	<li><strong>👤 Viewer:</strong> Chat only</li>
	<li><strong>✏️ Editor:</strong> Chat + Document Ingestion (no delete)</li>
	<li><strong>🛡️ Admin/Owner:</strong> Full access to all features</li>
	</ul>
	</div>
	"""
	)

	with gr.Row(elem_classes=["input-container"]):
	with gr.Column(scale=2, elem_classes=["tenant-card"]):
	gr.Markdown(
	"""
	<div class="field-label-pill">
	<span class="icon">🏢</span>
	<span>Tenant ID</span>
	</div>
	<div class="field-label-subtitle">
	Required for all operations. Use a unique ID per customer / environment.
	</div>
	"""
	)
	tenant_id_input = gr.Textbox(
	label="",
	placeholder="Enter your tenant ID (e.g., tenant123)",
	value="",
	interactive=True,
	scale=2,
	show_label=False,
	)
	with gr.Column(scale=1, elem_classes=["role-card"]):
	gr.Markdown(
	"""
	<div class="field-label-pill">
	<span class="icon">👤</span>
	<span>User Role</span>
	</div>
	<div class="field-label-subtitle">
	Select your role to automatically unlock the right capabilities.
	</div>
	"""
	)
	role_input = gr.Dropdown(
	label="",
	choices=VALID_ROLES,
	value=DEFAULT_ROLE,
	interactive=True,
	scale=1,
	show_label=False,
	)

	with gr.Tabs():
	with gr.Tab("Chat"):
	# Access denied for Editor role - Editor should only see Document Ingestion
	chat_access_denied = gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(239, 68, 68, 0.2) 0%, rgba(220, 38, 38, 0.2) 100%); padding: 40px; border-radius: 16px; border: 2px solid rgba(239, 68, 68, 0.4); text-align: center; margin: 20px 0;">
	<h2 style="color: #fca5a5; margin-bottom: 16px;">🔒 Access Denied</h2>
	<p style="color: #f1f5f9; font-size: 16px; margin-bottom: 12px;">
	<strong>Editor role can only access Document Ingestion.</strong>
	</p>
	<p style="color: #cbd5e1; font-size: 14px;">
	Please switch to Owner or Admin role to access Chat functionality, or go to the Document Ingestion tab.
	</p>
	</div>
	""",
	visible=False
	)

	chat_content = gr.Column(visible=True)

	with chat_content:
	# Two-column layout: chat on the left, guidance panel on the right
	with gr.Row(elem_classes=["chat-row"]):
	with gr.Column(scale=2, elem_classes=["section-card"]):
	chatbot = gr.Chatbot(
	label="Chat with Agent",
	height=500,
	show_label=True,
	container=True,
	elem_classes=["chatbot"]
	)

	with gr.Row():
	message_input = gr.Textbox(
	label="Message",
	placeholder="Type your message here...",
	scale=4,
	show_label=False,
	container=False
	)
	send_button = gr.Button("Send", variant="primary", scale=1)

	with gr.Column(scale=1, elem_classes=["summary-box"]):
	gr.Markdown(
	"""
	### 📝 Chat Instructions
	1. Enter your Tenant ID and Role above
	2. Ask a question or give a task to the agent
	3. The MCP agent will automatically select tools (RAG, Web, etc.)

	### ⚡ Features
	- ✨ Real-time character-by-character streaming responses
	- 🚀 Query caching for faster repeated queries
	- 🔍 Query expansion for ambiguous terms (Al→AI, ML→machine learning)
	- 🌐 Multi-query web search with parallel execution
	- 🧠 Multi-step planning & reasoning
	- 🔍 Automatic tool selection with latency prediction
	- 🧠 Context-aware routing (intelligent tool skipping)
	- 💾 Conversation memory
	- 📊 Reasoning visualization (see Debug tab)
	- ⚡ Per-tool latency estimates (RAG: 60-120ms, Web: 400-1800ms)
	- 📋 Schema-validated tool outputs
	- 🛡️ Enhanced error handling with actionable messages
	"""
	)

	# Reasoning trace viewer
	reasoning_trace_viewer = gr.Markdown(
	"💡 Tip: Use the Debug tab to view detailed reasoning traces for your messages.",
	visible=True
	)

	# Event handlers for chat tab with streaming
	def send_message(message, tenant_id, role, history):
	# Clear message input immediately
	message_input_value = ""
	# Use streaming function which yields updates
	# Gradio will automatically handle the generator and update UI in real-time
	try:
	for updated_history in chat_with_agent(message, tenant_id, role, history):
	yield updated_history, message_input_value
	except Exception as e:
	# Fallback if streaming fails
	error_msg = f"Streaming error: {str(e)}"
	history = convert_history_to_tuples(history)
	history = append_to_history(history, "assistant", error_msg)
	yield history, message_input_value

	send_button.click(
	fn=send_message,
	inputs=[message_input, tenant_id_input, role_input, chatbot],
	outputs=[chatbot, message_input]
	)

	message_input.submit(
	fn=send_message,
	inputs=[message_input, tenant_id_input, role_input, chatbot],
	outputs=[chatbot, message_input]
	)

	# Function to update Chat tab visibility based on role (Editor sees access denied)
	def update_chat_visibility(role):
	is_editor = role == "editor"
	return (
	gr.update(visible=is_editor), # Access denied message for Editor
	gr.update(visible=not is_editor), # Chat content for Owner/Admin
	)

	role_input.change(
	fn=update_chat_visibility,
	inputs=[role_input],
	outputs=[chat_access_denied, chat_content]
	)

	with gr.Tab("🔍 Debug & Reasoning"):
	gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(139, 92, 246, 0.1) 0%, rgba(124, 58, 237, 0.1) 100%); padding: 20px; border-radius: 12px; border: 1px solid rgba(139, 92, 246, 0.2); margin-bottom: 20px;">
	### 🔍 Agent Reasoning Debugger
	View the complete reasoning path, tool invocations, and decision-making process for any message.

	Features:
	- 🧠 Step-by-step reasoning trace
	- ⚙️ Tool invocation timeline with schema-validated outputs
	- ⚡ Per-tool latency predictions (RAG: 60-120ms, Web: 400-1800ms, Admin: <20ms)
	- 🧠 Context-aware routing hints (skip web if RAG high, skip RAG if memory available)
	- 📊 Tool output schemas for easier debugging
	- 🎯 Final decision breakdown with estimated latency
	- 📊 Performance metrics
	</div>
	"""
	)

	debug_message = gr.Textbox(
	label="Message to Debug",
	placeholder="Enter the same message you sent in Chat to see its reasoning path...",
	lines=2
	)
	debug_button = gr.Button("🔍 Analyze Reasoning", variant="primary")
	debug_output = gr.Markdown("👉 Enter a message and click 'Analyze Reasoning' to see the agent's reasoning path.")

	def analyze_reasoning(message, tenant_id, role):
	if not message or not message.strip():
	return "❗ Please enter a message to analyze."
	if not tenant_id or not tenant_id.strip():
	return "❗ Please enter a Tenant ID."
	return get_reasoning_trace(tenant_id, role, message)

	debug_button.click(
	fn=analyze_reasoning,
	inputs=[debug_message, tenant_id_input, role_input],
	outputs=[debug_output]
	)

	debug_message.submit(
	fn=analyze_reasoning,
	inputs=[debug_message, tenant_id_input, role_input],
	outputs=[debug_output]
	)

	with gr.Tab("📚 Document Ingestion"):
	gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(16, 185, 129, 0.1) 0%, rgba(5, 150, 105, 0.1) 100%); padding: 20px; border-radius: 12px; border: 1px solid rgba(16, 185, 129, 0.2); margin-bottom: 20px;">
	### 📚 Knowledge Base Ingestion
	Ingest documents so the MCP agent can reference tenant-private knowledge.

	📄 Supported Formats:
	- Raw text / URLs: Use the fields below
	- Files: PDF, DOCX, TXT, Markdown
	- Metadata: Optional JSON metadata for better organization

	🤖 AI-Generated Metadata (Automatic):
	- ✨ Title extraction from filename, content, or URL
	- 📝 Summary generation (2-3 sentences via LLM)
	- 🏷️ Tags extraction (5-8 relevant tags)
	- 📚 Topics identification (3-5 main themes)
	- 📅 Date detection (multiple formats)
	- ⭐ Quality score (0.0-1.0 based on structure and completeness)
	- 🔄 Intelligent fallback when LLM is unavailable

	⚠️ Note: Editor role and above can ingest. Admin/Owner can delete.
	</div>
	"""
	)

	ingestion_mode = gr.Radio(
	["Raw Text", "URL", "File Upload"],
	value="Raw Text",
	label="Select Ingestion Mode"
	)

	with gr.Row():
	doc_filename = gr.Textbox(label="Filename (optional)")
	doc_id = gr.Textbox(label="Document ID (optional)")

	document_url = gr.Textbox(
	label="Document URL (for URL ingestion)",
	placeholder="https://example.com/policy",
	visible=False
	)

	doc_content = gr.Textbox(
	label="Content / Notes",
	placeholder="Paste the document text here...",
	lines=8,
	visible=True
	)

	metadata_json = gr.Textbox(
	label="Additional Metadata (JSON)",
	placeholder='{"department": "HR", "tags": ["policy", "benefits"]}'
	)

	ingest_doc_button = gr.Button("Ingest Text / URL Document", variant="primary")

	document_status = gr.Markdown("")

	def handle_ingest_document(
	tenant_id,
	role,
	mode,
	content,
	doc_url,
	filename,
	doc_id_value,
	metadata
	):
	# Debug: Log the role value received
	print(f"🔍 DEBUG: handle_ingest_document received role='{role}' (type: {type(role)})", file=sys.stderr)

	# Ensure role is not None or empty
	if not role or role.strip() == "":
	role = DEFAULT_ROLE
	print(f"⚠️ WARNING: Role was empty/None, defaulting to '{role}'", file=sys.stderr)

	source_type = "raw_text" if mode == "Raw Text" else "url"
	result = ingest_document(
	tenant_id=tenant_id,
	role=role.strip() if role else DEFAULT_ROLE,
	source_type=source_type,
	content=content,
	document_url=doc_url,
	filename=filename,
	doc_id=doc_id_value,
	metadata_json=metadata
	)
	# Add note about refreshing Knowledge Base Library
	if "✅" in result:
	result += "\n\n💡 Tip: Go to the 'Knowledge Base Library' tab to view your ingested documents."
	return result

	ingest_doc_button.click(
	fn=handle_ingest_document,
	inputs=[
	tenant_id_input,
	role_input,
	ingestion_mode,
	doc_content,
	document_url,
	doc_filename,
	doc_id,
	metadata_json
	],
	outputs=document_status
	)

	file_section = gr.Markdown("#### 📁 File Upload (PDF, DOCX, TXT, Markdown)", visible=False)
	file_upload = gr.File(
	label="Upload File",
	file_types=[".pdf", ".docx", ".txt", ".md", ".markdown"],
	visible=False
	)
	ingest_file_button = gr.Button("Upload & Ingest File", visible=False)

	def handle_file_ingestion(tenant_id, role, file_obj):
	result = ingest_file(tenant_id, role, file_obj)
	# Add note about refreshing Knowledge Base Library
	if "✅" in result:
	result += "\n\n💡 Tip: Go to the 'Knowledge Base Library' tab to view your ingested documents."
	return result

	ingest_file_button.click(
	fn=handle_file_ingestion,
	inputs=[tenant_id_input, role_input, file_upload],
	outputs=document_status
	)

	def toggle_source_fields(mode):
	show_text = mode == "Raw Text"
	show_url = mode == "URL"
	show_file = mode == "File Upload"
	return (
	gr.update(visible=show_text),
	gr.update(visible=show_url),
	gr.update(visible=not show_file),
	gr.update(visible=not show_file),
	gr.update(visible=not show_file),
	gr.update(visible=show_file),
	gr.update(visible=show_file),
	gr.update(visible=show_file),
	)

	ingestion_mode.change(
	fn=toggle_source_fields,
	inputs=[ingestion_mode],
	outputs=[
	doc_content,
	document_url,
	doc_filename,
	doc_id,
	ingest_doc_button,
	file_section,
	file_upload,
	ingest_file_button,
	]
	)

	with gr.Tab("📖 Knowledge Base Library"):
	# Access denied for Editor role
	kb_access_denied = gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(239, 68, 68, 0.2) 0%, rgba(220, 38, 38, 0.2) 100%); padding: 40px; border-radius: 16px; border: 2px solid rgba(239, 68, 68, 0.4); text-align: center; margin: 20px 0;">
	<h2 style="color: #fca5a5; margin-bottom: 16px;">🔒 Access Denied</h2>
	<p style="color: #f1f5f9; font-size: 16px; margin-bottom: 12px;">
	<strong>Editor role can only access Document Ingestion.</strong>
	</p>
	<p style="color: #cbd5e1; font-size: 14px;">
	Please switch to Owner or Admin role to access Knowledge Base Library.
	</p>
	</div>
	""",
	visible=False
	)

	# Set initial visibility based on default role
	# Editor should NOT see Knowledge Base Library content
	initial_is_editor = (DEFAULT_ROLE or "").lower().strip() == "editor"
	kb_access_denied.visible = initial_is_editor # Show access denied for editor
	kb_library_content = gr.Column(visible=not initial_is_editor)

	with kb_library_content:
	gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(139, 92, 246, 0.1) 0%, rgba(124, 58, 237, 0.1) 100%); padding: 20px; border-radius: 12px; border: 1px solid rgba(139, 92, 246, 0.2); margin-bottom: 20px;">
	### 📖 Knowledge Base Library
	View, search, and manage all ingested documents for your tenant with visual analytics.

	Features:
	- 📊 Statistics: View document counts, types, and distribution
	- 🔍 Search: Use semantic search with cross-encoder re-ranking for better results
	- 🤖 AI Metadata: Documents include auto-extracted title, summary, tags, topics, and quality scores
	- 🔽 Filter: Filter documents by type (text, PDF, FAQ, link)
	- 🗑️ Delete: Remove individual documents or delete all at once (Admin/Owner only)
	</div>
	"""
	)

	# Statistics Section
	with gr.Row():
	kb_total_docs = gr.Markdown("### 📄 Total Documents\n0", elem_classes=["stat-card"])
	kb_text_docs = gr.Markdown("### 📝 Text Documents\n0", elem_classes=["stat-card"])
	kb_pdf_docs = gr.Markdown("### 📄 PDF Documents\n0", elem_classes=["stat-card"])
	kb_faq_docs = gr.Markdown("### ❓ FAQ Documents\n0", elem_classes=["stat-card"])
	kb_link_docs = gr.Markdown("### 🔗 Link Documents\n0", elem_classes=["stat-card"])

	# Chart and Search Section
	with gr.Row():
	with gr.Column(scale=1):
	kb_chart = gr.Plot(label="Document Type Distribution", show_label=True)
	kb_refresh_button = gr.Button("🔄 Refresh Documents", variant="primary", size="lg")
	kb_delete_all_button = gr.Button("🗑️ Delete All Documents", variant="stop")

	with gr.Column(scale=1):
	kb_search_query = gr.Textbox(
	label="🔍 Search Knowledge Base",
	placeholder="Enter a search query (e.g., 'admin', 'policy', 'FAQ')...",
	show_label=True
	)
	kb_search_button = gr.Button("Search", variant="primary")
	kb_search_status = gr.Markdown("")
	kb_search_results = gr.Dataframe(
	headers=["Rank", "Text", "Relevance"],
	datatype=["number", "str", "str"],
	interactive=False,
	label="Search Results",
	wrap=True
	)

	# Status and Filter Section
	kb_status = gr.Markdown("👉 Click Refresh Documents to load your knowledge base.")

	with gr.Row():
	with gr.Column(scale=2):
	kb_filter_type = gr.Radio(
	["all", "text", "pdf", "faq", "link"],
	value="all",
	label="Filter by Type",
	info="Filter documents by detected type"
	)
	with gr.Column(scale=1):
	kb_avg_length = gr.Markdown("Average Length: 0 characters")

	# Documents Table
	kb_documents_table = gr.Dataframe(
	headers=["ID", "Type", "Preview", "Length", "Created"],
	datatype=["number", "str", "str", "number", "str"],
	interactive=False,
	label="Documents",
	wrap=True
	)

	# Delete Section (Admin/Owner only)
	kb_delete_section = gr.Row()
	with kb_delete_section:
	kb_delete_id = gr.Number(
	label="Delete Document by ID",
	value=None,
	precision=0,
	info="Enter document ID to delete",
	scale=3
	)
	kb_delete_button = gr.Button("Delete Document", variant="stop", scale=1)

	kb_delete_status = gr.Markdown("")

	# Function to update KB tab visibility based on role
	def update_kb_visibility(role):
	can_delete = can_delete_documents(role)
	return (
	gr.update(visible=can_delete), # Delete all button
	gr.update(visible=can_delete), # Delete section
	)

	def refresh_documents(tenant_id, role, filter_type="all"):
	status, docs, total, stats, chart_fig = list_documents(tenant_id, role)

	# Filter documents by type if not "all"
	# docs is now a list of lists: [ID, Type, Preview, Length, Created]
	if filter_type != "all" and docs:
	filtered_docs = [doc for doc in docs if len(doc) > 1 and doc[1].lower() == filter_type.lower()]
	docs = filtered_docs
	status = f"✅ Found {len(docs)} {filter_type} document(s) (out of {total} total)"

	# Update statistics cards
	type_counts = stats.get("types", {})
	total_md = f"### 📄 Total Documents\n{total}"
	text_md = f"### 📝 Text Documents\n{type_counts.get('text', 0)}"
	pdf_md = f"### 📄 PDF Documents\n{type_counts.get('pdf', 0)}"
	faq_md = f"### ❓ FAQ Documents\n{type_counts.get('faq', 0)}"
	link_md = f"### 🔗 Link Documents\n{type_counts.get('link', 0)}"
	avg_length_md = f"Average Length: {stats.get('avg_length', 0):,} characters"

	status_msg = f"{status}\n\nTotal Documents: {total} \| Total Characters: {stats.get('total_chars', 0):,}"

	return (
	status_msg, docs, total_md, text_md, pdf_md, faq_md, link_md,
	avg_length_md, chart_fig
	)

	def filter_documents(tenant_id, role, filter_type):
	return refresh_documents(tenant_id, role, filter_type)

	def search_kb(tenant_id, role, query):
	status, results = search_knowledge_base(tenant_id, role, query)
	return status, results

	def delete_doc(tenant_id, role, doc_id):
	if doc_id is None or doc_id <= 0:
	return "❗ Please enter a valid document ID.", "", "", "", "", "", "", "", None
	result = delete_document(tenant_id, role, int(doc_id))
	# Refresh document list after deletion
	return (result, *refresh_documents(tenant_id, role, "all"))

	def delete_all_docs(tenant_id, role):
	result = delete_all_documents(tenant_id, role)
	# Refresh document list after deletion
	return (result, *refresh_documents(tenant_id, role, "all"))

	kb_refresh_button.click(
	fn=refresh_documents,
	inputs=[tenant_id_input, role_input, kb_filter_type],
	outputs=[
	kb_status, kb_documents_table, kb_total_docs, kb_text_docs,
	kb_pdf_docs, kb_faq_docs, kb_link_docs, kb_avg_length, kb_chart
	]
	)

	kb_filter_type.change(
	fn=filter_documents,
	inputs=[tenant_id_input, role_input, kb_filter_type],
	outputs=[
	kb_status, kb_documents_table, kb_total_docs, kb_text_docs,
	kb_pdf_docs, kb_faq_docs, kb_link_docs, kb_avg_length, kb_chart
	]
	)

	kb_search_button.click(
	fn=search_kb,
	inputs=[tenant_id_input, role_input, kb_search_query],
	outputs=[kb_search_status, kb_search_results]
	)

	kb_search_query.submit(
	fn=search_kb,
	inputs=[tenant_id_input, role_input, kb_search_query],
	outputs=[kb_search_status, kb_search_results]
	)

	kb_delete_button.click(
	fn=delete_doc,
	inputs=[tenant_id_input, role_input, kb_delete_id],
	outputs=[
	kb_delete_status, kb_status, kb_documents_table, kb_total_docs,
	kb_text_docs, kb_pdf_docs, kb_faq_docs, kb_link_docs, kb_avg_length, kb_chart
	]
	)

	kb_delete_all_button.click(
	fn=delete_all_docs,
	inputs=[tenant_id_input, role_input],
	outputs=[
	kb_delete_status, kb_status, kb_documents_table, kb_total_docs,
	kb_text_docs, kb_pdf_docs, kb_faq_docs, kb_link_docs, kb_avg_length, kb_chart
	]
	)

	# Update visibility when role changes
	def update_kb_full_visibility(role):
	# Normalize role to lowercase for comparison
	role_lower = (role or DEFAULT_ROLE).lower().strip()
	is_editor = role_lower == "editor"
	can_delete = can_delete_documents(role_lower)
	return (
	gr.update(visible=is_editor), # Access denied for Editor
	gr.update(visible=not is_editor), # KB content for Owner/Admin/Viewer
	gr.update(visible=can_delete), # Delete all button
	gr.update(visible=can_delete), # Delete section
	)

	role_input.change(
	fn=update_kb_full_visibility,
	inputs=[role_input],
	outputs=[kb_access_denied, kb_library_content, kb_delete_all_button, kb_delete_section]
	)

	with gr.Tab("📊 Admin Analytics"):
	# Access denied message for non-admin/owner roles
	analytics_access_denied = gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(239, 68, 68, 0.2) 0%, rgba(220, 38, 38, 0.2) 100%); padding: 40px; border-radius: 16px; border: 2px solid rgba(239, 68, 68, 0.4); text-align: center; margin: 20px 0;">
	<h2 style="color: #fca5a5; margin-bottom: 16px;">🔒 Access Denied</h2>
	<p style="color: #f1f5f9; font-size: 16px; margin-bottom: 12px;">
	<strong>Analytics is available to all roles.</strong>
	</p>
	<p style="color: #cbd5e1; font-size: 14px;">
	If you're seeing this message, there may be a configuration issue.
	</p>
	</div>
	""",
	visible=False
	)

	# Analytics content (visible for admin/owner)
	analytics_content = gr.Column(visible=True)

	with analytics_content:
	gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(245, 158, 11, 0.1) 0%, rgba(217, 119, 6, 0.1) 100%); padding: 24px; border-radius: 12px; border: 1px solid rgba(245, 158, 11, 0.2); margin-bottom: 20px;">
	# 📊 Admin Analytics Dashboard

	Comprehensive tenant-level analytics with visual insights, performance metrics, and detailed tool usage statistics.

	🔒 Access: Admin and Owner roles only
	</div>
	"""
	)

	# Refresh Button at Top
	with gr.Row():
	analytics_refresh = gr.Button("🔄 Fetch Analytics Snapshot", variant="primary", size="lg")
	gr.Markdown("")

	# Statistics Cards
	gr.Markdown("### 📈 Key Metrics")
	with gr.Row():
	analytics_total_queries = gr.Markdown("### 📊 Total Queries\n0", elem_classes=["stat-card"])
	analytics_active_users = gr.Markdown("### 👥 Active Users\n0", elem_classes=["stat-card"])
	analytics_redflags = gr.Markdown("### 🚩 Red Flags\n0", elem_classes=["stat-card"])
	analytics_rag_searches = gr.Markdown("### 🔍 RAG Searches\n0", elem_classes=["stat-card"])

	# Charts Section
	gr.Markdown("### 📊 Performance Charts")
	with gr.Row():
	with gr.Column(scale=1):
	gr.Markdown("#### 📈 Tool Usage Count", elem_classes=["chart-title"])
	analytics_tool_chart = gr.Plot(label="", show_label=False)
	with gr.Column(scale=1):
	gr.Markdown("#### ⚡ Average Tool Latency", elem_classes=["chart-title"])
	analytics_latency_chart = gr.Plot(label="", show_label=False)

	# RAG Quality and Summary Section
	with gr.Row():
	with gr.Column(scale=1):
	gr.Markdown("#### 🔍 RAG Quality Metrics", elem_classes=["chart-title"])
	analytics_rag_chart = gr.Plot(label="", show_label=False)

	with gr.Column(scale=1):
	gr.Markdown("### 📋 Analytics Summary")
	analytics_summary = gr.Markdown(
	"👉 Click Fetch Analytics Snapshot to load data.",
	elem_classes=["summary-box"]
	)

	# Tool Usage Details Table
	gr.Markdown("### 🔧 Detailed Tool Usage")
	analytics_tool_table = gr.Dataframe(
	headers=["Tool", "Count", "Avg Latency (ms)", "Success", "Errors", "Total Tokens"],
	datatype=["str", "number", "number", "number", "number", "number"],
	interactive=False,
	label="",
	wrap=True
	)

	analytics_error = gr.Markdown("", visible=False)

	def format_analytics(tenant_id, role):
	summary, tool_usage, tool_chart, latency_chart, rag_chart, error = fetch_admin_analytics(tenant_id, role)

	if error:
	return (
	error, "", "", "", "", None, None, None, []
	)

	# Extract overview data - fetch_admin_analytics already fetched it, but we need it again for cards
	overview_data = {}
	try:
	headers = {
	"x-tenant-id": tenant_id,
	"x-user-role": role if role else DEFAULT_ROLE
	}
	resp = requests.get(
	f"{BACKEND_BASE_URL}/analytics/overview",
	headers=headers,
	timeout=30
	)
	if resp.status_code == 200:
	data = resp.json()
	# The API returns {"overview": {...}} or direct overview object
	overview_data = data.get("overview", data) if isinstance(data, dict) else {}
	# Debug: print to see what we're getting
	print(f"DEBUG: Overview data keys: {overview_data.keys() if isinstance(overview_data, dict) else 'Not a dict'}")
	except Exception as e:
	print(f"Error fetching overview: {e}")
	pass

	# Extract values with proper fallbacks - handle both nested and flat structures
	if isinstance(overview_data, dict):
	total_queries = overview_data.get("total_queries", 0)
	active_users = overview_data.get("active_users", 0)
	redflag_count = overview_data.get("redflag_count", 0)
	rag_quality = overview_data.get("rag_quality", {})
	rag_searches = rag_quality.get("total_searches", 0) if isinstance(rag_quality, dict) else 0
	else:
	total_queries = 0
	active_users = 0
	redflag_count = 0
	rag_quality = {}
	rag_searches = 0

	# Format statistics cards
	queries_md = f"### 📊 Total Queries\n{total_queries}"
	users_md = f"### 👥 Active Users\n{active_users}"
	redflags_md = f"### 🚩 Red Flags\n{redflag_count}"
	rag_md = f"### 🔍 RAG Searches\n{rag_searches}"

	# Format tool usage table
	tool_table_data = []
	for tool_name, stats in tool_usage.items():
	tool_table_data.append({
	"Tool": tool_name.replace(".", " ").title(),
	"Count": stats.get("count", 0),
	"Avg Latency (ms)": round(stats.get("avg_latency_ms", 0), 2),
	"Success": stats.get("success_count", 0),
	"Errors": stats.get("error_count", 0),
	"Total Tokens": stats.get("total_tokens", 0)
	})

	return (
	summary, queries_md, users_md, redflags_md, rag_md,
	tool_chart, latency_chart, rag_chart, tool_table_data
	)

	analytics_refresh.click(
	fn=format_analytics,
	inputs=[tenant_id_input, role_input],
	outputs=[
	analytics_summary,
	analytics_total_queries,
	analytics_active_users,
	analytics_redflags,
	analytics_rag_searches,
	analytics_tool_chart,
	analytics_latency_chart,
	analytics_rag_chart,
	analytics_tool_table
	]
	)

	# Function to update Analytics tab visibility based on role (all roles can view)
	def update_analytics_visibility(role):
	has_access = can_view_analytics(role) # All roles can view now
	return (
	gr.update(visible=False), # No access denied message
	gr.update(visible=True), # Analytics content visible for all
	)

	# Update visibility when role changes
	role_input.change(
	fn=update_analytics_visibility,
	inputs=[role_input],
	outputs=[analytics_access_denied, analytics_content]
	)


	with gr.Tab("🛡️ Admin Rules & Compliance"):
	# Access denied for Editor role
	rules_access_denied = gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(239, 68, 68, 0.2) 0%, rgba(220, 38, 38, 0.2) 100%); padding: 40px; border-radius: 16px; border: 2px solid rgba(239, 68, 68, 0.4); text-align: center; margin: 20px 0;">
	<h2 style="color: #fca5a5; margin-bottom: 16px;">🔒 Access Denied</h2>
	<p style="color: #f1f5f9; font-size: 16px; margin-bottom: 12px;">
	<strong>Editor role can only access Document Ingestion.</strong>
	</p>
	<p style="color: #cbd5e1; font-size: 14px;">
	Admin Rules & Compliance is restricted to Admin and Owner roles only.
	</p>
	</div>
	""",
	visible=False
	)

	rules_content = gr.Column(visible=True)

	with rules_content:
	gr.Markdown(
	"""
	<div style="background: linear-gradient(135deg, rgba(239, 68, 68, 0.1) 0%, rgba(220, 38, 38, 0.1) 100%); padding: 20px; border-radius: 12px; border: 1px solid rgba(239, 68, 68, 0.2); margin-bottom: 20px;">
	### 🛡️ Admin Rules & Regulations
	Upload or manage tenant-specific governance rules (red-flag patterns, compliance policies, etc.).

	📤 Upload Methods:
	- Text Input: Enter one rule per line in the text box
	- File Upload: Upload rules from TXT, PDF, DOC, or DOCX files

	✨ Features:
	- 🤖 Rules are automatically enhanced by LLM (identifies edge cases, improves patterns)
	- 💬 Comment lines (starting with #) are automatically ignored
	- 🗑️ Use the delete box to remove an exact rule
	- 🔄 Refresh anytime to view the latest rule set

	🔒 Access: Admin and Owner roles only
	</div>
	"""
	)

	rules_summary = gr.Markdown("👉 Click Refresh Rules to see existing entries.")
	rules_table = gr.Dataframe(
	headers=["#", "Rule"],
	datatype=["number", "str"],
	interactive=False,
	value=[]
	)
	rules_status = gr.Markdown("")

	with gr.Row():
	refresh_rules_button = gr.Button("Refresh Rules", variant="secondary")
	gr.Markdown("")

	with gr.Row():
	with gr.Column(scale=1):
	rules_input = gr.Textbox(
	label="Rules / Regulations (Text Input)",
	placeholder="Enter one rule per line...",
	lines=6
	)
	enhance_rules_checkbox = gr.Checkbox(
	label="🤖 Enable LLM Enhancement (slower but provides better patterns and explanations)",
	value=True,
	info="Uncheck to add rules quickly without LLM enhancement"
	)
	upload_rules_button = gr.Button("Upload / Append Rules", variant="primary")

	with gr.Column(scale=1):
	gr.Markdown("OR")
	rules_file_upload = gr.File(
	label="Upload Rules File",
	file_types=[".txt", ".pdf", ".doc", ".docx"],
	type="filepath"
	)
	enhance_file_checkbox = gr.Checkbox(
	label="🤖 Enable LLM Enhancement",
	value=True,
	info="Uncheck to add rules quickly without LLM enhancement"
	)
	upload_file_button = gr.Button("Upload Rules from File", variant="primary")

	delete_rule_input = gr.Textbox(
	label="Delete Rule",
	placeholder="Enter rule number (e.g., 1) or the full rule text to remove..."
	)
	delete_rule_button = gr.Button("Delete Rule", variant="stop")

	refresh_rules_button.click(
	fn=fetch_admin_rules,
	inputs=[tenant_id_input, role_input],
	outputs=[rules_summary, rules_table]
	)

	upload_rules_button.click(
	fn=add_rules_and_refresh,
	inputs=[tenant_id_input, role_input, rules_input, enhance_rules_checkbox],
	outputs=[rules_status, rules_summary, rules_table]
	)

	upload_file_button.click(
	fn=lambda tenant_id, role, file_path, enhance: add_rules_from_file(tenant_id, role, file_path, enhance),
	inputs=[tenant_id_input, role_input, rules_file_upload, enhance_file_checkbox],
	outputs=[rules_status, rules_summary, rules_table]
	)

	delete_rule_button.click(
	fn=delete_rule_and_refresh,
	inputs=[tenant_id_input, role_input, delete_rule_input],
	outputs=[rules_status, rules_summary, rules_table]
	)

	# Function to update Admin Rules tab visibility based on role
	def update_rules_visibility(role):
	is_editor = role == "editor"
	has_access = can_manage_rules(role)
	return (
	gr.update(visible=is_editor or not has_access), # Access denied for Editor or non-admin
	gr.update(visible=has_access and not is_editor), # Rules content for Admin/Owner only
	)

	role_input.change(
	fn=update_rules_visibility,
	inputs=[role_input],
	outputs=[rules_access_denied, rules_content]
	)

	gr.Markdown(
	"""
	<div style="margin-top: 40px; padding: 24px; background: linear-gradient(135deg, rgba(15, 23, 42, 0.5) 0%, rgba(30, 41, 59, 0.5) 100%); border-radius: 12px; border: 1px solid rgba(148, 163, 184, 0.1); text-align: center;">
	<p style="margin: 0; color: #94a3b8; font-size: 14px;">
	Built with ❤️ using <a href="https://modelcontextprotocol.io/" target="_blank" style="color: #06b6d4; text-decoration: none; font-weight: 600;">Model Context Protocol (MCP)</a>
	</p>
	<p style="margin: 8px 0 0 0; color: #64748b; font-size: 12px;">
	Enterprise-Grade MCP Autonomous Agent Platform
	</p>
	</div>
	"""
	)

	if __name__ == "__main__":
	import os
	import threading
	import time
	import requests

	# Detect environment
	# - HF Spaces sets SPACE_ID
	# - Docker entrypoint script manages services, so don't auto-start here
	is_hf_space = os.getenv("SPACE_ID") is not None
	is_docker = os.path.exists("/.dockerenv") or os.getenv("DOCKER_CONTAINER") == "1"

	# For Hugging Face Spaces or Docker, bind to 0.0.0.0; for local dev, use 127.0.0.1
	server_name = "0.0.0.0" if (is_hf_space or is_docker) else "127.0.0.1"

	# Start backend services if running in HF Spaces (but NOT in Docker - entrypoint handles that)
	if is_hf_space and not is_docker:
	def start_mcp_server():
	"""Start MCP server in a background process."""
	try:
	import sys
	import subprocess
	# Use subprocess.Popen to run in background and surface logs in HF Spaces
	subprocess.Popen(
	[
	sys.executable, "-m", "uvicorn",
	"backend.mcp_server.server:app",
	"--host", "0.0.0.0",
	"--port", os.getenv("MCP_PORT", "8900"),
	"--log-level", "info",
	]
	)
	except Exception as e:
	print(f"Warning: Could not start MCP server: {e}")

	def start_fastapi_server():
	"""Start FastAPI server in a background process."""
	try:
	import sys
	import subprocess
	# Use subprocess.Popen to run in background and surface logs in HF Spaces
	subprocess.Popen(
	[
	sys.executable, "-m", "uvicorn",
	"backend.api.main:app",
	"--host", "0.0.0.0",
	"--port", os.getenv("API_PORT", "8000"),
	"--log-level", "info",
	]
	)
	except Exception as e:
	print(f"Warning: Could not start FastAPI server: {e}")

	# Start services in background threads
	print("Starting backend services...")
	mcp_thread = threading.Thread(target=start_mcp_server, daemon=True)
	api_thread = threading.Thread(target=start_fastapi_server, daemon=True)

	mcp_thread.start()
	time.sleep(4) # Give MCP server time to start
	api_thread.start()
	# Give FastAPI extra time to start on first cold boot (model downloads etc.)
	time.sleep(10)

	demo.launch(
	server_name=server_name,
	server_port=7860,
	share=False,
	show_error=True
	)