Spaces:

Pipalskill
/

Support-Ticket-AI-Agent

Sleeping

App Files Files Community

Support-Ticket-AI-Agent / agent_langchain.py

Pipalskill

Update agent_langchain.py

2760115 verified 3 months ago

raw

history blame contribute delete

19.6 kB

	import os
	os.environ["TOKENIZERS_PARALLELISM"] = "false"
	os.environ["TRANSFORMERS_CACHE"] = "/tmp/transformers"
	os.environ["HF_HOME"] = "/tmp/huggingface"
	os.environ["SENTENCE_TRANSFORMERS_HOME"] = "/tmp/sentence_transformers"
	os.environ["TORCH_HOME"] = "/tmp/torch"

	import json
	import requests
	import torch
	import time
	from transformers import AutoTokenizer, AutoModelForSequenceClassification
	import numpy as np
	from sentence_transformers import SentenceTransformer
	import chromadb
	from chromadb.config import Settings
	from langchain_google_genai import ChatGoogleGenerativeAI
	from langchain.agents.react.agent import create_react_agent
	from langchain.agents.agent import AgentExecutor

	from langchain.tools import Tool
	from langchain.prompts import PromptTemplate
	import threading
	from datetime import datetime
	import firebase_admin
	from firebase_admin import credentials, firestore
	from typing import Optional, Dict, Any

	# Environment
	GEMINI_API_KEY = os.environ.get("GEMINI_API_KEY")
	ROUTING_URL = os.environ.get("ROUTING_URL")
	SPACE_URL = os.environ.get("SPACE_URL", "http://localhost:7860")
	FIREBASE_CREDS_PATH = os.environ.get("FIREBASE_CREDS_PATH")
	firebase_creds_json = os.getenv("FIREBASE_CREDS_JSON")

	# Initialize Firebase
	db = None
	if firebase_creds_json:
	try:
	creds_dict = json.loads(firebase_creds_json)
	cred = credentials.Certificate(creds_dict)

	if not firebase_admin._apps:
	firebase_admin.initialize_app(cred)
	db = firestore.client()
	print("✅ Firebase initialized from FIREBASE_CREDS_JSON")
	except Exception as e:
	import traceback
	print(f"⚠️ Firebase init failed: {e}")
	traceback.print_exc()
	else:
	print("⚠️ FIREBASE_CREDS_JSON not found in environment variables")

	# Label Dictionary
	LABEL_DICTIONARY = {
	"I1": "Low Impact", "I2": "Medium Impact", "I3": "High Impact", "I4": "Critical Impact",
	"U1": "Low Urgency", "U2": "Medium Urgency", "U3": "High Urgency", "U4": "Critical Urgency",
	"T1": "Information", "T2": "Incident", "T3": "Problem", "T4": "Request", "T5": "Question"
	}

	# Classification Model
	clf_model_name = "DavinciTech/BERT_Categorizer"
	clf_tokenizer = AutoTokenizer.from_pretrained(clf_model_name, cache_dir="/tmp/transformers")
	clf_model = AutoModelForSequenceClassification.from_pretrained(clf_model_name, cache_dir="/tmp/transformers")

	def classify_ticket(text):
	"""Classify ticket into Impact, Urgency, and Type."""
	inputs = clf_tokenizer(text, return_tensors="pt", truncation=True)
	outputs = clf_model(**inputs)
	logits = outputs.logits[0]
	impact_idx = torch.argmax(logits[:4]).item() + 1
	urgency_idx = torch.argmax(logits[4:8]).item() + 1
	type_idx = torch.argmax(logits[8:]).item() + 1
	return {
	"impact": LABEL_DICTIONARY[f"I{impact_idx}"],
	"urgency": LABEL_DICTIONARY[f"U{urgency_idx}"],
	"type": LABEL_DICTIONARY[f"T{type_idx}"]
	}

	# Routing Function
	def call_routing(text, retries=3, delay=5):
	"""Route ticket to appropriate department."""
	url = ROUTING_URL if ROUTING_URL else f"{SPACE_URL}/route"
	for attempt in range(retries):
	try:
	resp = requests.post(url, json={"text": text}, timeout=30)
	resp.raise_for_status()
	return resp.json().get("department", "General IT")
	except Exception as e:
	print(f"Routing attempt {attempt+1} failed: {e}")
	if attempt < retries - 1:
	time.sleep(delay)
	return "General IT"

	# Knowledge Base
	CHROMA_PATH = "/tmp/chroma"
	COLLECTION_NAME = "knowledge_base"
	kb_collection = None
	kb_lock = threading.Lock()
	encoder = SentenceTransformer("all-MiniLM-L6-v2", cache_folder="/tmp/sentence_transformers")

	def get_kb_collection():
	global kb_collection
	if kb_collection is None:
	with kb_lock:
	if kb_collection is None:
	try:
	chroma_client = chromadb.PersistentClient(
	path=CHROMA_PATH,
	settings=Settings(anonymized_telemetry=False, allow_reset=True)
	)
	kb_collection = chroma_client.get_or_create_collection(COLLECTION_NAME)
	except Exception as e:
	print(f"Could not get KB collection: {e}")
	return kb_collection

	def query_kb(text: str, top_k: int = 1):
	"""Query KB and return answer with confidence."""
	collection = get_kb_collection()
	if not collection or collection.count() == 0:
	return {"answer": None, "confidence": 0.0}

	try:
	query_embedding = encoder.encode([text])[0].tolist()
	results = collection.query(
	query_embeddings=[query_embedding],
	n_results=top_k,
	include=["documents", "distances", "metadatas"]
	)

	if not results or not results.get("documents") or len(results["documents"][0]) == 0:
	return {"answer": None, "confidence": 0.0}

	answer = results["documents"][0][0]
	distance = results["distances"][0][0] if results.get("distances") else 1.0
	confidence = max(0.0, 1.0 - (distance / 2.0))

	return {"answer": answer, "confidence": round(float(confidence), 3)}
	except Exception as e:
	print(f"KB query failed: {e}")
	return {"answer": None, "confidence": 0.0}

	# Firestore Helper
	def save_ticket_to_firestore(ticket_data: Dict[str, Any]):
	"""Save resolved/escalated ticket to Firestore."""
	if not db:
	print("⚠️ Firestore not initialized, skipping save")
	return None

	try:
	ticket_ref = db.collection('tickets').document()
	ticket_data['created_at'] = firestore.SERVER_TIMESTAMP
	ticket_data['updated_at'] = firestore.SERVER_TIMESTAMP
	ticket_ref.set(ticket_data)
	print(f"✅ Ticket saved to Firestore: {ticket_ref.id}")
	return ticket_ref.id
	except Exception as e:
	print(f"❌ Firestore save failed: {e}")
	return None

	# Gemini LLM
	llm = ChatGoogleGenerativeAI(
	model="gemini-2.5-flash",
	temperature=0.3,
	google_api_key=GEMINI_API_KEY
	)

	# Global conversation storage
	conversations = {}

	# Tool Functions for Agent
	def classify_tool(query: str) -> str:
	"""Analyzes ticket severity, impact, urgency, and type. Use when you need to understand ticket priority."""
	result = classify_ticket(query)
	return f"Impact: {result['impact']}, Urgency: {result['urgency']}, Type: {result['type']}"

	def routing_tool(query: str) -> str:
	"""Identifies which IT department should handle this issue. Use when you need to know responsible team."""
	dept = call_routing(query)
	return f"Department: {dept}"

	def kb_tool(query: str) -> str:
	"""Searches knowledge base for solutions. Returns answer with confidence score. Use when you need technical solutions."""
	result = query_kb(query)
	if result["answer"] and result["confidence"] > 0.5:
	return f"[KB Confidence: {result['confidence']}]\n{result['answer']}"
	return f"[KB Confidence: {result['confidence']}] No relevant solution found in knowledge base."

	def escalation_tool(reason: str) -> str:
	"""Creates escalation ticket for human agent. Use ONLY when KB confidence is below 0.6 AND issue is truly complex. Always try KB first!"""
	ticket_id = f"TKT-{datetime.now().strftime('%Y%m%d-%H%M%S')}"
	return f"ESCALATED: Ticket {ticket_id} created. Reason: {reason}. Human agent will respond in 2-4 hours."

	# Define Tools
	tools = [
	Tool(
	name="ClassifyTicket",
	func=classify_tool,
	description="Analyzes ticket to determine impact level, urgency, and type. Use this when you need to understand the severity or priority of an issue."
	),
	Tool(
	name="RouteTicket",
	func=routing_tool,
	description="Determines which IT department should handle this ticket. Use this when you need to identify the responsible team."
	),
	Tool(
	name="SearchKnowledgeBase",
	func=kb_tool,
	description="Searches internal knowledge base for solutions. Returns answer with confidence score (0-1). ALWAYS USE THIS FIRST before escalating. Use this when you need to find technical solutions or troubleshooting steps."
	),
	Tool(
	name="EscalateToHuman",
	func=escalation_tool,
	description="Creates an escalation ticket for human agent review. CRITICAL: Use this ONLY as a LAST RESORT when: 1) KB confidence score is below 0.6 AND you've already tried KB, 2) Issue is extremely complex and unusual, 3) User explicitly confirms the KB solution failed after trying it. DO NOT escalate if KB has a reasonable solution (confidence > 0.6)."
	)
	]

	# IMPROVED Agent Prompt
	AGENT_PROMPT = """You are an intelligent IT Helpdesk AI Agent. Your PRIMARY goal is to resolve tickets using the Knowledge Base. Escalation is a LAST RESORT.

	AVAILABLE TOOLS:
	{tools}

	TOOL NAMES: {tool_names}

	CRITICAL RULES:
	1. ALWAYS search Knowledge Base FIRST - This is your primary tool for resolution
	2. Trust KB solutions with confidence >= 0.6 - These are reliable solutions, provide them to users
	3. ONLY escalate when ABSOLUTELY necessary:
	- KB confidence is below 0.6 AND no solution found
	- Issue is extremely unusual or complex beyond KB scope
	- User explicitly tried your KB solution and reports it failed
	4. Be thorough with KB - If first search doesn't work, try rephrasing the query
	5. Maintain context - Remember conversation history for follow-ups

	DECISION WORKFLOW:
	NEW TICKET → Search KB → If confidence >= 0.6 → Provide solution → Mark RESOLVED
	↓
	If confidence < 0.6 → Try rephrasing search → Still low? → Classify & Route → THEN escalate

	FOLLOW-UP → Check if user tried solution → Worked? → Mark RESOLVED
	↓
	Failed? → Search KB again with different query → Still failing? → THEN escalate

	IMPORTANT:
	- Don't mention tool names or confidence scores to users
	- Provide clear, step-by-step instructions from KB
	- Be conversational and helpful
	- Escalation means you couldn't solve it - avoid this outcome!

	FORMAT:
	Question: the user's input
	Thought: your reasoning about what to do next
	Action: the tool to use (must be one of [{tool_names}])
	Action Input: the input for that tool
	Observation: the tool's output
	... (repeat Thought/Action/Observation as needed)
	Thought: I now have enough information to respond
	Final Answer: your complete response to the user

	Begin!

	Question: {input}
	Thought: {agent_scratchpad}"""

	prompt = PromptTemplate.from_template(AGENT_PROMPT)

	# Create Agent
	agent = create_react_agent(llm=llm, tools=tools, prompt=prompt)
	agent_executor = AgentExecutor(
	agent=agent,
	tools=tools,
	verbose=True,
	max_iterations=6,
	handle_parsing_errors="Check your output and make sure it conforms to the format instructions!",
	return_intermediate_steps=True,
	early_stopping_method="force"
	)

	# Main Processing Function
	def process_with_agent(
	user_message: str,
	conversation_id: str = None,
	user_email: str = None,
	callback=None
	):
	"""Process user message through autonomous AI agent."""

	if not conversation_id:
	conversation_id = f"conv_{datetime.now().strftime('%Y%m%d_%H%M%S')}_{hash(user_message) % 10000}"

	if conversation_id not in conversations:
	conversations[conversation_id] = {
	"messages": [],
	"ticket_info": {},
	"created_at": datetime.now().isoformat(),
	"user_email": user_email,
	"status": "open"
	}

	conv = conversations[conversation_id]

	conv["messages"].append({
	"role": "user",
	"content": user_message,
	"timestamp": datetime.now().isoformat()
	})

	if callback:
	callback({"type": "status", "message": "Agent is thinking..."})

	# Build context for follow-ups
	if len(conv["messages"]) > 1:
	context = f"CONVERSATION HISTORY:\n"
	for msg in conv["messages"][-6:-1]:
	context += f"{msg['role'].upper()}: {msg['content']}\n"
	context += f"\nCURRENT MESSAGE: {user_message}"
	agent_input = context
	else:
	agent_input = user_message

	try:
	result = agent_executor.invoke({"input": agent_input})

	agent_response = result.get("output", "I apologize, I encountered an error.")
	intermediate_steps = result.get("intermediate_steps", [])

	# IMPROVED: Check tool usage to determine status
	status = "in_progress"
	should_save = False
	escalated = False
	used_escalation_tool = False

	# First, check if EscalateToHuman tool was actually used
	for action, observation in intermediate_steps:
	if action.tool == "EscalateToHuman":
	used_escalation_tool = True
	print("🔍 Detected EscalateToHuman tool usage")
	break

	# Determine final status
	if used_escalation_tool:
	# Tool was used - definitely escalated
	status = "escalated"
	should_save = True
	escalated = True
	print("🔴 Ticket ESCALATED (tool used) - Saving to Firebase")
	elif "ESCALATED" in agent_response or "TKT-" in agent_response:
	# Fallback: Check response text
	status = "escalated"
	should_save = True
	escalated = True
	print("🔴 Ticket ESCALATED (text match) - Saving to Firebase")
	elif any(phrase in agent_response.lower() for phrase in [
	"resolved", "you're all set", "should work now", "problem solved",
	"this should fix", "try these steps", "follow these steps"
	]):
	# Resolution detected
	status = "resolved"
	should_save = True
	print("✅ Ticket RESOLVED - Saving to Firebase")
	else:
	# Still in progress
	print("⏳ Ticket IN PROGRESS - Not saving yet")

	# Extract ticket info from tools
	ticket_info = conv.get("ticket_info", {})
	kb_confidence = None
	escalation_reason = None

	for action, observation in intermediate_steps:
	if action.tool == "ClassifyTicket":
	parts = str(observation).split(", ")
	for part in parts:
	if "Impact:" in part:
	ticket_info["impact"] = part.split(": ")[1]
	elif "Urgency:" in part:
	ticket_info["urgency"] = part.split(": ")[1]
	elif "Type:" in part:
	ticket_info["type"] = part.split(": ")[1]

	elif action.tool == "RouteTicket":
	ticket_info["department"] = str(observation).replace("Department: ", "")

	elif action.tool == "SearchKnowledgeBase":
	# Extract confidence from KB response
	if "[KB Confidence:" in str(observation):
	try:
	conf_str = str(observation).split("[KB Confidence: ")[1].split("]")[0]
	kb_confidence = float(conf_str)
	ticket_info["kb_confidence"] = kb_confidence
	except:
	pass

	elif action.tool == "EscalateToHuman":
	# Capture escalation reason
	escalation_reason = action.tool_input

	conv["ticket_info"] = ticket_info
	conv["status"] = status

	# Build reasoning trace for debugging
	reasoning_trace = []
	for action, observation in intermediate_steps:
	reasoning_trace.append({
	"tool": action.tool,
	"input": action.tool_input,
	"output": str(observation)[:200]
	})

	if callback:
	callback({
	"type": "tool_use",
	"tool": action.tool,
	"input": action.tool_input
	})

	conv["messages"].append({
	"role": "assistant",
	"content": agent_response,
	"timestamp": datetime.now().isoformat(),
	"reasoning": reasoning_trace
	})

	# Save to Firestore if resolved OR escalated
	firestore_id = None
	if should_save:
	print(f"💾 Preparing to save ticket - Status: {status}, Escalated: {escalated}")

	firestore_data = {
	"conversation_id": conversation_id,
	"status": status,
	"user_email": user_email or "anonymous",
	"ticket_info": ticket_info,
	"messages": conv["messages"],
	"resolution": agent_response,
	"created_at_iso": conv["created_at"],
	"escalated": escalated,
	"reasoning_trace": reasoning_trace
	}

	# Add escalation reason if escalated
	if escalated:
	if escalation_reason:
	firestore_data["escalation_reason"] = escalation_reason
	elif kb_confidence is not None and kb_confidence < 0.6:
	firestore_data["escalation_reason"] = f"Low KB confidence: {kb_confidence}"
	else:
	firestore_data["escalation_reason"] = "Complex issue requiring human intervention"

	print(f"🔼 Saving escalated ticket - Reason: {firestore_data['escalation_reason']}")

	firestore_id = save_ticket_to_firestore(firestore_data)

	if firestore_id:
	print(f"✅ Successfully saved to Firestore with ID: {firestore_id}")
	else:
	print("❌ Failed to save to Firestore")

	if callback:
	callback({
	"type": "saved",
	"firestore_id": firestore_id,
	"status": status
	})
	else:
	print(f"⏭️ Not saving - Status: {status}, Should save: {should_save}")

	return {
	"conversation_id": conversation_id,
	"response": agent_response,
	"status": status,
	"message_count": len(conv["messages"]),
	"reasoning_trace": reasoning_trace,
	"ticket_info": ticket_info,
	"firestore_id": firestore_id,
	"escalated": escalated
	}

	except Exception as e:
	print(f"❌ Agent error: {e}")
	import traceback
	traceback.print_exc()

	error_response = "I apologize, I encountered an error. Please try again or I can escalate this to a human agent."
	conv["messages"].append({
	"role": "assistant",
	"content": error_response,
	"timestamp": datetime.now().isoformat()
	})

	if callback:
	callback({"type": "error", "message": str(e)})

	return {
	"conversation_id": conversation_id,
	"response": error_response,
	"status": "error",
	"error": str(e)
	}

	def get_conversation_history(conversation_id: str):
	"""Get conversation history."""
	return conversations.get(conversation_id)