Spaces:

Pipalskill
/

Support-Ticket-AI-Agent

Sleeping

File size: 19,608 Bytes

import os
os.environ["TOKENIZERS_PARALLELISM"] = "false"
os.environ["TRANSFORMERS_CACHE"] = "/tmp/transformers"
os.environ["HF_HOME"] = "/tmp/huggingface"
os.environ["SENTENCE_TRANSFORMERS_HOME"] = "/tmp/sentence_transformers"
os.environ["TORCH_HOME"] = "/tmp/torch"

import json
import requests
import torch
import time
from transformers import AutoTokenizer, AutoModelForSequenceClassification
import numpy as np
from sentence_transformers import SentenceTransformer
import chromadb
from chromadb.config import Settings
from langchain_google_genai import ChatGoogleGenerativeAI
from langchain.agents.react.agent import create_react_agent
from langchain.agents.agent import AgentExecutor

from langchain.tools import Tool
from langchain.prompts import PromptTemplate
import threading
from datetime import datetime
import firebase_admin
from firebase_admin import credentials, firestore
from typing import Optional, Dict, Any

# Environment
GEMINI_API_KEY = os.environ.get("GEMINI_API_KEY")
ROUTING_URL = os.environ.get("ROUTING_URL")
SPACE_URL = os.environ.get("SPACE_URL", "http://localhost:7860")
FIREBASE_CREDS_PATH = os.environ.get("FIREBASE_CREDS_PATH")
firebase_creds_json = os.getenv("FIREBASE_CREDS_JSON")

# Initialize Firebase
db = None
if firebase_creds_json:
    try:
        creds_dict = json.loads(firebase_creds_json)
        cred = credentials.Certificate(creds_dict)

        if not firebase_admin._apps:
            firebase_admin.initialize_app(cred)
        db = firestore.client()
        print("✅ Firebase initialized from FIREBASE_CREDS_JSON")
    except Exception as e:
        import traceback
        print(f"⚠️ Firebase init failed: {e}")
        traceback.print_exc()
else:
    print("⚠️ FIREBASE_CREDS_JSON not found in environment variables")

# Label Dictionary
LABEL_DICTIONARY = {
    "I1": "Low Impact", "I2": "Medium Impact", "I3": "High Impact", "I4": "Critical Impact",
    "U1": "Low Urgency", "U2": "Medium Urgency", "U3": "High Urgency", "U4": "Critical Urgency",
    "T1": "Information", "T2": "Incident", "T3": "Problem", "T4": "Request", "T5": "Question"
}

# Classification Model
clf_model_name = "DavinciTech/BERT_Categorizer"
clf_tokenizer = AutoTokenizer.from_pretrained(clf_model_name, cache_dir="/tmp/transformers")
clf_model = AutoModelForSequenceClassification.from_pretrained(clf_model_name, cache_dir="/tmp/transformers")

def classify_ticket(text):
    """Classify ticket into Impact, Urgency, and Type."""
    inputs = clf_tokenizer(text, return_tensors="pt", truncation=True)
    outputs = clf_model(**inputs)
    logits = outputs.logits[0]
    impact_idx = torch.argmax(logits[:4]).item() + 1
    urgency_idx = torch.argmax(logits[4:8]).item() + 1
    type_idx = torch.argmax(logits[8:]).item() + 1
    return {
        "impact": LABEL_DICTIONARY[f"I{impact_idx}"],
        "urgency": LABEL_DICTIONARY[f"U{urgency_idx}"],
        "type": LABEL_DICTIONARY[f"T{type_idx}"]
    }

# Routing Function
def call_routing(text, retries=3, delay=5):
    """Route ticket to appropriate department."""
    url = ROUTING_URL if ROUTING_URL else f"{SPACE_URL}/route"
    for attempt in range(retries):
        try:
            resp = requests.post(url, json={"text": text}, timeout=30)
            resp.raise_for_status()
            return resp.json().get("department", "General IT")
        except Exception as e:
            print(f"Routing attempt {attempt+1} failed: {e}")
            if attempt < retries - 1:
                time.sleep(delay)
    return "General IT"

# Knowledge Base
CHROMA_PATH = "/tmp/chroma"
COLLECTION_NAME = "knowledge_base"
kb_collection = None
kb_lock = threading.Lock()
encoder = SentenceTransformer("all-MiniLM-L6-v2", cache_folder="/tmp/sentence_transformers")

def get_kb_collection():
    global kb_collection
    if kb_collection is None:
        with kb_lock:
            if kb_collection is None:
                try:
                    chroma_client = chromadb.PersistentClient(
                        path=CHROMA_PATH,
                        settings=Settings(anonymized_telemetry=False, allow_reset=True)
                    )
                    kb_collection = chroma_client.get_or_create_collection(COLLECTION_NAME)
                except Exception as e:
                    print(f"Could not get KB collection: {e}")
    return kb_collection

def query_kb(text: str, top_k: int = 1):
    """Query KB and return answer with confidence."""
    collection = get_kb_collection()
    if not collection or collection.count() == 0:
        return {"answer": None, "confidence": 0.0}
    
    try:
        query_embedding = encoder.encode([text])[0].tolist()
        results = collection.query(
            query_embeddings=[query_embedding],
            n_results=top_k,
            include=["documents", "distances", "metadatas"]
        )
        
        if not results or not results.get("documents") or len(results["documents"][0]) == 0:
            return {"answer": None, "confidence": 0.0}
        
        answer = results["documents"][0][0]
        distance = results["distances"][0][0] if results.get("distances") else 1.0
        confidence = max(0.0, 1.0 - (distance / 2.0))
        
        return {"answer": answer, "confidence": round(float(confidence), 3)}
    except Exception as e:
        print(f"KB query failed: {e}")
        return {"answer": None, "confidence": 0.0}

# Firestore Helper
def save_ticket_to_firestore(ticket_data: Dict[str, Any]):
    """Save resolved/escalated ticket to Firestore."""
    if not db:
        print("⚠️ Firestore not initialized, skipping save")
        return None
    
    try:
        ticket_ref = db.collection('tickets').document()
        ticket_data['created_at'] = firestore.SERVER_TIMESTAMP
        ticket_data['updated_at'] = firestore.SERVER_TIMESTAMP
        ticket_ref.set(ticket_data)
        print(f"✅ Ticket saved to Firestore: {ticket_ref.id}")
        return ticket_ref.id
    except Exception as e:
        print(f"❌ Firestore save failed: {e}")
        return None

# Gemini LLM
llm = ChatGoogleGenerativeAI(
    model="gemini-2.5-flash",
    temperature=0.3,
    google_api_key=GEMINI_API_KEY
)

# Global conversation storage
conversations = {}

# Tool Functions for Agent
def classify_tool(query: str) -> str:
    """Analyzes ticket severity, impact, urgency, and type. Use when you need to understand ticket priority."""
    result = classify_ticket(query)
    return f"Impact: {result['impact']}, Urgency: {result['urgency']}, Type: {result['type']}"

def routing_tool(query: str) -> str:
    """Identifies which IT department should handle this issue. Use when you need to know responsible team."""
    dept = call_routing(query)
    return f"Department: {dept}"

def kb_tool(query: str) -> str:
    """Searches knowledge base for solutions. Returns answer with confidence score. Use when you need technical solutions."""
    result = query_kb(query)
    if result["answer"] and result["confidence"] > 0.5:
        return f"[KB Confidence: {result['confidence']}]\n{result['answer']}"
    return f"[KB Confidence: {result['confidence']}] No relevant solution found in knowledge base."

def escalation_tool(reason: str) -> str:
    """Creates escalation ticket for human agent. Use ONLY when KB confidence is below 0.6 AND issue is truly complex. Always try KB first!"""
    ticket_id = f"TKT-{datetime.now().strftime('%Y%m%d-%H%M%S')}"
    return f"ESCALATED: Ticket {ticket_id} created. Reason: {reason}. Human agent will respond in 2-4 hours."

# Define Tools
tools = [
    Tool(
        name="ClassifyTicket",
        func=classify_tool,
        description="Analyzes ticket to determine impact level, urgency, and type. Use this when you need to understand the severity or priority of an issue."
    ),
    Tool(
        name="RouteTicket",
        func=routing_tool,
        description="Determines which IT department should handle this ticket. Use this when you need to identify the responsible team."
    ),
    Tool(
        name="SearchKnowledgeBase",
        func=kb_tool,
        description="Searches internal knowledge base for solutions. Returns answer with confidence score (0-1). ALWAYS USE THIS FIRST before escalating. Use this when you need to find technical solutions or troubleshooting steps."
    ),
    Tool(
        name="EscalateToHuman",
        func=escalation_tool,
        description="Creates an escalation ticket for human agent review. CRITICAL: Use this ONLY as a LAST RESORT when: 1) KB confidence score is below 0.6 AND you've already tried KB, 2) Issue is extremely complex and unusual, 3) User explicitly confirms the KB solution failed after trying it. DO NOT escalate if KB has a reasonable solution (confidence > 0.6)."
    )
]

# IMPROVED Agent Prompt
AGENT_PROMPT = """You are an intelligent IT Helpdesk AI Agent. Your PRIMARY goal is to resolve tickets using the Knowledge Base. Escalation is a LAST RESORT.

AVAILABLE TOOLS:
{tools}

TOOL NAMES: {tool_names}

CRITICAL RULES:
1. **ALWAYS search Knowledge Base FIRST** - This is your primary tool for resolution
2. **Trust KB solutions with confidence >= 0.6** - These are reliable solutions, provide them to users
3. **ONLY escalate when ABSOLUTELY necessary**:
   - KB confidence is below 0.6 AND no solution found
   - Issue is extremely unusual or complex beyond KB scope
   - User explicitly tried your KB solution and reports it failed
4. **Be thorough with KB** - If first search doesn't work, try rephrasing the query
5. **Maintain context** - Remember conversation history for follow-ups

DECISION WORKFLOW:
NEW TICKET → Search KB → If confidence >= 0.6 → Provide solution → Mark RESOLVED
         ↓
   If confidence < 0.6 → Try rephrasing search → Still low? → Classify & Route → THEN escalate

FOLLOW-UP → Check if user tried solution → Worked? → Mark RESOLVED
                                      ↓
                              Failed? → Search KB again with different query → Still failing? → THEN escalate

IMPORTANT: 
- Don't mention tool names or confidence scores to users
- Provide clear, step-by-step instructions from KB
- Be conversational and helpful
- Escalation means you couldn't solve it - avoid this outcome!

FORMAT:
Question: the user's input
Thought: your reasoning about what to do next
Action: the tool to use (must be one of [{tool_names}])
Action Input: the input for that tool
Observation: the tool's output
... (repeat Thought/Action/Observation as needed)
Thought: I now have enough information to respond
Final Answer: your complete response to the user

Begin!

Question: {input}
Thought: {agent_scratchpad}"""

prompt = PromptTemplate.from_template(AGENT_PROMPT)

# Create Agent
agent = create_react_agent(llm=llm, tools=tools, prompt=prompt)
agent_executor = AgentExecutor(
    agent=agent,
    tools=tools,
    verbose=True,
    max_iterations=6,
    handle_parsing_errors="Check your output and make sure it conforms to the format instructions!",
    return_intermediate_steps=True,
    early_stopping_method="force"
)

# Main Processing Function
def process_with_agent(
    user_message: str, 
    conversation_id: str = None,
    user_email: str = None,
    callback=None
):
    """Process user message through autonomous AI agent."""
    
    if not conversation_id:
        conversation_id = f"conv_{datetime.now().strftime('%Y%m%d_%H%M%S')}_{hash(user_message) % 10000}"
    
    if conversation_id not in conversations:
        conversations[conversation_id] = {
            "messages": [],
            "ticket_info": {},
            "created_at": datetime.now().isoformat(),
            "user_email": user_email,
            "status": "open"
        }
    
    conv = conversations[conversation_id]
    
    conv["messages"].append({
        "role": "user",
        "content": user_message,
        "timestamp": datetime.now().isoformat()
    })
    
    if callback:
        callback({"type": "status", "message": "Agent is thinking..."})
    
    # Build context for follow-ups
    if len(conv["messages"]) > 1:
        context = f"CONVERSATION HISTORY:\n"
        for msg in conv["messages"][-6:-1]:
            context += f"{msg['role'].upper()}: {msg['content']}\n"
        context += f"\nCURRENT MESSAGE: {user_message}"
        agent_input = context
    else:
        agent_input = user_message
    
    try:
        result = agent_executor.invoke({"input": agent_input})
        
        agent_response = result.get("output", "I apologize, I encountered an error.")
        intermediate_steps = result.get("intermediate_steps", [])
        
        # IMPROVED: Check tool usage to determine status
        status = "in_progress"
        should_save = False
        escalated = False
        used_escalation_tool = False
        
        # First, check if EscalateToHuman tool was actually used
        for action, observation in intermediate_steps:
            if action.tool == "EscalateToHuman":
                used_escalation_tool = True
                print("🔍 Detected EscalateToHuman tool usage")
                break
        
        # Determine final status
        if used_escalation_tool:
            # Tool was used - definitely escalated
            status = "escalated"
            should_save = True
            escalated = True
            print("🔴 Ticket ESCALATED (tool used) - Saving to Firebase")
        elif "ESCALATED" in agent_response or "TKT-" in agent_response:
            # Fallback: Check response text
            status = "escalated"
            should_save = True
            escalated = True
            print("🔴 Ticket ESCALATED (text match) - Saving to Firebase")
        elif any(phrase in agent_response.lower() for phrase in [
            "resolved", "you're all set", "should work now", "problem solved", 
            "this should fix", "try these steps", "follow these steps"
        ]):
            # Resolution detected
            status = "resolved"
            should_save = True
            print("✅ Ticket RESOLVED - Saving to Firebase")
        else:
            # Still in progress
            print("⏳ Ticket IN PROGRESS - Not saving yet")
        
        # Extract ticket info from tools
        ticket_info = conv.get("ticket_info", {})
        kb_confidence = None
        escalation_reason = None
        
        for action, observation in intermediate_steps:
            if action.tool == "ClassifyTicket":
                parts = str(observation).split(", ")
                for part in parts:
                    if "Impact:" in part:
                        ticket_info["impact"] = part.split(": ")[1]
                    elif "Urgency:" in part:
                        ticket_info["urgency"] = part.split(": ")[1]
                    elif "Type:" in part:
                        ticket_info["type"] = part.split(": ")[1]
            
            elif action.tool == "RouteTicket":
                ticket_info["department"] = str(observation).replace("Department: ", "")
            
            elif action.tool == "SearchKnowledgeBase":
                # Extract confidence from KB response
                if "[KB Confidence:" in str(observation):
                    try:
                        conf_str = str(observation).split("[KB Confidence: ")[1].split("]")[0]
                        kb_confidence = float(conf_str)
                        ticket_info["kb_confidence"] = kb_confidence
                    except:
                        pass
            
            elif action.tool == "EscalateToHuman":
                # Capture escalation reason
                escalation_reason = action.tool_input
        
        conv["ticket_info"] = ticket_info
        conv["status"] = status
        
        # Build reasoning trace for debugging
        reasoning_trace = []
        for action, observation in intermediate_steps:
            reasoning_trace.append({
                "tool": action.tool,
                "input": action.tool_input,
                "output": str(observation)[:200]
            })
            
            if callback:
                callback({
                    "type": "tool_use",
                    "tool": action.tool,
                    "input": action.tool_input
                })
        
        conv["messages"].append({
            "role": "assistant",
            "content": agent_response,
            "timestamp": datetime.now().isoformat(),
            "reasoning": reasoning_trace
        })
        
        # Save to Firestore if resolved OR escalated
        firestore_id = None
        if should_save:
            print(f"💾 Preparing to save ticket - Status: {status}, Escalated: {escalated}")
            
            firestore_data = {
                "conversation_id": conversation_id,
                "status": status,
                "user_email": user_email or "anonymous",
                "ticket_info": ticket_info,
                "messages": conv["messages"],
                "resolution": agent_response,
                "created_at_iso": conv["created_at"],
                "escalated": escalated,
                "reasoning_trace": reasoning_trace
            }
            
            # Add escalation reason if escalated
            if escalated:
                if escalation_reason:
                    firestore_data["escalation_reason"] = escalation_reason
                elif kb_confidence is not None and kb_confidence < 0.6:
                    firestore_data["escalation_reason"] = f"Low KB confidence: {kb_confidence}"
                else:
                    firestore_data["escalation_reason"] = "Complex issue requiring human intervention"
                
                print(f"🔼 Saving escalated ticket - Reason: {firestore_data['escalation_reason']}")
            
            firestore_id = save_ticket_to_firestore(firestore_data)
            
            if firestore_id:
                print(f"✅ Successfully saved to Firestore with ID: {firestore_id}")
            else:
                print("❌ Failed to save to Firestore")
            
            if callback:
                callback({
                    "type": "saved",
                    "firestore_id": firestore_id,
                    "status": status
                })
        else:
            print(f"⏭️  Not saving - Status: {status}, Should save: {should_save}")
        
        return {
            "conversation_id": conversation_id,
            "response": agent_response,
            "status": status,
            "message_count": len(conv["messages"]),
            "reasoning_trace": reasoning_trace,
            "ticket_info": ticket_info,
            "firestore_id": firestore_id,
            "escalated": escalated
        }
        
    except Exception as e:
        print(f"❌ Agent error: {e}")
        import traceback
        traceback.print_exc()
        
        error_response = "I apologize, I encountered an error. Please try again or I can escalate this to a human agent."
        conv["messages"].append({
            "role": "assistant",
            "content": error_response,
            "timestamp": datetime.now().isoformat()
        })
        
        if callback:
            callback({"type": "error", "message": str(e)})
        
        return {
            "conversation_id": conversation_id,
            "response": error_response,
            "status": "error",
            "error": str(e)
        }

def get_conversation_history(conversation_id: str):
    """Get conversation history."""
    return conversations.get(conversation_id)