Spaces:

NLP-Debater-Project
/

FastAPI-Backend-Models

Sleeping

File size: 5,613 Bytes

"""Service for topic extraction from text using LangChain Groq"""

import logging
from typing import Optional, List
from langchain_core.messages import HumanMessage, SystemMessage
from langchain_groq import ChatGroq
from pydantic import BaseModel, Field
from langsmith import traceable

from config import GROQ_API_KEY, GROQ_TOPIC_MODEL

logger = logging.getLogger(__name__)


class TopicOutput(BaseModel):
    """Pydantic schema for topic extraction output"""
    topic: str = Field(..., description="A specific, detailed topic description")


class TopicService:
    """Service for extracting topics from text arguments"""
    
    def __init__(self):
        self.llm = None
        # Use valid Groq model - defaults from config, fallback to stable model
        self.model_name = GROQ_TOPIC_MODEL if GROQ_TOPIC_MODEL else "llama3-70b-8192"
        # Fallback models to try if primary fails (using current/available Groq models)
        self.fallback_models = [
            "llama3-70b-8192",  # Stable production model (same as chat)
            "llama-3.1-8b-instant",  # Faster, smaller alternative
            "openai/gpt-oss-20b"  # Alternative OpenAI OSS model
        ]
        self.initialized = False
        
    def initialize(self, model_name: Optional[str] = None):
        """Initialize the Groq LLM with structured output"""
        if self.initialized:
            logger.info("Topic service already initialized")
            return
            
        if not GROQ_API_KEY:
            raise ValueError("GROQ_API_KEY not found in environment variables")
        
        if model_name:
            self.model_name = model_name
            
        # Try primary model first, then fallbacks
        models_to_try = [self.model_name] + [m for m in self.fallback_models if m != self.model_name]
        
        last_error = None
        for model_to_try in models_to_try:
            try:
                logger.info(f"Initializing topic extraction service with model: {model_to_try}")
                
                llm = ChatGroq(
                    model=model_to_try,
                    api_key=GROQ_API_KEY,
                    temperature=0.0,
                    max_tokens=512,
                )
                
                # Bind structured output directly to the model
                self.llm = llm.with_structured_output(TopicOutput)
                self.model_name = model_to_try  # Update to successful model
                self.initialized = True
                
                logger.info(f"✓ Topic extraction service initialized successfully with model: {model_to_try}")
                return
                
            except Exception as e:
                last_error = e
                logger.warning(f"Failed to initialize with model {model_to_try}: {str(e)}")
                continue
        
        # If all models failed
        logger.error(f"Error initializing topic service with all models: {last_error}")
        raise RuntimeError(f"Failed to initialize topic service with any model. Last error: {str(last_error)}")
    
    @traceable(name="extract_topic")
    def extract_topic(self, text: str) -> str:
        """
        Extract a topic from the given text/argument
        
        Args:
            text: The input text/argument to extract topic from
            
        Returns:
            The extracted topic string
        """
        if not self.initialized:
            self.initialize()
        
        if not text or not isinstance(text, str):
            raise ValueError("Text must be a non-empty string")
        
        text = text.strip()
        if len(text) == 0:
            raise ValueError("Text cannot be empty")
        
        system_message = """You are an information extraction model.
Extract a topic from the user text. The topic should be a single sentence that captures the main idea of the text in simple english.

Examples:
- Text: "Governments should subsidize electric cars to encourage adoption."
  Output: topic="government subsidies for electric vehicle adoption"

- Text: "Raising the minimum wage will hurt small businesses and cost jobs."
  Output: topic="raising the minimum wage and its economic impact on small businesses"
"""
        
        try:
            result = self.llm.invoke(
                [
                    SystemMessage(content=system_message),
                    HumanMessage(content=text),
                ]
            )
            
            return result.topic
            
        except Exception as e:
            logger.error(f"Error extracting topic: {str(e)}")
            raise RuntimeError(f"Topic extraction failed: {str(e)}")
    
    def batch_extract_topics(self, texts: List[str]) -> List[str]:
        """
        Extract topics from multiple texts
        
        Args:
            texts: List of input texts/arguments
            
        Returns:
            List of extracted topics
        """
        if not self.initialized:
            self.initialize()
        
        if not texts or not isinstance(texts, list):
            raise ValueError("Texts must be a non-empty list")
        
        results = []
        for text in texts:
            try:
                topic = self.extract_topic(text)
                results.append(topic)
            except Exception as e:
                logger.error(f"Error extracting topic for text '{text[:50]}...': {str(e)}")
                results.append(None)  # Or raise, depending on desired behavior
        
        return results


# Initialize singleton instance
topic_service = TopicService()