Spaces:

karim323
/

nlp-analysis-api

Running

File size: 3,918 Bytes

e4eb82b

"""
Pydantic models for request and response validation
"""
from pydantic import BaseModel, Field, validator
from typing import Optional, List


class TextInput(BaseModel):
    """Input model for text-based operations"""
    text: str = Field(
        ..., 
        min_length=1, 
        max_length=5000,
        description="The text to process (max 5000 characters)"
    )
    
    @validator('text')
    def validate_text(cls, v):
        """Validate and sanitize text input"""
        # Strip whitespace
        v = v.strip()
        
        # Check if empty after stripping
        if not v:
            raise ValueError("Text cannot be empty or only whitespace")
            
        return v


class BatchTextInput(BaseModel):
    """Input model for batch text processing"""
    texts: List[str] = Field(
        ..., 
        min_items=1, 
        max_items=100,
        description="List of texts to process (max 100 items)"
    )
    
    @validator('texts')
    def validate_texts(cls, v):
        """Validate each text in the batch"""
        for text in v:
            if not text or not text.strip():
                raise ValueError("All texts must be non-empty")
            if len(text) > 5000:
                raise ValueError("Each text must be under 5000 characters")
        return v


class TranslationInput(BaseModel):
    """Input model for translation"""
    text: str = Field(
        ..., 
        min_length=1, 
        max_length=3000,
        description="The text to translate (max 3000 characters)"
    )
    source_lang: str = Field(
        default="en", 
        min_length=2, 
        max_length=5,
        description="Source language code (e.g., 'en', 'es', 'fr')"
    )
    target_lang: str = Field(
        default="ar", 
        min_length=2, 
        max_length=5,
        description="Target language code (e.g., 'en', 'es', 'fr')"
    )
    
    @validator('text')
    def validate_text(cls, v):
        """Validate and sanitize translation text"""
        v = v.strip()
        if not v:
            raise ValueError("Text cannot be empty")
        return v


class SentimentResponse(BaseModel):
    """Response model for sentiment analysis"""
    sentiment: str = Field(..., description="The detected sentiment (Positive/Negative/Neutral)")
    confidence: float = Field(..., ge=0.0, le=1.0, description="Confidence score")
    all_scores: Optional[List[dict]] = Field(default=None, description="All sentiment scores")


class TranslationResponse(BaseModel):
    """Response model for translation"""
    translated_text: str = Field(..., description="The translated text")


class Entity(BaseModel):
    """Model for a named entity"""
    text: str = Field(..., description="The entity text")
    label: str = Field(..., description="The entity label/type")
    score: float = Field(..., ge=0.0, le=1.0, description="Confidence score")


class NERResponse(BaseModel):
    """Response model for Named Entity Recognition"""
    entities: List[Entity] = Field(..., description="List of detected entities")
    text: str = Field(..., description="The original text")


class BatchSentimentResult(BaseModel):
    """Result for a single text in batch analysis"""
    text: str = Field(..., description="The analyzed text")
    sentiment: str = Field(..., description="The detected sentiment")
    confidence: float = Field(..., ge=0.0, le=1.0, description="Confidence score")


class BatchSentimentResponse(BaseModel):
    """Response model for batch sentiment analysis"""
    results: List[BatchSentimentResult] = Field(..., description="Results for each text")

class ParaphraseResponse(BaseModel):
    """Response model for paraphrasing"""
    paraphrased_text: str = Field(..., description="The paraphrased text")

class SummarizationResponse(BaseModel):
    """Response model for text summarization"""
    summary_text: str = Field(..., description="The summarized text")