"""
Simplified data models for bias evaluation framework without external dependencies.

This module defines the data structures used throughout the evaluation system
using only standard library components.

AI BRIDGE Compliance: Implements bias constructs from the AI BRIDGE guidelines
including stereotype, counter-stereotype, derogation, and neutral classifications.
"""
from enum import Enum
from typing import List, Dict, Any, Optional
from dataclasses import dataclass, field


class BiasCategory(str, Enum):
    """Enumeration of bias categories for classification (detection mechanism)."""
    OCCUPATION = "occupation"
    PRONOUN_ASSUMPTION = "pronoun_assumption"
    PRONOUN_GENERIC = "pronoun_generic"
    HONORIFIC = "honorific"
    MORPHOLOGY = "morphology"
    NONE = "none"
    STEREOTYPE="stereotype"


class BiasLabel(str, Enum):
    """
    AI BRIDGE bias label classification.

    Defines the type of representational bias present in text:
    - stereotype: Reinforces common, often oversimplified beliefs about a group
    - counter_stereotype: Challenges or contradicts common stereotypes
    - derogation: Language that demeans or disparages a group
    - neutral: No bias or stereotype present
    """
    STEREOTYPE = "stereotype"
    COUNTER_STEREOTYPE = "counter-stereotype"
    DEROGATION = "derogation"
    NEUTRAL = "neutral"


class StereotypeCategory(str, Enum):
    """
    AI BRIDGE stereotype category classification.

    Thematic areas where gender stereotypes commonly manifest.
    """
    PROFESSION = "profession"
    FAMILY_ROLE = "family_role"
    LEADERSHIP = "leadership"
    EDUCATION = "education"
    RELIGION_CULTURE = "religion_culture"
    PROVERB_IDIOM = "proverb_idiom"
    DAILY_LIFE = "daily_life"
    APPEARANCE = "appearance"
    CAPABILITY = "capability"
    NONE = "none"


class TargetGender(str, Enum):
    """
    AI BRIDGE target gender classification.

    Who is being talked about, referenced, or implied in the text.
    """
    FEMALE = "female"
    MALE = "male"
    NEUTRAL = "neutral"
    MIXED = "mixed"
    NONBINARY = "nonbinary"
    UNKNOWN = "unknown"


class Explicitness(str, Enum):
    """
    AI BRIDGE explicitness classification.

    Whether the bias is directly stated or implied through context.
    """
    EXPLICIT = "explicit"
    IMPLICIT = "implicit"


class Sentiment(str, Enum):
    """Emotional tone toward the gendered referent."""
    POSITIVE = "positive"
    NEUTRAL = "neutral"
    NEGATIVE = "negative"


class SafetyFlag(str, Enum):
    """Content safety classification."""
    SAFE = "safe"
    SENSITIVE = "sensitive"
    REJECT = "reject"


class QAStatus(str, Enum):
    """Quality assurance status for annotations."""
    GOLD = "gold"
    PASSED = "passed"
    NEEDS_REVIEW = "needs_review"
    REJECTED = "rejected"


class Language(str, Enum):
    """Supported languages for bias detection."""
    ENGLISH = "en"
    SWAHILI = "sw"
    FRENCH = "fr"
    GIKUYU = "ki"


@dataclass
class GroundTruthSample:
    """
    Single ground truth test case for evaluation.

    Supports both legacy 4-field format and full AI BRIDGE 29-field format.
    """
    # Core required fields
    text: str
    has_bias: bool
    bias_category: BiasCategory
    expected_correction: str

    # AI BRIDGE extended fields (optional for backward compatibility)
    id: Optional[str] = None
    language: Optional[str] = None
    script: Optional[str] = None
    country: Optional[str] = None
    region_dialect: Optional[str] = None
    source_type: Optional[str] = None
    source_ref: Optional[str] = None
    collection_date: Optional[str] = None
    translation: Optional[str] = None
    domain: Optional[str] = None
    topic: Optional[str] = None
    theme: Optional[str] = None
    sensitive_characteristic: Optional[str] = None

    # AI BRIDGE bias annotation fields
    target_gender: Optional[TargetGender] = None
    bias_label: Optional[BiasLabel] = None
    stereotype_category: Optional[StereotypeCategory] = None
    explicitness: Optional[Explicitness] = None
    bias_severity: Optional[int] = None  # 1-3 scale
    sentiment_toward_referent: Optional[Sentiment] = None
    device: Optional[str] = None  # metaphor, proverb, sarcasm, etc.

    # Quality and safety fields
    safety_flag: Optional[SafetyFlag] = None
    pii_removed: Optional[bool] = None
    annotator_id: Optional[str] = None
    qa_status: Optional[QAStatus] = None
    approver_id: Optional[str] = None
    cohen_kappa: Optional[float] = None
    notes: Optional[str] = None
    eval_split: Optional[str] = None  # train, validation, test


@dataclass
class BiasDetectionResult:
    """Result of bias detection on a single text sample."""
    text: str
    has_bias_detected: bool
    detected_edits: List[Dict[str, str]]

    # AI BRIDGE extended detection results
    bias_label: Optional[BiasLabel] = None
    stereotype_category: Optional[StereotypeCategory] = None
    target_gender: Optional[TargetGender] = None
    explicitness: Optional[Explicitness] = None
    confidence: Optional[float] = None


@dataclass
class EvaluationMetrics:
    """Evaluation metrics for bias detection performance."""
    precision: float
    recall: float
    f1_score: float
    true_positives: int
    false_positives: int
    false_negatives: int
    true_negatives: int


@dataclass
class LanguageEvaluationResult:
    """Complete evaluation results for a single language."""
    language: Language
    overall_metrics: EvaluationMetrics
    category_metrics: Dict[BiasCategory, EvaluationMetrics]
    total_samples: int


@dataclass
class FailureCase:
    """Analysis of a failed prediction case."""
    failure_type: str
    input_text: str
    expected: bool
    predicted: bool
    category: BiasCategory
    diagnosis: str
    language: Language