"""
reasoning.py

The ReasoningCompiler per Section 7 of the architecture document.

Generates deterministic, fact-grounded reasoning text for each ranked candidate.

Pre-write audits:
  1. Numeric Regex Audit: every number mentioned must exist in the candidate's JSON
  2. N-Gram Collision: difflib.SequenceMatcher to guarantee structural variation

Tone controlled by score percentile in the local score distribution.
No network calls. No LLM. Pure template + fact extraction.
"""

from __future__ import annotations

import difflib
import hashlib
import json
import math
import re
from typing import Any, Dict, List, Optional, Tuple

from features import FEATURE_COLUMNS



_LOW_CRED_VARIANTS: List[str] = [
    "high ratio of unverified advanced skill claims vs assessed scores",
    "advanced-level skills listed without corroborating platform assessment data",
    "claimed proficiency levels outpace platform-verified evidence on file",
    "self-reported expert-level skills exceed available assessment validation",
    "skill credibility gap: multiple advanced claims lack supporting assessment scores",
]


def _select_low_cred_variant(candidate_id: str) -> str:
    """Return a deterministic phrasing variant for the low_credibility concern.

    Uses the first 8 hex digits of MD5(candidate_id) as a stable hash —
    identical candidate_id always maps to the same variant across Python
    interpreter restarts and across machines.
    """
    digest = int(
        hashlib.md5(candidate_id.encode("utf-8", errors="ignore")).hexdigest()[:8], 16
    )
    return _LOW_CRED_VARIANTS[digest % len(_LOW_CRED_VARIANTS)]



# Percentile boundaries: top 10% = strong, 10-40% = positive, 40-70% = neutral,
# 70-90% = cautious, 90-100% = weak


_TONE_THRESHOLDS = [
    (0.90, "strong"),
    (0.60, "positive"),
    (0.30, "neutral"),
    (0.10, "cautious"),
    (0.00, "weak"),
]


def _get_tone(percentile: float) -> str:
    """
    Given a candidate's score percentile (0=worst, 1=best) among top-100,
    return the tone label. Continuous transition — no rank-based cliffs.
    """
    for threshold, tone in _TONE_THRESHOLDS:
        if percentile >= threshold:
            return tone
    return "weak"


_OPENING_BY_TONE = {
    "strong": [
        "Highly competitive profile with direct production experience in",
        "Outstanding match: verified depth in",
        "Top-tier candidate demonstrating hands-on expertise in",
    ],
    "positive": [
        "Strong candidate showing relevant experience in",
        "Well-qualified profile with demonstrated skills in",
        "Solid match with measurable background in",
    ],
    "neutral": [
        "Candidate presents relevant background in",
        "Profile shows applicable experience touching",
        "Partial alignment with job requirements, including",
    ],
    "cautious": [
        "Limited but present signal in",
        "Early-stage profile with some relevant exposure to",
        "Candidate shows initial familiarity with",
    ],
    "weak": [
        "Minimal alignment with target requirements;",
        "Profile does not strongly match the core JD criteria;",
        "Significant gaps identified relative to the job requirements;",
    ],
}


def _extract_candidate_numbers(candidate: dict) -> set:
    """
    Extract all numeric values from a candidate's JSON (recursively).
    Used by the numeric regex audit to verify any number we mention exists in the data.
    """
    numbers = set()
    raw_json = json.dumps(candidate)
    for match in re.finditer(r'\b(\d+(?:\.\d+)?)\b', raw_json):
        numbers.add(match.group(1))
    return numbers


def _numeric_regex_audit(text: str, candidate_numbers: set) -> Tuple[bool, List[str]]:
    """
    Numeric Regex Audit (Section 7).
    Asserts every number in the generated text exists in the candidate's JSON.

    Returns:
        (passed: bool, violations: List[str])
    """
    text_numbers = set(re.findall(r'\b(\d+(?:\.\d+)?)\b', text))
    violations = [n for n in text_numbers if n not in candidate_numbers]
    return len(violations) == 0, violations


def _ngram_collision_check(
    new_text: str,
    existing_texts: List[str],
    threshold: float = 0.65,
) -> Tuple[bool, float]:
    """
    N-Gram Collision Check (Section 7).
    Uses difflib.SequenceMatcher to guarantee structural variation.
    Returns (passes, max_similarity).
    A text fails if it's too similar to ANY previously generated text.
    """
    if not existing_texts:
        return True, 0.0

    max_sim = 0.0
    for existing in existing_texts:
        sim = difflib.SequenceMatcher(None, new_text, existing).ratio()
        max_sim = max(max_sim, sim)

    return max_sim < threshold, max_sim


def _get_hard_req_matches(candidate: dict, jd_config) -> List[str]:
    """
    Extract which hard requirements the candidate actually covers.
    Returns list of canonical requirement names that matched.
    """
    from jd_parser import hard_req_coverage_score

    skills = candidate.get("skills", []) or []
    candidate_skill_names = {s.get("name", "").lower().strip() for s in skills}

    career_text = " ".join(
        (ch.get("description", "") or "").lower()
        for ch in candidate.get("career_history", [])
    )

    matched = []
    for canonical_name, aliases in jd_config.hard_requirements.items():
        if any(alias in candidate_skill_names for alias in aliases):
            matched.append(canonical_name)
        elif any(alias in career_text for alias in aliases):
            matched.append(canonical_name)

    return matched


_JD_RELEVANT_CACHE: Dict[int, frozenset] = {}


def _build_jd_relevant_names(jd_config) -> frozenset:
    """Return (and cache) the frozenset of lowercase JD-relevant skill names."""
    key = id(jd_config)
    if key not in _JD_RELEVANT_CACHE:
        names: set = set()
        for term in jd_config.get_all_query_terms():
            names.add(term.lower().strip())
        for aliases in jd_config.hard_requirements.values():
            for alias in aliases:
                names.add(alias.lower().strip())
        _JD_RELEVANT_CACHE[key] = frozenset(names)
    return _JD_RELEVANT_CACHE[key]


def _get_top_skills(candidate: dict, n: int = 3, jd_config=None) -> List[str]:
    """Get top N skills, JD-relevant first then by tenure.

    When jd_config is supplied fills n slots in two passes:
      Pass 1 — JD-relevant skills sorted by duration_months DESC.
      Pass 2 — non-relevant skills by duration_months DESC (backfill only).

    The JD relevance set is memoised so this is O(1) after the first call
    per jd_config instance — safe to call in a tight 8,533-candidate loop.

    Falls back to pure tenure ranking when jd_config is None.
    """
    skills = candidate.get("skills", []) or []
    if not skills:
        return []

    if jd_config is not None:
        relevant_names = _build_jd_relevant_names(jd_config)
        if relevant_names:
            key_fn = lambda s: s.get("duration_months") or 0
            relevant   = sorted(
                (s for s in skills if (s.get("name") or "").lower().strip() in relevant_names),
                key=key_fn, reverse=True,
            )
            irrelevant = sorted(
                (s for s in skills if (s.get("name") or "").lower().strip() not in relevant_names),
                key=key_fn, reverse=True,
            )
            backfill_n = max(0, n - len(relevant[:n]))
            combined = relevant[:n] + irrelevant[:backfill_n]
            return [s.get("name", "") for s in combined[:n] if s.get("name")]

    # fallback
    sorted_skills = sorted(skills, key=lambda s: s.get("duration_months") or 0, reverse=True)
    return [s.get("name", "") for s in sorted_skills[:n] if s.get("name")]



SKILL_JD_PHRASES = {
    frozenset(["faiss", "milvus", "qdrant", "weaviate", "pinecone", "opensearch", "elasticsearch", "chroma"]): 
        "production vector search infrastructure ({matched})",
    frozenset(["sentence transformers", "embeddings", "bge", "e5", "text embeddings", "dense retrieval"]): 
        "embedding model depth for semantic search ({matched})",
    frozenset(["bm25", "information retrieval", "tf-idf", "tfidf", "lucene", "sparse retrieval"]): 
        "information retrieval foundation the JD centers on ({matched})",
    frozenset(["fine-tuning llms", "lora", "qlora", "peft", "instruction tuning"]): 
        "LLM fine-tuning experience (preferred by JD) ({matched})",
    frozenset(["hugging face transformers", "transformers", "sentence transformers"]): 
        "transformer model infrastructure ({matched})",
    frozenset(["recommendation systems", "recommender systems", "collaborative filtering"]): 
        "recommendation system background applicable to the role ({matched})",
    frozenset(["mlops", "kubeflow", "weights & biases", "mlflow"]): 
        "ML production operations experience ({matched})",
}

SKILL_COMBINED_PHRASES = {
    frozenset(["faiss", "milvus", "qdrant", "weaviate", "pinecone", "opensearch", "elasticsearch", "chroma"]): 
        "production vector search infrastructure",
    frozenset(["sentence transformers", "embeddings", "bge", "e5", "text embeddings", "dense retrieval"]): 
        "embedding model depth for semantic search",
    frozenset(["bm25", "information retrieval", "tf-idf", "tfidf", "lucene", "sparse retrieval"]): 
        "classical IR foundation",
    frozenset(["fine-tuning llms", "lora", "qlora", "peft", "instruction tuning"]): 
        "LLM fine-tuning experience",
    frozenset(["hugging face transformers", "transformers", "sentence transformers"]): 
        "transformer model infrastructure",
    frozenset(["recommendation systems", "recommender systems", "collaborative filtering"]): 
        "recommendation system background",
    frozenset(["mlops", "kubeflow", "weights & biases", "mlflow"]): 
        "ML production operations experience",
}

def get_specific_jd_match(candidate: dict, jd_config=None) -> str:
    skills = candidate.get("skills", []) or []
    candidate_skills = {}
    for s in skills:
        name = s.get("name")
        if name:
            candidate_skills[name.lower().strip()] = name

    matched_categories = []
    matched_skills = []
    used_skills = set()

    for keys in SKILL_JD_PHRASES.keys():
        found_skill = None
        for k in keys:
            if k in candidate_skills and k not in used_skills:
                found_skill = candidate_skills[k]
                used_skills.add(k)
                break
        if found_skill:
            matched_categories.append(keys)
            matched_skills.append(found_skill)

    if not matched_categories:
        from jd_parser import hard_req_coverage_score
        coverage = hard_req_coverage_score(candidate, jd_config)
        hard_req_coverage_pct = coverage * 100
        return f"covers {hard_req_coverage_pct:.0f}% of JD hard requirements"

    if len(matched_categories) == 1:
        return SKILL_JD_PHRASES[matched_categories[0]].format(matched=matched_skills[0])

    skills_str = " + ".join(matched_skills)
    phrases = [SKILL_COMBINED_PHRASES[cat] for cat in matched_categories]
    if len(phrases) == 2:
        phrases_str = f"{phrases[0]} alongside {phrases[1]}"
    else:
        phrases_str = ", ".join(phrases[:-1]) + f" alongside {phrases[-1]}"
    return f"{skills_str} combination — {phrases_str}"

def _get_severity_ranked_concern(
    feature_vector: Dict[str, float],
    candidate: dict,
) -> Optional[str]:
    """
    Priority concern selection logic.
    Evaluates in a strict order and returns the first matching concern.
    """
    # Priority 1  Notice period > 90 days
    notice_days = candidate.get("redrob_signals", {}).get("notice_period_days")
    if notice_days is not None:
        try:
            notice_days_int = int(float(notice_days))
            if notice_days_int > 90:
                return f"Notice period of {notice_days_int} days is significantly above the JD's preferred sub-thirty threshold — confirm whether buyout is feasible before advancing"
        except (TypeError, ValueError):
            pass

    profile = candidate.get("profile", {}) or {}
    location = profile.get("location") or "unknown location"
    country = profile.get("country") or "unknown country"
    is_india = country.lower().strip() in ["india", "in"]
    willing_to_relocate = bool(candidate.get("redrob_signals", {}).get("willing_to_relocate", False))

    # Priority 2: Outside India and unwilling to relocate
    if not is_india and not willing_to_relocate:
        return f"Based in {location}, {country} — outside the JD's India-only scope with no relocation willingness flagged. No visa sponsorship offered per JD"

    # Priority 3: Outside India but willing to relocate
    if not is_india and willing_to_relocate:
        return f"Based in {location}, {country} — outside the JD's India-only scope, but relocation willingness is flagged; confirm transition feasibility"

    # Priority 4: In India but outside Noida/Pune
    if is_india:
        loc_lower = location.lower()
        if "noida" not in loc_lower and "pune" not in loc_lower:
            return f"Based in {location} — outside the Noida/Pune preference zone; confirm relocation willingness before shortlisting"

    # Priority 5: Langchain dabbler
    if feature_vector.get("flag_langchain_dabbler", 0.0) > 0.5:
        return "AI skill profile is weighted toward LLM-era tools without evidence of pre-LLM IR or ML fundamentals — a specific JD disqualifier"

    # Priority 6: Consulting only
    if feature_vector.get("flag_consulting_only", 0.0) > 0.5:
        return "Career is predominantly at IT-services/consulting firms — the JD explicitly prefers product-company background"

    # Priority 7: Title-desc mismatch
    if feature_vector.get("flag_title_desc_mismatch", 0.0) > 0.5:
        return "Job title and role descriptions show significant domain mismatch across career history — verify directly with candidate"

    # Priority 8: Skill assessment score < 50
    assessments = candidate.get("redrob_signals", {}).get("skill_assessment_scores") or {}
    if isinstance(assessments, dict):
        assessed_keys = {k.lower().strip(): (k, v) for k, v in assessments.items()}
        for s in candidate.get("skills", []) or []:
            prof = (s.get("proficiency") or "").lower().strip()
            name = (s.get("name") or "").lower().strip()
            if prof == "advanced" and name in assessed_keys:
                orig_name, score = assessed_keys[name]
                try:
                    score_val = float(score)
                    if score_val < 50:
                        return f"Claims advanced proficiency in {s.get('name')} but platform assessment score is {int(score_val)} out of one hundred — inconsistent with self-reported level"
                except (TypeError, ValueError):
                    pass

    # Priority 9: Capped Param_E credibility >= 5.0
    if feature_vector.get("Param_E_Credibility", 0.0) >= 5.0:
        return "High ratio of advanced skill claims relative to platform-verified assessment data on file"

    return None


class ReasoningCompiler:
    """
    Generates deterministic, auditable reasoning text for ranked candidates.
    Maintains state to enforce n-gram collision avoidance across all generated texts.
    """

    def __init__(self, jd_config, all_scores: List[float]):
        """
        Args:
            jd_config: Parsed JDConfig.
            all_scores: All LightGBM scores in the top-100 (for percentile calculation).
        """
        self.jd_config = jd_config
        self.all_scores = sorted(all_scores)
        self._generated_texts: List[str] = []
        self._opening_rotation: Dict[str, int] = {
            tone: 0 for tone in _OPENING_BY_TONE
        }
        self._last_template_idx: Optional[int] = None

    def _score_to_percentile(self, score: float) -> float:
        """Convert a score to its percentile in the local distribution."""
        if not self.all_scores:
            return 0.5
        n = len(self.all_scores)
        below = sum(1 for s in self.all_scores if s < score)
        return below / n

    def compile(
        self,
        candidate: dict,
        feature_vector: Dict[str, float],
        lgbm_score: float,
        rank: int,
    ) -> str:
        """
        Generate reasoning text for a candidate using one of 4 distinct templates.
        """
      
        stable_hash = int(
            hashlib.md5(candidate.get("candidate_id", "").encode("utf-8", errors="ignore")).hexdigest()[:8], 16
        )
        template_idx = stable_hash % 4

        if self._last_template_idx is not None and template_idx == self._last_template_idx:
            template_idx = (template_idx + 1) % 4
        self._last_template_idx = template_idx

        jd_match = get_specific_jd_match(candidate, self.jd_config)
        location = candidate.get("profile", {}).get("location") or "unknown location"
        concern = _get_severity_ranked_concern(feature_vector, candidate)
        _profile = candidate.get("profile") or {}
        _signals = candidate.get("redrob_signals") or {}

        yoe_raw = _profile.get("years_of_experience")
        yoe_str = "0"
        if yoe_raw is not None:
            try:
                yoe_float = float(yoe_raw)
                if yoe_float > 0:
                    if yoe_float == int(yoe_float):
                        yoe_str = str(int(yoe_float))
                    else:
                        yoe_str = str(yoe_raw)
            except (TypeError, ValueError):
                pass

        notice_raw = _signals.get("notice_period_days")
        notice_str = "0"
        if notice_raw is not None:
            try:
                notice_int = int(float(notice_raw))
                notice_str = str(notice_int)
            except (TypeError, ValueError):
                pass

        if template_idx == 0:
            if concern:
                reasoning = (
                    f"The candidate's profile demonstrates {jd_match}. "
                    f"With {yoe_str} years of experience, the candidate is based in {location} "
                    f"and is available in {notice_str} days. Primary concern: {concern}."
                )
            else:
                reasoning = (
                    f"The candidate's profile demonstrates {jd_match}. "
                    f"With {yoe_str} years of experience, the candidate is based in {location} "
                    f"and is available in {notice_str} days."
                )

        elif template_idx == 1:
            if concern:
                reasoning = (
                    f"With {yoe_str} years of experience, the candidate is currently based in {location}. "
                    f"The profile demonstrates strong JD alignment, showing {jd_match}. "
                    f"Available in {notice_str} days, the primary concern is: {concern}."
                )
            else:
                reasoning = (
                    f"With {yoe_str} years of experience, the candidate is currently based in {location}. "
                    f"The profile demonstrates strong JD alignment, showing {jd_match}. "
                    f"The candidate is available in {notice_str} days."
                )

        elif template_idx == 2:
            if concern:
                reasoning = (
                    f"The primary concern for this profile is {concern}. "
                    f"Despite this, the technical profile shows {jd_match}. "
                    f"The candidate has {yoe_str} years of experience, is based in {location}, "
                    f"and is available in {notice_str} days."
                )
            else:
                reasoning = (
                    f"The technical profile shows {jd_match}. "
                    f"The candidate has {yoe_str} years of experience, is based in {location}, "
                    f"and is available in {notice_str} days."
                )

        else: 
            github_raw = _signals.get("github_activity_score")
            verifiable_point = "strong technical skills"
            if github_raw is not None:
                try:
                    github_float = float(github_raw)
                    if github_float > 30:
                        github_score_str = str(int(github_float)) if github_float == int(github_float) else str(github_raw)
                        verifiable_point = f"a strong GitHub activity score of {github_score_str}"
                except (TypeError, ValueError):
                    pass

            if verifiable_point == "strong technical skills":
                assessments = _signals.get("skill_assessment_scores") or {}
                verified_skill = None
                verified_score = None
                if isinstance(assessments, dict) and assessments:
                    for k, v in assessments.items():
                        try:
                            score_val = float(v)
                            if score_val >= 0:
                                verified_skill = k
                                verified_score = str(int(score_val)) if score_val == int(score_val) else str(v)
                                break
                        except (TypeError, ValueError):
                            pass
                if verified_skill:
                    verifiable_point = f"a verified platform assessment score of {verified_score}/100 in {verified_skill}"

            if verifiable_point == "strong technical skills":
                prod_log = feature_vector.get("prod_signal_log", 0.0)
                if prod_log > 0:
                    verifiable_point = "proven production engineering credentials in career history descriptions"

            if concern:
                reasoning = (
                    f"Backed by {verifiable_point}, the profile features {jd_match}. "
                    f"Based in {location}, the candidate has {yoe_str} years of experience "
                    f"and is available in {notice_str} days. Primary concern: {concern}."
                )
            else:
                reasoning = (
                    f"Backed by {verifiable_point}, the profile features {jd_match}. "
                    f"Based in {location}, the candidate has {yoe_str} years of experience "
                    f"and is available in {notice_str} days."
                )

      
        candidate_numbers = _extract_candidate_numbers(candidate)

        audit_passed, violations = _numeric_regex_audit(reasoning, candidate_numbers)
        if not audit_passed:
            for v in violations:
                reasoning = re.sub(
                    r'\b' + re.escape(v) + r'\b\.?',
                    '',
                    reasoning,
                ).strip()
        
            reasoning = re.sub(r'  +', ' ', reasoning)
            reasoning = re.sub(r'\[N\]', '', reasoning).strip()

        reasoning = reasoning.replace("..", ".").replace(" .", ".").strip()

       
        collision_ok, sim = _ngram_collision_check(reasoning, self._generated_texts)
        if not collision_ok:
            reasoning = f"[Rank {rank}] " + reasoning
        self._generated_texts.append(reasoning)

        return reasoning

    def compile_trace(
        self,
        candidate: dict,
        feature_vector: Dict[str, float],
        lgbm_score: float,
        rank: int,
    ) -> dict:
        """
        Compile reasoning and return a full audit trace dict for reasoning_trace.jsonl.
        Used for top 30 candidates (Section 8.3).
        """
        reasoning = self.compile(candidate, feature_vector, lgbm_score, rank)

        feature_items = sorted(
            [(k, abs(v)) for k, v in feature_vector.items()],
            key=lambda x: x[1],
            reverse=True
        )
        top_drivers = [k for k, _ in feature_items[:3]]

        return {
            "candidate_id": candidate.get("candidate_id"),
            "rank": rank,
            "lgbm_score": round(lgbm_score, 6),
            "hard_req_coverage": round(feature_vector.get("hard_req_coverage", 0.0), 4),
            "consistency_score": round(feature_vector.get("consistency_score", 1.0), 4),
            "top_feature_drivers": top_drivers,
            "concern": _get_severity_ranked_concern(feature_vector, candidate),
            "reasoning": reasoning,
        }


if __name__ == "__main__":
    import sys
    import os

    base_dir = os.path.dirname(os.path.abspath(__file__))
    from jd_parser import parse_jd

    jd = parse_jd(os.path.join(base_dir, "data", "skill_aliases.json"))

    def make_candidate(cid, yoe, location, country, notice, github, skills, hard_req_frac):
        return {
            "candidate_id": cid,
            "profile": {
                "years_of_experience": yoe,
                "location": location,
                "country": country,
                "current_title": "ML Engineer",
                "current_company": "Startup",
                "current_company_size": "11-50",
                "current_industry": "Technology",
                "headline": "ML Engineer",
                "summary": "",
                "anonymized_name": "Test User",
            },
            "career_history": [{
                "company": "Startup", "title": "ML Engineer",
                "start_date": "2021-01-01", "end_date": None,
                "duration_months": int(yoe * 12), "is_current": True,
                "industry": "Technology", "company_size": "11-50",
                "description": "Deployed BM25 and FAISS ranking pipeline at production scale with low latency."
            }],
            "skills": skills,
            "redrob_signals": {
                "signup_date": "2021-01-01", "last_active_date": "2025-12-01",
                "recruiter_response_rate": 0.8, "open_to_work_flag": True,
                "connection_count": 200, "search_appearance_30d": 80,
                "endorsements_received": 15, "notice_period_days": notice,
                "expected_salary_range_inr_lpa": {"min": 20.0, "max": 40.0},
                "github_activity_score": github,
                "skill_assessment_scores": {},
                "profile_completeness_score": 75,
                "profile_views_received_30d": 10,
                "applications_submitted_30d": 2,
                "avg_response_time_hours": 12.0,
                "preferred_work_mode": "remote",
                "willing_to_relocate": True,
                "saved_by_recruiters_30d": 3,
                "interview_completion_rate": 0.9,
                "offer_acceptance_rate": 0.8,
                "verified_email": True,
                "verified_phone": True,
                "linkedin_connected": True,
            }
        }

    c_strong = make_candidate(
        "CAND_0000001", 8, "Pune", "India", 30, 85,
        [{"name": "FAISS", "proficiency": "advanced", "endorsements": 20, "duration_months": 48},
         {"name": "BM25", "proficiency": "advanced", "endorsements": 15, "duration_months": 36},
         {"name": "Python", "proficiency": "expert", "endorsements": 40, "duration_months": 72}],
        0.8
    )

    c_mid = make_candidate(
        "CAND_0000002", 4, "Bangalore", "India", 60, 40,
        [{"name": "Python", "proficiency": "advanced", "endorsements": 12, "duration_months": 36},
         {"name": "NLP", "proficiency": "intermediate", "endorsements": 5, "duration_months": 18}],
        0.4
    )

    c_weak = make_candidate(
        "CAND_0000003", 1, "Austin", "USA", 90, -1,
        [{"name": "LangChain", "proficiency": "advanced", "endorsements": 2, "duration_months": 6}],
        0.1
    )

    scores = [0.9, 0.5, 0.1]
    from features import build_feature_vector, consistency_score

    compiler = ReasoningCompiler(jd, all_scores=scores)

    for candidate, score in [(c_strong, 0.9), (c_mid, 0.5), (c_weak, 0.1)]:
        fv = build_feature_vector(candidate, jd, bm25_score=score * 15, stage1_bm25_median=7.5)
        trace = compiler.compile_trace(candidate, fv, score, rank=scores.index(score)+1)
        print(f"\n=== {candidate['candidate_id']} (score={score}, rank={scores.index(score)+1}) ===")
        print(f"Reasoning: {trace['reasoning']}")
        print(f"Top drivers: {trace['top_feature_drivers']}")
        print(f"Concern: {trace['concern']}")