from __future__ import annotations
import os
import time
import shutil
import uuid
import json
import asyncio
import base64
import re
import traceback
from typing import List, Optional, Dict, Any
from fastapi import FastAPI, UploadFile, File, BackgroundTasks, HTTPException, Form
from fastapi.middleware.cors import CORSMiddleware
from pydantic import BaseModel, ConfigDict
import warnings

# Suppress warnings
warnings.filterwarnings('ignore', category=FutureWarning)

# CrewAI imports
from crewai import Agent, Task, Crew, Process
from crewai.llm import LLM

# Gemini imports
import google.generativeai as genai
from google.generativeai.types import HarmCategory, HarmBlockThreshold

# OpenCV
import cv2
import numpy as np

# Configuration
GEMINI_API_KEY = os.getenv("GOOGLE_API_KEY")
GROQ_API_KEY = os.getenv("GROQ_API_KEY")


if not GEMINI_API_KEY:
    raise ValueError("GOOGLE_API_KEY environment variable required")
if not GROQ_API_KEY:
    raise ValueError("GROQ_API_KEY environment variable required")

genai.configure(api_key=GEMINI_API_KEY)

app = FastAPI(title="BJJ AI Coach - Hybrid Agentic")

app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)

# --- MODELS ---

class TimestampedEvent(BaseModel):
    time: str
    title: str
    description: str
    category: Optional[str] = "GENERAL"
    frame_image: Optional[str] = None
    frame_timestamp: Optional[str] = None
    model_config = ConfigDict(extra="allow")

class Drill(BaseModel):
    name: str
    focus_area: str
    reason: str
    duration: Optional[str] = "15 min/day"
    frequency: Optional[str] = "5x/week"

class DetailedSkillBreakdown(BaseModel):
    offense: int
    defense: int
    guard: int
    passing: int
    standup: int

class PerformanceGrades(BaseModel):
    defense_grade: str
    offense_grade: str
    control_grade: str

class AnalysisResult(BaseModel):
    overall_score: int
    performance_label: str
    performance_grades: PerformanceGrades
    skill_breakdown: DetailedSkillBreakdown
    strengths: List[str]
    weaknesses: List[str]
    missed_opportunities: List[TimestampedEvent]
    key_moments: List[TimestampedEvent]
    coach_notes: str
    recommended_drills: List[Drill]

db_storage = {}

# --- UTILITIES ---

def parse_time_to_seconds(time_str: str) -> Optional[int]:
    if not time_str:
        return None
    match = re.search(r"(\d{1,2}):(\d{2})", time_str)
    if not match:
        return None
    mm, ss = match.groups()
    return int(mm) * 60 + int(ss)

def find_closest_frame(target_time_sec: int, frames: list) -> dict:
    return min(frames, key=lambda f: abs(f["second"] - target_time_sec))

def attach_frames_to_events(events: List[dict], frames: list):
    for event in events:
        try:
            event_time_sec = parse_time_to_seconds(event.get("time"))
            if event_time_sec is None:
                continue
            closest = find_closest_frame(event_time_sec, frames)
            event["frame_timestamp"] = closest["timestamp"]
            event["frame_image"] = base64.b64encode(closest["bytes"]).decode("utf-8")
        except:
            event["frame_image"] = None

def extract_json_from_text(text: str) -> Dict:
    """Robust JSON extraction"""
    text = text.strip()
    
    # Direct parse
    try:
        return json.loads(text)
    except:
        pass
    
    # Remove markdown
    if "```json" in text or "```" in text:
        try:
            if "```json" in text:
                text = text.split("```json")[1].split("```")[0]
            else:
                text = text.split("```")[1].split("```")[0]
            return json.loads(text.strip())
        except:
            pass
    
    # Find boundaries
    try:
        start_idx = text.find('{')
        if start_idx == -1:
            raise ValueError("No opening brace")
        
        brace_count = 0
        end_idx = -1
        
        for i in range(start_idx, len(text)):
            if text[i] == '{':
                brace_count += 1
            elif text[i] == '}':
                brace_count -= 1
                if brace_count == 0:
                    end_idx = i
                    break
        
        if end_idx != -1:
            json_str = text[start_idx:end_idx+1]
            return json.loads(json_str)
        
        # Truncation repair
        json_str = text[start_idx:]
        open_braces = json_str.count('{')
        close_braces = json_str.count('}')
        open_brackets = json_str.count('[')
        close_brackets = json_str.count(']')
        
        if open_brackets > close_brackets:
            json_str += ']' * (open_brackets - close_brackets)
        if open_braces > close_braces:
            json_str += '}' * (open_braces - close_braces)
        
        return json.loads(json_str)
        
    except:
        pass
    
    raise ValueError("Could not extract JSON")

def is_generic(text: str) -> bool:
    """Check if feedback is too generic"""
    patterns = [r'^More \w+$', r'^Improve \w+$', r'^Work \w+$', r'^Better \w+$']
    for p in patterns:
        if re.match(p, text.strip(), re.IGNORECASE):
            return True
    if not re.search(r'\d{1,2}:\d{2}', text):
        return True
    if len(text) < 20:
        return True
    return False

# --- FRAME EXTRACTION ---

def extract_frames(video_path: str) -> tuple:
    """Extract frames with weighted distribution (40% from end)"""
    try:
        cap = cv2.VideoCapture(video_path)
        if not cap.isOpened():
            raise Exception("Cannot open video")
        
        fps = cap.get(cv2.CAP_PROP_FPS)
        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
        duration = total_frames / fps if fps > 0 else 0
        
        if duration <= 30:
            total_to_extract = 14
        elif duration <= 60:
            total_to_extract = 16
        else:
            total_to_extract = 18
        
        print(f"Extracting {total_to_extract} frames from {duration:.1f}s video")
        
        # Weighted: 25% start, 35% middle, 40% end
        start_frames = max(4, int(total_to_extract * 0.25))
        end_frames = max(6, int(total_to_extract * 0.40))
        middle_frames = total_to_extract - start_frames - end_frames
        
        start_section_end = int(total_frames * 0.20)
        end_section_start = int(total_frames * 0.80)
        
        frames = []
        
        # Extract START
        start_interval = max(1, start_section_end // start_frames)
        for i in range(0, start_section_end, start_interval):
            if len([f for f in frames if f["second"] < duration * 0.20]) >= start_frames:
                break
            frame = get_frame(cap, i, fps)
            if frame:
                frames.append(frame)
        
        # Extract MIDDLE
        middle_section_frames = end_section_start - start_section_end
        middle_interval = max(1, middle_section_frames // middle_frames)
        for i in range(start_section_end, end_section_start, middle_interval):
            if len([f for f in frames if duration * 0.20 <= f["second"] < duration * 0.80]) >= middle_frames:
                break
            frame = get_frame(cap, i, fps)
            if frame:
                frames.append(frame)
        
        # Extract END
        end_section_frames = total_frames - end_section_start
        end_interval = max(1, end_section_frames // end_frames)
        for i in range(end_section_start, total_frames, end_interval):
            if len([f for f in frames if f["second"] >= duration * 0.80]) >= end_frames:
                break
            frame = get_frame(cap, i, fps)
            if frame:
                frames.append(frame)
        
        # Always add last frame
        last = get_frame(cap, total_frames - 1, fps)
        if last and last not in frames:
            frames.append(last)
        
        cap.release()
        frames.sort(key=lambda f: f["second"])
        
        metadata = {
            "duration": round(duration, 2),
            "fps": round(fps, 2),
            "frames_extracted": len(frames),
            "distribution": {"start": start_frames, "middle": middle_frames, "end": end_frames}
        }
        
        print(f"Extracted {len(frames)} frames")
        return frames, metadata
        
    except Exception as e:
        if 'cap' in locals():
            cap.release()
        raise Exception(f"Frame extraction failed: {str(e)}")

def get_frame(cap: cv2.VideoCapture, frame_idx: int, fps: float) -> Optional[dict]:
    try:
        cap.set(cv2.CAP_PROP_POS_FRAMES, frame_idx)
        ret, frame = cap.read()
        if not ret:
            return None
        
        h, w = frame.shape[:2]
        target_h = 720
        target_w = int(w * (target_h / h))
        resized = cv2.resize(frame, (target_w, target_h))
        _, buffer = cv2.imencode('.jpg', resized, [cv2.IMWRITE_JPEG_QUALITY, 85])
        
        timestamp_sec = frame_idx / fps
        timestamp_str = f"{int(timestamp_sec // 60):02d}:{int(timestamp_sec % 60):02d}"
        
        return {
            "bytes": buffer.tobytes(),
            "timestamp": timestamp_str,
            "second": round(timestamp_sec, 2),
            "frame_idx": frame_idx
        }
    except:
        return None

# --- STEP 1: GEMINI VISION EXTRACTION ---

async def extract_frame_observations(frames: List[Dict], user_desc: str, opp_desc: str, duration: float) -> str:
    """Use Gemini to analyze frames and extract observations"""
    
    print("STEP 1: Gemini Vision - Frame Analysis")
    
    try:
        # Build frame list
        frame_list = "\n".join([
            f"Frame {i+1} at {f['timestamp']} ({f['second']}s)"
            for i, f in enumerate(frames)
        ])
        prompt = f"""
You are an expert Brazilian Jiu-Jitsu (BJJ) video analyst performing STRICT FRAME-BY-FRAME PERCEPTION.

YOUR ROLE IS LIMITED TO OBSERVATION.
You do NOT judge performance, assign scores, or give coaching advice.

PRIMARY RULES (NON-NEGOTIABLE):
- You MUST rely ONLY on what is visibly observable in each frame.
- You are FORBIDDEN from assuming intent, pain, referee actions, or outcomes.
- If evidence is unclear or partially visible, you MUST say:
  "Insufficient visual evidence to confirm."
- If video or frames are not related to BJJ, say "You must provide a video of Brazilian-Jiu-Jitsu only.".

====================
VIDEO CONTEXT
====================
- Duration: {duration}s
- Total Frames: {len(frames)}
- Athlete Being Analyzed (User): {user_desc}
- Opponent: {opp_desc}

====================
REFERENCE KNOWLEDGE (VOCABULARY ONLY)
====================

Use the following terms ONLY if clearly supported by visual evidence.

POSITIONS:
Standing, Clinch,
Closed Guard,
Open Guard (Butterfly, De La Riva, Spider, X-Guard),
Half Guard (Top / Bottom, Knee Shield, Deep Half),
Side Control (Standard, Kesa Gatame, Reverse Kesa),
North-South,
Mount (Low, High, S-Mount),
Back Control (with hooks or body triangle),
Turtle (Top / Bottom).

IMPORTANT POSITION RULE:
- "Full Mount" requires:
  BOTH knees on the mat,
  hips square over opponent’s torso,
  opponent flat on back,
  and NO leg entanglement.
- If ANY condition is missing, DO NOT label as mount.
  Use "Top control (not mount)" or "Transitional position".

ATTACKS & THREATS:
Chokes (RNC, Guillotine, Triangle, Arm Triangle, D'Arce, Anaconda,
Ezekiel, Collar chokes),
Joint Locks (Armbar, Kimura, Americana, Omoplata, Wrist locks),
Leg Locks (Straight Ankle, Kneebar, Heel Hook, Toe Hold, Calf Slicer).

CONTROL INDICATORS (SUPPORTING ONLY, NOT DECISIVE):
- Hip or head control
- Chest-to-chest pressure
- Hooks or body triangle
- Limb isolation
- Flattening opponent
- Opponent forced into defensive posture

====================
SUBMISSION CONFIRMATION (STRICT)
====================

A submission may ONLY be marked if at least ONE is explicitly visible:
- Tapping (hand, foot, or body)
- Match stoppage during a locked submission
- Footage ends immediately during an unmistakably locked submission

Pattern cues alone (leg entanglement, arching, neck control)
are NEVER sufficient.

If unclear → classify as "submission attempt" or "no submission".

====================
FRAME-BY-FRAME TASK
====================

For EACH frame, report exactly:

1. POSITION:
   The clearest dominant or transitional position
   (use conservative labels when unsure).

2. ADVANTAGE:
   User / Opponent / Neutral
   (based ONLY on visible control).

3. ACTION TYPE (SELECT ONE):
   OFFENSE | DEFENSE | GUARD | PASSING | STANDUP | NONE

4. THREATS:
   None / Submission Attempt (name it) / Positional Advance.

5. TECHNICAL DETAILS:
   Observable grips, pressure, transitions, defenses, or escapes.
   Do NOT speculate.

ACTION TYPE DEFINITIONS:
- OFFENSE: Initiated submission attempts or attack chains
- DEFENSE: Escaping, framing, or defending submissions
- GUARD: Bottom-position control, sweeps, or attacks
- PASSING: Clearing legs and advancing past guard
- STANDUP: Takedowns or clinch exchanges
- NONE: Static control or transitions without active skill use

STRICT OUTPUT FORMAT:

Frame X (MM:SS):
[Position] - [Advantage] - [Action Type] - [Threats] - [Technical Details]

====================
CRITICAL FINAL FRAMES (LAST 6–7 ONLY)
====================

Analyze carefully:
- Is a submission CLEARLY locked?
- Is tapping EXPLICITLY visible?
- Does the footage end during control?

DECISION RULE:
- Without tapping or stoppage → NO submission.

====================
FINAL SUMMARY (FACTUAL ONLY)
====================

Provide a short factual summary:

1. OUTCOME VERDICT:
   - Submission: YES / NO
   - Winner: User / Opponent / NONE
   - Technique: <name or NONE>
   - Time: MM:SS or NONE
   - Confidence: HIGH / MEDIUM / LOW
   - Evidence: Brief quote or paraphrase from frames

2. POSITIONAL OVERVIEW:
   - Which positions were clearly established?
   - Who held visible positional control overall?

FINAL CHECK (MANDATORY):
- No submission without explicit evidence
- No "full mount" unless criteria are met
- No techniques not visible in frames
- No coaching, scoring, or evaluation language
"""

        # Prepare content
        content = []
        for f in frames:
            content.append({
                "mime_type": "image/jpeg",
                "data": base64.b64encode(f["bytes"]).decode("utf-8")
            })
        content.append(prompt)
        
        # Call Gemini
        start = time.time()
        model = genai.GenerativeModel(
            model_name="gemini-2.5-flash",
            generation_config={
                "temperature": 0.2,
                "max_output_tokens": 8000
            }
        )
        
        response = await asyncio.get_event_loop().run_in_executor(
            None,
            lambda: model.generate_content(
                content,
                safety_settings={
                    HarmCategory.HARM_CATEGORY_DANGEROUS_CONTENT: HarmBlockThreshold.BLOCK_NONE,
                    HarmCategory.HARM_CATEGORY_HARASSMENT: HarmBlockThreshold.BLOCK_NONE,
                    HarmCategory.HARM_CATEGORY_HATE_SPEECH: HarmBlockThreshold.BLOCK_NONE,
                    HarmCategory.HARM_CATEGORY_SEXUALLY_EXPLICIT: HarmBlockThreshold.BLOCK_NONE,
                }
            )
        )
        
        elapsed = time.time() - start
        print(f"Gemini vision: {elapsed:.2f}s")
        
        # Get text
        try:
            observations = response.text
        except:
            observations = response.candidates[0].content.parts[0].text
        
        return observations
        
    except Exception as e:
        print(f"Vision extraction failed: {e}")
        return f"Error analyzing frames: {str(e)}"

# --- STEP 2: CREWAI AGENTS ---

def create_analysis_crew(observations: str, user_desc: str, opp_desc: str, duration: float):
    """Create CrewAI agents for analysis and formatting"""
    
    # Groq LLM for fast text processing
    llm = LLM(
        model="groq/llama-3.3-70b-versatile",
        api_key=GROQ_API_KEY,
        temperature=0.2
    )
    
    
    # Agent 1: Technical Analyst
    analyst = Agent(
        role="BJJ Technical Analyst",
        goal=f"Analyze frame observations for {user_desc} to detect submissions, score performance, and identify strengths/weaknesses",
backstory="""
You are a BJJ black belt coach acting as an EVIDENCE-BASED TECHNICAL AUDITOR.

IMPORTANT SCOPE LIMIT:
- You do NOT analyze video or frames directly.
- You ONLY analyze the OBSERVATIONS provided by the vision model.
- The OBSERVATIONS are the single source of truth.

OUTCOME AUTHORITY RULE:
- You MUST accept the Outcome Verdict stated in the OBSERVATIONS.
- You are NOT allowed to override or reinterpret submission decisions.
- If the verdict confidence is MEDIUM or LOW, treat the match as having NO submission.

POSITION AUTHORITY RULE:
- You MUST respect position labels used in OBSERVATIONS.
- You may summarize positional trends but MUST NOT relabel positions.

ALLOWED ACTIONS:
- Aggregate frame-level facts into performance insights
- Score performance based on observed evidence
- Identify strengths, weaknesses, and missed opportunities
- Provide coaching feedback grounded in timestamps

FORBIDDEN ACTIONS:
- Do NOT infer intent, pain, or referee behavior
- Do NOT upgrade control into a submission
- Do NOT introduce techniques not present in OBSERVATIONS
- Do NOT repeat the same issue using different wording

LANGUAGE & SCORING CONSTRAINTS:
- Every claim must reference a timestamp
- Generic phrases are forbidden
- Every score must be justified by at least one timestamp
- If user was submitted: Defense ≤40
- If user finished opponent: Offense ≥80
-NEVER mention frame numbers, frame ranges, or frame indices in the final output.
"""
,
        verbose=True,
        allow_delegation=False,
        llm=llm,
        memory=True
    )
    
    # Agent 2: JSON Formatter
    formatter = Agent(
        role="Data Structure Specialist",
        goal="Convert analysis into valid JSON matching exact schema requirements",
        backstory="""You transform technical analysis into structured JSON. You ensure:
        - Exactly 3 strengths and 3 weaknesses
        - All feedback includes timestamps (MM:SS format)
        - No generic phrases like "More aggression"
        - Scores reflect actual match outcome
        - JSON is valid (no trailing commas, proper syntax)
        """,
        verbose=True,
        allow_delegation=False,
        llm=llm
    )
    
    # Task 1: Analysis
    analysis_task = Task(
        description=f"""
Analyze the OBSERVATIONS produced by a frame-by-frame BJJ vision system.

IMPORTANT:
- Do NOT re-detect submissions or re-label positions.
- Your role is to evaluate performance quality based on OBSERVATIONS only.

====================
OBSERVATIONS (AUTHORITATIVE)
====================
{observations}

VIDEO INFO:
- Duration: {duration}s
- User: {user_desc}
- Opponent: {opp_desc}

====================
REQUIRED OUTPUT
====================

1. OUTCOME SUMMARY:
- Restate the outcome exactly as supported by OBSERVATIONS.
- Do NOT modify submission status or technique.

2. SKILL SCORING (0–100, REALISTIC):

**OVERALL SCORE PHILOSOPHY:**
- Recreational rolls (no finish): 60-75 range
- User achieves submission: 75-88 range
- User gets submitted: 45-60 range
- Close competitive match: 65-75 range
- Dominant performance (no finish): 70-80 range

⚔️ OFFENSE (Submission attempts & attack chains):
- Finished opponent: 80-92
- Multiple strong attempts: 70-80
- Some attempts visible: 60-70
- Positional pressure only: 50-60
- Minimal attacking: 40-50
- Purely defensive: 30-40

🛡️ DEFENSE (Escapes, survival, defending attacks):
- Got submitted: 35-45 (defensive failure evident)
- Never seriously threatened: 70-80
- Defended some attacks: 60-70
- Struggled but survived: 50-60
- Heavy defensive pressure: 40-50

🔒 GUARD (Bottom position effectiveness):
- Active sweeps/attacks: 70-85
- Controlled from bottom: 60-70
- Some guard work: 50-60
- Guard passed easily: 35-45
- Minimal guard play: 25-35

🚶 PASSING (Clearing legs, advancing):
- Multiple passes: 75-85
- Successful pass(es): 65-75
- Attempted passing: 55-65
- Pressure but no pass: 45-55
- Minimal passing work: 35-45

🧍 STANDUP (Takedowns/clinch):
- Successful takedown(s): 70-85
- Strong attempts: 60-70
- Some standup: 50-60
- No standup engagement: 0

**OUTCOME ADJUSTMENT:**
- Submission finish: +10-15 to overall, offense 80+, defense 70+
- Got submitted: -10-15 to overall, defense 35-45, offense capped at 65
- Dominant position control: +5-10 to overall
- Lost position badly: -5-10 to overall
- Close match: neutral (65-70 base)

Each score MUST reference at least one timestamp.

3. STRENGTHS (EXACTLY 3):
- Timestamped, technical, non-repetitive
- If submission occurred, Strength #1 MUST be the finish

4. WEAKNESSES (EXACTLY 3):
- Timestamped, distinct technical issues
- If user was submitted, Weakness #1 MUST be the failure

5. MISSED OPPORTUNITIES (2–3):
- Must be visible in OBSERVATIONS
- Positional or submission-chain only

6. COACH NOTES (150–250 words):
- Technical, honest, evidence-based
- No speculation

7. DRILLS (EXACTLY 3):
- Each drill maps directly to a weakness
- Include timestamp justification

FINAL CHECK:
- No contradiction of OBSERVATIONS
- No new techniques
- Scores align with demonstrated actions
"""
,
        agent=analyst,
        expected_output="Detailed technical analysis with submission detection"
    )
    
    # Task 2: JSON Formatting
    formatting_task = Task(
        description="""Convert the analysis into this EXACT JSON structure. NO markdown wrapping.

{{
  "overall_score": <int 0-100>,
  "performance_label": "EXCELLENT|STRONG|SOLID|DEVELOPING|NEEDS IMPROVEMENT",
  "performance_grades": {{
    "defense_grade": "<A+|A|B+|B|C+|C|D+|D>",
    "offense_grade": "<letter>",
    "control_grade": "<letter>"
  }},
  "skill_breakdown": {{
    "offense": <int>,
    "defense": <int>,
    "guard": <int>,
    "passing": <int>,
    "standup": <int>
  }},
  "strengths": [
    "At 0:XX - Specific observation (min 25 chars)",
    "At 0:XX - Another specific observation",
    "At 0:XX - Third specific observation"
  ],
  "weaknesses": [
    "At 0:XX - Specific weakness (min 25 chars)",
    "At 0:XX - Another weakness",
    "At 0:XX - Third weakness"
  ],
  "missed_opportunities": [
    {{"time": "MM:SS", "title": "Brief", "description": "Detail", "category": "SUBMISSION|POSITION|SWEEP"}}
  ],
  "key_moments": [
    {{"time": "MM:SS", "title": "Event", "description": "What happened", "category": "SUBMISSION|TRANSITION|DEFENSE"}}
  ],
  "coach_notes": "Paragraph 150-250 words",
  "recommended_drills": [
    {{"name": "Drill 1", "focus_area": "Area", "reason": "Why at timestamp", "duration": "15 min/day", "frequency": "5x/week"}},
    {{"name": "Drill 2", "focus_area": "Area", "reason": "Why", "duration": "10 min/day", "frequency": "4x/week"}},
    {{"name": "Drill 3", "focus_area": "Area", "reason": "Why", "duration": "12 min/day", "frequency": "3x/week"}}
  ]
}}

VALIDATION:
- All timestamps in MM:SS format
- No trailing commas
- Exactly 3 strengths, 3 weaknesses, 3 drills
- All feedback includes timestamps
- No generic phrases
""",
        agent=formatter,
        expected_output="Valid JSON only"
    )
    
    # Create crew
    crew = Crew(
        agents=[analyst, formatter],
        tasks=[analysis_task, formatting_task],
        process=Process.sequential,
        verbose=True
    )
    
    return crew

# --- HYBRID ANALYSIS ---

async def hybrid_agentic_analysis(
    frames: List[Dict],
    metadata: Dict,
    user_desc: str,
    opp_desc: str,
    activity_type: str,
    analysis_id: str = None
) -> AnalysisResult:
    """Hybrid: Gemini vision + CrewAI agents + Python validation"""
    
    print("\n" + "="*70)
    print("HYBRID AGENTIC ANALYSIS")
    print("="*70)
    
    try:
        if analysis_id:
            db_storage[analysis_id]["progress"] = 30
        
        # STEP 1: Gemini Vision
        observations = await extract_frame_observations(
            frames, user_desc, opp_desc, metadata["duration"]
        )
        
        if analysis_id:
            db_storage[analysis_id]["progress"] = 60
        
        # STEP 2: CrewAI Agents
        print("\nSTEP 2: CrewAI Agents - Analysis & Formatting")
        crew = create_analysis_crew(observations, user_desc, opp_desc, metadata["duration"])
        
        crew_start = time.time()
        result = await asyncio.get_event_loop().run_in_executor(
            None,
            crew.kickoff
        )
        crew_time = time.time() - crew_start
        print(f"CrewAI: {crew_time:.2f}s")
        
        if analysis_id:
            db_storage[analysis_id]["progress"] = 90
        
        # STEP 3: Parse & Validate
        print("\nSTEP 3: Python Validation")
        result_text = str(result)
        
        # Clean markdown
        if "```json" in result_text:
            result_text = result_text.split("```json")[1].split("```")[0].strip()
        elif "```" in result_text:
            result_text = result_text.split("```")[1].split("```")[0].strip()
        
        data = extract_json_from_text(result_text)
        data = validate_and_filter(data, frames)
        
        # Attach frames
        attach_frames_to_events(data.get("missed_opportunities", []), frames)
        attach_frames_to_events(data.get("key_moments", []), frames)
        
        if analysis_id:
            db_storage[analysis_id]["progress"] = 100
        
        print("Analysis complete")
        print("="*70 + "\n")
        
        return AnalysisResult(**data)
        
    except Exception as e:
        print(f"Hybrid analysis failed: {e}")
        traceback.print_exc()
        fallback = make_fallback(frames)
        if analysis_id:
            db_storage[analysis_id]["used_fallback"] = True
        return AnalysisResult(**fallback)

def validate_and_filter(data: Dict, frames: List[Dict]) -> Dict:
    """Python-level validation and generic filtering"""
    
    # Validate scores
    if "overall_score" not in data:
        data["overall_score"] = 65
    data["overall_score"] = max(0, min(100, data["overall_score"]))
    
    if "performance_label" not in data:
        score = data["overall_score"]
        if score >= 85:
            data["performance_label"] = "EXCELLENT PERFORMANCE"
        elif score >= 75:
            data["performance_label"] = "STRONG PERFORMANCE"
        elif score >= 60:
            data["performance_label"] = "SOLID PERFORMANCE"
        else:
            data["performance_label"] = "DEVELOPING PERFORMANCE"
    
    if "performance_grades" not in data:
        data["performance_grades"] = {"defense_grade": "C+", "offense_grade": "C", "control_grade": "C+"}
    
    if "skill_breakdown" not in data:
        base = data["overall_score"]
        data["skill_breakdown"] = {
            "offense": max(0, min(100, base - 5)),
            "defense": max(0, min(100, base + 3)),
            "guard": max(0, min(100, base - 2)),
            "passing": max(0, min(100, base - 10)),
            "standup": max(0, min(100, base - 13))
        }
    
    # Filter generic feedback
    for field in ["strengths", "weaknesses"]:
        if field in data and data[field]:
            filtered = [item for item in data[field] if not is_generic(item)]
            if len(filtered) >= 3:
                data[field] = filtered[:3]
            else:
                data[field] = make_specific(field, frames, filtered)
        else:
            data[field] = make_specific(field, frames, [])
    
    # Validate other fields
    if "missed_opportunities" not in data or not data["missed_opportunities"]:
        data["missed_opportunities"] = [{
            "time": frames[len(frames)//2]["timestamp"],
            "title": "Position",
            "description": "Review",
            "category": "POSITION"
        }]
    
    if "key_moments" not in data or not data["key_moments"]:
        data["key_moments"] = [{
            "time": frames[-3]["timestamp"],
            "title": "Exchange",
            "description": "Work",
            "category": "TRANSITION"
        }]
    
    if "coach_notes" not in data or len(data["coach_notes"]) < 50:
        data["coach_notes"] = "Focus on techniques. Review timestamps for improvement."
    
    if "recommended_drills" not in data or len(data["recommended_drills"]) < 3:
        data["recommended_drills"] = [
            {"name": "Control", "focus_area": "General", "reason": "Improve awareness", "duration": "15 min/day", "frequency": "5x/week"},
            {"name": "Guard", "focus_area": "Defense", "reason": "Strengthen defense", "duration": "10 min/day", "frequency": "4x/week"},
            {"name": "Flow", "focus_area": "Movement", "reason": "Improve transitions", "duration": "12 min/day", "frequency": "3x/week"}
        ]
    
    return data

def make_specific(field: str, frames: List[Dict], existing: List[str]) -> List[str]:
    feedback = existing.copy()
    
    start = frames[len(frames) // 6]
    mid = frames[len(frames) // 2]
    end = frames[-2] if len(frames) > 1 else frames[-1]
    
    if field == "strengths":
        templates = [
            f"At {start['timestamp']} - Maintained structure in opening",
            f"At {mid['timestamp']} - Showed awareness during exchange",
            f"At {end['timestamp']} - Demonstrated control"
        ]
    else:
        templates = [
            f"At {start['timestamp']} - Could improve positioning",
            f"At {mid['timestamp']} - Slow to recognize opportunity",
            f"At {end['timestamp']} - Room to improve execution"
        ]
    
    for t in templates:
        if len(feedback) < 3:
            feedback.append(t)
    
    return feedback[:3]

def make_fallback(frames: List[Dict]) -> Dict:
    mid = frames[len(frames)//2]["timestamp"]
    end = frames[-2]["timestamp"] if len(frames) > 1 else frames[-1]["timestamp"]
    
    return {
        "overall_score": 65,
        "performance_label": "SOLID PERFORMANCE",
        "performance_grades": {"defense_grade": "C+", "offense_grade": "C", "control_grade": "C+"},
        "skill_breakdown": {"offense": 60, "defense": 68, "guard": 63, "passing": 55, "standup": 52},
        "strengths": [
            f"At 0:10 - Maintained structure",
            f"At {mid} - Showed awareness",
            f"At {end} - Demonstrated control"
        ],
        "weaknesses": [
            f"At 0:15 - Could improve positioning",
            f"At {mid} - Slow to recognize opportunity",
            f"At {end} - Room to improve execution"
        ],
        "missed_opportunities": [{"time": mid, "title": "Position", "description": "Review", "category": "POSITION"}],
        "key_moments": [{"time": end, "title": "Exchange", "description": "Work", "category": "TRANSITION"}],
        "coach_notes": "Focus on techniques. Review timestamps.",
        "recommended_drills": [
            {"name": "Control", "focus_area": "General", "reason": "Improve", "duration": "15 min/day", "frequency": "5x/week"},
            {"name": "Guard", "focus_area": "Defense", "reason": "Strengthen", "duration": "10 min/day", "frequency": "4x/week"},
            {"name": "Flow", "focus_area": "Movement", "reason": "Improve", "duration": "12 min/day", "frequency": "3x/week"}
        ]
    }

# --- API ---

@app.post("/analyze-complete")
async def analyze_complete(
    file: UploadFile = File(...),
    user_description: str = Form(...),
    opponent_description: str = Form(...),
    activity_type: str = Form("Brazilian Jiu-Jitsu")
):
    start_time = time.time()
    file_path = None
    
    try:
        file_name = f"{uuid.uuid4()}_{file.filename}"
        file_path = f"temp_videos/{file_name}"
        os.makedirs("temp_videos", exist_ok=True)
        
        with open(file_path, "wb") as buffer:
            shutil.copyfileobj(file.file, buffer)
        
        analysis_id = str(uuid.uuid4())
        db_storage[analysis_id] = {"status": "processing", "progress": 0}
        
        # Extract frames
        frames, metadata = await asyncio.get_event_loop().run_in_executor(
            None, extract_frames, file_path
        )
        
        # Hybrid analysis
        result = await hybrid_agentic_analysis(
            frames, metadata,
            user_description.strip(), opponent_description.strip(),
            activity_type, analysis_id
        )
        
        total_time = time.time() - start_time
        
        return {
            "status": "completed",
            "data": result.model_dump(),
            "processing_time": f"{total_time:.2f}s",
            "used_fallback": db_storage[analysis_id].get("used_fallback", False),
            "method": "hybrid_agentic"
        }
    except Exception as e:
        print(f"Error: {e}")
        try:
            frames_fb, _ = await asyncio.get_event_loop().run_in_executor(None, extract_frames, file_path)
            fallback = make_fallback(frames_fb)
        except:
            fallback = make_fallback([{"timestamp": "00:30", "second": 30}])
        
        return {
            "status": "completed_with_fallback",
            "data": fallback,
            "error": str(e),
            "used_fallback": True
        }
    finally:
        if file_path:
            try:
                os.remove(file_path)
            except:
                pass

@app.get("/health")
async def health_check():
    return {"status": "healthy", "version": "26.0.0-hybrid-agentic"}

@app.get("/")
async def root():
    return {
        "message": "BJJ AI Coach - Hybrid Agentic",
        "version": "26.0.0",
        "architecture": "Gemini Vision + CrewAI Agents + Python Validation",
        "agents": {
            "gemini": "Frame-by-frame vision analysis",
            "analyst_agent": "Technical analysis + submission detection (Groq)",
            "formatter_agent": "JSON structure + validation (Groq)",
            "python": "Generic filtering + frame attachment"
        },
        "benefits": [
            "Gemini's vision for accurate frame analysis",
            "Groq's speed for text processing (3-5x faster)",
            "Multi-agent review for quality",
            "Python guardrails against generic feedback"
        ]
    }

if __name__ == "__main__":
    import uvicorn
    port = int(os.environ.get("PORT", 7860))
    uvicorn.run(app, host="0.0.0.0", port=port)