# Copyright: Shayekh Bin Islam. KAIST, South Korea. 2026.

MAX_TEXT_CHAR = 1500

model_id = "Qwen/Qwen3.5-9B"
# model_id = "Qwen/Qwen3.5-2B"

try:
    import spaces
    IS_HF = True
except ImportError:
    IS_HF = False


if not IS_HF:
    class spaces:
        @staticmethod
        def GPU(*args, **kwargs):
            def decorator(func):
                return func
            if len(args) == 1 and callable(args[0]) and not kwargs:
                return args[0]
            return decorator
else:
    import os, sys, subprocess
    os.environ['SUPERTONIC_CACHE_DIR']  = '/home/user/huggingface'
    os.environ["HF_HOME"] = "/home/user/huggingface"
    os.environ['XDG_CACHE_HOME'] = "/home/user/huggingface"
    
    os.environ['PLAYWRIGHT_BROWSERS_PATH'] = "/home/user/huggingface/ms-playwright"
    # os.system("playwright install chromium")
    result = subprocess.run(
        ["python", "-m", "playwright", "install", "chromium"],
        env={**os.environ},
        check=True,
        stdout=subprocess.PIPE,
        stderr=subprocess.PIPE
    )

import gradio as gr
import fitz  # PyMuPDF
from PIL import Image
import io
import json
import base64
import soundfile as sf
import torch
import os
import tempfile
import re as re_module

if IS_HF:
    LOG_DIR = tempfile.gettempdir()
else:
    LOG_DIR = "log"
os.makedirs(LOG_DIR, exist_ok=True)

from supertonic import TTS
from transformers import AutoProcessor, AutoModelForImageTextToText

# model = None
# processor = None
# tts = None
# voice_style = None

global_stop_thinking = [False]
global_kill_threads = [False]

def set_stop_thinking():
    global_stop_thinking[0] = True
    print(f"[STOP-THINK] set_stop_thinking CALLED! Flag is now: {global_stop_thinking[0]}")
    return gr.update(value="⚡ Forcing generation...")

def reset_stop_thinking_after_delay():
    """Wait 5 seconds then restore the button text so the user can click it again."""
    import time
    time.sleep(5)
    return gr.update(value="⚡ Stop thinking, Generate now")

def set_kill_threads():
    global_kill_threads[0] = True
    print(f"[KILL] set_kill_threads CALLED! Flag is now: {global_kill_threads[0]}")
    return gr.update(value="🛑 Stopping...")

def reset_generation_flags():
    """Reset all generation control flags at the start of a new generation."""
    global_stop_thinking[0] = False
    global_kill_threads[0] = False
    print("[FLAGS] Reset stop_thinking and kill_threads to False")


def extract_pdf_content(pdf_path, max_pages=2):
    """Extract text and images from up to max_pages of a PDF."""
    doc = fitz.open(pdf_path)
    text = ""
    images = []
    for i in range(min(max_pages, len(doc))):
        page = doc[i]
        text += page.get_text() + "\n"
        pix = page.get_pixmap(dpi=150)
        img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
        images.append(img)
    return text, images

def is_youtube_url(url):
    """Check if a URL is a YouTube link."""
    if not url:
        return False
    youtube_patterns = [
        r'(https?://)?(www\.)?youtube\.com/watch',
        r'(https?://)?(www\.)?youtube\.com/shorts/',
        r'(https?://)?youtu\.be/',
        r'(https?://)?(www\.)?youtube\.com/embed/',
        r'(https?://)?m\.youtube\.com/',
    ]
    for pattern in youtube_patterns:
        if re_module.search(pattern, url):
            return True
    return False

def extract_youtube_audio(url, max_duration_sec=300, cookiefile=None):
    """Extract audio from YouTube video (first max_duration_sec seconds).
    Returns path to the downloaded audio file.
    cookiefile: optional path to a Netscape-format cookies.txt to bypass bot filtering.
    """
    import yt_dlp
    from yt_dlp.utils import download_range_func
    
    os.makedirs("log", exist_ok=True)
    output_path = os.path.join("log", "yt_audio")
    
    ydl_opts = {
        'format': 'bestaudio/best',
        'postprocessors': [{
            'key': 'FFmpegExtractAudio',
            'preferredcodec': 'wav',
            'preferredquality': '192',
        }],
        'download_ranges': download_range_func(None, [(0, max_duration_sec)]),
        'force_keyframes_at_cuts': True,
        'outtmpl': output_path + '.%(ext)s',
        'quiet': True,
        'no_warnings': True,
    }
    
    if cookiefile:
        ydl_opts['cookiefile'] = cookiefile
    
    with yt_dlp.YoutubeDL(ydl_opts) as ydl:
        info = ydl.extract_info(url, download=True)
        title = info.get('title', 'YouTube Video')
    
    # The output file will be output_path.wav after postprocessing
    wav_path = output_path + '.wav'
    if not os.path.exists(wav_path):
        # Sometimes the extension might differ, search for it
        for ext in ['wav', 'mp3', 'opus', 'webm', 'm4a']:
            candidate = output_path + '.' + ext
            if os.path.exists(candidate):
                wav_path = candidate
                break
    
    if not os.path.exists(wav_path):
        raise FileNotFoundError(f"Could not find downloaded audio file at {output_path}.*")
    
    return wav_path, title

@spaces.GPU(duration=180)
def transcribe_audio_with_asr(audio_path):
    """Transcribe audio file using Cohere ASR model via transformers."""
    global asr_model, asr_processor
    from transformers.audio_utils import load_audio
    
    audio = load_audio(audio_path, sampling_rate=16000)
    
    inputs = asr_processor(audio, language="ko", sampling_rate=16000, return_tensors="pt")
    inputs = inputs.to(asr_model.device, dtype=asr_model.dtype)
    
    outputs = asr_model.generate(**inputs, max_new_tokens=2048)
    texts = asr_processor.decode(outputs, skip_special_tokens=True)
    # text = texts[0] if isinstance(texts, list) else texts
    # join texts
    # Filter the lines in texts which are english only and no korean
    if isinstance(texts, list):
        # Filter out lines that are purely English/symbols (no Korean characters)
        # Korean Unicode range: AC00-D7A3 (Syllables), 1100-11FF (Jamo), 3130-318F (Compatibility Jamo)
        korean_re = re_module.compile(r'[가-힣ㄱ-ㅎㅏ-ㅣ]')
        texts = [line for line in texts if korean_re.search(line)]
        

    text = "\n".join(texts) if isinstance(texts, list) else texts
    
    
    return text.strip()

def extract_website_content(url, max_images=2):
    """Extract text and images from a website URL."""
    import requests
    from bs4 import BeautifulSoup
    import io
    
    headers = {
        'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'
    }
    
    html_content = ""
    try:
        from playwright.sync_api import sync_playwright
        with sync_playwright() as p:
            browser = p.chromium.launch(headless=True)
            page = browser.new_page(user_agent=headers['User-Agent'])
            # Wait until there are no network connections for at least 500 ms (so JS can finish)
            page.goto(url, timeout=30000, wait_until="networkidle")
            html_content = page.content()
            browser.close()
    except Exception as e:
        print(f"Playwright headless fetch failed: {e}. Falling back to requests...")
        response = requests.get(url, headers=headers, timeout=10)
        response.raise_for_status()
        html_content = response.content
        
    soup = BeautifulSoup(html_content, 'html.parser')
    
    for script in soup(["script", "style", "nav", "footer", "header", "noscript"]):
        script.extract()
        
    text = soup.get_text(separator='\n')
    lines = (line.strip() for line in text.splitlines())
    chunks = (phrase.strip() for line in lines for phrase in line.split("  "))
    text = '\n'.join(chunk for chunk in chunks if chunk)
    
    images = []
    img_tags = soup.find_all('img')
    for img in img_tags:
        if len(images) >= max_images:
            break
        src = img.get('src') or img.get('data-src')
        if src:
            if src.startswith('//'):
                src = 'https:' + src
            elif src.startswith('/'):
                from urllib.parse import urljoin
                src = urljoin(url, src)
                
            try:
                img_resp = requests.get(src, headers=headers, timeout=5)
                if img_resp.status_code == 200:
                    pil_img = Image.open(io.BytesIO(img_resp.content))
                    if pil_img.mode != 'RGB':
                        pil_img = pil_img.convert('RGB')
                    if pil_img.width >= 100 and pil_img.height >= 100:
                        images.append(pil_img)
            except Exception as e:
                print(f"Failed to load image {src}: {e}")
                
    return text, images

def get_base64_image(image):
    buffered = io.BytesIO()
    image.save(buffered, format="JPEG")
    img_str = base64.b64encode(buffered.getvalue()).decode("utf-8")
    return f"data:image/jpeg;base64,{img_str}"

@spaces.GPU(duration=180)
def extract_vocabulary(pdf_text, images, translit_lang, translit_format, target_lang, max_text_char=1500, repetition_penalty_val=1.1, partial_assistant_text=None, auto_force_chars=1000, enable_thinking=True):
    """Use Transformers to extract vocabulary from text and images."""
    global model, processor
    
    os.makedirs("log", exist_ok=True)
    
    if len(pdf_text.strip()) == 0:
        pdf_text = '''"No Text available, see provided Images only."'''
    
    no_img = ""
    if len(images) == 0:
        no_img = '''\n"No Images available, see provided Text only."'''

    non_english = ""
    if translit_lang.upper() != "ENGLISH":
        non_english = f" CRITICAL: You MUST use the native alphabet/script of {translit_lang.upper()}, do NOT use English letters unless requested."
    
    prompt_text = f"""Text:

<scrpated-content>
{pdf_text[:int(max_text_char)]}
</scrpated-content>{no_img}

Extract at least 10 key Korean words or phrases from the following text and images.
Focus on meaningful vocabulary that is highly helpful for a new language learner (e.g., common nouns, verbs, adjectives, or useful expressions).
CRITICAL: Do NOT extract website template words, navigation menus, boilerplate text, UI elements, or titles like 'Home page', 'News', 'Menu'.

Return ONLY a valid JSON list of dictionaries, where each dictionary has four keys:
- 'korean' (the Korean text)
- 'transliteration' (the pronunciation transliterated into {translit_lang.upper()} script/characters, formatted as {translit_format}.{non_english})
- 'translation' (the brief translation into {target_lang.upper()})
- 'explanation' (a brief grammar or context note in {target_lang.upper()}).

Just output raw JSON with ```json and ``` markers, as the user will load in python. Example:

```json
[
  {{
    "korean": "날씨",
    "transliteration": "nal-ssi",
    "translation": "weather",
    "explanation": "Common noun used to describe weather conditions."
  }},
  {{
    "korean": "맛있다",
    "transliteration": "ma-sit-da",
    "translation": "to be delicious",
    "explanation": "Descriptive verb. Polite form: 맛있어요. Used to compliment food."
  }}
]
```

CRITICAL: Do NOT overthink. Do NOT deliberate over conditions, edge cases, or reasoning. Keep your thinking extremely brief (a few words at most). Output the JSON array IMMEDIATELY without lengthy analysis.


"""
    
    # DEBUG: Log prompt text
    if not IS_HF:
        with open(os.path.join(LOG_DIR, "debug_vlm_prompt.txt"), "w", encoding="utf-8") as f:
            f.write(prompt_text)

    content = []
    pil_images = []
    
    for i, img in enumerate(images):
        # DEBUG: Log images
        img.save(os.path.join(LOG_DIR, f"debug_image_{i}.png"), format="PNG")
        pil_images.append(img)
        
        content.append({
            "type": "image",
        })
        
    content += [{"type": "text", "text": prompt_text}]

    messages = [
        {
            "role": "user",
            "content": content
        }
    ]

    try:
        model.to("cuda")
        text = processor.apply_chat_template(messages, tokenize=False, add_generation_prompt=True, enable_thinking=enable_thinking)
        if not enable_thinking:
            # Non-think mode: force JSON output immediately
            text += "```json\n[\n"
        elif partial_assistant_text:
            text += partial_assistant_text + "\nReady to generate.\n</think>\n\n```json\n[\n"
            
        inputs = processor(
            text=[text],
            images=pil_images if pil_images else None,
            return_tensors="pt",
            padding=True
        ).to("cuda")
        
        from transformers import TextIteratorStreamer, StoppingCriteria, StoppingCriteriaList
        from threading import Thread
        import queue

        local_stop = [False]
        
        class LocalKillCriteria(StoppingCriteria):
            def __call__(self, input_ids, scores, **kwargs):
                return local_stop[0] or global_kill_threads[0]

        def run_generation(cur_inputs, cur_streamer, cur_local_stop):
            """Run model.generate in a thread, always calling streamer.end() on exit."""
            kill_criteria = StoppingCriteriaList([LocalKillCriteria()])
            gen_kwargs = dict(
                **cur_inputs,
                streamer=cur_streamer,
                max_new_tokens=2048*16,
                do_sample=True,
                repetition_penalty=repetition_penalty_val,
                stopping_criteria=kill_criteria
            )
            if len(images) > 0:
                gen_kwargs.update(dict(temperature=0.6, top_p=0.95, top_k=20, min_p=0.0))
            else:
                gen_kwargs.update(dict(temperature=1.0, top_p=0.95, top_k=20, min_p=0.0))
            try:
                model.generate(**gen_kwargs)
            except Exception as e:
                import traceback
                print(f"\n[THREAD ERROR] model.generate crashed: {e}")
                traceback.print_exc()
            finally:
                try:
                    cur_streamer.end()
                except Exception:
                    pass

        output_text = partial_assistant_text + "\n</think>\n\n```json\n[\n" if partial_assistant_text else ("" if enable_thinking else "")

        streamer = TextIteratorStreamer(processor.tokenizer, skip_prompt=True, skip_special_tokens=True)
        thread = Thread(target=run_generation, args=(inputs, streamer, local_stop))
        thread.start()
        
        force_triggered = False
        AUTO_FORCE_CHARS = auto_force_chars
        for new_text in streamer:
            output_text += new_text
            yield output_text, None
            
            # Auto-force JSON if thinking exceeds 300 chars without producing JSON
            should_auto_force = (
                enable_thinking
                and not force_triggered
                and not partial_assistant_text
                and len(output_text) > AUTO_FORCE_CHARS
                and '```json' not in output_text
            )
            
            # Check if user clicked "Stop thinking" OR auto-force threshold reached
            if (global_stop_thinking[0] or should_auto_force) and not force_triggered:
                force_triggered = True
                reason = f"auto-force (>{AUTO_FORCE_CHARS} chars)" if should_auto_force else "user clicked stop"
                print(f"[STOP-THINK] Force triggered ({reason})! Killing current generation...")
                
                # 1. Kill the current generation thread
                local_stop[0] = True
                # Drain queue so the thread can exit
                while not streamer.text_queue.empty():
                    try:
                        streamer.text_queue.get_nowait()
                    except queue.Empty:
                        break
                thread.join(timeout=5)
                print("[STOP-THINK] Old thread joined. Starting forced JSON generation...")
                
                # 2. Reset flags
                global_stop_thinking[0] = False
                local_stop[0] = False
                
                # 3. Append the think-closing + JSON prefix
                output_text += "\nReady to generate.\n</think>\n\n```json\n[\n"
                yield output_text, None
                
                # 4. Build new prompt with partial assistant text
                text2 = processor.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
                text2 += output_text
                inputs2 = processor(
                    text=[text2],
                    images=pil_images if pil_images else None,
                    return_tensors="pt",
                    padding=True
                ).to("cuda")
                
                # 5. Start new generation thread with force-JSON context
                # This loop also monitors stop_thinking so user can force again if model keeps thinking
                streamer2 = TextIteratorStreamer(processor.tokenizer, skip_prompt=True, skip_special_tokens=True)
                thread2 = Thread(target=run_generation, args=(inputs2, streamer2, local_stop))
                thread2.start()
                
                HARD_FORCE_CHARS = 10_000
                for new_text2 in streamer2:
                    output_text += new_text2
                    yield output_text, None
                    
                    # Hard auto-force: if total output exceeds 10K chars,
                    # the model has been rambling too long — force again regardless
                    # of JSON state (the model may complete JSON then start over).
                    should_hard_force = len(output_text) > HARD_FORCE_CHARS
                    
                    # Allow user to force again OR hard auto-force kicks in
                    if global_stop_thinking[0] or global_kill_threads[0] or should_hard_force:
                        reason = "hard auto-force (>10K chars)" if should_hard_force and not global_stop_thinking[0] else "user/kill flag"
                        print(f"[STOP-THINK] Flag detected in forced generation loop ({reason})! Killing...")
                        local_stop[0] = True
                        while not streamer2.text_queue.empty():
                            try:
                                streamer2.text_queue.get_nowait()
                            except queue.Empty:
                                break
                        thread2.join(timeout=5)
                        global_stop_thinking[0] = False
                        local_stop[0] = False
                        
                        # Force JSON prefix again
                        output_text += "\nReady to generate.\n</think>\n\n```json\n[\n"
                        yield output_text, None
                        
                        text3 = processor.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
                        text3 += output_text
                        inputs3 = processor(
                            text=[text3],
                            images=pil_images if pil_images else None,
                            return_tensors="pt",
                            padding=True
                        ).to("cuda")
                        
                        streamer3 = TextIteratorStreamer(processor.tokenizer, skip_prompt=True, skip_special_tokens=True)
                        thread3 = Thread(target=run_generation, args=(inputs3, streamer3, local_stop))
                        thread3.start()
                        
                        for new_text3 in streamer3:
                            output_text += new_text3
                            yield output_text, None
                        
                        thread3.join(timeout=10)
                        break
                else:
                    thread2.join(timeout=10)
                break  # Exit the outer streamer loop
        
        if not force_triggered:
            thread.join()
        
        # Reset flag in case it was set but generation finished naturally
        global_stop_thinking[0] = False

        # DEBUG: Log raw output text
        if not IS_HF:
            with open(os.path.join(LOG_DIR, "debug_vlm_output.txt"), "w", encoding="utf-8") as f:
                f.write(output_text)
            
    except Exception as e:
        print(f"Error during Transformers inference: {e}")
        yield f"Error during Transformers inference: {e}", []
        return

    try:
        import re
        # Extract JSON from markdown code fences or raw output
        json_matches = list(re.finditer(r'```(?:json)?\s*([\s\S]*?)```', output_text))
        if json_matches:
            clean_text = json_matches[-1].group(1).strip()
        else:
            # Fallback: find last [ ... ] or { ... } block
            json_matches = list(re.finditer(r'(\[[\s\S]*\]|\{[\s\S]*\})', output_text))
            clean_text = json_matches[-1].group(1).strip() if json_matches else output_text.strip()
        try:
            data = json.loads(clean_text)
        except:
            import jiter
            # Get bytes from string
            data = jiter.from_json(clean_text.encode("utf-8"), partial_mode=True)
        
        if not isinstance(data, list):
            data = [data]
        yield output_text, data
    except Exception as e:
        print(f"Error parsing JSON: {e}\nRaw output: {output_text}")
        yield output_text, []

def translate_vocabulary(korean_words, translit_lang, translit_format, target_lang, repetition_penalty_val=1.1, enable_thinking=True):
    """Use Transformers text-only inference to translate/transliterate Korean words."""
    global model, processor
    
    non_english = ""
    if translit_lang.upper() != "ENGLISH":
        non_english = f" CRITICAL: You MUST use the native alphabet/script of {translit_lang.upper()}, do NOT use English letters unless requested."
    
    words_str = ", ".join(korean_words)
    prompt_text = f"""Translate and transliterate the following Korean words.
Return ONLY a valid JSON list of dictionaries, where each dictionary has four keys:
- 'korean' (the original Korean text)
- 'transliteration' (the pronunciation transliterated into {translit_lang.upper()} script/characters, formatted as {translit_format}.{non_english})
- 'translation' (the translation into {target_lang.upper()})
- 'explanation' (a brief grammar or context note in {target_lang.upper()}).
No markdown formatting, just raw JSON with ```json and ``` markers.
CRITICAL: Do NOT overthink. Do NOT deliberate over conditions, edge cases, or reasoning. Keep your thinking extremely brief (5 paragraphs at most). Output the JSON array IMMEDIATELY without lengthy analysis.

Korean words:
{words_str}
"""

    # DEBUG: Log translation prompt text
    if not IS_HF:
        with open(os.path.join(LOG_DIR, "debug_translate_prompt.txt"), "w", encoding="utf-8") as f:
            f.write(prompt_text)

    messages = [
        {
            "role": "user",
            "content": [{"type": "text", "text": prompt_text}]
        }
    ]

    try:
        model.to("cuda")
        text = processor.apply_chat_template(messages, tokenize=False, add_generation_prompt=True, enable_thinking=enable_thinking)
        if not enable_thinking:
            text += "```json\n[\n"
        inputs = processor(
            text=[text],
            images=None,
            return_tensors="pt",
            padding=True
        ).to("cuda")

        generated_ids = model.generate(
            **inputs,
            # max_new_tokens=2048*16,
            max_new_tokens=2048*2,
            # temperature=1.0,
            # top_p=0.95,
            temperature=1.0, top_p=0.95, top_k=20, min_p=0.0, 
            # presence_penalty=1.5, 
            repetition_penalty=repetition_penalty_val,
            do_sample=True
        )
        
        generated_ids = [
            output_ids[len(input_ids):] for input_ids, output_ids in zip(inputs.input_ids, generated_ids)
        ]
        output_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
        
        # DEBUG: Log raw translation output text
        if not IS_HF:
            with open(os.path.join(LOG_DIR, "debug_translate_output.txt"), "w", encoding="utf-8") as f:
                f.write(output_text)
            
    except Exception as e:
        print(f"Error during Transformers text inference: {e}")
        return []

    try:
        import re
        json_matches = list(re.finditer(r'```(?:json)?\s*([\s\S]*?)```', output_text))
        if json_matches:
            clean_text = json_matches[-1].group(1).strip()
        else:
            json_matches = list(re.finditer(r'(\[[\s\S]*\]|\{[\s\S]*\})', output_text))
            clean_text = json_matches[-1].group(1).strip() if json_matches else output_text.strip()
            
        try:
            data = json.loads(clean_text)
        except:
            import jiter
            data = jiter.from_json(clean_text.encode("utf-8"), partial_mode=True)
            
        if not isinstance(data, list):
            data = [data]
        return data
    except Exception as e:
        print(f"Error parsing JSON: {e}\nRaw output: {output_text}")
        return []

def numpy_to_base64_audio(wav, sample_rate):
    wav = wav.squeeze()
    buffer = io.BytesIO()
    sf.write(buffer, wav, sample_rate, format='WAV')
    buffer.seek(0)
    audio_base64 = base64.b64encode(buffer.read()).decode('utf-8')
    return f"data:audio/wav;base64,{audio_base64}"

import hashlib

def hash_file(filepath):
    with open(filepath, 'rb') as f:
        return hashlib.md5(f.read(1024*1024)).hexdigest()

@spaces.GPU(duration=180)
def process_pdf(pdf_file, url_input, audio_file_input, yt_url_input, yt_cookies_file, translit_lang, translit_format, target_lang, max_text_char, repetition_penalty_val, auto_force_chars_val, last_source_hash, last_korean_words, active_tab, enable_thinking=True, progress=gr.Progress()):
    global tts, voice_style
    
    # Clean language choices from "Family - Language" to just "Language"
    if " - " in translit_lang:
        translit_lang = translit_lang.split(" - ")[-1]
    if " - " in target_lang:
        target_lang = target_lang.split(" - ")[-1]
        
    os.makedirs(LOG_DIR, exist_ok=True)
    
    # Reset flags at start of new generation
    reset_generation_flags()
    
    # Determine input source based on active tab
    is_url = (active_tab == "Website URL") and bool(url_input and url_input.strip())
    is_youtube = (active_tab == "YouTube Link") and bool(yt_url_input and yt_url_input.strip() and is_youtube_url(yt_url_input.strip()))
    is_audio_upload = (active_tab == "Upload Audio") and (audio_file_input is not None)
    is_pdf = (active_tab == "Upload PDF") and (pdf_file is not None)
    
    if not is_url and not is_youtube and not is_audio_upload and not is_pdf:
        yield "<p>Please provide input in the active tab.</p>", None, None, "", "", [], None
        return
        
    if is_youtube:
        current_source_hash = hashlib.md5(yt_url_input.strip().encode()).hexdigest()
    elif is_audio_upload:
        current_source_hash = hash_file(audio_file_input)
    elif is_url:
        current_source_hash = hashlib.md5(url_input.strip().encode()).hexdigest()
    else:
        current_source_hash = hash_file(pdf_file.name)
        
    vocab_list = []
    extracted_audio_path = None

    try:
        if is_youtube:
            progress(0, desc="Downloading YouTube audio (first 5 min)...")
            cookies_path = yt_cookies_file.name if yt_cookies_file else None
            audio_path, yt_title = extract_youtube_audio(yt_url_input.strip(), max_duration_sec=300, cookiefile=cookies_path)
            
            progress(0.1, desc=f"Transcribing audio with Cohere ASR...")
            content_text = transcribe_audio_with_asr(audio_path)
            images = []
            extracted_audio_path = audio_path
                
            if not content_text.strip():
                yield "<p>Could not transcribe any text from the YouTube video.</p>", current_source_hash, None, "", "", [], extracted_audio_path
                return
                
            # Log the transcription
            if not IS_HF:
                with open(os.path.join(LOG_DIR, "debug_yt_transcription.txt"), "w", encoding="utf-8") as f:
                    f.write(f"Title: {yt_title}\n\n{content_text}")
        elif is_audio_upload:
            progress(0, desc="Transcribing uploaded audio with Cohere ASR...")
            content_text = transcribe_audio_with_asr(audio_file_input)
            images = []
            extracted_audio_path = audio_file_input
                
            if not content_text.strip():
                yield "<p>Could not transcribe any text from the uploaded audio.</p>", current_source_hash, None, "", "", [], extracted_audio_path
                return
                
            if not IS_HF:
                with open(os.path.join(LOG_DIR, "debug_audio_transcription.txt"), "w", encoding="utf-8") as f:
                    f.write(content_text)
        elif is_url:
            progress(0, desc="Fetching Website...")
            content_text, images = extract_website_content(url_input.strip())
        else:
            progress(0, desc="Reading PDF...")
            content_text, images = extract_pdf_content(pdf_file.name)
            
        if not content_text.strip() and not images:
            yield "<p>No content found.</p>", current_source_hash, None, "", "", [], extracted_audio_path
            return
    except Exception as e:
        import traceback
        traceback.print_exc()
        yield f"<p>Error reading content: {e}</p>", None, None, "", "", [], None
        return

    vocab_list = []
    stream_text = ""
    for attempt in range(1, 4):
        if global_kill_threads[0]:
            print("[KILL] Kill flag detected, stopping extraction attempts.")
            break
        progress(0.2, desc=f"Extracting vocabulary (Attempt {attempt}/3)...")
        for stream_t, v_list in extract_vocabulary(content_text, images, translit_lang, translit_format, target_lang, max_text_char, repetition_penalty_val, auto_force_chars=auto_force_chars_val, enable_thinking=enable_thinking):
            stream_text = stream_t
            if v_list is not None:
                vocab_list = v_list
            yield "", current_source_hash, None, stream_text, content_text, images, extracted_audio_path
            
        if vocab_list:
            break

    # Reset kill flag after extraction so TTS can proceed
    global_kill_threads[0] = False

    # If generation was killed but we don't have vocab yet, try to salvage JSON from stream_text
    if not vocab_list and stream_text:
        print("[KILL] Attempting to salvage JSON from partial generation output...")
        try:
            import re
            json_matches = list(re.finditer(r'```(?:json)?\s*([\s\S]*?)```', stream_text))
            if json_matches:
                clean_text = json_matches[-1].group(1).strip()
            else:
                json_matches = list(re.finditer(r'(\[[\s\S]*\]|\{[\s\S]*\})', stream_text))
                clean_text = json_matches[-1].group(1).strip() if json_matches else ""
            
            if clean_text:
                try:
                    data = json.loads(clean_text)
                except:
                    import jiter
                    data = jiter.from_json(clean_text.encode("utf-8"), partial_mode=True)
                if not isinstance(data, list):
                    data = [data]
                if data and isinstance(data[0], dict) and 'korean' in data[0]:
                    vocab_list = data
                    print(f"[KILL] Salvaged {len(vocab_list)} vocab items from partial output!")
        except Exception as e:
            print(f"[KILL] Could not salvage JSON: {e}")

    if not vocab_list:
        yield "<p>Failed to extract or translate vocabulary after 3 attempts.</p>", current_source_hash, None, stream_text, content_text, images, extracted_audio_path
        return

    progress(0.6, desc="Generating TTS audio...")
    # Pre-generate TTS audio
    for i, item in enumerate(vocab_list):
        korean = item.get("korean", "")
        # Add dot
        if not korean.endswith("."):
            korean += "."
            
        try:
            wav, dur = tts.synthesize(
                korean, voice_style=voice_style, lang="ko",
                total_steps=12,
                speed=0.7,
            )
            
            # DEBUG: Save audio locally
            if not IS_HF:
                wav_1d = wav.squeeze()
                sf.write(os.path.join(LOG_DIR, f"debug_audio_{i}.wav"), wav_1d, tts.sample_rate, format='WAV')
            
            audio_data_uri = numpy_to_base64_audio(wav, tts.sample_rate)
            item['audio_uri'] = audio_data_uri
        except Exception as e:
            print(f"TTS error for '{korean}': {e}")
            item['audio_uri'] = None

    cards_json = json.dumps(vocab_list).replace("</", "<\\/")

    iframe_html = f"""
    <!DOCTYPE html>
    <html>
    <head>
    <!-- Flaticon UIcons CDN -->
    <link rel='stylesheet' href='https://cdn-uicons.flaticon.com/uicons-regular-rounded/css/uicons-regular-rounded.css'>
    <style>
        body {{
            margin: 0;
            padding: 0;
            background: transparent;
        }}
        .flashcard-container {{
            perspective: 1000px;
            width: 100%;
            max-width: 500px;
            margin: 0 auto;
            font-family: 'Inter', sans-serif;
            padding-top: 20px;
        }}
        .flashcard {{
            width: 100%;
            min-height: 400px;
            display: grid;
            transition: transform 0.6s cubic-bezier(0.4, 0.2, 0.2, 1);
            transform-style: preserve-3d;
            cursor: pointer;
        }}
        .flashcard.is-flipped {{
            transform: rotateY(180deg);
        }}
        .card-face {{
            grid-area: 1 / 1;
            width: 100%;
            backface-visibility: hidden;
            display: flex;
            flex-direction: column;
            justify-content: center;
            align-items: center;
            border-radius: 20px;
            box-shadow: 0 10px 30px rgba(0,0,0,0.1);
            padding: 30px;
            box-sizing: border-box;
            background: rgba(15, 23, 42, 0.6);
            backdrop-filter: blur(15px);
            border: 1px solid rgba(255, 255, 255, 0.1);
            text-align: center;
            box-shadow: inset 0 0 0 1px rgba(255, 255, 255, 0.05), 0 10px 40px rgba(0, 0, 0, 0.5);
        }}
        .card-front {{
            background: linear-gradient(135deg, rgba(30, 41, 59, 0.9) 0%, rgba(15, 23, 42, 0.9) 100%);
            border-top: 2px solid rgba(139, 92, 246, 0.5);
        }}
        .card-back {{
            transform: rotateY(180deg);
            background: linear-gradient(135deg, rgba(30, 58, 138, 0.9) 0%, rgba(15, 23, 42, 0.9) 100%);
            border-top: 2px solid rgba(56, 189, 248, 0.5);
            color: #f8fafc;
        }}
        .korean-text {{
            font-size: 54px;
            font-weight: 700;
            color: #ffffff;
            text-shadow: 0 0 20px rgba(139, 92, 246, 0.6);
            margin-bottom: 20px;
        }}
        .english-text {{
            font-size: 34px;
            font-weight: 700;
            color: #ffffff;
            text-shadow: 0 0 15px rgba(56, 189, 248, 0.6);
            margin-bottom: 5px;
        }}
        .translit-text {{
            font-size: 20px;
            font-style: italic;
            color: #fca5a5;
            margin-bottom: 15px;
            letter-spacing: 1px;
        }}
        .explanation-text {{
            font-size: 16px;
            color: #cbd5e1;
            line-height: 1.6;
            background: rgba(0,0,0,0.2);
            padding: 15px;
            border-radius: 12px;
            border: 1px solid rgba(255,255,255,0.05);
        }}
        .nav-buttons {{
            display: flex;
            justify-content: space-between;
            margin-top: 30px;
            width: 100%;
            max-width: 500px;
            margin-left: auto;
            margin-right: auto;
        }}
        .nav-btn {{
            padding: 14px 28px;
            border: none;
            border-radius: 16px;
            background: rgba(139, 92, 246, 0.2);
            backdrop-filter: blur(5px);
            border: 1px solid rgba(139, 92, 246, 0.5);
            color: white;
            font-weight: 600;
            cursor: pointer;
            text-transform: uppercase;
            letter-spacing: 1px;
            transition: all 0.3s ease;
            box-shadow: 0 4px 15px rgba(0,0,0,0.2);
        }}
        .nav-btn:hover {{
            background: rgba(139, 92, 246, 0.5);
            transform: translateY(-2px);
            box-shadow: 0 6px 20px rgba(139, 92, 246, 0.4);
        }}
            transition: all 0.2s;
            box-shadow: 0 4px 12px rgba(124, 58, 237, 0.3);
            flex: 1;
            margin: 0 10px;
            display: flex;
            align-items: center;
            justify-content: center;
            gap: 8px;
        }}
        .nav-btn:hover {{
            background: #6d28d9;
            transform: translateY(-2px);
        }}
        .nav-btn:disabled {{
            background: #ccc;
            cursor: not-allowed;
            transform: none;
            box-shadow: none;
        }}
        .audio-btn {{
            margin-top: 15px;
            padding: 12px 24px;
            background: rgba(56, 189, 248, 0.2);
            color: #38bdf8;
            border: 1px solid rgba(56, 189, 248, 0.4);
            border-radius: 20px;
            font-size: 15px;
            font-weight: 600;
            cursor: pointer;
            transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
            display: flex;
            align-items: center;
            justify-content: center;
            gap: 8px;
            text-transform: uppercase;
            letter-spacing: 1px;
        }}
        .audio-btn:hover {{
            background: rgba(56, 189, 248, 0.4);
            transform: scale(1.05) translateY(-2px);
            box-shadow: 0 5px 15px rgba(56, 189, 248, 0.3);
        }}
        .progress {{
            text-align: center;
            margin-top: 15px;
            color: #666;
            font-size: 14px;
            font-weight: 600;
        }}
        .copy-icon {{
            cursor: pointer;
            color: #a0a0a0;
            font-size: 24px;
            transition: color 0.2s, transform 0.2s;
        }}
        .copy-icon:hover {{
            color: #7c3aed;
            transform: scale(1.1);
        }}
    </style>
    </head>
    <body>
    <div id="flashcard-app">
        <div class="flashcard-container">
            <div class="flashcard" id="card" onclick="flipCard()">
                <div class="card-face card-front">
                    <div style="display: flex; align-items: center; justify-content: center; gap: 15px; margin-bottom: 20px; width: 100%;">
                        <div class="korean-text" id="front-text" style="margin-bottom: 0;"><i class="fi fi-rr-spinner-third fa-spin"></i> Loading...</div>
                        <i class="fi fi-rr-copy copy-icon" id="copy-ko" onclick="copyText('front-text', event, this)" title="Copy text" style="display:none;"></i>
                    </div>
                    <button class="audio-btn" onclick="playAudio(event)" id="audio-btn" style="display:none;"><i class="fi fi-rr-play-circle"></i> Play Audio</button>
                    <p style="margin-top:20px; color:#999; font-size:13px; display:flex; align-items:center; gap:5px;"><i class="fi fi-rr-rotate-right"></i> Click card to flip 🎯</p>
                </div>
                <div class="card-face card-back">
                    <div style="display: flex; align-items: center; justify-content: center; gap: 15px; margin-bottom: 5px; width: 100%;">
                        <div class="english-text" id="back-en" style="margin-bottom: 0;"></div>
                        <i class="fi fi-rr-copy copy-icon" id="copy-en" onclick="copyText('back-en', event, this)" title="Copy text" style="display:none;"></i>
                    </div>
                    <div class="translit-text" id="back-translit"></div>
                    <div class="explanation-text"><i class="fi fi-rr-lightbulb-on" style="color:#f1c40f;"></i> <span id="back-exp"></span></div>
                </div>
            </div>
        </div>
        <div class="nav-buttons">
            <button class="nav-btn" id="prev-btn" onclick="prevCard()"><i class="fi fi-rr-angle-left"></i> Previous</button>
            <button class="nav-btn" id="next-btn" onclick="nextCard()">Next <i class="fi fi-rr-angle-right"></i></button>
        </div>
        <div class="progress" id="progress-text"></div>
    </div>

    <script>
        const cards = {cards_json};
        let currentIndex = 0;
        let audioPlayer = new Audio();

        function updateCard() {{
            if (!cards || cards.length === 0) {{
                document.getElementById('front-text').innerHTML = "No vocabulary found 😥";
                document.getElementById('prev-btn').disabled = true;
                document.getElementById('next-btn').disabled = true;
                if(document.getElementById('copy-ko')) document.getElementById('copy-ko').style.display = 'none';
                if(document.getElementById('copy-en')) document.getElementById('copy-en').style.display = 'none';
                return;
            }}
            const card = cards[currentIndex];
            document.getElementById('front-text').innerText = card.korean || "No word";
            document.getElementById('back-en').innerText = card.translation || card.english || "";
            document.getElementById('back-translit').innerText = card.transliteration ? `[${{card.transliteration}}]` : "";
            document.getElementById('back-exp').innerText = card.explanation || "";
            
            if(document.getElementById('copy-ko')) document.getElementById('copy-ko').style.display = 'block';
            if(document.getElementById('copy-en')) document.getElementById('copy-en').style.display = 'block';
            
            document.getElementById('prev-btn').disabled = currentIndex === 0;
            document.getElementById('next-btn').disabled = currentIndex === cards.length - 1;
            document.getElementById('progress-text').innerHTML = `📚 Card ${{currentIndex + 1}} of ${{cards.length}}`;
            
            const cardEl = document.getElementById('card');
            cardEl.classList.remove('is-flipped');
            
            if(card.audio_uri) {{
                audioPlayer.src = card.audio_uri;
                document.getElementById('audio-btn').style.display = 'flex';
            }} else {{
                document.getElementById('audio-btn').style.display = 'none';
            }}
        }}

        function flipCard() {{
            if (!cards || cards.length === 0) return;
            document.getElementById('card').classList.toggle('is-flipped');
        }}

        function playAudio(e) {{
            e.stopPropagation(); 
            audioPlayer.play().catch(err => console.log("Audio play error:", err));
        }}

        function nextCard() {{
            if (currentIndex < cards.length - 1) {{
                currentIndex++;
                updateCard();
            }}
        }}

        function prevCard() {{
            if (currentIndex > 0) {{
                currentIndex--;
                updateCard();
            }}
        }}

        function copyText(elementId, e, iconEl) {{
            e.stopPropagation();
            const textToCopy = document.getElementById(elementId).innerText;
            navigator.clipboard.writeText(textToCopy).then(() => {{
                const oldClass = iconEl.className;
                iconEl.className = "fi fi-rr-check copy-icon";
                iconEl.style.color = "#27ae60";
                setTimeout(() => {{
                    iconEl.className = oldClass;
                    iconEl.style.color = "";
                }}, 1500);
            }}).catch(err => console.log('Copy failed', err));
        }}

        window.onload = function() {{
            updateCard();
        }};
    </script>
    </body>
    </html>
    """
    
    fc_html = build_flashcard_html(vocab_list)
    yield fc_html, current_source_hash, vocab_list, stream_text, content_text, images, extracted_audio_path

LANGUAGE_DATA = """Indo-European	Bengali, English, French, Portuguese, German, Romanian, Swedish, Danish, Bulgarian, Russian, Czech, Greek, Ukrainian, Spanish, Dutch, Slovak, Croatian, Polish, Lithuanian, Norwegian Bokmål, Norwegian Nynorsk, Persian, Slovenian, Gujarati, Latvian, Italian, Occitan, Nepali, Marathi, Belarusian, Serbian, Luxembourgish, Venetian, Assamese, Welsh, Silesian, Asturian, Chhattisgarhi, Awadhi, Maithili, Bhojpuri, Sindhi, Irish, Faroese, Hindi, Punjabi, Oriya, Tajik, Eastern Yiddish, Lombard, Ligurian, Sicilian, Friulian, Sardinian, Galician, Catalan, Icelandic, Tosk Albanian, Limburgish, Dari, Afrikaans, Macedonian, Sinhala, Urdu, Magahi, Bosnian, Armenian, Latgalian, Scottish Gaelic, Central Kurdish, Northern Kurdish, Southern Pashto, Sanskrit, Dhundari, Marwari, Ahirani, Bagheli, Bagri, Bundeli, Braj, Kumaoni, Kashmiri
Sino-Tibetan	Chinese (Simplified), Chinese (Traditional), Cantonese, Burmese, Standard Tibetan, Meitei
Afro-Asiatic	Arabic (Standard), Arabic (Najdi), Arabic (Levantine), Arabic (Egyptian), Arabic (Moroccan), Arabic (Mesopotamian), Arabic (Ta’izzi-Adeni), Arabic (Tunisian), Arabic (Gulf), Arabic (Algerian), Arabic (Sudanese), Arabic (Libyan), Hebrew, Maltese, Amharic, Tigrinya, Kabyle, Somali, West Central Oromo, Hausa
Austronesian	Indonesian, Malay, Tagalog, Cebuano, Javanese, Sundanese, Minangkabau, Balinese, Banjar, Pangasinan, Iloko, Waray (Philippines), Plateau Malagasy, Malagasy, Buginese, Maori, Samoan, Hawaiian, Fijian
Dravidian	Tamil, Telugu, Kannada, Malayalam
Turkic	Turkish, North Azerbaijani, Northern Uzbek, Kazakh, Bashkir, Tatar, Crimean Tatar, Kyrgyz, Turkmen, Uyghur
Tai-Kadai	Thai, Lao, Shan
Uralic	Finnish, Estonian, Hungarian, Meadow Mari
Austroasiatic	Vietnamese, Khmer
Niger–Congo	Yoruba, Ewe, Kinyarwanda, Lingala, Northern Sotho, Nyanja, Shona, Southern Sotho, Tswana, Xhosa, Zulu, Luganda, Swati, Tsonga, Tumbuka, Venda, Chokwe, Luba-Kasai, Rundi, Umbundu, Kikuyu, Kongo, Nigerian Fulfulde, Wolof, Fon, Kabiyè, Mossi, Akan, Twi, Bambara, Igbo"""
# Other	Japanese, Korean, Georgian, Basque, Haitian, Papiamento, Kabuverdianu, Tok Pisin, Swahili, Central Aymara, Tulu, Nagamese, Nigerian Pidgin, Mauritian Creole, Sango, Ayacucho Quechua, Halh Mongolian, Southwestern Dinka, Nuer, Guarani

LANGUAGE_CHOICES = []
for line in LANGUAGE_DATA.strip().split('\n'):
    family, langs = line.split('\t')
    for lang in langs.split(', '):
        LANGUAGE_CHOICES.append(f"{family} - {lang}")

import urllib.request

def get_example_pdf():
    url = "https://raw.githubusercontent.com/ShayekhBinIslam/file-host/main/cnp_korean_page7.pdf"
    file_path = "cnp_korean_page7.pdf"
    if not os.path.exists(file_path):
        try:
            urllib.request.urlretrieve(url, file_path)
        except Exception as e:
            print(f"Failed to download example PDF: {e}")
    return file_path if os.path.exists(file_path) else None

def get_example_audio():
    url = "https://raw.githubusercontent.com/ShayekhBinIslam/file-host/main/new_1min.wav"
    file_path = "new_1min.wav"
    if not os.path.exists(file_path):
        try:
            urllib.request.urlretrieve(url, file_path)
        except Exception as e:
            print(f"Failed to download example audio: {e}")
    return file_path if os.path.exists(file_path) else None

@spaces.GPU(duration=180)
def process_pdf_force(partial_text, pdf_file, url_input, translit_lang, translit_format, target_lang, max_text_char, repetition_penalty_val, last_source_state, last_korean_words_state):
    """Force JSON generation using the current partial stream_box text."""
    is_url = bool(url_input and url_input.strip())
    
    current_source_hash = ""
    if is_url:
        current_source_hash = "url:" + url_input.strip()
    elif pdf_file is not None:
        import hashlib
        with open(pdf_file.name, "rb") as f:
            current_source_hash = "pdf:" + hashlib.md5(f.read()).hexdigest()
            
    try:
        if is_url:
            progress(0, desc="Fetching Website...")
            content_text, images = extract_website_content(url_input.strip())
        else:
            progress(0, desc="Reading PDF...")
            content_text, images = extract_pdf_content(pdf_file.name)
            
        if not content_text.strip() and not images:
            yield "<p>No content found.</p>", current_source_hash, None, partial_text, "", [], None
            return
    except Exception as e:
        yield f"<p>Error reading content: {e}</p>", None, None, partial_text, "", [], None
        return

    vocab_list = []
    stream_text = partial_text
    
    progress(0.2, desc="Extracting vocabulary (Forced JSON)...")
    for stream_t, v_list in extract_vocabulary(content_text, images, translit_lang, translit_format, target_lang, max_text_char, repetition_penalty_val, partial_assistant_text=partial_text):
        stream_text = stream_t
        if v_list is not None:
            vocab_list = v_list
        yield "", current_source_hash, None, stream_text, content_text, images, None

    if not vocab_list:
        yield "<p>Failed to parse forced JSON.</p>", current_source_hash, None, stream_text, content_text, images, None
        return

    progress(0.6, desc="Generating TTS audio...")
    for i, item in enumerate(vocab_list):
        korean = item.get("korean", "")
        if korean and tts is not None:
            progress(0.6 + 0.3 * (i / len(vocab_list)), desc=f"Generating audio {i+1}/{len(vocab_list)}...")
            try:
                wav, dur = tts.synthesize(
                    korean, voice_style=voice_style, lang="ko",
                    total_steps=12,
                    speed=0.7,
                )
                import numpy as np
                import soundfile as sf
                
                if not IS_HF:
                    audio_path = os.path.join(LOG_DIR, f"audio_{i}.wav")
                    sf.write(audio_path, wav, 24000)
                item["audio_uri"] = numpy_to_base64_audio(wav, tts.sample_rate)
            except Exception as e:
                print(f"Failed to generate audio for {korean}: {e}")
                item["audio_uri"] = None

    progress(1.0, desc="Rendering flashcards...")
    fc_html = build_flashcard_html(vocab_list)
    yield fc_html, current_source_hash, vocab_list, stream_text, content_text, images, None


def build_flashcard_html(vocab_list):
    """Build the flashcard SPA with spaced repetition (SM-2 lite via localStorage)."""
    import html as _html
    cards_json = json.dumps(vocab_list).replace("</", "<\\/")

    iframe_html = f"""<!DOCTYPE html>
<html>
<head>
<meta charset="utf-8">
<link rel='stylesheet' href='https://cdn-uicons.flaticon.com/uicons-regular-rounded/css/uicons-regular-rounded.css'>
<style>
  * {{ box-sizing:border-box; margin:0; padding:0; }}
  body {{ background:transparent; font-family:'Outfit','Inter',sans-serif; color:#f8fafc; padding:12px 8px; }}
  .sr-header {{ display:flex; align-items:center; gap:10px; margin-bottom:12px; }}
  .sr-bar-wrap {{ flex:1; height:7px; background:rgba(255,255,255,.1); border-radius:4px; overflow:hidden; }}
  .sr-bar-fill {{ height:100%; background:linear-gradient(90deg,#22c55e,#3b82f6); border-radius:4px; transition:width .5s ease; }}
  .sr-stats-txt {{ font-size:12px; color:#94a3b8; white-space:nowrap; }}
  .due-btn {{ padding:5px 13px; border-radius:20px; border:1px solid rgba(56,189,248,.4); background:rgba(56,189,248,.1); color:#38bdf8; font-size:12px; font-weight:700; cursor:pointer; transition:all .2s; white-space:nowrap; }}
  .due-btn.active {{ background:rgba(56,189,248,.3); border-color:#38bdf8; box-shadow:0 0 10px rgba(56,189,248,.4); }}
  .due-btn:hover {{ background:rgba(56,189,248,.25); }}
  .fc-container {{ perspective:1000px; width:100%; max-width:520px; margin:0 auto; }}
  .flashcard {{ width:100%; min-height:330px; display:grid; transition:transform .6s cubic-bezier(.4,.2,.2,1); transform-style:preserve-3d; cursor:pointer; }}
  .flashcard.is-flipped {{ transform:rotateY(180deg); }}
  .card-face {{ grid-area:1/1; width:100%; backface-visibility:hidden; display:flex; flex-direction:column; justify-content:center; align-items:center; border-radius:20px; padding:28px; box-sizing:border-box; text-align:center; }}
  .card-front {{ background:linear-gradient(135deg,rgba(30,41,59,.95) 0%,rgba(15,23,42,.95) 100%); border-top:2px solid rgba(139,92,246,.6); box-shadow:0 10px 40px rgba(0,0,0,.5),inset 0 0 0 1px rgba(255,255,255,.05); position:relative; }}
  .card-back {{ transform:rotateY(180deg); background:linear-gradient(135deg,rgba(30,58,138,.95) 0%,rgba(15,23,42,.95) 100%); border-top:2px solid rgba(56,189,248,.6); box-shadow:0 10px 40px rgba(0,0,0,.5),inset 0 0 0 1px rgba(255,255,255,.05); }}
  .sr-badge {{ position:absolute; top:12px; right:14px; font-size:10px; padding:3px 9px; border-radius:12px; font-weight:800; letter-spacing:.5px; }}
  .badge-new {{ background:rgba(139,92,246,.3); color:#c084fc; }}
  .badge-learning {{ background:rgba(239,68,68,.3); color:#fca5a5; }}
  .badge-known {{ background:rgba(34,197,94,.3); color:#86efac; }}
  .badge-due {{ background:rgba(251,191,36,.3); color:#fde68a; }}
  .ko-text {{ font-size:50px; font-weight:800; color:#fff; text-shadow:0 0 20px rgba(139,92,246,.7); margin-bottom:14px; line-height:1.2; }}
  .en-text {{ font-size:28px; font-weight:800; color:#fff; text-shadow:0 0 15px rgba(56,189,248,.7); margin-bottom:6px; }}
  .tr-text {{ font-size:17px; font-style:italic; color:#fca5a5; margin-bottom:12px; letter-spacing:1px; }}
  .exp-text {{ font-size:14px; color:#cbd5e1; line-height:1.6; background:rgba(0,0,0,.25); padding:12px 15px; border-radius:12px; border:1px solid rgba(255,255,255,.06); max-width:100%; }}
  .flip-hint {{ margin-top:14px; color:#475569; font-size:12px; display:flex; align-items:center; gap:5px; }}
  .audio-btn {{ margin-top:10px; padding:9px 20px; background:rgba(56,189,248,.15); color:#38bdf8; border:1px solid rgba(56,189,248,.4); border-radius:20px; font-size:13px; font-weight:700; cursor:pointer; transition:all .3s; display:flex; align-items:center; gap:6px; text-transform:uppercase; letter-spacing:.5px; }}
  .audio-btn:hover {{ background:rgba(56,189,248,.35); transform:scale(1.04); box-shadow:0 5px 15px rgba(56,189,248,.3); }}
  .copy-icon {{ cursor:pointer; color:#475569; font-size:18px; transition:color .2s,transform .2s; flex-shrink:0; }}
  .copy-icon:hover {{ color:#8b5cf6; transform:scale(1.15); }}
  .sr-actions {{ display:flex; justify-content:center; gap:10px; margin-top:18px; width:100%; max-width:520px; margin-left:auto; margin-right:auto; }}
  .sr-btn {{ flex:1; padding:12px 8px; border:none; border-radius:14px; font-weight:700; font-size:13px; cursor:pointer; transition:all .25s cubic-bezier(.4,0,.2,1); display:flex; align-items:center; justify-content:center; gap:5px; font-family:inherit; }}
  .sr-dk {{ background:rgba(239,68,68,.2); border:1px solid rgba(239,68,68,.5); color:#fca5a5; }}
  .sr-dk:hover {{ background:rgba(239,68,68,.4); transform:translateY(-2px); box-shadow:0 6px 20px rgba(239,68,68,.3); }}
  .sr-sk {{ background:rgba(100,116,139,.2); border:1px solid rgba(100,116,139,.5); color:#94a3b8; }}
  .sr-sk:hover {{ background:rgba(100,116,139,.4); transform:translateY(-2px); }}
  .sr-kn {{ background:rgba(34,197,94,.2); border:1px solid rgba(34,197,94,.5); color:#86efac; }}
  .sr-kn:hover {{ background:rgba(34,197,94,.4); transform:translateY(-2px); box-shadow:0 6px 20px rgba(34,197,94,.3); }}
  .nav-buttons {{ display:flex; justify-content:space-between; align-items:center; margin-top:10px; width:100%; max-width:520px; margin-left:auto; margin-right:auto; gap:10px; }}
  .nav-btn {{ padding:9px 18px; border-radius:14px; background:rgba(139,92,246,.15); border:1px solid rgba(139,92,246,.4); color:white; font-weight:700; cursor:pointer; transition:all .25s; display:flex; align-items:center; gap:5px; font-size:13px; font-family:inherit; }}
  .nav-btn:hover {{ background:rgba(139,92,246,.4); transform:translateY(-2px); box-shadow:0 5px 15px rgba(139,92,246,.3); }}
  .nav-btn:disabled {{ background:rgba(100,116,139,.1); border-color:rgba(100,116,139,.2); color:#334155; cursor:not-allowed; transform:none; box-shadow:none; }}
  .progress {{ text-align:center; margin-top:8px; color:#475569; font-size:13px; font-weight:600; }}
</style>
</head>
<body>
<div id="fc-app">
  <div class="sr-header">
    <div class="sr-bar-wrap"><div class="sr-bar-fill" id="sr-fill" style="width:0%"></div></div>
    <span class="sr-stats-txt" id="sr-stats"></span>
    <button class="due-btn" id="due-btn" onclick="toggleReview()">📅 Due Cards</button>
  </div>
  <div class="fc-container">
    <div class="flashcard" id="card" onclick="flipCard()">
      <div class="card-face card-front">
        <span class="sr-badge badge-new" id="sr-badge">🆕 NEW</span>
        <div style="display:flex;align-items:center;gap:10px;margin-bottom:14px;width:100%;justify-content:center;">
          <div class="ko-text" id="front-text"><i class="fi fi-rr-spinner-third"></i></div>
          <i class="fi fi-rr-copy copy-icon" id="copy-ko" onclick="copyText('front-text',event,this)" style="display:none;"></i>
        </div>
        <button class="audio-btn" onclick="playAudio(event)" id="audio-btn" style="display:none;"><i class="fi fi-rr-play-circle"></i> Play</button>
        <p class="flip-hint"><i class="fi fi-rr-rotate-right"></i> Click card to flip 🎯</p>
      </div>
      <div class="card-face card-back">
        <div style="display:flex;align-items:center;gap:10px;margin-bottom:6px;width:100%;justify-content:center;">
          <div class="en-text" id="back-en"></div>
          <i class="fi fi-rr-copy copy-icon" id="copy-en" onclick="copyText('back-en',event,this)" style="display:none;"></i>
        </div>
        <div class="tr-text" id="back-tr"></div>
        <div class="exp-text"><i class="fi fi-rr-lightbulb-on" style="color:#f1c40f;"></i> <span id="back-exp"></span></div>
      </div>
    </div>
  </div>
  <div class="sr-actions">
    <button class="sr-btn sr-dk" onclick="markDontKnow()">❌ Don't Know</button>
    <button class="sr-btn sr-sk" onclick="skipCard()">⏭ Skip</button>
    <button class="sr-btn sr-kn" onclick="markKnow()">✅ Know</button>
  </div>
  <div class="nav-buttons">
    <button class="nav-btn" id="prev-btn" onclick="prevCard()"><i class="fi fi-rr-angle-left"></i> Prev</button>
    <button class="nav-btn" id="next-btn" onclick="nextCard()">Next <i class="fi fi-rr-angle-right"></i></button>
  </div>
  <div class="progress" id="prog"></div>
</div>
<script>
  const ALL = {cards_json};
  let disp=[...ALL], idx=0, reviewMode=false;
  const aud=new Audio();

  function srKey(k){{ return 'sr_'+encodeURIComponent(k); }}
  function getSR(k){{ const s=localStorage.getItem(srKey(k)); return s?JSON.parse(s):{{interval:1,ef:2.5,due:null,status:'new'}}; }}
  function setSR(k,s){{ localStorage.setItem(srKey(k),JSON.stringify(s)); }}
  function today(){{ return new Date().toISOString().slice(0,10); }}
  function daysLater(n){{ const d=new Date(); d.setDate(d.getDate()+n); return d.toISOString().slice(0,10); }}
  function isDue(s){{ return !s.due||s.status==='new'||s.due<=today(); }}

  function markKnow(){{
    if(!disp.length) return;
    const k=disp[idx].korean; let s=getSR(k);
    s.interval=Math.round((s.interval||1)*(s.ef||2.5));
    s.ef=Math.min(2.5,(s.ef||2.5)+0.1);
    s.due=daysLater(s.interval); s.status='known';
    setSR(k,s); afterAction();
  }}
  function markDontKnow(){{
    if(!disp.length) return;
    const k=disp[idx].korean; let s=getSR(k);
    s.interval=1; s.ef=Math.max(1.3,(s.ef||2.5)-0.2);
    s.due=daysLater(1); s.status='learning';
    setSR(k,s); afterAction();
  }}
  function skipCard(){{ if(!disp.length) return; afterAction(); }}
  function afterAction(){{
    if(reviewMode){{ refreshDue(); }}
    else {{ if(idx<disp.length-1){{ idx++; }} else {{ idx=0; }} showCard(); }}
    updateHeader();
  }}

  function toggleReview(){{
    reviewMode=!reviewMode;
    const btn=document.getElementById('due-btn');
    if(reviewMode){{ btn.classList.add('active'); btn.textContent='📖 All Cards'; refreshDue(); }}
    else{{ btn.classList.remove('active'); btn.textContent='📅 Due Cards'; disp=[...ALL]; idx=0; showCard(); }}
    updateHeader();
  }}
  function refreshDue(){{
    const due=ALL.filter(c=>isDue(getSR(c.korean)));
    if(!due.length){{
      disp=[];
      document.getElementById('front-text').innerHTML='🎉 All caught up!';
      ['audio-btn','copy-ko','copy-en','sr-badge'].forEach(id=>{{ const el=document.getElementById(id); if(el) el.style.display='none'; }});
      document.getElementById('prev-btn').disabled=true;
      document.getElementById('next-btn').disabled=true;
      document.getElementById('prog').textContent='✨ Nothing due today!';
      return;
    }}
    disp=due; if(idx>=disp.length) idx=0; showCard();
  }}

  function updateHeader(){{
    const total=ALL.length; if(!total) return;
    const known=ALL.filter(c=>getSR(c.korean).status==='known').length;
    const due=ALL.filter(c=>isDue(getSR(c.korean))).length;
    document.getElementById('sr-fill').style.width=Math.round(known/total*100)+'%';
    document.getElementById('sr-stats').textContent=`✅ ${{known}}/${{total}} · 📅 ${{due}} due`;
    if(!reviewMode){{
      const db=document.getElementById('due-btn');
      db.textContent=due>0?`📅 Due (${{due}})`:'📅 Due Cards';
    }}
  }}

  function showCard(){{
    if(!disp.length) return;
    const c=disp[idx];
    document.getElementById('front-text').innerText=c.korean||'—';
    document.getElementById('back-en').innerText=c.translation||c.english||'';
    document.getElementById('back-tr').innerText=c.transliteration?`[${{c.transliteration}}]`:'';
    document.getElementById('back-exp').innerText=c.explanation||'';
    const s=getSR(c.korean);
    const badge=document.getElementById('sr-badge');
    badge.style.display='block';
    if(s.status==='known'){{ badge.textContent=isDue(s)?'⏰ DUE':'✅ KNOWN'; badge.className=isDue(s)?'sr-badge badge-due':'sr-badge badge-known'; }}
    else if(s.status==='learning'){{ badge.textContent='📖 LEARNING'; badge.className='sr-badge badge-learning'; }}
    else{{ badge.textContent='🆕 NEW'; badge.className='sr-badge badge-new'; }}
    document.getElementById('copy-ko').style.display='block';
    document.getElementById('copy-en').style.display='block';
    document.getElementById('prev-btn').disabled=idx===0;
    document.getElementById('next-btn').disabled=idx===disp.length-1;
    document.getElementById('prog').innerHTML=`📚 Card ${{idx+1}} of ${{disp.length}}`;
    document.getElementById('card').classList.remove('is-flipped');
    if(c.audio_uri){{ aud.src=c.audio_uri; document.getElementById('audio-btn').style.display='flex'; }}
    else {{ document.getElementById('audio-btn').style.display='none'; }}
    updateHeader();
  }}

  function flipCard(){{ if(disp.length) document.getElementById('card').classList.toggle('is-flipped'); }}
  function playAudio(e){{ e.stopPropagation(); aud.play().catch(()=>{{}}); }}
  function nextCard(){{ if(idx<disp.length-1){{ idx++; showCard(); }} }}
  function prevCard(){{ if(idx>0){{ idx--; showCard(); }} }}
  function copyText(id,e,el){{
    e.stopPropagation();
    navigator.clipboard.writeText(document.getElementById(id).innerText).then(()=>{{
      const old=el.className; el.className='fi fi-rr-check copy-icon'; el.style.color='#22c55e';
      setTimeout(()=>{{ el.className=old; el.style.color=''; }},1500);
    }}).catch(()=>{{}});
  }}
  window.onload=function(){{ if(ALL.length) showCard(); updateHeader(); }};
</script>
</body>
</html>"""

    safe_srcdoc = _html.escape(iframe_html)
    return f'<iframe srcdoc="{safe_srcdoc}" style="width:100%; height:700px; border:none; overflow-y:auto;"></iframe>'


def build_quiz_html(vocab_list):
    """Build a 5-question multiple-choice quiz SPA."""
    import html as _html
    import random as rnd

    if not vocab_list or len(vocab_list) < 2:
        return "<p style='color:#94a3b8;text-align:center;padding:30px;font-family:Outfit,sans-serif;font-size:16px;'>⚠️ Need at least 2 flashcards to start a quiz.<br>Generate or import a deck first!</p>"

    nq = min(5, len(vocab_list))
    q_cards = rnd.sample(vocab_list, nq)
    quiz_data = []
    for qc in q_cards:
        correct = qc.get('translation', '') or qc.get('english', '')
        wrong_pool = [c for c in vocab_list if c is not qc and (c.get('translation', '') or c.get('english', '')) != correct]
        wrongs = rnd.sample(wrong_pool, min(3, len(wrong_pool)))
        choices = [correct] + [w.get('translation', '') or w.get('english', '') for w in wrongs]
        rnd.shuffle(choices)
        quiz_data.append({
            'korean': qc.get('korean', ''),
            'transliteration': qc.get('transliteration', ''),
            'choices': choices,
            'correct': choices.index(correct),
        })

    quiz_json = json.dumps(quiz_data).replace("</", "<\\/")

    iframe_html = f"""<!DOCTYPE html>
<html>
<head>
<meta charset="utf-8">
<link rel='stylesheet' href='https://cdn-uicons.flaticon.com/uicons-regular-rounded/css/uicons-regular-rounded.css'>
<style>
  * {{ box-sizing:border-box; margin:0; padding:0; }}
  body {{ background:transparent; font-family:'Outfit','Inter',sans-serif; color:#f8fafc; padding:14px 10px; }}
  .quiz-hdr {{ text-align:center; margin-bottom:18px; }}
  .quiz-title {{ font-size:20px; font-weight:800; background:linear-gradient(to right,#c084fc,#60a5fa); -webkit-background-clip:text; -webkit-text-fill-color:transparent; margin-bottom:8px; }}
  .qpbar {{ width:100%; height:5px; background:rgba(255,255,255,.1); border-radius:3px; overflow:hidden; margin-bottom:4px; }}
  .qpfill {{ height:100%; background:linear-gradient(90deg,#8b5cf6,#3b82f6); border-radius:3px; transition:width .4s ease; }}
  .qptxt {{ font-size:12px; color:#64748b; }}
  .q-card {{ background:linear-gradient(135deg,rgba(30,41,59,.95) 0%,rgba(15,23,42,.95) 100%); border:1px solid rgba(139,92,246,.3); border-top:2px solid rgba(139,92,246,.7); border-radius:20px; padding:26px; text-align:center; margin-bottom:18px; box-shadow:0 10px 40px rgba(0,0,0,.5); }}
  .q-label {{ font-size:11px; text-transform:uppercase; letter-spacing:2px; color:#8b5cf6; font-weight:800; margin-bottom:10px; }}
  .q-word {{ font-size:52px; font-weight:800; color:#fff; text-shadow:0 0 25px rgba(139,92,246,.7); margin-bottom:7px; }}
  .q-tr {{ font-size:15px; color:#fca5a5; font-style:italic; letter-spacing:1px; }}
  .choices-grid {{ display:grid; grid-template-columns:1fr 1fr; gap:10px; margin-bottom:14px; }}
  .choice-btn {{ padding:14px 12px; border-radius:14px; border:1px solid rgba(139,92,246,.3); background:rgba(139,92,246,.1); color:#e2e8f0; font-size:14px; font-weight:600; cursor:pointer; transition:all .25s; text-align:center; line-height:1.3; font-family:inherit; }}
  .choice-btn:hover:not(:disabled) {{ background:rgba(139,92,246,.3); border-color:rgba(139,92,246,.7); transform:translateY(-2px); box-shadow:0 5px 15px rgba(139,92,246,.3); }}
  .choice-btn.correct {{ background:rgba(34,197,94,.3)!important; border-color:#22c55e!important; color:#86efac!important; transform:scale(1.02); box-shadow:0 0 20px rgba(34,197,94,.4)!important; }}
  .choice-btn.wrong {{ background:rgba(239,68,68,.2)!important; border-color:rgba(239,68,68,.5)!important; color:#fca5a5!important; }}
  .choice-btn:disabled {{ cursor:default; }}
  .fb-txt {{ font-size:15px; font-weight:700; text-align:center; min-height:22px; margin-bottom:6px; }}
  .nxt-btn {{ width:100%; padding:13px; border:none; border-radius:14px; background:linear-gradient(135deg,#8b5cf6,#3b82f6); color:white; font-size:14px; font-weight:800; cursor:pointer; transition:all .3s; letter-spacing:.5px; text-transform:uppercase; display:none; font-family:inherit; }}
  .nxt-btn:hover {{ transform:translateY(-2px); box-shadow:0 8px 25px rgba(139,92,246,.5); }}
  #score-screen {{ display:none; text-align:center; padding:28px 16px; }}
  .score-em {{ font-size:70px; margin-bottom:14px; animation:pop .6s cubic-bezier(.68,-.55,.265,1.55); }}
  @keyframes pop {{ from {{ transform:scale(0); opacity:0; }} to {{ transform:scale(1); opacity:1; }} }}
  .score-ttl {{ font-size:26px; font-weight:800; background:linear-gradient(to right,#c084fc,#60a5fa); -webkit-background-clip:text; -webkit-text-fill-color:transparent; margin-bottom:6px; }}
  .score-sub {{ font-size:14px; color:#94a3b8; margin-bottom:20px; }}
  .score-details {{ background:rgba(139,92,246,.1); border:1px solid rgba(139,92,246,.3); border-radius:16px; padding:16px; margin-bottom:20px; }}
  .s-row {{ display:flex; justify-content:space-between; padding:5px 0; border-bottom:1px solid rgba(255,255,255,.05); font-size:13px; }}
  .s-row:last-child {{ border-bottom:none; }}
  .s-ko {{ color:#e2e8f0; }} .s-ok {{ color:#86efac; font-weight:700; }} .s-no {{ color:#fca5a5; font-weight:700; }}
  .restart-btn {{ padding:13px 28px; border:none; border-radius:14px; background:linear-gradient(135deg,#8b5cf6,#3b82f6); color:white; font-size:14px; font-weight:800; cursor:pointer; transition:all .3s; text-transform:uppercase; letter-spacing:1px; font-family:inherit; }}
  .restart-btn:hover {{ transform:translateY(-2px); box-shadow:0 8px 25px rgba(139,92,246,.5); }}
</style>
</head>
<body>
<div id="quiz-app">
  <div id="question-screen">
    <div class="quiz-hdr">
      <div class="quiz-title">🧠 Vocabulary Quiz</div>
      <div class="qpbar"><div class="qpfill" id="qp-fill" style="width:0%"></div></div>
      <div class="qptxt" id="qp-txt">Question 1 of {nq}</div>
    </div>
    <div class="q-card">
      <div class="q-label">What does this word mean?</div>
      <div class="q-word" id="q-word"></div>
      <div class="q-tr" id="q-tr"></div>
    </div>
    <div class="choices-grid" id="choices"></div>
    <div class="fb-txt" id="fb"></div>
    <button class="nxt-btn" id="nxt-btn" onclick="nextQ()">Next →</button>
  </div>
  <div id="score-screen">
    <div class="score-em" id="s-em"></div>
    <div class="score-ttl" id="s-ttl"></div>
    <div class="score-sub" id="s-sub"></div>
    <div class="score-details" id="s-det"></div>
    <button class="restart-btn" onclick="restart()">🔄 Try Again</button>
  </div>
</div>
<script>
  const QD={quiz_json};
  let qi=0,score=0,res=[],answered=false;
  const NQ=QD.length;
  function loadQ(){{
    if(qi>=NQ){{ showScore(); return; }}
    answered=false;
    const q=QD[qi];
    document.getElementById('q-word').textContent=q.korean;
    document.getElementById('q-tr').textContent=q.transliteration?`[${{q.transliteration}}]`:'';
    document.getElementById('qp-fill').style.width=(qi/NQ*100)+'%';
    document.getElementById('qp-txt').textContent=`Question ${{qi+1}} of ${{NQ}}`;
    document.getElementById('fb').innerHTML='';
    document.getElementById('nxt-btn').style.display='none';
    const ch=document.getElementById('choices'); ch.innerHTML='';
    q.choices.forEach((c,i)=>{{
      const b=document.createElement('button'); b.className='choice-btn';
      b.textContent=c; b.onclick=()=>pick(i,b); ch.appendChild(b);
    }});
  }}
  function pick(ci,btn){{
    if(answered) return; answered=true;
    const q=QD[qi]; const ok=ci===q.correct;
    document.querySelectorAll('.choice-btn').forEach(b=>b.disabled=true);
    document.querySelectorAll('.choice-btn')[q.correct].classList.add('correct');
    if(ok){{ score++; document.getElementById('fb').innerHTML='✅ <span style="color:#86efac">Correct!</span>'; res.push({{k:q.korean,ok:true}}); }}
    else{{ btn.classList.add('wrong'); document.getElementById('fb').innerHTML=`❌ <span style="color:#fca5a5">Wrong!</span> → <strong>${{q.choices[q.correct]}}</strong>`; res.push({{k:q.korean,ok:false,ans:q.choices[q.correct]}}); }}
    const nb=document.getElementById('nxt-btn'); nb.style.display='block';
    nb.textContent=qi<NQ-1?'Next Question →':'See Results 🎉';
  }}
  function nextQ(){{ qi++; loadQ(); }}
  function showScore(){{
    document.getElementById('question-screen').style.display='none';
    document.getElementById('score-screen').style.display='block';
    const p=score/NQ;
    const data=p===1?['🏆','Perfect Score!','You nailed every question!']:p>=.8?['⭐','Excellent!','Almost perfect!']:p>=.6?['👍','Good Work!','Keep practicing!']:p>=.4?['📚','Keep Studying!','Review the flashcards!']:['💪','Keep Going!',"Practice makes perfect!"];
    document.getElementById('s-em').textContent=data[0];
    document.getElementById('s-ttl').textContent=`${{score}}/${{NQ}} — ${{data[1]}}`;
    document.getElementById('s-sub').textContent=data[2];
    document.getElementById('s-det').innerHTML=res.map(r=>`<div class="s-row"><span class="s-ko">${{r.k}}</span><span class="${{r.ok?'s-ok':'s-no'}}">${{r.ok?'✅ Correct':'❌ '+r.ans}}</span></div>`).join('');
  }}
  function restart(){{
    qi=0; score=0; res=[]; answered=false;
    document.getElementById('question-screen').style.display='block';
    document.getElementById('score-screen').style.display='none';
    loadQ();
  }}
  window.onload=loadQ;
</script>
</body>
</html>"""

    safe_srcdoc = _html.escape(iframe_html)
    return f'<iframe srcdoc="{safe_srcdoc}" style="width:100%; height:700px; border:none; overflow-y:auto;"></iframe>'


def export_json_file_fn(vocab_list):
    """Export current vocab list to a JSON file for download."""
    if not vocab_list:
        gr.Warning("No flashcards to export. Generate or import a deck first!")
        return gr.update(visible=False)
    
    export_data = [{k: v for k, v in item.items() if k != 'audio_uri'} for item in vocab_list]
    
    # Create a unique temporary file
    temp_fd, temp_path = tempfile.mkstemp(suffix=".json", prefix="flashcards_export_")
    with os.fdopen(temp_fd, "w", encoding="utf-8") as f:
        json.dump(export_data, f, ensure_ascii=False, indent=2)
        
    return gr.update(value=temp_path, visible=True)


def export_anki_file_fn(vocab_list):
    """Export current vocab list to an Anki .apkg file for download."""
    if not vocab_list:
        gr.Warning("No flashcards to export. Generate or import a deck first!")
        return gr.update(visible=False)
    try:
        import genanki
        import random as rnd
    except ImportError:
        gr.Warning("genanki not installed. Run: pip install genanki")
        return gr.update(visible=False)
    model = genanki.Model(
        rnd.randrange(1 << 30, 1 << 31),
        'LocalDuo Korean Vocab',
        fields=[{'name': 'Korean'}, {'name': 'Translation'}, {'name': 'Transliteration'}, {'name': 'Explanation'}],
        templates=[{
            'name': 'Card 1',
            'qfmt': '<div style="font-size:42px;text-align:center;font-weight:bold;color:#4a0e8f;padding:20px;">{{Korean}}</div>',
            'afmt': '{{FrontSide}}<hr id=answer><div style="font-size:24px;font-weight:bold;color:#1a56db;">{{Translation}}</div><div style="color:#888;font-style:italic;margin:8px 0;">{{Transliteration}}</div><div style="font-size:14px;color:#555;background:#f5f5f5;padding:10px;border-radius:8px;">{{Explanation}}</div>',
        }]
    )
    deck = genanki.Deck(rnd.randrange(1 << 30, 1 << 31), 'LocalDuo - Korean Vocabulary')
    for item in vocab_list:
        deck.add_note(genanki.Note(model=model, fields=[
            item.get('korean', ''),
            item.get('translation', '') or item.get('english', ''),
            item.get('transliteration', ''),
            item.get('explanation', ''),
        ]))
    
    # Create a unique temporary file
    temp_fd, temp_path = tempfile.mkstemp(suffix=".apkg", prefix="flashcards_export_")
    os.close(temp_fd) # Close it so genanki can write to it
    
    genanki.Package(deck).write_to_file(temp_path)
    return gr.update(value=temp_path, visible=True)


def import_deck_fn(json_file, anki_file):
    """Load a flashcard deck from a JSON or Anki .apkg file."""
    if json_file is not None:
        try:
            with open(json_file, "r", encoding="utf-8") as f:
                data = json.load(f)
            if not isinstance(data, list):
                data = [data]
            for item in data:
                if 'audio_uri' not in item:
                    item['audio_uri'] = None
            return build_flashcard_html(data), data
        except Exception as e:
            return f"<p style='color:#fca5a5;padding:20px;font-family:Outfit,sans-serif;'>❌ Error loading JSON: {e}</p>", None
    elif anki_file is not None:
        try:
            import zipfile, sqlite3, tempfile
            with tempfile.TemporaryDirectory() as tmpdir:
                with zipfile.ZipFile(anki_file, 'r') as z:
                    z.extractall(tmpdir)
                db_path = os.path.join(tmpdir, 'collection.anki2')
                if not os.path.exists(db_path):
                    db_path = os.path.join(tmpdir, 'collection.anki21')
                conn = sqlite3.connect(db_path)
                rows = conn.execute("SELECT flds FROM notes").fetchall()
                conn.close()
            vocab_list = []
            for row in rows:
                fields = row[0].split('\x1f')
                vocab_list.append({
                    'korean': fields[0] if len(fields) > 0 else '',
                    'translation': fields[1] if len(fields) > 1 else '',
                    'transliteration': fields[2] if len(fields) > 2 else '',
                    'explanation': fields[3] if len(fields) > 3 else '',
                    'audio_uri': None,
                })
            if not vocab_list:
                return "<p style='color:#fca5a5;padding:20px;font-family:Outfit,sans-serif;'>❌ No notes found in Anki deck.</p>", None
            return build_flashcard_html(vocab_list), vocab_list
        except Exception as e:
            return f"<p style='color:#fca5a5;padding:20px;font-family:Outfit,sans-serif;'>❌ Error loading Anki deck: {e}</p>", None
    return "<p style='color:#94a3b8;padding:20px;text-align:center;font-family:Outfit,sans-serif;'>⚠️ Please upload a JSON or Anki (.apkg) file above.</p>", None


# ─── Bootstrap demo content (shown before any generation) ───
BOOTSTRAP_VOCAB = [
    {"korean": "안녕하세요", "translation": "Hello", "transliteration": "an-nyeong-ha-se-yo", "explanation": "The most common formal greeting in Korean, used when meeting someone.", "audio_uri": None},
    {"korean": "감사합니다", "translation": "Thank you", "transliteration": "gam-sa-ham-ni-da", "explanation": "The standard polite way to express gratitude.", "audio_uri": None},
    {"korean": "사랑", "translation": "Love", "transliteration": "sa-rang", "explanation": "A fundamental word for love or affection, used in many K-pop songs.", "audio_uri": None},
    {"korean": "학교", "translation": "School", "transliteration": "hak-gyo", "explanation": "Refers to a school or educational institution. 학 means 'study', 교 means 'teach'.", "audio_uri": None},
    {"korean": "음식", "translation": "Food", "transliteration": "eum-sik", "explanation": "General word for food or cuisine. Korean 음식 (food) is world-famous!", "audio_uri": None},
    {"korean": "친구", "translation": "Friend", "transliteration": "chin-gu", "explanation": "Means a friend or buddy. In Korean culture, 친구 specifically refers to someone the same age.", "audio_uri": None},
    {"korean": "물", "translation": "Water", "transliteration": "mul", "explanation": "Essential vocabulary — 물 주세요 (mul ju-se-yo) means 'Water, please'.", "audio_uri": None},
    {"korean": "시간", "translation": "Time", "transliteration": "si-gan", "explanation": "Means time or hour. 시 (si) = hour, 간 (gan) = interval.", "audio_uri": None},
    {"korean": "행복", "translation": "Happiness", "transliteration": "haeng-bok", "explanation": "Means happiness or bliss. 행복하다 (haeng-bok-ha-da) = to be happy.", "audio_uri": None},
    {"korean": "여행", "translation": "Travel", "transliteration": "yeo-haeng", "explanation": "Means travel or trip. 여행하다 (yeo-haeng-ha-da) = to travel.", "audio_uri": None},
]

DEMO_EXTRACTED_TEXT = """[Demo Content — Common Korean Words]

안녕하세요! 오늘은 한국어를 배워봅시다.
(Hello! Let's learn Korean today.)

한국 음식은 정말 맛있습니다. 친구와 함께 학교 근처 식당에서 점심을 먹었습니다.
(Korean food is really delicious. I had lunch at a restaurant near the school with a friend.)

여행을 가면 항상 행복합니다. 새로운 곳에서 새로운 사람들을 만나는 것이 좋습니다.
(I'm always happy when I travel. I enjoy meeting new people in new places.)

물 주세요! 감사합니다.
(Water, please! Thank you.)

시간이 빨리 갑니다. 사랑하는 사람과 함께하면 더 빨리 갑니다.
(Time flies. It goes even faster when you're with someone you love.)
"""


def create_demo():
    example_pdf = get_example_pdf()
    example_audio = get_example_audio()
    
    custom_theme = gr.themes.Soft(
        primary_hue="amber",
        secondary_hue="stone",
        neutral_hue="stone",
        font=[gr.themes.GoogleFont("Outfit"), gr.themes.GoogleFont("Noto Serif KR"), "ui-sans-serif", "sans-serif"]
    )

    css = """
    /* ── 한국 (Hanguk) Inspired Theme ── */
    @import url('https://fonts.googleapis.com/css2?family=Noto+Serif+KR:wght@400;700;900&family=Outfit:wght@400;600;700;800&display=swap');

    /* ── Animated Background — ink wash 수묵화 ── */
    @keyframes gradientBG {
        0% { background-position: 0% 50%; }
        50% { background-position: 100% 50%; }
        100% { background-position: 0% 50%; }
    }

    body, .gradio-container {
        background: linear-gradient(-45deg, #0a0a0f, #1a1008, #0d1a12, #12080a, #0f0f1a) !important;
        background-size: 400% 400% !important;
        animation: gradientBG 20s ease infinite !important;
        background-attachment: fixed !important;
        color: #e8e0d4 !important;
        font-family: 'Outfit', 'Noto Serif KR', sans-serif !important;

        /* Force internal Gradio variables */
        --block-label-background-fill: transparent !important;
        --block-title-background-fill: transparent !important;
        --background-fill-primary: transparent !important;
        --background-fill-secondary: transparent !important;
        --block-background-fill: transparent !important;
        --input-background-fill: rgba(0, 0, 0, 0.25) !important;
        --input-background-fill-focus: rgba(0, 0, 0, 0.35) !important;
        --panel-background-fill: transparent !important;
        --checkbox-background-color: rgba(0, 0, 0, 0.2) !important;
        --table-even-background-fill: transparent !important;
        --table-odd-background-fill: rgba(0, 0, 0, 0.1) !important;
    }

    /* ── AGGRESSIVE BACKGROUND OVERRIDES FOR FIREFOX ── */
    .gradio-container .tabitem,
    .gradio-container .wrap,
    .gradio-container .form,
    .gradio-container .panel,
    .gradio-container .box,
    .gradio-container input,
    .gradio-container textarea,
    .gradio-container select,
    .gradio-container .dropdown-container,
    .gradio-container .block,
    .gradio-container .secondary-wrap,
    .gradio-container .contain {
        background: rgba(15, 12, 8, 0.5) !important;
        background-color: rgba(15, 12, 8, 0.5) !important;
    }

    /* ── FILE UPLOAD / PREVIEW — fix white backgrounds ── */
    .gradio-container .file-preview,
    .gradio-container .file-preview *,
    .gradio-container .file-preview table,
    .gradio-container .file-preview tr,
    .gradio-container .file-preview td,
    .gradio-container .file-preview th,
    .gradio-container .file-preview tbody,
    .gradio-container .file-preview thead,
    .gradio-container .upload-button,
    .gradio-container .file-upload,
    .gradio-container [data-testid="file"],
    .gradio-container [data-testid="file"] *,
    .gradio-container .file,
    .gradio-container .file *,
    .gradio-container .upload-text,
    .gradio-container .icon-wrap,
    .gradio-container .waveform-container,
    .gradio-container .empty,
    .gradio-container .empty *,
    .gradio-container .wrap.default {
        background: rgba(10, 8, 5, 0.4) !important;
        background-color: rgba(10, 8, 5, 0.4) !important;
        color: #e8e0d4 !important;
        border-color: rgba(196, 164, 105, 0.15) !important;
    }
    .gradio-container .file-preview a,
    .gradio-container .file a {
        color: #c4a469 !important;
    }

    /* ── Glassmorphism Panels — hanji paper texture feel ── */
    .gradio-container .form,
    .gradio-container .panel,
    .gradio-container .box {
        background: rgba(15, 12, 8, 0.45) !important;
        backdrop-filter: blur(20px) !important;
        -webkit-backdrop-filter: blur(20px) !important;
        border-radius: 16px !important;
        border: 1px solid rgba(196, 164, 105, 0.12) !important;
        box-shadow: 0 12px 30px rgba(0, 0, 0, 0.3), inset 0 0 0 1px rgba(196, 164, 105, 0.05) !important;
    }

    /* ── Selection — warm gold ── */
    ::selection {
        background: rgba(196, 164, 105, 0.45) !important;
        color: #ffffff !important;
    }
    ::-moz-selection {
        background: rgba(196, 164, 105, 0.45) !important;
        color: #ffffff !important;
    }

    /* ── GLOBAL BACKGROUND OVERRIDES ── */
    .gradio-container label,
    .gradio-container .label-wrap,
    .gradio-container .block label,
    .gradio-container .block-info,
    .gradio-container .block-title,
    .gradio-container .form > .block > .label-wrap,
    .gradio-container .form .label-wrap {
        background: transparent !important;
        background-color: transparent !important;
        border: none !important;
        box-shadow: none !important;
    }

    /* ── GLOBAL TEXT — warm parchment tones ── */
    .gradio-container,
    .gradio-container label,
    .gradio-container .label-wrap,
    .gradio-container .label-wrap span,
    .gradio-container span,
    .gradio-container p,
    .gradio-container h2,
    .gradio-container h3,
    .gradio-container h4,
    .gradio-container h5,
    .gradio-container h6,
    .gradio-container .prose,
    .gradio-container .prose *,
    .gradio-container .block label span,
    .gradio-container .block .label-wrap span,
    .gradio-container button,
    .gradio-container button span,
    .gradio-container input,
    .gradio-container select,
    .gradio-container textarea {
        color: #e8e0d4 !important;
    }

    /* ── Heading — 서예 calligraphy style ── */
    h1 {
        text-align: center;
        background: linear-gradient(135deg, #c4a469, #e8c97a, #a0825a);
        -webkit-background-clip: text;
        -webkit-text-fill-color: transparent;
        font-weight: 900 !important;
        font-size: 2.4em !important;
        margin-bottom: 0.3em !important;
        letter-spacing: 1px;
        line-height: 1.2 !important;
        font-family: 'Noto Serif KR', 'Outfit', serif !important;
    }

    /* ── TAB LABELS — 단청 style ── */
    .gradio-container .tabs .tab-nav button,
    .gradio-container .tabs .tab-nav button span {
        color: #8a7a65 !important;
        font-weight: 600 !important;
        font-size: 14px !important;
        padding: 10px 16px !important;
        background: transparent !important;
        border: none !important;
        border-bottom: 2px solid transparent !important;
        transition: all 0.3s ease !important;
    }
    .gradio-container .tabs .tab-nav button.selected,
    .gradio-container .tabs .tab-nav button.selected span,
    .gradio-container .tabs .tab-nav button[aria-selected="true"],
    .gradio-container .tabs .tab-nav button[aria-selected="true"] span {
        color: #c4a469 !important;
        border-bottom-color: #c4a469 !important;
        background: rgba(196, 164, 105, 0.08) !important;
    }
    .gradio-container .tabs .tab-nav button:hover,
    .gradio-container .tabs .tab-nav button:hover span {
        color: #e8e0d4 !important;
        background: rgba(196, 164, 105, 0.05) !important;
    }
    .gradio-container .tabs .tab-nav {
        background: transparent !important;
        border-bottom: 1px solid rgba(196, 164, 105, 0.15) !important;
    }

    /* ── SLIDER / RANGE LABELS ── */
    .gradio-container input[type="range"] + .rangeSlider,
    .gradio-container .range-slider,
    .gradio-container input[type="number"],
    .gradio-container input[type="number"]::-moz-placeholder {
        color: #e8e0d4 !important;
    }
    .gradio-container .wrap.default span,
    .gradio-container .head span,
    .gradio-container .range_slider span {
        color: #8a7a65 !important;
    }

    /* ── ACCORDION HEADERS ── */
    .gradio-container .accordion > button,
    .gradio-container .accordion > .label-wrap,
    .gradio-container details > summary,
    .gradio-container details > summary span {
        color: #e8e0d4 !important;
        font-weight: 600 !important;
    }

    /* ── MARKDOWN / PROSE ── */
    .gradio-container .md,
    .gradio-container .md p,
    .gradio-container .md li,
    .gradio-container .md strong,
    .gradio-container .md em,
    .gradio-container .md h3,
    .gradio-container .md h2 {
        color: #d4cbbe !important;
    }
    .gradio-container .md strong {
        color: #f0e8da !important;
    }
    .gradio-container .md a {
        color: #c4a469 !important;
    }
    .gradio-container .prose h3,
    .gradio-container h3 {
        color: #c4a469 !important;
        font-weight: 700 !important;
        font-size: 1.05em !important;
    }

    /* ── HINT TEXT ── */
    .hint-text, .hint-text p, .hint-text * {
        color: #6b5e4f !important;
        font-size: 13px !important;
    }

    /* ── FILE UPLOAD ── */
    .gradio-container .file-upload,
    .gradio-container .upload-button {
        background: rgba(0, 0, 0, 0.25) !important;
        border: 1px dashed rgba(196, 164, 105, 0.2) !important;
        color: #8a7a65 !important;
        border-radius: 12px !important;
    }

    /* ── DROPDOWN / SELECT ── */
    .gradio-container .dropdown-container,
    .gradio-container .secondary-wrap,
    .gradio-container ul[role="listbox"] {
        background: rgba(15, 12, 8, 0.95) !important;
        border: 1px solid rgba(196, 164, 105, 0.15) !important;
        color: #e8e0d4 !important;
    }
    .gradio-container ul[role="listbox"] li {
        color: #e8e0d4 !important;
    }
    .gradio-container ul[role="listbox"] li:hover {
        background: rgba(196, 164, 105, 0.15) !important;
    }

    /* ── BUTTONS — 한복 inspired ── */
    button.primary {
        background: linear-gradient(135deg, #b8860b, #c4a469, #8b6914) !important;
        border: none !important;
        box-shadow: 0 0 20px rgba(196, 164, 105, 0.35) !important;
        transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1) !important;
        font-weight: 700 !important;
        letter-spacing: 1px !important;
        text-transform: uppercase;
        border-radius: 12px !important;
        color: #0a0a0f !important;
    }
    button.primary:hover {
        transform: translateY(-3px) scale(1.02) !important;
        box-shadow: 0 0 30px rgba(196, 164, 105, 0.6) !important;
        color: #0a0a0f !important;
    }
    button.secondary {
        background: rgba(100, 90, 70, 0.15) !important;
        border: 1px solid rgba(196, 164, 105, 0.2) !important;
        color: #e8e0d4 !important;
        border-radius: 12px !important;
        font-weight: 600 !important;
        transition: all 0.25s ease !important;
    }
    button.secondary:hover {
        background: rgba(196, 164, 105, 0.12) !important;
        border-color: rgba(196, 164, 105, 0.35) !important;
        color: #f0e8da !important;
        transform: translateY(-2px) !important;
    }
    button.stop {
        background: linear-gradient(135deg, #8b2020, #c0392b) !important;
        border: none !important;
        box-shadow: 0 0 20px rgba(192, 57, 43, 0.4) !important;
        transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1) !important;
        font-weight: 700 !important;
        text-transform: uppercase;
        letter-spacing: 1px !important;
        border-radius: 12px !important;
        color: #f0e8da !important;
    }
    button.stop:hover {
        transform: translateY(-3px) scale(1.02) !important;
        box-shadow: 0 0 30px rgba(192, 57, 43, 0.6) !important;
    }

    /* ── INPUTS ── */
    textarea, input[type="text"], input[type="number"], select {
        background: rgba(0, 0, 0, 0.3) !important;
        border: 1px solid rgba(196, 164, 105, 0.12) !important;
        border-radius: 10px !important;
        color: #f0e8da !important;
        transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1) !important;
    }
    textarea:focus, input[type="text"]:focus {
        border-color: #c4a469 !important;
        box-shadow: 0 0 15px rgba(196, 164, 105, 0.25), inset 0 0 0 1px rgba(196, 164, 105, 0.25) !important;
    }
    .gradio-container .textbox label span,
    .gradio-container .input-label {
        color: #c4a469 !important;
        font-weight: 600 !important;
    }

    /* ── EXPORT / DOWNLOAD FILE COMPONENT ── */
    .gradio-container .download,
    .gradio-container .file a {
        color: #c4a469 !important;
    }

    /* ── GALLERY ── */
    .gradio-container .gallery-item {
        background: rgba(0, 0, 0, 0.3) !important;
        border: 1px solid rgba(196, 164, 105, 0.1) !important;
        border-radius: 10px !important;
    }

    /* ── INFO / TOOLTIP ── */
    .gradio-container .info,
    .gradio-container .wrap .info {
        color: #6b5e4f !important;
    }

    /* ── BLOCK BACKGROUNDS ── */
    .gradio-container .block {
        background: transparent !important;
    }
    .gradio-container .contain {
        background: transparent !important;
    }
    .gradio-container .tabitem {
        background: transparent !important;
    }

    /* ── AUDIO PLAYER ── */
    .gradio-container audio {
        filter: invert(0.85) hue-rotate(180deg) sepia(0.15);
        border-radius: 8px;
    }

    /* ── Hide Stream Box Duplicate Progress ── */
    #stream_box .progress-text,
    #stream_box .progress-level,
    #stream_box .progress,
    #stream_box .progress-container {
        display: none !important;
    }

    /* ── MAIN PROGRESS BAR ── */
    .gradio-container .progress-container,
    .gradio-container .progress-text {
        color: #ffffff !important;
        font-weight: 700 !important;
        text-shadow: 0px 1px 4px rgba(0,0,0,0.9) !important;
    }
    .gradio-container .progress-level {
        background: linear-gradient(90deg, #b8860b, #c4a469) !important;
    }

    /* ── SCROLLBAR — ink brush style ── */
    * {
        scrollbar-width: thin;
        scrollbar-color: rgba(196, 164, 105, 0.3) transparent;
    }
    ::-webkit-scrollbar { width: 5px; height: 5px; }
    ::-webkit-scrollbar-track { background: transparent; }
    ::-webkit-scrollbar-thumb { background: rgba(196, 164, 105, 0.3); border-radius: 3px; }
    ::-webkit-scrollbar-thumb:hover { background: rgba(196, 164, 105, 0.5); }

    /* ── CHECKBOX ── */
    .gradio-container input[type="checkbox"] {
        appearance: none !important;
        -webkit-appearance: none !important;
        width: 20px !important;
        height: 20px !important;
        border: 2px solid rgba(196, 164, 105, 0.4) !important;
        border-radius: 5px !important;
        background: rgba(0, 0, 0, 0.3) !important;
        cursor: pointer !important;
        position: relative !important;
        transition: all 0.2s ease !important;
    }
    .gradio-container input[type="checkbox"]:checked {
        background: linear-gradient(135deg, #b8860b, #c4a469) !important;
        border-color: #c4a469 !important;
    }
    .gradio-container input[type="checkbox"]:checked::after {
        content: "✓" !important;
        position: absolute !important;
        top: 50% !important;
        left: 50% !important;
        transform: translate(-50%, -50%) !important;
        color: #0a0a0f !important;
        font-size: 14px !important;
        font-weight: 900 !important;
    }
    .gradio-container input[type="checkbox"]:hover {
        border-color: #c4a469 !important;
        box-shadow: 0 0 8px rgba(196, 164, 105, 0.3) !important;
    }

    /* ── Korean decorative border on main content ── */
    .gradio-container > .main {
        border-top: 3px solid transparent !important;
        border-image: linear-gradient(90deg, transparent, rgba(196, 164, 105, 0.3), rgba(192, 57, 43, 0.2), rgba(196, 164, 105, 0.3), transparent) 1 !important;
    }
    """
    # Force dark mode via JavaScript so Gradio's internal CSS variables default to dark
    dark_mode_js = """
    function() {
        document.body.classList.add('dark');
        document.documentElement.classList.add('dark');
    }
    """
    
    with gr.Blocks(title="LocalDuo", theme=custom_theme, css=css, js=dark_mode_js) as demo:
        gr.Markdown("# LocalDuo — Learn Korean from PDFs, Websites & YouTube")
        gr.Markdown("🇰🇷✨ Enter a website URL 🌐, upload a PDF 📄, upload an audio file 🎵, or paste a YouTube link 🎬. The app uses a **Vision-Language Model (VLM)** 🧠, **ASR** 🎤, and **TTS** 🗣️ to generate vocabulary flashcards.")
        
        active_tab = gr.State("Website URL")
        
        with gr.Row():
            with gr.Column(scale=1):
                with gr.Tabs() as input_tabs:
                    with gr.Tab("Website URL", id="tab_url") as tab_url:
                        url_input = gr.Textbox(label="Enter a Website URL 🌐",
                        placeholder=r"e.g. https://www.bbc.com/korean/articles/cn0p7rkvxdgo",
                        value=r"https://www.bbc.com/korean/articles/cn0p7rkvxdgo")

                    with gr.Tab("Upload PDF", id="tab_pdf") as tab_pdf:
                        pdf_input = gr.File(label="Upload Book PDF 📚", file_types=[".pdf"], value=example_pdf)

                    with gr.Tab("Upload Audio", id="tab_audio") as tab_audio:
                        audio_file_input = gr.File(label="Upload Audio File 🎵", file_types=[".wav", ".mp3", ".m4a", ".ogg", ".flac", ".opus", ".webm"], value=example_audio)
                        gr.Markdown("*Upload a Korean audio file. It will be transcribed using Cohere ASR and vocabulary will be extracted from the transcript.*", elem_classes=["hint-text"])

                    with gr.Tab("YouTube Link", id="tab_yt") as tab_yt:
                        yt_url_input = gr.Textbox(label="Enter a YouTube Link 🎬",
                        placeholder=r"e.g. https://www.youtube.com/watch?v=...",
                        value="https://www.youtube.com/watch?v=9Nj7l73PBWE",
                        info="Audio from the first 5 minutes will be transcribed using Cohere ASR")
                        yt_cookies_input = gr.File(label="YouTube Cookies (cookies.txt)", file_types=[".txt"], value=None,
                            type="filepath")
                        gr.Markdown("*Optional. Helps bypass YouTube bot detection. Install the [cookies.txt](https://addons.mozilla.org/firefox/addon/cookies-txt/) extension, go to youtube.com while logged in, click the extension → 'Current Site' to export.*", elem_classes=["hint-text"])

                    with gr.Tab("📂 Import Deck", id="tab_import") as tab_import:
                        gr.Markdown("### Load a saved deck into the app")
                        gr.Markdown("Upload a previously exported **JSON file** or an **Anki .apkg deck** to reload flashcards without regenerating.")
                        import_json_file_in = gr.File(label="📄 JSON Deck (.json)", file_types=[".json"])
                        import_anki_file_in = gr.File(label="📦 Anki Deck (.apkg)", file_types=[".apkg"])
                        import_load_btn = gr.Button("📂 Load Deck", variant="primary")

                # Track active tab
                tab_url.select(fn=lambda: "Website URL", inputs=None, outputs=active_tab)
                tab_pdf.select(fn=lambda: "Upload PDF", inputs=None, outputs=active_tab)
                tab_audio.select(fn=lambda: "Upload Audio", inputs=None, outputs=active_tab)
                tab_yt.select(fn=lambda: "YouTube Link", inputs=None, outputs=active_tab)
                tab_import.select(fn=lambda: "Import Deck", inputs=None, outputs=active_tab)

                gr.Markdown("### ⚙️ Customization Settings")
                max_text_char_input = gr.Slider(minimum=1000, maximum=30000, step=1000, value=1500, label="Max Input Text Length (Characters)")
                repetition_penalty_input = gr.Slider(minimum=0.1, maximum=2.0, step=0.1, value=1.2, label="Repetition Penalty")
                auto_force_chars_input = gr.Slider(minimum=1_000, maximum=10_000, step=100, value=4_000, label="Auto-force JSON after (chars of thinking)")
                enable_thinking_checkbox = gr.Checkbox(label="🧠 Enable Thinking (longer but more accurate)", value=True)

                with gr.Accordion("🔧 Advanced", open=False):
                    translit_lang = gr.Dropdown(
                        label="Word Transliteration Language",
                        choices=LANGUAGE_CHOICES,
                        value="Indo-European - English"
                    )
                    translit_format = gr.Dropdown(label="Transliteration Format", choices=["dashed syllable", "regular word with space"], value="dashed syllable")
                    target_lang = gr.Dropdown(
                        label="Target Language (Full App)",
                        choices=LANGUAGE_CHOICES,
                        value="Indo-European - English"
                    )

                submit_btn = gr.Button("✨ Generate Flashcards ✨", variant="primary")
                
                with gr.Accordion("🛑 Generation Controls", open=False):
                    with gr.Row():
                        stop_thinking_btn = gr.Button("⚡ Stop thinking, Generate now", variant="secondary")
                        stop_btn = gr.Button("🛑 Stop Generation", variant="stop")

            with gr.Column(scale=2):
                with gr.Tabs() as output_tabs:
                    with gr.Tab("📖 Flashcards"):
                        bootstrap_html = build_flashcard_html(BOOTSTRAP_VOCAB)
                        output_html = gr.HTML(label="Flashcards will appear here", value=bootstrap_html)
                        gr.Markdown("**Export current deck:**")
                        with gr.Row():
                            export_json_btn = gr.Button("📥 Export JSON", variant="secondary", size="sm")
                            export_anki_btn = gr.Button("📦 Export Anki (.apkg)", variant="secondary", size="sm")
                        export_json_out = gr.File(label="⬇️ JSON Download", visible=False, interactive=False)
                        export_anki_out = gr.File(label="⬇️ Anki Deck Download", visible=False, interactive=False)

                    with gr.Tab("❓ Quiz"):
                        gr.Markdown("**Test your knowledge** with a randomized 5-question multiple-choice quiz from the current deck.")
                        start_quiz_btn = gr.Button("🧪 Start 5-Question Quiz", variant="primary")
                        bootstrap_quiz_html = build_quiz_html(BOOTSTRAP_VOCAB)
                        quiz_output_html = gr.HTML(label="Quiz", value=bootstrap_quiz_html)

                stream_box = gr.Textbox(label="Live Model Generation 🧠", lines=10, max_lines=20, interactive=False, autoscroll=True, elem_id="stream_box")

                with gr.Accordion("📄 Extracted Source Content", open=True):
                    extracted_text_box = gr.Textbox(label="Extracted Text", lines=10, max_lines=15, interactive=False, value=DEMO_EXTRACTED_TEXT)
                    extracted_images_gallery = gr.Gallery(label="Extracted Images", columns=4, height="auto", object_fit="contain")
                    extracted_audio_player = gr.Audio(label="Extracted Audio (YouTube / Uploaded)", type="filepath", interactive=False)

        last_source_state = gr.State(None)
        last_korean_words_state = gr.State(BOOTSTRAP_VOCAB)

        def reset_btn_text():
            return gr.update(value="⚡ Stop thinking, Generate now"), gr.update(value="🛑 Stop Generation")

        submit_btn.click(fn=reset_btn_text, inputs=None, outputs=[stop_thinking_btn, stop_btn], queue=False)

        generate_event = submit_btn.click(
            fn=process_pdf,
            inputs=[pdf_input, url_input, audio_file_input, yt_url_input, yt_cookies_input, translit_lang, translit_format, target_lang, max_text_char_input, repetition_penalty_input, auto_force_chars_input, last_source_state, last_korean_words_state, active_tab, enable_thinking_checkbox],
            outputs=[output_html, last_source_state, last_korean_words_state, stream_box, extracted_text_box, extracted_images_gallery, extracted_audio_player]
        )

        stop_thinking_btn.click(fn=set_stop_thinking, inputs=None, outputs=stop_thinking_btn, queue=False).then(
            fn=reset_stop_thinking_after_delay, inputs=None, outputs=stop_thinking_btn
        )
        stop_btn.click(fn=set_kill_threads, inputs=None, outputs=stop_btn, queue=False)

        # Export events
        export_json_btn.click(fn=export_json_file_fn, inputs=[last_korean_words_state], outputs=[export_json_out])
        export_anki_btn.click(fn=export_anki_file_fn, inputs=[last_korean_words_state], outputs=[export_anki_out])

        # Import event
        import_load_btn.click(
            fn=import_deck_fn,
            inputs=[import_json_file_in, import_anki_file_in],
            outputs=[output_html, last_korean_words_state]
        )

        # Quiz event
        start_quiz_btn.click(fn=build_quiz_html, inputs=[last_korean_words_state], outputs=[quiz_output_html])

        # Force autoscroll using Custom JS
        stream_box.change(
            fn=None,
            js="""
            function() {
                const ta = document.querySelector('#stream_box textarea');
                if (ta) {
                    ta.scrollTop = ta.scrollHeight;
                }
            }
            """
        )
    return demo


if __name__ == "__main__":
    global model, processor, tts, voice_style, asr_model, asr_processor
    
    
    model_id = "Qwen/Qwen3.5-9B"
    # model_id = "Qwen/Qwen3.5-2B"
    
    print(f"Loading {model_id} model via Transformers...")
    
    processor = AutoProcessor.from_pretrained(model_id, trust_remote_code=True)
    
    # try:
    #     with open("chat_template.jinja", "r", encoding="utf-8") as f:
    #         processor.chat_template = f.read()
    # except Exception as e:
    #     print("Could not load custom chat template:", e)
    processor.chat_template = """
{%- set image_count = namespace(value=0) %}
{%- set video_count = namespace(value=0) %}
{%- macro render_content(content, do_vision_count, is_system_content=false) %}
    {%- if content is string %}
        {{- content }}
    {%- elif content is iterable and content is not mapping %}
        {%- for item in content %}
            {%- if 'image' in item or 'image_url' in item or item.type == 'image' %}
                {%- if is_system_content %}
                    {{- raise_exception('System message cannot contain images.') }}
                {%- endif %}
                {%- if do_vision_count %}
                    {%- set image_count.value = image_count.value + 1 %}
                {%- endif %}
                {%- if add_vision_id %}
                    {{- 'Picture ' ~ image_count.value ~ ': ' }}
                {%- endif %}
                {{- '<|vision_start|><|image_pad|><|vision_end|>' }}
            {%- elif 'video' in item or item.type == 'video' %}
                {%- if is_system_content %}
                    {{- raise_exception('System message cannot contain videos.') }}
                {%- endif %}
                {%- if do_vision_count %}
                    {%- set video_count.value = video_count.value + 1 %}
                {%- endif %}
                {%- if add_vision_id %}
                    {{- 'Video ' ~ video_count.value ~ ': ' }}
                {%- endif %}
                {{- '<|vision_start|><|video_pad|><|vision_end|>' }}
            {%- elif 'text' in item %}
                {{- item.text }}
            {%- else %}
                {{- raise_exception('Unexpected item type in content.') }}
            {%- endif %}
        {%- endfor %}
    {%- elif content is none or content is undefined %}
        {{- '' }}
    {%- else %}
        {{- raise_exception('Unexpected content type.') }}
    {%- endif %}
{%- endmacro %}
{%- if not messages %}
    {{- raise_exception('No messages provided.') }}
{%- endif %}
{%- if tools and tools is iterable and tools is not mapping %}
    {{- '<|im_start|>system\n' }}
    {{- "# Tools\n\nYou have access to the following functions:\n\n<tools>" }}
    {%- for tool in tools %}
        {{- "\n" }}
        {{- tool | tojson }}
    {%- endfor %}
    {{- "\n</tools>" }}
    {{- '\n\nIf you choose to call a function ONLY reply in the following format with NO suffix:\n\n<tool_call>\n<function=example_function_name>\n<parameter=example_parameter_1>\nvalue_1\n</parameter>\n<parameter=example_parameter_2>\nThis is the value for the second parameter\nthat can span\nmultiple lines\n</parameter>\n</function>\n</tool_call>\n\n<IMPORTANT>\nReminder:\n- Function calls MUST follow the specified format: an inner <function=...></function> block must be nested within <tool_call></tool_call> XML tags\n- Required parameters MUST be specified\n- You may provide optional reasoning for your function call in natural language BEFORE the function call, but NOT after\n- If there is no function call available, answer the question like normal with your current knowledge and do not tell the user about function calls\n</IMPORTANT>' }}
    {%- if messages[0].role == 'system' %}
        {%- set content = render_content(messages[0].content, false, true)|trim %}
        {%- if content %}
            {{- '\n\n' + content }}
        {%- endif %}
    {%- endif %}
    {{- '<|im_end|>\n' }}
{%- else %}
    {%- if messages[0].role == 'system' %}
        {%- set content = render_content(messages[0].content, false, true)|trim %}
        {{- '<|im_start|>system\n' + content + '<|im_end|>\n' }}
    {%- endif %}
{%- endif %}
{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
{%- for message in messages[::-1] %}
    {%- set index = (messages|length - 1) - loop.index0 %}
    {%- if ns.multi_step_tool and message.role == "user" %}
        {%- set content = render_content(message.content, false)|trim %}
        {%- if not(content.startswith('<tool_response>') and content.endswith('</tool_response>')) %}
            {%- set ns.multi_step_tool = false %}
            {%- set ns.last_query_index = index %}
        {%- endif %}
    {%- endif %}
{%- endfor %}
{%- if ns.multi_step_tool %}
    {{- raise_exception('No user query found in messages.') }}
{%- endif %}
{%- for message in messages %}
    {%- set content = render_content(message.content, true)|trim %}
    {%- if message.role == "system" %}
        {%- if not loop.first %}
            {{- raise_exception('System message must be at the beginning.') }}
        {%- endif %}
    {%- elif message.role == "user" %}
        {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
    {%- elif message.role == "assistant" %}
        {%- set reasoning_content = '' %}
        {%- if message.reasoning_content is string %}
            {%- set reasoning_content = message.reasoning_content %}
        {%- else %}
            {%- if '</think>' in content %}
                {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
                {%- set content = content.split('</think>')[-1].lstrip('\n') %}
            {%- endif %}
        {%- endif %}
        {%- set reasoning_content = reasoning_content|trim %}
        {%- if loop.index0 > ns.last_query_index %}
            {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content + '\n</think>\n\n' + content }}
        {%- else %}
            {{- '<|im_start|>' + message.role + '\n' + content }}
        {%- endif %}
        {%- if message.tool_calls and message.tool_calls is iterable and message.tool_calls is not mapping %}
            {%- for tool_call in message.tool_calls %}
                {%- if tool_call.function is defined %}
                    {%- set tool_call = tool_call.function %}
                {%- endif %}
                {%- if loop.first %}
                    {%- if content|trim %}
                        {{- '\n\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
                    {%- else %}
                        {{- '<tool_call>\n<function=' + tool_call.name + '>\n' }}
                    {%- endif %}
                {%- else %}
                    {{- '\n<tool_call>\n<function=' + tool_call.name + '>\n' }}
                {%- endif %}
                {%- if tool_call.arguments is defined %}
                    {%- for args_name, args_value in tool_call.arguments|items %}
                        {{- '<parameter=' + args_name + '>\n' }}
                        {%- set args_value = args_value | tojson | safe if args_value is mapping or (args_value is sequence and args_value is not string) else args_value | string %}
                        {{- args_value }}
                        {{- '\n</parameter>\n' }}
                    {%- endfor %}
                {%- endif %}
                {{- '</function>\n</tool_call>' }}
            {%- endfor %}
        {%- endif %}
        {{- '<|im_end|>\n' }}
    {%- elif message.role == "tool" %}
        {%- if loop.previtem and loop.previtem.role != "tool" %}
            {{- '<|im_start|>user' }}
        {%- endif %}
        {{- '\n<tool_response>\n' }}
        {{- content }}
        {{- '\n</tool_response>' }}
        {%- if not loop.last and loop.nextitem.role != "tool" %}
            {{- '<|im_end|>\n' }}
        {%- elif loop.last %}
            {{- '<|im_end|>\n' }}
        {%- endif %}
    {%- else %}
        {{- raise_exception('Unexpected message role.') }}
    {%- endif %}
{%- endfor %}
{%- if add_generation_prompt %}
    {{- '<|im_start|>assistant\n' }}
    {%- if enable_thinking is defined and enable_thinking is false %}
        {{- '<think>\n\n</think>\n\n' }}
    {%- else %}
        {{- '<think>\n' }}
    {%- endif %}
{%- endif %}
""".strip()
        
    model = AutoModelForImageTextToText.from_pretrained(
        model_id, 
        torch_dtype=torch.bfloat16, 
        device_map="cpu", 
        trust_remote_code=True
    )

    print("Loading Cohere ASR model...")
    from transformers import CohereAsrForConditionalGeneration
    asr_processor = AutoProcessor.from_pretrained("CohereLabs/cohere-transcribe-03-2026")
    asr_model = CohereAsrForConditionalGeneration.from_pretrained(
        "CohereLabs/cohere-transcribe-03-2026",
        device_map="cpu",
    )

    print("Loading Supertonic TTS...")
    tts = TTS(model="supertonic-3")
    try:
        voice_style = tts.get_voice_style("F1")
    except Exception:
        voice_style = tts.get_voice_style(tts.voice_style_names[0])
        
    print("Generating audio for BOOTSTRAP_VOCAB...")
    for item in BOOTSTRAP_VOCAB:
        korean_word = item.get("korean", "")
        if korean_word and tts is not None:
            try:
                wav, dur = tts.synthesize(
                    text=korean_word,
                    voice_style=voice_style,
                    lang="ko",
                    speed=0.7,
                    total_steps=12,
                )
                item["audio_uri"] = numpy_to_base64_audio(wav, tts.sample_rate)
            except Exception as e:
                print(f"Failed to generate audio for {korean_word}: {e}")
                

    demo = create_demo()
    if IS_HF:
        demo.launch(allowed_paths=[LOG_DIR])
    else:
        demo.launch(server_name="0.0.0.0", server_port=7865, allowed_paths=[LOG_DIR])