"""
Evaluation queue for the Gradio Space: FIFO jobs, bounded memory.

Evaluations dispatch to **Hugging Face Hub Jobs** when ``FFASR_REMOTE_JOBS=1`` (see ``remote_jobs``).
The Space does not import torch or run ASR locally.

Optional moderation: when FFASR_MODERATION=1 and FFASR_MODERATOR_SECRET is set, new jobs stay in
pending_moderation until the moderator approves (then they enter the work queue).

Job state is persisted to the Hub bucket (results/jobs_state.csv) so moderation and queue survive
Space restarts.
"""

from __future__ import annotations

import csv
import hmac
import io
import json
import os
import time
import queue
import threading
import uuid
from dataclasses import dataclass
from datetime import datetime, timezone
from enum import Enum
from typing import Any

# --- Moderation (Space secrets / env) ---
# In HF Space: Settings → Variables and secrets → Secrets
#   FFASR_MODERATION=1
#   FFASR_MODERATOR_SECRET=<long random string>
MODERATION_ENABLED = os.environ.get("FFASR_MODERATION", "").strip().lower() in (
    "1",
    "true",
    "yes",
    "on",
)
MODERATOR_SECRET = os.environ.get("FFASR_MODERATOR_SECRET", "").strip()


class JobStatus(str, Enum):
    pending_moderation = "pending_moderation"
    queued = "queued"
    running = "running"
    dispatching = "dispatching"
    remote_running = "remote_running"
    collecting = "collecting"
    done = "done"
    failed = "failed"


@dataclass
class Job:
    id: str
    model_id: str
    family_id: str
    status: JobStatus
    created_at: str
    updated_at: str = ""
    error: str | None = None
    result: dict[str, Any] | None = None
    submission_notes: str = ""
    contact_email: str = ""
    extra_requirements: str = ""
    setup_script: str = ""
    custom_script: str = ""
    recipe_id: str = ""
    is_gated: bool = False
    run_custom_script: bool = False
    # Progress (not persisted; only meaningful while running)
    progress_done: int = 0
    progress_total: int = 0
    progress_condition: str = ""
    hf_remote_job_id: str | None = None
    remote_artifact_path: str | None = None
    # Set by moderator retry: skip duplicate guard and replace CSV row on success.
    replace_leaderboard: bool = False
    # Subset of PACKED_FILES keys; None means evaluate all conditions.
    eval_conditions: tuple[str, ...] | None = None


_jobs: dict[str, Job] = {}
_jobs_lock = threading.Lock()
_jobs_file_lock = threading.Lock()
_work_queue: queue.Queue[str] = queue.Queue()
_running_job_id: str | None = None
_worker_started = False
_worker_lock = threading.Lock()
_jobs_loaded = False
# Per Space job id: monotonic deadline for remote Hub Job polling (not persisted).
_remote_deadlines: dict[str, float] = {}

_MAX_JOBS_TRACKED = 400
_MAX_QUEUE_BACKLOG = 32
_MAX_PENDING_MODERATION = 64
_DEFAULT_REMOTE_MAX_CONCURRENT = 4
_MAX_CUSTOM_SCRIPT_BYTES = 32 * 1024
_MAX_REQUIREMENT_LINE_LEN = 200
_MAX_REQUIREMENT_LINES = 50

_JOBS_CSV_FIELDS = [
    "job_id",
    "model_id",
    "family_id",
    "status",
    "created_at",
    "updated_at",
    "error",
    "submission_notes",
    "contact_email",
    "extra_requirements",
    "setup_script_b64",
    "custom_script_b64",
    "recipe_id",
    "is_gated",
    "run_custom_script",
    "hf_remote_job_id",
    "remote_artifact_path",
    "eval_conditions",
]


def parse_requirements_lines(text: str) -> list[str]:
    """One package spec per line (requirements.txt style); ignores blanks and # comments."""
    out: list[str] = []
    for raw in (text or "").splitlines():
        line = raw.strip()
        if not line or line.startswith("#"):
            continue
        if len(line) > _MAX_REQUIREMENT_LINE_LEN:
            line = line[:_MAX_REQUIREMENT_LINE_LEN]
        out.append(line)
        if len(out) >= _MAX_REQUIREMENT_LINES:
            break
    return out


def sanitize_custom_script(text: str) -> str:
    """Trim and cap custom script body for storage."""
    from backends.custom_eval import normalize_custom_script_compat

    s = normalize_custom_script_compat((text or "").strip())
    if not s:
        return ""
    enc = s.encode("utf-8")
    if len(enc) > _MAX_CUSTOM_SCRIPT_BYTES:
        enc = enc[:_MAX_CUSTOM_SCRIPT_BYTES]
        s = enc.decode("utf-8", errors="ignore")
    return s


def sanitize_contact_email(text: str) -> str:
    """Trim and validate a required submitter email address."""
    s = (text or "").strip()[:254]
    if not s:
        raise ValueError("Contact email is required.")
    if s.count("@") != 1:
        raise ValueError("Invalid email address.")
    local, domain = s.split("@", 1)
    if not local or not domain or "." not in domain:
        raise ValueError("Invalid email address.")
    return s


def sanitize_setup_script(text: str) -> str:
    """Trim and cap one-time setup script (shell or Python) for storage."""
    s = (text or "").strip()
    if not s:
        return ""
    enc = s.encode("utf-8")
    if len(enc) > _MAX_CUSTOM_SCRIPT_BYTES:
        enc = enc[:_MAX_CUSTOM_SCRIPT_BYTES]
        s = enc.decode("utf-8", errors="ignore")
    return s


def custom_script_deprecated_api_warning(text: str) -> str | None:
    """Return a short warning if the script uses kwargs removed from current HF Hub."""
    s = (text or "").strip()
    if not s:
        return None
    if "use_auth_token" in s or "authentication_token" in s:
        return (
            "Your script uses <code>use_auth_token</code> (deprecated). "
            "It will be rewritten to <code>token=</code> automatically; prefer "
            "<code>token=os.environ['HF_TOKEN']</code> for gated models."
        )
    return None


def custom_script_argparse_warning(text: str) -> str | None:
    """Warn when a script references ``args.`` without defining argparse (common clone mistake)."""
    s = (text or "").strip()
    if not s or "args." not in s:
        return None
    try:
        import ast

        tree = ast.parse(s)
    except SyntaxError:
        return None

    defines_args = False
    calls_parse_args = False
    for node in ast.walk(tree):
        if isinstance(node, ast.Assign):
            for t in node.targets:
                if isinstance(t, ast.Name) and t.id == "args":
                    defines_args = True
        if isinstance(node, ast.AnnAssign) and isinstance(node.target, ast.Name):
            if node.target.id == "args":
                defines_args = True
        if isinstance(node, ast.Call):
            func = node.func
            if isinstance(func, ast.Attribute) and func.attr == "parse_args":
                calls_parse_args = True
            if isinstance(func, ast.Name) and func.id == "parse_args":
                calls_parse_args = True

    if defines_args or calls_parse_args:
        return None
    return (
        "Your script uses <code>args.something</code> but FFASR does not run "
        "<code>argparse</code> — replace with literal values (e.g. "
        "<code>routing_enabled=True</code>) or call <code>parse_args()</code> "
        "before using <code>args</code>. For Mega-ASR, use the recipe evaluator "
        "in <code>recipes/mega_asr/evaluate.py</code>."
    )


def custom_script_defines_evaluate(text: str) -> bool:
    """Best-effort check that the script defines a top-level ``evaluate`` function."""
    s = (text or "").strip()
    if not s:
        return True
    try:
        import ast

        tree = ast.parse(s)
    except SyntaxError:
        return False
    return any(
        isinstance(node, ast.FunctionDef) and node.name == "evaluate"
        for node in tree.body
    )


def _bool_to_csv(flag: bool) -> str:
    return "1" if flag else "0"


def _bool_from_csv(raw: str) -> bool:
    return (raw or "").strip().lower() in ("1", "true", "yes", "on")


def _encode_script_b64(script: str) -> str:
    if not script:
        return ""
    import base64

    return base64.b64encode(script.encode("utf-8")).decode("ascii")


def _decode_script_b64(raw: str) -> str:
    raw = (raw or "").strip()
    if not raw:
        return ""
    import base64

    try:
        return base64.b64decode(raw.encode("ascii")).decode("utf-8")
    except Exception:
        return ""


def _now_iso() -> str:
    return datetime.now(timezone.utc).isoformat()


def _touch(job: Job) -> None:
    job.updated_at = _now_iso()


def moderation_active() -> bool:
    """True when moderation is enabled and a secret is configured."""
    return MODERATION_ENABLED and bool(MODERATOR_SECRET)


def moderation_misconfigured() -> bool:
    """Enabled in UI but secret missing; submissions should be rejected."""
    return MODERATION_ENABLED and not MODERATOR_SECRET


def _check_moderator_secret(provided: str) -> bool:
    if not MODERATOR_SECRET or provided is None:
        return False
    a = provided.strip().encode("utf-8")
    b = MODERATOR_SECRET.encode("utf-8")
    if len(a) != len(b):
        return False
    return hmac.compare_digest(a, b)


def _prune_jobs() -> None:
    if len(_jobs) <= _MAX_JOBS_TRACKED:
        return
    terminal = [
        jid
        for jid, j in _jobs.items()
        if j.status in (JobStatus.done, JobStatus.failed)
    ]
    terminal.sort(key=lambda jid: _jobs[jid].created_at)
    for jid in terminal[: max(0, len(_jobs) - _MAX_JOBS_TRACKED // 2)]:
        _jobs.pop(jid, None)


def _persist_jobs() -> None:
    """Write all tracked jobs to Hub bucket CSV (best-effort)."""
    from storage import (
        HF_BUCKET_ID,
        HF_TOKEN,
        JOBS_STATE_PATH,
        STORAGE_BACKEND,
        batch_bucket_files,
        upload_to_bucket,
    )

    if STORAGE_BACKEND != "hf_bucket" or batch_bucket_files is None:
        return
    with _jobs_lock:
        rows: list[dict[str, str]] = []
        for jid, j in _jobs.items():
            rows.append(
                {
                    "job_id": j.id,
                    "model_id": j.model_id,
                    "family_id": j.family_id,
                    "status": j.status.value,
                    "created_at": j.created_at,
                    "updated_at": j.updated_at or j.created_at,
                    "error": (j.error or "").replace("\n", " ")[:2000],
                    "submission_notes": (j.submission_notes or "").replace("\n", " ")[:4000],
                    "contact_email": (j.contact_email or "").replace("\n", " ")[:254],
                    "extra_requirements": (j.extra_requirements or "").replace("\r\n", "\n")[:8000],
                    "setup_script_b64": _encode_script_b64(j.setup_script or ""),
                    "custom_script_b64": _encode_script_b64(j.custom_script or ""),
                    "recipe_id": (j.recipe_id or "").strip()[:64],
                    "is_gated": _bool_to_csv(j.is_gated),
                    "run_custom_script": _bool_to_csv(j.run_custom_script),
                    "hf_remote_job_id": (j.hf_remote_job_id or "").strip(),
                    "remote_artifact_path": (j.remote_artifact_path or "").strip(),
                    "eval_conditions": ",".join(j.eval_conditions)
                    if j.eval_conditions
                    else "",
                }
            )
        rows.sort(key=lambda r: r["created_at"])
    buf = io.StringIO()
    w = csv.DictWriter(buf, fieldnames=_JOBS_CSV_FIELDS, extrasaction="ignore")
    w.writeheader()
    w.writerows(rows)
    content = buf.getvalue().encode("utf-8")
    try:
        with _jobs_file_lock:
            upload_to_bucket(
                HF_BUCKET_ID,
                add=[(content, JOBS_STATE_PATH)],
                token=HF_TOKEN,
            )
    except Exception:
        pass


def _load_persisted_jobs_once() -> None:
    """Restore jobs from bucket and re-queue work that was queued or interrupted."""
    global _jobs_loaded
    if _jobs_loaded:
        return
    _jobs_loaded = True

    from storage import STORAGE_BACKEND, download_bucket_file, JOBS_STATE_PATH

    if STORAGE_BACKEND != "hf_bucket":
        return
    try:
        import os as _os

        local_path = download_bucket_file(JOBS_STATE_PATH)
        with open(local_path, "r", encoding="utf-8") as f:
            disk_rows = list(csv.DictReader(f))
        _os.unlink(local_path)
    except Exception:
        return

    if not disk_rows:
        return

    # Last row wins if duplicate job_id
    by_id: dict[str, dict] = {}
    for row in disk_rows:
        jid = (row.get("job_id") or "").strip()
        if jid:
            by_id[jid] = row

    to_queue: list[tuple[str, str]] = []

    with _jobs_lock:
        for jid, row in by_id.items():
            st_raw = (row.get("status") or "").strip()
            try:
                st = JobStatus(st_raw)
            except ValueError:
                continue
            err = (row.get("error") or "").strip() or None
            notes = (row.get("submission_notes") or "").strip()
            email = (row.get("contact_email") or "").strip()[:254]
            extra_req = (row.get("extra_requirements") or "").strip()
            setup = _decode_script_b64(row.get("setup_script_b64") or "")
            script = _decode_script_b64(row.get("custom_script_b64") or "")
            recipe_id = (row.get("recipe_id") or "").strip()
            is_gated = _bool_from_csv(row.get("is_gated") or "")
            run_custom = _bool_from_csv(row.get("run_custom_script") or "")
            created = (row.get("created_at") or _now_iso()).strip()
            updated = (row.get("updated_at") or created).strip()
            mid = (row.get("model_id") or "").strip()
            fid = (row.get("family_id") or "").strip()
            hf_rid = (row.get("hf_remote_job_id") or "").strip() or None
            art_path = (row.get("remote_artifact_path") or "").strip() or None
            eval_conds = _parse_eval_conditions_csv(row.get("eval_conditions") or "")
            if not mid:
                continue

            if st == JobStatus.running:
                st = JobStatus.queued
                extra = "Re-queued after Space restart (was running)."
                err = f"{err}; {extra}" if err else extra

            if st in (JobStatus.dispatching, JobStatus.remote_running, JobStatus.collecting):
                st = JobStatus.queued
                extra = "Re-queued after Space restart (remote job resume)."
                err = f"{err}; {extra}" if err else extra

            job = Job(
                id=jid,
                model_id=mid,
                family_id=fid,
                status=st,
                created_at=created,
                updated_at=updated,
                error=err,
                submission_notes=notes,
                contact_email=email,
                extra_requirements=extra_req,
                setup_script=setup,
                custom_script=script,
                recipe_id=recipe_id,
                is_gated=is_gated,
                run_custom_script=run_custom,
                hf_remote_job_id=hf_rid,
                remote_artifact_path=art_path,
                eval_conditions=eval_conds,
            )
            _jobs[jid] = job

            if st == JobStatus.queued:
                to_queue.append((created, jid))

    to_queue.sort(key=lambda x: x[0])
    for _, jid in to_queue:
        _work_queue.put(jid)


def _progress_update(job_id: str, done: int, total: int, condition: str) -> None:
    """Cheap in-memory progress update; throttling is done by the UI timer."""
    with _jobs_lock:
        j = _jobs.get(job_id)
        if j is None:
            return
        j.progress_done = int(done)
        j.progress_total = int(total)
        j.progress_condition = condition or ""


def _leaderboard_sort_rows_inplace(rows: list[dict]) -> None:
    """Sort leaderboard CSV rows by Pareto layer (asc), then FFAS score (desc)."""
    from analytics import sort_leaderboard_rows_inplace

    sort_leaderboard_rows_inplace(rows)


def _remote_poll_interval_s() -> float:
    raw = os.environ.get("FFASR_REMOTE_JOB_POLL_S", "10").strip()
    try:
        return float(raw) if raw else 10.0
    except ValueError:
        return 10.0


_DEFAULT_REMOTE_JOB_MAX_WAIT_S = 86400.0  # 24 hours; previously 8h / 4h.
# Extra slack past the Space-side deadline before we declare a timeout.
# Absorbs the brief gap between a worker script exiting cleanly (artifact
# uploaded) and the Hub flipping the job stage to COMPLETED.
_REMOTE_DEADLINE_GRACE_S = 90.0


def _remote_max_wait_s() -> float:
    raw = os.environ.get(
        "FFASR_REMOTE_JOB_MAX_WAIT_S", str(_DEFAULT_REMOTE_JOB_MAX_WAIT_S)
    ).strip()
    try:
        return float(raw) if raw else _DEFAULT_REMOTE_JOB_MAX_WAIT_S
    except ValueError:
        return _DEFAULT_REMOTE_JOB_MAX_WAIT_S


def remote_max_concurrent_jobs() -> int:
    """Max Hub Jobs in flight at once when ``FFASR_REMOTE_JOBS=1`` (default 4)."""
    raw = os.environ.get(
        "FFASR_REMOTE_MAX_CONCURRENT_JOBS", str(_DEFAULT_REMOTE_MAX_CONCURRENT)
    ).strip()
    try:
        n = int(raw) if raw else _DEFAULT_REMOTE_MAX_CONCURRENT
    except ValueError:
        n = _DEFAULT_REMOTE_MAX_CONCURRENT
    return max(1, min(n, 32))


def _remote_in_flight_statuses() -> tuple[JobStatus, ...]:
    return (JobStatus.dispatching, JobStatus.remote_running, JobStatus.collecting)


def _count_remote_in_flight() -> int:
    with _jobs_lock:
        return sum(1 for j in _jobs.values() if j.status in _remote_in_flight_statuses())


def _list_remote_in_flight_ids() -> list[str]:
    with _jobs_lock:
        return [
            j.id
            for j in _jobs.values()
            if j.status in _remote_in_flight_statuses()
        ]


def _list_active_eval_jobs() -> list[Job]:
    """Jobs currently using a remote or in-process eval slot."""
    with _jobs_lock:
        return [
            j
            for j in _jobs.values()
            if j.status
            in (
                JobStatus.running,
                *_remote_in_flight_statuses(),
            )
        ]


def _fail_job(job_id: str, error: str, *, finish_queue: bool = True) -> None:
    with _jobs_lock:
        j = _jobs.get(job_id)
        if j:
            j.status = JobStatus.failed
            j.error = (error or "Unknown error")[:8000]
            _touch(j)
        _prune_jobs()
    _remote_deadlines.pop(job_id, None)
    _persist_jobs()
    if finish_queue:
        try:
            _work_queue.task_done()
        except ValueError:
            pass


def _succeed_job(job_id: str, result: dict) -> None:
    with _jobs_lock:
        j = _jobs.get(job_id)
        if j:
            j.status = JobStatus.done
            j.result = result
            j.error = None
            j.progress_condition = ""
            _touch(j)
        _prune_jobs()
    _remote_deadlines.pop(job_id, None)
    _persist_jobs()
    try:
        _work_queue.task_done()
    except ValueError:
        pass


def _merge_eval_result_to_leaderboard(
    result: dict,
    submitted_at_iso: str,
    submission_notes: str,
    contact_email: str = "",
    *,
    replace_existing: bool = False,
    merge_partial: bool = False,
) -> None:
    from init import (
        invalidate_results_cache,
        leaderboard_row_from_eval_result,
        load_raw_results,
        merge_leaderboard_row_from_eval_result,
        normalize_legacy_csv_row,
        save_raw_results,
    )

    if merge_partial:
        merge_leaderboard_row_from_eval_result(
            result,
            submitted_at_iso,
            submission_notes=submission_notes,
            contact_email=contact_email,
        )
        return

    model_id = str(result.get("model_id", "")).strip()
    rows = load_raw_results()
    if replace_existing and model_id:
        existing = [i for i, r in enumerate(rows) if (r.get("model_id") or "").strip() == model_id]
        for i in sorted(existing, reverse=True):
            rows.pop(i)

    new_row = leaderboard_row_from_eval_result(
        result,
        submitted_at_iso,
        submission_notes=submission_notes,
        contact_email=contact_email,
    )
    normalize_legacy_csv_row(new_row)
    rows.append(new_row)
    _leaderboard_sort_rows_inplace(rows)
    save_raw_results(rows)
    invalidate_results_cache()


def _parse_eval_conditions_csv(raw: str) -> tuple[str, ...] | None:
    from benchmark.dataset import resolve_condition_keys

    parts = [p.strip() for p in (raw or "").split(",") if p.strip()]
    if not parts:
        return None
    keys = resolve_condition_keys(parts)
    from benchmark.dataset import PACKED_FILES

    if set(keys) == set(PACKED_FILES.keys()):
        return None
    return keys


def _encode_eval_conditions_csv(keys: tuple[str, ...] | None) -> str:
    if not keys:
        return ""
    return ",".join(keys)


def normalize_moderator_eval_conditions(
    selected: list[str] | None,
) -> tuple[str, ...] | None:
    """``None`` = all packed conditions; otherwise a validated non-empty subset."""
    from benchmark.dataset import PACKED_FILES, resolve_condition_keys

    if not selected:
        return None
    keys = resolve_condition_keys(selected)
    if not keys:
        raise ValueError("Select at least one dataset to evaluate.")
    if set(keys) == set(PACKED_FILES.keys()):
        return None
    return keys


def eval_condition_checkbox_defaults() -> tuple[list[str], list[str]]:
    """(labels, values) for Gradio CheckboxGroup defaults (all selected)."""
    from benchmark.dataset import CONDITION_UI_CHOICES

    labels = [lbl for lbl, _ in CONDITION_UI_CHOICES]
    values = [key for _, key in CONDITION_UI_CHOICES]
    return labels, values


def _job_is_partial_eval(job: Job | None) -> bool:
    return bool(job and job.eval_conditions)


def _load_artifact_json_from_bucket(artifact_path: str) -> dict:
    """Download and parse a remote eval JSON artifact from the Hub bucket."""
    from storage import STORAGE_BACKEND, download_bucket_file

    if STORAGE_BACKEND != "hf_bucket":
        raise RuntimeError("Artifact import requires STORAGE_BACKEND='hf_bucket'.")
    local_path = download_bucket_file(artifact_path)
    try:
        with open(local_path, "r", encoding="utf-8") as f:
            return json.load(f)
    finally:
        try:
            os.unlink(local_path)
        except Exception:
            pass


def _submission_fields_for_artifact_import(
    data: dict, artifact_path: str, notes_override: str, email_override: str
) -> tuple[str, str]:
    notes = (notes_override or "").strip()[:4000]
    email = (email_override or "").strip()[:254]
    if notes and email:
        return notes, email
    space_job_id = str(data.get("job_id") or "").strip()
    with _jobs_lock:
        for j in _jobs.values():
            if space_job_id and j.id == space_job_id:
                if not notes:
                    notes = (j.submission_notes or "").strip()[:4000]
                if not email:
                    email = (j.contact_email or "").strip()[:254]
                return notes, email
            if (j.remote_artifact_path or "").strip() == artifact_path:
                if not notes:
                    notes = (j.submission_notes or "").strip()[:4000]
                if not email:
                    email = (j.contact_email or "").strip()[:254]
                return notes, email
    return notes, email


def _submission_notes_for_artifact_import(
    data: dict, artifact_path: str, override: str
) -> str:
    notes, _ = _submission_fields_for_artifact_import(data, artifact_path, override, "")
    return notes


def _mark_job_done_for_artifact(
    data: dict, artifact_path: str, result: dict
) -> str | None:
    """If a tracked queue job matches, mark it done. Returns matched job id or None."""
    space_job_id = str(data.get("job_id") or "").strip()
    matched: Job | None = None
    with _jobs_lock:
        for j in _jobs.values():
            if space_job_id and j.id == space_job_id:
                matched = j
                break
            if (j.remote_artifact_path or "").strip() == artifact_path:
                matched = j
                break
        if matched is not None:
            matched.status = JobStatus.done
            matched.result = result
            matched.error = None
            if not (matched.remote_artifact_path or "").strip():
                matched.remote_artifact_path = artifact_path
            _touch(matched)
    if matched is not None:
        _persist_jobs()
        return matched.id
    return None


def import_artifact_to_leaderboard(
    artifact_ref: str,
    secret: str,
    *,
    replace_existing: bool = False,
    submission_notes: str = "",
) -> tuple[bool, str]:
    """
    Moderator-only: load a bucket JSON artifact and merge its result into leaderboard.csv.

    ``artifact_ref`` may be a file name (``abc123.json``), job id (``abc123``), or full bucket path.
    """
    ok, msg = _moderator_secret_ok(secret)
    if not ok:
        return False, msg

    from evaluation.remote_artifact import extract_result_or_raise, normalize_artifact_bucket_path
    from init import (
        invalidate_results_cache,
        leaderboard_row_from_eval_result,
        load_raw_results,
        normalize_legacy_csv_row,
        save_raw_results,
    )
    import analytics

    try:
        artifact_path = normalize_artifact_bucket_path(artifact_ref)
    except ValueError as e:
        return False, str(e)

    try:
        data = _load_artifact_json_from_bucket(artifact_path)
    except Exception as e:
        return False, f"Could not load artifact <code>{_escape_html(artifact_path)}</code>: {e}"

    try:
        result = extract_result_or_raise(data)
    except Exception as e:
        return False, f"Artifact is not a successful evaluation: {e}"

    model_id = str(result.get("model_id", "")).strip()
    if not model_id:
        return False, "Artifact result is missing model_id."

    notes, email = _submission_fields_for_artifact_import(
        data, artifact_path, submission_notes, ""
    )
    rows = load_raw_results()
    existing = [i for i, r in enumerate(rows) if (r.get("model_id") or "").strip() == model_id]

    if existing and not replace_existing:
        row = dict(rows[existing[0]])
        normalize_legacy_csv_row(row)
        avg = analytics._avg_wer_for_row(row)
        avg_txt = f"{avg * 100:.2f}%" if avg != float("inf") else "N/A"
        return False, (
            f"Model <code>{_escape_html(model_id)}</code> is already on the leaderboard "
            f"(Avg WER {avg_txt}). Enable "
            f"<strong>Replace existing row</strong> to overwrite."
        )

    if existing and replace_existing:
        for i in sorted(existing, reverse=True):
            rows.pop(i)

    submitted_at = _now_iso()
    new_row = leaderboard_row_from_eval_result(
        result, submitted_at, submission_notes=notes, contact_email=email
    )
    normalize_legacy_csv_row(new_row)
    rows.append(new_row)
    _leaderboard_sort_rows_inplace(rows)
    save_raw_results(rows)
    invalidate_results_cache()

    avg = analytics._avg_wer_for_row(new_row)
    avg_txt = f"{avg * 100:.2f}%" if avg != float("inf") else "N/A"
    action = "Replaced" if existing else "Added"
    matched_job = _mark_job_done_for_artifact(data, artifact_path, result)
    job_bit = f" Matched queue job <code>{_escape_html(matched_job)}</code> marked done." if matched_job else ""

    return True, (
        f"{action} <strong>{_escape_html(model_id)}</strong> from "
        f"<code>{_escape_html(artifact_path)}</code>. "
        f"Average WER: <strong>{avg_txt}</strong>.{job_bit}"
    )


def _remote_collect_result(job_id: str, hf_id: str, jobs_token: str) -> dict:
    from evaluation.remote_artifact import extract_result_or_raise
    from storage import download_bucket_file

    with _jobs_lock:
        j = _jobs.get(job_id)
        if not j:
            raise RuntimeError("internal: job not found")
        artifact_path = str(j.remote_artifact_path or "").strip()
    if not artifact_path:
        raise RuntimeError("internal: missing remote artifact path")

    with _jobs_lock:
        j2 = _jobs.get(job_id)
        if j2:
            j2.status = JobStatus.collecting
            _touch(j2)
    _persist_jobs()

    # HF dataset bucket uploads are sometimes briefly not readable right after
    # the worker uploaded the JSON (especially with Xet). Retry a few times
    # with light backoff so a single 404 doesn't permanently fail an otherwise
    # successful run.
    last_err: Exception | None = None
    local_path: str | None = None
    for attempt in range(5):
        try:
            local_path = download_bucket_file(artifact_path)
            break
        except Exception as e:
            last_err = e
            msg = str(e).lower()
            transient = (
                "404" in msg
                or "not found" in msg
                or "entrynotfound" in msg
                or "no such" in msg
                or "timed out" in msg
                or "timeout" in msg
            )
            if not transient or attempt == 4:
                raise
            time.sleep(2.0 * (2 ** attempt))
    if local_path is None:
        # Shouldn't reach here, but keep mypy / runtime safe.
        raise last_err or RuntimeError("artifact download failed")

    try:
        with open(local_path, "r", encoding="utf-8") as f:
            data = json.load(f)
    finally:
        try:
            os.unlink(local_path)
        except Exception:
            pass

    return extract_result_or_raise(data)


def _remote_dispatch_job(job_id: str, mid: str, fid: str, jobs_token: str) -> str:
    """Submit Hub Job if needed; return ``hf_remote_job_id``."""
    import remote_jobs
    from evaluation.remote_artifact import default_remote_artifact_path

    with _jobs_lock:
        j = _jobs.get(job_id)
        if not j:
            raise RuntimeError("internal: job not found")
        if not (j.remote_artifact_path or "").strip():
            j.remote_artifact_path = default_remote_artifact_path(job_id)
            _touch(j)
        artifact_path = str(j.remote_artifact_path).strip()
        existing_hf = (j.hf_remote_job_id or "").strip()

    if existing_hf:
        with _jobs_lock:
            j2 = _jobs.get(job_id)
            if j2 and j2.status != JobStatus.remote_running:
                j2.status = JobStatus.remote_running
                _touch(j2)
        _persist_jobs()
        _remote_deadlines[job_id] = time.monotonic() + _remote_max_wait_s()
        return existing_hf

    with _jobs_lock:
        j3 = _jobs.get(job_id)
        if j3:
            j3.status = JobStatus.dispatching
            _touch(j3)
    _persist_jobs()

    with _jobs_lock:
        j_dispatch = _jobs.get(job_id)
        extra_req = (j_dispatch.extra_requirements or "") if j_dispatch else ""
        setup_script = (j_dispatch.setup_script or "") if j_dispatch else ""
        custom_script = (j_dispatch.custom_script or "") if j_dispatch else ""
        recipe_id = (j_dispatch.recipe_id or "") if j_dispatch else ""
        run_custom = bool(j_dispatch and j_dispatch.run_custom_script)
        eval_conds = j_dispatch.eval_conditions if j_dispatch else None

    info = remote_jobs.submit_eval_job(
        model_id=mid,
        family_id=fid,
        space_job_id=job_id,
        artifact_path=artifact_path,
        token=jobs_token,
        extra_requirements=extra_req,
        setup_script=setup_script,
        custom_script=custom_script,
        recipe_id=recipe_id,
        run_custom_script=run_custom,
        eval_conditions=eval_conds,
    )
    hf_id = info.id
    with _jobs_lock:
        j4 = _jobs.get(job_id)
        if j4:
            j4.hf_remote_job_id = hf_id
            j4.status = JobStatus.remote_running
            _touch(j4)
    _persist_jobs()
    _remote_deadlines[job_id] = time.monotonic() + _remote_max_wait_s()
    return hf_id


def _remote_start_queued_job(job_id: str, jobs_token: str) -> None:
    """Move a queued job onto Hub Jobs (duplicate check + dispatch)."""
    from init import load_raw_results

    with _jobs_lock:
        j = _jobs.get(job_id)
        if j is None or j.status != JobStatus.queued:
            try:
                _work_queue.task_done()
            except ValueError:
                pass
            return
        mid = j.model_id
        fid = j.family_id
        notes = j.submission_notes or ""
        email = j.contact_email or ""
        j.status = JobStatus.running
        j.progress_done = 0
        j.progress_total = 0
        j.progress_condition = ""
        _touch(j)
    _persist_jobs()

    rows = load_raw_results()
    with _jobs_lock:
        j_chk = _jobs.get(job_id)
        replace_lb = bool(j_chk and j_chk.replace_leaderboard)
        partial = _job_is_partial_eval(j_chk)
    if not replace_lb and not partial and any(r["model_id"] == mid for r in rows):
        _fail_job(job_id, "Model already on leaderboard (skipped duplicate race).")
        return

    global _running_job_id
    _running_job_id = job_id

    try:
        _remote_dispatch_job(job_id, mid, fid, jobs_token)
    except Exception as e:
        _fail_job(job_id, str(e))
    finally:
        with _jobs_lock:
            if _running_job_id == job_id:
                _running_job_id = None


def _remote_tick_job(job_id: str, jobs_token: str) -> None:
    """Poll one remote job once; on completion merge CSV or mark failed."""
    import remote_jobs
    from huggingface_hub._jobs_api import JobStage

    with _jobs_lock:
        j = _jobs.get(job_id)
        if j is None or j.status not in _remote_in_flight_statuses():
            return
        hf_id = (j.hf_remote_job_id or "").strip()
        if not hf_id:
            return
        mid = j.model_id
        fid = j.family_id
        notes = j.submission_notes or ""
        email = j.contact_email or ""

    # Grace window absorbs the brief gap between the worker script returning
    # rc=0 (and uploading the JSON artifact) and the Hub flipping the job's
    # stage to COMPLETED. Without this, a tick that arrives ε seconds past
    # the deadline would fail an already-successful run with a misleading
    # "exceeded max wait" message.
    deadline = _remote_deadlines.get(job_id)
    deadline_hit = (
        deadline is not None
        and time.monotonic() > deadline + _REMOTE_DEADLINE_GRACE_S
    )

    try:
        info = remote_jobs.inspect_job_once(hf_id, token=jobs_token)
    except Exception:
        # If the Hub API is unavailable AND we're already past the wait
        # budget, give up cleanly. Otherwise wait for the next tick.
        if deadline_hit:
            _fail_job(
                job_id,
                f"Remote Hub Job exceeded max wait ({_remote_max_wait_s():.0f}s); "
                "Hub inspect_job unavailable.",
            )
        return

    stage = info.status.stage if info.status else None

    # 1) Always honor a terminal Hub state, even if the Space-side deadline
    #    already elapsed -- a completed job's artifact should be collected,
    #    not thrown away.
    if stage == JobStage.COMPLETED:
        try:
            result = _remote_collect_result(job_id, hf_id, jobs_token)
            with _jobs_lock:
                j_done = _jobs.get(job_id)
                replace_lb = bool(j_done and j_done.replace_leaderboard)
                partial = _job_is_partial_eval(j_done)
            _merge_eval_result_to_leaderboard(
                result,
                _now_iso(),
                notes,
                email,
                replace_existing=replace_lb and not partial,
                merge_partial=partial,
            )
            with _jobs_lock:
                j_clr = _jobs.get(job_id)
                if j_clr:
                    j_clr.replace_leaderboard = False
            _succeed_job(job_id, result)
        except Exception as e:
            _fail_job(job_id, str(e))
        return

    if stage in (JobStage.ERROR, JobStage.CANCELED, JobStage.DELETED):
        _fail_job(job_id, remote_jobs.describe_job_failure(info, token=jobs_token))
        return

    # 2) Job is genuinely still running. Only now enforce the Space-side
    #    deadline (the Hub has its own FFASR_REMOTE_JOB_TIMEOUT as a backstop).
    if deadline_hit:
        try:
            remote_jobs.cancel_remote_job(hf_id, token=jobs_token)
        except Exception:
            pass
        _fail_job(job_id, f"Remote Hub Job exceeded max wait ({_remote_max_wait_s():.0f}s).")
        return


def _remote_parallel_worker_loop() -> None:
    """Dispatch up to N Hub Jobs and poll them concurrently (N = remote_max_concurrent_jobs)."""
    import remote_jobs
    from storage import HF_TOKEN, require_token_for_ffasr_jobs

    jobs_token = require_token_for_ffasr_jobs()
    if not HF_TOKEN:
        raise RuntimeError("HF_TOKEN is required when FFASR_REMOTE_JOBS=1.")

    poll_s = _remote_poll_interval_s()
    max_slots = remote_max_concurrent_jobs()

    while True:
        while _count_remote_in_flight() < max_slots:
            try:
                job_id = _work_queue.get_nowait()
            except queue.Empty:
                break
            _remote_start_queued_job(job_id, jobs_token)

        active = _list_remote_in_flight_ids()
        if active:
            for jid in active:
                _remote_tick_job(jid, jobs_token)
            time.sleep(poll_s)
            continue

        if _work_queue.qsize() == 0:
            try:
                job_id = _work_queue.get(timeout=poll_s)
            except queue.Empty:
                continue
            _remote_start_queued_job(job_id, jobs_token)
        else:
            time.sleep(min(poll_s, 2.0))


def ensure_worker_started() -> None:
    """Start background Hub Jobs worker after restoring persisted queue (once per process)."""
    global _worker_started
    _load_persisted_jobs_once()
    with _worker_lock:
        if _worker_started:
            return
        import remote_jobs as _rj

        if not _rj.remote_jobs_enabled():
            raise RuntimeError(
                "FFASR_REMOTE_JOBS=1 is required. This Space dispatches evaluations to "
                "Hugging Face Hub Jobs and does not run ASR models locally."
            )
        t = threading.Thread(target=_remote_parallel_worker_loop, name="ffasr-remote-worker", daemon=True)
        t.start()
        _worker_started = True


def _ensure_worker() -> None:
    """Alias used by queue UI helpers."""
    ensure_worker_started()


def _worker_unavailable_html(exc: Exception) -> str:
    return (
        "<p style='color:orange'><strong>Queue unavailable:</strong> "
        f"{_escape_html(str(exc))}</p>"
    )


def _model_in_flight(model_id: str) -> bool:
    with _jobs_lock:
        for j in _jobs.values():
            if j.model_id != model_id:
                continue
            if j.status in (
                JobStatus.pending_moderation,
                JobStatus.queued,
                JobStatus.running,
                JobStatus.dispatching,
                JobStatus.remote_running,
                JobStatus.collecting,
            ):
                return True
    return False


def _pending_moderation_count() -> int:
    with _jobs_lock:
        return sum(1 for j in _jobs.values() if j.status == JobStatus.pending_moderation)


def enqueue(
    model_id: str,
    family_id: str,
    submission_notes: str = "",
    *,
    contact_email: str = "",
    extra_requirements: str = "",
    setup_script: str = "",
    custom_script: str = "",
    recipe_id: str = "",
    is_gated: bool = False,
) -> tuple[str, int, str | None, bool]:
    """
    Enqueue an evaluation job.

    Returns (job_id, position_or_count, error_message, awaiting_moderation).
    When awaiting_moderation is True, the job is not in the execution queue yet.
    """
    import remote_jobs

    if not remote_jobs.remote_jobs_enabled():
        return "", 0, "remote_jobs_required", False

    _ensure_worker()

    from init import load_raw_results

    if moderation_misconfigured():
        return "", 0, "moderation_misconfigured", False

    if _work_queue.qsize() >= _MAX_QUEUE_BACKLOG and not moderation_active():
        return "", 0, "queue_full", False

    if _model_in_flight(model_id):
        return "", 0, f"Model '{model_id}' is already submitted, queued, or running.", False

    existing = load_raw_results()
    for row in existing:
        if row["model_id"] == model_id:
            return "", 0, "already_in_csv", False

    if moderation_active() and _pending_moderation_count() >= _MAX_PENDING_MODERATION:
        return "", 0, "pending_moderation_full", False

    job_id = str(uuid.uuid4())[:8]
    created = _now_iso()
    notes_clean = (submission_notes or "").strip()[:4000]
    try:
        email_clean = sanitize_contact_email(contact_email)
        from recipes.registry import apply_recipe_to_submission

        req_lines = parse_requirements_lines(extra_requirements)
        extra_req_clean = "\n".join(req_lines)
        setup_clean = sanitize_setup_script(setup_script)
        script_clean = sanitize_custom_script(custom_script)
        extra_req_clean, setup_clean, script_clean, resolved_recipe = apply_recipe_to_submission(
            model_id,
            recipe_id or None,
            extra_req_clean,
            setup_clean,
            script_clean,
        )
        recipe_clean = (resolved_recipe or recipe_id or "").strip().lower()[:64]
    except Exception as e:
        return "", 0, f"Invalid submission fields: {e}", False

    awaiting = moderation_active()
    status = JobStatus.pending_moderation if awaiting else JobStatus.queued

    uses_custom_stack = bool(
        script_clean.strip() or setup_clean.strip() or recipe_clean
    )

    job = Job(
        id=job_id,
        model_id=model_id,
        family_id=family_id,
        status=status,
        created_at=created,
        updated_at=created,
        submission_notes=notes_clean,
        contact_email=email_clean,
        extra_requirements=extra_req_clean,
        setup_script=setup_clean,
        custom_script=script_clean,
        recipe_id=recipe_clean,
        is_gated=bool(is_gated),
        run_custom_script=uses_custom_stack,
    )

    with _jobs_lock:
        _jobs[job_id] = job

    _persist_jobs()

    if awaiting:
        pos = _pending_moderation_count()
        return job_id, pos, None, True

    if _work_queue.qsize() >= _MAX_QUEUE_BACKLOG:
        with _jobs_lock:
            _jobs.pop(job_id, None)
        return "", 0, "queue_full", False

    _work_queue.put(job_id)
    position = _work_queue.qsize()
    return job_id, position, None, False


def approve_job(
    job_id: str,
    secret: str,
    *,
    run_custom_script: bool = False,
    eval_conditions: list[str] | None = None,
) -> tuple[bool, str]:
    """Move a pending job into the execution queue (moderator only)."""
    if not moderation_active():
        return False, "Moderation is not active on this Space."
    if not _check_moderator_secret(secret):
        return False, "Invalid moderator secret."
    job_id = job_id.strip()
    if not job_id:
        return False, "Enter a job ID."

    try:
        conds = normalize_moderator_eval_conditions(eval_conditions)
    except ValueError as e:
        return False, str(e)

    with _jobs_lock:
        job = _jobs.get(job_id)
        if not job or job.status != JobStatus.pending_moderation:
            return False, "Job not found or not awaiting approval."
        if _work_queue.qsize() >= _MAX_QUEUE_BACKLOG:
            return False, "Execution queue is full; try again in a moment."

        job.status = JobStatus.queued
        # Use custom stack when evaluate/setup/recipe is provided.
        job.run_custom_script = bool(
            (job.custom_script or "").strip()
            or (job.setup_script or "").strip()
            or (job.recipe_id or "").strip()
        )
        job.eval_conditions = conds
        job.replace_leaderboard = False
        _touch(job)

    _work_queue.put(job_id)
    _persist_jobs()
    _ensure_worker()
    max_n = remote_max_concurrent_jobs()
    custom_note = ""
    cond_note = ""
    with _jobs_lock:
        j = _jobs.get(job_id)
        if j and j.run_custom_script and (j.custom_script or "").strip():
            custom_note = " Custom script will run on the Hub Job."
        if j and j.eval_conditions:
            cond_note = f" Evaluating: {', '.join(j.eval_conditions)} (others unchanged on success)."
    return True, (
        f"Approved job {job_id}. Up to {max_n} Hub Jobs may run in parallel; "
        f"this job starts when a slot is free.{custom_note}{cond_note}"
    )


def reject_job(job_id: str, secret: str) -> tuple[bool, str]:
    """Reject a pending job (moderator only)."""
    if not moderation_active():
        return False, "Moderation is not active on this Space."
    if not _check_moderator_secret(secret):
        return False, "Invalid moderator secret."
    job_id = job_id.strip()
    if not job_id:
        return False, "Enter a job ID."

    with _jobs_lock:
        job = _jobs.get(job_id)
        if not job or job.status != JobStatus.pending_moderation:
            return False, "Job not found or not awaiting approval."
        job.status = JobStatus.failed
        job.error = "Rejected by moderator."
        _touch(job)
        _prune_jobs()

    _persist_jobs()
    return True, f"Rejected job {job_id}."


def verify_moderator_secret(secret: str) -> tuple[bool, str]:
    """Check moderator secret for UI unlock and privileged actions."""
    if not MODERATOR_SECRET:
        return False, "Moderator secret is not configured (set FFASR_MODERATOR_SECRET)."
    if not _check_moderator_secret(secret):
        return False, "Invalid moderator secret."
    return True, ""


def _moderator_secret_ok(secret: str) -> tuple[bool, str]:
    """Shared gate for destructive / queue actions (needs FFASR_MODERATOR_SECRET)."""
    return verify_moderator_secret(secret)


def moderation_locked_placeholder_html() -> str:
    """Neutral HTML shown before the moderator secret unlocks the panel."""
    return "<p><em>Moderator tools are locked. Enter the secret above and click Unlock.</em></p>"


def _job_can_retry(status: JobStatus) -> bool:
    """Moderator may re-run jobs that are not actively executing on Hub."""
    if status in (
        JobStatus.running,
        JobStatus.dispatching,
        JobStatus.remote_running,
        JobStatus.collecting,
        JobStatus.pending_moderation,
    ):
        return False
    return status in (JobStatus.failed, JobStatus.done, JobStatus.queued)


def retry_failed_job(
    job_id: str,
    secret: str,
    *,
    eval_conditions: list[str] | None = None,
) -> tuple[bool, str]:
    """Re-queue a job for another evaluation run (moderator only).

    Allowed for failed, done, and queued jobs. Successful re-runs replace the
    existing leaderboard row for that model when one is present.
    """
    ok, msg = _moderator_secret_ok(secret)
    if not ok:
        return False, msg
    job_id = job_id.strip()
    if not job_id:
        return False, "Select a job."

    try:
        conds = normalize_moderator_eval_conditions(eval_conditions)
    except ValueError as e:
        return False, str(e)

    with _jobs_lock:
        job = _jobs.get(job_id)
        if not job:
            return False, "Job not found."
        if not _job_can_retry(job.status):
            return (
                False,
                "Cannot retry while the job is running or awaiting moderation. "
                "Wait for it to finish, or approve/reject pending jobs first.",
            )
        if _work_queue.qsize() >= _MAX_QUEUE_BACKLOG:
            return False, "Execution queue is full; try again later."
        was_queued = job.status == JobStatus.queued
        job.status = JobStatus.queued
        job.error = None
        job.result = None
        job.hf_remote_job_id = None
        job.remote_artifact_path = None
        job.progress_done = 0
        job.progress_total = 0
        job.progress_condition = ""
        job.eval_conditions = conds
        job.replace_leaderboard = conds is None
        _touch(job)

    if not was_queued:
        _work_queue.put(job_id)
    _persist_jobs()
    _ensure_worker()
    cond_note = ""
    with _jobs_lock:
        j = _jobs.get(job_id)
        if j and j.eval_conditions:
            cond_note = (
                f" Only {', '.join(j.eval_conditions)} will run; "
                "existing leaderboard WER columns for other datasets are kept."
            )
        elif j and j.replace_leaderboard:
            cond_note = " Full re-eval; the leaderboard row will be replaced on success."
    return (
        True,
        f"Re-queued job {job_id}; it will run after jobs ahead of it.{cond_note}"
    )


def retry_all_eligible_jobs(secret: str) -> tuple[bool, str]:
    """Re-queue every retry-eligible job against the full benchmark (all datasets).

    "Retry-eligible" matches :func:`_job_can_retry` — i.e. ``failed``, ``done``, or
    ``queued``. Jobs that are running, dispatching, awaiting moderation, etc. are left
    untouched. ``eval_conditions`` is forced to ``None`` (full benchmark) so that on
    success the existing leaderboard row is replaced — matching the semantics
    described in the moderator panel for a full re-run.

    Stops early (with a partial-success message) if the work queue fills up, so we
    never silently drop retries on the floor.
    """
    ok, msg = _moderator_secret_ok(secret)
    if not ok:
        return False, msg

    requeued: list[str] = []
    skipped_running: list[str] = []
    skipped_pending: list[str] = []
    capacity_hit = False

    job_ids_to_enqueue: list[str] = []

    with _jobs_lock:
        snapshot = list(_jobs.values())
        snapshot.sort(key=lambda j: j.updated_at or j.created_at)
        for job in snapshot:
            if job.status == JobStatus.pending_moderation:
                skipped_pending.append(job.id)
                continue
            if not _job_can_retry(job.status):
                skipped_running.append(job.id)
                continue
            # Approximate current backlog while we still hold the lock; this keeps
            # us within ``_MAX_QUEUE_BACKLOG`` even when several retries land at once.
            if _work_queue.qsize() + len(job_ids_to_enqueue) >= _MAX_QUEUE_BACKLOG:
                capacity_hit = True
                break
            was_queued = job.status == JobStatus.queued
            job.status = JobStatus.queued
            job.error = None
            job.result = None
            job.hf_remote_job_id = None
            job.remote_artifact_path = None
            job.progress_done = 0
            job.progress_total = 0
            job.progress_condition = ""
            job.eval_conditions = None
            job.replace_leaderboard = True
            _touch(job)
            requeued.append(job.id)
            if not was_queued:
                job_ids_to_enqueue.append(job.id)

    for jid in job_ids_to_enqueue:
        _work_queue.put(jid)
    if requeued:
        _persist_jobs()
        _ensure_worker()

    parts: list[str] = []
    if requeued:
        parts.append(
            f"Re-queued {len(requeued)} job(s) against the full benchmark; "
            "on success each leaderboard row will be replaced."
        )
    else:
        parts.append("No retry-eligible jobs were found.")
    if skipped_pending:
        parts.append(
            f"Skipped {len(skipped_pending)} job(s) awaiting moderation "
            "(approve or reject those manually)."
        )
    if skipped_running:
        parts.append(
            f"Skipped {len(skipped_running)} job(s) currently running or dispatching."
        )
    if capacity_hit:
        parts.append(
            f"Stopped early: the execution queue hit its backlog cap "
            f"({_MAX_QUEUE_BACKLOG}); re-click to enqueue the rest once it drains."
        )
    return bool(requeued), " ".join(parts)


def remove_job_entry(job_id: str, secret: str) -> tuple[bool, str]:
    """Remove a job from tracking (not allowed while running). Moderator only."""
    ok, msg = _moderator_secret_ok(secret)
    if not ok:
        return False, msg
    job_id = job_id.strip()
    if not job_id:
        return False, "Select a job."

    with _jobs_lock:
        job = _jobs.get(job_id)
        if not job:
            return False, "Job not found."
        if job.status == JobStatus.running:
            return False, "Cannot remove a running job; wait for it to finish."
        _jobs.pop(job_id, None)
        _prune_jobs()

    _persist_jobs()
    return True, f"Removed job {job_id} from the list."


def list_pending_moderation_jobs() -> list[Job]:
    with _jobs_lock:
        return [j for j in _jobs.values() if j.status == JobStatus.pending_moderation]


_JOB_NON_EDITABLE_STATUSES = (
    JobStatus.running,
    JobStatus.dispatching,
    JobStatus.remote_running,
    JobStatus.collecting,
)


def update_job_script_and_requirements(
    job_id: str,
    secret: str,
    *,
    extra_requirements: str,
    setup_script: str = "",
    custom_script: str,
    recipe_id: str = "",
) -> tuple[bool, str]:
    """Update stored script/requirements for a job (moderator only)."""
    ok, msg = _moderator_secret_ok(secret)
    if not ok:
        return False, msg
    job_id = job_id.strip()
    if not job_id:
        return False, "No job selected."

    with _jobs_lock:
        job = _jobs.get(job_id)
        if not job:
            return False, "Job not found."

    try:
        from recipes.registry import apply_recipe_to_submission

        setup = sanitize_setup_script(setup_script)
        script = sanitize_custom_script(custom_script)
        reqs = extra_requirements or ""
        reqs, setup, script, resolved_recipe = apply_recipe_to_submission(
            job.model_id,
            recipe_id or None,
            reqs,
            setup,
            script,
        )
        recipe_clean = (resolved_recipe or recipe_id or "").strip().lower()[:64]
    except Exception as e:
        return False, f"Invalid submission fields: {e}"

    with _jobs_lock:
        job = _jobs.get(job_id)
        if not job:
            return False, "Job not found."
        if job.status in _JOB_NON_EDITABLE_STATUSES:
            return (
                False,
                "Cannot edit submission while the job is running or dispatching.",
            )
        job.extra_requirements = reqs
        job.setup_script = setup
        job.custom_script = script
        job.recipe_id = recipe_clean
        job.run_custom_script = bool(
            script.strip() or setup.strip() or recipe_clean
        )
        _touch(job)

    _persist_jobs()
    return True, f"Saved submission details for job {job_id}."


def _ensure_jobs_loaded_for_display() -> None:
    """Load persisted job state without starting the remote worker (moderator read-only UI)."""
    _load_persisted_jobs_once()


def pending_job_dropdown_choices() -> list[tuple[str, str]]:
    """Gradio (label, value) pairs for pending job IDs."""
    try:
        _ensure_jobs_loaded_for_display()
    except Exception:
        return [("(Queue unavailable)", "")]
    jobs = list_pending_moderation_jobs()
    jobs.sort(key=lambda j: j.created_at)
    if not jobs:
        return [("(No pending jobs)", "")]
    out: list[tuple[str, str]] = []
    for j in jobs:
        label = f"{j.id}: {j.model_id} ({j.family_id})"
        out.append((label, j.id))
    return out


def moderation_action_job_choices() -> list[tuple[str, str]]:
    """Recent jobs for retry/remove dropdown (label shows id, model, status)."""
    try:
        _ensure_jobs_loaded_for_display()
    except Exception:
        return [("(Queue unavailable)", "")]
    with _jobs_lock:
        items = list(_jobs.values())
    items.sort(key=lambda j: j.updated_at or j.created_at, reverse=True)
    items = items[:60]
    if not items:
        return [("(No jobs)", "")]
    out: list[tuple[str, str]] = []
    for j in items:
        short_model = j.model_id.split("/")[-1][:32]
        label = f"{j.id}: {short_model} ({j.status.value})"
        out.append((label, j.id))
    return out


def _escape_html(s: str) -> str:
    return (
        s.replace("&", "&amp;")
        .replace("<", "&lt;")
        .replace(">", "&gt;")
        .replace('"', "&quot;")
    )


def _hub_job_link_html(hf_job_id: str | None) -> str:
    if not (hf_job_id or "").strip():
        return ""
    try:
        import remote_jobs as rj

        url = rj.hub_job_page_url(hf_job_id.strip())
    except Exception:
        return ""
    return (
        f"<a href=\"{_escape_html(url)}\" target=\"_blank\" rel=\"noopener noreferrer\">"
        f"Open Hub Job logs</a>"
    )


def _bucket_artifacts_link_html() -> str:
    try:
        import remote_jobs as rj

        url = rj.bucket_artifact_browser_url()
    except Exception:
        return ""
    return (
        f"<a href=\"{_escape_html(url)}\" target=\"_blank\" rel=\"noopener noreferrer\">"
        f"remote_artifacts folder</a>"
    )


def moderation_list_html() -> str:
    """HTML table of jobs awaiting approval."""
    try:
        _ensure_jobs_loaded_for_display()
    except Exception as e:
        return _worker_unavailable_html(e)
    jobs = list_pending_moderation_jobs()
    jobs.sort(key=lambda j: j.created_at)
    if not jobs:
        return "<p><em>No jobs awaiting approval.</em></p>"
    rows = []
    for j in jobs:
        note = (j.submission_notes or "").strip()
        note_cell = _escape_html(note[:200] + ("…" if len(note) > 200 else "")) if note else "N/A"
        gated = " <span style='color:#b45309'>[gated]</span>" if j.is_gated else ""
        req_n = len(parse_requirements_lines(j.extra_requirements or ""))
        req_bit = f"{req_n} extra req(s)" if req_n else ""
        extras = req_bit if req_bit else "—"
        script_raw = (j.custom_script or "").strip()
        if script_raw:
            max_script = 12000
            truncated = len(script_raw) > max_script
            script_body = script_raw[:max_script]
            if truncated:
                script_body += "\n… (truncated)"
            script_cell = (
                "<details><summary>View script</summary>"
                f"<pre style='max-height:240px;overflow:auto;font-size:0.75em;"
                f"white-space:pre-wrap;margin:0.25rem 0'>{_escape_html(script_body)}</pre>"
                "</details>"
            )
        else:
            script_cell = "—"
        rows.append(
            f"<tr><td><code>{_escape_html(j.id)}</code></td>"
            f"<td><code>{_escape_html(j.model_id)}</code>{gated}</td>"
            f"<td><code>{_escape_html(j.family_id)}</code></td>"
            f"<td style='max-width:140px;font-size:0.85em'>{_escape_html(extras)}</td>"
            f"<td style='max-width:320px;font-size:0.8em;vertical-align:top'>{script_cell}</td>"
            f"<td style='max-width:280px;font-size:0.9em'>{note_cell}</td>"
            f"<td>{_escape_html(j.created_at)}</td></tr>"
        )
    body = "".join(rows)
    return (
        "<table style='width:100%;border-collapse:collapse;font-size:0.95em'>"
        "<thead><tr><th>Job ID</th><th>Model</th><th>Family</th><th>Extras</th>"
        "<th>Script</th><th>Notes</th><th>Submitted (UTC)</th></tr></thead>"
        f"<tbody>{body}</tbody></table>"
    )


def next_up_html(limit: int = 5) -> str:
    """Ordered list of models next in the approved execution queue (Submit tab)."""
    try:
        _ensure_worker()
    except Exception as e:
        return _worker_unavailable_html(e)
    with _jobs_lock:
        queued = [j for j in _jobs.values() if j.status == JobStatus.queued]
    queued.sort(key=lambda j: j.created_at)
    queued = queued[: max(1, int(limit))]
    if not queued:
        return (
            "<div class='next-up-panel' style='font-size:0.9em;opacity:0.85'>"
            "<p><em>No models are waiting in the evaluation queue.</em></p></div>"
        )
    items = "".join(
        f"<li><code>{_escape_html(j.model_id)}</code> "
        f"<span style='opacity:0.75'>(job {_escape_html(j.id)})</span></li>"
        for j in queued
    )
    return (
        "<div class='next-up-panel' style='font-size:0.9em'>"
        f"<p><strong>Next models to evaluate</strong> ({len(queued)} shown):</p>"
        f"<ol style='margin:0.25rem 0 0 1.1rem'>{items}</ol></div>"
    )


_JOB_ROW_STATUS_CLASS: dict[str, str] = {
    "pending_moderation": "ffasr-job-status-pending",
    "queued": "ffasr-job-status-queued",
    "running": "ffasr-job-status-active",
    "dispatching": "ffasr-job-status-active",
    "remote_running": "ffasr-job-status-active",
    "collecting": "ffasr-job-status-active",
    "done": "ffasr-job-status-done",
    "failed": "ffasr-job-status-failed",
}


def job_row_elem_classes(status: str) -> str:
    """CSS classes for a moderator job row (status background + layout)."""
    key = (status or "").strip().lower()
    specific = _JOB_ROW_STATUS_CLASS.get(key, "ffasr-job-status-unknown")
    return f"ffasr-job-row {specific}"


def _job_uses_custom_stack(job: Job) -> bool:
    return bool(
        (job.custom_script or "").strip()
        or (job.setup_script or "").strip()
        or (job.recipe_id or "").strip()
    )


def pending_jobs_for_render(limit: int = 60) -> list[dict[str, Any]]:
    """Structured pending jobs for Gradio @gr.render rows (Approve / Reject / Check)."""
    try:
        _ensure_jobs_loaded_for_display()
    except Exception:
        return []
    jobs = list_pending_moderation_jobs()
    jobs.sort(key=lambda j: j.created_at)
    out: list[dict[str, Any]] = []
    for j in jobs[: max(1, int(limit))]:
        note = (j.submission_notes or "").strip()
        out.append(
            {
                "id": j.id,
                "model_id": j.model_id,
                "family_id": j.family_id,
                "created_at": (j.created_at or "")[:19],
                "contact_email": (j.contact_email or "").strip(),
                "is_gated": j.is_gated,
                "req_count": len(parse_requirements_lines(j.extra_requirements or "")),
                "notes_preview": (
                    note[:120] + ("…" if len(note) > 120 else "") if note else ""
                ),
                "has_custom_script": _job_uses_custom_stack(j),
                "status": JobStatus.pending_moderation.value,
            }
        )
    return out


def recent_jobs_for_render(limit: int = 30) -> list[dict[str, Any]]:
    """Structured recent jobs for Gradio @gr.render rows (Retry / Remove)."""
    try:
        _ensure_jobs_loaded_for_display()
    except Exception:
        return []
    with _jobs_lock:
        items = list(_jobs.values())
    items.sort(key=lambda j: j.updated_at or j.created_at, reverse=True)
    out: list[dict[str, Any]] = []
    for j in items[: max(1, int(limit))]:
        err = (j.error or "").strip()
        try:
            hub = _hub_job_link_html(j.hf_remote_job_id)
        except Exception:
            hub = ""
        out.append(
            {
                "id": j.id,
                "model_id": j.model_id,
                "status": j.status.value,
                "contact_email": (j.contact_email or "").strip(),
                "error": err[:200] + ("…" if len(err) > 200 else ""),
                "hub_link_html": hub,
                "updated_at": (j.updated_at or j.created_at)[:19],
                "can_retry": _job_can_retry(j.status),
                "can_remove": j.status != JobStatus.running,
                "has_custom_script": _job_uses_custom_stack(j),
            }
        )
    return out


def recent_jobs_html(limit: int = 25, *, with_heading: bool = True) -> str:
    """Recent jobs with status (for spotting stuck or failed runs)."""
    try:
        _ensure_jobs_loaded_for_display()
    except Exception as e:
        return _worker_unavailable_html(e)
    with _jobs_lock:
        items = list(_jobs.values())
    items.sort(key=lambda j: j.updated_at or j.created_at, reverse=True)
    items = items[:limit]
    if not items:
        empty = (
            "<p><em>No job history loaded yet. Open <strong>Submit</strong> (queue status refreshes automatically) "
            "or click <strong>Refresh</strong> here to load persisted jobs from storage.</em></p>"
        )
        return empty
    rows = []
    for j in items:
        err = (j.error or "").strip()
        err_cell = _escape_html(err[:120] + ("…" if len(err) > 120 else "")) if err else "N/A"
        hub_link = _hub_job_link_html(j.hf_remote_job_id)
        links = hub_link if hub_link else "N/A"
        if j.status == JobStatus.done and (j.remote_artifact_path or "").strip():
            art = (j.remote_artifact_path or "").strip()
            try:
                from storage import HF_BUCKET_ID

                art_url = f"https://huggingface.co/datasets/{HF_BUCKET_ID}/resolve/main/{art}"
                links = (
                    f"{hub_link} · <a href=\"{_escape_html(art_url)}\" target=\"_blank\" "
                    f"rel=\"noopener noreferrer\">artifact</a>"
                    if hub_link
                    else f"<a href=\"{_escape_html(art_url)}\" target=\"_blank\" "
                    f"rel=\"noopener noreferrer\">artifact</a>"
                )
            except Exception:
                pass
        rows.append(
            f"<tr><td><code>{_escape_html(j.id)}</code></td>"
            f"<td><code>{_escape_html(j.model_id)}</code></td>"
            f"<td>{_escape_html(j.status.value)}</td>"
            f"<td style='max-width:240px;font-size:0.85em'>{err_cell}</td>"
            f"<td style='font-size:0.85em'>{links}</td>"
            f"<td style='font-size:0.85em'>{_escape_html((j.updated_at or j.created_at)[:19])}</td></tr>"
        )
    body = "".join(rows)
    table = (
        "<table style='width:100%;border-collapse:collapse;font-size:0.9em'>"
        "<thead><tr><th>Job</th><th>Model</th><th>Status</th><th>Error / detail</th>"
        "<th>Hub / bucket</th><th>Updated (UTC)</th></tr></thead>"
        f"<tbody>{body}</tbody></table>"
    )
    if with_heading:
        return (
            "<p style='font-size:0.9em;opacity:0.9'><strong>Recent jobs</strong> "
            "(newest first; persisted across restarts)</p>" + table
        )
    return table


def progress_html() -> str:
    """Live progress bar for the currently running job (empty when idle)."""
    try:
        _ensure_worker()
    except Exception as e:
        return _worker_unavailable_html(e)
    active = _list_active_eval_jobs()
    if len(active) > 1:
        max_n = remote_max_concurrent_jobs()
        lines = [
            "<div style='padding:0.5rem 0;font-size:0.9em'>"
            f"<p><strong>{len(active)} evaluations in progress</strong> "
            f"(up to {max_n} parallel Hub Jobs):</p><ul style='margin:0.25rem 0 0.5rem 1.1rem'>"
        ]
        for j in sorted(active, key=lambda x: x.updated_at or x.created_at, reverse=True)[:10]:
            hub = _hub_job_link_html(j.hf_remote_job_id)
            hub_bit = f" · {hub}" if hub else ""
            lines.append(
                f"<li><code>{_escape_html(j.model_id)}</code> "
                f"(job <code>{_escape_html(j.id)}</code>, {j.status.value}){hub_bit}</li>"
            )
        lines.append("</ul></div>")
        return "".join(lines)

    with _jobs_lock:
        jid = _running_job_id
        j = _jobs.get(jid) if jid else None
        if j is None and active:
            j = active[0]
        if j is None:
            return (
                "<div style='padding:0.5rem 0;font-size:0.9em;opacity:0.85'>"
                "<em>No evaluation is currently running.</em></div>"
            )
        done = int(j.progress_done or 0)
        total = int(j.progress_total or 0)
        model = j.model_id
        fam = j.family_id
        cond = j.progress_condition or ""
        job_label = j.id
        status = j.status
        hf_rid = (j.hf_remote_job_id or "").strip() or None
        art_path = (j.remote_artifact_path or "").strip() or None

    remote_extra = ""
    try:
        import remote_jobs as rj

        remote_mode = rj.remote_jobs_enabled()
    except Exception:
        remote_mode = False
    if remote_mode and status in (
        JobStatus.running,
        JobStatus.dispatching,
        JobStatus.remote_running,
        JobStatus.collecting,
    ):
        hub = _hub_job_link_html(hf_rid)
        bucket = _bucket_artifacts_link_html()
        remote_extra = (
            "<p style='margin:0.35rem 0 0 0;font-size:0.9em'>"
            f"<strong>Remote eval:</strong> status <code>{_escape_html(status.value)}</code>"
        )
        if hub:
            remote_extra += f" · {hub}"
        elif status == JobStatus.dispatching:
            remote_extra += " · submitting Hub Job…"
        if art_path:
            remote_extra += (
                f" · expected artifact <code>{_escape_html(art_path)}</code> "
                f"(uploaded only on success; browse {_bucket_artifacts_link_html()})"
            )
        elif bucket:
            remote_extra += f" · bucket {_bucket_artifacts_link_html()}"
        remote_extra += "</p>"

    if total <= 0:
        inner = (
            "<div style='width:40%;height:100%;background:#38BFA1;"
            "background-image:linear-gradient(90deg,#38BFA1,#3DFFA3,#38BFA1);"
            "background-size:200% 100%;animation:ffasr-indet 1.6s linear infinite;'></div>"
        )
        pct_label = "preparing…"
    else:
        pct = max(0.0, min(100.0, 100.0 * done / total))
        inner = (
            f"<div style='height:100%;width:{pct:.1f}%;background:#38BFA1;"
            "transition:width 0.4s ease-out'></div>"
        )
        cond_txt = f"; current condition: <code>{_escape_html(cond)}</code>" if cond else ""
        pct_label = f"{done}/{total} samples ({pct:.1f}%){cond_txt}"

    return (
        "<style>@keyframes ffasr-indet{0%{background-position:200% 0}100%{background-position:-200% 0}}</style>"
        "<div style='padding:0.25rem 0'>"
        f"<p style='margin:0 0 0.4rem 0'><strong>Running:</strong> "
        f"<code>{_escape_html(model)}</code> "
        f"(family <code>{_escape_html(fam)}</code>, job <code>{_escape_html(job_label)}</code>): {pct_label}</p>"
        f"{remote_extra}"
        "<div style='width:100%;background:#e6e6e6;border:1px solid #d0d0d0;border-radius:6px;"
        "overflow:hidden;height:14px'>"
        f"{inner}"
        "</div></div>"
    )


def status_html(*, start_worker: bool = True) -> str:
    """Short HTML snippet for the Submit tab (queue + current runner + recent activity)."""
    if start_worker:
        try:
            _ensure_worker()
        except Exception as e:
            return (
                "<div class='queue-status'><p style='color:orange'>"
                f"<strong>Queue unavailable:</strong> {_escape_html(str(e))}</p></div>"
            )
    active = _list_active_eval_jobs()
    with _jobs_lock:
        waiting = _work_queue.qsize()
        pending_mod = sum(1 for j in _jobs.values() if j.status == JobStatus.pending_moderation)
        # Do not call _count_remote_in_flight() while holding _jobs_lock; that helper
        # also acquires the lock and would deadlock Gradio callbacks/timers.
        in_flight = sum(1 for j in _jobs.values() if j.status in _remote_in_flight_statuses())

        if len(active) == 0:
            run_line = "<p><strong>Running:</strong> none</p>"
        elif len(active) == 1:
            running = active[0]
            done = int(running.progress_done or 0)
            total = int(running.progress_total or 0)
            progress_txt = (
                f"; progress <strong>{done}/{total}</strong> ({(100.0 * done / total):.1f}%)"
                if total > 0
                else "; preparing…"
            )
            run_line = (
                f"<p><strong>Running:</strong> <code>{running.model_id}</code> "
                f"(family: <code>{running.family_id}</code>, job <code>{running.id}</code>)"
                f"{progress_txt}</p>"
            )
        else:
            max_n = remote_max_concurrent_jobs()
            models = ", ".join(f"<code>{_escape_html(j.model_id)}</code>" for j in active[:4])
            if len(active) > 4:
                models += f" … (+{len(active) - 4} more)"
            run_line = (
                f"<p><strong>Running:</strong> {len(active)} evaluations "
                f"({in_flight} on Hub Jobs, max {max_n} parallel): {models}</p>"
            )
        wait_line = f"<p><strong>Waiting to run (approved queue):</strong> {waiting}</p>"
        mod_line = ""
        if moderation_active():
            mod_line = (
                f"<p><strong>Awaiting moderator approval:</strong> {pending_mod}</p>"
                "<p style='font-size:0.9em;opacity:0.85'>New submissions stay pending until approved on the <strong>Moderate</strong> tab.</p>"
            )
        elif MODERATION_ENABLED and not MODERATOR_SECRET:
            mod_line = (
                "<p style='color:orange'><strong>Moderation misconfigured:</strong> "
                "set secret <code>FFASR_MODERATOR_SECRET</code> in Space settings.</p>"
            )
        max_n = remote_max_concurrent_jobs()
        hint = (
            "<p style='font-size:0.9em;opacity:0.85'>Evaluations run as "
            "<strong>Hugging Face Hub Jobs</strong> "
            "(<code>FFASR_REMOTE_JOBS=1</code>) with results written to the bucket. "
            "Set Space secrets <code>token_for_ffasr_jobs</code> (Jobs billing) and "
            "<code>HF_TOKEN</code> (bucket). Up to "
            f"<strong>{max_n}</strong> models evaluate in parallel "
            "(<code>FFASR_REMOTE_MAX_CONCURRENT_JOBS</code>). The Space does not run ASR locally.</p>"
        )
    recent = recent_jobs_html(20)
    return f"<div class='queue-status'>{run_line}{wait_line}{mod_line}{hint}{recent}</div>"


def peek_job(job_id: str) -> Job | None:
    try:
        _ensure_jobs_loaded_for_display()
    except Exception:
        pass
    with _jobs_lock:
        return _jobs.get(job_id)