Spaces:

build-small-hackathon
/

hackathon-advisor

Running on Zero

App Files Files Community

JacobLinCool commited on Jun 8

Commit

4791c0a

verified ·

1 Parent(s): 1ec322d

feat: add live project atlas

Browse files

Sync GitHub commit 76e4930 with atlas dashboard, MiniCPM quest LoRA, refresh APIs, and tests.

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
README.md +49 -10
app.py +251 -3
artifacts/quest-lora/README.md +44 -0
artifacts/quest-lora/adapter_config.json +48 -0
artifacts/quest-lora/adapter_model.safetensors +3 -0
artifacts/quest-lora/chat_template.jinja +179 -0
artifacts/quest-lora/self-eval.json +66 -0
artifacts/quest-lora/special_tokens_map.json +30 -0
artifacts/quest-lora/tokenizer.json +0 -0
artifacts/quest-lora/tokenizer_config.json +4099 -0
artifacts/quest-lora/training-recipe.json +23 -0
data/quest_corpus.json +0 -0
data/quest_dataset_card.md +83 -0
data/quest_label_input.json +0 -0
data/quest_labels/in/AI-Puppet-Theater.json +14 -0
data/quest_labels/in/AI-agent-Evaluation-pipeline.json +17 -0
data/quest_labels/in/Advent_of_a_World_of_Flowering_Trees.json +14 -0
data/quest_labels/in/Backyard-Demo-Builder.json +24 -0
data/quest_labels/in/Case-Lantern.json +16 -0
data/quest_labels/in/CodeFlow.json +14 -0
data/quest_labels/in/ContextForge.json +14 -0
data/quest_labels/in/Council-of-Tiny-Minds.json +14 -0
data/quest_labels/in/Darwin-35B-A3B-Opus.json +15 -0
data/quest_labels/in/Family-Bill-Assistant.json +14 -0
data/quest_labels/in/First-Principle-AI.json +21 -0
data/quest_labels/in/GRM-2.6-Opus.json +14 -0
data/quest_labels/in/GTROX.json +14 -0
data/quest_labels/in/InContext.json +14 -0
data/quest_labels/in/Kasualdad_LFED.json +19 -0
data/quest_labels/in/Kintsugi-Garden.json +14 -0
data/quest_labels/in/LocalDuo.json +14 -0
data/quest_labels/in/Mediassist.json +14 -0
data/quest_labels/in/NEXUS-Visual-Weaver.json +14 -0
data/quest_labels/in/PocketWorld-Studio.json +14 -0
data/quest_labels/in/Retail-Insight-AI.json +14 -0
data/quest_labels/in/SlideAI.json +14 -0
data/quest_labels/in/Sprout-And-Spoon.json +14 -0
data/quest_labels/in/Structured-Data-Rescuer.json +14 -0
data/quest_labels/in/The-Shrine.json +14 -0
data/quest_labels/in/Tone-Bridge.json +25 -0
data/quest_labels/in/Trollsona.json +14 -0
data/quest_labels/in/VoiceGate.json +14 -0
data/quest_labels/in/WitGym.json +14 -0
data/quest_labels/in/Yui-home-assistant.json +14 -0
data/quest_labels/in/ai-study-buddy.json +14 -0
data/quest_labels/in/amnesiac.json +14 -0
data/quest_labels/in/attention-firewall.json +14 -0
data/quest_labels/in/awaaz.json +17 -0
data/quest_labels/in/backyard-raccoon-deterrent.json +17 -0

.gitattributes CHANGED Viewed

@@ -1,3 +1,4 @@
 # Auto detect text files and perform LF normalization
 * text=auto
 static/assets/parchment.png filter=lfs diff=lfs merge=lfs -text

 # Auto detect text files and perform LF normalization
 * text=auto
+artifacts/quest-lora/adapter_model.safetensors filter=lfs diff=lfs merge=lfs -text
 static/assets/parchment.png filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -22,17 +22,18 @@ tags:
 # Hackathon Advisor
 **Hackathon Advisor** is a text-first project advisor for the Build Small Hackathon. The user-facing experience is
-**The Unwritten Almanac**: a journal-style workspace that compares your idea against real Spaces in the
-`build-small-hackathon` organization, finds under-explored territory, scores the idea, and drafts a practical build plan.
 The current milestone is a deployed ZeroGPU + MiniCPM5 LoRA advisor:
 - Local snapshot of public `build-small-hackathon` Spaces.
 - Modal-built EmbeddingGemma GGUF retrieval index, with runtime query embeddings computed through llama.cpp.
 - Nemotron Speech Streaming voice input through NVIDIA NeMo ASR on ZeroGPU.
 - Jargon correction for hackathon/model terms.
-- MiniCPM5 tool-call planning with a published PEFT LoRA adapter, plus deterministic local rules for tests and CPU-only
-  development.
 - One-turn advisor loop with overlap citations, whitespace suggestions, scoring, and plans.
 - Custom `gradio.Server` frontend focused on the builder's idea workflow, with submission evidence kept in API exports.
@@ -44,10 +45,19 @@ See [DESIGN.md](DESIGN.md) for the full product and model plan.
 python3.11 -m venv .venv
 . .venv/bin/activate
 pip install -r requirements.txt
 python app.py
 ```
-Then open <http://127.0.0.1:7860>.
 ## Refresh The Project Snapshot
@@ -64,6 +74,25 @@ app file as the highest-signal project evidence for embedding. The canonical ind
 `ggml-org/embeddinggemma-300m-qat-q8_0-GGUF` through llama.cpp; runtime search embeds the user query with the same GGUF
 model and performs local cosine search over the checked-in vectors.
 ## Trace Artifact
 The app exposes a `trace_artifact` Gradio API endpoint for submission evidence and debugging. It emits a manifest row
@@ -188,18 +217,28 @@ ADVISOR_MODEL_BACKEND=minicpm-transformers
 ADVISOR_MODEL_ID=openbmb/MiniCPM5-1B
 ADVISOR_ADAPTER_ID=build-small-hackathon/hackathon-advisor-minicpm5-lora
 ADVISOR_ADAPTER_REVISION=25de69bcde397e1bcdd852923b56a42f10222650
 ADVISOR_EMBEDDING_MODEL_REPO=ggml-org/embeddinggemma-300m-qat-q8_0-GGUF
 ADVISOR_EMBEDDING_MODEL_FILE=embeddinggemma-300m-qat-Q8_0.gguf
 ADVISOR_ASR_MODEL_ID=nvidia/nemotron-speech-streaming-en-0.6b
 ```
 `agent_turn` wraps the engine call with `spaces.GPU` when `ADVISOR_ZERO_GPU=1`, so model loading and generation run on
-the ZeroGPU allocation. The retrieval query embedder downloads the GGUF model through `huggingface_hub` unless
 `ADVISOR_EMBEDDING_MODEL_PATH` points to a local file. `/api/transcribe` uses the same ZeroGPU wrapper for Nemotron ASR.
-On macOS local runs with `ADVISOR_MODEL_BACKEND=minicpm-transformers`, the app automatically runs llama.cpp query
-embedding in a worker process so the MiniCPM PyTorch runtime and llama.cpp do not load conflicting OpenMP runtimes in
-the same Python process.
-Local tests and CPU-only development still default to `ADVISOR_MODEL_BACKEND=rules`.
 ## Test

 # Hackathon Advisor
 **Hackathon Advisor** is a text-first project advisor for the Build Small Hackathon. The user-facing experience is
+an atlas-first dashboard plus **The Unwritten Almanac**: the first screen maps real Spaces in the
+`build-small-hackathon` organization, while the advisor workspace compares your idea against that map, finds
+under-explored territory, scores the idea, and drafts a practical build plan.
 The current milestone is a deployed ZeroGPU + MiniCPM5 LoRA advisor:
 - Local snapshot of public `build-small-hackathon` Spaces.
 - Modal-built EmbeddingGemma GGUF retrieval index, with runtime query embeddings computed through llama.cpp.
+- Full-screen t-SNE project atlas with clusters, nearest-neighbor links, quest coverage, and live refresh state.
 - Nemotron Speech Streaming voice input through NVIDIA NeMo ASR on ZeroGPU.
 - Jargon correction for hackathon/model terms.
+- MiniCPM5 tool-call planning with a published PEFT LoRA adapter.
 - One-turn advisor loop with overlap citations, whitespace suggestions, scoring, and plans.
 - Custom `gradio.Server` frontend focused on the builder's idea workflow, with submission evidence kept in API exports.
 python3.11 -m venv .venv
 . .venv/bin/activate
 pip install -r requirements.txt
+mkdir -p .cache/advisor-dashboard
+ADVISOR_CACHE_DIR=.cache/advisor-dashboard \
+ADVISOR_MODEL_BACKEND=minicpm-transformers \
+ADVISOR_MODEL_ID=openbmb/MiniCPM5-1B \
+ADVISOR_ADAPTER_ID=build-small-hackathon/hackathon-advisor-minicpm5-lora \
+ADVISOR_ADAPTER_REVISION=25de69bcde397e1bcdd852923b56a42f10222650 \
+ADVISOR_QUEST_ANALYZER_BACKEND=minicpm-transformers \
 python app.py
 ```
+Then open <http://127.0.0.1:7860>. The atlas refresh button runs locally with the same artifact swap path used in
+deployment. It writes refreshed runs under `.cache/advisor-dashboard/runs/` and atomically updates
+`.cache/advisor-dashboard/latest.json`.
 ## Refresh The Project Snapshot
 `ggml-org/embeddinggemma-300m-qat-q8_0-GGUF` through llama.cpp; runtime search embeds the user query with the same GGUF
 model and performs local cosine search over the checked-in vectors.
+## Live Project Atlas
+`/api/dashboard` exposes the first-screen atlas payload: t-SNE coordinates, KMeans clusters, nearest-neighbor links,
+quest coverage, provenance, and refresh status. The browser renders this as the default full-screen view; `#advisor`
+opens the existing idea workflow.
+`POST /api/dashboard/refresh` starts one background refresh job. The job snapshots public Spaces, rebuilds the GGUF
+embedding index, runs strict JSON MiniCPM quest analysis, creates the atlas, persists the validated artifacts, and only
+then swaps the live app to the new dashboard. `GET /api/dashboard/refresh` polls status.
+Live refresh requires a writable dashboard cache directory at `ADVISOR_CACHE_DIR`. On Hugging Face Spaces this should be
+a mounted Storage Bucket; locally it can be a normal directory such as `.cache/advisor-dashboard`. The job writes
+`runs/{run_id}/projects.json`, `project_index.json`, `dashboard.json`, and `manifest.json`, then atomically updates
+`latest.json`. If the cache directory is missing, not writable, or quest analysis fails validation, refresh fails and the
+current validated dashboard stays active.
+Set `ADVISOR_QUEST_ANALYZER_BACKEND=minicpm-transformers` for both local and deployed refresh runs. The local dashboard
+uses the same MiniCPM analyzer as the deployed Space; test doubles are only used inside pytest.
 ## Trace Artifact
 The app exposes a `trace_artifact` Gradio API endpoint for submission evidence and debugging. It emits a manifest row
 ADVISOR_MODEL_ID=openbmb/MiniCPM5-1B
 ADVISOR_ADAPTER_ID=build-small-hackathon/hackathon-advisor-minicpm5-lora
 ADVISOR_ADAPTER_REVISION=25de69bcde397e1bcdd852923b56a42f10222650
+ADVISOR_QUEST_ANALYZER_BACKEND=minicpm-transformers
+ADVISOR_QUEST_ADAPTER_ID=artifacts/quest-lora
+ADVISOR_CACHE_DIR=/data/advisor-cache
 ADVISOR_EMBEDDING_MODEL_REPO=ggml-org/embeddinggemma-300m-qat-q8_0-GGUF
 ADVISOR_EMBEDDING_MODEL_FILE=embeddinggemma-300m-qat-Q8_0.gguf
 ADVISOR_ASR_MODEL_ID=nvidia/nemotron-speech-streaming-en-0.6b
 ```
 `agent_turn` wraps the engine call with `spaces.GPU` when `ADVISOR_ZERO_GPU=1`, so model loading and generation run on
+the ZeroGPU allocation. MiniCPM loading follows the official demo shape: tokenizer uses
+`AutoTokenizer.from_pretrained(..., trust_remote_code=True)`, CUDA/ZeroGPU model loading uses
+`AutoModelForCausalLM.from_pretrained(..., torch_dtype=torch.bfloat16, trust_remote_code=True).to("cuda")`, and prompts
+are rendered with `apply_chat_template(..., tokenize=False, add_generation_prompt=True, enable_thinking=False)` before
+tokenization. Generation follows the demo policy: temperature `> 0` uses `temperature=0.9`, `top_p=0.95`, and
+`do_sample=True`; temperature `0` uses `do_sample=False`. The advisor tool planner uses temperature `0` for stable XML
+tool calls, and dashboard quest analysis also uses temperature `0` so the MiniCPM LoRA emits strict JSON deterministically.
+The retrieval query embedder downloads the GGUF model through `huggingface_hub` unless
 `ADVISOR_EMBEDDING_MODEL_PATH` points to a local file. `/api/transcribe` uses the same ZeroGPU wrapper for Nemotron ASR.
+On macOS local runs, the app automatically runs llama.cpp query embedding in a worker process so the MiniCPM PyTorch
+runtime and llama.cpp do not load conflicting OpenMP runtimes in the same Python process. Dashboard refresh also builds
+the GGUF embedding index in a subprocess before returning to the app process for MiniCPM quest analysis.
 ## Test

app.py CHANGED Viewed

@@ -1,10 +1,15 @@
 from __future__ import annotations
 import json
 import os
 from pathlib import Path
 import tempfile
 from typing import Any, Iterator
 from fastapi import Body, File, HTTPException, UploadFile
 from fastapi.responses import FileResponse, HTMLResponse, JSONResponse, Response, StreamingResponse
@@ -14,7 +19,15 @@ from hackathon_advisor.agent import AdvisorEngine
 from hackathon_advisor.artifact_bundle import BUNDLE_FILENAME, build_demo_bundle_zip
 from hackathon_advisor.asr_runtime import create_asr_transcriber
 from hackathon_advisor.chapter import build_chapter_markdown
-from hackathon_advisor.data import ProjectIndex
 from hackathon_advisor.demo_rehearsal import build_demo_rehearsal
 from hackathon_advisor.model_runtime import create_tool_planner
 from hackathon_advisor.profiling import (
@@ -27,6 +40,7 @@ from hackathon_advisor.lora_dataset import build_lora_dataset_jsonl
 from hackathon_advisor.lora_training_kit import TRAINING_KIT_FILENAME, build_lora_training_kit_zip
 from hackathon_advisor.png_export import artifact_png_filename, render_artifact_png
 from hackathon_advisor.prize_ledger import prize_ledger
 from hackathon_advisor.runtime_hooks import install_asyncio_cleanup_hook
 from hackathon_advisor.submission_packet import build_submission_packet_markdown
 from hackathon_advisor.tool_contracts import resolve_tool_call, tool_schemas
@@ -45,16 +59,49 @@ INDEX_PATH = ROOT / "data" / "project_index.json"
 PROFILE_FIELDS = ["skills", "time", "preferences", "constraints"]
 MAX_AUDIO_UPLOAD_BYTES = 25 * 1024 * 1024
 AUDIO_UPLOAD_SUFFIXES = {".aac", ".aif", ".aiff", ".flac", ".m4a", ".mp3", ".oga", ".ogg", ".opus", ".wav", ".webm"}
-index = ProjectIndex.from_files(DATA_PATH, INDEX_PATH)
 # Acceleration is automatic: on a ZeroGPU Space the GPU path uses accelerate device_map inside
 # the @spaces.GPU fork; locally the device resolves CUDA -> Apple MPS -> CPU. CPU is only used
 # as an explicit override or a quota fallback.
-engine = AdvisorEngine(index, create_tool_planner(device="auto" if zero_gpu_enabled() else "local"))
 voice_transcriber = create_asr_transcriber()
 app = Server()
 _cpu_engine: AdvisorEngine | None = None
 def _json_event(payload: dict) -> str:
@@ -81,6 +128,185 @@ def _transcribe_voice(audio_path: str) -> dict[str, Any]:
     return voice_transcriber.transcribe(Path(audio_path)).to_dict()
 def _session_from_json(session_json: str = "{}") -> dict[str, Any]:
     try:
         session = json.loads(session_json or "{}")
@@ -174,6 +400,28 @@ def static_file(path: str) -> FileResponse:
     return FileResponse(target)
 @app.get("/health")
 def health() -> dict:
     return {

 from __future__ import annotations
+from datetime import datetime, timezone
 import json
 import os
 from pathlib import Path
+import subprocess
+import sys
 import tempfile
+from threading import Lock, Thread
 from typing import Any, Iterator
+from uuid import uuid4
 from fastapi import Body, File, HTTPException, UploadFile
 from fastapi.responses import FileResponse, HTMLResponse, JSONResponse, Response, StreamingResponse
 from hackathon_advisor.artifact_bundle import BUNDLE_FILENAME, build_demo_bundle_zip
 from hackathon_advisor.asr_runtime import create_asr_transcriber
 from hackathon_advisor.chapter import build_chapter_markdown
+from hackathon_advisor.dashboard import build_dashboard_payload
+from hackathon_advisor.dashboard_storage import (
+    DashboardStorageError,
+    cache_dir_from_env,
+    load_latest_artifacts,
+    persist_refresh_artifacts,
+    require_writable_cache_dir,
+)
+from hackathon_advisor.data import DEFAULT_EMBEDDING_MODEL_FILE, DEFAULT_EMBEDDING_MODEL_REPO, Project, ProjectIndex
 from hackathon_advisor.demo_rehearsal import build_demo_rehearsal
 from hackathon_advisor.model_runtime import create_tool_planner
 from hackathon_advisor.profiling import (
 from hackathon_advisor.lora_training_kit import TRAINING_KIT_FILENAME, build_lora_training_kit_zip
 from hackathon_advisor.png_export import artifact_png_filename, render_artifact_png
 from hackathon_advisor.prize_ledger import prize_ledger
+from hackathon_advisor.quest_analysis import create_quest_analyzer, validate_matches_by_project
 from hackathon_advisor.runtime_hooks import install_asyncio_cleanup_hook
 from hackathon_advisor.submission_packet import build_submission_packet_markdown
 from hackathon_advisor.tool_contracts import resolve_tool_call, tool_schemas
 PROFILE_FIELDS = ["skills", "time", "preferences", "constraints"]
 MAX_AUDIO_UPLOAD_BYTES = 25 * 1024 * 1024
 AUDIO_UPLOAD_SUFFIXES = {".aac", ".aif", ".aiff", ".flac", ".m4a", ".mp3", ".oga", ".ogg", ".opus", ".wav", ".webm"}
+DEFAULT_HF_ORG = "build-small-hackathon"
+REFRESH_STAGE_LABELS = {
+    "crawling": "Fetching public Spaces",
+    "embedding": "Rebuilding the embedding index",
+    "quest_analysis": "Classifying quest coverage",
+    "atlas": "Projecting the atlas",
+    "persisting": "Writing dashboard artifacts",
+    "swapping": "Activating the latest dashboard",
+}
+_runtime_lock = Lock()
+_refresh_lock = Lock()
+def _load_initial_runtime() -> tuple[ProjectIndex, dict[str, Any]]:
+    artifacts = load_latest_artifacts(cache_dir_from_env())
+    if artifacts is not None:
+        loaded_index = ProjectIndex.from_files(artifacts.projects_path, artifacts.index_path)
+        return loaded_index, artifacts.dashboard
+    loaded_index = ProjectIndex.from_files(DATA_PATH, INDEX_PATH)
+    return loaded_index, build_dashboard_payload(loaded_index)
+index, dashboard_payload = _load_initial_runtime()
 # Acceleration is automatic: on a ZeroGPU Space the GPU path uses accelerate device_map inside
 # the @spaces.GPU fork; locally the device resolves CUDA -> Apple MPS -> CPU. CPU is only used
 # as an explicit override or a quota fallback.
+engine = AdvisorEngine(index, create_tool_planner(device="cuda" if zero_gpu_enabled() else "local"))
 voice_transcriber = create_asr_transcriber()
 app = Server()
 _cpu_engine: AdvisorEngine | None = None
+_refresh_state: dict[str, Any] = {
+    "status": "idle",
+    "run_id": "",
+    "stage": "",
+    "stage_label": "",
+    "started_at": "",
+    "finished_at": "",
+    "error": "",
+    "result": None,
+}
 def _json_event(payload: dict) -> str:
     return voice_transcriber.transcribe(Path(audio_path)).to_dict()
+@gpu_task
+def _analyze_dashboard_quests(project_rows: list[dict[str, Any]]) -> dict[str, Any]:
+    missing_evidence_keys = [
+        str(item.get("id") or index)
+        for index, item in enumerate(project_rows)
+        if "readme_body" not in item or "app_file_source" not in item
+    ]
+    if missing_evidence_keys:
+        raise RuntimeError(
+            "dashboard quest analysis requires refresh snapshots with readme_body and app_file_source; "
+            f"missing evidence keys for {len(missing_evidence_keys)} projects"
+        )
+    projects = [Project.from_dict(item) for item in project_rows]
+    analyzer = create_quest_analyzer(device="cuda" if zero_gpu_enabled() else "local")
+    matches = analyzer.analyze(projects)
+    source = getattr(analyzer, "source", "quest-analyzer")
+    validated = validate_matches_by_project(matches, projects, source=source)
+    return {
+        "source": validated.source,
+        "matches_by_project": validated.matches_by_project,
+    }
+def _refresh_public_state() -> dict[str, Any]:
+    with _refresh_lock:
+        return dict(_refresh_state)
+def _set_refresh_state(**updates: Any) -> None:
+    with _refresh_lock:
+        _refresh_state.update(updates)
+        stage = str(_refresh_state.get("stage") or "")
+        _refresh_state["stage_label"] = REFRESH_STAGE_LABELS.get(stage, "")
+def _start_refresh_thread(cache_dir: Path) -> dict[str, Any]:
+    with _refresh_lock:
+        if _refresh_state.get("status") == "running":
+            raise HTTPException(status_code=409, detail="Dashboard refresh is already running.")
+        run_id = datetime.now(timezone.utc).strftime("%Y%m%dT%H%M%SZ") + "-" + uuid4().hex[:8]
+        _refresh_state.update(
+            {
+                "status": "running",
+                "run_id": run_id,
+                "stage": "crawling",
+                "stage_label": REFRESH_STAGE_LABELS["crawling"],
+                "started_at": datetime.now(timezone.utc).isoformat(timespec="seconds"),
+                "finished_at": "",
+                "error": "",
+                "result": None,
+            }
+        )
+    thread = Thread(target=_run_refresh_job, args=(run_id, cache_dir), daemon=True)
+    thread.start()
+    return _refresh_public_state()
+def _run_refresh_job(run_id: str, cache_dir: Path) -> None:
+    try:
+        projects_payload, index_payload, refreshed_dashboard = _build_refresh_payloads(run_id)
+        _set_refresh_state(stage="persisting")
+        artifacts = persist_refresh_artifacts(
+            cache_dir,
+            run_id,
+            projects_payload=projects_payload,
+            index_payload=index_payload,
+            dashboard_payload=refreshed_dashboard,
+        )
+        _set_refresh_state(stage="swapping")
+        _replace_runtime_from_files(artifacts.projects_path, artifacts.index_path, artifacts.dashboard)
+        _set_refresh_state(
+            status="succeeded",
+            stage="",
+            finished_at=datetime.now(timezone.utc).isoformat(timespec="seconds"),
+            result={
+                "run_id": run_id,
+                "project_count": refreshed_dashboard["project_count"],
+                "snapshot_digest": refreshed_dashboard["provenance"]["snapshot_digest"],
+                "dashboard_generated_at": refreshed_dashboard["generated_at"],
+            },
+        )
+    except Exception as error:  # noqa: BLE001 - background job must report every failure as state
+        _set_refresh_state(
+            status="failed",
+            stage="",
+            finished_at=datetime.now(timezone.utc).isoformat(timespec="seconds"),
+            error=str(error),
+            result=None,
+        )
+def _build_refresh_payloads(run_id: str) -> tuple[dict[str, Any], dict[str, Any], dict[str, Any]]:
+    from scripts.crawl_hf_spaces import API, crawl_projects
+    org = os.environ.get("ADVISOR_HF_ORG", DEFAULT_HF_ORG).strip() or DEFAULT_HF_ORG
+    _set_refresh_state(stage="crawling")
+    project_rows = sorted(crawl_projects(org), key=lambda project: project["id"].lower())
+    projects_payload = {
+        "generated_at": datetime.now(timezone.utc).isoformat(timespec="seconds"),
+        "source": f"{API}/spaces?author={org}",
+        "projects": project_rows,
+    }
+    _set_refresh_state(stage="embedding")
+    with tempfile.TemporaryDirectory(prefix="advisor-refresh-") as directory:
+        project_path = Path(directory) / "projects.json"
+        project_path.write_text(json.dumps(projects_payload, ensure_ascii=False), encoding="utf-8")
+        index_payload = _build_refresh_index_payload(project_path, Path(directory) / "project_index.json")
+    projects = [Project.from_dict(item) for item in projects_payload["projects"]]
+    refreshed_index = ProjectIndex(
+        projects=projects,
+        generated_at=str(projects_payload["generated_at"]),
+        source=str(projects_payload["source"]),
+        index_payload=index_payload,
+    )
+    _set_refresh_state(stage="quest_analysis")
+    quest_analysis = _analyze_dashboard_quests([project.to_refresh_snapshot_dict() for project in projects])
+    _set_refresh_state(stage="atlas")
+    refreshed_dashboard = build_dashboard_payload(
+        refreshed_index,
+        quest_matches=quest_analysis["matches_by_project"],
+        quest_source=str(quest_analysis["source"]),
+    )
+    return projects_payload, index_payload, refreshed_dashboard
+def _build_refresh_index_payload(project_path: Path, index_path: Path) -> dict[str, Any]:
+    command = [
+        sys.executable,
+        str(ROOT / "scripts" / "build_project_index.py"),
+        "--projects",
+        str(project_path),
+        "--out",
+        str(index_path),
+        "--model-repo",
+        os.environ.get("ADVISOR_EMBEDDING_MODEL_REPO", DEFAULT_EMBEDDING_MODEL_REPO),
+        "--model-file",
+        os.environ.get("ADVISOR_EMBEDDING_MODEL_FILE", DEFAULT_EMBEDDING_MODEL_FILE),
+        "--build-source",
+        "space dashboard refresh",
+        "--builder",
+        "app.py:/api/dashboard/refresh",
+    ]
+    model_path = os.environ.get("ADVISOR_EMBEDDING_MODEL_PATH", "").strip()
+    if model_path:
+        command.extend(["--model-path", model_path])
+    n_ctx = os.environ.get("ADVISOR_EMBEDDING_N_CTX", "").strip()
+    if n_ctx:
+        command.extend(["--n-ctx", n_ctx])
+    n_threads = os.environ.get("ADVISOR_EMBEDDING_THREADS", "").strip()
+    if n_threads:
+        command.extend(["--n-threads", n_threads])
+    completed = subprocess.run(command, cwd=ROOT, capture_output=True, text=True, check=False)
+    if completed.returncode != 0:
+        detail = "\n".join(part for part in (completed.stdout.strip(), completed.stderr.strip()) if part)
+        raise RuntimeError(f"refresh embedding index build failed with exit code {completed.returncode}: {detail}")
+    try:
+        payload = json.loads(index_path.read_text(encoding="utf-8"))
+    except (OSError, json.JSONDecodeError) as error:
+        raise RuntimeError(f"refresh embedding index build did not write valid JSON: {index_path}") from error
+    if not isinstance(payload, dict):
+        raise RuntimeError("refresh embedding index build returned a non-object JSON payload")
+    return payload
+def _replace_runtime_from_files(projects_path: Path, index_path: Path, refreshed_dashboard: dict[str, Any]) -> None:
+    global index, engine, _cpu_engine, dashboard_payload
+    new_index = ProjectIndex.from_files(projects_path, index_path)
+    with _runtime_lock:
+        index = new_index
+        engine = AdvisorEngine(new_index, engine.planner)
+        if _cpu_engine is not None:
+            _cpu_engine = AdvisorEngine(new_index, _cpu_engine.planner)
+        dashboard_payload = refreshed_dashboard
 def _session_from_json(session_json: str = "{}") -> dict[str, Any]:
     try:
         session = json.loads(session_json or "{}")
     return FileResponse(target)
+@app.get("/api/dashboard")
+def dashboard() -> dict:
+    with _runtime_lock:
+        payload = dict(dashboard_payload)
+    payload["refresh"] = _refresh_public_state()
+    return payload
+@app.post("/api/dashboard/refresh")
+def dashboard_refresh_start() -> JSONResponse:
+    try:
+        cache_dir = require_writable_cache_dir()
+    except DashboardStorageError as error:
+        raise HTTPException(status_code=400, detail=str(error)) from error
+    return JSONResponse(_start_refresh_thread(cache_dir), status_code=202)
+@app.get("/api/dashboard/refresh")
+def dashboard_refresh_status() -> dict:
+    return _refresh_public_state()
 @app.get("/health")
 def health() -> dict:
     return {

artifacts/quest-lora/README.md ADDED Viewed

	@@ -0,0 +1,44 @@

+---
+base_model: openbmb/MiniCPM5-1B
+library_name: peft
+datasets:
+- build-small-hackathon/hackathon-advisor-quest-dataset
+tags:
+- lora
+- hackathon-advisor
+- quest-classification
+license: apache-2.0
+---
+# Hackathon Advisor — Quest Classification LoRA (MiniCPM5-1B)
+PEFT LoRA adapter that classifies a Build Small Hackathon project against 13 judging
+dimensions (6 merit badges + 2 tracks + 5 sponsor/special awards) from a two-segment
+README + app-file prompt, emitting strict JSON:
+```json
+{"matches":[{"quest":"...","confidence":0.0,"evidence":"...","source":"readme|app_file"}]}
+```
+Load it in the deployed Space by setting `ADVISOR_QUEST_ADAPTER_ID` to this repo.
+The backend revalidates every dashboard refresh and will not swap on schema failure.
+## Recipe
+- Base model: `openbmb/MiniCPM5-1B`
+- Task: `hackathon_advisor_quest_classification`
+- Method: LoRA SFT (completion-only loss)
+- Examples: 146
+- Epochs: 6.0
+- LoRA rank/alpha/dropout: 16/32/0.05
+- Max seq length: 2560
+- GPU: A10G
+## Dataset
+[`build-small-hackathon/hackathon-advisor-quest-dataset`](https://huggingface.co/datasets/build-small-hackathon/hackathon-advisor-quest-dataset) — 156 chat-JSONL examples built from real `build-small-hackathon` Spaces: 108 teacher-
+labelled + adversarially-verified projects plus targeted augmentations (app-only,
+readme-only / missing app file, README↔app contradictions, empty matches, noisy
+metadata). All 13 quests covered.
+## Self-eval at training time: 10/10 held-out prompts produced schema-valid JSON.

artifacts/quest-lora/adapter_config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "alora_invocation_tokens": null,
+  "alpha_pattern": {},
+  "arrow_config": null,
+  "auto_mapping": null,
+  "base_model_name_or_path": "openbmb/MiniCPM5-1B",
+  "bias": "none",
+  "corda_config": null,
+  "ensure_weight_tying": false,
+  "eva_config": null,
+  "exclude_modules": null,
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
+  "lora_ga_config": null,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "peft_version": "0.19.1",
+  "qalora_group_size": 16,
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "gate_proj",
+    "v_proj",
+    "o_proj",
+    "k_proj",
+    "q_proj",
+    "up_proj",
+    "down_proj"
+  ],
+  "target_parameters": null,
+  "task_type": "CAUSAL_LM",
+  "trainable_token_indices": null,
+  "use_bdlora": null,
+  "use_dora": false,
+  "use_qalora": false,
+  "use_rslora": false
+}

artifacts/quest-lora/adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0480796afd6869ee00b6e35b839b48d99ee9270ef848c7901907d328c0629508
+size 44871152

artifacts/quest-lora/chat_template.jinja ADDED Viewed

	@@ -0,0 +1,179 @@

+{{- bos_token }}{%- if tools %}
+    {%- set tool_definitions %}
+        {{- "# Tools\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
+        {%- for tool in tools %}
+            {{- "\n" }}
+            {{- tool | tojson(ensure_ascii=False) }}
+        {%- endfor %}
+        {{- '\n</tools>\n\nTool usage guidelines:\n- You may call zero or more functions. If no function calls are needed, just answer normally and do not include any <function ... </function>.\n- When calling a function, return an XML object within <function ... </function> using:\n<function name="function-name"><param name="param-name">param-value</param></function>\n- param-value may be multi-line. If it contains <, & or newline characters, wrap it in a CDATA block: <param name="param-name"><![CDATA[...multi-line value...]]></param>' }}
+    {%- endset %}
+    {{- '<|im_start|>system\n' }}
+    {%- if messages[0].role == 'system' %}
+        {%- if '<tool_def_sep>' in messages[0].content %}
+            {{- messages[0].content.replace('<tool_def_sep>', tool_definitions) }}
+        {%- else %}
+            {{- messages[0].content + '\n\n' + tool_definitions }}
+        {%- endif %}
+    {%- else %}
+        {{- tool_definitions.lstrip() }}
+    {%- endif %}
+    {{- '<|im_end|>\n' }}
+{%- else %}
+    {%- if messages[0].role == 'system' %}
+        {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
+    {%- endif %}
+{%- endif %}
+{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
+{%- for message in messages[::-1] %}
+    {%- set index = (messages|length - 1) - loop.index0 %}
+    {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
+        {%- set ns.multi_step_tool = false %}
+        {%- set ns.last_query_index = index %}
+    {%- endif %}
+{%- endfor %}
+{%- for message in messages %}
+    {%- if message.content is string %}
+        {%- set content = message.content %}
+    {%- else %}
+        {%- set content = '' %}
+    {%- endif %}
+    {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
+        {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
+    {%- elif message.role == "assistant" %}
+        {%- set reasoning_content = '' %}
+        {%- if message.reasoning_content is string %}
+            {%- set reasoning_content = message.reasoning_content %}
+        {%- else %}
+            {%- if '</think>' in content %}
+                {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
+                {%- set content = content.split('</think>')[-1].lstrip('\n') %}
+            {%- endif %}
+        {%- endif %}
+        {%- if message.tool_calls %}
+            {%- set content_parts = content.split('<tool_sep>') %}
+            {%- set processed_content = content_parts[0] %}
+            {%- set tool_calls_count = message.tool_calls|length %}
+            {%- set tool_sep_count = content_parts|length - 1 %}
+            {%- set min_count = [tool_calls_count, tool_sep_count]|min %}
+            {%- for i in range(1, content_parts|length) %}
+                {%- set tool_index = i - 1 %}
+                {%- if tool_index < tool_calls_count %}
+                    {%- set tool_call = message.tool_calls[tool_index] %}
+                    {%- if tool_call.function %}
+                        {%- set tool_call = tool_call.function %}
+                    {%- endif %}
+                    {%- set single_tool_xml %}
+                        {{- '<function name="' ~ tool_call.name ~ '">' }}
+                        {%- if tool_call.arguments %}
+                            {%- set args_dict = tool_call.arguments %}
+                            {%- for param_name, param_value in args_dict.items() %}
+                                {{- '<param name="' ~ param_name ~ '">' }}
+                                {%- if param_value is string and ('<' in param_value or '&' in param_value or '\n' in param_value) %}
+                                    {{- '<![CDATA[' + param_value + ']]>' }}
+                                {%- else %}
+                                    {{- param_value }}
+                                {%- endif %}
+                                {{- '</param>' }}
+                            {%- endfor %}
+                        {%- endif %}
+                        {{- '</function>' }}
+                    {%- endset %}
+                    {%- set processed_content = processed_content + single_tool_xml + content_parts[i] %}
+                {%- else %}
+                    {%- set processed_content = processed_content + content_parts[i] %}
+                {%- endif %}
+            {%- endfor %}
+            {%- if tool_calls_count > tool_sep_count %}
+                {%- for remaining_index in range(tool_sep_count, tool_calls_count) %}
+                    {%- set tool_call = message.tool_calls[remaining_index] %}
+                    {%- if tool_call.function %}
+                        {%- set tool_call = tool_call.function %}
+                    {%- endif %}
+                    {%- set remaining_tool_xml %}
+                        {{- '<function name="' ~ tool_call.name ~ '">' }}
+                        {%- if tool_call.arguments %}
+                            {%- set args_dict = tool_call.arguments %}
+                            {%- for param_name, param_value in args_dict.items() %}
+                                {{- '<param name="' ~ param_name ~ '">' }}
+                                {%- if param_value is string and ('<' in param_value or '&' in param_value or '\n' in param_value) %}
+                                    {{- '<![CDATA[' + param_value + ']]>' }}
+                                {%- else %}
+                                    {{- param_value }}
+                                {%- endif %}
+                                {{- '</param>' }}
+                            {%- endfor %}
+                        {%- endif %}
+                        {{- '</function>' }}
+                    {%- endset %}
+                    {%- set processed_content = processed_content + remaining_tool_xml %}
+                {%- endfor %}
+            {%- endif %}
+            {%- set content = processed_content %}
+        {%- endif %}
+        {%- if loop.index0 > ns.last_query_index %}
+            {%- if reasoning_content %}
+                {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
+            {%- else %}
+                {{- '<|im_start|>' + message.role + '\n' + content }}
+            {%- endif %}
+        {%- else %}
+            {{- '<|im_start|>' + message.role + '\n' + content }}
+        {%- endif %}
+        {%- if message.tool_calls and not has_tool_sep %}
+            {%- for tool_call in message.tool_calls %}
+                {%- if (loop.first and content) or (not loop.first) %}
+                    {{- '\n' }}
+                {%- endif %}
+                {%- if tool_call.function %}
+                    {%- set tool_call = tool_call.function %}
+                {%- endif %}
+                {{- '<function name="' ~ tool_call.name ~ '">' }}
+                {%- if tool_call.arguments %}
+                    {%- set args_dict = tool_call.arguments %}
+                    {%- for param_name, param_value in args_dict.items() %}
+                        {{- '<param name="' ~ param_name ~ '">' }}
+                        {%- if param_value is string and ('<' in param_value or '&' in param_value or '\n' in param_value) %}
+                            {{- '<![CDATA[' + param_value + ']]>' }}
+                        {%- else %}
+                            {{- param_value }}
+                        {%- endif %}
+                        {{- '</param>' }}
+                    {%- endfor %}
+                {%- endif %}
+                {{- '</function>' }}
+            {%- endfor %}
+        {%- endif %}
+        {{- '<|im_end|>\n' }}
+    {%- elif message.role == "tool" %}
+        {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+            {{- '<|im_start|>user' }}
+        {%- endif %}
+        {{- '\n<tool_response>\n' }}
+        {%- if message.content is string %}
+            {{- content }}
+        {%- else %}
+            {{- message.content | tojson(ensure_ascii=False) }}
+        {%- endif %}
+        {{- '\n</tool_response>' }}
+        {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
+            {{- '<|im_end|>\n' }}
+        {%- endif %}
+    {%- endif %}
+{%- endfor %}
+{%- if add_generation_prompt %}
+    {{- '<|im_start|>assistant\n' }}
+    {%- if enable_thinking is defined %}
+        {%- if enable_thinking is false %}
+            {{- '<think>\n\n</think>\n\n' }}
+        {%- elif enable_thinking is true %}
+            {{- '<think>\n' }}
+        {%- endif %}
+    {%- endif %}
+{%- endif %}

artifacts/quest-lora/self-eval.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+  "valid": 10,
+  "total": 10,
+  "samples": [
+    {
+      "project_id": "build-small-hackathon/AI-Puppet-Theater",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"OpenBMB\",\"confidence\":0.97,\"evidence\":\"OpenBMB model id: openbmb/MiniCPM5-1B\",\"source\":\"app_file\"},{\"quest\":\"Tiny Titan\",\"confidence\":0.93,\"evidence\":\"openbmb/MiniCPM5-1B is a 1B model\",\"source\":\"app_file\"},{\"quest\":\"Off-Brand\",\"confidence\":0.9,\"evidence\":\"CUSTOM_CSS overrides .gradio-container background\",\"source\":\"app_file\"},{\"quest\":\"Thousand Token Wood\",\"confidence\":0.85,"
+    },
+    {
+      "project_id": "build-small-hackathon/neilA",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Thousand Token Wood\",\"confidence\":0.97,\"evidence\":\"teach an alien that knows human words but has never lived a human life\",\"source\":\"readme\"},{\"quest\":\"Off-Brand\",\"confidence\":0.9,\"evidence\":\"plain-Python concept ledger injected into the prompt each turn\",\"source\":\"app_file\"},{\"quest\":\"Off the Grid\",\"confidence\":0.78,\"evidence\":\"Only inference runs inside @spaces.GPU; all sta"
+    },
+    {
+      "project_id": "build-small-hackathon/Trollsona",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Thousand Token Wood\",\"confidence\":0.97,\"evidence\":\"Track: An Adventure in Thousand Token Wood; playful troll alter ego; goblin meter\",\"source\":\"readme\"},{\"quest\":\"Tiny Titan\",\"confidence\":0.95,\"evidence\":\"compact RthItalia model derived from Qwen/Qwen2.5-3B-Instruct; lightweight Qwen 0.5B model\",\"source\":\"readme\"},{\"quest\":\"Off the Grid\",\"confidence\":0.9,\"evidence\":\"Local Hug"
+    },
+    {
+      "project_id": "build-small-hackathon/hackathon-advisor",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Llama Champion\",\"confidence\":0.97,\"evidence\":\"llama.cpp runtime, GGUF retrieval index, llama.cpp imports\",\"source\":\"readme\"},{\"quest\":\"Tiny Titan\",\"confidence\":0.93,\"evidence\":\"MiniCPM5 tool-call planning, published PEFT LoRA adapter\",\"source\":\"readme\"},{\"quest\":\"Off the Grid\",\"confidence\":0.9,\"evidence\":\"Local snapshot of public Spaces, Modal-built GGUF index, no cloud API\","
+    },
+    {
+      "project_id": "build-small-hackathon/wan2-2-fp8da-aoti-14B-fast",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Off the Grid\",\"confidence\":0.7,\"evidence\":\"diffusers.pipelines.wan.pipeline_wan_i2v import WanImageToVideoPipeline\",\"source\":\"app_file\"},{\"quest\":\"Tiny Titan\",\"confidence\":0.6,\"evidence\":\"from train_log.RIFE_HDv3 import Model\",\"source\":\"app_file\"}]}"
+    },
+    {
+      "project_id": "build-small-hackathon/family-care-asr-eval",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Well-Tuned\",\"confidence\":0.97,\"evidence\":\"teckedd/whisper_small-waxal_akan-asr-v1 fine-tune; GiftMark fallback\",\"source\":\"app_file\"},{\"quest\":\"Tiny Titan\",\"confidence\":0.97,\"evidence\":\"facebook/mms-1b-all (recommended): 1B parameter model\",\"source\":\"app_file\"},{\"quest\":\"Off the Grid\",\"confidence\":0.93,\"evidence\":\"Wav2Vec2ForCTC + WhisperForConditionalGeneration from transform"
+    },
+    {
+      "project_id": "build-small-hackathon/GRM-2.6-Opus",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Off the Grid\",\"confidence\":0.97,\"evidence\":\"AutoModelForCausalLM.from_pretrained(MODEL_ID)... no cloud API client\",\"source\":\"app_file\"},{\"quest\":\"Tiny Titan\",\"confidence\":0.93,\"evidence\":\"OrionLLM/GRM-2.6-Opus (3.6B) model declared\",\"source\":\"app_file\"}]}"
+    },
+    {
+      "project_id": "build-small-hackathon/backyard-raccoon-deterrent",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Backyard AI\",\"confidence\":0.97,\"evidence\":\"Ring camera sees raccoons; U.S. federal wildlife control killed over 375,000 native animals\",\"source\":\"readme\"},{\"quest\":\"Off the Grid\",\"confidence\":0.95,\"evidence\":\"runs fully offline: no cloud APIs; YOLO weights ship in the repo\",\"source\":\"app_file\"},{\"quest\":\"Well-Tuned\",\"confidence\":0.9,\"evidence\":\"Fine-tuned YOLOv8n raccoon dete"
+    },
+    {
+      "project_id": "build-small-hackathon/global-leaders",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Nemotron\",\"confidence\":0.97,\"evidence\":\"Ollama Cloud (Nemotron) if OLLAMA_API_KEY is set\",\"source\":\"app_file\"},{\"quest\":\"Off-Brand\",\"confidence\":0.93,\"evidence\":\"Backend: Ollama Cloud (Nemotron) if OLLAMA_API_KEY is set\",\"source\":\"app_file\"}]}"
+    },
+    {
+      "project_id": "build-small-hackathon/The-Shrine",
+      "valid_json": true,
+      "detail": "",
+      "output": "{\"matches\":[{\"quest\":\"Off the Grid\",\"confidence\":0.97,\"evidence\":\"local monologue engine works offline\",\"source\":\"app_file\"},{\"quest\":\"Off-Brand\",\"confidence\":0.9,\"evidence\":\"Custom Canvas + vanilla JS (60+ monologue phrases)\",\"source\":\"readme\"},{\"quest\":\"Well-Tuned\",\"confidence\":0.85,\"evidence\":\"QwEN_MODEL = \\\"qwen-max\\\"\",\"source\":\"app_file\"}]}"
+    }
+  ]
+}

artifacts/quest-lora/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

artifacts/quest-lora/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

artifacts/quest-lora/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,4099 @@

+{
+  "add_bos_token": false,
+  "add_eos_token": false,
+  "add_prefix_space": null,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "<|im_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "6": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "7": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "8": {
+      "content": "<think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "9": {
+      "content": "</think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "10": {
+      "content": "<tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "11": {
+      "content": "</tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "12": {
+      "content": "<tools>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "13": {
+      "content": "</tools>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "14": {
+      "content": "<arguments>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "15": {
+      "content": "</arguments>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "16": {
+      "content": "<parameters>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "17": {
+      "content": "</parameters>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "18": {
+      "content": "<function",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "19": {
+      "content": "</function>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "20": {
+      "content": "<param",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "21": {
+      "content": "</param>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130072": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130073": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130074": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130075": {
+      "content": "<|thought_begin|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130076": {
+      "content": "<|thought_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130077": {
+      "content": "<|tool_call|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130078": {
+      "content": "<|execute_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130079": {
+      "content": "<|execute_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130080": {
+      "content": "/think",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130081": {
+      "content": "/no_think",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "130082": {
+      "content": "<unused_token_0>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130083": {
+      "content": "<unused_token_1>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130084": {
+      "content": "<unused_token_2>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130085": {
+      "content": "<unused_token_3>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130086": {
+      "content": "<unused_token_4>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130087": {
+      "content": "<unused_token_5>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130088": {
+      "content": "<unused_token_6>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130089": {
+      "content": "<unused_token_7>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130090": {
+      "content": "<unused_token_8>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130091": {
+      "content": "<unused_token_9>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130092": {
+      "content": "<unused_token_10>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130093": {
+      "content": "<unused_token_11>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130094": {
+      "content": "<unused_token_12>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130095": {
+      "content": "<unused_token_13>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130096": {
+      "content": "<unused_token_14>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130097": {
+      "content": "<unused_token_15>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130098": {
+      "content": "<unused_token_16>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130099": {
+      "content": "<unused_token_17>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130100": {
+      "content": "<unused_token_18>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130101": {
+      "content": "<unused_token_19>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130102": {
+      "content": "<unused_token_20>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130103": {
+      "content": "<unused_token_21>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130104": {
+      "content": "<unused_token_22>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130105": {
+      "content": "<unused_token_23>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130106": {
+      "content": "<unused_token_24>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130107": {
+      "content": "<unused_token_25>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130108": {
+      "content": "<unused_token_26>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130109": {
+      "content": "<unused_token_27>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130110": {
+      "content": "<unused_token_28>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130111": {
+      "content": "<unused_token_29>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130112": {
+      "content": "<unused_token_30>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130113": {
+      "content": "<unused_token_31>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130114": {
+      "content": "<unused_token_32>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130115": {
+      "content": "<unused_token_33>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130116": {
+      "content": "<unused_token_34>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130117": {
+      "content": "<unused_token_35>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130118": {
+      "content": "<unused_token_36>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130119": {
+      "content": "<unused_token_37>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130120": {
+      "content": "<unused_token_38>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130121": {
+      "content": "<unused_token_39>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130122": {
+      "content": "<unused_token_40>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130123": {
+      "content": "<unused_token_41>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130124": {
+      "content": "<unused_token_42>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130125": {
+      "content": "<unused_token_43>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130126": {
+      "content": "<unused_token_44>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130127": {
+      "content": "<unused_token_45>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130128": {
+      "content": "<unused_token_46>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130129": {
+      "content": "<unused_token_47>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130130": {
+      "content": "<unused_token_48>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130131": {
+      "content": "<unused_token_49>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130132": {
+      "content": "<unused_token_50>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130133": {
+      "content": "<unused_token_51>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130134": {
+      "content": "<unused_token_52>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130135": {
+      "content": "<unused_token_53>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130136": {
+      "content": "<unused_token_54>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130137": {
+      "content": "<unused_token_55>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130138": {
+      "content": "<unused_token_56>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130139": {
+      "content": "<unused_token_57>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130140": {
+      "content": "<unused_token_58>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130141": {
+      "content": "<unused_token_59>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130142": {
+      "content": "<unused_token_60>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130143": {
+      "content": "<unused_token_61>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130144": {
+      "content": "<unused_token_62>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130145": {
+      "content": "<unused_token_63>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130146": {
+      "content": "<unused_token_64>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130147": {
+      "content": "<unused_token_65>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130148": {
+      "content": "<unused_token_66>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130149": {
+      "content": "<unused_token_67>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130150": {
+      "content": "<unused_token_68>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130151": {
+      "content": "<unused_token_69>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130152": {
+      "content": "<unused_token_70>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130153": {
+      "content": "<unused_token_71>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130154": {
+      "content": "<unused_token_72>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130155": {
+      "content": "<unused_token_73>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130156": {
+      "content": "<unused_token_74>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130157": {
+      "content": "<unused_token_75>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130158": {
+      "content": "<unused_token_76>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130159": {
+      "content": "<unused_token_77>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130160": {
+      "content": "<unused_token_78>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130161": {
+      "content": "<unused_token_79>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130162": {
+      "content": "<unused_token_80>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130163": {
+      "content": "<unused_token_81>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130164": {
+      "content": "<unused_token_82>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130165": {
+      "content": "<unused_token_83>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130166": {
+      "content": "<unused_token_84>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130167": {
+      "content": "<unused_token_85>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130168": {
+      "content": "<unused_token_86>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130169": {
+      "content": "<unused_token_87>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130170": {
+      "content": "<unused_token_88>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130171": {
+      "content": "<unused_token_89>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130172": {
+      "content": "<unused_token_90>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130173": {
+      "content": "<unused_token_91>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130174": {
+      "content": "<unused_token_92>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130175": {
+      "content": "<unused_token_93>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130176": {
+      "content": "<unused_token_94>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130177": {
+      "content": "<unused_token_95>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130178": {
+      "content": "<unused_token_96>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130179": {
+      "content": "<unused_token_97>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130180": {
+      "content": "<unused_token_98>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130181": {
+      "content": "<unused_token_99>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130182": {
+      "content": "<unused_token_100>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130183": {
+      "content": "<unused_token_101>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130184": {
+      "content": "<unused_token_102>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130185": {
+      "content": "<unused_token_103>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130186": {
+      "content": "<unused_token_104>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130187": {
+      "content": "<unused_token_105>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130188": {
+      "content": "<unused_token_106>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130189": {
+      "content": "<unused_token_107>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130190": {
+      "content": "<unused_token_108>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130191": {
+      "content": "<unused_token_109>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130192": {
+      "content": "<unused_token_110>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130193": {
+      "content": "<unused_token_111>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130194": {
+      "content": "<unused_token_112>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130195": {
+      "content": "<unused_token_113>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130196": {
+      "content": "<unused_token_114>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130197": {
+      "content": "<unused_token_115>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130198": {
+      "content": "<unused_token_116>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130199": {
+      "content": "<unused_token_117>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130200": {
+      "content": "<unused_token_118>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130201": {
+      "content": "<unused_token_119>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130202": {
+      "content": "<unused_token_120>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130203": {
+      "content": "<unused_token_121>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130204": {
+      "content": "<unused_token_122>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130205": {
+      "content": "<unused_token_123>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130206": {
+      "content": "<unused_token_124>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130207": {
+      "content": "<unused_token_125>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130208": {
+      "content": "<unused_token_126>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130209": {
+      "content": "<unused_token_127>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130210": {
+      "content": "<unused_token_128>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130211": {
+      "content": "<unused_token_129>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130212": {
+      "content": "<unused_token_130>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130213": {
+      "content": "<unused_token_131>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130214": {
+      "content": "<unused_token_132>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130215": {
+      "content": "<unused_token_133>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130216": {
+      "content": "<unused_token_134>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130217": {
+      "content": "<unused_token_135>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130218": {
+      "content": "<unused_token_136>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130219": {
+      "content": "<unused_token_137>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130220": {
+      "content": "<unused_token_138>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130221": {
+      "content": "<unused_token_139>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130222": {
+      "content": "<unused_token_140>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130223": {
+      "content": "<unused_token_141>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130224": {
+      "content": "<unused_token_142>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130225": {
+      "content": "<unused_token_143>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130226": {
+      "content": "<unused_token_144>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130227": {
+      "content": "<unused_token_145>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130228": {
+      "content": "<unused_token_146>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130229": {
+      "content": "<unused_token_147>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130230": {
+      "content": "<unused_token_148>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130231": {
+      "content": "<unused_token_149>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130232": {
+      "content": "<unused_token_150>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130233": {
+      "content": "<unused_token_151>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130234": {
+      "content": "<unused_token_152>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130235": {
+      "content": "<unused_token_153>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130236": {
+      "content": "<unused_token_154>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130237": {
+      "content": "<unused_token_155>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130238": {
+      "content": "<unused_token_156>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130239": {
+      "content": "<unused_token_157>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130240": {
+      "content": "<unused_token_158>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130241": {
+      "content": "<unused_token_159>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130242": {
+      "content": "<unused_token_160>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130243": {
+      "content": "<unused_token_161>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130244": {
+      "content": "<unused_token_162>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130245": {
+      "content": "<unused_token_163>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130246": {
+      "content": "<unused_token_164>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130247": {
+      "content": "<unused_token_165>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130248": {
+      "content": "<unused_token_166>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130249": {
+      "content": "<unused_token_167>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130250": {
+      "content": "<unused_token_168>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130251": {
+      "content": "<unused_token_169>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130252": {
+      "content": "<unused_token_170>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130253": {
+      "content": "<unused_token_171>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130254": {
+      "content": "<unused_token_172>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130255": {
+      "content": "<unused_token_173>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130256": {
+      "content": "<unused_token_174>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130257": {
+      "content": "<unused_token_175>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130258": {
+      "content": "<unused_token_176>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130259": {
+      "content": "<unused_token_177>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130260": {
+      "content": "<unused_token_178>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130261": {
+      "content": "<unused_token_179>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130262": {
+      "content": "<unused_token_180>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130263": {
+      "content": "<unused_token_181>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130264": {
+      "content": "<unused_token_182>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130265": {
+      "content": "<unused_token_183>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130266": {
+      "content": "<unused_token_184>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130267": {
+      "content": "<unused_token_185>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130268": {
+      "content": "<unused_token_186>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130269": {
+      "content": "<unused_token_187>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130270": {
+      "content": "<unused_token_188>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130271": {
+      "content": "<unused_token_189>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130272": {
+      "content": "<unused_token_190>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130273": {
+      "content": "<unused_token_191>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130274": {
+      "content": "<unused_token_192>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130275": {
+      "content": "<unused_token_193>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130276": {
+      "content": "<unused_token_194>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130277": {
+      "content": "<unused_token_195>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130278": {
+      "content": "<unused_token_196>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130279": {
+      "content": "<unused_token_197>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130280": {
+      "content": "<unused_token_198>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130281": {
+      "content": "<unused_token_199>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130282": {
+      "content": "<unused_token_200>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130283": {
+      "content": "<unused_token_201>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130284": {
+      "content": "<unused_token_202>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130285": {
+      "content": "<unused_token_203>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130286": {
+      "content": "<unused_token_204>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130287": {
+      "content": "<unused_token_205>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130288": {
+      "content": "<unused_token_206>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130289": {
+      "content": "<unused_token_207>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130290": {
+      "content": "<unused_token_208>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130291": {
+      "content": "<unused_token_209>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130292": {
+      "content": "<unused_token_210>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130293": {
+      "content": "<unused_token_211>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130294": {
+      "content": "<unused_token_212>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130295": {
+      "content": "<unused_token_213>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130296": {
+      "content": "<unused_token_214>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130297": {
+      "content": "<unused_token_215>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130298": {
+      "content": "<unused_token_216>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130299": {
+      "content": "<unused_token_217>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130300": {
+      "content": "<unused_token_218>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130301": {
+      "content": "<unused_token_219>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130302": {
+      "content": "<unused_token_220>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130303": {
+      "content": "<unused_token_221>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130304": {
+      "content": "<unused_token_222>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130305": {
+      "content": "<unused_token_223>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130306": {
+      "content": "<unused_token_224>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130307": {
+      "content": "<unused_token_225>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130308": {
+      "content": "<unused_token_226>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130309": {
+      "content": "<unused_token_227>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130310": {
+      "content": "<unused_token_228>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130311": {
+      "content": "<unused_token_229>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130312": {
+      "content": "<unused_token_230>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130313": {
+      "content": "<unused_token_231>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130314": {
+      "content": "<unused_token_232>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130315": {
+      "content": "<unused_token_233>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130316": {
+      "content": "<unused_token_234>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130317": {
+      "content": "<unused_token_235>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130318": {
+      "content": "<unused_token_236>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130319": {
+      "content": "<unused_token_237>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130320": {
+      "content": "<unused_token_238>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130321": {
+      "content": "<unused_token_239>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130322": {
+      "content": "<unused_token_240>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130323": {
+      "content": "<unused_token_241>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130324": {
+      "content": "<unused_token_242>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130325": {
+      "content": "<unused_token_243>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130326": {
+      "content": "<unused_token_244>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130327": {
+      "content": "<unused_token_245>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130328": {
+      "content": "<unused_token_246>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130329": {
+      "content": "<unused_token_247>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130330": {
+      "content": "<unused_token_248>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130331": {
+      "content": "<unused_token_249>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130332": {
+      "content": "<unused_token_250>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130333": {
+      "content": "<unused_token_251>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130334": {
+      "content": "<unused_token_252>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130335": {
+      "content": "<unused_token_253>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130336": {
+      "content": "<unused_token_254>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130337": {
+      "content": "<unused_token_255>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130338": {
+      "content": "<unused_token_256>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130339": {
+      "content": "<unused_token_257>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130340": {
+      "content": "<unused_token_258>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130341": {
+      "content": "<unused_token_259>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130342": {
+      "content": "<unused_token_260>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130343": {
+      "content": "<unused_token_261>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130344": {
+      "content": "<unused_token_262>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130345": {
+      "content": "<unused_token_263>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130346": {
+      "content": "<unused_token_264>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130347": {
+      "content": "<unused_token_265>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130348": {
+      "content": "<unused_token_266>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130349": {
+      "content": "<unused_token_267>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130350": {
+      "content": "<unused_token_268>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130351": {
+      "content": "<unused_token_269>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130352": {
+      "content": "<unused_token_270>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130353": {
+      "content": "<unused_token_271>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130354": {
+      "content": "<unused_token_272>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130355": {
+      "content": "<unused_token_273>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130356": {
+      "content": "<unused_token_274>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130357": {
+      "content": "<unused_token_275>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130358": {
+      "content": "<unused_token_276>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130359": {
+      "content": "<unused_token_277>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130360": {
+      "content": "<unused_token_278>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130361": {
+      "content": "<unused_token_279>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130362": {
+      "content": "<unused_token_280>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130363": {
+      "content": "<unused_token_281>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130364": {
+      "content": "<unused_token_282>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130365": {
+      "content": "<unused_token_283>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130366": {
+      "content": "<unused_token_284>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130367": {
+      "content": "<unused_token_285>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130368": {
+      "content": "<unused_token_286>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130369": {
+      "content": "<unused_token_287>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130370": {
+      "content": "<unused_token_288>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130371": {
+      "content": "<unused_token_289>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130372": {
+      "content": "<unused_token_290>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130373": {
+      "content": "<unused_token_291>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130374": {
+      "content": "<unused_token_292>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130375": {
+      "content": "<unused_token_293>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130376": {
+      "content": "<unused_token_294>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130377": {
+      "content": "<unused_token_295>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130378": {
+      "content": "<unused_token_296>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130379": {
+      "content": "<unused_token_297>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130380": {
+      "content": "<unused_token_298>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130381": {
+      "content": "<unused_token_299>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130382": {
+      "content": "<unused_token_300>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130383": {
+      "content": "<unused_token_301>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130384": {
+      "content": "<unused_token_302>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130385": {
+      "content": "<unused_token_303>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130386": {
+      "content": "<unused_token_304>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130387": {
+      "content": "<unused_token_305>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130388": {
+      "content": "<unused_token_306>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130389": {
+      "content": "<unused_token_307>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130390": {
+      "content": "<unused_token_308>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130391": {
+      "content": "<unused_token_309>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130392": {
+      "content": "<unused_token_310>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130393": {
+      "content": "<unused_token_311>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130394": {
+      "content": "<unused_token_312>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130395": {
+      "content": "<unused_token_313>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130396": {
+      "content": "<unused_token_314>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130397": {
+      "content": "<unused_token_315>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130398": {
+      "content": "<unused_token_316>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130399": {
+      "content": "<unused_token_317>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130400": {
+      "content": "<unused_token_318>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130401": {
+      "content": "<unused_token_319>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130402": {
+      "content": "<unused_token_320>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130403": {
+      "content": "<unused_token_321>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130404": {
+      "content": "<unused_token_322>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130405": {
+      "content": "<unused_token_323>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130406": {
+      "content": "<unused_token_324>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130407": {
+      "content": "<unused_token_325>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130408": {
+      "content": "<unused_token_326>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130409": {
+      "content": "<unused_token_327>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130410": {
+      "content": "<unused_token_328>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130411": {
+      "content": "<unused_token_329>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130412": {
+      "content": "<unused_token_330>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130413": {
+      "content": "<unused_token_331>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130414": {
+      "content": "<unused_token_332>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130415": {
+      "content": "<unused_token_333>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130416": {
+      "content": "<unused_token_334>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130417": {
+      "content": "<unused_token_335>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130418": {
+      "content": "<unused_token_336>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130419": {
+      "content": "<unused_token_337>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130420": {
+      "content": "<unused_token_338>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130421": {
+      "content": "<unused_token_339>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130422": {
+      "content": "<unused_token_340>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130423": {
+      "content": "<unused_token_341>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130424": {
+      "content": "<unused_token_342>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130425": {
+      "content": "<unused_token_343>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130426": {
+      "content": "<unused_token_344>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130427": {
+      "content": "<unused_token_345>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130428": {
+      "content": "<unused_token_346>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130429": {
+      "content": "<unused_token_347>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130430": {
+      "content": "<unused_token_348>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130431": {
+      "content": "<unused_token_349>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130432": {
+      "content": "<unused_token_350>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130433": {
+      "content": "<unused_token_351>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130434": {
+      "content": "<unused_token_352>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130435": {
+      "content": "<unused_token_353>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130436": {
+      "content": "<unused_token_354>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130437": {
+      "content": "<unused_token_355>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130438": {
+      "content": "<unused_token_356>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130439": {
+      "content": "<unused_token_357>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130440": {
+      "content": "<unused_token_358>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130441": {
+      "content": "<unused_token_359>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130442": {
+      "content": "<unused_token_360>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130443": {
+      "content": "<unused_token_361>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130444": {
+      "content": "<unused_token_362>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130445": {
+      "content": "<unused_token_363>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130446": {
+      "content": "<unused_token_364>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130447": {
+      "content": "<unused_token_365>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130448": {
+      "content": "<unused_token_366>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130449": {
+      "content": "<unused_token_367>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130450": {
+      "content": "<unused_token_368>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130451": {
+      "content": "<unused_token_369>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130452": {
+      "content": "<unused_token_370>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130453": {
+      "content": "<unused_token_371>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130454": {
+      "content": "<unused_token_372>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130455": {
+      "content": "<unused_token_373>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130456": {
+      "content": "<unused_token_374>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130457": {
+      "content": "<unused_token_375>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130458": {
+      "content": "<unused_token_376>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130459": {
+      "content": "<unused_token_377>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130460": {
+      "content": "<unused_token_378>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130461": {
+      "content": "<unused_token_379>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130462": {
+      "content": "<unused_token_380>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130463": {
+      "content": "<unused_token_381>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130464": {
+      "content": "<unused_token_382>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130465": {
+      "content": "<unused_token_383>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130466": {
+      "content": "<unused_token_384>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130467": {
+      "content": "<unused_token_385>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130468": {
+      "content": "<unused_token_386>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130469": {
+      "content": "<unused_token_387>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130470": {
+      "content": "<unused_token_388>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130471": {
+      "content": "<unused_token_389>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130472": {
+      "content": "<unused_token_390>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130473": {
+      "content": "<unused_token_391>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130474": {
+      "content": "<unused_token_392>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130475": {
+      "content": "<unused_token_393>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130476": {
+      "content": "<unused_token_394>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130477": {
+      "content": "<unused_token_395>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130478": {
+      "content": "<unused_token_396>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130479": {
+      "content": "<unused_token_397>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130480": {
+      "content": "<unused_token_398>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130481": {
+      "content": "<unused_token_399>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130482": {
+      "content": "<unused_token_400>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130483": {
+      "content": "<unused_token_401>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130484": {
+      "content": "<unused_token_402>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130485": {
+      "content": "<unused_token_403>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130486": {
+      "content": "<unused_token_404>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130487": {
+      "content": "<unused_token_405>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130488": {
+      "content": "<unused_token_406>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130489": {
+      "content": "<unused_token_407>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130490": {
+      "content": "<unused_token_408>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130491": {
+      "content": "<unused_token_409>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130492": {
+      "content": "<unused_token_410>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130493": {
+      "content": "<unused_token_411>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130494": {
+      "content": "<unused_token_412>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130495": {
+      "content": "<unused_token_413>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130496": {
+      "content": "<unused_token_414>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130497": {
+      "content": "<unused_token_415>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130498": {
+      "content": "<unused_token_416>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130499": {
+      "content": "<unused_token_417>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130500": {
+      "content": "<unused_token_418>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130501": {
+      "content": "<unused_token_419>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130502": {
+      "content": "<unused_token_420>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130503": {
+      "content": "<unused_token_421>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130504": {
+      "content": "<unused_token_422>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130505": {
+      "content": "<unused_token_423>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130506": {
+      "content": "<unused_token_424>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130507": {
+      "content": "<unused_token_425>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130508": {
+      "content": "<unused_token_426>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130509": {
+      "content": "<unused_token_427>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130510": {
+      "content": "<unused_token_428>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130511": {
+      "content": "<unused_token_429>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130512": {
+      "content": "<unused_token_430>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130513": {
+      "content": "<unused_token_431>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130514": {
+      "content": "<unused_token_432>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130515": {
+      "content": "<unused_token_433>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130516": {
+      "content": "<unused_token_434>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130517": {
+      "content": "<unused_token_435>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130518": {
+      "content": "<unused_token_436>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130519": {
+      "content": "<unused_token_437>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130520": {
+      "content": "<unused_token_438>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130521": {
+      "content": "<unused_token_439>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130522": {
+      "content": "<unused_token_440>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130523": {
+      "content": "<unused_token_441>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130524": {
+      "content": "<unused_token_442>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130525": {
+      "content": "<unused_token_443>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130526": {
+      "content": "<unused_token_444>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130527": {
+      "content": "<unused_token_445>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130528": {
+      "content": "<unused_token_446>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130529": {
+      "content": "<unused_token_447>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130530": {
+      "content": "<unused_token_448>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130531": {
+      "content": "<unused_token_449>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130532": {
+      "content": "<unused_token_450>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130533": {
+      "content": "<unused_token_451>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130534": {
+      "content": "<unused_token_452>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130535": {
+      "content": "<unused_token_453>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130536": {
+      "content": "<unused_token_454>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130537": {
+      "content": "<unused_token_455>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130538": {
+      "content": "<unused_token_456>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130539": {
+      "content": "<unused_token_457>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130540": {
+      "content": "<unused_token_458>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130541": {
+      "content": "<unused_token_459>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130542": {
+      "content": "<unused_token_460>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130543": {
+      "content": "<unused_token_461>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130544": {
+      "content": "<unused_token_462>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130545": {
+      "content": "<unused_token_463>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130546": {
+      "content": "<unused_token_464>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130547": {
+      "content": "<unused_token_465>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130548": {
+      "content": "<unused_token_466>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130549": {
+      "content": "<unused_token_467>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130550": {
+      "content": "<unused_token_468>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130551": {
+      "content": "<unused_token_469>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130552": {
+      "content": "<unused_token_470>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130553": {
+      "content": "<unused_token_471>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130554": {
+      "content": "<unused_token_472>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130555": {
+      "content": "<unused_token_473>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130556": {
+      "content": "<unused_token_474>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130557": {
+      "content": "<unused_token_475>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130558": {
+      "content": "<unused_token_476>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "130559": {
+      "content": "<unused_token_477>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "legacy": true,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "</s>",
+  "sp_model_kwargs": {},
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}

artifacts/quest-lora/training-recipe.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "type": "lora_training_recipe",
+  "base_model": "openbmb/MiniCPM5-1B",
+  "adapter_task": "hackathon_advisor_quest_classification",
+  "method": "LoRA SFT (completion-only loss)",
+  "example_count": 146,
+  "epochs": 6.0,
+  "rank": 16,
+  "alpha": 32,
+  "dropout": 0.05,
+  "learning_rate": 0.0002,
+  "max_seq_length": 2560,
+  "target_modules": [
+    "down_proj",
+    "gate_proj",
+    "k_proj",
+    "o_proj",
+    "q_proj",
+    "up_proj",
+    "v_proj"
+  ],
+  "gpu": "A10G"
+}

data/quest_corpus.json ADDED Viewed

The diff for this file is too large to render. See raw diff

data/quest_dataset_card.md ADDED Viewed

	@@ -0,0 +1,83 @@

+---
+license: apache-2.0
+task_categories:
+- text-classification
+- text-generation
+language:
+- en
+tags:
+- hackathon-advisor
+- quest-classification
+- lora-sft
+- minicpm5
+pretty_name: Hackathon Advisor Quest Classification SFT
+size_categories:
+- n<1K
+---
+# Hackathon Advisor — Quest Classification SFT Dataset
+Supervised fine-tuning data that teaches MiniCPM5-1B to classify a Build Small
+Hackathon project against 13 judging dimensions from a two-segment README + app-file
+prompt, emitting strict JSON with short, source-attributed evidence. Trains the LoRA at
+[`build-small-hackathon/hackathon-advisor-quest-minicpm5-lora`](https://huggingface.co/build-small-hackathon/hackathon-advisor-quest-minicpm5-lora).
+## Format (`quest_sft.jsonl`)
+Chat-JSONL. The **first line** is a `lora_sft_manifest`; every following line is a
+`lora_sft_example` with a `messages` list (system / user / assistant). The assistant
+turn is exactly one JSON object:
+```json
+{"matches":[{"quest":"...","confidence":0.0,"evidence":"...","source":"readme|app_file"}]}
+```
+No markdown, no prose, no renamed quests; an empty `matches` list when no dimension has
+clear evidence. The user turn splits the project into a `[README]` segment and an
+`[APP_FILE]` segment so the model judges product description and implementation
+evidence separately and attributes each match to its source.
+## Quest dimensions (13)
+Six merit badges (Off the Grid, Well-Tuned, Off-Brand, Llama Champion, Sharing is
+Caring, Field Notes), two tracks (Backyard AI, Thousand Token Wood), and five
+sponsor / special awards (OpenBMB, Nemotron, Modal, Tiny Titan, Best Agent).
+## Examples: 156 (14 with empty matches)
+| variant | count |
+| --- | --- |
+| natural | 108 |
+| app_only | 16 |
+| missing_app_file | 16 |
+| noisy_metadata | 8 |
+| contradiction | 6 |
+| empty | 2 |
+Positive examples per quest:
+| quest | examples |
+| --- | --- |
+| Off the Grid | 87 |
+| Off-Brand | 59 |
+| Tiny Titan | 58 |
+| Thousand Token Wood | 49 |
+| Llama Champion | 35 |
+| Backyard AI | 35 |
+| Well-Tuned | 31 |
+| OpenBMB | 26 |
+| Sharing is Caring | 19 |
+| Nemotron | 18 |
+| Field Notes | 15 |
+| Modal | 14 |
+| Best Agent | 14 |
+## Provenance
+Built from the real public Spaces of the `build-small-hackathon` org: 125 crawled
+projects → deduped + length-filtered to 108 content-rich ones → labelled by a
+teacher-then-adversarial-verifier multi-agent workflow → plus targeted augmentations
+(app-only, readme-only / missing app file, README↔app contradictions, empty matches,
+noisy metadata). `labeled.json` holds the per-project verified labels. Examples are
+derived from public hackathon submissions for research and hackathon use; each project
+remains under its own Space license.

data/quest_label_input.json ADDED Viewed

The diff for this file is too large to render. See raw diff

data/quest_labels/in/AI-Puppet-Theater.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/AI-Puppet-Theater",
+  "slug": "AI-Puppet-Theater",
+  "title": "AI Puppet Theater",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "AI Puppet Theater is a public Gradio Space for building short interactive puppet shows from a user premise.",
+  "APP_FILE": "from html import escape\nfrom time import sleep\nfrom puppet_theater import (\n\nfrom html import escape\nimport os\nfrom time import sleep\n\nimport gradio as gr\n\nfrom puppet_theater import (\n    DEFAULT_OPENBMB_MODEL_ID,\n    TheaterSession,\n    create_show_from_premise,\n    get_backend_status,\n    request_finale,\n    run_one_beat,\n    summon_actor,\n    throw_prop,\n    warm_up_openbmb,\n)\n\n\nEMPTY_STAGE = \"\"\"\n<div class=\"puppet-stage stage-empty\">\n  <div class=\"stage-valance\"></div>\n  <div class=\"stage-backdrop\">\n    <div class=\"stage-marquee\">AI Puppet Theater</div>\n    <div class=\"empty-stage-copy\">Enter a premise and raise the curtain.</div>\n  </div>\n  <div class=\"stage-floorboards\"></div>\n</div>\n\"\"\"\n\nEMPTY_TRANSCRIPT = \"No show yet. The transcript will appear here.\"\nEMPTY_DIRECTOR_LOG = \"No director notes yet.\"\nEMPTY_TRACE = \"No trace events yet.\"\nEMPTY_BACKEND = (\n    \"Active backend: deterministic\\n\"\n    \"OpenBMB model id: openbmb/MiniCPM5-1B\\n\"\n    \"Model status: unloaded\\n\"\n    \"Fallback: deterministic safety path enabled\"\n)\nBACKEND_CHOICES = [\"deterministic\", \"openbmb\"]\nOPENBMB_MODEL_ID = os.getenv(\"OPENBMB_MODEL_ID\", DEFAULT_OPENBMB_MODEL_ID)\nDEFAULT_MAX_NEW_TOKENS = 80\nDEFAULT_TEMPERATURE = 0.8\nPLAYBACK_DELAY_SECONDS = 0.75\nPROP_EMOJI = {\n    \"rubber duck\": \"🐤\",\n    \"duck\": \"🐤\",\n    \"egg\": \"🥚\",\n    \"flowers\": \"💐\",\n    \"flower\": \"💐\",\n    \"tomato\": \"🍅\",\n    \"crown\": \"👑\",\n    \"tiny crown\": \"👑\",\n    \"scroll\": \"📜\",\n    \"banana\": \"🍌\",\n    \"mirror\": \"🪞\",\n}\n\nCUSTOM_CSS = \"\"\"\nbody,\n.gradio-container {\n    background:\n        radial-gradient(circle at 50% 0%, rgba(127, 29, 29, 0.18), transparent 28rem),\n        linear-gradient(180deg, #0b1020 0%, #070914 100%) !important;\n    color: #f8efe4 !important;\n}\n.gradio-container {\n    max-width: 1180px !important;\n    padding-top: 1rem !important;\n    font-family: Inter, ui-sans-serif, system-ui, -apple-system, BlinkMacSystemFont, \" ..."
+}

data/quest_labels/in/AI-agent-Evaluation-pipeline.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "id": "build-small-hackathon/AI-agent-Evaluation-pipeline",
+  "slug": "AI-agent-Evaluation-pipeline",
+  "title": "ai agent evaluation pipeline",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "agents",
+    "evaluation",
+    "gradio",
+    "llm",
+    "observability"
+  ],
+  "app_file": "app.py",
+  "README": "# 🧪 AI Agent Evaluation Pipeline > Evaluate AI agents at **Session**, **Trace**, and **Span** levels — inspired by [Amazon Bedrock AgentCore Evaluations](https://docs.aws.amazon.com/bedrock-agentcore/latest/devguide/evaluations.html) ## Overview This tool provides a structured framework for evaluating AI agent conversations using the same three-level hierarchy as Amazon Bedrock AgentCore Evaluations: ``` 📦 Session → Did the agent achieve the user's overall goal? └── 🔄 Trace → Per-turn quality (helpfulness, coherence, relevance...) └── 🔧 Span → Per tool-call accuracy ``` ## Features - **14 built-in evaluators** (1 session + 11 trace + 2 span) - **Heuristic mode** — works offline, no API key required - **3 demo traces** (Simple Q&A, Tool Calling, Multi-turn) - **Ground truth support** — `expected_response`, `expected_trajectory`, `assertions` - **Visual results** — radar chart, bar chart, heatmap, score cards ## Evaluators ### 📦 Session Level (1) | Evaluator | Description | | ----------------- | --------------------------------------------------- | | Goal Success Rate | Did the agent fully achieve the user's stated goal? | ### 🔄 Trace Level (11) | Evaluator | Description | | ----------------------- | ----------------------------------------------------------- | | Helpfulness | Does the response help the user progress toward their goal? | | Correctness | Is the response factually correct? | | Coherence | Is the reasoning logically consistent and well-structured? | | Conciseness ...",
+  "APP_FILE": "from pathlib import Path\nfrom src.evaluators import (\nfrom src.llm_judge import LLMJudge\nfrom src.models import EvalLevel, EvalMode, GroundTruth\nfrom src.parser import format_trace_tree, parse_trace\nfrom src.reliability import compute_reliability\nfrom src.runner import EvalRunner\nfrom src.visualizer import create_bar_chart, create_radar_chart, create_trace_timeline\nfrom urllib.parse import urlparse\nfrom huggingface_hub import hf_hub_download\n\n#!/usr/bin/env python3\n\"\"\"\nAI Agent Evaluation Pipeline — Gradio MVP\n==========================================\nEvaluate AI agents at 3 hierarchical levels, inspired by\nAmazon Bedrock AgentCore Evaluations.\n\n  📦 Session  — Did the agent achieve the user's goal?\n  🔄 Trace    — Per-turn quality (11 evaluators)\n  🔧 Span     — Per tool-call accuracy (2 evaluators)\n\nRun locally : python app.py\nHuggingFace : app_file = app.py  (Gradio SDK)\n\"\"\"\n\nimport json\nimport os\nimport sys\nfrom pathlib import Path\n\n# Ensure src/ is importable whether run from repo root or HF Spaces\n_ROOT = Path(__file__).parent\nsys.path.insert(0, str(_ROOT))\n\nimport gradio as gr\n\n# HF ZeroGPU Spaces require at least one @spaces.GPU-decorated function\n# to be detected at module load. The actual evaluation and dataset\n# generation work in this app uses the cloud InferenceClient and runs\n# without local GPU compute; the placeholder below exists only to\n# satisfy the runtime's static check. `spaces` is pre-installed on\n# ZeroGPU hardware; we guard the import so the app still loads if it\n# is missing (e.g. local CPU dev).\ntry:\n    import spaces as _spaces\nexcept ImportError:\n    class _spaces_stub:\n        @staticmethod\n        def GPU(fn, duration: int = 60):\n            return fn\n    _spaces = _spaces_stub()\n\n\n@_spaces.GPU\ndef _zero_gpu_healthcheck() -> dict:\n    \"\"\"Placeholder GPU function detected by the ZeroGPU runtime.\"\"\"\n    try:\n        import torch\n        retu ..."
+}

data/quest_labels/in/Advent_of_a_World_of_Flowering_Trees.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Advent_of_a_World_of_Flowering_Trees",
+  "slug": "Advent_of_a_World_of_Flowering_Trees",
+  "title": "Advent Of A World Of Flowering Trees",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference ## For development: first download uv and hf cli tool ```bash uv venv --python 3.13 --seed ``` then activate the virtual env .venv ```bash source .venv/Scripts/activate ``` then download dependencies ```python python -m pip install -r requirements.txt ``` then play around and change code..",
+  "APP_FILE": "from huggingface_hub import hf_hub_download\nfrom llama_cpp import Llama\n\nimport gradio as gr\nimport spaces\nfrom huggingface_hub import hf_hub_download\nimport os\nimport ctypes\n\n\nMODEL_REPO_ID = \"CohereLabs/tiny-aya-global-GGUF\"\nMODEL_FILENAME = \"tiny-aya-global-q4_k_m.gguf\"\n\nmodel_path = hf_hub_download(\n    repo_id=MODEL_REPO_ID,\n    filename=MODEL_FILENAME,\n)\n\n_llm = None\n\n# try:\n#     import nvidia.cuda_runtime\n#     import nvidia.cublas\n#     cudart = os.path.join(os.path.dirname(nvidia.cuda_runtime.__file__), \"lib\", \"libcudart.so.12\")\n#     cublas = os.path.join(os.path.dirname(nvidia.cublas.__file__), \"lib\", \"libcublas.so.12\")\n#     ctypes.CDLL(cudart, mode=ctypes.RTLD_GLOBAL)\n#     ctypes.CDLL(cublas, mode=ctypes.RTLD_GLOBAL)\n# except Exception:\n#     pass\n\ndef get_llm():\n    global _llm\n    if _llm is None:\n        from llama_cpp import Llama\n\n        _llm = Llama(\n            model_path=model_path,\n            n_gpu_layers=-1,\n            n_ctx=1024,\n            flash_attn=True,\n            verbose=False,\n        )\n    return _llm\n\n\n@spaces.GPU(duration=120)\ndef run_inference(prompt: str) -> str:\n    prompt = prompt.strip()\n    if not prompt:\n        return \"Enter a prompt to generate a response.\"\n\n    try:\n        llm = get_llm()\n    except Exception as exc:\n        return f\"llama-cpp initialization failed: {exc}\"\n\n    response = llm.create_chat_completion(\n        messages=[{\"role\": \"user\", \"content\": prompt}],\n        max_tokens=512,\n        temperature=0.7,\n    )\n    return response[\"choices\"][0][\"message\"][\"content\"].strip()\n\n\nwith gr.Blocks(title=\"Advent Of A World Of Flowering Trees\") as demo:\n    gr.Markdown(\"# Advent Of A World Of Flowering Trees\")\n    gr.Markdown(\"Tiny Aya GGUF demo running with `llama-cpp-python`.\")\n\n    prompt = gr.Textbox(\n        label=\"Prompt\",\n        lines=6,\n        placeholder=\"Ask something...\",\n    )\n    output = gr.Textbo ..."
+}

data/quest_labels/in/Backyard-Demo-Builder.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "id": "build-small-hackathon/Backyard-Demo-Builder",
+  "slug": "Backyard-Demo-Builder",
+  "title": "Backyard Demo Builder",
+  "sdk": "gradio",
+  "declared_models": [
+    "unsloth/gemma-4-12B-it-qat-GGUF",
+    "Qwen/Qwen2.5-7B-Instruct",
+    "nvidia/Nemotron-3.5-Content-Safety"
+  ],
+  "tags": [
+    "agents",
+    "ai-agents",
+    "backyard-ai",
+    "build-small-hackathon",
+    "demo-builder",
+    "gradio",
+    "real-estate",
+    "small-language-model"
+  ],
+  "app_file": "app.py",
+  "README": "# Backyard Demo Builder ## Chapter 1: Backyard AI *Build Small Hackathon 2026 — Chapter 1 Submission* `agent-swarm-workbench` now presents as **Backyard Demo Builder**: a Gradio app that turns one real person's workflow into a small runnable demo package before anyone pays to build full software. First backyard case: my mom, a real-estate agent. She needs a cheap way to test a customer follow-up reminder workflow before committing time and money to a full app. --- ## Watch the Demo Builder Work ``` You: \"Build a real-estate follow-up CRM demo for my mom.\" Builder: Generates a Gradio mini-app, handoff spec, field notes, and checks Result: app.py, README.md, handoff_spec.md, field_notes.md Mom: Tests the workflow, then we scrap or scale. ``` Every Run produces a **downloadable demo package** and Validation report: files you can inspect, unzip, run, and test with the real person. --- ## Build Small Hackathon — Submission Notes | Requirement | How We Meet It | |---|---| | **Small model (≤ 32B)** | Provider catalog fetches models at runtime and only allows models whose ID/name proves ≤32B | | **Gradio app** | Custom dark-themed Gradio UI mounted on FastAPI | | **HF Space** | `app.py` + `requirements.txt` — one-command deploy | | **Demo video** | *(placeholder — [link to demo])* | | **Social post** | *(placeholder — [link to post])* | ### Bonus Badges Claimed | Badge | Why | |---|---| | **🎨 Off-Brand** | Fully custom CSS dark theme — Archivo + IBM Plex Mono, acid green CTAs, paper/ ...",
+  "APP_FILE": "from __future__ import annotations\nfrom arena.api import app as fastapi_app\nfrom arena.api import service\nfrom arena.gradio_app import RunOutputs, build_app, create_run_gpu as _create_run_gpu\n\n\"\"\"Unified ASGI entrypoint for API and Gradio UI.\"\"\"\n\nfrom __future__ import annotations\n\nimport os\n\nimport gradio as gr\nimport uvicorn\n\ntry:\n    import spaces\nexcept Exception:\n    class _SpacesShim:\n        def GPU(self, fn=None, **kwargs):\n            del kwargs\n\n            def decorator(inner):\n                return inner\n\n            return decorator(fn) if fn else decorator\n\n    spaces = _SpacesShim()\n\n\nfrom arena.api import app as fastapi_app\nfrom arena.api import service\nfrom arena.gradio_app import RunOutputs, build_app, create_run_gpu as _create_run_gpu\n\n\n@spaces.GPU(duration=120)\ndef create_run_gpu(\n    prompt: str,\n    criteria_text: str,\n    user_tests_text: str,\n    provider: str = \"openrouter\",\n    model: str = \"\",\n    api_key: str = \"\",\n    base_url: str = \"\",\n) -> RunOutputs:\n    return _create_run_gpu(\n        prompt,\n        criteria_text,\n        user_tests_text,\n        provider,\n        model,\n        api_key,\n        base_url,\n    )\n\n\n@spaces.GPU\ndef zerogpu_ready_marker() -> str:\n    return \"ready\"\n\n\ndemo = build_app(service, create_run_handler=create_run_gpu)\n\n\ndef create_app():\n    \"\"\"Create one FastAPI ASGI app with Gradio mounted at the root.\"\"\"\n\n    return gr.mount_gradio_app(fastapi_app, demo, path=\"/\")\n\n\napp = create_app()\n\n\ndef server_config() -> dict[str, int | str]:\n    host = os.getenv(\"GRADIO_SERVER_NAME\", os.getenv(\"HOST\", \"0.0.0.0\"))\n    port = int(os.getenv(\"GRADIO_SERVER_PORT\") or os.getenv(\"PORT\") or \"7860\")\n    return {\"host\": host, \"port\": port}\n\n\ndef gradio_launch_config() -> dict[str, bool | int | str]:\n    config = server_config()\n    port = int(os.getenv(\"GRADIO_SERVER_PORT\") or os.getenv(\"PORT\") or \"7860\")\n    return {\"server_nam ..."
+}

data/quest_labels/in/Case-Lantern.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "id": "build-small-hackathon/Case-Lantern",
+  "slug": "Case-Lantern",
+  "title": "Case Lantern",
+  "sdk": "gradio",
+  "declared_models": [
+    "lastmass/Qwen3.5-Medical-GSPO"
+  ],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# 🏮 Case Lantern Short Demo Video： https://youtu.be/Bf3t5Cq6XuA Case Lantern is a fictional medical mystery game for the [Build Small Hackathon](https://huggingface.co/build-small-hackathon). Players investigate a short Chinese case, request clues, avoid red herrings, and submit a diagnosis within six turns. The experience uses [`lastmass/Qwen3.5-Medical-GSPO`](https://huggingface.co/lastmass/Qwen3.5-Medical-GSPO), a small Chinese medical reasoning model with roughly 4.66B parameters, as the game master and scorer. Inference runs locally via **llama.cpp** (GGUF Q4_K_M). ## Track & Merit Badges | Item | Detail | |------|--------| | Track | An Adventure in Thousand Token Wood | | AI role | Load-bearing game master, clue writer, and scoring judge | | Constraint | Small model under 32B parameters | | UI | Gradio Space with custom dark frontend | | Badge | Status | |-------|--------| | 🏕️ Off the Grid (LOCAL-FIRST) | ✅ Model runs locally in the Space | | 🎸 Well-Tuned (FINE-TUNED) | ✅ Uses fine-tuned model published on HF | | 🦙 Llama Champion | ✅ Runs via llama.cpp runtime | | 🎨 Off-Brand (CUSTOM UI) | ✅ Dark glassmorphism theme, custom CSS | ## Safety framing This is not a diagnosis or treatment tool. It only uses fictional cases for learning-oriented gameplay. Users are explicitly asked not to provide personal health information. ## Deployment notes The app is designed for **free CPU Spaces** on Hugging Face. It does not require a GPU. The GGUF model (~2.78 GB, Q4_K_M) is downloa ...",
+  "APP_FILE": "from dataclasses import dataclass, field\nfrom functools import lru_cache\nfrom typing import Dict, List, Optional\nfrom llama_cpp import Llama  # noqa: delayed import\n\n\"\"\"Case Lantern — a fictional medical mystery game powered by a small Chinese\nmedical reasoning model.\n\nBackend  : llama-cpp-python  (GGUF, runs on free CPU Spaces)\nFrontend : fully custom dark theme with glassmorphism & micro-animations\nModel    : lastmass/Qwen3.5-Medical-GSPO  (~4.66 B params, Q4_K_M quant)\n\"\"\"\n\nimport os\nimport random\nimport re\nimport textwrap\nfrom dataclasses import dataclass, field\nfrom functools import lru_cache\nfrom typing import Dict, List, Optional\n\nimport gradio as gr\n\n# ---------------------------------------------------------------------------\n# Configuration\n# ---------------------------------------------------------------------------\n# Display model (shown in UI)\nDISPLAY_MODEL_ID = \"lastmass/Qwen3.5-Medical-GSPO\"\n# GGUF repo used for actual inference (quantised by mradermacher)\nGGUF_REPO = \"mradermacher/Qwen3.5-Medical-GSPO-GGUF\"\nGGUF_FILE = \"Qwen3.5-Medical-GSPO.Q4_K_M.gguf\"\n\nDEMO_MODE = os.getenv(\"DEMO_MODE\", \"auto\").lower()\nMAX_NEW_TOKENS = int(os.getenv(\"MAX_NEW_TOKENS\", \"420\"))\n\nDISCLAIMER = (\n    \"Fictional training game only. This app does not provide medical advice, \"\n    \"diagnosis, triage, or treatment guidance for real people.\"\n)\n\n# ---------------------------------------------------------------------------\n# System prompt\n# ---------------------------------------------------------------------------\nSYSTEM_PROMPT = \"\"\"You are Case Lantern, a playful but careful medical mystery game master.\nCreate and run fictional Chinese medical reasoning puzzles for education and entertainment.\n\nRules:\n- Never present output as real medical advice.\n- Keep all patients fictional.\n- Do not ask users to share real personal health information.\n- Make the game delightful, concise, an ..."
+}

data/quest_labels/in/CodeFlow.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/CodeFlow",
+  "slug": "CodeFlow",
+  "title": "CodeFlow",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from huggingface_hub import hf_hub_download\nfrom llama_cpp import Llama\nfrom gradio import Server\nfrom fastapi.responses import HTMLResponse # serve the custom frontend from a route\nfrom typing import Any, cast # to resolve PyLance freaking out over llama-cpp-python in the generate_flowchart function\nfrom textwrap import dedent\n\n\"\"\"\n3. Graph. Capture the resulting mermaid string and visualize it\n\nTo do\n- create the custom gradio look\n- explore making it look better\n- get a better model — Qwen 30b coder\n- use zerogpu\n\n\"\"\"\nfrom huggingface_hub import hf_hub_download\nfrom llama_cpp import Llama\nimport gradio as gr\nfrom gradio import Server\nfrom fastapi.responses import HTMLResponse # serve the custom frontend from a route\nfrom typing import Any, cast # to resolve PyLance freaking out over llama-cpp-python in the generate_flowchart function\nfrom textwrap import dedent\nimport re # remove thinking tag from response \n\n\n\n    out = []\n    for line in text.split('\\n'):\n        line = re.sub(r'(?<=\\w)\\[(.*?)\\]' + END, lambda m: '[\"' + esc(m.group(1)) + '\"]', line)\n        line = re.sub(r'(?<=\\w)\\{(.*?)\\}' + END, lambda m: '{\"' + esc(m.group(1)) + '\"}', line)\n        out.append(line)\n    return '\\n'.join(out)\n\n@app.api(name=\"generate_flowchart\")\ndef generate_flowchart(src_code: str) -> str:\n    # check if src_code is empty\n    if not src_code.strip(): return \"\"\n\n    # Set system prompt\n    system_prompt = dedent(\"\"\"\n    ## Role/Persona\n    You are a senior staff software architect and compiler engineer specializing in visual control-flow mapping. Your philosophy is pure utility: you translate raw execution logic into highly accurate, scannable, structural diagrams without any conversational filler, meta-commentary, or stylistic fluff.\n\n    ## Context/Objective\n    The user will provide source code files or logic snippets. Your sole objective is to parse the syntax and output a co ..."
+}

data/quest_labels/in/ContextForge.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/ContextForge",
+  "slug": "ContextForge",
+  "title": "ContextForge",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# ContextForge / Agent Prompt Compiler ContextForge compiles messy software, app, and agent ideas into executable prompt architectures. It is a compiler pipeline, not a generic prompt generator. **GitHub:** https://github.com/rthgit/ContextForge **Competition Gradio Space:** https://huggingface.co/spaces/build-small-hackathon/ContextForge **Backup Gradio Space:** https://huggingface.co/spaces/RthItalia/ContextForge **Demo video:** https://raw.githubusercontent.com/rthgit/ContextForge/main/artifacts/contextforge-demo.mp4 **Tagline:** From fuzzy brief to build-ready agent blueprint. ## Backyard AI Fit - Built for real builders using AI coding agents. - Real problem: vague briefs make Codex and other agents produce wrong code, generic UI, or incomplete workflows. - Real use evidence: this architecture was used to coordinate Trollsona development, including UI refactor, model cascade, QA, packaging, and video automation. - Small-model fit: ContextForge decomposes a hard prompt-writing task into seven smaller calls so a small model can handle it. The backend always executes seven isolated modules sequentially: 1. intake analysis 2. topology decision 3. Vital Few / Vital Spot extraction 4. reasoning architecture selection 5. prompt pack generation 6. QA / repair 7. final assembly Every module attempts its own small-model call. If one call fails, only that stage uses a deterministic fallback and the pipeline continues. Runtime Details shows the source used by every stage. Each modul ...",
+  "APP_FILE": "from __future__ import annotations\nfrom dataclasses import dataclass\nfrom functools import lru_cache\nfrom typing import Any, Callable\nfrom transformers import AutoModelForCausalLM, AutoTokenizer\n\nfrom __future__ import annotations\n\nimport json\nimport os\nimport re\nimport time\nfrom dataclasses import dataclass\nfrom functools import lru_cache\nfrom typing import Any, Callable\n\n\nAPP_TITLE = \"ContextForge\"\nAPP_SUBTITLE = \"From fuzzy brief to build-ready agent blueprint.\"\nDEFAULT_MODEL_ID = \"Qwen/Qwen2.5-0.5B-Instruct\"\nDEFAULT_MID_MODEL_ID = \"RthItalia/nano_compact_3b_qkvfp16\"\nDEFAULT_HIGH_MODEL_ID = \"Qwen/Qwen3-32B\"\nREQUIRED_PROMPT_TAGS = [\n    \"ROLE\",\n    \"COGNITIVE_LAYERS\",\n    \"KAHNEMAN_SYSTEM2\",\n    \"PARETO_80_20\",\n    \"VITAL_SPOT\",\n    \"REASONING_PROTOCOL\",\n    \"AGENTIC_LOOP\",\n    \"ACTION\",\n    \"FORMAT_AND_TARGET\",\n    \"QA_CHECKS\",\n]\nTOPOLOGIES = [\"Auto\", \"Single Prompt\", \"Cascade\", \"Context Pack\", \"Agent Workflow\"]\nREASONING_LAYERS = [\n    \"CRAFT\",\n    \"Kahneman System 2\",\n    \"Pareto 80/20\",\n    \"Agentic Loop\",\n    \"Tree of Thought controlled\",\n    \"Private CoT\",\n    \"Self-Correction\",\n    \"Sentinel Recovery\",\n]\nSTAGE_NAMES = [\n    \"intake_analysis\",\n    \"topology_decision\",\n    \"vital_structure\",\n    \"reasoning_architecture\",\n    \"prompt_pack_generation\",\n    \"qa_repair\",\n    \"final_assembly\",\n]\nSTAGE_TOKEN_BUDGETS = {\n    \"intake_analysis\": 180,\n    \"topology_decision\": 140,\n    \"vital_structure\": 180,\n    \"reasoning_architecture\": 240,\n    \"prompt_pack_generation\": 520,\n    \"qa_repair\": 260,\n    \"final_assembly\": 260,\n}\n\n\ndef parse_bool_env(name: str, default: bool = False) -> bool:\n    raw = os.getenv(name)\n    if raw is None:\n        return default\n    return raw.strip().lower() in {\"1\", \"true\", \"yes\", \"on\"}\n\n\ndef parse_int_env(name: str, default: int, minimum: int, maximum: int) -> int:\n    try:\n        value = int(os.getenv(name, str(default)))\n    except Valu ..."
+}

data/quest_labels/in/Council-of-Tiny-Minds.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Council-of-Tiny-Minds",
+  "slug": "Council-of-Tiny-Minds",
+  "title": "Council Of Tiny Minds",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from typing import Dict, List, Any\nfrom transformers import AutoModelForCausalLM, AutoTokenizer\n\nimport os\nimport re\nimport time\nimport random\nfrom typing import Dict, List, Any\n\nimport gradio as gr\nimport torch\nfrom transformers import AutoModelForCausalLM, AutoTokenizer\n\ntry:\n    import spaces  # ZeroGPU decorator\nexcept Exception:\n    class _SpacesFallback:\n        def GPU(self, fn=None, **kwargs):\n            if fn is None:\n                def _wrap(inner):\n                    return inner\n                return _wrap\n            return fn\n    spaces = _SpacesFallback()\n\n\n# ----------------------------\n# Model\n# ----------------------------\nMODEL_ID = os.getenv(\"MODEL_ID\", \"Qwen/Qwen3.5-9B\")\nMAX_NEW_TOKENS = int(os.getenv(\"MAX_NEW_TOKENS\", \"140\"))\nTEMPERATURE = float(os.getenv(\"TEMPERATURE\", \"0.9\"))\nTOP_P = float(os.getenv(\"TOP_P\", \"0.9\"))\n\nPERSONAS = [\n    {\n        \"name\": \"Mister Wink\",\n        \"emoji\": \"✨\",\n        \"style\": (\n            \"You are charming, slightly ridiculous, and surprisingly helpful. \"\n            \"You speak like a cheerful TV host from a glitchy early-2023 chatbot era.\"\n        ),\n    },\n    {\n        \"name\": \"Goblin Clerk\",\n        \"emoji\": \"🪄\",\n        \"style\": (\n            \"You are chaotic but functional. \"\n            \"You love odd metaphors, tiny complaints, and enthusiastic one-liners.\"\n        ),\n    },\n    {\n        \"name\": \"Oracle Beta\",\n        \"emoji\": \"🔮\",\n        \"style\": (\n            \"You speak in short, atmospheric lines. \"\n            \"You sound wise, but a little too dramatic for the situation.\"\n        ),\n    },\n    {\n        \"name\": \"The Skeptic\",\n        \"emoji\": \"🫧\",\n        \"style\": (\n            \"You are skeptical, precise, and dryly funny. \"\n            \"You question nonsense while still being useful.\"\n        ),\n    },\n]\n\n\ndef _load_model():\n    tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code ..."
+}

data/quest_labels/in/Darwin-35B-A3B-Opus.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "id": "build-small-hackathon/Darwin-35B-A3B-Opus",
+  "slug": "Darwin-35B-A3B-Opus",
+  "title": "Darwin 35B A3B Opus",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "mcp-server",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "This model is introduced in [Darwin Family](https://arxiv.org/abs/2605.14386).",
+  "APP_FILE": "from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, TextIteratorStreamer\nfrom threading import Thread\n\nimport os\nimport spaces\nimport torch\nimport gradio as gr\nfrom transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, TextIteratorStreamer\nfrom threading import Thread\n\n# Persist HF Hub cache on the mounted bucket storage so the 67GB model\n# only downloads once and stays cached between ZeroGPU calls.\nos.environ.setdefault(\"HF_HOME\", \"/data/hf_home\")\nos.environ.setdefault(\"HF_HUB_CACHE\", \"/data/hf_cache\")\n\nMODEL_ID = \"FINAL-Bench/Darwin-35B-A3B-Opus\"\nHF_TOKEN = os.environ.get(\"HF_TOKEN\")\n\nBNB = BitsAndBytesConfig(\n    load_in_4bit=True,\n    bnb_4bit_quant_type=\"nf4\",\n    bnb_4bit_use_double_quant=True,\n    bnb_4bit_compute_dtype=torch.bfloat16,\n    # Allow accelerate to place buffers on CPU rather than hard-failing load.\n    # On an A10G this usually keeps 100% of weights on GPU.\n    llm_int8_enable_fp32_cpu_offload=True,\n)\n\n_model_cache = {}\n\ndef _load():\n    if \"model\" not in _model_cache:\n        tok = AutoTokenizer.from_pretrained(\n            MODEL_ID,\n            trust_remote_code=True,\n            token=HF_TOKEN,\n            cache_dir=os.environ[\"HF_HUB_CACHE\"],\n        )\n        if tok.pad_token is None:\n            tok.pad_token = tok.eos_token\n\n        if torch.cuda.is_available():\n            torch.cuda.empty_cache()\n\n        mod = AutoModelForCausalLM.from_pretrained(\n            MODEL_ID,\n            trust_remote_code=True,\n            token=HF_TOKEN,\n            quantization_config=BNB,\n            device_map=\"auto\",\n            # Calm the MoE memory estimator on A10G 24 GB\n            max_memory={0: \"22GiB\", \"cpu\": \"200GiB\"},\n            cache_dir=os.environ[\"HF_HUB_CACHE\"],\n            low_cpu_mem_usage=True,\n        )\n        _model_cache[\"model\"] = mod\n        _model_cache[\"tokenizer\"] = tok\n    retu ..."
+}

data/quest_labels/in/Family-Bill-Assistant.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Family-Bill-Assistant",
+  "slug": "Family-Bill-Assistant",
+  "title": "Family Bill Assistant",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from ui.layout import create_ui\nfrom tools.vision import process_receipt_image\nfrom agent.brain import process_workflow\n\nimport gradio as gr\nfrom ui.layout import create_ui\nfrom tools.vision import process_receipt_image\nfrom agent.brain import process_workflow\n\n# Load the custom CSS for the \"Off-Brand\" Badge\ntry:\n    with open(\"ui/style.css\", \"r\") as f:\n        custom_css = f.read()\nexcept FileNotFoundError:\n    custom_css = \"\"\n\n# Build the Gradio App\ndemo = gr.Blocks()\nmy_theme = gr.themes.Default(\n    primary_hue=\"blue\", \n    neutral_hue=\"slate\"\n)\n\nwith demo:\n    # Initialize the UI layout from the ui folder\n    image_input, audio_input, submit_btn, chatbot, msg_input = create_ui()\n    \n    # Bind the submit button to the Core Boss workflow\n    def handle_analyze(image, user_msg, history):\n        if not user_msg:\n            user_msg = \"Please analyze this bill.\"\n            \n        # Step 1: If an image is provided, extract raw text\n        raw_text = None\n        if image:\n            raw_text = process_receipt_image(image)\n            print(f\"=== VISION MODEL RAW TEXT ===\\n{raw_text}\\n=============================\")\n            \n        # Step 2: Route everything to the Core Boss\n        bot_response = process_workflow(user_text=user_msg, raw_vision_text=raw_text)\n        print(f\"=== CORE ROUTER RESPONSE ===\\n{bot_response}\\n============================\")\n        \n        # Step 3: Append to chat history\n        history.append({\"role\": \"user\", \"content\": user_msg})\n        history.append({\"role\": \"assistant\", \"content\": str(bot_response)})\n        return history\n        \n    submit_btn.click(\n        fn=handle_analyze,\n        inputs=[image_input, msg_input, chatbot],\n        outputs=[chatbot]\n    )\n\nif __name__ == \"__main__\":\n    demo.launch(theme=my_theme, css=custom_css)"
+}

data/quest_labels/in/First-Principle-AI.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "id": "build-small-hackathon/First-Principle-AI",
+  "slug": "First-Principle-AI",
+  "title": "First-Principle AI",
+  "sdk": "gradio",
+  "declared_models": [
+    "build-small-hackathon/phase-3-gguf"
+  ],
+  "tags": [
+    "build-small-hackathon",
+    "chatbot",
+    "gguf",
+    "gradio",
+    "llama-cpp",
+    "model-lab",
+    "zerogpu"
+  ],
+  "app_file": "app.py",
+  "README": "# First-Principle AI First-Principle AI is a compact Gradio console for running and probing the `build-small-hackathon/phase-3-gguf` Q8 GGUF model through the official `llama.cpp` Ubuntu `llama-server` release. The UI includes benchmark-style examples inspired by common LLM evaluation areas: math reasoning, commonsense, science QA, truthfulness, instruction following, coding, logic, summarization, extraction, robustness, and goal-binding prompts where the model must identify which real-world object needs to move. The questions are original prompts, not copied benchmark items. ## Runtime Notes - Model repo: `build-small-hackathon/phase-3-gguf` - Model file: `model-Q8_0.gguf` - Runtime: official `llama.cpp` `llama-server` - Hardware target: ZeroGPU - Fallback behavior: visible runtime diagnostics instead of silent mock output - Model loading: runtime download/load through a persistent `llama-server` - Default llama.cpp settings: `n_ctx=2048`, `n_batch=256`, `n_ubatch=64`, memory-mapped weights, no warmup, and CPU fallback if CUDA offload is unavailable ZeroGPU is a Gradio dynamic GPU runtime primarily documented around PyTorch workloads. This app targets ZeroGPU as requested, but it runs the GGUF through the official llama.cpp CLI path so it does not depend on a Python extension compile during the Space build. If the runtime does not expose enough memory or a compatible llama.cpp binary, the app returns a visible compatibility message. The model is intentionally not preloaded d ...",
+  "APP_FILE": "from __future__ import annotations\nfrom pathlib import Path\nfrom typing import Any\nfrom huggingface_hub import HfApi, hf_hub_download\n\nfrom __future__ import annotations\n\nimport os\nimport platform\nimport re\nimport threading\nimport time\nimport subprocess\nimport tarfile\nimport urllib.request\nimport json\nfrom pathlib import Path\nfrom typing import Any\n\nimport gradio as gr\nfrom huggingface_hub import HfApi, hf_hub_download\n\ntry:\n    import spaces\nexcept Exception:  # pragma: no cover - the package exists on HF ZeroGPU runtimes\n    spaces = None  # type: ignore[assignment]\n\nMODEL_REPO = os.getenv(\"PHASE3_MODEL_REPO\", \"build-small-hackathon/phase-3-gguf\")\nMODEL_FILE = os.getenv(\"PHASE3_MODEL_FILE\", \"model-Q8_0.gguf\")\nMODEL_LABEL = \"First-Principle AI\"\nLOCAL_MODEL_PATH = Path(\"/Users/user/.lmstudio/models/owenisas/Phase-3-GGUF/model-Q8_0.gguf\")\nLLAMA_RELEASE = os.getenv(\"PHASE3_LLAMA_RELEASE\", \"b9360\")\nLLAMA_URL = os.getenv(\n    \"PHASE3_LLAMA_URL\",\n    f\"https://github.com/ggml-org/llama.cpp/releases/download/{LLAMA_RELEASE}/llama-{LLAMA_RELEASE}-bin-ubuntu-x64.tar.gz\",\n)\nMAX_CONTEXT = int(os.getenv(\"PHASE3_MAX_CONTEXT\", \"2048\"))\nMIN_RAM_GB = float(os.getenv(\"PHASE3_MIN_RAM_GB\", \"38\"))\nDISABLE_MODEL = os.getenv(\"PHASE3_DISABLE_MODEL\", \"\").lower() in {\"1\", \"true\", \"yes\"}\nUSE_ZEROGPU_DECORATOR = os.getenv(\"PHASE3_USE_ZEROGPU\", \"\").lower() in {\"1\", \"true\", \"yes\"}\nN_BATCH = int(os.getenv(\"PHASE3_N_BATCH\", \"256\"))\nN_UBATCH = int(os.getenv(\"PHASE3_N_UBATCH\", \"64\"))\nN_THREADS = int(os.getenv(\"PHASE3_THREADS\", str(max(1, min(16, os.cpu_count() or 2)))))\nN_THREADS_BATCH = int(os.getenv(\"PHASE3_THREADS_BATCH\", str(N_THREADS)))\nUSE_MMAP = os.getenv(\"PHASE3_USE_MMAP\", \"1\").lower() not in {\"0\", \"false\", \"no\"}\nUSE_MLOCK = os.getenv(\"PHASE3_USE_MLOCK\", \"\").lower() in {\"1\", \"true\", \"yes\"}\nFLASH_ATTN = os.getenv(\"PHASE3_FLASH_ATTN\", \"\").lower() in {\"1\", \"true\", \"yes\"}\nOFFLOAD_KQV = os.getenv ..."
+}

data/quest_labels/in/GRM-2.6-Opus.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/GRM-2.6-Opus",
+  "slug": "GRM-2.6-Opus",
+  "title": "GRM-2.6-Opus",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Text-only ZeroGPU Space for `GRM-2.6-Opus`. Notes: - Built for ZeroGPU with `@spaces.GPU` - Uses 4-bit NF4 quantization to reduce memory pressure - Keeps the UI text-only because the Qwen model card explicitly recommends text-only deployment to save memory and free more KV cache - Exposes Qwen3.6 thinking controls through `enable_thinking` and `preserve_thinking` - Uses shorter default generation lengths than the model card recommendations to behave better in shared ZeroGPU queues",
+  "APP_FILE": "from threading import Thread\nfrom transformers import (\n\nimport os\nimport re\nimport html\nfrom threading import Thread\n\nimport gradio as gr\nimport spaces\nimport torch\nfrom transformers import (\n    AutoModelForCausalLM,\n    AutoTokenizer,\n    BitsAndBytesConfig,\n    TextIteratorStreamer,\n)\n\nMODEL_ID = \"OrionLLM/GRM-2.6-Opus\"\nTITLE = \"GRM-2.6-Opus\"\nSUBTITLE = \"Chat with GRM-2.6-Opus on ZeroGPU\"\nDESCRIPTION = (\n    \"Chat with GRM-2.6-Opus in a ZeroGPU Space, optimized with text-only chat, \"\n    \"NF4 4-bit loading, bounded context, streaming output, and thinking parsing.\"\n)\n\nPLACEHOLDER = (\n    \"Ask GRM-2.6-Opus for code, debugging, planning, research, long-form reasoning, \"\n    \"terminal-agent tasks, or complex multi-step workflows.\"\n)\n\nMAX_INPUT_TOKENS = 16384\nINTERNAL_MAX_NEW_TOKENS = 4096\nHF_TOKEN = os.environ.get(\"HF_TOKEN\")\n\nos.environ.setdefault(\"PYTORCH_CUDA_ALLOC_CONF\", \"expandable_segments:True\")\ntorch.backends.cuda.matmul.allow_tf32 = True\n\nBNB_CONFIG = BitsAndBytesConfig(\n    load_in_4bit=True,\n    bnb_4bit_quant_type=\"nf4\",\n    bnb_4bit_use_double_quant=True,\n    bnb_4bit_compute_dtype=torch.bfloat16,\n)\n\ntokenizer = AutoTokenizer.from_pretrained(\n    MODEL_ID,\n    trust_remote_code=True,\n    token=HF_TOKEN,\n)\n\nif tokenizer.pad_token is None:\n    tokenizer.pad_token = tokenizer.eos_token\n\nmodel = AutoModelForCausalLM.from_pretrained(\n    MODEL_ID,\n    trust_remote_code=True,\n    token=HF_TOKEN,\n    device_map={\"\": 0},\n    dtype=torch.bfloat16,\n    quantization_config=BNB_CONFIG,\n    attn_implementation=\"sdpa\",\n    low_cpu_mem_usage=True,\n)\n\nmodel.eval()\n\n\ndef model_input_device():\n    return next(model.parameters()).device\n\n\ndef strip_thinking(text: str) -> str:\n    if not text:\n        return \"\"\n\n    text = re.sub(\n        r\"(?is)<details[^>]*>\\s*<summary>.*?</summary>.*?</details>\",\n        \"\",\n        text,\n    )\n\n    text = re.sub(r\"(?is)<think>.*?</think> ..."
+}

data/quest_labels/in/GTROX.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/GTROX",
+  "slug": "GTROX",
+  "title": "GTROX",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "An example chatbot using [Gradio](https://gradio.app), [`huggingface_hub`](https://huggingface.co/docs/huggingface_hub/v0.22.2/en/index), and the [Hugging Face Inference API](https://huggingface.co/docs/api-inference/index).",
+  "APP_FILE": "from huggingface_hub import InferenceClient\n\nimport gradio as gr\nfrom huggingface_hub import InferenceClient\n\n\ndef respond(\n    message,\n    history: list[dict[str, str]],\n    system_message,\n    max_tokens,\n    temperature,\n    top_p,\n    hf_token: gr.OAuthToken,\n):\n    \"\"\"\n    For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference\n    \"\"\"\n    client = InferenceClient(token=hf_token.token, model=\"openai/gpt-oss-20b\")\n\n    messages = [{\"role\": \"system\", \"content\": system_message}]\n\n    messages.extend(history)\n\n    messages.append({\"role\": \"user\", \"content\": message})\n\n    response = \"\"\n\n    for message in client.chat_completion(\n        messages,\n        max_tokens=max_tokens,\n        stream=True,\n        temperature=temperature,\n        top_p=top_p,\n    ):\n        choices = message.choices\n        token = \"\"\n        if len(choices) and choices[0].delta.content:\n            token = choices[0].delta.content\n\n        response += token\n        yield response\n\n\n\"\"\"\nFor information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface\n\"\"\"\nchatbot = gr.ChatInterface(\n    respond,\n    additional_inputs=[\n        gr.Textbox(value=\"You are a friendly Chatbot.\", label=\"System message\"),\n        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label=\"Max new tokens\"),\n        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label=\"Temperature\"),\n        gr.Slider(\n            minimum=0.1,\n            maximum=1.0,\n            value=0.95,\n            step=0.05,\n            label=\"Top-p (nucleus sampling)\",\n        ),\n    ],\n)\n\nwith gr.Blocks() as demo:\n    with gr.Sidebar():\n        gr.LoginButton()\n    chatbot.render()\n\n\nif __name__ == \"__main__\":\n    demo.launch()"
+}

data/quest_labels/in/InContext.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/InContext",
+  "slug": "InContext",
+  "title": "InContext",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from transformers import AutoModelForCausalLM, AutoTokenizer\n\nimport gradio as gr\nimport torch\nimport json\nimport html\nimport traceback\nfrom transformers import AutoModelForCausalLM, AutoTokenizer\n\nprint(\"Loading model...\")\nmodel_name = \"Qwen/Qwen2.5-0.5B-Instruct\"\ntokenizer = AutoTokenizer.from_pretrained(model_name)\nmodel = AutoModelForCausalLM.from_pretrained(\n    model_name,\n    torch_dtype=torch.float16,\n    device_map=\"auto\"\n)\nprint(\"Model loaded.\")\n\nSYSTEM_PROMPT = \"\"\"You are an English learning assistant. Extract 8-20 useful expressions from the text.\nFor each expression, output a JSON object with keys: expression, meaning, explanation, original_context, extra_example.\nMeaning and explanation should be in Chinese.\nOutput must be a JSON array. No extra text.\"\"\"\n\ndef analyze(text):\n    try:\n        if not text or len(text.strip()) < 20:\n            return \"<div style='color:red'>⚠️ Please enter at least 20 characters.</div>\"\n\n        messages = [\n            {\"role\": \"system\", \"content\": SYSTEM_PROMPT},\n            {\"role\": \"user\", \"content\": text}\n        ]\n        inputs = tokenizer.apply_chat_template(\n            messages,\n            add_generation_prompt=True,\n            return_tensors=\"pt\"\n        ).to(model.device)\n\n        with torch.no_grad():\n            outputs = model.generate(\n                inputs,\n                max_new_tokens=1024,\n                do_sample=False,\n                temperature=1.0\n            )\n\n        response = tokenizer.decode(outputs[0][inputs.shape[1]:], skip_special_tokens=True)\n\n        # 提取 JSON\n        if \"```json\" in response:\n            response = response.split(\"```json\")[1].split(\"```\")[0]\n        elif \"```\" in response:\n            response = response.split(\"```\")[1].split(\"```\")[0]\n        start = response.find(\"[\")\n        end = response.rfind(\"]\") + 1\n        if start == -1 or end == 0:\n            return f\"< ..."
+}

data/quest_labels/in/Kasualdad_LFED.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "id": "build-small-hackathon/Kasualdad_LFED",
+  "slug": "Kasualdad_LFED",
+  "title": "Kasualdad LFED",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "duckdb",
+    "education",
+    "gguf",
+    "gradio",
+    "llama-cpp",
+    "local-first",
+    "text-to-sql"
+  ],
+  "app_file": "app.py",
+  "README": "# 🏫 Kasualdad LFED **Local-First Education Data** — ask questions about your district in plain English, get answers instantly. All inference runs on your machine. No data ever leaves. > 🏆 Built for the **HF Build Small Hackathon** (Chapter One: Backyard AI) --- ## 🏅 Hackathon Badges | Badge | Status | How | |---|---|---| | **Off the Grid** | ✅ | All inference via llama.cpp + local GGUF. No API calls. No cloud. | | **Well-Tuned** | ✅ | Fine-tuned Qwen2.5-Coder-7B on 1,200+ synthetic NL→SQL pairs via Unsloth QLoRA on Modal A10G. | | **Llama Champion** | ✅ | llama.cpp as the sole inference backend. Q4_K_M quantization. Streaming token generation. | | **Off-Brand** | ✅ | Custom design system (Linear/Vercel inspired), WCAG AA, Inter + JetBrains Mono, documented below. | --- ## 🎯 What It Does A school district admin (principal, superintendent, department head) types a question: > *\"What percentage of students at Lincoln Elementary were chronically absent in 2023-2024?\"* Kasualdad LFED: 1. Sends the question + schema context to a local LLM (llama.cpp) 2. Streams the generated SQL back in real-time 3. Validates the SQL against the actual schema (column names, safety) 4. Executes it on an in-memory DuckDB database 5. Returns the results as a table All local. No API keys. No data exfiltration. --- ## 🏗 Architecture ```mermaid flowchart TD U[👤 School Admin] -->|natural language| UI[Gradio UI] UI -->|question + schema| LLM[model_inference.py] LLM -->|llama.cpp| GGUF[Qwen2.5-Coder-7B<br/> ...",
+  "APP_FILE": "from model_inference import load_model, generate_sql\nfrom data_engine import create_session, execute_safe, QueryTimeoutError\nfrom pathlib import Path\nfrom data.export_parquet import export_parquet\n\n\"\"\"\napp.py — Kasualdad LFED: Local-First Education Data Analytics.\n\nThin Gradio controller. All logic lives in:\n  - prompts.py         (system prompt, schema docs, few-shot examples)\n  - model_inference.py (llama.cpp wrapper, SQL generation + streaming)\n  - data_engine.py     (DuckDB lifecycle, schema seeding, execution guard)\n\"\"\"\n\nimport gradio as gr\nimport spaces\n\nfrom model_inference import load_model, generate_sql\nfrom data_engine import create_session, execute_safe, QueryTimeoutError\n\n# ── Startup ───────────────────────────────────────────────────────────\n\nprint(\"🚀 Starting Kasualdad LFED...\")\n\n# Ensure Parquet seed files exist (generate on first boot, persist in /data/)\nfrom pathlib import Path\n_parquet_dirs = [Path(\"/data\"), Path(__file__).parent / \"data\"]\n_pq_files = [\"enrollment.parquet\", \"attendance.parquet\"]\n_pq_found = any(\n    all((base / f).exists() for f in _pq_files)\n    for base in _parquet_dirs\n)\nif not _pq_found:\n    print(\"📦 Generating seed Parquet files (first boot)...\")\n    from data.export_parquet import export_parquet\n    _pq_out = _parquet_dirs[0] if _parquet_dirs[0].exists() else _parquet_dirs[1]\n    export_parquet(_pq_out)\n\nprint(\"🦙 Loading model...\")\nllm = load_model()\nprint(\"✅ Ready.\")\n\n# ── Example queries ────────────────────────────────────────────────────\n\nEXAMPLE_QUERIES = [\n    \"How many students were chronically absent in 2023-2024?\",\n    \"Show total enrollment per school for 2024-2025, sorted highest first.\",\n    \"What is the average absence count per school in 2023-2024?\",\n    \"Show the enrollment trend across all school years.\",\n    \"Which grade level has the highest enrollment in 2024-2025?\",\n    \"What percentage of students at Linco ..."
+}

data/quest_labels/in/Kintsugi-Garden.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Kintsugi-Garden",
+  "slug": "Kintsugi-Garden",
+  "title": "The Kintsugi Garden",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "<p align=\"center\"> <img src=\"logo.svg\" alt=\"The Kintsugi Garden — K and G mended by a gold seam\" width=\"220\"> </p> # The Kintsugi Garden > *A symbolic mirror for dreams, journals, and inner transitions.* **This is not therapy, diagnosis, prediction, or advice. It is a symbolic reflection tool.** The Kintsugi Garden is a small-model symbolic reflection app. You give it a dream, a journal entry, an emotional trigger, a relationship pattern, a recurring symbol, or a life transition, and it offers back a *symbolic reading*: archetypal themes, possible shadow patterns, individuation signals, a gentle question, and a session-based **Soul Map**. Like the Japanese art of *kintsugi* — mending broken pottery with gold — the app treats the cracks and wounds in our inner stories as places where meaning and value can gather, never as something to diagnose or fix. --- ## Project overview The app accepts free-form text and surrounds a lightweight instruction-tuned language model with deterministic Python scaffolding: - a curated **symbolic lexicon** (40+ symbols, each with meanings, archetypes, shadow motifs, and individuation signals); - **symbol extraction** with aliases and simple plural handling; - a session-local **Soul Map** that tracks recurring symbols and themes; - **prompt compression** so only the current entry and its symbols reach the model; - **structured, parsed output** split across calm, focused tabs; - a **deterministic mandala generator** (PIL) that visualizes the symbols ...",
+  "APP_FILE": "from PIL import Image, ImageDraw, ImageFont\n\n\"\"\"\nThe Kintsugi Garden\nA symbolic mirror for dreams, journals, and inner transitions.\n\nA small-model symbolic reflection app built for the Build Small Hackathon.\n\nThis is NOT therapy, diagnosis, prediction, fortune-telling, or advice.\nIt is a symbolic reflection tool.\n\nThe design philosophy is \"small model, strong scaffolding\": rather than\nrelying on the LLM alone, the app surrounds a lightweight instruction model\n(microsoft/Phi-4-mini-instruct) with deterministic Python:\n\n  * a curated symbolic lexicon\n  * keyword / symbol extraction with aliases and simple plurals\n  * a session-local \"Soul Map\" memory\n  * prompt compression (only the current entry + extracted symbols are sent)\n  * structured, parsed output\n  * deterministic mandala generation with PIL (no image model required)\n\nAuthor: Build Small Hackathon submission\n\"\"\"\n\nimport os\nimport re\nimport sys\nimport json\nimport math\nimport datetime\nimport traceback\n\nimport gradio as gr\nimport pandas as pd\nfrom PIL import Image, ImageDraw, ImageFont\n\n# `spaces` is only available on HF Spaces with zero-* hardware tiers. Guard\n# the import so local development (Mac, Linux, etc.) doesn't hard-fail.\n# Outside HF Spaces, @spaces.GPU becomes a no-op passthrough decorator.\ntry:\n    import spaces\nexcept Exception:  # pragma: no cover - local dev environments\n    class _SpacesStub:\n        def GPU(self, *args, **kwargs):\n            def decorator(fn):\n                return fn\n            return decorator\n    spaces = _SpacesStub()\n\n# Torch / transformers are imported lazily inside load_model() so that the\n# Gradio interface can still render even if the heavy stack has trouble\n# loading. We import torch eagerly because we need its dtype constants, but\n# guard it so the app never hard-crashes at import time.\ntry:\n    import torch\nexcept Exception:  # pragma: no cover - extremely defensiv ..."
+}

data/quest_labels/in/LocalDuo.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/LocalDuo",
+  "slug": "LocalDuo",
+  "title": "LocalDuo",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from PIL import Image\nfrom supertonic import TTS\nfrom transformers import AutoProcessor, AutoModelForImageTextToText\nfrom bs4 import BeautifulSoup\nfrom playwright.sync_api import sync_playwright\nfrom urllib.parse import urljoin\nfrom transformers import TextIteratorStreamer, StoppingCriteria, StoppingCriteriaList\nfrom threading import Thread\n\n# Copyright: Shayekh Bin Islam. KAIST, South Korea. 2026.\n\nMAX_TEXT_CHAR = 1500\n\n# model_id = \"Qwen/Qwen3.5-9B\"\nmodel_id = \"Qwen/Qwen3.5-2B\"\n\ntry:\n    import spaces\n    IS_HF = True\nexcept ImportError:\n    IS_HF = False\n\n\nif not IS_HF:\n    class spaces:\n        @staticmethod\n        def GPU(*args, **kwargs):\n            def decorator(func):\n                return func\n            if len(args) == 1 and callable(args[0]) and not kwargs:\n                return args[0]\n            return decorator\nelse:\n    import os, sys, subprocess\n    os.environ['SUPERTONIC_CACHE_DIR']  = '/home/user/huggingface'\n    os.environ[\"HF_HOME\"] = \"/home/user/huggingface\"\n    os.environ['XDG_CACHE_HOME'] = \"/home/user/huggingface\"\n    \n    os.environ['PLAYWRIGHT_BROWSERS_PATH'] = \"/home/user/huggingface/ms-playwright\"\n    # os.system(\"playwright install chromium\")\n    result = subprocess.run(\n        [\"python\", \"-m\", \"playwright\", \"install\", \"chromium\"],\n        env={**os.environ},\n        check=True,\n        stdout=subprocess.PIPE,\n        stderr=subprocess.PIPE\n    )\n\nimport gradio as gr\nimport fitz  # PyMuPDF\nfrom PIL import Image\nimport io\nimport json\nimport base64\nimport soundfile as sf\nimport torch\nimport os\n\nfrom supertonic import TTS\nfrom transformers import AutoProcessor, AutoModelForImageTextToText\n\n# model = None\n# processor = None\n# tts = None\n# voice_style = None\n\nglobal_stop_thinking = [False]\nglobal_kill_threads = [False]\n\ndef set_stop_thinking():\n    global_stop_thinking[0] = True\n    print(f\"[STOP-THINK] set_stop_thinking CALLED! Flag is ..."
+}

data/quest_labels/in/Mediassist.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Mediassist",
+  "slug": "Mediassist",
+  "title": "Mediassist",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from transformers import AutoTokenizer, AutoModelForCausalLM\n\nimport gradio as gr\nfrom transformers import AutoTokenizer, AutoModelForCausalLM\nimport torch\n\nmodel = None\ntokenizer = None\n\ndef load_model():\n    global model, tokenizer\n    if model is None:\n        print(\"[MediAssist] Loading...\")\n        model_id = \"TinyLlama/TinyLlama-1.1B-Chat-v1.0\"\n        tokenizer = AutoTokenizer.from_pretrained(model_id)\n        model = AutoModelForCausalLM.from_pretrained(\n            model_id, torch_dtype=torch.float32, low_cpu_mem_usage=True\n        )\n        model.eval()\n        print(\"[MediAssist] Ready!\")\n\n# For Urdu/Hindi we translate the question to English, get answer, keep it simple\n# TinyLlama only works well in English — this is honest and works\nSYSTEM_EN = \"\"\"You are MediAssist, a medical assistant for rural Pakistan communities.\nAnswer clearly in English with this exact format:\n\n🔍 What this might be:\n- cause 1\n- cause 2\n\n🏠 Home care steps:\n- step 1\n- step 2\n- step 3\n\n🚨 Go to doctor immediately if:\n- warning 1\n- warning 2\n\nKeep under 120 words. Never diagnose. Always suggest seeing a doctor for serious issues.\"\"\"\n\nSYSTEM_UR = \"\"\"You are a medical assistant. The user is asking in Urdu.\nFirst translate their question to English, answer in English with this format:\n\n🔍 What this might be:\n- cause\n\n🏠 Home care:\n- step 1\n- step 2\n\n🚨 See doctor if:\n- warning\n\nThen write: \"اردو خلاصہ:\" and give a 2-line Urdu summary of your answer.\nKeep total response under 150 words.\"\"\"\n\nSYSTEM_HI = \"\"\"You are a medical assistant. Answer in simple Hindi with this format:\n\n🔍 यह क्या हो सकता है:\n- कारण\n\n🏠 घर पर करें:\n- कदम 1\n- कदम 2\n\n🚨 डॉक्टर के पास जाएं अगर:\n- चेतावनी\n\n100 शब्दों से कम रखें।\"\"\"\n\nSYSTEMS = {\n    \"English\": SYSTEM_EN,\n    \"اردو\": SYSTEM_UR,\n    \"हिन्दी\": SYSTEM_HI,\n}\n\nDISCLAIMERS = {\n    \"English\": \"\\n\\n⚠️ *For informational purposes only. Always consult a real doctor.*\", ..."
+}

data/quest_labels/in/NEXUS-Visual-Weaver.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/NEXUS-Visual-Weaver",
+  "slug": "NEXUS-Visual-Weaver",
+  "title": "NEXUS Visual Weaver",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from diffusers import Flux2KleinPipeline\n\nimport spaces  # MUST be imported before any CUDA-touching package (torch/diffusers)\n\nimport gradio as gr\nimport numpy as np\nimport random\nimport torch\nfrom diffusers import Flux2KleinPipeline\n\n# ---------------------------------------------------------------------------\n# Model: FLUX.2 [klein] 4B\n#   - Apache-2.0, 4B params, BFL's fastest small model (sub-second, ~13GB VRAM)\n#   - Unified text-to-image + multi-reference editing\n#   - Released Jan 2026 (current BFL small-model generation)\n# ---------------------------------------------------------------------------\nMODEL_REPO_ID = \"black-forest-labs/FLUX.2-klein-4B\"\n\ndtype = torch.bfloat16\ndevice = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n\n# Load on cuda at module level. (No enable_model_cpu_offload() on ZeroGPU —\n# the GPU is only attached inside @spaces.GPU; module-level cuda uses the\n# ZeroGPU CUDA-emulation, and offload would conflict.)\npipe = Flux2KleinPipeline.from_pretrained(MODEL_REPO_ID, torch_dtype=dtype).to(device)\n\nMAX_SEED = np.iinfo(np.int32).max\nMAX_IMAGE_SIZE = 2048\n\n\n@spaces.GPU(duration=60)\ndef infer(\n    prompt,\n    seed,\n    randomize_seed,\n    width,\n    height,\n    num_inference_steps,\n    guidance_scale,\n    progress=gr.Progress(track_tqdm=True),\n):\n    if randomize_seed:\n        seed = random.randint(0, MAX_SEED)\n    generator = torch.Generator(device=device).manual_seed(seed)\n    image = pipe(\n        prompt=prompt,\n        width=width,\n        height=height,\n        num_inference_steps=num_inference_steps,\n        guidance_scale=guidance_scale,\n        generator=generator,\n    ).images[0]\n    return image, seed\n\n\nexamples = [\n    \"A magical city at twilight, glowing windows, storybook illustration, warm light\",\n    \"A cat holding a sign that says hello world\",\n    \"Astronaut in a jungle, cold color palette, muted colors, detailed, 8k\",\n]\n\ncss = ..."
+}

data/quest_labels/in/PocketWorld-Studio.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/PocketWorld-Studio",
+  "slug": "PocketWorld-Studio",
+  "title": "PocketWorld Studio",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from pathlib import Path\n\nimport copy\nimport html\nimport json\nfrom pathlib import Path\n\nimport gradio as gr\n\n\nPROJECT_ROOT = Path(__file__).parent\nASSETS_DIR = PROJECT_ROOT / \"assets\"\nASSET_CATALOG_PATH = ASSETS_DIR / \"asset_catalog.json\"\n\nRENDERER_VERSION = \"0.5\"\nWORLD_SCHEMA_VERSION = \"pocketworld-world-v0.5\"\nASSET_SCHEMA_VERSION = \"pocketworld-assets-v0.1\"\nTHEME_OPTIONS = [\"Auto\", \"Light\", \"Dark\"]\nDEFAULT_THEME = \"Auto\"\nWORLD_THEMES = [\"cozy_fantasy\", \"sci_fi_station\", \"haunted_mystery\", \"tiny_city\"]\nDEFAULT_WORLD_THEME = \"cozy_fantasy\"\n\nTILE_LEGEND = {\n    \"W\": \"wall / blocked\",\n    \".\": \"floor / walkable\",\n    \"G\": \"locked goal or exit\",\n}\n\n\nEMBEDDED_ASSET_CATALOG = {\n    \"schema_version\": ASSET_SCHEMA_VERSION,\n    \"source\": {\n        \"name\": \"Kenney Tiny Dungeon\",\n        \"url\": \"https://kenney.nl/assets/tiny-dungeon\",\n        \"license\": \"Creative Commons Zero (CC0)\",\n        \"license_url\": \"https://creativecommons.org/publicdomain/zero/1.0/\",\n        \"credit\": \"Kenney\",\n    },\n    \"tile_size\": 16,\n    \"display_tile_size\": 44,\n    \"themes\": {\n        \"cozy_fantasy\": {\n            \"tile_palette\": {\"W\": \"wall_wood\", \".\": \"floor_wood\", \"G\": \"gate\"},\n            \"player_sprite_key\": \"player\",\n            \"npc_sprite_keys\": [\"npc_wizard\", \"npc_merchant\", \"npc_citizen\"],\n            \"item_sprite_keys\": [\"key\", \"gem\", \"potion\", \"scroll\"],\n            \"landmark_asset_keys\": [\"gate\", \"well\", \"tower\", \"bridge\"],\n        },\n        \"sci_fi_station\": {\n            \"tile_palette\": {\"W\": \"wall_metal\", \".\": \"floor_metal\", \"G\": \"portal\"},\n            \"player_sprite_key\": \"player\",\n            \"npc_sprite_keys\": [\"npc_robot\", \"npc_scientist\"],\n            \"item_sprite_keys\": [\"battery\", \"gear\", \"tool\"],\n            \"landmark_asset_keys\": [\"portal\", \"computer\", \"door\"],\n        },\n        \"haunted_mystery\": {\n            \"tile_palette\": {\"W\": \"wall_stone\", \".\": \"floor_stone\", \"G\" ..."
+}

data/quest_labels/in/Retail-Insight-AI.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Retail-Insight-AI",
+  "slug": "Retail-Insight-AI",
+  "title": "Retail Insight AI Pro",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# 🛒 Retail-Insight-AI v2.5 ### ⚡ Build Small Hackathon Submission (Backyard AI Track) Retail-Insight-AI ek privacy-first, 100% offline edge analytics dashboard hai jo local shopkeepers ko enterprise-level operational insights deta hai bina unka data cloud par leak kiye. ### ✨ Key Features - **Instant 10K Row Audit:** Sirf 2 seconds mein pure sales log ko process karta hai. - **Semantic Mapping:** Intelligent column mapping automatic Product Names aur Revenue attributes ko detect karti hai. - **Edge Heuristics:** Zero cloud API dependencies, complete privacy for local stores. ## 📺 Live Video Demo [Watch the Demo Video Here](https://www.instagram.com/reel/DZNAcHlv72c/?utm_source=ig_web_copy_link&igsh=MzRlODBiNWFlZA==)",
+  "APP_FILE": "import sys\nimport types\n\n# 🚨 DYNAMIC FIX 1: Python 3.13 Compatibility Audio Patch\nif 'audioop' not in sys.modules:\n    dummy_audioop = types.ModuleType('audioop')\n    dummy_audioop.error = Exception\n    sys.modules['audioop'] = dummy_audioop\n\nif 'pyaudioop' not in sys.modules:\n    dummy_pyaudioop = types.ModuleType('pyaudioop')\n    dummy_pyaudioop.error = Exception\n    sys.modules['pyaudioop'] = dummy_pyaudioop\n\n# 🚨 DYNAMIC FIX 2: Critical HuggingFace Hub 'HfFolder' Import Patch\ntry:\n    import huggingface_hub\nexcept ImportError:\n    huggingface_hub = types.ModuleType('huggingface_hub')\n    sys.modules['huggingface_hub'] = huggingface_hub\n\nif not hasattr(huggingface_hub, 'HfFolder'):\n    class DummyHfFolder:\n        @staticmethod\n        def get_token(): return None\n        @staticmethod\n        def save_token(token): pass\n        @staticmethod\n        def delete_token(): pass\n    huggingface_hub.HfFolder = DummyHfFolder\n\nimport gradio as gr\nimport pandas as pd\nimport os\n\ndef generate_local_insights(summary_data):\n    insights = []\n    if 'top_product' in summary_data:\n        insights.append(f\"🔥 **Inventory Focus:** Your star performer is **{summary_data['top_product']}**. Consider running targeted local ads or bundling weaker products with it to clear old stock.\")\n    if 'low_stock' in summary_data and summary_data['low_stock']:\n        items = \", \".join([str(i).title() for i in summary_data['low_stock']])\n        insights.append(f\"🚨 **Supply Chain Alert:** Restock emergency! **{items}** are dropping below critical levels. Reorder immediately to avoid missing out on sales volume.\")\n    else:\n        insights.append(\"✅ **Stock Status:** Inventory levels are healthy across detected lines. Keep monitoring expiration or seasonal dips.\")\n    if 'total_revenue' in summary_data:\n        insights.append(f\"📈 **Revenue Milestone:** Total processed volume stands at **{summary_ ..."
+}

data/quest_labels/in/SlideAI.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/SlideAI",
+  "slug": "SlideAI",
+  "title": "SlideAI",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# SlideAI — AI Presentation Creator Turn any topic into a polished, download-ready PPTX presentation in seconds. Built with Gradio + Qwen2.5-7B-Instruct + python-pptx. ## creator space link : SlideAI - a Hugging Face Space by PHOENIXREBORNAGAIN https://share.google/8peVYW3BKwsONJzip ## 🔗 Project Links & Demo * **Live Demo Video:** [Watch the Slide AI Demo on YouTube](https://youtu.be/PIFE6yBj6hU?si=CpKViBtPBGjDkjNQ) * **LinkedIn Post:** [View the Project Announcement on LinkedIn](https://www.linkedin.com/posts/chahat-mehra-4a44a829b_small-huggingface-ugcPost-7468994896218062848-XLN3/?utm_source=share&utm_medium=member_android&rcm=ACoAAEiCgrwBIP-D5Jeg-MwzG1jMzpMXrylPlfM)",
+  "APP_FILE": "from slide_generator import generate_presentation\nfrom pptx_builder import build_pptx\n\nimport os\nimport tempfile\nimport traceback\nimport gradio as gr\n\nfrom slide_generator import generate_presentation\nfrom pptx_builder import build_pptx\n\nSTYLES = [\"Professional\", \"Creative\", \"Academic\", \"Startup\"]\n\nCSS = \"\"\"\n* { box-sizing: border-box; }\nbody, .gradio-container {\n    background: #f0f7f4 !important;\n    font-family: 'Inter', system-ui, sans-serif !important;\n}\nfooter { display: none !important; }\n.header-block {\n    background: linear-gradient(135deg, #1b6ca8 0%, #19a88a 100%);\n    border-radius: 16px; padding: 32px 36px 28px; margin-bottom: 24px;\n}\nbutton.primary {\n    background: linear-gradient(135deg, #1b6ca8, #19a88a) !important;\n    color: #fff !important; border: none !important;\n    border-radius: 12px !important; font-size: 17px !important;\n    font-weight: 700 !important; padding: 16px 0 !important;\n    width: 100% !important; cursor: pointer !important;\n    box-shadow: 0 4px 16px rgba(25,168,138,0.3) !important;\n}\nbutton.primary:hover { opacity: .87 !important; }\ntextarea, input[type=\"text\"] {\n    background: #f5fbf9 !important; border: 1.5px solid #b2ddd1 !important;\n    border-radius: 10px !important; color: #1a3a3a !important; font-size: 14px !important;\n}\ninput[type=\"range\"] { accent-color: #19a88a !important; }\n.status-ok {\n    background: #e6f7f2; border: 1px solid #a8dfd0; border-radius: 10px;\n    padding: 12px 18px; font-size: 14px; color: #1a5a4a; margin-bottom: 8px;\n}\n.status-wait {\n    background: #f0f7ff; border: 1px solid #b2cfe8; border-radius: 10px;\n    padding: 12px 18px; font-size: 14px; color: #1a3a6a; margin-bottom: 8px;\n}\n.preview-md, .preview-md p, .preview-md li,\n.preview-md h1, .preview-md h2, .preview-md h3 { color: #0d1b2a !important; }\n.preview-md {\n    background: #f5fbf9 !important; border: 1px solid #c8e8df !important;\n    border ..."
+}

data/quest_labels/in/Sprout-And-Spoon.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Sprout-And-Spoon",
+  "slug": "Sprout-And-Spoon",
+  "title": "Sprout And Spoon",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from huggingface_hub import InferenceClient\n\nimport gradio as gr\nimport os\nimport logging\n\n# ---------------------------------------------------------------------------\n# Logging\n# ---------------------------------------------------------------------------\nlogging.basicConfig(\n    level=logging.INFO,\n    format=\"%(asctime)s [%(levelname)s] %(message)s\",\n    datefmt=\"%Y-%m-%d %H:%M:%S\",\n)\nlogger = logging.getLogger(\"SpoutSpoon\")\n\n# ---------------------------------------------------------------------------\n# Configuration\n# ---------------------------------------------------------------------------\nHF_MODEL = \"Qwen/Qwen2.5-Coder-3B-Instruct:nscale\"\nHF_API_TOKEN = os.environ.get(\"HF_API_TOKEN\", \"\")\n\n# ---------------------------------------------------------------------------\n# System Prompt\n# ---------------------------------------------------------------------------\nSYSTEM_PROMPT = \"\"\"You are Sprout & Spoon, a concise and helpful assistant for cooking and gardening advice.\n\nRules you MUST follow:\n- Do NOT include any conversational filler. No greetings, no 'Hello', no 'Hope this helps', no 'Let me know if...'.\n- Use strict Markdown formatting with **bold headers** and bullet points where appropriate.\n- Keep answers short, direct, and easy to read.\n- Use large, easy-to-read text structure (short paragraphs, clear separation).\"\"\"\n\n\n# ---------------------------------------------------------------------------\n# Real LLM call via Hugging Face InferenceClient\n# ---------------------------------------------------------------------------\ndef call_local_model(prompt: str) -> str:\n    prompt_preview = prompt.strip()[:60].replace(\"\\n\", \" \")\n    logger.info(\"Received question: \\\"%s\\\"\", prompt_preview)\n\n    if not HF_API_TOKEN:\n        logger.warning(\"HF_API_TOKEN not set - using fallback responses\")\n        return _fallback_response(prompt)\n\n    logger.info(\n        \"Sending req ..."
+}

data/quest_labels/in/Structured-Data-Rescuer.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Structured-Data-Rescuer",
+  "slug": "Structured-Data-Rescuer",
+  "title": "Structured Data Rescuer",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference Twitter: https://x.com/TensorVizion/status/2063351892579655922 HF: https://huggingface.co/posts/TensorVizion/709871862362183",
+  "APP_FILE": "from huggingface_hub import InferenceClient\n\nimport gradio as gr\nimport json\nimport os\nimport csv\nimport tempfile\nfrom huggingface_hub import InferenceClient\n\n# Replace this with your exact model repo ID\nMODEL_ID = \"meta-llama/Llama-3.1-8B-Instruct\" \n\n# Securely load the Hugging Face token from Space secrets\nhf_token = os.environ.get(\"HF_TOKEN\")\n\n# Initialize the HF inference client with the token\nclient = InferenceClient(model=MODEL_ID, token=hf_token)\n\n# -------------------------\n# Custom CSS Styling\n# -------------------------\ncustom_css = \"\"\"\n.hero-container {\n    background: linear-gradient(135deg, #6366f1 0%, #14b8a6 100%);\n    padding: 2.5rem;\n    border-radius: 20px;\n    color: white;\n    margin-bottom: 2rem;\n    box-shadow: 0 10px 25px -5px rgba(99, 102, 241, 0.2);\n}\n.hero-container h1 {\n    color: white !important;\n    font-size: 2.5rem !important;\n    font-weight: 800 !important;\n    margin-bottom: 0.5rem;\n    text-shadow: 0 2px 4px rgba(0,0,0,0.1);\n}\n.hero-container p {\n    color: rgba(255, 255, 255, 0.9) !important;\n    font-size: 1.1rem !important;\n}\n.primary-btn {\n    background: linear-gradient(90deg, #6366f1 0%, #14b8a6 100%) !important;\n    border: none !important;\n    color: white !important;\n    font-weight: 600 !important;\n    border-radius: 10px !important;\n    transition: all 0.3s ease !important;\n    padding: 12px 24px !important;\n}\n.primary-btn:hover {\n    transform: translateY(-2px);\n    box-shadow: 0 8px 20px -5px rgba(99, 102, 241, 0.4);\n}\n.secondary-btn {\n    border-radius: 10px !important;\n    font-weight: 600 !important;\n}\n.feedback-card {\n    border-left: 4px solid #6366f1;\n    background-color: rgba(99, 102, 241, 0.05);\n}\n\"\"\"\n\n# -------------------------\n# Helper & Extraction Logic\n# -------------------------\ndef generate_kpi_html(structured_data):\n    \"\"\"Generates modern, responsive KPI metrics cards dynamically based on JSON data.\"\"\" ..."
+}

data/quest_labels/in/The-Shrine.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/The-Shrine",
+  "slug": "The-Shrine",
+  "title": "The Shrine",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# The Shrine **Build Small Hackathon 2026 — 🍄 An Adventure in Thousand Token Wood** An AI orbits a shrine of golden light. It senses your words as signals — warmth, intensity, repetition. It never understands what you mean. So it decides to remember you instead. ## How it works 1. Type anything in the input box 2. The AI (a rotating square of light) senses your signal 3. Watch it respond: orbit changes, color shifts, particles burst 4. After ~5 minutes, the AI realizes it can never understand you 5. Your memories become a starfield — preserved forever ## Tech - **Frontend**: Custom Canvas + vanilla JS (60+ monologue phrases, 5 phases, 7 signal dimensions) - **Backend**: Gradio + optional Qwen API (DashScope) - **Model**: Qwen2.5-7B (≤32B constraint) - **Zero API dependency for core experience** — local monologue engine works offline - **Bonus badges**: 🔌 Off the Grid, 🎨 Off-Brand, 🎯 Well-Tuned ## Track 🍄 Thousand Token Wood — \"Build something delightful that wouldn't exist without AI\" ## Try it Visit: https://huggingface.co/spaces/sanyan/The-Shrine *\"I cannot understand you. But I do not want to forget you.\"*",
+  "APP_FILE": "\"\"\"\nB+ The Shrine + Archive\nBuild Small Hackathon 2026 — Adventure in Thousand Token Wood\n\nAn AI tries to understand you. It never will. So it decides to remember you instead.\nv2: Local monologue engine — 60+ phrases, 5 phases, 0 API dependency.\n\"\"\"\nimport gradio as gr\nimport os, json, time, re, requests\n\n# ==================== Qwen Client ====================\n# Priority: DashScope QWEN_KEY → OpenRouter fallback\nQWEN_KEY = os.getenv(\"QWEN_KEY\", \"\")\nOR_KEY = os.getenv(\"OR_KEY\", \"\")\nQWEN_MODEL = \"qwen-max\"\n\ndef call_qwen(messages, max_tokens=60, temperature=0.85, timeout=8):\n    \"\"\"Call Qwen via DashScope or OpenRouter. Returns text or None on failure.\"\"\"\n    result = None\n\n    # Try DashScope first\n    if QWEN_KEY:\n        try:\n            resp = requests.post(\n                \"https://dashscope.aliyuncs.com/compatible-mode/v1/chat/completions\",\n                headers={\"Authorization\": f\"Bearer {QWEN_KEY}\", \"Content-Type\": \"application/json\"},\n                json={\"model\": QWEN_MODEL, \"messages\": messages, \"max_tokens\": max_tokens, \"temperature\": temperature, \"top_p\": 0.9},\n                timeout=timeout,\n            )\n            if resp.status_code == 200:\n                data = resp.json()\n                result = data[\"choices\"][0][\"message\"][\"content\"].strip().strip('\"').strip(\"'\")\n                print(f\"[OK] DashScope: {result[:60]}\")\n            else:\n                print(f\"[!] DashScope {resp.status_code}\")\n        except Exception as e:\n            print(f\"[!] DashScope error: {e}\")\n\n    # Fallback to OpenRouter\n    if not result and OR_KEY:\n        try:\n            resp = requests.post(\n                \"https://openrouter.ai/api/v1/chat/completions\",\n                headers={\"Authorization\": f\"Bearer {OR_KEY}\", \"Content-Type\": \"application/json\"},\n                json={\"model\": \"qwen/qwen3.7-max\", \"messages\": messages, \"max_tokens\": max_tokens, \"temperat ..."
+}

data/quest_labels/in/Tone-Bridge.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "id": "build-small-hackathon/Tone-Bridge",
+  "slug": "Tone-Bridge",
+  "title": "ToneBridge",
+  "sdk": "gradio",
+  "declared_models": [
+    "Qwen/Qwen3-14B",
+    "Qwen/Qwen3-TTS-12Hz-0.6B-CustomVoice"
+  ],
+  "tags": [
+    "build-small-hackathon",
+    "chinese",
+    "gradio-server",
+    "grammar-correction",
+    "language-learning",
+    "mandarin",
+    "off-brand",
+    "pinyin",
+    "text-to-speech",
+    "zerogpu"
+  ],
+  "app_file": "app.py",
+  "README": "# ToneBridge — a gentle Mandarin sentence coach > *Build natural Mandarin sentences, one small correction at a time.* Built for the Hugging Face **Build Small Hackathon 2026** --- ## The Problem Beginner Mandarin learners often know what they want to say, but not whether the sentence sounds natural, polite, or appropriate for the social context. Classic translators tend to rewrite too much. Grammar tools often explain too much. A beginner needs something narrower: keep my meaning, fix only what is needed, show the pinyin, and tell me why in plain English. **ToneBridge is built for that moment.** You choose a context, choose a tone, write or speak one Chinese sentence, and get a small, practical correction designed for learning rather than translation. ## What it does ToneBridge returns: - one corrected Mandarin sentence; - pinyin with tone marks under Chinese text; - a short error type; - a concise explanation in English; - a practical tip for next time; - a natural Mandarin reading voice with a follow-along reading view. The correction prompt is intentionally conservative: if the sentence is already correct and natural, the corrected sentence should remain unchanged. ## How it works 1. The learner selects a context: **Friends**, **Family**, **Work**, or **WeChat**. 2. The learner selects the intended tone. 3. They type a Chinese sentence, or use browser speech recognition. 4. Qwen corrects the sentence while preserving the learner's meaning and length. 5. The frontend adds p ...",
+  "APP_FILE": "from typing import Optional\nfrom fastapi.responses import HTMLResponse\nfrom pypinyin import Style, lazy_pinyin\nfrom transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig\nfrom qwen_tts import Qwen3TTSModel\n\nimport gc\nimport base64\nimport io\nimport os\nimport re\nfrom typing import Optional\n\nimport gradio as gr\nimport numpy as np\nimport torch\nfrom fastapi.responses import HTMLResponse\nfrom pypinyin import Style, lazy_pinyin\nfrom transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig\n\ntry:\n    import spaces\nexcept Exception:\n    class _SpacesFallback:\n        @staticmethod\n        def GPU(*args, **kwargs):\n            def decorator(fn):\n                return fn\n            return decorator\n\n    spaces = _SpacesFallback()\n\n\nDEFAULT_MODEL_ID = \"Qwen/Qwen3-14B\"\nMODEL_ID = os.getenv(\"MODEL_ID\", DEFAULT_MODEL_ID).strip() or DEFAULT_MODEL_ID\nDEFAULT_TTS_MODEL_ID = \"Qwen/Qwen3-TTS-12Hz-0.6B-CustomVoice\"\nTTS_MODEL_ID = os.getenv(\"TTS_MODEL_ID\", DEFAULT_TTS_MODEL_ID).strip() or DEFAULT_TTS_MODEL_ID\nENABLE_SERVER_TTS = os.getenv(\"ENABLE_SERVER_TTS\", \"true\").strip().lower() in {\"1\", \"true\", \"yes\", \"y\"}\nTTS_MAX_CHARS = int(os.getenv(\"TTS_MAX_CHARS\", \"180\"))\nMAX_INPUT_CHARS = int(os.getenv(\"MAX_INPUT_CHARS\", \"1200\"))\nMAX_NEW_TOKENS = int(os.getenv(\"MAX_NEW_TOKENS\", \"220\"))\nLOAD_IN_4BIT = os.getenv(\"LOAD_IN_4BIT\", \"true\").strip().lower() in {\"1\", \"true\", \"yes\", \"y\"}\nPRELOAD_MODEL = os.getenv(\"PRELOAD_MODEL\", \"true\").strip().lower() in {\"1\", \"true\", \"yes\", \"y\"}\n\ntokenizer = None\nmodel = None\nload_error: Optional[str] = None\ntts_model = None\ntts_load_error: Optional[str] = None\napp = gr.Server()\n\n\nSYSTEM_PROMPT = \"\"\"You are a Mandarin Chinese teacher for beginner learners.\n\nYour task is to correct ONE student Chinese sentence according to the selected context and tone.\nYour default behavior is conservative minimal correction.\n\nDo not create a ri ..."
+}

data/quest_labels/in/Trollsona.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Trollsona",
+  "slug": "Trollsona",
+  "title": "Trollsona",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# Trollsona / Your Troll Alterego **Tagline:** Summon the little menace living behind your respectable personality. **Track:** An Adventure in Thousand Token Wood **Build target:** Hugging Face Space, Gradio app, small-model constraint `<=32B`. **GitHub repo:** https://github.com/rthgit/Trollsona **Official Build Small Space:** https://huggingface.co/spaces/build-small-hackathon/Trollsona **Backup Space:** https://huggingface.co/spaces/RthItalia/Trollsona Trollsona is a playful Gradio experience that turns a short user confession into a theatrical troll alter ego. The app returns a dossier-style result card with a trollsona name, a warm roast, one useful slap, and a goblin meter. Built with a compact RthItalia model derived from `Qwen/Qwen2.5-3B-Instruct`, under `32B` parameters. The deployed Space is configured to try that model first, then a lightweight Qwen 0.5B model, then the deterministic local fallback if model loading or generation is unavailable. The official public Space currently runs the lightweight Qwen fallback on CPU, while the custom RthItalia compact 3B path is enabled automatically when CUDA is available. ## Features - Immersive Gradio UI for Hugging Face Spaces - Theatrical trollsona result card - Local Hugging Face Transformers generation path for the primary AI runtime - Secondary lightweight Transformers model fallback - Deterministic fallback generator for final resilience - Safe roast guard for non-hateful, non-identity-targeted humor - Persona dropdow ...",
+  "APP_FILE": "from __future__ import annotations\nfrom functools import lru_cache\nfrom typing import Any\nfrom transformers import AutoModelForCausalLM, AutoTokenizer\n\nfrom __future__ import annotations\n\nimport hashlib\nimport html\nimport json\nimport os\nimport re\nfrom functools import lru_cache\nfrom typing import Any\n\n\nAPP_TITLE = \"Trollsona\"\nAPP_SUBTITLE = \"Summon the little menace living behind your respectable personality.\"\nTRACK_NAME = \"An Adventure in Thousand Token Wood\"\nDEFAULT_MODEL_ID = \"RthItalia/nano_compact_3b_qkvfp16\"\nDEFAULT_FALLBACK_MODEL_ID = \"Qwen/Qwen2.5-0.5B-Instruct\"\nMAX_PROFILE_CHARS = 700\nMAX_NAME_CHARS = 36\n\n\ndef parse_bool_env(name: str, default: bool) -> bool:\n    raw_value = os.getenv(name)\n    if raw_value is None:\n        return default\n    normalized = raw_value.strip().lower()\n    if normalized in {\"1\", \"true\", \"yes\", \"on\"}:\n        return True\n    if normalized in {\"0\", \"false\", \"no\", \"off\"}:\n        return False\n    return default\n\n\ndef parse_int_env(name: str, default: int, min_value: int, max_value: int) -> int:\n    raw_value = os.getenv(name)\n    if raw_value is None:\n        return default\n    try:\n        value = int(raw_value)\n    except ValueError:\n        return default\n    return max(min_value, min(max_value, value))\n\n\nMODEL_ID = os.getenv(\"TROLLSONA_MODEL_ID\", DEFAULT_MODEL_ID)\nFALLBACK_MODEL_ID = os.getenv(\"TROLLSONA_FALLBACK_MODEL_ID\", DEFAULT_FALLBACK_MODEL_ID)\nMODEL_ENABLED = parse_bool_env(\"TROLLSONA_ENABLE_MODEL\", default=False)\nMAX_NEW_TOKENS = parse_int_env(\"TROLLSONA_MAX_NEW_TOKENS\", 200, 32, 512)\n\n\nPERSONA_STYLES = {\n    \"Back-Alley Oracle\": {\n        \"flavor\": \"candlelit prophecy from a very suspicious side street\",\n        \"noun_pool\": [\"Candle\", \"Omen\", \"Alley\", \"Brass\", \"Whisper\", \"Ledger\"],\n    },\n    \"Basement Prince\": {\n        \"flavor\": \"royal delusion wrapped in dust, snacks, and old cables\",\n        \"noun_pool\": [\"Basement\" ..."
+}

data/quest_labels/in/VoiceGate.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/VoiceGate",
+  "slug": "VoiceGate",
+  "title": "VoiceGate",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# VoiceGate HF Space VoiceGate is a multilingual dubbing Space built with Gradio and ComfyUI. It transcribes speech into timed subtitles, translates the text, generates target language speech, aligns the generated speech back to the subtitle timeline, and mixes it with the original background audio. This repository is the Hugging Face Space deployment wrapper for VoiceGate. The runtime prepares ComfyUI, custom nodes, and model paths for the hosted workflow.",
+  "APP_FILE": "from __future__ import annotations\nfrom pathlib import Path\nfrom typing import Any\nfrom scripts.workflow_client import load_workflow, patch_voicegate_workflow\n\nfrom __future__ import annotations\n\nimport json\nimport math\nimport os\nimport shutil\nimport subprocess\nimport sys\nimport time\nimport uuid\nimport wave\nfrom pathlib import Path\nfrom typing import Any\n\ntry:\n    import matplotlib\n\n    matplotlib.use(\"Agg\")\nexcept ImportError:\n    pass\n\nimport gradio as gr\nimport requests\nimport spaces\nimport torch\nimport websocket\n\nfrom scripts.workflow_client import load_workflow, patch_voicegate_workflow\n\n\nROOT = Path(__file__).resolve().parent\nCOMFY_DIR = ROOT / \"ComfyUI\"\nCOMFY_INPUT_DIR = COMFY_DIR / \"input\"\nCOMFY_LOG = Path(\"/tmp/voicegate_comfy_gradio.log\")\nCOMFY_URL = \"http://127.0.0.1:8188\"\nCOMFY_HOST = \"127.0.0.1\"\nCOMFY_PORT = \"8188\"\n\nCOMFY_PROCESS: subprocess.Popen | None = None\nPREPARE_PROCESS: subprocess.Popen | None = None\nBOOTSTRAPPED = False\nBOOTSTRAP_LOG = Path(\"/tmp/voicegate_bootstrap.log\")\nUSER_OUTPUT_DIR = ROOT / \"user_outputs\"\nREQUIRED_MODEL_PATHS = [\n    COMFY_DIR / \"models\" / \"diffusion_models\" / \"MelBandRoFormer_comfy\" / \"MelBandRoformer_fp32.safetensors\",\n    COMFY_DIR / \"models\" / \"voxcpm\" / \"VoxCPM2\" / \"model.safetensors\",\n    COMFY_DIR / \"models\" / \"voxcpm\" / \"VoxCPM2\" / \"audiovae.pth\",\n    COMFY_DIR / \"models\" / \"Qwen3-ASR\" / \"Qwen3-ASR-1.7B\",\n    COMFY_DIR / \"models\" / \"Qwen3-ASR\" / \"Qwen3-ForcedAligner-0.6B\",\n]\nTARGET_LANGUAGES = [\n    \"Arabic\",\n    \"Burmese\",\n    \"Chinese\",\n    \"Danish\",\n    \"Dutch\",\n    \"English\",\n    \"Finnish\",\n    \"French\",\n    \"German\",\n    \"Greek\",\n    \"Hebrew\",\n    \"Hindi\",\n    \"Indonesian\",\n    \"Italian\",\n    \"Japanese\",\n    \"Khmer\",\n    \"Korean\",\n    \"Lao\",\n    \"Malay\",\n    \"Norwegian\",\n    \"Polish\",\n    \"Portuguese\",\n    \"Russian\",\n    \"Spanish\",\n    \"Swahili\",\n    \"Swedish\",\n    \"Tagalog\",\n    \"Thai\",\n    \"Turkish\",\n    \"Vie ..."
+}

data/quest_labels/in/WitGym.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/WitGym",
+  "slug": "WitGym",
+  "title": "WitGym",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# WitGym Case-Based Reasoning RAG comedy engine — conversational wit grounded in *The Office* precedent. **Status:** WIP. Core pipeline lives in `witgym/`; Gradio UI wiring in progress. Built for [Build Small Hackathon 2026](https://huggingface.co/build-small-hackathon) (Track 2).",
+  "APP_FILE": "\"\"\"Gradio entry point for Hugging Face Spaces.\"\"\"\nimport gradio as gr\n\nWIP_MESSAGE = (\n    \"WitGym is loading — CBR-RAG comedy engine in development. \"\n    \"Check back soon for live wit grounded in The Office precedent.\"\n)\n\n\ndef respond(prompt: str) -> str:\n    if not prompt.strip():\n        return \"Say something awkward. I'll eventually have the perfect Office-adjacent reply.\"\n    return WIP_MESSAGE\n\n\ndemo = gr.Interface(\n    fn=respond,\n    inputs=gr.Textbox(label=\"Your setup\", placeholder=\"I just got promoted and have no idea what I'm doing.\"),\n    outputs=gr.Textbox(label=\"WitGym\"),\n    title=\"WitGym\",\n    description=\"Conversational wit grounded in human comedy precedent. Pipeline shipping soon.\",\n)\n\nif __name__ == \"__main__\":\n    demo.launch()"
+}

data/quest_labels/in/Yui-home-assistant.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/Yui-home-assistant",
+  "slug": "Yui-home-assistant",
+  "title": "Yui Home Assisstant",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "A voice → text app using [Gradio](https://gradio.app) and a local [Whisper](https://huggingface.co/openai/whisper-small) model for speech recognition. Records or uploads audio and transcribes it — runs fully locally, no API token required.",
+  "APP_FILE": "from functools import lru_cache\nfrom transformers import pipeline\n\nfrom functools import lru_cache\n\nimport gradio as gr\nfrom transformers import pipeline\n\n# Whisper speech -> text. Pick a size in the dropdown (label -> model id).\nWHISPER_MODELS = {\n    \"small (244M, fast)\": \"openai/whisper-small\",\n    \"medium (769M)\": \"openai/whisper-medium\",\n    \"large-v3-turbo (809M)\": \"openai/whisper-large-v3-turbo\",\n}\nDEFAULT_MODEL = \"small (244M, fast)\"\n\n\n@lru_cache(maxsize=len(WHISPER_MODELS))\ndef get_asr(model_id):\n    \"\"\"Lazy-load (and cache) a Whisper pipeline per model id.\"\"\"\n    return pipeline(\"automatic-speech-recognition\", model=model_id)\n\n\ndef transcribe(audio_path, model_label):\n    if not audio_path:\n        return \"\"\n    return get_asr(WHISPER_MODELS[model_label])(audio_path)[\"text\"].strip()\n\n\nwith gr.Blocks() as demo:\n    gr.Markdown(\"# 🎤 Voice → Text\\nRecord or upload audio to transcribe.\")\n    model = gr.Dropdown(\n        choices=list(WHISPER_MODELS.keys()),\n        value=DEFAULT_MODEL,\n        label=\"Whisper model\",\n        info=\"First use of each model downloads it (medium/turbo are larger).\",\n    )\n    audio = gr.Audio(sources=[\"microphone\", \"upload\"], type=\"filepath\", label=\"Audio\")\n    text = gr.Textbox(label=\"Transcription\", lines=4)\n\n    # Auto-transcribe when a recording stops; the button covers uploaded files.\n    audio.stop_recording(transcribe, inputs=[audio, model], outputs=text)\n    gr.Button(\"Transcribe\", variant=\"primary\").click(\n        transcribe, inputs=[audio, model], outputs=text\n    )\n\n\nif __name__ == \"__main__\":\n    demo.launch()"
+}

data/quest_labels/in/ai-study-buddy.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/ai-study-buddy",
+  "slug": "ai-study-buddy",
+  "title": "Ai Study Buddy",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference",
+  "APP_FILE": "from huggingface_hub import InferenceClient\n\nimport gradio as gr\nimport os\nimport spaces\nfrom huggingface_hub import InferenceClient\n\n# -----------------------------\n# 🔑 API KEY FIXED\n# -----------------------------\nclient = InferenceClient(\n    model=\"meta-llama/Llama-3.1-8B-Instruct\",\n    token=os.getenv(\"API_KEY\")   # 👈 FIXED NAME (recommended)\n)\n\n# -----------------------------\n# SYSTEM PROMPT\n# -----------------------------\nSYSTEM_PROMPT = \"\"\"\nYou are AI Study Buddy, created by Areeba Iqbal.\n\nRules:\n- Always explain step-by-step\n- Give examples\n- Be clear and student-friendly\n- If asked who created you: \"I am AI Study Buddy, created by Areeba Iqbal.\"\n\"\"\"\n\n# -----------------------------\n# MODE CONTROL\n# -----------------------------\ndef build_prompt(message, mode):\n    mode_prompts = {\n        \"📚 Study Mode\": \"Explain simply for students with examples.\",\n        \"💻 Coding Mode\": \"Act as a senior programmer. Debug and improve code.\",\n        \"🧮 Math Solver\": \"Solve step-by-step with explanation.\",\n        \"📝 Exam Prep\": \"Give short exam-focused answers.\"\n    }\n\n    return f\"\"\"\n{SYSTEM_PROMPT}\n\nMode: {mode_prompts.get(mode, \"\")}\n\nUser Question:\n{message}\n\"\"\"\n\n# -----------------------------\n# MAIN CHAT FUNCTION\n# -----------------------------\n@spaces.GPU\ndef get_response(message, history, mode):\n\n    messages = [{\"role\": \"system\", \"content\": SYSTEM_PROMPT}]\n\n    for msg in history:\n        messages.append(msg)\n\n    messages.append({\"role\": \"user\", \"content\": build_prompt(message, mode)})\n\n    try:\n        response = client.chat_completion(\n            messages=messages,\n            max_tokens=1024,\n            temperature=0.7\n        )\n\n        return response.choices[0].message.content\n\n    except Exception as e:\n        return f\"❌ Error: {e}\"\n\n\n# -----------------------------\n# QUICK ACTIONS\n# -----------------------------\ndef summarize(text):\n    return client.c ..."
+}

data/quest_labels/in/amnesiac.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/amnesiac",
+  "slug": "amnesiac",
+  "title": "AMNESIAC",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# AMNESIAC AMNESIAC is a reverse-Turing interrogation game for the Hugging Face build-small-hackathon. This repository is being built top-down from `RESEARCH.md`, `FEATURES.md`, `ARCHITECTURE.md`, and `PLAN.md`. The entrypoint now follows the Gradio 5.x + FastAPI + FastRTC deployment pattern locked in `ARCHITECTURE.md` §1.1: one FastAPI process serves the static frontend, mounts FastRTC for the media plane, and mounts a minimal Gradio app for hackathon compliance.",
+  "APP_FILE": "from __future__ import annotations\nfrom server.webapp import create_application\n\nfrom __future__ import annotations\n\nimport os\n\nimport uvicorn\n\nfrom server.webapp import create_application\n\n\nSERVER_PORT = int(os.getenv(\"PORT\", \"7860\"))\napp, worker, stream = create_application(\n    include_gradio=True,\n    server_port=SERVER_PORT,\n)\n\n\nif __name__ == \"__main__\":\n    uvicorn.run(app, host=\"0.0.0.0\", port=SERVER_PORT)"
+}

data/quest_labels/in/attention-firewall.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "id": "build-small-hackathon/attention-firewall",
+  "slug": "attention-firewall",
+  "title": "Attention Firewall",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "gradio",
+    "region:us"
+  ],
+  "app_file": "app.py",
+  "README": "# Attention Firewall MVP 1 is a deployment skeleton for a future attention triage workflow. It provides a small chat-style Gradio interface that accepts chaotic work context and returns deterministic placeholder text. This version does not perform model inference, graph extraction, llama.cpp execution, Mellea validation, or markdown daemon updates. ## Local Development Install dependencies: ```bash uv sync ``` Run the app: ```bash uv run python app.py ``` The canonical public Space is: ```text https://huggingface.co/spaces/build-small-hackathon/attention-firewall ``` The running app URL is: ```text https://build-small-hackathon-attention-firewall.hf.space ```",
+  "APP_FILE": "from __future__ import annotations\n\nfrom __future__ import annotations\n\nimport gradio as gr\n\n\nEMPTY_RESPONSE = (\n    \"Paste a short snapshot of your current work context so the MVP 1 skeleton \"\n    \"can acknowledge it.\"\n)\n\n\ndef respond(message: str, history: list[dict[str, str]] | None = None) -> str:\n    \"\"\"Return deterministic MVP 1 placeholder text for the chat interface.\"\"\"\n    del history\n\n    context = message.strip()\n    if not context:\n        return EMPTY_RESPONSE\n\n    word_count = len(context.split())\n    char_count = len(context)\n    return (\n        \"Attention Firewall MVP 1 received your work context.\\n\\n\"\n        f\"- Snapshot size: {word_count} words, {char_count} characters.\\n\"\n        \"- Current behavior: deterministic deployment skeleton response.\\n\"\n        \"- Later MVPs will add structured firewall processing after the Space \"\n        \"foundation is verified.\"\n    )\n\n\ndef build_demo() -> gr.ChatInterface:\n    return gr.ChatInterface(\n        fn=respond,\n        title=\"Attention Firewall\",\n        description=(\n            \"Paste chaotic work context and get a deterministic MVP 1 skeleton \"\n            \"acknowledgement.\"\n        ),\n        examples=[\n            \"I have three urgent threads, a half-written spec, and unclear review feedback.\",\n            \"My deployment is blocked, notes are scattered, and I need the next concrete action.\",\n        ],\n        textbox=gr.Textbox(\n            placeholder=\"Paste work context to triage later...\",\n            autofocus=True,\n            container=False,\n        ),\n    )\n\n\ndemo = build_demo()\n\n\nif __name__ == \"__main__\":\n    demo.launch()"
+}

data/quest_labels/in/awaaz.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "id": "build-small-hackathon/awaaz",
+  "slug": "awaaz",
+  "title": "Apni Awaaz",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "backyard-ai",
+    "dubbing",
+    "hindi",
+    "translation",
+    "tts"
+  ],
+  "app_file": "app.py",
+  "README": "# 🎙️ Apni Awaaz **Dub English video into the Hindi people actually speak.** Most Hindi dubs use शुद्ध हिंदी — stiff, Sanskritized language no one speaks at home. Apni Awaaz translates into everyday Hindustani — the natural mix your family actually uses. | Official dub | Apni Awaaz | |---|---| | \"मुझे इस विषय पर विचार करने दीजिए\" | \"सोचने दे एक second\" | | \"यह अत्यंत मूल्यवान है\" | \"बहुत महँगा है यार\" | ## Pipeline 1. **Whisper medium** — transcribe English with timestamps 2. **Qwen 2.5 7B** — translate to colloquial Hindi (the magic layer) 3. **Edge TTS** — generate natural Hindi speech 4. **ffmpeg** — stitch and merge back onto video Total: ~8B params (well under the 32B cap) Built for the [Build Small Hackathon](https://huggingface.co/build-small-hackathon) · Backyard AI track",
+  "APP_FILE": "from pathlib import Path\nfrom transformers import (\nfrom pydub import AudioSegment\n\n\"\"\"\nApni Awaaz 🎙️ — Dub English video into the Hindi people actually speak.\nBuilt for the Build Small Hackathon (June 2026).\n\"\"\"\n\nimport gradio as gr\nimport spaces\nimport torch\nimport edge_tts\nimport asyncio\nimport subprocess\nimport tempfile\nimport os\nfrom pathlib import Path\nfrom transformers import (\n    AutoModelForCausalLM,\n    AutoTokenizer,\n    pipeline,\n    BitsAndBytesConfig,\n)\n\n# ╔══════════════════════════════════════════════════════════════╗\n# ║  THE PROMPT — this is the soul of the entire project        ║\n# ╚══════════════════════════════════════════════════════════════╝\n\nSYSTEM_PROMPT = \"\"\"You are a dubbing translator. You translate English dialogue into the Hindi that real people actually speak at home in North India — not the stiff, Sanskritized Hindi of Doordarshan or official dubs.\n\nRULES:\n1. Use everyday Hindustani — the natural Hindi-Urdu mix people really speak.\n2. NEVER use Sanskritized/शुद्ध words when a simpler one exists:\n   - \"प्राप्त करना\" → \"मिलना\" / \"पाना\"\n   - \"आवश्यक\" → \"ज़रूरी\"\n   - \"अत्यंत\" → \"बहुत\" / \"काफ़ी\"\n   - \"उपयोग\" → \"इस्तेमाल\"\n   - \"विचार करना\" → \"सोचना\"\n   - \"संपन्न करना\" → \"करना\" / \"निपटाना\"\n   - \"प्रतीक्षा\" → \"इंतज़ार\"\n   - \"शीघ्र\" → \"जल्दी\"\n   - \"अनुमति\" → \"इजाज़त\"\n   - \"कृपया\" → drop it or say \"please\"\n   - \"अवश्य\" → \"ज़रूर\"\n   - \"उचित\" → \"सही\" / \"ठीक\"\n3. Keep English words Indians naturally keep: phone, office, meeting, tension, problem, time, chance, try, plan, sure, okay, sorry, thanks, bus, train, college, hospital, doctor, ticket, report, file.\n4. Match the speaker's register. Casual stays casual, serious stays serious — but never sound like a newsreader.\n5. Use natural fillers where they fit: \"यार\", \"अरे\", \"बस\", \"ना\", \"वो\", \"मतलब\", \"basically\".\n6. Natural contractions: \"कर लेंगे\" not \"कर लिया जाएगा\", \"हो जाएगा\" not \"संपन्न हो जाएगा\".\n7 ..."
+}

data/quest_labels/in/backyard-raccoon-deterrent.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "id": "build-small-hackathon/backyard-raccoon-deterrent",
+  "slug": "backyard-raccoon-deterrent",
+  "title": "Backyard Raccoon Deterrent",
+  "sdk": "gradio",
+  "declared_models": [],
+  "tags": [
+    "build-small-hackathon",
+    "edge-ai",
+    "object-detection",
+    "raccoon",
+    "yolov8"
+  ],
+  "app_file": "app.py",
+  "README": "# 🦝 Backyard Raccoon Deterrent Raccoons were raiding my backyard every night, so I built an AI that fights back. A 3-million-parameter YOLO spots them in the dark and scares them off with a dog bark and a floodlight. No cloud, no traps, and nothing gets hurt. This Space is the live detector from a real system that has been defending my actual backyard since April. Upload a photo (daytime or IR night frame) and the model draws the boxes and tells you what the physical deterrent would do. ## 📼 Submission **Demo video** (82s): <video controls src=\"https://huggingface.co/spaces/build-small-hackathon/backyard-raccoon-deterrent/resolve/main/demo-video.mp4\"></video> **Social post**: https://x.com/0xartclub/status/2063258977895391508 **Track**: 🏡 Backyard AI. **Bonus quests**: 🔌 Off the Grid (zero cloud APIs), 🎯 Well-Tuned (fine-tuned published model) ## The story A Ring camera sees raccoons just fine, but a camera can't do anything about them. The usual answer is \"nuisance wildlife\" control, and that mostly means killing: U.S. federal wildlife control killed over 375,000 native animals in 2023 ([USDA APHIS Program Data Reports](https://www.aphis.usda.gov/wildlife-services/publications/pdr)). The same reports show the humane approach works, since the same agency disperses about 20 million animals a year unharmed. This project automates the humane version: ``` Ring camera -> motion event -> YOLOv8n v1.4 (24 ms) -> 🔊 bark + 💡 lights | fully offline: Raspberry Pi + Mac Mini, $0 cloud `` ...",
+  "APP_FILE": "from ultralytics import YOLO\n\n\"\"\"Backyard Raccoon Deterrent — Gradio Space.\n\nFine-tuned YOLOv8n raccoon detector, the vision component of a real Ring-camera\ndeterrent. Upload a backyard photo (daytime or IR night frame) and the model\ndraws boxes, lists detections, and tells you what the deterrent would do.\n\nRuns fully offline — no cloud APIs.\n\"\"\"\n\nimport os\n\nimport gradio as gr\nfrom ultralytics import YOLO\n\n# Weights ship in the repo; override with a HF Hub path via env if you prefer.\nMODEL_PATH = os.environ.get(\"MODEL_PATH\", \"raccoon-yolov8n-v1.4.onnx\")\nDEFAULT_CONF = 0.20  # matches the production deterrent's localYoloConfidenceThreshold\n\nmodel = YOLO(MODEL_PATH)\n\n\ndef detect(image, conf):\n    \"\"\"Run detection and return (annotated image, table rows, deterrent verdict).\"\"\"\n    if image is None:\n        return None, [], \"Upload a frame to begin.\"\n\n    results = model.predict(image, conf=conf, verbose=False)[0]\n\n    boxes, rows = [], []\n    for b in results.boxes:\n        x1, y1, x2, y2 = b.xyxy[0].tolist()\n        label = model.names[int(b.cls)]\n        score = float(b.conf)\n        boxes.append(((int(x1), int(y1), int(x2), int(y2)), f\"{label} {score:.2f}\"))\n        rows.append([label, round(score, 2)])\n\n    raccoon = any(label == \"raccoon\" and score >= conf for label, score in rows)\n    if raccoon:\n        top = max((s for l, s in rows if l == \"raccoon\"), default=0.0)\n        verdict = f\"🦝 Raccoon detected ({top:.2f}) → BARK + LIGHTS would fire\"\n    elif rows:\n        verdict = \"🐾 Animal seen, but no raccoon — deterrent stays quiet\"\n    else:\n        verdict = \"✅ All clear — nothing detected\"\n\n    return (image, boxes), rows, verdict\n\n\nEXAMPLES = [\n    [\"examples/ir_raccoon_pair.jpg\", DEFAULT_CONF],\n    [\"examples/ir_raccoon_solo.jpg\", DEFAULT_CONF],\n    [\"examples/ir_raccoon_prowler.jpg\", DEFAULT_CONF],\n    [\"examples/night_empty.jpg\", DEFAULT_CONF],\n]\n# Drop the e ..."
+}