""" Hugging Face Spaces entrypoint (Gradio). Uses the same backend as the Reflex UI via `reflex_ui.backend_bridge.run_prediction`. """ from __future__ import annotations import os import sys from pathlib import Path import gradio as gr import pandas as pd REPO_ROOT = Path(__file__).resolve().parent os.chdir(REPO_ROOT) if str(REPO_ROOT) not in sys.path: sys.path.insert(0, str(REPO_ROOT)) _reflex_pkg_parent = REPO_ROOT / "reflex_ui" if str(_reflex_pkg_parent) not in sys.path: sys.path.insert(0, str(_reflex_pkg_parent)) _reflex_pkg_nested = _reflex_pkg_parent / "reflex_ui" if str(_reflex_pkg_nested) not in sys.path: sys.path.insert(0, str(_reflex_pkg_nested)) from backend_bridge import run_prediction # noqa: E402 def _predict(code: str, language: str, top_k: float): text = (code or "").strip() if not text: return ( "*Paste a non-empty code snippet.*", "", pd.DataFrame(), "", ) lang = (language or "python").lower() if lang not in ("python", "java"): lang = "python" k = int(top_k) if top_k else 6 k = max(1, min(30, k)) try: r = run_prediction(code=text, language=lang, top_k=k) except Exception as e: return (f"**{type(e).__name__}:** `{e}`", "", pd.DataFrame(), "") label_md = f"## Prediction: **{r.label}**\n\nP(AI) = **{r.prob_ai:.4f}**" grouped_lines = [ f"- **{name}:** {val:.4f}" for name, val in sorted(r.grouped_importance.items(), key=lambda x: -x[1]) ] grouped_md = "### Group importance\n" + ("\n".join(grouped_lines) if grouped_lines else "_n/a_") df = pd.DataFrame(r.shap_rows) if not df.empty and "impact" in df.columns: show = df.drop(columns=["impact"], errors="ignore") else: show = df return label_md, r.explanation, show, grouped_md with gr.Blocks(title="AI vs Human Code Classifier") as demo: gr.Markdown( "# AI vs Human Code Classifier\n" "Classifies snippets as **AI** or **Human** using XGBoost on statistical, AST, " "stylometry, language, and **UnixCoder** semantic features, with **SHAP** attributions." ) with gr.Row(): language = gr.Radio(choices=["python", "java"], value="python", label="Language") top_k = gr.Slider(1, 20, value=6, step=1, label="Top SHAP features") code = gr.Code(label="Code", language="python", lines=18) run_btn = gr.Button("Run prediction", variant="primary") out_head = gr.Markdown() out_grouped = gr.Markdown() out_expl = gr.Markdown(label="Narrative explanation") out_table = gr.Dataframe(label="Top feature attributions", wrap=True) run_btn.click( _predict, inputs=[code, language, top_k], outputs=[out_head, out_expl, out_table, out_grouped], ) if __name__ == "__main__": demo.launch(server_name="0.0.0.0", server_port=7860)