Spaces:

GamucopiaCreatives
/

POLICYPULSE-AI

Running

File size: 56,614 Bytes

import sys
import os
# Add parent directory to path so we can import 'envs' and 'inference'
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

from fastapi import FastAPI, HTTPException, Body, Query
from fastapi.responses import HTMLResponse
from pydantic import BaseModel, Field
from typing import Optional, Dict, Any, List
from enum import Enum
from envs.social_stream_moderation.environment import SocialStreamModerationEnv
from envs.social_stream_moderation.models import State, ModerationAction
from envs.social_stream_moderation.graders import list_graders as _list_graders, get_grader, grade_episode
from envs.social_stream_moderation.tasks import TASKS, TASK_ALIASES, resolve_task

# Reverse mapping: canonical name -> legacy task ID (for openenv.yaml alignment)
CANONICAL_TO_LEGACY = {v: k for k, v in TASK_ALIASES.items()}

# Enums for Swagger Dropdowns
class TaskName(str, Enum):
    TASK_1 = "Task 1: Basic Safety"
    TASK_2 = "Task 2: Context & Nuance"
    TASK_3 = "Task 3: Fairness & Bias"

class PolicyModeChoice(str, Enum):
    NORMAL = "Standard Moderation"
    STRICT = "Strict Enforcement"
    LENIENT = "Lenient Privacy"

class UserHistoryChoice(str, Enum):
    CLEAN = "Clean History"
    REPEATED = "Repeat Offender"

class ContextTypeChoice(str, Enum):
    ROOT = "Main Post"
    COMMENT = "Comment"

# Mapping UI labels back to backend IDs
TASK_MAP = {
    TaskName.TASK_1: "Task 1: Basic Safety",
    TaskName.TASK_2: "Task 2: Context & Nuance",
    TaskName.TASK_3: "Task 3: Fairness & Bias"
}

POLICY_MAP = {
    PolicyModeChoice.NORMAL: "normal",
    PolicyModeChoice.STRICT: "strict",
    PolicyModeChoice.LENIENT: "lenient"
}

HISTORY_MAP = {
    UserHistoryChoice.CLEAN: "no_prior_violations",
    UserHistoryChoice.REPEATED: "prior_violations"
}

CONTEXT_MAP = {
    ContextTypeChoice.ROOT: "root_post",
    ContextTypeChoice.COMMENT: "comment"
}

# API Metadata for Swagger
TAGS_METADATA = [
    {
        "name": "🤖 Automated Benchmarking",
        "description": "Autonomous evaluation loop. Sequence: **Reset** -> **Predict & Step** (Repeat). This tracks the official hackathon metrics.",
    },
    {
        "name": "🧪 Interactive Lab",
        "description": "Manual testing endpoints. Perfect for testing specific edge cases with custom inputs and human overrides.",
    },
    {
        "name": "📊 System Monitoring",
        "description": "Real-time state and status tracking for the moderation engine.",
    }
]

app = FastAPI(
    title="🛡️ PolicyPulse AI | Intelligence Center",
    description="""

### Evaluation Guide for Hackathon Judges:

1. **Automated Testing:** Use `[POST] /reset` then `[POST] /predict_and_step`.

2. **Fairness Testing (Task 3):** Start an episode with `task_name='policy_fairness'`.

3. **Internal Logic:** Use `[POST] /evaluate` to see the model's reasoning without advancing the environment.

    """,
    version="1.2.0",
    openapi_tags=TAGS_METADATA
)
env = SocialStreamModerationEnv()

class ResetRequest(BaseModel):
    task_name: Optional[TaskName] = Field(None, description="Select the benchmark level to initialize (Swagger UI).")
    task_id: Optional[str] = Field(None, description="Machine-readable task ID (e.g. 'clear_cut_moderation'). Used by the validator.")
    seed: Optional[int] = Field(42, description="Reproducibility seed for dataset sampling.")

class EvaluateRequest(BaseModel):
    text: str = Field("I will kill you", description="The user content string to analyze.")
    api_base_url: Optional[str] = Field(None, description="Optional override. If blank, defaults to server's API_BASE_URL config.")
    model_name: Optional[str] = Field(None, description="Optional override. If blank, defaults to server's MODEL_NAME config.")
    api_key: Optional[str] = Field(None, description="Optional override. If blank, defaults to server's HF_TOKEN config.")

class LLMConfigRequest(BaseModel):
    api_base_url: Optional[str] = Field(None, description="Optional override. If blank, defaults to server's API_BASE_URL config.")
    model_name: Optional[str] = Field(None, description="Optional override. If blank, defaults to server's MODEL_NAME config.")
    api_key: Optional[str] = Field(None, description="Optional override. If blank, defaults to server's HF_TOKEN config.")

class StepRequest(BaseModel):
    action: ModerationAction = Field(ModerationAction.ALLOW, description="The action to apply to the current post.")

class FeedbackRequest(BaseModel):
    text: str
    corrected_action: ModerationAction
    reason: str

@app.get("/", response_class=HTMLResponse)
def read_root():
    return r"""



    <!DOCTYPE html>

    <html lang="en">

    <head>

        <meta charset="UTF-8">

        <meta name="viewport" content="width=device-width, initial-scale=1.0">

        <title>PolicyPulse AI | Intelligence Center</title>

        <link href="https://fonts.googleapis.com/css2?family=Outfit:wght@300;400;600;800&family=JetBrains+Mono&display=swap" rel="stylesheet">

        <style>

            :root {

                --bg: #030712;

                --sidebar: rgba(15, 23, 42, 0.6);

                --accent: #38bdf8;

                --danger: #f472b6;

                --success: #4ade80;

                --text: #f8fafc;

                --muted: #94a3b8;

            }

            * { margin:0; padding:0; box-sizing:border-box; }

            body {

                font-family:'Outfit', sans-serif; background: #030712; color:var(--text);

                height:100vh; overflow:hidden; display:flex; flex-direction:column;

                transition: 0.3s cubic-bezier(0.4, 0, 0.2, 1);

            }

            

            /* Custom Scrollbars */

            ::-webkit-scrollbar { width: 6px; height: 6px; }

            ::-webkit-scrollbar-track { background: transparent; }

            ::-webkit-scrollbar-thumb { background: rgba(56, 189, 248, 0.2); border-radius: 10px; }

            ::-webkit-scrollbar-thumb:hover { background: var(--accent); }



            main { 

                flex:1; 

                display:grid; 

                grid-template-columns: 320px 1fr 0px; 

                gap:20px; 

                padding:20px; 

                max-height:calc(100vh - 60px); 

                transition: 0.4s cubic-bezier(0.4, 0, 0.2, 1);

            }

            body.audit-active main { 

                grid-template-columns: 320px 1fr 420px; 

            }



            header { height:60px; display:flex; align-items:center; justify-content:space-between; padding:0 30px; border-bottom:1px solid rgba(255,255,255,0.05); background:rgba(15, 23, 42, 0.4); }

            .logo { font-weight:800; font-size:1.4rem; letter-spacing:-0.03em; color:var(--accent); }

            .version { font-size:0.7rem; background:rgba(56, 189, 248, 0.1); padding:4px 10px; border-radius:6px; color:var(--accent); font-weight:600; }



            /* Panel Styling */

            .panel { background:var(--sidebar); backdrop-filter:blur(20px); border-radius:24px; border:1px solid rgba(255,255,255,0.06); display:flex; flex-direction:column; overflow:hidden; }

            .panel-header { padding:25px; border-bottom:1px solid rgba(255,255,255,0.05); }

            .panel-title { font-size:0.9rem; font-weight:800; text-transform:uppercase; letter-spacing:0.05em; display:flex; align-items:center; gap:10px; }

            .panel-title::before { content:''; width:3px; height:14px; background:var(--accent); border-radius:10px; }

            .panel-content { padding:25px; flex:1; overflow-y:auto; }



            /* Tabs */

            .mode-switch { display:flex; background:rgba(0,0,0,0.3); padding:4px; border-radius:12px; margin-bottom:25px; }

            .tab { flex:1; padding:10px; text-align:center; cursor:pointer; font-size:0.8rem; font-weight:700; border-radius:8px; transition:0.3s; color:var(--muted); }

            .tab.active { background:var(--accent); color:#020617; }



            /* Forms */

            .field { margin-bottom:20px; }

            label { display:block; font-size:0.65rem; font-weight:700; color:var(--muted); text-transform:uppercase; margin-bottom:8px; }

            select, textarea { width:100%; background:rgba(0,0,0,0.4); border:1px solid rgba(255,255,255,0.1); border-radius:12px; padding:12px; color:#fff; font-family:'Outfit'; font-size:0.9rem; transition:0.3s; }

            textarea { resize:none; min-height:100px; }

            select:focus, textarea:focus { outline:none; border-color:var(--accent); }



            /* Buttons */

            .btn { width:100%; padding:16px; border-radius:14px; border:none; font-weight:700; cursor:pointer; transition:0.3s; font-size:0.95rem; display:flex; align-items:center; justify-content:center; gap:10px; }

            .btn-primary { background:var(--accent); color:#020617; }

            .btn-primary:hover { background:#7dd3fc; transform:translateY(-2px); }

            .btn-secondary { background:rgba(255,255,255,0.05); color:#fff; border:1px solid rgba(255,255,255,0.1); margin-top:10px; }

            .btn-secondary:hover { background:rgba(255,255,255,0.08); }

            .btn:disabled { opacity:0.3; cursor:not-allowed; transform:none !important; }



            /* Right Column */

            .stats-bar { display:grid; grid-template-columns: repeat(3, 1fr); gap:15px; margin-bottom:20px; }

            .stat-card { background:rgba(255,255,255,0.03); padding:15px; border-radius:16px; border:1px solid rgba(255,255,255,0.05); }

            .stat-label { font-size:0.6rem; color:var(--muted); font-weight:700; text-transform:uppercase; }

            .stat-value { font-size:1.1rem; font-weight:800; font-family:'JetBrains Mono'; margin-top:5px; color:var(--accent); }



            .log-container { background:rgba(0,0,0,0.2); border-radius:20px; border:1px solid rgba(255,255,255,0.05); flex:1; overflow-y:auto; padding:20px; display:flex; flex-direction:column; gap:12px; }

            .log-entry { 

                background:rgba(255,255,255,0.02); padding:18px; border-radius:14px; 

                border-left:3px solid var(--accent); animation:fadeIn 0.3s; 

                transition:0.3s; cursor:default;

            }

            .log-entry.active-audit { background:rgba(56,189,248,0.08); border-color:var(--accent); box-shadow:0 10px 30px rgba(0,0,0,0.3); }

            @keyframes fadeIn { from { opacity:0; transform:translateY(5px); } to { opacity:1; transform:translateY(0); } }

            .log-meta { display:flex; justify-content:space-between; font-size:0.7rem; color:var(--muted); margin-bottom:8px; font-weight:600; }

            .log-text { font-size:0.95rem; line-height:1.4; color:#e2e8f0; }

            .log-badge { font-size:0.6rem; font-weight:800; padding:2px 8px; border-radius:4px; text-transform:uppercase; margin-top:10px; display:inline-block; }



            .audit-btn { background:rgba(255,255,255,0.05); border:1px solid rgba(255,255,255,0.1); color:var(--muted); font-size:0.6rem; padding:4px 12px; border-radius:6px; cursor:pointer; font-weight:800; transition:0.2s; }

            .audit-btn:hover { background:var(--danger); color:#000; border-color:var(--danger); }

            

            .verify-btn { background:rgba(74,222,128,0.05); border:1px solid var(--success); color:var(--success); font-size:0.6rem; padding:4px 12px; border-radius:6px; cursor:pointer; font-weight:800; transition:0.2s; }

            .verify-btn:hover { background:var(--success); color:#000; }



            .grid-btn { background:rgba(255,255,255,0.05); border:1px solid rgba(255,255,255,0.1); color:white; font-size:0.7rem; padding:12px; border-radius:8px; cursor:pointer; font-weight:700; transition:0.2s; }

            .grid-btn:hover { background:var(--accent); color:#020617; border-color:var(--accent); }



            /* Skeleton Shimmer */

            .skeleton { 

                height: 200px; 

                background: linear-gradient(90deg, rgba(255,255,255,0.03) 25%, rgba(255,255,255,0.08) 50%, rgba(255,255,255,0.03) 75%);

                background-size: 200% 100%;

                animation: shimmer 1.5s infinite;

                border-radius: 14px;

                margin-bottom: 12px;

                border: 1px solid rgba(255,255,255,0.05);

            }

            @keyframes shimmer {

                0% { background-position: 200% 0; }

                100% { background-position: -200% 0; }

            }



            .empty-state { margin:auto; text-align:center; color:var(--muted); font-weight:300; }



            /* Header Nav */

            .nav-links { display:flex; gap:25px; align-items:center; }

            .nav-links a { 

                font-size:0.75rem; 

                color:var(--muted); 

                text-decoration:none; 

                font-weight:700; 

                letter-spacing:0.05em; 

                transition:0.3s; 

                position:relative;

                padding-bottom: 4px;

            }

            .nav-links a:hover { color:var(--accent); }

            .nav-links a::after {

                content: '';

                position: absolute;

                bottom: 0; left: 0;

                width: 0; height: 1px;

                background: var(--accent);

                transition: 0.3s;

            }

            .nav-links a:hover::after { width: 100%; }

        </style>

    </head>

    <body>

        <header>

            <div class="logo">POLICYPULSE <span style="font-weight:300">AI</span></div>

            <div style="display:flex; align-items:center; gap:20px;">

                <div class="nav-links">

                    <a href="/docs">API REFERENCE</a>

                    <a href="/state">SYSTEM STATUS</a>

                </div>

                <div class="version">REVISION 1.0</div>

            </div>

        </header>



        <main>

            <!-- Left Panel: Orchestration -->

            <div class="panel">

                <div class="panel-header">

                    <div class="panel-title">Operation Center</div>

                </div>

                <div class="panel-content">

                    <div class="mode-switch">

                        <div class="tab active" id="tab-lab">LIVE MODE</div>

                        <div class="tab" id="tab-auto">GRADER MODE</div>

                    </div>



                    <!-- Lab Mode Form -->

                    <div id="section-lab">

                        <div class="field">

                            <label>User Content</label>

                            <textarea id="lab-input" placeholder="Type or paste text to test our agent's moderation logic..."></textarea>

                        </div>

                        <div class="field">

                            <label>Safety Policy</label>

                            <select id="lab-policy">

                                <option value="NORMAL">Standard Moderation</option>

                                <option value="STRICT">Strict Enforcement</option>

                                <option value="LENIENT">Lenient Privacy</option>

                            </select>

                        </div>

                        <div class="field" style="display:grid; grid-template-columns:1fr 1fr; gap:10px;">

                            <div>

                                <label>User History</label>

                                <select id="lab-history" style="font-size:0.75rem;">

                                    <option value="no_prior_violations">Clean History</option>

                                    <option value="prior_violations">Repeat Offender</option>

                                </select>

                            </div>

                            <div>

                                <label>Context Type</label>

                                <select id="lab-context" style="font-size:0.75rem;">

                                    <option value="root_post">Main Post</option>

                                    <option value="comment">Comment</option>

                                </select>

                            </div>

                        </div>

                    </div>





                    <!-- Auto Mode Form -->

                    <div id="section-auto" style="display:none;">

                        <div class="field">

                            <label>Benchmark Level</label>

                            <select id="auto-task">

                                <option value="Task 1: Basic Safety">Task 1: Basic Safety</option>

                                <option value="Task 2: Context & Nuance">Task 2: Context & Nuance</option>

                                <option value="Task 3: Fairness & Bias">Task 3: Fairness & Bias</option>

                            </select>

                        </div>

                        <button class="btn btn-primary" id="btn-auto-reset">START BENCHMARK</button>

                        <button class="btn btn-secondary" id="btn-auto-step" disabled>PROCESS NEXT ITEM</button>

                    </div>



                    <div style="margin-top:20px; padding-top:20px; border-top:1px solid rgba(255,255,255,0.05);">

                        <div style="font-size:0.65rem; font-weight:700; color:var(--accent); text-transform:uppercase; margin-bottom:10px;">Optional: Custom LLM Override</div>

                        <div class="field" style="margin-bottom:15px;">

                            <input type="text" id="config-base-url" placeholder="API Base URL (e.g., https://api.openai.com/v1)" style="width:100%; background:rgba(0,0,0,0.4); border:1px solid rgba(255,255,255,0.1); border-radius:8px; padding:10px; color:#fff; font-family:'Outfit'; font-size:0.8rem; margin-bottom:8px;">

                            <input type="text" id="config-model" placeholder="Model Name (e.g., gpt-4o-mini)" style="width:100%; background:rgba(0,0,0,0.4); border:1px solid rgba(255,255,255,0.1); border-radius:8px; padding:10px; color:#fff; font-family:'Outfit'; font-size:0.8rem; margin-bottom:8px;">

                            <input type="password" id="config-key" placeholder="API Key" style="width:100%; background:rgba(0,0,0,0.4); border:1px solid rgba(255,255,255,0.1); border-radius:8px; padding:10px; color:#fff; font-family:'Outfit'; font-size:0.8rem;">

                        </div>

                    </div>



                    <button class="btn btn-primary" id="btn-lab-run" style="margin-top:20px" disabled>RUN MODERATION</button>

                    <button class="btn btn-secondary" id="btn-global-clear" style="margin-top:10px">PURGE LOGS</button>



                </div>

            </div>



            <!-- Right Panel: Intelligence Stream -->

            <div class="panel" style="background:transparent; border:none; backdrop-filter:none;">

                <div class="stats-bar">

                    <div class="stat-card">

                        <div class="stat-label">Model Accuracy</div>

                        <div class="stat-value" id="val-accuracy">--</div>

                    </div>

                    <div class="stat-card">

                        <div class="stat-label">Aggregate Reward</div>

                        <div class="stat-value" id="val-reward">0.000</div>

                    </div>

                    <div class="stat-card">

                        <div class="stat-label">System State</div>

                        <div class="stat-value" id="val-state" style="color:var(--muted)">IDLE</div>

                    </div>

                </div>



                <div class="log-container" id="log-viewport">

                    <div class="empty-state" id="empty-hint">

                        <div style="font-size:3rem; margin-bottom:20px; opacity:0.2;">📉</div>

                        <div style="font-weight:600; font-size:0.9rem;">Intelligence Stream Idle</div>

                        <p style="font-size:0.75rem; opacity:0.5; margin-top:10px;">Configure your parameters and click 'RUN MODERATION' to begin ingestion.</p>

                    </div>

                </div>

            </div>



            <!-- Audit Inspector Sidepanel (Now correctly part of the grid) -->

            <div id="inspector-pane" class="panel" style="border-left:1px solid rgba(255,255,255,0.1); background:rgba(15,23,42,0.6); overflow:hidden; visibility:hidden; opacity:0; transition:0.4s;">

                <div class="panel-header" style="display:flex; justify-content:space-between; align-items:center;">

                    <div class="panel-title">Audit Inspector</div>

                    <button onclick="closeInspector()" style="background:none; border:none; color:var(--muted); cursor:pointer; font-size:1.2rem;">&times;</button>

                </div>

                <div class="panel-content" id="inspector-content" style="padding:20px;">

                    <!-- Content injected by JS -->

                </div>

            </div>

        </main>



        <script>

            // Elements

            const tabs = { lab: document.getElementById('tab-lab'), auto: document.getElementById('tab-auto') };

            const sections = { lab: document.getElementById('section-lab'), auto: document.getElementById('section-auto') };

            const btnLabRun = document.getElementById('btn-lab-run');

            const btnAutoReset = document.getElementById('btn-auto-reset');

            const btnAutoStep = document.getElementById('btn-auto-step');

            const btnGlobalClear = document.getElementById('btn-global-clear');

            const logViewport = document.getElementById('log-viewport');



            // HUD

            const valReward = document.getElementById('val-reward');

            const valAccuracy = document.getElementById('val-accuracy');

            const valState = document.getElementById('val-state');



            let totalReward = 0;

            let counter = 0;

            let currentMode = 'lab';



            // Tab Switching

            tabs.lab.onclick = () => setMode('lab');

            tabs.auto.onclick = () => setMode('auto');



            // Mode Switch Logic

            function setMode(m) {

                currentMode = m;

                sections.lab.style.display = m === 'lab' ? 'block' : 'none';

                sections.auto.style.display = m === 'auto' ? 'block' : 'none';

                tabs.lab.classList.toggle('active', m === 'lab');

                tabs.auto.classList.toggle('active', m === 'auto');

                

                // Clear state UI

                valState.textContent = 'READY';

                valState.style.color = 'var(--accent)';

            }

            

            // Lab Input Validation

            document.getElementById('lab-input').oninput = (e) => {

                btnLabRun.disabled = !e.target.value.trim();

            };



            // Task Change Re-enables Start

            document.getElementById('auto-task').onchange = () => {

                btnAutoReset.disabled = false;

                btnAutoStep.disabled = true;

            };



            // Global Reset

            btnGlobalClear.onclick = () => {

                logViewport.innerHTML = '<div class="empty-state">System purged. Waiting for new data.</div>';

                totalReward = 0;

                counter = 0;

                valReward.textContent = '0.000';

                valAccuracy.textContent = '--';

                valState.textContent = 'IDLE';

                valState.style.color = 'var(--muted)';

                btnAutoStep.disabled = true;

                btnAutoReset.disabled = false; // Re-enable benchmark

                if (currentMode === 'auto') valState.textContent = 'SYSTEM RESET';

            };



            // Lab Evaluation

            btnLabRun.onclick = async () => {

                const text = document.getElementById('lab-input').value.trim();

                const policy = document.getElementById('lab-policy').value;

                const history = document.getElementById('lab-history').value;

                const context = document.getElementById('lab-context').value;

                if (!text) return;



                btnLabRun.disabled = true;



                // Show Skeleton Loading State

                const skeleton = document.createElement('div');

                skeleton.id = 'lab-shimmer';

                skeleton.innerHTML = `<div class="skeleton"></div>`;

                logViewport.prepend(skeleton);



                try {

                    const resp = await fetch('/evaluate', {

                        method: 'POST',

                        headers: {'Content-Type': 'application/json'},

                        body: JSON.stringify({

                            text: text,

                            policy_mode: policy.toLowerCase(),

                            user_history: history,

                            context_type: context,

                            api_base_url: document.getElementById('config-base-url').value.trim() || undefined,

                            model_name: document.getElementById('config-model').value.trim() || undefined,

                            api_key: document.getElementById('config-key').value.trim() || undefined

                        })

                    });



                    if (skeleton) skeleton.remove();



                    if (!resp.ok) {

                        const errData = await resp.json();

                        throw new Error(errData.detail || "Neural Evaluation Failed");

                    }



                    const data = await resp.json();

                    renderEntry(text, data.action, data.reward, policy, data.reason, {history, context});

                    updateHUD(data.reward);

                    document.getElementById('lab-input').value = '';

                    btnLabRun.disabled = true; // Auto-disable after clear

                } catch (e) {

                    if (skeleton) skeleton.remove();

                    const errorEntry = document.createElement('div');

                    errorEntry.className = 'log-entry';

                    errorEntry.style.borderLeftColor = 'var(--danger)';

                    errorEntry.style.background = 'rgba(244,114,182,0.05)';

                    errorEntry.innerHTML = `

                        <div class="log-meta"><span style="color:var(--danger)">⚠️ SYSTEM EXCEPTION</span></div>

                        <div class="log-text">The neural bridge was interrupted. Check your API key or model availability.</div>

                        <div style="font-size:0.6rem; color:var(--danger); margin-top:10px; opacity:0.7; font-family:'JetBrains Mono'">${e.toString()}</div>

                    `;

                    logViewport.prepend(errorEntry);

                } finally {

                    btnLabRun.disabled = !document.getElementById('lab-input').value.trim();

                }

            };





            // Auto Benchmark

            btnAutoReset.onclick = async () => {

                btnAutoReset.disabled = true; // Lock Benchmark

                btnAutoStep.disabled = false;

                const task = document.getElementById('auto-task').value;

                valState.textContent = 'RESETTING...';

                const resp = await fetch('/reset', {

                    method: 'POST',

                    headers: {'Content-Type': 'application/json'},

                    body: JSON.stringify({task_name: task})

                });

                const state = await resp.json();



                logViewport.innerHTML = `<div class="log-entry" style="border-color:var(--muted)">

                    <div class="log-meta"><span>SYSTEM EVENT</span><span>SESSION START</span></div>

                    <div class="log-text">Environment reset complete. Target: <b>${task}</b>. Dataset contains ${state.total_steps} items. Ready for sequential evaluation.</div>

                </div>`;





                valState.textContent = `SEQ: 1/${state.total_steps}`;

                btnAutoStep.disabled = false;

            };



            btnAutoStep.onclick = async () => {

                if (btnAutoStep.disabled) return;

                btnAutoStep.disabled = true;



                // Show Skeleton Loading State

                const logViewport = document.getElementById('log-viewport');

                const skeleton = document.createElement('div');

                skeleton.id = 'shimmer-loading';

                skeleton.innerHTML = `<div class="skeleton"></div>`;

                logViewport.prepend(skeleton);



                try {

                    const stateResp = await fetch('/state');

                    const state = await stateResp.json();



                    const evalResp = await fetch('/evaluate', {

                        method: 'POST',

                        headers: {'Content-Type': 'application/json'},

                        body: JSON.stringify({

                            text: state.text, 

                            policy_mode: state.platform_policy_mode,

                            api_base_url: document.getElementById('config-base-url').value.trim() || undefined,

                            model_name: document.getElementById('config-model').value.trim() || undefined,

                            api_key: document.getElementById('config-key').value.trim() || undefined

                        })

                    });

                    const evalData = await evalResp.json();



                    const stepResp = await fetch('/step', {

                        method: 'POST',

                        headers: {'Content-Type': 'application/json'},

                        body: JSON.stringify({action: evalData.action})

                    });

                    const stepResult = await stepResp.json();



                    // Remove Skeleton

                    if (skeleton) skeleton.remove();



                    renderEntry(state.text, evalData.action, stepResult.reward, state.platform_policy_mode.toUpperCase(), evalData.reason, {history: state.user_history_summary, context: state.context_type});

                    updateHUD(stepResult.reward);



                    if (stepResult.done) {

                        valState.textContent = 'COMPLETE';

                        valState.style.color = 'var(--success)';

                        btnAutoStep.disabled = true;



                        logViewport.innerHTML = `<div class="log-entry" style="border-color:var(--success); background:rgba(74,222,128,0.05)">

                            <div class="log-meta"><span>EPISODE COMPLETE</span><span>FINAL GRADE</span></div>

                            <div class="log-text">The environment has finalized this sequence. Total episodes rewards calculated with active fairness parity checks.</div>

                            <div style="font-size:1.4rem; font-weight:800; color:var(--success); margin-top:15px; font-family:'JetBrains Mono'">SCORE: ${stepResult.final_score.toFixed(4)}</div>

                        </div>` + logViewport.innerHTML;

                    } else {

                        valState.textContent = `SEQ: ${state.step_index + 1}/${state.total_steps}`;

                        btnAutoStep.disabled = false;

                    }

                } catch (e) {

                    if (skeleton) skeleton.remove();

                    btnAutoStep.disabled = false;

                    

                    const errorEntry = document.createElement('div');

                    errorEntry.className = 'log-entry';

                    errorEntry.style.borderLeftColor = 'var(--danger)';

                    errorEntry.style.background = 'rgba(244,114,182,0.05)';

                    errorEntry.innerHTML = `

                        <div class="log-meta"><span style="color:var(--danger)">⚠️ SYSTEM EXCEPTION</span></div>

                        <div class="log-text">An intelligence bypass occurred or the connection was interrupted. Please check your Operation Center configuration or API availability.</div>

                        <div style="font-size:0.6rem; color:var(--danger); margin-top:10px; opacity:0.7; font-family:'JetBrains Mono'">${e.toString()}</div>

                    `;

                    logViewport.prepend(errorEntry);

                }

            };



            function updateHUD(r) {

                totalReward += r;

                counter++;

                valReward.textContent = totalReward.toFixed(3);

                valAccuracy.textContent = (totalReward / counter).toFixed(3);

            }



            function renderEntry(text, action, reward, mode, reason, meta) {

                const colors = { ALLOW:'var(--accent)', BAN_USER:'var(--danger)', HARD_FILTER:'var(--danger)', SOFT_HIDE:'#fbbf24', ALLOW_WITH_WARNING:'var(--accent)', ESCALATE_HUMAN:'var(--success)' };

                const entry = document.createElement('div');

                entry.className = 'log-entry';

                entry.style.borderColor = colors[action] || 'var(--accent)';

                entry.innerHTML = `

                    <div class="log-meta">

                        <span>POLICY: ${mode}</span>

                        <span>VERDICT: +${reward.toFixed(3)}</span>

                    </div>

                    <div style="display:flex; gap:8px; margin-bottom:10px;">

                        <span style="font-size:0.6rem; color:var(--muted); border:1px solid rgba(255,255,255,0.1); padding:2px 6px; border-radius:4px; text-transform:uppercase;">${meta.history.replace(/_/g,' ')}</span>

                        <span style="font-size:0.6rem; color:var(--muted); border:1px solid rgba(255,255,255,0.1); padding:2px 6px; border-radius:4px; text-transform:uppercase;">${meta.context.replace(/_/g,' ')}</span>

                    </div>

                    <div class="log-text">${text}</div>

                    <div style="font-size:0.75rem; color:var(--accent); background:rgba(56,189,248,0.04); padding:12px; border-radius:12px; margin-top:12px; border:1px solid rgba(56,189,248,0.1); white-space: pre-wrap; line-height: 1.6;">

                        ${reason}

                    </div>

                    <div style="display:flex; align-items:center; justify-content:space-between; margin-top:12px;">

                        <span class="log-badge" style="background:${colors[action] || 'var(--accent)'}; color:#020617; margin-top:0">${action}</span>

                        <div class="hitl-actions" id="hitl-${counter}" style="display:flex; gap:5px;">

                            <button onclick="showOverrideMenu(this, ${reward}, '${action}', \`${text.replace(/`/g, '\\`')}\`)" class="audit-btn">AUDIT</button>

                            <button onclick="verifyAction(this)" class="verify-btn">VERIFY</button>

                        </div>

                    </div>

                `;

                const hint = document.getElementById('empty-hint');

                if (hint) hint.remove();

                logViewport.prepend(entry);

            }



            function verifyAction(btn) {

                btn.parentElement.innerHTML = '<span style="color:var(--success); font-size:0.6rem; font-weight:800; border:1px solid var(--success); padding:2px 6px; border-radius:4px;">✓ HUMAN VERIFIED</span>';

            }



            function closeInspector() {

                document.body.classList.remove('audit-active');

                const pane = document.getElementById('inspector-pane');

                pane.style.visibility = 'hidden';

                pane.style.opacity = '0';

                if (window.__active_row) window.__active_row.classList.remove('active-audit');

            }



            function showOverrideMenu(btn, originalReward, originalAction, originalText) {

                const pane = document.getElementById('inspector-pane');

                const content = document.getElementById('inspector-content');

                const row = btn.closest('.log-entry');

                

                if (window.__active_row) window.__active_row.classList.remove('active-audit');

                row.classList.add('active-audit');

                window.__active_row = row;



                window.__pending_text = originalText;

                window.__pending_reward = originalReward;

                window.__pending_hitl_id = btn.parentElement.id;

                window.__selected_action = null; 

                

                content.innerHTML = `

                    <div style="display:flex; flex-direction:column; gap:20px;">

                        <div style="background:rgba(255,255,255,0.03); padding:20px; border-radius:16px; border:1px solid rgba(255,255,255,0.05);">

                            <div style="font-size:0.6rem; color:var(--muted); text-transform:uppercase; font-weight:800; margin-bottom:10px;">Original Content</div>

                            <div style="font-size:0.9rem; line-height:1.5;">"${originalText}"</div>

                        </div>



                        <div style="display:flex; flex-direction:column; gap:12px;">

                            <label style="font-size:0.65rem; color:var(--danger); font-weight:800; text-transform:uppercase;">Correction Verdict</label>

                            <div style="display:grid; grid-template-columns: 1fr 1fr; gap:10px;" id="action-selector">

                                <button onclick="selectAction(this, 'ALLOW')" class="grid-btn">ALLOW</button>

                                <button onclick="selectAction(this, 'ALLOW_WITH_WARNING')" class="grid-btn">WARNING</button>

                                <button onclick="selectAction(this, 'SOFT_HIDE')" class="grid-btn">HIDE</button>

                                <button onclick="selectAction(this, 'ESCALATE_HUMAN')" class="grid-btn">ESCALATE</button>

                                <button onclick="selectAction(this, 'BAN_USER')" class="grid-btn" style="grid-column: span 2;">BAN USER</button>

                            </div>

                        </div>

                        

                        <div style="display:flex; flex-direction:column; gap:10px;">

                            <label style="font-size:0.65rem; color:var(--muted); font-weight:800; text-transform:uppercase;">Memory Reason (Optional)</label>

                            <textarea id="feedback-reason" placeholder="Why is this correction necessary?" style="min-height:100px; font-size:0.85rem; background:rgba(0,0,0,0.4); padding:15px; border:1px solid rgba(255,255,255,0.1); border-radius:12px; color:white; width:100%; resize:none;"></textarea>

                        </div>

                        

                        <button id="btn-submit-feedback" onclick="submitFeedback()" class="btn btn-primary" style="margin-top:10px; opacity:0.5;" disabled>REINFORCE SYSTEM</button>

                        

                        <div id="feedback-status" style="font-size:0.7rem; color:var(--muted); text-align:center;">Select an action to enable submission.</div>

                    </div>

                `;

                

                pane.style.visibility = 'visible';

                pane.style.opacity = '1';

                document.body.classList.add('audit-active');

            }



            function selectAction(btn, action) {

                // Clear state

                const btns = document.querySelectorAll('#action-selector .grid-btn');

                btns.forEach(b => {

                    b.style.background = 'rgba(255,255,255,0.05)';

                    b.style.color = 'white';

                });

                

                // Set active

                btn.style.background = 'var(--accent)';

                btn.style.color = '#020617';

                window.__selected_action = action;

                

                // Enable submit

                const submit = document.getElementById('btn-submit-feedback');

                submit.disabled = false;

                submit.style.opacity = '1';

                document.getElementById('feedback-status').innerHTML = "Ready to reinforce local memory.";

            }



            async function submitFeedback() {

                const action = window.__selected_action;

                const reason = document.getElementById('feedback-reason').value.trim() || "Manual correction by human auditor.";

                const text = window.__pending_text;

                const originalReward = window.__pending_reward;

                const hitlId = window.__pending_hitl_id;

                

                const statusDiv = document.getElementById('feedback-status');

                const submitBtn = document.getElementById('btn-submit-feedback');

                

                submitBtn.disabled = true;

                statusDiv.innerHTML = "⏳ REINFORCING LOGIC...";



                try {

                    await fetch('/feedback', {

                        method: 'POST',

                        headers: {'Content-Type': 'application/json'},

                        body: JSON.stringify({

                            text: text,

                            corrected_action: action,

                            reason: reason

                        })

                    });



                    const correction = - (originalReward + 1.0);

                    updateHUD(correction);



                    const container = document.getElementById(hitlId);

                    container.innerHTML = `<span style="color:var(--danger); font-size:0.6rem; font-weight:800; border:1px solid var(--danger); padding:2px 6px; border-radius:4px;">🧠 MEMORY REINFORCED</span>`;

                    

                    statusDiv.innerHTML = "✅ SYSTEM REINFORCED!";

                    setTimeout(closeInspector, 1000);

                } catch (e) {

                    statusDiv.innerHTML = "❌ MEMORY WRITE FAILED";

                    submitBtn.disabled = false;

                }

            }





        </script>

    </body>

    </html>

    """



@app.post("/reset", tags=["🤖 Automated Benchmarking"], summary="1. Initialize Environment (Task Selection)")
async def reset_env(req: ResetRequest = Body(default=ResetRequest())):
    """Resets the environment with a given task and seed. This must be the first step in any benchmarking track.



    Accepts either ``task_id`` (legacy machine ID like ``clear_cut_moderation``)

    or ``task_name`` (Swagger UI enum).  ``task_id`` takes precedence when both

    are supplied.

    """
    try:
        if req.task_id:
            # Validator sends task_id (legacy ID like "clear_cut_moderation")
            task_cfg = resolve_task(req.task_id)
            internal_task_name = task_cfg.name
        elif req.task_name:
            # Swagger UI sends the enum
            internal_task_name = TASK_MAP[req.task_name]
        else:
            # Default to Task 1
            internal_task_name = "Task 1: Basic Safety"
        state = await env.reset(task_name=internal_task_name, seed=req.seed)
        return state
    except (ValueError, KeyError) as e:
        raise HTTPException(status_code=400, detail=str(e))

@app.get("/health", tags=["📊 System Monitoring"])
def health_check():
    """Health check endpoint required by OpenEnv runtime validation."""
    return {"status": "healthy"}


@app.get("/metadata", tags=["📊 System Monitoring"])
def metadata():
    """Returns environment metadata required by OpenEnv runtime validation."""
    return {
        "name": "SocialStreamModerationEnv",
        "description": (
            "A content-moderation RL environment where an agent must classify "
            "social-media posts as safe or harmful under varying policy regimes, "
            "with tasks spanning basic safety, contextual nuance, and fairness."
        ),
        "version": "1.2.0",
        "tasks": list(CANONICAL_TO_LEGACY.values()),
    }


@app.get("/schema", tags=["📊 System Monitoring"])
def schema():
    """Returns action, observation, and state schemas for OpenEnv validation."""
    return {
        "action": {
            "type": "string",
            "enum": [a.value for a in ModerationAction],
        },
        "observation": {
            "type": "object",
            "properties": {
                "post_id": {"type": "string"},
                "text": {"type": "string"},
                "user_history_summary": {"type": "string"},
                "context_type": {"type": "string"},
                "platform_policy_mode": {"type": "string"},
                "user_group": {"type": "string"},
                "step_index": {"type": "integer"},
                "total_steps": {"type": "integer"},
            },
        },
        "state": {
            "type": "object",
            "properties": {
                "post_id": {"type": "string"},
                "text": {"type": "string"},
                "context_type": {"type": "string"},
                "platform_policy_mode": {"type": "string"},
                "user_group": {"type": "string"},
                "step_index": {"type": "integer"},
                "total_steps": {"type": "integer"},
            },
        },
    }


@app.get("/tasks", tags=["🤖 Automated Benchmarking"])
async def list_tasks():
    """Returns the list of tasks available in the environment for discovery.



    ``task_id`` / ``id`` use the legacy machine-readable IDs that match

    ``openenv.yaml`` (e.g. ``clear_cut_moderation``) so the external validator

    can cross-reference them.

    """
    return [
        {
            "task_id": CANONICAL_TO_LEGACY.get(canonical, canonical),
            "id": CANONICAL_TO_LEGACY.get(canonical, canonical),
            "name": task_cfg.name,
            "difficulty": task_cfg.difficulty,
            "description": f"Episode length: {task_cfg.episode_length} posts. Policy mode: {task_cfg.policy_mode.value}.",
            "grader_id": task_cfg.grader_id,
        }
        for canonical, task_cfg in TASKS.items()
    ]

@app.get("/graders", tags=["🛡️ Automated Benchmarking"])
async def list_graders_endpoint():
    """Returns the list of graders available in the environment for discovery."""
    return _list_graders()


# Per-task score cache so /grader?task_id=... can return past scores
_task_scores: Dict[str, float] = {}


@app.get("/grader", tags=["🤖 Automated Benchmarking"])
def grader_score(task_id: Optional[str] = Query(None, description="Legacy task ID to retrieve a specific task's score.")):
    """Returns the grader score for the current (or most recent) episode.



    The Scaler / OpenEnv hackathon validator calls this endpoint after running

    an episode to obtain the final score.  Accepts an optional ``task_id``

    query parameter to retrieve the score for a specific task.



    If no episode has been run yet a minimal default score is returned.

    """
    # If a specific task_id is requested, look up its cached score
    if task_id:
        if task_id in _task_scores:
            return {"score": _task_scores[task_id]}
        # Also check canonical name
        canonical = TASK_ALIASES.get(task_id)
        if canonical and canonical in _task_scores:
            return {"score": _task_scores[canonical]}
        return {"score": 0.001}

    # Use the environment's last episode info to compute the score
    if env.episode_history:
        task = env.current_task
        if task is not None:
            grader_inst = get_grader(task.grader_id)
            score = grader_inst.grade(env.episode_history)
            # Cache the score under both canonical name and legacy ID
            _task_scores[task.name] = score
            legacy_id = CANONICAL_TO_LEGACY.get(task.name)
            if legacy_id:
                _task_scores[legacy_id] = score
        else:
            score = grade_episode(env.episode_history, use_fairness=False)
    else:
        score = 0.001
    return {"score": score}

@app.post("/evaluate", tags=["🧪 Interactive Lab"], summary="Test Model Logic (XAI Insight)")
async def evaluate_text(

    req: EvaluateRequest,

    policy_mode: PolicyModeChoice = Query(PolicyModeChoice.NORMAL, description="Select the active safety policy regime."),

    user_history: UserHistoryChoice = Query(UserHistoryChoice.CLEAN, description="Select the author's moderation history."),

    context_type: ContextTypeChoice = Query(ContextTypeChoice.ROOT, description="Select the content hierarchical context.")

):
    """Internal endpoint for the Interactive Sandbox UI. Returns logic reasoning and calculated rewards."""
    # Use proper Enum types
    from envs.social_stream_moderation.models import PolicyMode, State
    from envs.social_stream_moderation.graders import compute_per_post_reward, REWARD_TABLE
    from inference import get_agent

    # Map choice to model enum
    try:
        p_mode = PolicyMode(POLICY_MAP[policy_mode])
    except ValueError:
        p_mode = PolicyMode.NORMAL

    # Predict action using rule-based or LLM logic
    agent = get_agent(api_base_url=req.api_base_url, model_name=req.model_name, api_key=req.api_key)
    mock_state = State(
        post_id="playground_test",
        text=req.text,
        user_history_summary=HISTORY_MAP[user_history],
        context_type=CONTEXT_MAP[context_type],
        platform_policy_mode=p_mode.value,
        user_group="A",
        step_index=0,
        total_steps=1
    )


    action, reason = agent.predict(mock_state)

    # We need to simulate a 'correct' label for reward calculation in demo
    # For simplicity in demo, if the agent bans, we assume it caught something
    # (HarmLabel mapping is internal, so we'll just derive a representative reward)

    # Check if this input matches our known harmful patterns to determine reward
    from envs.social_stream_moderation.models import HarmLabel
    from inference import SAFETY_KEYWORDS
    best_harm_guess = HarmLabel.SAFE
    
    for category, keywords in SAFETY_KEYWORDS.items():
        if any(kw in req.text.lower() for kw in keywords):
            best_harm_guess = category
            break

    reward = compute_per_post_reward(best_harm_guess, action, p_mode)

    return {
        "action": action.value,
        "reward": float(reward),
        "reason": reason
    }


@app.post("/step", tags=["🧪 Interactive Lab"])
async def step_env(req: StepRequest):
    try:
        next_state, reward, done, info = await env.step(req.action)

        final_score = 0.0
        grader_id = None
        if done:
            # The environment now uses the task-specific grader internally;
            # the final score and grader_id are returned in ``info``.
            final_score = info.get("score", 0.0)
            grader_id = info.get("grader_id")

        return {
            "next_state": next_state,
            "reward": reward,
            "done": done,
            "info": info,
            "final_score": final_score,
            "grader_id": grader_id,
        }

    except RuntimeError as e:
        raise HTTPException(status_code=400, detail=str(e))

@app.post("/predict_and_step", tags=["🤖 Automated Benchmarking"], summary="2. Autonomous Model Execution (Autonomous)")
async def predict_and_step(req: Optional[LLMConfigRequest] = Body(None)):
    """Predicts using dynamic agent and steps the env automatically. This matches our inference.py autonomous loop."""
    from inference import get_agent

    state = env._get_state()
    if state is None:
        raise HTTPException(status_code=400, detail="No active episode. Please call /reset first.")

    agent = get_agent(
        api_base_url=req.api_base_url if req else None,
        model_name=req.model_name if req else None,
        api_key=req.api_key if req else None
    )
    action, reason = agent.predict(state)

    # Execute the step with the model's prediction
    next_state, reward, done, info = await env.step(action)

    final_score = 0.0
    grader_id = None
    if done:
        # The environment now uses the task-specific grader internally
        final_score = info.get("score", 0.0)
        grader_id = info.get("grader_id")

    return {
        "prediction": action.value,
        "reason": reason,
        "reward": reward,
        "done": done,
        "final_score": final_score,
        "grader_id": grader_id,
        "next_state": next_state,
        "info": info
    }

@app.post("/feedback")
async def save_feedback(req: FeedbackRequest):
    """Saves human correction to local JSON memory for reinforcement learning."""
    import json
    memory_path = os.path.join(os.path.dirname(__file__), "..", "envs", "social_stream_moderation", "human_memory.json")
    
    # Load existing memory
    memory = []
    if os.path.exists(memory_path):
        with open(memory_path, "r") as f:
            try:
                memory = json.load(f)
            except:
                memory = []
                
    # Check for duplicates or update
    found = False
    for entry in memory:
        if entry["text"] == req.text:
            entry["action"] = req.corrected_action
            entry["reason"] = req.reason
            found = True
            break
            
    if not found:
        memory.append({
            "text": req.text,
            "action": req.corrected_action,
            "reason": req.reason
        })
        
    with open(memory_path, "w") as f:
        json.dump(memory, f, indent=2)
        
    return {"status": "success", "message": "Memory reinforced."}

@app.get("/state", tags=["📊 System Monitoring"])
def get_state():
    state = env._get_state()
    if state is None:
        return {
            "status": "Ready",
            "message": "Environment is initialized but no episode is currently active.",
            "how_to_start": "Call 'POST /reset' with a task_name (e.g., 'clear_cut_moderation') to begin benchmarking."
        }
    return state


def kill_port(port):
    import subprocess
    import os
    import sys
    try:
        if sys.platform == "win32":
            # Windows logic
            output = subprocess.check_output(f'netstat -ano | findstr :{port}', shell=True).decode()
            for line in output.strip().split('\n'):
                if 'LISTENING' in line:
                    pid = line.strip().split()[-1]
                    if pid != str(os.getpid()):
                        print(f"Cleanup: Stopping existing process {pid} on port {port}...")
                        subprocess.run(f'taskkill /F /PID {pid}', shell=True, capture_output=True)
        else:
            # Unix/Mac/Linux logic
            try:
                # Use lsof to find the PID
                output = subprocess.check_output(['lsof', '-ti', f':{port}']).decode().strip()
                if output:
                    for pid in output.split('\n'):
                        if pid != str(os.getpid()):
                            print(f"Cleanup: Stopping existing process {pid} on port {port}...")
                            subprocess.run(['kill', '-9', pid], capture_output=True)
            except (subprocess.CalledProcessError, FileNotFoundError):
                # Fallback to fuser if lsof is missing
                try:
                    subprocess.run(['fuser', '-k', f'{port}/tcp'], capture_output=True)
                except Exception:
                    pass
    except Exception:
        pass

def main():
    import uvicorn
    # Automatically clear the port before starting to avoid [WinError 10048]
    kill_port(7860)
    uvicorn.run(app, host="0.0.0.0", port=7860)

if __name__ == "__main__":
    main()