Spaces:

minato1718
/

Corp_AI

Sleeping

App Files Files Community

Corp_AI / app.py

minato1718

feat: add Gradio playground UI on port 7860 for HuggingFace Spaces

9ff0fa2 about 2 months ago

raw

history blame contribute delete

9.86 kB

	"""
	AuditEnv OpenEnv Playground UI
	Gradio frontend that wraps the FastAPI backend server.
	"""
	import json
	import subprocess
	import time
	import gradio as gr
	import requests

	API_BASE = "http://127.0.0.1:8000"

	# ──────────────────────────────────────────────
	# Boot the FastAPI server in the background
	# ──────────────────────────────────────────────
	def _start_api_server():
	subprocess.Popen(
	["uvicorn", "auditenv.server:app",
	"--host", "127.0.0.1", "--port", "8000", "--app-dir", "src"],
	stdout=subprocess.DEVNULL,
	stderr=subprocess.DEVNULL,
	)

	def _wait_for_api(max_retries: int = 40) -> bool:
	for _ in range(max_retries):
	try:
	r = requests.get(f"{API_BASE}/health", timeout=2)
	if r.status_code == 200:
	return True
	except Exception:
	pass
	time.sleep(1)
	return False

	_start_api_server()
	_api_ready = _wait_for_api()

	# ──────────────────────────────────────────────
	# API helpers
	# ──────────────────────────────────────────────
	def _fmt(response: requests.Response) -> str:
	try:
	return json.dumps(response.json(), indent=2)
	except Exception:
	return response.text

	def api_reset(task_id: str) -> str:
	if not _api_ready:
	return '{"error": "API server failed to start"}'
	try:
	r = requests.post(f"{API_BASE}/reset", json={"task_id": task_id}, timeout=15)
	return _fmt(r)
	except Exception as e:
	return json.dumps({"error": str(e)})

	def api_step(action_type: str, task_id: str, note: str,
	invoice_id: str, vendor_name: str, amount: float,
	violation_type: str, confidence: float) -> str:
	if not _api_ready:
	return '{"error": "API server failed to start"}'
	finding = None
	if action_type == "submit_finding":
	finding = {
	"invoice_id": invoice_id or None,
	"vendor_name": vendor_name or None,
	"amount": amount if amount else None,
	"violation_type": violation_type or None,
	"confidence": confidence,
	}
	payload = {
	"action_type": action_type,
	"task_id": task_id,
	"note": note or "",
	"finding": finding,
	}
	try:
	r = requests.post(f"{API_BASE}/step", json=payload, timeout=15)
	return _fmt(r)
	except Exception as e:
	return json.dumps({"error": str(e)})

	def api_get_state() -> str:
	if not _api_ready:
	return '{"error": "API server failed to start"}'
	try:
	r = requests.get(f"{API_BASE}/state", timeout=15)
	return _fmt(r)
	except Exception as e:
	return json.dumps({"error": str(e)})

	def api_health() -> str:
	try:
	r = requests.get(f"{API_BASE}/health", timeout=5)
	return _fmt(r)
	except Exception as e:
	return json.dumps({"error": str(e)})

	# ──────────────────────────────────────────────
	# Gradio UI
	# ──────────────────────────────────────────────
	CSS = """
	#title { text-align: center; margin-bottom: 0.5rem; }
	#subtitle { text-align: center; color: #6b7280; margin-bottom: 1.5rem; }
	.action-btn { min-width: 110px; }
	#json-out { font-family: monospace; font-size: 0.82rem; }
	"""

	QUICK_START_MD = """
	## Quick Start

	1. Choose a task (Easy / Medium / Hard)
	2. Click Reset to start a new episode
	3. Click Get State to see the documents your agent must audit
	4. Build a finding and click Step to submit it
	5. The environment returns a reward from 0.0 → 1.0

	---

	### Action types
	\| Action \| Description \|
	\|---\|---\|
	\| `submit_finding` \| Flag a specific document as violating policy \|
	\| `flag_human_review` \| Escalate an ambiguous item \|
	\| `noop` \| Do nothing this step \|

	---

	### Scoring
	\| Event \| Reward \|
	\|---\|---\|
	\| True positive (correct flag) \| +0.2 \|
	\| Full evidence chain \| +0.3 \|
	\| False positive \| −0.5 \|
	\| False negative \| −0.2 \|
	"""

	README_MD = """
	## AuditEnv

	AuditEnv is an OpenEnv-compatible reinforcement-learning environment
	for autonomous compliance auditing.

	Instead of eating pac-dots, the AI learns to be a corporate compliance
	auditor — finding fraud, policy violations, and access anomalies.

	### Difficulty Levels
	\| Level \| Task \| Max Steps \|
	\|---\|---\|---\|
	\| Easy \| Expense Report Audit \| 12 \|
	\| Medium \| Access Control Review \| 20 \|
	\| Hard \| Multi-System Fraud Detection \| 28 \|

	### API Endpoints
	\| Method \| Path \| Purpose \|
	\|---\|---\|---\|
	\| `POST` \| `/reset` \| Start new episode \|
	\| `POST` \| `/step` \| Submit action \|
	\| `GET` \| `/state` \| Read current state \|
	\| `GET` \| `/health` \| Health check \|
	\| `GET` \| `/docs` \| Swagger UI \|
	"""

	with gr.Blocks(css=CSS, title="OpenEnv Agentic Environment: AuditEnv") as demo:

	gr.Markdown("# 🏢 OpenEnv Agentic Environment: AuditEnv", elem_id="title")
	gr.Markdown(
	"Autonomous compliance auditing — powered by reinforcement learning",
	elem_id="subtitle",
	)

	with gr.Row():
	# ── Left sidebar ──────────────────────────────
	with gr.Column(scale=1, min_width=220):
	gr.Markdown("### Navigation")
	with gr.Accordion("Quick Start", open=True):
	gr.Markdown(QUICK_START_MD)
	with gr.Accordion("README", open=False):
	gr.Markdown(README_MD)

	# ── Main area ─────────────────────────────────
	with gr.Column(scale=3):
	with gr.Tab("🎮 Playground"):
	gr.Markdown("### Playground\nClick Reset to start a new episode.")

	with gr.Row():
	task_dd = gr.Dropdown(
	choices=["easy", "medium", "hard"],
	value="easy",
	label="Task Difficulty",
	scale=1,
	)
	action_radio = gr.Radio(
	choices=["submit_finding", "flag_human_review", "noop"],
	value="noop",
	label="Action Type",
	scale=2,
	)

	note_box = gr.Textbox(
	label="Note / Message",
	placeholder="Optional note to attach to this action…",
	)

	with gr.Accordion("Finding Details (only for submit_finding)", open=False):
	with gr.Row():
	invoice_id_box = gr.Textbox(label="Invoice ID", placeholder="e.g. INV-0042")
	vendor_box = gr.Textbox(label="Vendor Name", placeholder="e.g. Acme Corp")
	with gr.Row():
	amount_box = gr.Number(label="Amount (USD)", value=0.0)
	violation_dd = gr.Dropdown(
	choices=["duplicate_receipt", "alcohol_over_limit",
	"late_submission", "sod_conflict",
	"dormant_account", "shell_company",
	"invoice_splitting", "round_tripping"],
	label="Violation Type",
	)
	confidence_slider = gr.Slider(0.0, 1.0, value=0.8, step=0.05, label="Confidence")

	with gr.Row():
	step_btn = gr.Button("▶ Step", variant="primary", elem_classes="action-btn")
	reset_btn = gr.Button("🔄 Reset", variant="secondary", elem_classes="action-btn")
	state_btn = gr.Button("📊 Get State", variant="secondary", elem_classes="action-btn")

	gr.Markdown("#### Status — Raw JSON Response")
	json_out = gr.Code(language="json", label="", elem_id="json-out", lines=20)

	# Wire buttons
	reset_btn.click(
	fn=api_reset,
	inputs=[task_dd],
	outputs=json_out,
	)
	step_btn.click(
	fn=api_step,
	inputs=[action_radio, task_dd, note_box,
	invoice_id_box, vendor_box, amount_box,
	violation_dd, confidence_slider],
	outputs=json_out,
	)
	state_btn.click(
	fn=api_get_state,
	inputs=[],
	outputs=json_out,
	)

	with gr.Tab("🔧 Custom / API"):
	gr.Markdown("""
	### Direct API Access

	Your AuditEnv server is also available at the `/docs` endpoint for full
	Swagger UI access, or hit the endpoints directly:

	```
	POST /reset — start a new episode
	POST /step — submit an action
	GET /state — read current state
	GET /health — health check
	```
	""")
	health_btn = gr.Button("🩺 Ping Health Check", variant="primary")
	health_out = gr.Code(language="json", label="Response", lines=5)
	health_btn.click(fn=api_health, inputs=[], outputs=health_out)

	with gr.Tab("📖 About"):
	gr.Markdown(README_MD)

	if __name__ == "__main__":
	demo.launch(server_name="0.0.0.0", server_port=7860)