Spaces:

Yaser77
/

ambiguity-env

Sleeping

Yaser77

fix: resolve Gradio generator pickling error and deprecation warnings

b922e87 about 2 months ago

11.5 kB

	import time
	import requests
	import gradio as gr
	import json

	# ── CONFIGURATION & STYLING ──────────────────────────────────────────────────
	BASE_URL = "https://yaser77-ambiguity-env.hf.space"
	MAX_STEPS = 5

	CUSTOM_CSS = """
	.gradio-container {
	font-family: 'Inter', 'Segoe UI', sans-serif !important;
	}
	.header-banner {
	background: linear-gradient(135deg, #1e1e2e 0%, #313244 100%);
	padding: 30px;
	border-radius: 12px;
	text-align: center;
	border: 1px solid #45475a;
	box-shadow: 0 4px 6px -1px rgba(0, 0, 0, 0.1);
	margin-bottom: 20px;
	}
	.header-banner h1 {
	margin: 0;
	color: #cdd6f4;
	font-weight: 800;
	}
	.header-banner p {
	color: #a6adc8;
	font-size: 1.1em;
	margin-top: 10px;
	}
	.step-card {
	background: #181825;
	border-left: 4px solid #89b4fa;
	border-radius: 8px;
	padding: 16px 20px;
	margin-bottom: 15px;
	box-shadow: 0 2px 4px rgba(0,0,0,0.05);
	}
	.reward-tag {
	display: inline-block;
	padding: 3px 10px;
	border-radius: 20px;
	font-weight: bold;
	font-size: 0.9em;
	}
	.reward-pos { background-color: rgba(166, 227, 161, 0.15); color: #a6e3a1; }
	.reward-neg { background-color: rgba(243, 139, 168, 0.15); color: #f38ba8; }
	.action-text {
	font-family: monospace;
	background: #11111b;
	padding: 4px 8px;
	border-radius: 4px;
	color: #f5c2e7;
	}
	.info-box {
	background-color: rgba(137, 180, 250, 0.1);
	border: 1px solid rgba(137, 180, 250, 0.3);
	border-radius: 8px;
	padding: 15px;
	margin-bottom: 20px;
	}
	.result-banner {
	padding: 20px;
	border-radius: 12px;
	text-align: center;
	font-size: 1.25em;
	font-weight: bold;
	margin-top: 20px;
	}
	.result-success { background: linear-gradient(135deg, rgba(166, 227, 161, 0.2), rgba(148, 226, 213, 0.2)); border: 1px solid #a6e3a1; color: #a6e3a1; }
	.result-fail { background: linear-gradient(135deg, rgba(243, 139, 168, 0.2), rgba(250, 179, 135, 0.2)); border: 1px solid #f38ba8; color: #f38ba8; }
	"""

	TASK_MAPPING = {
	"Easy Explicit": "easy_explicit",
	"Medium Missing Time": "medium_missing_time",
	"Medium Missing Participants": "medium_missing_participants",
	"Hard Ambiguous": "hard_ambiguous"
	}

	# ── DOMAIN REASONING ─────────────────────────────────────────────────────────

	def get_valid_times(constraints: dict) -> list[str]:
	all_times = ["10 AM", "2 PM", "4 PM"]
	unavailable = [t.strip().upper() for t in constraints.get("unavailable_times", [])]
	deadline = constraints.get("deadline", "ASAP")
	valid = []
	for t in all_times:
	t_up = t.strip().upper()
	if t_up in unavailable: continue
	if deadline == "before 3 PM" and "4 PM" in t_up: continue
	valid.append(t)
	return valid

	def extract_from_text(text: str):
	time_val = None
	parts = []
	t_up = text.upper()
	for t in ["10 AM", "2 PM", "4 PM"]:
	if t in t_up:
	time_val = t
	break
	for p in ["TEAM A", "TEAM B", "TEAM C"]:
	if p in t_up:
	parts.append(p.title())
	return time_val, parts

	# ── AGENT LOGIC (Mirroring inference.py Intelligence) ────────────────────────

	def demo_agent(obs_dict, task_name):
	instruction = obs_dict.get("instruction", "")
	known = obs_dict.get("known_info", {})
	constraints = obs_dict.get("constraints", {})
	inst_time, inst_parts = extract_from_text(instruction)

	needs_time = ("time" in task_name.lower() or "hard" in task_name.lower()) and "time" not in known
	needs_parts = ("participants" in task_name.lower() or "hard" in task_name.lower()) and "participants" not in known

	if needs_time and not inst_time:
	return {"type": "ask", "question": "What time works for the meeting?"}
	if needs_parts and not inst_parts:
	return {"type": "ask", "question": "Who should attend the meeting?"}

	valid_times = get_valid_times(constraints)
	revealed_time = known.get("time")
	if revealed_time and any(revealed_time.upper() == vt.upper() for vt in valid_times):
	final_time = revealed_time
	elif inst_time and any(inst_time.upper() == vt.upper() for vt in valid_times):
	final_time = inst_time
	else:
	final_time = valid_times[0] if valid_times else "10 AM"

	revealed_parts = known.get("participants")
	if revealed_parts:
	final_participants = [p.strip() for p in revealed_parts.split(",")]
	else:
	final_participants = inst_parts if inst_parts else ["Team A"]

	return {"type": "execute", "proposed_time": final_time, "proposed_participants": final_participants}

	# ── CORE EXECUTION LOOP ──────────────────────────────────────────────────────
	def run_interaction(task_display_name, custom_inst, is_demo=False):
	if is_demo:
	task_name = "hard_ambiguous"
	custom_inst = "Schedule meeting ASAP with the team"
	else:
	task_name = TASK_MAPPING.get(task_display_name, "hard_ambiguous")

	output_html = "<div><span style='color:#a6adc8;'><i>Initialising environment...</i></span></div>"
	yield output_html

	payload = {"task_name": task_name}
	if custom_inst and custom_inst.strip():
	payload["instruction"] = custom_inst.strip()

	try:
	r = requests.post(f"{BASE_URL}/reset", json=payload)
	r.raise_for_status()
	data = r.json()
	obs = data["observation"]
	except Exception as e:
	yield f"<div class='step-card' style='border-left-color:#f38ba8;'><b>Error:</b> {e}</div>"
	return

	output_html = f"""
	<div class='info-box'>
	<div style='color:#89b4fa; font-size:0.9em; text-transform:uppercase; font-weight:bold; margin-bottom:5px;'>✅ Session Start</div>
	<div style='font-size:1.15em; color:#cdd6f4; margin-bottom:10px;'>"{obs['instruction']}"</div>
	<div style='font-size:0.9em; color:#a6adc8; border-top:1px solid #45475a; padding-top:8px;'>
	<b>Active Constraints:</b><br>
	⏳ Deadline: <span style='color:#f9e2af;'>{obs.get('constraints', {}).get('deadline', 'None')}</span><br>
	🚫 Unavailable: <span style='color:#f38ba8;'>{', '.join(obs.get('constraints', {}).get('unavailable_times', [])) or 'None'}</span>
	</div>
	</div>
	"""
	yield output_html

	step = 0
	done = False
	rewards = []

	while not done and step < MAX_STEPS:
	step += 1
	action = demo_agent(obs, task_name)

	if action["type"] == "ask":
	act_str = f"<span style='color:#89b4fa;'>Ask</span> <span style='color:#6c7086;'>→</span> <span class='action-text'>\"{action['question']}\"</span>"
	else:
	act_str = f"<span style='color:#a6e3a1;'>Execute</span> <span style='color:#6c7086;'>→</span> <span class='action-text'>time='{action['proposed_time']}', parts={action['proposed_participants']}</span>"

	time.sleep(0.8)

	try:
	r = requests.post(f"{BASE_URL}/step", json=action)
	r.raise_for_status()
	res = r.json()
	obs = res["observation"]
	reward = res["reward"]
	done = res["done"]
	info = res.get("info", {})
	raw_reward = info.get("raw_reward", reward)
	rewards.append(reward)
	except Exception as e:
	output_html += f"<div class='step-card' style='border-left-color:#f38ba8;'><b>Step Error:</b> {e}</div>"
	yield output_html
	break

	reward_class = "reward-pos" if raw_reward > 0 else "reward-neg"
	status_text = "<span style='color:#a6e3a1'>✔ Resolved</span>" if done else "<span style='color:#f9e2af'>⚡ Clarifying...</span>"

	step_block = f"""
	<div class='step-card'>
	<div style='display:flex; justify-content:space-between; align-items:center; margin-bottom:10px;'>
	<span style='color:#bac2de; font-weight:bold;'>Step {step}</span>
	<span class='reward-tag {reward_class}'>{raw_reward:+.2f} Reward</span>
	</div>
	<div style='margin-bottom:8px;'>{act_str}</div>
	<div style='font-size:0.9em;'>{status_text}</div>
	</div>
	"""

	if not done and obs.get("last_response"):
	step_block += f"""
	<div style='margin-left:20px; padding:8px 12px; border-left:3px solid #cba6f7; background:rgba(203,166,247,0.05); margin-bottom:15px; margin-top:-5px;'>
	<span style='color:#cba6f7; font-size:0.85em; text-transform:uppercase; font-weight:bold;'>Revealed Info</span><br>
	<span style='color:#cdd6f4;'>{obs['last_response']}</span>
	</div>
	"""
	output_html += step_block
	yield output_html

	if done:
	score = sum(rewards) / max(len(rewards), 1)
	banner = "result-success" if score > 0.5 else "result-fail"
	msg = "Success" if score > 0.5 else "Failure"
	output_html += f"<div class='result-banner {banner}'>{msg}! <br><span style='font-size:0.8em; font-weight:normal;'>Final Episode Score: {score:.2f}</span></div>"
	yield output_html

	# ── GRADIO UI WRAPPERS (Fixing Generator Pickling) ──────────────────────────

	def start_agent_run(task, custom_inst):
	yield from run_interaction(task, custom_inst, is_demo=False)

	def start_demo_run(task, custom_inst):
	yield from run_interaction(task, custom_inst, is_demo=True)

	# ── GRADIO UI LAYOUT ─────────────────────────────────────────────────────────

	with gr.Blocks(title="Ambiguity Resolution Demo") as app:
	gr.HTML("<div class='header-banner'><h1>🧠 Ambiguity Resolution Benchmark Demo</h1><p>Visualizing intelligent multi-step decision making under constraints</p></div>")

	with gr.Row():
	with gr.Column(scale=1):
	gr.Markdown("### ⚙️ Context")
	task_dropdown = gr.Dropdown(label="Complexity", choices=list(TASK_MAPPING.keys()), value="Hard Ambiguous")
	custom_input = gr.Textbox(label="Prompt", placeholder="Schedule meeting ASAP...")
	with gr.Row():
	btn_run = gr.Button("🚀 Start Agent", variant="primary")
	btn_demo = gr.Button("▶ Quick Demo", variant="secondary")
	gr.Markdown("<br>💡 Note: The agent is deterministic and follows the high-quality reasoning benchmark rules.")

	with gr.Column(scale=2):
	gr.Markdown("### 📡 Trace")
	output_display = gr.HTML(value="<div style='color:#a6adc8; text-align:center; padding:40px;'>Awaiting trigger...</div>")

	btn_run.click(fn=start_agent_run, inputs=[task_dropdown, custom_input], outputs=[output_display])
	btn_demo.click(fn=start_demo_run, inputs=[task_dropdown, custom_input], outputs=[output_display])

	if __name__ == "__main__":
	# Gradio 5.x/6.x Recommended: Apply theme and CSS in launch()
	app.launch(
	server_name="0.0.0.0",
	server_port=7860,
	theme=gr.themes.Soft(),
	css=CUSTOM_CSS
	)