Spaces:

MCP-1st-Birthday
/

MCP-Blockly

Running

App Files Files Community

MCP-Blockly / project /test.py

owenkaplinsky

Update project/test.py

599c773 verified 20 days ago

raw

history blame contribute delete

17.7 kB

	from fastapi import FastAPI, Request, HTTPException
	from fastapi.middleware.cors import CORSMiddleware
	import gradio as gr
	import os
	import ast
	import inspect
	import pandas as pd
	import multiprocessing
	import time
	from collections import defaultdict
	import uuid
	import logging

	app = FastAPI()

	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# Per-session storage for the latest Blockly-generated code
	latest_blockly_code = defaultdict(str)

	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger("test_app")

	# ---------------------------------------------------------------------------
	# Session helpers
	# ---------------------------------------------------------------------------

	def require_session_id(data_or_query):
	"""
	Ensure every request carries a session_id; otherwise reject.
	"""
	session_id = None
	if isinstance(data_or_query, dict):
	session_id = data_or_query.get("session_id")
	else:
	session_id = data_or_query

	if not session_id:
	raise HTTPException(status_code=400, detail="session_id is required")
	return session_id


	# ---------------------------------------------------------------------------
	# Safe execution helpers (protect against infinite loops and crashes)
	# ---------------------------------------------------------------------------

	def _worker_exec(code_str, inputs, queue, openai_key=None, hf_key=None):
	"""
	Execute user-generated code in an isolated process.
	Returns output through a queue to avoid sharing state.
	"""
	try:
	# Inject keys into environment for this process only (not persisted outside)
	if openai_key:
	os.environ["OPENAI_API_KEY"] = openai_key
	if hf_key:
	os.environ["HF_TOKEN"] = hf_key

	result = ""

	def capture_result(msg):
	nonlocal result
	result = msg

	# Execution environment
	env = {
	"reply": capture_result,
	"__builtins__": __builtins__,
	}

	# Minimal imports that Blockly outputs may rely on
	exec("import os\nimport pandas as pd\nimport ast\nimport inspect", env)

	exec(code_str, env)
	if "create_mcp" in env:
	func = env["create_mcp"]
	sig = inspect.signature(func)
	params = list(sig.parameters.values())
	in_types = getattr(func, "in_types", [])

	typed_args = []
	for i, arg in enumerate(inputs):
	if i >= len(params):
	break
	if arg is None or arg == "":
	typed_args.append(None)
	continue

	target_type = in_types[i] if i < len(in_types) else params[i].annotation
	try:
	if target_type in (int, "int", "integer"):
	typed_args.append(int(arg))
	elif target_type in (float, "float"):
	typed_args.append(float(arg))
	elif target_type in (bool, "bool", "boolean"):
	typed_args.append(bool(arg) if isinstance(arg, bool) else str(arg).lower() in ("true", "1", "yes"))
	elif target_type in (list, "list"):
	if isinstance(arg, list):
	typed_args.append(arg)
	else:
	try:
	typed_args.append(ast.literal_eval(arg))
	except Exception:
	typed_args.append([arg])
	elif target_type in ("any", "Any"):
	typed_args.append(arg)
	elif target_type == inspect._empty:
	typed_args.append(str(arg))
	else:
	typed_args.append(str(arg))
	except Exception:
	typed_args.append(arg)

	if len(typed_args) > 0 and isinstance(typed_args[0], list):
	typed_args[0] = pd.DataFrame(typed_args[0])

	result = env["create_mcp"](*typed_args)
	elif "process_input" in env:
	env["process_input"](inputs)

	queue.put({"ok": True, "result": result if result not in (None, "") else "No output generated"})
	except Exception as e:
	queue.put({"ok": False, "result": f"Error: {str(e)}"})


	# ---------------------------------------------------------------------------
	# API endpoints
	# ---------------------------------------------------------------------------

	# Gets REAL Python code, not the LLM DSL
	@app.post("/update_code")
	async def update_code(request: Request):
	data = await request.json()
	session_id = require_session_id(data)
	latest_blockly_code[session_id] = data.get("code", "")
	logger.info(f"[update_code] Stored code; length={len(latest_blockly_code[session_id])}")
	return {"ok": True}

	# Sends the latest code to chat.py so that the agent will be able to use the MCP
	@app.get("/get_latest_code")
	async def get_latest_code(request: Request):
	session_id = require_session_id(dict(session_id=request.query_params.get("session_id")))
	logger.info(f"[get_latest_code] Returning code; length={len(latest_blockly_code.get(session_id, ''))}")
	return {"code": latest_blockly_code.get(session_id, "")}

	def execute_blockly_logic(user_inputs, session_id, openai_key=None, hf_key=None):
	"""
	Execute the Blockly-generated code for a specific session in an isolated, timed subprocess.
	"""
	if not session_id:
	return "No session_id provided to execute code."
	logger.info(f"[execute_blockly_logic] executing; inputs={user_inputs}")
	code_for_session = latest_blockly_code.get(session_id, "")
	if not code_for_session.strip():
	return "No Blockly code available"

	# Strip Gradio scaffolding before execution
	lines = code_for_session.split('\n')
	filtered_lines = []
	skip_mode = False
	in_demo_block = False

	for line in lines:
	# Skip import gradio line
	if 'import gradio' in line:
	continue

	# Skip Gradio interface creation and any demo-related lines
	if 'demo = gr.Interface' in line:
	in_demo_block = True
	skip_mode = True
	continue
	elif 'demo.launch' in line:
	skip_mode = False
	in_demo_block = False
	continue
	elif in_demo_block:
	# Skip everything in the demo block (multi-line Interface declaration)
	continue

	# Skip any standalone gr. calls
	if 'gr.' in line:
	continue

	if not skip_mode:
	filtered_lines.append(line)

	code_to_run = '\n'.join(filtered_lines)
	# Launch in isolated subprocess
	q = multiprocessing.Queue()
	p = multiprocessing.Process(target=_worker_exec, args=(code_to_run, user_inputs, q, openai_key, hf_key), daemon=True)
	p.start()
	p.join(timeout=8)

	if p.is_alive():
	p.terminate()
	p.join()
	logger.error("[execute_blockly_logic] timeout")
	return "Error: Execution timed out"

	if q.empty():
	return "No output generated"

	msg = q.get()
	return msg.get("result", "No output generated")


	def build_interface():
	with gr.Blocks(title="Test MCP Server") as demo:
	session_state = gr.State()

	def init_session(req: gr.Request):
	sid = None
	q_sid = None
	c_sid = None
	try:
	q_sid = req.query_params.get("session_id")
	except Exception:
	q_sid = None
	try:
	c_sid = req.cookies.get("mcp_blockly_session_id")
	except Exception:
	c_sid = None

	sid = q_sid or c_sid
	logger.info("[init_session] session resolved")
	if not sid:
	logger.error("Gradio test interface loaded without session_id (neither query param nor cookie); refresh/process will be no-ops.")
	return sid

	demo.load(init_session, inputs=None, outputs=[session_state], queue=False)

	def hide_all_fields():
	# Hide everything after initial mount so they don't flash visible
	return [gr.update(visible=False, value="") for _ in input_fields + output_fields]

	# Create a fixed number of potential input fields (max 10)
	input_fields = []
	input_labels = []
	input_group_items = []

	with gr.Accordion("MCP Inputs", open=True):
	for i in range(10):
	# Create inputs that can be shown/hidden
	# Gradio 6 lazy-renders hidden components; start visible so they mount, then hide via refresh updates
	txt = gr.Textbox(label=f"Input {i+1}", visible=True)
	input_fields.append(txt)
	input_group_items.append(txt)

	output_fields = []

	with gr.Accordion("MCP Outputs", open=True):
	for i in range(10):
	# Start visible to force mount; refresh updates will hide/show appropriately
	out = gr.Textbox(label=f"Output {i+1}", visible=True, interactive=False)
	output_fields.append(out)

	with gr.Row():
	submit_btn = gr.Button("Test")
	refresh_btn = gr.Button("Refresh")

	def refresh_inputs(session_id):
	if not session_id:
	logger.error("refresh_inputs called without session_id; no data will be returned.")
	return [gr.update(visible=False, value="") for _ in input_fields + output_fields]
	import re
	code_str = latest_blockly_code.get(session_id, "")
	logger.info(f"[refresh_inputs] code length={len(code_str)}")

	def normalize_type_name(type_name):
	if not type_name:
	return "string"
	if isinstance(type_name, str):
	type_name_lower = type_name.lower()
	if "int" in type_name_lower:
	return "integer"
	if "float" in type_name_lower:
	return "float"
	if "list" in type_name_lower:
	return "list"
	if "bool" in type_name_lower:
	return "boolean"
	if "any" in type_name_lower:
	return "any"
	return "string"

	# Look for the create_mcp function definition
	# Allow multiline function signatures
	pattern = r'def\s+create_mcp\s\((.?)\)\s*:'
	match = re.search(pattern, code_str, re.DOTALL)

	params = []
	# Prefer explicit in_types if present
	in_types_match = re.search(r'in_types\s=\s(\[.*?\])', code_str, re.DOTALL)
	in_types = []
	if in_types_match:
	try:
	in_types = ast.literal_eval(in_types_match.group(1))
	except Exception:
	in_types = []

	if match:
	params_str = match.group(1)
	if params_str.strip():
	# Parse parameters to extract names and types
	for idx, param in enumerate(params_str.split(',')):
	param = param.strip()
	name = param.split(':')[0].strip() if param else param
	# Prefer in_types entry, fall back to annotation parsing
	display_type = normalize_type_name(in_types[idx] if idx < len(in_types) else None)
	if ':' in param and (not in_types or idx >= len(in_types)):
	_, type_hint = param.split(':')
	display_type = normalize_type_name(type_hint.strip())

	params.append({
	'name': name,
	'type': display_type
	})

	# Detect output count (out_amt = N)
	out_amt_match = re.search(r'out_amt\s=\s(\d+)', code_str)
	out_amt = int(out_amt_match.group(1)) if out_amt_match else 0

	out_names_match = re.search(r'out_names\s=\s(\[.*?\])', code_str, re.DOTALL)
	if out_names_match:
	try:
	out_names = ast.literal_eval(out_names_match.group(1))
	except Exception:
	out_names = []
	else:
	out_names = []

	out_types_match = re.search(r'out_types\s=\s(\[.*?\])', code_str, re.DOTALL)
	if out_types_match:
	try:
	out_types = ast.literal_eval(out_types_match.group(1))
	except Exception:
	out_types = []
	else:
	out_types = []
	# Convert output types: handle string, integer, float, list, boolean, any
	out_types = [
	"string" if t == "str" else
	"integer" if t == "int" else
	"float" if t == "float" else
	"list" if t == "list" else
	"boolean" if t == "bool" else
	"any" if t == "Any" else t
	for t in out_types
	]

	# Update visibility + clear output fields
	output_updates = []
	for i, field in enumerate(output_fields):
	if i < out_amt:
	output_updates.append(gr.update(visible=True, label=f"{out_names[i]} ({out_types[i]})", value=""))
	else:
	output_updates.append(gr.update(visible=False, value=""))

	# Update visibility + clear input fields
	updates = []
	for i, field in enumerate(input_fields):
	if i < len(params):
	param = params[i]
	note = ""
	if param["type"] == "list":
	note = "- (use like: [\"a\", \"b\", ...])"

	updates.append(gr.update(
	visible=True,
	label=f"{param['name']} ({param['type']}) {note}",
	value=""
	))
	else:
	updates.append(gr.update(visible=False, value=""))

	return updates + output_updates

	def process_input(*args, request: gr.Request = None):
	*inputs, session_id = args
	if not session_id:
	logger.error("process_input called without session_id; aborting.")
	return [""] * 10

	openai_key = None
	hf_key = None
	if request:
	openai_key = request.headers.get("x-openai-key") or request.cookies.get("mcp_openai_key")
	hf_key = request.headers.get("x-hf-key") or request.cookies.get("mcp_hf_key")

	result = execute_blockly_logic(inputs, session_id, openai_key=openai_key, hf_key=hf_key)

	# Get output types to determine how to format the result
	import re
	code_str = latest_blockly_code.get(session_id, "")
	out_types_match = re.search(r'out_types\s=\s(\[.*?\])', code_str, re.DOTALL)
	out_types = []
	if out_types_match:
	try:
	out_types = ast.literal_eval(out_types_match.group(1))
	# Convert Python type strings to display names
	out_types = [
	"string" if t == "str" else
	"integer" if t == "int" else
	"float" if t == "float" else
	"list" if t == "list" else
	"boolean" if t == "bool" else
	"any" if t == "Any" else t
	for t in out_types
	]
	except Exception:
	out_types = []

	# If result is a tuple or list
	if isinstance(result, (tuple, list)):
	# Check if the first output type is "list" or "any" - if so, convert to string representation
	if out_types and out_types[0] in ("list", "any"):
	return [str(result)] + [""] * 9
	else:
	# Multiple outputs - each item is a separate output
	return list(result) + [""] * (10 - len(result))

	# If it's a single value, put it in the first slot and pad the rest
	return [result] + [""] * 9

	# When refresh is clicked, update input field visibility and labels
	refresh_btn.click(
	refresh_inputs,
	inputs=[session_state],
	outputs=input_fields + output_fields,
	queue=False
	)

	submit_btn.click(
	process_input,
	inputs=input_fields + [session_state],
	outputs=output_fields,
	queue=False
	)

	# After mount, hide all fields so they don't stay visible until refreshed
	demo.load(
	hide_all_fields,
	inputs=None,
	outputs=input_fields + output_fields,
	queue=False
	)

	return demo


	def get_gradio_interface():
	return build_interface()


	if __name__ == "__main__":
	demo = build_interface()
	app = gr.mount_gradio_app(app, demo, path="/")