Spaces:

AhmedSamir1598
/

QThink

Sleeping

QThink / app.py

Ahmed Samir Nagy Mohammed

Fix Python 3.9 compatibility - use Optional instead of union operator for type hints

ff85a59 4 months ago

13.3 kB

	import gradio as gr
	from fastapi import FastAPI, Body, HTTPException
	from pydantic import BaseModel, Field
	from typing import List, Dict, Any, Optional
	import time
	import numpy as np
	import random

	# --- Import All Project Logic ---
	from mock_k2_api import call_mock_planner, call_mock_reasoner, call_mock_verifier
	from quyaml_parser import parse_quyaml_to_qiskit
	from qiskit.qasm2 import dumps as to_qasm2_str

	# Ground truth for automated evaluation (QFT on \|101⟩)
	GROUND_TRUTH_QFT_101_VECTOR = np.array([
	0.35355339+0.j, -0.35355339+0.j, 0.0+0.35355339j, 0.0-0.35355339j,
	-0.25-0.25j, 0.25+0.25j, 0.25-0.25j, -0.25+0.25j
	])

	# === 1. BACKEND LOGIC (FastAPI) ===
	# This is our existing FastAPI app. Gradio will wrap around it.
	app = FastAPI(
	title="QThink Agentic POC API",
	description="This API powers the QThink Gradio Demo.",
	version="0.3.0"
	)

	# --- Pydantic Models ---
	class SimulationPrompt(BaseModel):
	prompt: str

	class AgentStep(BaseModel):
	agent: str
	thought: str
	output: Any

	# --- API Endpoints ---
	@app.post("/tools/parse-quyaml-to-qasm")
	async def parse_quyaml_endpoint(quyaml_body: str = Body(...)):
	try:
	quantum_circuit = parse_quyaml_to_qiskit(quyaml_body)
	qasm_output = to_qasm2_str(quantum_circuit)
	return {
	"status": "success",
	"qasm_2_0_output": qasm_output,
	"text_diagram": str(quantum_circuit)
	}
	except Exception as e:
	raise HTTPException(status_code=400, detail=f"Error parsing QuYAML: {str(e)}")

	@app.post("/solve/agentic-trace")
	async def agentic_trace_endpoint(body: SimulationPrompt):
	try:
	agent_trace: List[AgentStep] = []
	plan = call_mock_planner(body.prompt)
	agent_trace.append(AgentStep(agent="Planner", thought="I have analyzed the prompt and created a step-by-step plan.", output=plan))

	reasoner_results = []
	for task in plan:
	result = call_mock_reasoner(task)
	reasoner_results.append({"task": task, "result": result})
	agent_trace.append(AgentStep(agent="Reasoner", thought=f"I have completed task: {task}", output=result))

	verification = call_mock_verifier(agent_trace)
	agent_trace.append(AgentStep(agent="Verifier", thought="I have analyzed the full trace for correctness.", output=verification))

	return {"agent_trace": [step.dict() for step in agent_trace]}
	except Exception as e:
	raise HTTPException(status_code=500, detail=str(e))

	# === 2. FRONTEND LOGIC (Gradio UI) ===
	# These functions will call our backend logic.

	# --- Function for the QuYAML Parser Tab ---
	def parse_quyaml_interface(quyaml_string):
	"""Gradio interface function for the QuYAML parser."""
	try:
	circuit = parse_quyaml_to_qiskit(quyaml_string)
	qasm = to_qasm2_str(circuit)
	diagram = str(circuit)
	return qasm, diagram
	except Exception as e:
	return f"Error: {str(e)}", ""

	# --- Function for the Agentic Trace Tab ---
	def agent_trace_interface(prompt):
	"""Gradio interface function for the agentic trace."""
	if not prompt:
	return "Please enter a prompt.", ""

	trace_log = "Simulating agentic workflow...\n\n"

	plan = call_mock_planner(prompt)
	trace_log += "--- Planner Agent ---\n"
	trace_log += "Plan:\n" + "\n".join([f"- {p}" for p in plan]) + "\n\n"

	trace_log += "--- Reasoner Agent ---\n"
	all_results = []
	for task in plan:
	result = call_mock_reasoner(task)
	all_results.append(result)
	trace_log += f"Executing Task: {task}\nResult: {result}\n"

	trace_log += "\n--- Verifier Agent ---\n"
	verification = call_mock_verifier(all_results)
	trace_log += f"Verification Status: {verification['status']}\nDetails: {verification}\n"

	# We will return the final verification dictionary and the full text log
	return verification, trace_log

	# === DGM HELPER FUNCTIONS ===

	def call_mock_dgm_self_improve(current_prompt: str, failure_analysis: str) -> str:
	"""Simulates the DGM's self-modification by suggesting a prompt improvement."""
	suggestions = [
	"# DGM Suggestion: Add a directive to show mathematical derivations for each step.",
	"# DGM Suggestion: Rephrase to request complex numbers in 'a + bi' format explicitly.",
	"# DGM Suggestion: Instruct the model to double-check phase calculations before proceeding."
	]
	suggestion = random.choice(suggestions)
	return f"{current_prompt}\n\n{suggestion}\n# Justification: {failure_analysis}"

	def extract_final_vector_from_trace(agent_trace: list) -> Optional[np.ndarray]:
	"""Parses the final vector string from a mock agent trace."""
	try:
	# In our mock, the verifier's output contains the final vector preview
	verifier_step = next(step for step in reversed(agent_trace) if step['agent'] == 'Verifier')
	vector_str = verifier_step['output']['final_state_preview']
	# This is a simplified parser for the mock format: "[0.353, -0.353, 0.353i, ...]"
	vector_str = vector_str.strip('[]').replace('i', 'j')
	parts = [complex(p.strip()) for p in vector_str.split(',')]
	return np.array(parts)
	except (StopIteration, ValueError, TypeError):
	# Fallback for a slightly different vector format (to simulate prompt-induced changes)
	try:
	verifier_step = next(step for step in reversed(agent_trace) if step['agent'] == 'Verifier')
	vector_str = verifier_step['output']['final_state_preview']
	vector_str = vector_str.strip('[]').replace('i', 'j')
	# Handle format like "-0.353(1+j)"
	parts = [eval(p.strip().replace('(', '*(')) for p in vector_str.split(',') if p.strip()]
	return np.array(parts)
	except:
	return None # Failed to parse

	def run_automated_evaluation(new_prompt_set: dict) -> dict:
	"""Runs the mock simulation and evaluates the result against ground truth."""
	# Simulate the agentic trace using the new prompt logic (mocked)
	prompt_for_test_case = "Simulate a 3-qubit Quantum Fourier Transform on the state \|101⟩."
	plan = call_mock_planner(prompt_for_test_case)
	trace = []
	for task in plan:
	result = call_mock_reasoner(task)
	trace.append({'agent': 'Reasoner', 'output': result})
	verification = call_mock_verifier(trace)
	trace.append({'agent': 'Verifier', 'output': verification})

	# Extract the final vector from this simulated trace
	predicted_vector = extract_final_vector_from_trace(trace)

	if predicted_vector is None:
	return {'status': 'Error', 'message': 'Evaluation failed: Could not parse final vector from agent output.'}

	# Normalize vectors for fair comparison
	predicted_vector /= np.linalg.norm(predicted_vector)

	# Calculate Mean Squared Error
	mse = np.mean(np.abs(GROUND_TRUTH_QFT_101_VECTOR - predicted_vector)**2)
	threshold = 0.01
	result = "PASSED" if mse < threshold else "FAILED"

	return {
	'status': 'Completed',
	'test_case': 'QFT(\|101⟩)',
	'mse': f"{mse:.6f}",
	'threshold': threshold,
	'result': result
	}

	# --- Function for the DGM Tab ---
	def dgm_interface(current_prompt, failure_analysis):
	"""Gradio interface function for the DGM cycle."""
	if not failure_analysis:
	return "Please provide a failure analysis to guide the improvement."

	# Step 1: Self-Modification (Suggest a new prompt)
	suggested_prompt = call_mock_dgm_self_improve(current_prompt, failure_analysis)

	# Step 2: Automated Evaluation (Test the new prompt)
	new_prompt_set = {'reasoner': suggested_prompt} # In a real app, this would be a full set
	evaluation_result = run_automated_evaluation(new_prompt_set)

	# Step 3: Format the output for the UI
	output_log = "--- DGM SELF-MODIFICATION ---\n"
	output_log += "Generated a new candidate prompt based on failure analysis:\n"
	output_log += f'"""{suggested_prompt}"""\n\n'
	output_log += "--- AUTOMATED EVALUATION ---\n"
	output_log += f"Running benchmark test: {evaluation_result.get('test_case', 'N/A')}\n"
	output_log += f"Mean Squared Error (MSE): {evaluation_result.get('mse', 'N/A')}\n"
	output_log += f"Success Threshold: MSE < {evaluation_result.get('threshold', 'N/A')}\n"
	output_log += "--------------------------------\n"
	output_log += f"EVALUATION RESULT: {evaluation_result.get('result', 'ERROR')}\n"
	output_log += "--------------------------------\n"
	if evaluation_result.get('result') == 'PASSED':
	output_log += "Conclusion: The suggested prompt is an improvement and will be added to the agent archive."
	else:
	output_log += "Conclusion: The suggested prompt did not pass the benchmark and will be discarded."

	return output_log

	# --- Define the Gradio Interface ---
	with gr.Blocks(theme=gr.themes.Soft(), title="QThink Demo") as demo:
	gr.Markdown("# ⚛️ QThink: Agentic Quantum Co-Pilot")
	gr.Markdown("This interface demonstrates the two core features of our hackathon project. Use the tabs below to explore.")

	with gr.Tabs():
	with gr.TabItem("Agentic Workflow Demo"):
	gr.Markdown("### Simulate the full agentic workflow.")
	with gr.Row():
	prompt_input = gr.Textbox(lines=5, label="User Prompt", placeholder="Enter your prompt here...")
	execute_button = gr.Button("Execute Workflow", variant="primary")
	gr.Markdown("### Agent Trace Log")
	trace_output_log = gr.Textbox(lines=20, label="Full Agent Conversation Log", interactive=False)
	gr.Markdown("### Final Verification Output")
	trace_output_final = gr.JSON(label="Final Output from Verifier Agent")

	example_prompt = gr.Examples(
	examples=["Simulate a 3-qubit Quantum Fourier Transform on the state \|101⟩."],
	inputs=prompt_input
	)

	with gr.TabItem("QuYAML Parser Tool"):
	gr.Markdown("### Test our novel, token-efficient QuYAML format.")
	with gr.Row():
	quyaml_input = gr.Textbox(lines=15, label="QuYAML Input", placeholder="Enter your QuYAML circuit definition here...")
	with gr.Column():
	qasm_output = gr.Code(label="Generated QASM 2.0", language="python")
	diagram_output = gr.Textbox(label="Text Circuit Diagram", interactive=False)

	parse_button = gr.Button("Parse QuYAML", variant="primary")

	example_quyaml = gr.Examples(
	examples=[
	["""# QYAML v0.1: Bell State
	circuit: BellState
	qreg: q[2]
	creg: c[2]
	instructions:
	- h q[0]
	- cx q[0], q[1]
	- measure q, c"""]
	],
	inputs=quyaml_input
	)

	with gr.TabItem("DGM Self-Improvement Cycle"):
	gr.Markdown("### Simulate the Darwin Gödel Machine Loop on Prompts")
	gr.Markdown("This tab demonstrates how QThink can self-improve. It takes a 'failure analysis' of a previous run, uses an LLM to suggest a new prompt, and then automatically evaluates if the new prompt produces a better result on a benchmark task.")

	with gr.Row():
	with gr.Column(scale=1):
	dgm_current_prompt = gr.Textbox(
	value="You are a powerful mathematical and logical reasoning engine. Your task is to solve the following step precisely and show your work.",
	lines=5,
	label="Current 'Reasoner' Prompt (Version 0)"
	)
	dgm_failure_input = gr.Textbox(
	lines=3,
	label="Failure Analysis / Improvement Goal",
	placeholder="e.g., The mathematical explanation for complex number steps was unclear."
	)
	dgm_improve_button = gr.Button("Run DGM Improvement Cycle", variant="primary")

	with gr.Column(scale=2):
	dgm_output_log = gr.Textbox(
	lines=15,
	label="DGM Cycle Result (Suggested Prompt & Automated Evaluation)",
	interactive=False,
	placeholder="Results of the self-improvement cycle will appear here..."
	)

	# --- Connect functions to interfaces ---
	parse_button.click(fn=parse_quyaml_interface, inputs=quyaml_input, outputs=[qasm_output, diagram_output])
	execute_button.click(fn=agent_trace_interface, inputs=prompt_input, outputs=[trace_output_final, trace_output_log])
	dgm_improve_button.click(fn=dgm_interface, inputs=[dgm_current_prompt, dgm_failure_input], outputs=dgm_output_log)

	# === 3. MOUNTING & LAUNCHING ===
	# Mount the Gradio UI onto the FastAPI backend
	app = gr.mount_gradio_app(app, demo, path="/")

	# If you want to run this file locally, you can add this:
	# if __name__ == "__main__":
	# import uvicorn
	# uvicorn.run(app, host="0.0.0.0", port=7860)