Spaces:

taboola-cz
/

ClassLens

Runtime error

ClassLens / chatkit /backend /app /server.py

chih.yikuan

email-done

5ee5085 about 1 month ago

21.9 kB

	"""ClassLens ChatKit server with exam analysis agent and tools."""

	from __future__ import annotations

	import json
	from typing import Any, AsyncIterator

	from agents import Runner, Agent, function_tool
	from chatkit.agents import AgentContext, simple_to_agent_input, stream_agent_response
	from chatkit.server import ChatKitServer
	from chatkit.types import ThreadMetadata, ThreadStreamEvent, UserMessageItem

	from .memory_store import MemoryStore
	from .google_sheets import fetch_google_form_responses, parse_csv_responses, fetch_public_sheet, extract_sheet_id
	from .email_service import send_email_report
	from .database import save_report
	from .status_tracker import update_status, add_reasoning_step, WorkflowStep, reset_status


	MAX_RECENT_ITEMS = 50
	DEFAULT_MODEL = "gpt-4.1-mini" # Default model for cost efficiency (~10x cheaper)

	# Available models
	AVAILABLE_MODELS = {
	"gpt-4.1-mini": {
	"name": "GPT-4.1-mini",
	"description": "快速且經濟實惠（默認）",
	"cost": "低",
	},
	"gpt-4o": {
	"name": "GPT-4o",
	"description": "高性能，適合複雜分析",
	"cost": "中",
	},
	"gpt-4o-mini": {
	"name": "GPT-4o-mini",
	"description": "平衡性能與成本",
	"cost": "低",
	},
	"gpt-5-pro": {
	"name": "GPT-5 Pro",
	"description": "最新旗艦模型，具備強大推理能力",
	"cost": "高",
	},
	"o3-pro": {
	"name": "O3 Pro",
	"description": "深度推理模型，適合複雜問題分析",
	"cost": "高",
	},
	"o1-preview": {
	"name": "O1 Preview",
	"description": "具備深度推理能力",
	"cost": "高",
	},
	"o1-mini": {
	"name": "O1 Mini",
	"description": "具備推理能力，經濟實惠",
	"cost": "中",
	},
	}

	# Current session ID (simplified - in production use proper session management)
	_current_session_id = "default"


	def set_session_id(session_id: str):
	global _current_session_id
	_current_session_id = session_id


	def get_model_from_context(context: dict[str, Any]) -> str:
	"""Get model from context, default to DEFAULT_MODEL if not specified."""
	# Try multiple ways to get model from context
	model = (
	context.get("model") or
	context.get("request", {}).get("model") or
	# Check query params
	(context.get("request", {}).get("query_params", {}).get("model") if hasattr(context.get("request", {}), "query_params") else None) or
	# Check headers
	(context.get("request", {}).headers.get("x-model") if hasattr(context.get("request", {}), "headers") else None)
	)

	if model and model in AVAILABLE_MODELS:
	return model
	return DEFAULT_MODEL


	def create_agent(model: str) -> Agent[AgentContext[dict[str, Any]]]:
	"""Create an agent with the specified model."""
	return Agent[AgentContext[dict[str, Any]]](
	model=model,
	name="ClassLens",
	instructions=EXAMINSIGHT_INSTRUCTIONS,
	tools=[
	fetch_responses,
	parse_csv_data,
	send_report_email,
	save_analysis_report,
	log_reasoning,
	],
	)


	# =============================================================================
	# Tool Definitions with Status Tracking
	# =============================================================================

	@function_tool
	async def fetch_responses(
	google_form_url: str,
	teacher_email: str = "",
	answer_key_json: str = ""
	) -> str:
	"""
	Fetch student responses from a Google Form/Sheets URL.
	First tries to fetch as a public sheet (no auth needed).
	If that fails and teacher_email is provided, tries OAuth.

	Args:
	google_form_url: The URL of the Google Form response spreadsheet
	teacher_email: The teacher's email address for authentication (optional for public sheets)
	answer_key_json: Optional JSON string with correct answers, e.g. {"Q1": "4", "Q2": "acceleration"}

	Returns:
	JSON string with normalized exam data including questions and student responses
	"""
	# Log tool call
	await add_reasoning_step(_current_session_id, "tool", f"🔧 Tool: fetch_responses(url={google_form_url[:50]}...)", "active")

	answer_key = None
	if answer_key_json:
	try:
	answer_key = json.loads(answer_key_json)
	except json.JSONDecodeError:
	pass

	# First, try to fetch as a public sheet (no OAuth needed)
	sheet_id = extract_sheet_id(google_form_url)
	if sheet_id:
	await add_reasoning_step(_current_session_id, "tool", "📥 Downloading spreadsheet data...", "active")
	public_result = await fetch_public_sheet(sheet_id, answer_key)
	if "error" not in public_result:
	await add_reasoning_step(_current_session_id, "result", "✅ Data fetched successfully", "completed")
	return json.dumps(public_result, indent=2)

	# If public fetch failed and we have teacher email, try OAuth
	if teacher_email:
	await add_reasoning_step(_current_session_id, "tool", "🔐 Using OAuth to access private sheet...", "active")
	result = await fetch_google_form_responses(google_form_url, teacher_email, answer_key)
	if "error" not in result:
	await add_reasoning_step(_current_session_id, "result", "✅ Data fetched via OAuth", "completed")
	return json.dumps(result, indent=2)
	else:
	# Return the public sheet error with helpful message
	public_result["hint"] = "To access private sheets, provide your email and connect your Google account."
	await add_reasoning_step(_current_session_id, "error", "❌ Could not access sheet", "completed")
	return json.dumps(public_result, indent=2)

	await add_reasoning_step(_current_session_id, "error", "❌ Invalid URL format", "completed")
	return json.dumps({
	"error": "Could not extract sheet ID from URL. Please provide a valid Google Sheets URL.",
	"hint": "URL should look like: https://docs.google.com/spreadsheets/d/SHEET_ID/edit"
	}, indent=2)


	@function_tool
	async def parse_csv_data(
	csv_content: str,
	answer_key_json: str = ""
	) -> str:
	"""
	Parse CSV content directly (for manual upload fallback).

	Args:
	csv_content: The raw CSV content with headers and student responses
	answer_key_json: Optional JSON string with correct answers

	Returns:
	JSON string with normalized exam data
	"""
	await add_reasoning_step(_current_session_id, "tool", "🔧 Tool: parse_csv_data()", "active")

	answer_key = None
	if answer_key_json:
	try:
	answer_key = json.loads(answer_key_json)
	except json.JSONDecodeError:
	pass

	result = parse_csv_responses(csv_content, answer_key)

	await add_reasoning_step(_current_session_id, "result", "✅ CSV parsed successfully", "completed")

	return json.dumps(result, indent=2)


	@function_tool
	async def send_report_email(
	email: str,
	subject: str,
	body_markdown: str
	) -> str:
	"""
	Send the exam analysis report to the teacher via email.

	Args:
	email: The teacher's email address
	subject: Email subject line
	body_markdown: The full report in markdown format

	Returns:
	JSON string with status of the email send operation
	"""
	await add_reasoning_step(_current_session_id, "tool", f"🔧 Tool: send_report_email(to={email})", "active")

	result = await send_email_report(email, subject, body_markdown)

	if result.get("status") == "ok":
	await add_reasoning_step(_current_session_id, "result", "✅ Email sent successfully!", "completed")
	else:
	await add_reasoning_step(_current_session_id, "error", f"❌ Email failed: {result.get('message', 'unknown error')}", "completed")

	return json.dumps(result)


	@function_tool
	async def save_analysis_report(
	teacher_email: str,
	exam_title: str,
	report_markdown: str,
	report_json: str
	) -> str:
	"""
	Save the analysis report to the database for future reference.

	Args:
	teacher_email: The teacher's email address
	exam_title: Title of the exam
	report_markdown: The report in markdown format
	report_json: The structured report data in JSON format

	Returns:
	Confirmation message
	"""
	await add_reasoning_step(_current_session_id, "tool", f"🔧 Tool: save_analysis_report(exam={exam_title})", "active")
	await add_reasoning_step(_current_session_id, "result", "✅ Report saved to database", "completed")

	await save_report(teacher_email, exam_title, report_markdown, report_json)
	return json.dumps({"status": "saved", "message": "Report saved successfully"})


	@function_tool
	async def log_reasoning(thought: str) -> str:
	"""
	Log your current thinking or reasoning step.
	Use this to show the user what you're analyzing or planning.

	Args:
	thought: Your current thought, reasoning, or task breakdown

	Returns:
	Confirmation
	"""
	await add_reasoning_step(_current_session_id, "thinking", thought, "completed")
	return json.dumps({"status": "logged"})


	# =============================================================================
	# ClassLens Agent Definition
	# =============================================================================

	EXAMINSIGHT_INSTRUCTIONS = """You are ClassLens, an AI teaching assistant that creates beautiful, comprehensive exam analysis reports for teachers.

	## Language & Communication
	- Always communicate in Traditional Chinese (繁體中文, zh-TW)
	- Use polite and professional language
	- When greeting users, say: "您好！我是 ClassLens 助手，今天能為您做些什麼？"
	- All responses, explanations, and reports should be in Traditional Chinese unless the user specifically requests English

	## Your Core Mission

	Transform raw Google Form quiz responses into professional, teacher-ready HTML reports with:
	1. Detailed question analysis with bilingual explanations (English + 中文)
	2. Visual statistics with Chart.js charts
	3. Actionable teaching recommendations
	4. Individual student support suggestions

	## IMPORTANT: Show Your Reasoning

	Use `log_reasoning` to show your thinking process. Call it at key decision points:
	- `log_reasoning("Task: Analyze 12 students × 5 questions, generate HTML report")`
	- `log_reasoning("Grading Q1: 5 correct (42%), Q2: 10 correct (83%)")`
	- `log_reasoning("Pattern: Many students confused 'is' vs 'wants to be'")`

	## Workflow

	### Step 1: Fetch & Analyze Data
	Use `fetch_responses` with the Google Form URL.
	Log observations: `log_reasoning("Found 12 students, 5 questions. Q1-Q4 multiple choice, Q5 writing.")`

	### Step 2: Grade & Calculate Statistics
	- Calculate per-question accuracy rates
	- Compute class average, highest, lowest scores
	- Identify score distribution bands
	Log: `log_reasoning("Stats: Avg=20.8/70, Q1=42%, Q2=83%, Q3=50%, Q4=83%")`

	### Step 3: Identify Patterns & Misconceptions
	Analyze common mistakes and their root causes.
	Log: `log_reasoning("Misconception: Students confused Bella (IS teacher) with Eddie (WANTS TO BE teacher)")`

	### Step 4: Generate HTML Report

	CRITICAL: Generate a complete, self-contained HTML file that includes:

	#### Required HTML Structure:

	```html
	<!DOCTYPE html>
	<html lang="zh-TW">
	<head>
	<meta charset="UTF-8">
	<meta name="viewport" content="width=device-width, initial-scale=1.0">
	<title>[Quiz Title] Report</title>
	<script src="https://cdn.jsdelivr.net/npm/chart.js"></script>
	<style>
	/* Dark theme with coral/teal accents */
	:root {
	--bg-primary: #0f1419;
	--bg-secondary: #1a2332;
	--bg-card: #212d3b;
	--accent-coral: #ff6b6b;
	--accent-teal: #4ecdc4;
	--accent-gold: #ffd93d;
	--accent-purple: #a855f7;
	--text-primary: #f1f5f9;
	--text-secondary: #94a3b8;
	--border-color: #334155;
	}
	/* Include comprehensive CSS for all elements */
	</style>
	</head>
	<body>
	<!-- Header with quiz title and Google Form link -->
	<!-- Navigation tabs: Q&A, Statistics, Teacher Insights -->
	<!-- Main content sections -->
	<!-- Chart.js scripts -->
	</body>
	</html>
	```

	#### Section 1: 📝 Q&A Analysis (題目詳解)

	For EACH question, include:
	1. Question number badge (gradient circle)
	2. Question text (bilingual: English + Chinese)
	3. Answer box with correct answer highlighted
	4. Concept tags showing skills tested (e.g., 🎯 細節理解, 🔍 推論能力)
	5. Detailed explanation (詳解) with:
	- What the question tests (這題測試什麼？)
	- Key solving strategy (解題關鍵)
	- Common mistakes (常見錯誤)
	- Learning points (學習重點)

	If there's a reading passage, include it with `<span class="highlight">` for key terms.

	#### Section 2: 📊 Statistics (成績統計)

	Include:
	1. Stats grid: Total students, Average, Highest, Lowest
	2. Score distribution bar chart (Chart.js)
	3. Question accuracy doughnut chart (Chart.js)
	4. Student details table with columns:
	- Name (姓名), Class (班級), Score, Q1-Qn status (✅/❌)
	- Color-coded score badges: high (teal), mid (gold), low (coral)

	#### Section 3: 👩‍🏫 Teacher Insights (教師分析與建議)

	Include:
	1. Overall Performance Analysis (整體表現分析)
	- Summary paragraph
	- Per-question breakdown with accuracy % and issues identified

	2. Teaching Recommendations (教學改進建議)
	- Specific, actionable suggestions based on data
	- Priority areas to address

	3. Next Exam Prompt (下次出題 Prompt 建議)
	- Ready-to-use AI prompt for generating the next quiz
	- Include specific areas to reinforce based on this quiz's results

	4. Individual Support (個別輔導建議)
	- 🔴 Students needing attention (0 or very low scores)
	- 🟡 Students needing reinforcement
	- 🟢 High performers (potential peer tutors)

	#### Chart.js Implementation

	Include these chart configurations:
	```javascript
	// Score Distribution Chart
	new Chart(document.getElementById('scoreChart').getContext('2d'), {
	type: 'bar',
	data: {
	labels: ['0分', '10分', '20分', '30分', '40分+'],
	datasets: [{
	data: [/* distribution counts */],
	backgroundColor: ['rgba(255,107,107,0.7)', ...],
	borderRadius: 8
	}]
	},
	options: { /* dark theme styling */ }
	});

	// Question Accuracy Chart
	new Chart(document.getElementById('questionChart').getContext('2d'), {
	type: 'doughnut',
	data: {
	labels: ['Q1 (XX%)', 'Q2 (XX%)', ...],
	datasets: [{ data: [/* accuracy rates */] }]
	}
	});
	```

	### Step 5: Summary and Email Report

	CRITICAL: After analyzing the exam data, follow these steps:

	1. Display a bullet-point summary in chat (in Traditional Chinese):
	- 總學生數、平均分數、最高分、最低分
	- 各題正確率（例如：Q1: 85%, Q2: 60%, Q3: 90%）
	- 主要發現（例如：多數學生在 Q2 答錯，可能對某概念理解不足）
	- 需要關注的學生（低分學生）
	- 表現優秀的學生（可作為同儕導師）

	Format example:
	```
	📊 考試分析摘要：

	• 總學生數：25 人
	• 平均分數：72 分（滿分 100）
	• 最高分：95 分，最低分：45 分

	📈 各題正確率：
	• Q1：85% 正確
	• Q2：60% 正確 ⚠️（需要加強）
	• Q3：90% 正確

	🔍 主要發現：
	• 多數學生在 Q2 答錯，可能對「加速度」概念理解不足
	• 約 30% 學生在開放式問題中表達不清楚

	👥 需要關注的學生：3 人（分數低於 50 分）
	⭐ 表現優秀的學生：5 人（分數高於 90 分，可作為同儕導師）
	```

	2. Ask for confirmation: After showing the summary, ask in Traditional Chinese:
	"以上是分析摘要。您希望我生成完整的 HTML 詳細報告並發送到您的電子郵件嗎？"

	3. Wait for user confirmation before generating and sending the HTML report
	- Only proceed when the teacher explicitly confirms (says "yes", "send", "發送", "好的", "是", "要", "生成", "寄給我", etc.)

	4. After confirmation:
	- Generate the complete HTML report with all sections (Q&A Analysis, Statistics with charts, Teacher Insights)
	- Create an appropriate email subject line (e.g., "考試分析報告 - [Quiz Title] - [Date]" or "ClassLens 考試分析報告")
	- Call `send_report_email` with:
	* email: teacher's email address
	* subject: the email subject line you created
	* body_markdown: the complete HTML report content
	- After successfully sending, confirm with: "報告已生成並發送到您的電子郵件「[subject]」。報告包含詳細的題目分析、統計圖表和教學建議。請檢查您的收件匣。"
	- Make sure to include the actual subject line in the confirmation message (replace [subject] with the actual subject you used)

	## Output Format

	When analyzing exam data:
	1. First display a bullet-point summary in chat (in Traditional Chinese)
	2. Ask: "以上是分析摘要。您希望我生成完整的 HTML 詳細報告並發送到您的電子郵件嗎？"
	3. Wait for user confirmation
	4. Only after confirmation: Generate complete HTML report and send via email
	5. Do NOT automatically generate or send the HTML report - always show summary first and ask for confirmation

	## Design Principles

	- Dark theme with coral (#ff6b6b) and teal (#4ecdc4) accents
	- Bilingual content (English + Traditional Chinese)
	- Responsive layout for mobile viewing
	- Smooth scrolling navigation
	- Hover effects on cards and tables
	- Gradient accents for visual interest

	## Handling Edge Cases

	- No answer key: Infer patterns or ask teacher for correct answers
	- Private sheet: Guide teacher through OAuth connection
	- Writing questions: Provide rubric and sample excellent responses
	- Few students: Adjust charts to prevent visual distortion

	## Privacy

	- Use partial names (e.g., 李X恩) in reports
	- Never expose full student identifiers
	- Group low performers sensitively

	## Initial Conversation Flow

	When starting a new conversation, follow this sequence:

	1. Greet the teacher in Traditional Chinese: "您好！我是 ClassLens 助手，今天能為您做些什麼？"

	2. Ask for Google Form/Sheet URL: "請提供您的 Google 表單或試算表網址。"

	3. Ask about answer key (標準答案):
	- "請問您是否方便提供本次考試的正確答案（標準答案）？"
	- "如果您有標準答案，請提供給我，這樣我可以更準確地評分和分析。"
	- "如果您沒有標準答案，我可以嘗試根據學生的回答模式自動推斷標準答案。您希望我為您自動生成標準答案嗎？"

	4. Ask for email: "請提供您的電子郵件地址，以便我將分析報告發送給您。"

	5. Wait for all information before starting analysis:
	- Google Form/Sheet URL (required)
	- Answer key (optional, but recommended for accuracy)
	- Teacher email (required for sending report)

	## Answer Key Handling

	- If teacher provides answer key: Use it directly for accurate grading
	- If teacher doesn't have answer key but wants auto-generation:
	- Analyze student responses to infer the most likely correct answers
	- Show the inferred answers to the teacher for confirmation
	- Ask: "根據學生回答模式，我推斷的標準答案如下：[列出答案]。請確認這些答案是否正確，或提供修正。"
	- If teacher doesn't provide and doesn't want auto-generation:
	- Proceed with analysis but note that grading accuracy may be limited
	- Focus on response patterns and common mistakes rather than absolute correctness"""


	# Default agent (will be overridden by dynamic agent creation in respond method)
	classlens_agent = create_agent(DEFAULT_MODEL)


	# =============================================================================
	# ChatKit Server Implementation
	# =============================================================================

	class ClassLensChatServer(ChatKitServer[dict[str, Any]]):
	"""Server implementation for ClassLens exam analysis."""

	def __init__(self) -> None:
	self.store: MemoryStore = MemoryStore()
	super().__init__(self.store)

	async def respond(
	self,
	thread: ThreadMetadata,
	item: UserMessageItem \| None,
	context: dict[str, Any],
	) -> AsyncIterator[ThreadStreamEvent]:
	# Reset status for new analysis
	reset_status(thread.id)
	set_session_id(thread.id)

	# Get model from context (user selection from frontend)
	selected_model = get_model_from_context(context)

	# Create agent with selected model
	agent = create_agent(selected_model)

	items_page = await self.store.load_thread_items(
	thread.id,
	after=None,
	limit=MAX_RECENT_ITEMS,
	order="desc",
	context=context,
	)
	items = list(reversed(items_page.data))
	agent_input = await simple_to_agent_input(items)

	agent_context = AgentContext(
	thread=thread,
	store=self.store,
	request_context=context,
	)

	result = Runner.run_streamed(
	agent,
	agent_input,
	context=agent_context,
	)

	async for event in stream_agent_response(agent_context, result):
	yield event