Spaces:

nuojohnchen
/

review_annotation

Runtime error

App Files Files Community

review_annotation / app /tab_analytics.py

nuocuhz

Switch checklist from Checkbox to Radio (Yes/No/Unsure)

24112e5 about 2 months ago

raw

history blame contribute delete

10.7 kB

	"""tab_analytics.py — Analytics Dashboard with detailed analysis."""

	import gradio as gr
	import pandas as pd
	import plotly.express as px
	import plotly.graph_objects as go
	import tempfile
	import os
	from data_loader import DataStore
	from db import (CHECKLIST_ITEMS, DIMENSIONS, get_all_annotations_df,
	get_stats, export_csv, _int_to_radio)


	def _empty_fig(msg="No annotation data yet"):
	fig = go.Figure()
	fig.add_annotation(text=msg, xref="paper", yref="paper",
	x=0.5, y=0.5, showarrow=False, font_size=18)
	fig.update_layout(height=350, xaxis_visible=False, yaxis_visible=False)
	return fig


	def build_analytics_tab(store: DataStore):
	"""Build the Analytics Dashboard tab."""

	gr.Markdown("## Analytics Dashboard")

	refresh_btn = gr.Button("🔄 Refresh Analytics", variant="primary")

	# --- Summary Stats ---
	summary_md = gr.Markdown("Click Refresh to load analytics")

	# --- Row 1: Score distribution + Per-item check rates ---
	with gr.Row():
	score_hist = gr.Plot(label="System-2 Score Distribution")
	item_rates_plot = gr.Plot(label="Per-Item Check Rate")

	# --- Row 2: Per-conference stats ---
	with gr.Row():
	conf_count_plot = gr.Plot(label="Annotations by Conference")
	conf_score_plot = gr.Plot(label="Avg System-2 Score by Conference")

	# --- Row 3: Score change correlation + Per-dimension ---
	with gr.Row():
	correlation_plot = gr.Plot(label="Review Score Change vs System-2 Score")
	dimension_plot = gr.Plot(label="Per-Dimension Check Rate")

	# --- Row 4: Annotation table + Export ---
	gr.Markdown("### All Annotations")
	ann_table = gr.Dataframe(
	label="Annotation Records",
	interactive=False,
	wrap=True,
	)
	with gr.Row():
	export_btn = gr.Button("📥 Export CSV", scale=1)
	export_file = gr.File(label="Download", visible=False, scale=2)

	# ========== Callbacks ==========

	def refresh_all():
	df = get_all_annotations_df()
	stats = get_stats()

	# --- Summary ---
	if stats["total"] == 0:
	summary = ("No annotations yet. Go to the Annotation tab to start.\n\n"
	f"Dataset: {len(store.reviews_all):,} papers available for annotation.")
	empty = _empty_fig()
	return (summary, empty, empty, empty, empty, empty, empty, pd.DataFrame())

	summary_lines = [
	"\| Metric \| Value \|",
	"\|--------\|-------\|",
	f"\| Total annotations \| {stats['total']} \|",
	f"\| Unique papers annotated \| {stats['unique_papers']} \|",
	f"\| Average System-2 Score \| {stats['avg_score']:.2f} / 8 \|",
	f"\| Score range \| {stats['min_score']} – {stats['max_score']} \|",
	f"\| Dataset coverage \| {stats['unique_papers']}/{len(store.reviews_all):,} "
	f"({stats['unique_papers']/max(len(store.reviews_all),1)*100:.1f}%) \|",
	]
	summary = "\n".join(summary_lines)

	# --- Score Distribution Histogram ---
	score_data = []
	for s in range(9):
	score_data.append({"score": s, "count": stats["score_dist"].get(s, 0)})
	score_df = pd.DataFrame(score_data)
	fig_hist = px.bar(
	score_df, x="score", y="count",
	title="System-2 Score Distribution",
	labels={"score": "Score (0-8)", "count": "Count"},
	color="count", color_continuous_scale="Blues",
	)
	fig_hist.update_layout(height=380, xaxis=dict(dtick=1))
	fig_hist.update_coloraxes(showscale=False)

	# --- Per-Item Check Rates ---
	item_data = []
	total = max(stats["total"], 1)
	for item_id, text in CHECKLIST_ITEMS.items():
	rate = stats.get(f"rate_{item_id}", 0) / total * 100
	dim = item_id[0]
	item_data.append({
	"item": item_id,
	"label": f"{item_id}: {text[:15]}...",
	"rate": round(rate, 1),
	"dimension": DIMENSIONS[dim],
	})
	item_df = pd.DataFrame(item_data)
	fig_items = px.bar(
	item_df, x="item", y="rate", color="dimension",
	title="Per-Checklist-Item Check Rate (%)",
	labels={"item": "Item", "rate": "Check Rate (%)"},
	hover_data=["label"],
	)
	fig_items.update_layout(height=380, yaxis=dict(range=[0, 100]))

	# --- Per-Conference Count ---
	if stats["per_conference"]:
	conf_df = pd.DataFrame(stats["per_conference"])
	# Parse conference name from full string
	conf_df["conf_short"] = conf_df["conference"].apply(
	lambda x: " ".join(str(x).split()[:2]) if pd.notna(x) else "Unknown"
	)
	# Top 20 by count
	conf_df = conf_df.nlargest(20, "count")

	fig_conf_count = px.bar(
	conf_df, x="conf_short", y="count",
	title="Annotations by Conference (Top 20)",
	labels={"conf_short": "Conference", "count": "Annotations"},
	color="count", color_continuous_scale="Viridis",
	)
	fig_conf_count.update_layout(height=380, xaxis_tickangle=-45)
	fig_conf_count.update_coloraxes(showscale=False)

	fig_conf_score = px.bar(
	conf_df, x="conf_short", y="avg_score",
	title="Avg System-2 Score by Conference",
	labels={"conf_short": "Conference", "avg_score": "Avg Score"},
	color="avg_score", color_continuous_scale="RdYlGn",
	range_color=[0, 8],
	)
	fig_conf_score.update_layout(height=380, xaxis_tickangle=-45,
	yaxis=dict(range=[0, 8]))
	fig_conf_score.update_coloraxes(showscale=False)
	else:
	fig_conf_count = _empty_fig("No conference data")
	fig_conf_score = _empty_fig("No conference data")

	# --- Score Change Correlation ---
	fig_corr = _build_correlation_plot(df, store)

	# --- Per-Dimension Check Rate ---
	dim_data = []
	for dim_key, dim_label in DIMENSIONS.items():
	k1, k2 = f"{dim_key}1", f"{dim_key}2"
	r1 = stats.get(f"rate_{k1}", 0) / total * 100
	r2 = stats.get(f"rate_{k2}", 0) / total * 100
	avg_rate = (r1 + r2) / 2
	dim_data.append({"dimension": dim_label, "avg_rate": round(avg_rate, 1)})
	dim_df = pd.DataFrame(dim_data)
	fig_dim = px.bar(
	dim_df, x="dimension", y="avg_rate",
	title="Average Check Rate by Dimension (%)",
	labels={"dimension": "Dimension", "avg_rate": "Avg Check Rate (%)"},
	color="avg_rate", color_continuous_scale="Sunset",
	range_color=[0, 100],
	)
	fig_dim.update_layout(height=380, yaxis=dict(range=[0, 100]))
	fig_dim.update_coloraxes(showscale=False)

	# --- Annotation Table ---
	display_cols = ["paper_id", "reviewer_id", "conference",
	"A1", "A2", "B1", "B2", "C1", "C2", "D1", "D2",
	"score", "notes", "updated_at"]
	table_df = df[display_cols] if not df.empty else pd.DataFrame()
	# Convert integer codes to readable labels in table
	if not table_df.empty:
	for col in ["A1", "A2", "B1", "B2", "C1", "C2", "D1", "D2"]:
	table_df[col] = table_df[col].apply(_int_to_radio)

	return (summary, fig_hist, fig_items, fig_conf_count, fig_conf_score,
	fig_corr, fig_dim, table_df)

	def _build_correlation_plot(df, store):
	"""Scatter plot: review score change vs System-2 annotation score."""
	if df.empty:
	return _empty_fig("No data for correlation")

	points = []
	for _, row in df.iterrows():
	pid = row["paper_id"]
	rid = row["reviewer_id"]
	paper = store.review_by_paper_id.get(pid)
	if not paper:
	continue

	review_obj = None
	for r in paper["reviews"]:
	if r["reviewer_id"] == rid:
	review_obj = r
	break
	if not review_obj:
	continue

	try:
	init_r = int(str(review_obj.get("initial_score_unified", {})
	.get("rating", "")).split()[0])
	final_r = int(str(review_obj.get("final_score_unified", {})
	.get("rating", "")).split()[0])
	change = final_r - init_r
	except (ValueError, IndexError, AttributeError):
	continue

	points.append({
	"score_change": change,
	"system2_score": row["score"],
	"paper_id": pid,
	"reviewer_id": rid,
	})

	if not points:
	return _empty_fig("No matching review data")

	pts_df = pd.DataFrame(points)
	fig = px.scatter(
	pts_df, x="system2_score", y="score_change",
	title="Review Score Change vs System-2 Score",
	labels={"system2_score": "System-2 Score (0-8)",
	"score_change": "Review Score Change"},
	hover_data=["paper_id", "reviewer_id"],
	opacity=0.6,
	)
	# Add trend line
	if len(pts_df) > 2:
	fig.update_traces(marker=dict(size=8))
	fig = px.scatter(
	pts_df, x="system2_score", y="score_change",
	title="Review Score Change vs System-2 Score",
	labels={"system2_score": "System-2 Score (0-8)",
	"score_change": "Review Score Change"},
	hover_data=["paper_id", "reviewer_id"],
	opacity=0.6, trendline="ols",
	)
	fig.update_layout(height=380)
	return fig

	def do_export():
	csv_str = export_csv()
	if not csv_str:
	return gr.update(visible=False)
	tmp = tempfile.NamedTemporaryFile(
	mode="w", suffix=".csv", prefix="annotations_",
	delete=False, dir=tempfile.gettempdir(),
	)
	tmp.write(csv_str)
	tmp.close()
	return gr.update(value=tmp.name, visible=True)

	# ========== Wire Events ==========

	refresh_btn.click(
	fn=refresh_all,
	outputs=[summary_md, score_hist, item_rates_plot,
	conf_count_plot, conf_score_plot,
	correlation_plot, dimension_plot, ann_table],
	)

	export_btn.click(fn=do_export, outputs=[export_file])