Spaces:

banao-tech
/

intern-updates

Paused

App Files Files Community

intern-updates / app.py

banao-tech

Update app.py

f135dbb verified 14 days ago

raw

history blame contribute delete

21.1 kB

	"""
	AI Vidya — Daily Report Evaluation Agent
	=========================================
	Reads #ai-vidya on Slack, checks who posted an EOD report today,
	evaluates quality with Claude, posts a summary to #intern-updates.

	Deploy on HuggingFace Spaces (Gradio SDK) — runs as a persistent web app.
	Trigger manually via the UI or set a scheduled run via HF ZeroGPU / cron.
	"""

	import os
	import json
	import time
	import datetime
	from zoneinfo import ZoneInfo

	import anthropic
	import gradio as gr
	from slack_sdk import WebClient
	from slack_sdk.errors import SlackApiError

	# ─── CONFIG ───────────────────────────────────────────────────────────────────
	REPORT_CHANNEL_ID = "C08L1CFEF40" # #ai-vidya
	ALERT_CHANNEL_ID = "C0B2L4FTW4E" # #intern-updates
	IST = ZoneInfo("Asia/Kolkata")
	DEADLINE_HOUR = 23 # 11 PM IST

	# Intern registry — add/remove interns here
	# Format: { "slack_user_id": "Full Name" }
	INTERN_REGISTRY = {
	"U084C0HQLKS": "Khushi Mishra",
	"U0AFNM2H88G": "Roshesh Shah",
	"U0AEQV8F7LM": "Rishikesh Brahma",
	"U0AEN15QY0K": "Vishwajeet Jadhav",
	}

	# ─── CLIENTS (lazy-init from env) ─────────────────────────────────────────────
	def get_slack():
	token = os.environ.get("SLACK_BOT_TOKEN")
	if not token:
	raise ValueError("SLACK_BOT_TOKEN not set in environment secrets.")
	return WebClient(token=token)

	def get_anthropic():
	key = os.environ.get("ANTHROPIC_API_KEY")
	if not key:
	raise ValueError("ANTHROPIC_API_KEY not set in environment secrets.")
	return anthropic.Anthropic(api_key=key)


	# ─── STEP 1: FETCH TODAY'S MESSAGES ───────────────────────────────────────────
	def fetch_todays_messages(slack: WebClient, log: list) -> list:
	"""Return all non-bot messages posted in #ai-vidya today (IST)."""
	now_ist = datetime.datetime.now(IST)
	start_of_day = now_ist.replace(hour=0, minute=0, second=0, microsecond=0)
	oldest_ts = str(start_of_day.timestamp())

	log.append(f"📥 Fetching messages from #ai-vidya since {start_of_day.strftime('%d %b %Y %I:%M %p IST')}...")

	messages = []
	cursor = None
	while True:
	kwargs = {
	"channel": REPORT_CHANNEL_ID,
	"oldest": oldest_ts,
	"limit": 200,
	}
	if cursor:
	kwargs["cursor"] = cursor

	resp = slack.conversations_history(**kwargs)
	batch = [m for m in resp.get("messages", []) if not m.get("bot_id") and not m.get("subtype")]
	messages.extend(batch)

	if resp.get("has_more") and resp.get("response_metadata", {}).get("next_cursor"):
	cursor = resp["response_metadata"]["next_cursor"]
	else:
	break

	log.append(f" → Found {len(messages)} human messages today.")
	return messages


	# ─── STEP 2B: CHECK LEAVE STATUS VIA SLACK PROFILE ──────────────────────────
	def is_on_leave_today(name: str, full_status: str, claude_client) -> bool:
	"""Use Claude to determine if intern is on leave today from their full Slack status string."""
	if not full_status or full_status.strip() == "":
	return False

	today = datetime.datetime.now(IST).strftime("%d-%m-%Y")

	prompt = f"""Today is {today}.

	Intern Slack status: "{full_status}"

	Is this intern on leave TODAY?
	Consider: date ranges, "on leave", "off", "absent", :red_circle: emoji, away messages.
	Reply ONLY with "yes" or "no"."""

	try:
	resp = claude_client.messages.create(
	model="claude-sonnet-4-20250514",
	max_tokens=5,
	messages=[{"role": "user", "content": prompt}]
	)
	return resp.content[0].text.strip().lower().startswith("yes")
	except Exception:
	return False


	def get_interns_on_leave(slack: WebClient, claude_client, interns: list, log: list) -> set:
	"""Check each intern's Slack status using Claude to interpret leave intelligently."""
	on_leave = set()
	today = datetime.datetime.now(IST).strftime("%d %b %Y")
	log.append(f" Checking leave status for {today}...")

	for intern in interns:
	try:
	# Try users.info first
	resp = slack.users_info(user=intern["userId"])
	profile = resp.get("user", {}).get("profile", {})
	status_text = profile.get("status_text", "")
	status_emoji = profile.get("status_emoji", "")
	full_status = f"{status_emoji} {status_text}".strip()

	# Fallback: try users_profile_get if status is empty
	if not full_status:
	resp2 = slack.users_profile_get(user=intern["userId"])
	p2 = resp2.get("profile", {})
	status_text = p2.get("status_text", "")
	status_emoji = p2.get("status_emoji", "")
	full_status = f"{status_emoji} {status_text}".strip()

	log.append(f" {intern['name']} status: '{full_status}'")

	if not full_status:
	log.append(f" {intern['name']} — no status set, treating as active")
	continue

	on_leave_today = is_on_leave_today(intern["name"], full_status, claude_client)
	if on_leave_today:
	on_leave.add(intern["userId"])
	log.append(f" {intern['name']} — MARKED ON LEAVE")
	else:
	log.append(f" {intern['name']} — active")
	except Exception as e:
	log.append(f" Could not check {intern['name']}: {e}")

	return on_leave


	# ─── STEP 2: MATCH MESSAGES TO INTERNS ────────────────────────────────────────
	def match_reports(messages: list, log: list, on_leave: set = None) -> dict:
	"""
	Returns dict keyed by user_id:
	{
	"U123": {
	"name": "Priya Sharma",
	"submitted": True/False,
	"message": "...",
	"miss_count": 0
	}
	}
	"""
	# Build a set of user_ids who posted today
	posted_today = {}
	for msg in messages:
	uid = msg.get("user")
	if uid and uid not in posted_today:
	posted_today[uid] = msg.get("text", "")

	results = {}

	# Check registered interns
	registry = INTERN_REGISTRY
	if not registry:
	# Auto-detect from today's posters if registry is empty (fallback)
	log.append("⚠️ INTERN_REGISTRY is empty — showing all posters instead.")
	for uid, text in posted_today.items():
	results[uid] = {
	"name": uid,
	"submitted": True,
	"message": text,
	}
	return results

	on_leave = on_leave or set()
	for uid, name in registry.items():
	if uid in on_leave:
	results[uid] = {
	"name": name,
	"submitted": True,
	"message": None,
	"on_leave": True,
	}
	log.append(f" {name} — on leave (skipped)")
	elif uid in posted_today:
	results[uid] = {
	"name": name,
	"submitted": True,
	"message": posted_today[uid],
	"on_leave": False,
	}
	log.append(f" {name} — submitted")
	else:
	results[uid] = {
	"name": name,
	"submitted": False,
	"message": None,
	"on_leave": False,
	}
	log.append(f" {name} — MISSED")

	return results


	# ─── STEP 3: EVALUATE REPORT QUALITY WITH CLAUDE ─────────────────────────────
	EVAL_SYSTEM = """You evaluate daily EOD reports from AI developer interns.
	A valid report must contain ALL three:
	1. What they actually worked on — specific and technical
	2. What they got stuck on — an honest blocker, not vague
	3. What they tried to resolve it

	Return ONLY a JSON object (no markdown, no preamble):
	{
	"quality": "good" \| "weak" \| "invalid",
	"score": 1-10,
	"reason": "one sentence max",
	"flags": []
	}

	Quality:
	- "good" → specific technical content, real blocker, shows thinking (score 7-10)
	- "weak" → too vague, missing blocker, just a status update (score 4-6)
	- "invalid" → one liner, no content, "done", "working on it", link only (score 1-3)

	Flags (add any that apply):
	"no_blocker", "vague_progress", "no_technical_detail", "link_only", "too_short"
	"""

	def evaluate_report(client: anthropic.Anthropic, name: str, text: str, log: list) -> dict:
	"""Call Claude to evaluate a single report. Returns eval dict."""
	if not text or len(text.strip()) < 20:
	return {"quality": "invalid", "score": 1, "reason": "Report is empty or too short.", "flags": ["too_short"]}

	try:
	response = client.messages.create(
	model="claude-sonnet-4-20250514",
	max_tokens=300,
	system=EVAL_SYSTEM,
	messages=[{"role": "user", "content": f"Intern: {name}\n\nReport:\n{text}"}],
	)
	raw = response.content[0].text.strip().replace("```json", "").replace("```", "")
	return json.loads(raw)
	except Exception as e:
	log.append(f" ⚠️ Claude eval failed for {name}: {e}")
	return {"quality": "weak", "score": 3, "reason": "Evaluation error.", "flags": []}


	# ─── STEP 4: GET OR CREATE ALERT CHANNEL ─────────────────────────────────────
	def get_alert_channel_id(slack: WebClient, log: list) -> str:
	"""Find #intern-updates channel ID - paginate through all channels."""
	all_names = []
	cursor = None
	while True:
	kwargs = dict(types="public_channel,private_channel", limit=200)
	if cursor:
	kwargs["cursor"] = cursor
	resp = slack.conversations_list(**kwargs)
	for ch in resp.get("channels", []):
	all_names.append(ch["name"])
	if ch["name"] == ALERT_CHANNEL_ID:
	log.append(f" Found #{ALERT_CHANNEL_ID} (ID: {ch['id']})")
	return ch["id"]
	next_cursor = resp.get("response_metadata", {}).get("next_cursor")
	if not next_cursor:
	break
	cursor = next_cursor
	log.append(f"Channel #{ALERT_CHANNEL_ID} not found. Bot can see: {all_names}")
	log.append(f" Run in #intern-updates: /invite @intern-eod")
	return None


	# ─── STEP 5: BUILD SLACK MESSAGE ──────────────────────────────────────────────
	def build_slack_message(results: dict, evals: dict, run_time: str) -> str:
	active = {uid: r for uid, r in results.items() if not r.get("on_leave")}
	submitted = [r for r in active.values() if r["submitted"]]
	missed = [r for r in active.values() if not r["submitted"]]
	on_leave_list = [r for r in results.values() if r.get("on_leave")]
	good = [r for uid, r in active.items() if r["submitted"] and evals.get(uid, {}).get("quality") == "good"]
	weak = [r for uid, r in active.items() if r["submitted"] and evals.get(uid, {}).get("quality") == "weak"]
	invalid = [r for uid, r in active.items() if r["submitted"] and evals.get(uid, {}).get("quality") == "invalid"]

	total = len(results)
	active_count = len(active)
	date_str = datetime.datetime.now(IST).strftime("%d %b %Y")

	lines = []
	lines.append(f"<!channel>")
	lines.append(f"Daily Report Check — {date_str}")
	lines.append(f"{'─' * 32}")
	lines.append(f":busts_in_silhouette: {active_count} active · :spiral_calendar_pad: Deadline 11:00 PM IST")
	lines.append("")

	# Submitted
	if submitted:
	lines.append(f":notepad_spiral: Reports Received — {len(submitted)}/{active_count}")
	for uid, r in active.items():
	if not r["submitted"]:
	continue
	ev = evals.get(uid, {})
	q = ev.get("quality", "?")
	sc = ev.get("score", "?")
	icon = {"good": ":large_green_circle:", "weak": ":large_yellow_circle:", "invalid": ":red_circle:"}.get(q, ":white_circle:")
	flags = ev.get("flags", [])
	line = f" {icon} {r['name']} · {sc}/10 · {ev.get('reason', '')}"
	if flags:
	line += "\n _flags: " + ", ".join(flags) + "_"
	lines.append(line)
	lines.append("")

	# Missed
	if missed:
	lines.append(f":x: No Report — {len(missed)}/{active_count}")
	for r in missed:
	lines.append(f" :red_circle: {r['name']}")
	lines.append("")

	# On Leave
	if on_leave_list:
	lines.append(f":palm_tree: On Leave — {len(on_leave_list)}/{total}")
	for r in on_leave_list:
	lines.append(f" :white_circle: {r['name']}")
	lines.append("")

	# Footer
	lines.append(f"{'─' * 32}")
	lines.append(f":large_green_circle: {len(good)} :large_yellow_circle: {len(weak)} :red_circle: {len(invalid)} :x: {len(missed)} :palm_tree: {len(on_leave_list)}")

	return "\n".join(lines)


	# ─── STEP 6: SEND MISSED ALERTS ───────────────────────────────────────────────
	def send_missed_alerts(slack: WebClient, alert_channel_id: str, results: dict, log: list):
	"""Post individual @mention alerts for every missed intern — skip interns on leave."""
	for uid, r in results.items():
	if r["submitted"] or r.get("on_leave"):
	continue
	msg = (
	f"<@{uid}> Your EOD report for today has not been received.\n\n"
	f"Reports are expected daily by 11:00 PM IST. "
	f"If you are blocked, submit what you have worked on and state the blocker — that is a valid submission."
	)
	try:
	slack.chat_postMessage(channel=alert_channel_id, text=msg)
	log.append(f" Alert sent for {r['name']}")
	except SlackApiError as e:
	log.append(f" Could not send alert for {r['name']}: {e.response['error']}")


	# ─── MAIN EVALUATION RUNNER ───────────────────────────────────────────────────
	def run_evaluation(custom_interns_json: str = "") -> str:
	"""
	Full pipeline. Returns a log string for display in Gradio.
	custom_interns_json: optional JSON override for INTERN_REGISTRY, e.g.
	{"U06T83LP86P": "Mann Vishnoi", "U084C0HQLKS": "Khushi Mishra"}
	"""
	log = []
	now_ist = datetime.datetime.now(IST)
	run_time = now_ist.strftime("%d %b %Y %I:%M %p IST")
	log.append(f"🚀 Evaluation started at {run_time}")
	log.append("=" * 55)

	# Override intern registry if provided via UI
	global INTERN_REGISTRY
	if custom_interns_json.strip():
	try:
	INTERN_REGISTRY = json.loads(custom_interns_json)
	log.append(f"👥 Using custom intern list: {list(INTERN_REGISTRY.values())}")
	except json.JSONDecodeError:
	log.append("⚠️ Invalid JSON for intern list — using default INTERN_REGISTRY.")

	try:
	slack_client = get_slack()
	claude_client = get_anthropic()
	except ValueError as e:
	log.append(f"❌ {e}")
	return "\n".join(log)

	# 1. Fetch messages
	try:
	messages = fetch_todays_messages(slack_client, log)
	except SlackApiError as e:
	log.append(f"❌ Slack error: {e.response['error']}")
	return "\n".join(log)

	# 2. Check who is on leave via Slack status
	log.append("\nChecking Slack status for leave...")
	intern_list = [{"userId": uid, "name": name} for uid, name in INTERN_REGISTRY.items()]
	on_leave = get_interns_on_leave(slack_client, claude_client, intern_list, log)
	if not on_leave:
	log.append(" No interns on leave today.")

	# 3. Match to interns
	results = match_reports(messages, log, on_leave)
	if not results:
	log.append("⚠️ No interns to evaluate.")
	return "\n".join(log)

	# 3. Evaluate quality with Claude
	log.append("\n🤖 Evaluating report quality with Claude...")
	evals = {}
	for uid, r in results.items():
	if r["submitted"] and not r.get("on_leave"):
	ev = evaluate_report(claude_client, r["name"], r["message"], log)
	evals[uid] = ev
	q_icon = {"good": "🟢", "weak": "🟡", "invalid": "🔴"}.get(ev["quality"], "⚪")
	log.append(f" {q_icon} {r['name']} → {ev['quality']} (score {ev['score']}/10): {ev['reason']}")

	# 4. Alert channel is hardcoded - no API call needed
	alert_channel_id = ALERT_CHANNEL_ID
	log.append(f" Using #intern-updates ({ALERT_CHANNEL_ID})")

	# 5. Build and post full message to #ai-vidya only
	summary_msg = build_slack_message(results, evals, run_time)
	try:
	slack_client.chat_postMessage(channel=REPORT_CHANNEL_ID, text=summary_msg)
	log.append(" Summary posted to #ai-vidya.")
	except SlackApiError as e:
	log.append(f" Could not post to #ai-vidya: {e.response['error']}")

	# 6. Send @mention alerts to #ai-vidya
	missed_count = sum(1 for r in results.values() if not r["submitted"] and not r.get("on_leave"))
	if missed_count:
	log.append(f"\nSending {missed_count} missed report alert(s) to #ai-vidya...")
	send_missed_alerts(slack_client, REPORT_CHANNEL_ID, results, log)
	else:
	log.append("\nAll interns submitted — no missed alerts needed.")

	log.append("\n" + "=" * 55)
	log.append("✅ Evaluation complete.")
	return "\n".join(log)


	# ─── GRADIO UI ────────────────────────────────────────────────────────────────
	INTERN_REGISTRY_EXAMPLE = json.dumps({
	"U06T83LP86P": "Mann Vishnoi",
	"U084C0HQLKS": "Khushi Mishra",
	"U0AFNM2H88G": "Roshesh Shah",
	}, indent=2)

	with gr.Blocks(title="AI Vidya — Daily Report Agent", theme=gr.themes.Soft()) as demo:
	gr.Markdown("""
	# 📋 AI Vidya — Daily Report Evaluation Agent
	Reads #ai-vidya, checks who submitted their EOD report today,
	evaluates quality with Claude, and posts results to #intern-updates.

	---
	Before running: Add `SLACK_BOT_TOKEN` and `ANTHROPIC_API_KEY` in
	Settings → Secrets of this HuggingFace Space.
	""")

	with gr.Row():
	with gr.Column(scale=1):
	gr.Markdown("### 👥 Intern Registry")
	intern_input = gr.Textbox(
	label="Intern list (JSON: {slack_user_id: name})",
	value=INTERN_REGISTRY_EXAMPLE,
	lines=10,
	placeholder='{"U06T83LP86P": "Mann Vishnoi"}',
	info="Get Slack user IDs from: Slack profile → ⋮ menu → Copy member ID"
	)
	run_btn = gr.Button("▶️ Run Evaluation Now", variant="primary", size="lg")

	with gr.Column(scale=2):
	gr.Markdown("### 📄 Evaluation Log")
	output = gr.Textbox(
	label="",
	lines=28,
	interactive=False,
	show_copy_button=True,
	)

	gr.Markdown("""
	---
	### 🕐 Auto-scheduling on HuggingFace
	HuggingFace Spaces don't have built-in cron. Two options:

	Option A — GitHub Actions (recommended, free)
	Create `.github/workflows/trigger.yml` in your HF Space repo:
	```yaml
	on:
	schedule:
	- cron: '30 17 * * *' # 11:00 PM IST = 17:30 UTC
	jobs:
	trigger:
	runs-on: ubuntu-latest
	steps:
	- run: curl -X POST ${{ secrets.HF_SPACE_URL }}/run/predict -H "Content-Type: application/json" -d '{}'
	```

	Option B — External cron service
	Use [cron-job.org](https://cron-job.org) (free) to POST to your Space URL daily at 11 PM IST.
	""")

	run_btn.click(fn=run_evaluation, inputs=[intern_input], outputs=[output])

	# ─── CRON TRIGGER — runs evaluation synchronously and returns result ──────────
	import threading

	def trigger_evaluation():
	"""Called by the /trigger Gradio endpoint — runs fully, returns log."""
	return run_evaluation("")

	# Expose as a hidden Gradio endpoint so cron can call it
	with demo:
	cron_output = gr.Textbox(visible=False, label="cron_result")
	cron_btn = gr.Button(visible=False, elem_id="cron_trigger")
	cron_btn.click(fn=trigger_evaluation, inputs=[], outputs=[cron_output],
	api_name="trigger")

	if __name__ == "__main__":
	demo.launch()