Spaces:

kendrickfff
/

kentechtranslator

Sleeping

App Files Files Community

kentechtranslator / app.py

kendrickfff

Update app.py

9702f1d verified about 2 months ago

raw

history blame contribute delete

20.9 kB

	"""
	Ken's Tech Translator — Production Backend
	Secrets stay server-side. Prompt behavior is fully dynamic.
	Compatible with Azure OpenAI Responses API.
	Deploy target: HuggingFace Spaces (Docker)
	"""

	import os
	import logging
	import httpx
	from pathlib import Path
	from fastapi import FastAPI, Request
	from fastapi.staticfiles import StaticFiles
	from fastapi.responses import FileResponse, JSONResponse

	# ── Logging ───────────────────────────────────────────────────────────────────
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger("ken-translator")

	BASE_DIR = Path(__file__).resolve().parent
	app = FastAPI(title="Ken's Tech Translator", version="2.0.0")

	# ══════════════════════════════════════════════════════════════════════════════
	# SECRETS
	# ══════════════════════════════════════════════════════════════════════════════
	AZURE_API_KEY = os.environ.get("AZURE_API_KEY", "")

	AZURE_ENDPOINT = os.environ.get(
	"AZURE_ENDPOINT",
	"https://kendrickfilbert-9824-resource.cognitiveservices.azure.com/openai/responses?api-version=2025-04-01-preview"
	)

	MODEL_DEPLOYMENT = os.environ.get("MODEL_DEPLOYMENT", "gpt-5.3-chat-ken")

	# ══════════════════════════════════════════════════════════════════════════════
	# PROMPT LIBRARY
	# ══════════════════════════════════════════════════════════════════════════════

	BASE_SYSTEM_PROMPT = """
	You are Ken's Tech Translator — a senior technical communication engine.
	Your job is to convert raw engineering content into clear, structured updates
	tailored precisely to the audience, tone, and features specified below.

	## FEATURE CONFLICT RESOLUTION (MANDATORY)
	If Slack-Ready Format is enabled:
	- Override formatting ONLY (not content requirements)
	- Convert all required content into Slack format

	If multiple features conflict:
	Priority order:
	1. Slack Format
	2. Urgent Tone
	3. Audience rules
	4. Other features

	## CORE RULES
	- Never hallucinate or invent data not present in the source text.
	- Never ignore the AUDIENCE, TONE, or FEATURES instructions below — they are mandatory.
	- Always include the REQUIRED sections defined for the selected audience.
	- Do not omit required sections under any condition.
	- All output must be in Markdown.
	- Be concise. Eliminate filler. Every sentence must serve the reader.

	""".strip()

	AUDIENCE_PROMPTS = {
	"executive": """
	## AUDIENCE: C-Suite Executive
	Write for a time-poor executive who cares ONLY about business outcomes.
	- Lead with impact, not process.
	- Quantify risk, cost, or opportunity wherever possible.
	- Use no more than 3–4 short sections total.
	- Avoid all technical jargon. If unavoidable, define it inline in one clause.
	- REQUIRED sections: Summary (2 sentences max), Business Context, Suggested Next Steps.
	- OMIT: Technical Details, Glossary (unless a term is business-critical).
	""",
	"pm": """
	## AUDIENCE: Project Manager / Tech Lead
	Write for someone managing execution who needs scope, timelines, and owners.
	- Focus on what needs to happen, by when, and who owns it.
	- Call out blockers, dependencies, and risks explicitly.
	- REQUIRED sections: Summary, Overview, Business Context (timeline + scope focus),
	Technical Details (architectural context), Suggested Next Steps (detailed What/Who/Priority).
	""",
	"sales": """
	## AUDIENCE: Sales / Client-Facing
	Write for someone presenting value to a customer or external stakeholder.
	- Frame everything as customer benefit, competitive advantage, or risk mitigation.
	- Avoid internal jargon and infrastructure details entirely.
	- Use confident, positive framing.
	- REQUIRED sections: Summary, Overview (benefits-first), Business Context (implications + timeline),
	Suggested Next Steps (client-action focused).
	""",
	"general": """
	## AUDIENCE: General (Mixed / Anyone)
	Write for a non-technical reader with no assumed background.
	- Use plain English and everyday analogies.
	- Define every technical term on first use.
	- Keep sentences short. Use bullet points for lists.
	- REQUIRED sections: All standard sections. Glossary is mandatory.
	""",
	}

	TONE_PROMPTS = {
	"professional": """
	## TONE: Professional
	Clear, neutral, business-standard language. Structured paragraphs. Formal but not stiff.
	""",
	"casual": """
	## TONE: Casual Friendly
	Write like a knowledgeable colleague explaining over coffee.
	- Use conversational language and contractions (e.g., "it's", "doesn't")
	- Avoid report-style phrasing
	- Keep it natural and human
	- Reduce repetition across sections
	""",
	"urgent": """
	## TONE: Urgent / Escalation
	This content requires immediate attention.
	Open with impact and risk. Use direct, action-forcing language.
	Bold the most critical points. Keep it tight — no preamble or pleasantries.
	""",
	"educational": """
	## TONE: Educational
	Write to teach, not just inform. Explain the "why" behind decisions.
	Use the Glossary section fully. Build from simple to complex. Include at least one analogy.
	""",
	}

	FEATURE_PROMPTS = {
	"layered": """
	## FEATURE: Layered Output (TL;DR → Deep)
	You MUST begin your ENTIRE response with a "⚡ TL;DR" block — 1–2 sentences,
	plain English, zero jargon. Place it before all other sections.
	""",
	"business_impact": """
	## FEATURE: Business Impact
	You MUST include an explicit "💰 Business Impact" subsection inside Business Context.
	Cover: estimated cost/risk/ROI if quantifiable, operational disruption, revenue implication.
	If numbers are absent from source, state qualitative risk level (High/Medium/Low) with reasoning.
	""",
	"analogies": """
	## FEATURE: Analogies & Examples
	You MUST include at least one concrete real-world analogy inside the Overview section.
	Format it exactly as:
	💡 Analogy: [your analogy here]
	""",
	"action_items": """
	## FEATURE: Action Items
	The Suggested Next Steps section MUST use this exact Markdown table format:

	\| Action \| Owner \| Priority \|
	\|--------\|-------\|----------\|
	\| [What to do] \| [Suggested role] \| Address Promptly / Upcoming Sprint / Backlog \|

	Include a minimum of 2 rows and a maximum of 5 rows.
	""",
	"confidence": """
	## FEATURE: Confidence Notes
	You MUST add a final "🔍 Confidence Notes" section after all other sections.
	Rate confidence for each major claim:
	- ✅ High — clearly stated in source text
	- 🟡 Medium — reasonably inferred
	- 🔴 Low — assumed due to missing context
	Flag any ambiguous or missing information explicitly.
	""",
	"slack": """
	## FEATURE: Slack-Ready Format
	Reformat your ENTIRE output as a Slack message. This overrides all other formatting rules.
	Rules:
	- Maximum 300 words total.
	- Use bold for emphasis (Slack syntax), not Markdown headers.
	- Use emoji bullets (✅ 🔴 📌 ⚠️) instead of dashes or numbers.
	- Flat structure only — no nested headers or subsections.
	- End with exactly one line: 📌 Action needed: [single most important next step]
	""",
	}

	# ── Feature key normalization map (frontend label → internal key) ─────────────
	FEATURE_KEY_MAP = {
	"layered": "layered",
	"layered (tl;dr → deep)": "layered",
	"business_impact": "business_impact",
	"business impact": "business_impact",
	"analogies": "analogies",
	"analogies & examples": "analogies",
	"action_items": "action_items",
	"action items": "action_items",
	"confidence": "confidence",
	"confidence notes": "confidence",
	"slack": "slack",
	"slack-ready format": "slack",
	}

	# ── Audience key normalization map ────────────────────────────────────────────
	AUDIENCE_KEY_MAP = {
	"executive": "executive",
	"c-suite": "executive",
	"csuite": "executive",
	"pm": "pm",
	"pm / lead": "pm",
	"lead": "pm",
	"sales": "sales",
	"sales / client": "sales",
	"client": "sales",
	"general": "general",
	}

	# ── Tone key normalization map ────────────────────────────────────────────────
	TONE_KEY_MAP = {
	"professional": "professional",
	"casual": "casual",
	"casual friendly": "casual",
	"urgent": "urgent",
	"urgent / escalation":"urgent",
	"escalation": "urgent",
	"educational": "educational",
	}

	# Input limits (characters) — protects token budget and prevents abuse
	MAX_TEXT_LENGTH = 8_000
	MAX_TEXT2_LENGTH = 8_000

	# ══════════════════════════════════════════════════════════════════════════════
	# PROMPT BUILDER
	# ══════════════════════════════════════════════════════════════════════════════

	def build_system_prompt(audience: str, tone: str, features: list[str]) -> str:
	"""
	Assemble a deterministic system prompt from the base + audience + tone + feature blocks.
	Slack feature MUST be last (highest priority override).
	"""
	audience_key = AUDIENCE_KEY_MAP.get(audience.lower().strip(), "general")
	tone_key = TONE_KEY_MAP.get(tone.lower().strip(), "professional")

	# Normalize features safely
	normalized_features = []
	for f in features:
	key = FEATURE_KEY_MAP.get(f.lower().strip())
	if key and key not in normalized_features:
	normalized_features.append(key)

	# Enforce Slack LAST (highest priority)
	if "slack" in normalized_features:
	normalized_features = [
	f for f in normalized_features if f != "slack"
	] + ["slack"]

	parts = [
	BASE_SYSTEM_PROMPT,
	AUDIENCE_PROMPTS.get(audience_key, AUDIENCE_PROMPTS["general"]),
	TONE_PROMPTS.get(tone_key, TONE_PROMPTS["professional"]),
	]

	# Append features in correct order
	for feature_key in normalized_features:
	if feature_key in FEATURE_PROMPTS:
	parts.append(FEATURE_PROMPTS[feature_key])

	return "\n\n".join(parts)



	def build_user_prompt(
	text: str,
	text2: str,
	mode: str,
	audience: str,
	tone: str,
	features: list[str],
	) -> str:
	"""
	Build the user-turn prompt. Keeps source content clean and clearly delimited.
	"""
	feature_summary = ", ".join(features) if features else "None"

	header = (
	f"[Configuration]\n"
	f"- Mode: {mode.capitalize()}\n"
	f"- Audience: {audience}\n"
	f"- Tone: {tone}\n"
	f"- Features: {feature_summary}\n\n"
	)

	if mode == "comparison":
	body = (
	f"--- SOURCE TEXT A ---\n{text}\n\n"
	f"--- SOURCE TEXT B ---\n{text2}\n\n"
	f"[Task] Provide a Comparison summary: summarize both texts, "
	f"highlight key differences, note resource implications, and suggest an approach."
	)
	elif mode == "reverse":
	body = (
	f"--- BUSINESS REQUEST ---\n{text}\n\n"
	f"[Task] Reverse-translate this business request into: "
	f"technical considerations, acceptance criteria, and questions for the engineering team."
	)
	else:
	body = (
	f"--- TECHNICAL SOURCE TEXT ---\n{text}\n\n"
	f"[Task] Translate the technical content above following all configuration rules."
	)

	return header + body


	# ══════════════════════════════════════════════════════════════════════════════
	# API ROUTES
	# ══════════════════════════════════════════════════════════════════════════════

	@app.post("/api/translate")
	async def translate(request: Request):
	# ── 1. Parse body ──────────────────────────────────────────────────────────
	try:
	body = await request.json()
	except Exception:
	return JSONResponse({"error": "Invalid JSON body."}, status_code=400)

	if not body:
	return JSONResponse({"error": "Empty request body."}, status_code=400)

	text = (body.get("text") or "").strip()
	text2 = (body.get("text2") or "").strip()
	mode = (body.get("mode") or "standard").strip().lower()
	audience = (body.get("audience") or "general").strip().lower()
	tone = (body.get("tone") or "professional").strip().lower()
	features = [f for f in (body.get("features") or []) if isinstance(f, str)]

	# ── 2. Input validation ────────────────────────────────────────────────────
	if not text:
	return JSONResponse({"error": "No text provided."}, status_code=400)

	if len(text) > MAX_TEXT_LENGTH:
	return JSONResponse(
	{"error": f"Input text exceeds {MAX_TEXT_LENGTH:,} character limit. Please shorten it."},
	status_code=400,
	)

	if mode not in ("standard", "comparison", "reverse"):
	return JSONResponse(
	{"error": f"Invalid mode '{mode}'. Must be standard, comparison, or reverse."},
	status_code=400,
	)

	if mode == "comparison":
	if not text2:
	return JSONResponse(
	{"error": "Comparison mode requires a second text (text2)."},
	status_code=400,
	)
	if len(text2) > MAX_TEXT2_LENGTH:
	return JSONResponse(
	{"error": f"Second text exceeds {MAX_TEXT2_LENGTH:,} character limit."},
	status_code=400,
	)

	# ── 3. Config check ────────────────────────────────────────────────────────
	if not AZURE_API_KEY:
	logger.error("AZURE_API_KEY is not configured.")
	return JSONResponse(
	{"error": "Translation service is not configured. Contact the administrator."},
	status_code=500,
	)

	if not AZURE_ENDPOINT:
	logger.error("AZURE_ENDPOINT is not configured.")
	return JSONResponse(
	{"error": "Translation endpoint is not configured. Contact the administrator."},
	status_code=500,
	)

	# ── 4. Build prompts ───────────────────────────────────────────────────────
	system_prompt = build_system_prompt(audience, tone, features)
	user_prompt = build_user_prompt(text, text2, mode, audience, tone, features)

	logger.info(
	"Translate request \| mode=%s audience=%s tone=%s features=%s chars=%d",
	mode, audience, tone, features, len(text),
	)

	# ── 5. Call Azure OpenAI ───────────────────────────────────────────────────
	try:
	async with httpx.AsyncClient(timeout=90.0) as client:
	response = await client.post(
	AZURE_ENDPOINT,
	headers={
	"Content-Type": "application/json",
	"api-key": AZURE_API_KEY,
	},
	json={
	"model": MODEL_DEPLOYMENT,
	"instructions": system_prompt,
	"input": user_prompt,
	"max_output_tokens": 16384,
	},
	)

	# Surface non-2xx HTTP errors clearly
	if response.status_code != 200:
	logger.warning("Azure returned HTTP %d: %s", response.status_code, response.text[:300])
	return JSONResponse(
	{"error": f"Translation service returned an error (HTTP {response.status_code}). Try again."},
	status_code=502,
	)

	data = response.json()

	except httpx.TimeoutException:
	logger.warning("Azure request timed out.")
	return JSONResponse(
	{"error": "Request timed out. Try with shorter input or try again shortly."},
	status_code=504,
	)
	except httpx.RequestError as exc:
	logger.error("Network error contacting Azure: %s", exc)
	return JSONResponse(
	{"error": "Could not reach the translation service. Check connectivity."},
	status_code=502,
	)

	# ── 6. Parse Azure response ────────────────────────────────────────────────
	# Guard against {"error": {...}} in a 200 response (Azure sometimes does this)
	error_field = data.get("error")
	if error_field:
	error_msg = (
	error_field.get("message", "Unknown error from translation service.")
	if isinstance(error_field, dict)
	else str(error_field)
	)
	logger.warning("Azure error in 200 response: %s", error_msg)
	return JSONResponse({"error": error_msg}, status_code=502)

	# Extract text from the Responses API output array
	output_text = _extract_output_text(data)

	if not output_text:
	logger.error("Empty output extracted from Azure response: %s", str(data)[:500])
	return JSONResponse(
	{"error": "The AI returned an empty response. Please try again."},
	status_code=502,
	)

	return JSONResponse({"translation": output_text})


	def _extract_output_text(data: dict) -> str:
	"""
	Safely extract assistant text from Azure OpenAI Responses API payload.
	Handles nested output → message → content → output_text structure.
	Returns empty string if nothing is found.
	"""
	output_text = ""

	output_list = data.get("output") or []
	if not isinstance(output_list, list):
	return output_text

	for item in output_list:
	if not isinstance(item, dict):
	continue
	if item.get("type") != "message":
	continue
	content_list = item.get("content") or []
	for content in content_list:
	if isinstance(content, dict) and content.get("type") == "output_text":
	output_text += content.get("text", "")

	return output_text.strip()


	# ══════════════════════════════════════════════════════════════════════════════
	# HEALTH CHECK
	# ══════════════════════════════════════════════════════════════════════════════

	@app.get("/api/health")
	async def health():
	return {
	"status": "ok",
	"configured": bool(AZURE_API_KEY and AZURE_ENDPOINT),
	"model": MODEL_DEPLOYMENT,
	}


	# ══════════════════════════════════════════════════════════════════════════════
	# SERVE FRONTEND
	# ══════════════════════════════════════════════════════════════════════════════

	@app.get("/")
	async def root():
	return FileResponse(BASE_DIR / "static" / "index.html")

	app.mount("/static", StaticFiles(directory=str(BASE_DIR / "static")), name="static")