Spaces:

MCP-1st-Birthday
/

HR-Assistant

Running

App Files Files Community

HR-Assistant / src /frontend /streamlit /voice_screening_ui /app.py

owenkaplinsky

websocket url conversion fix (#8)

d864cc1 verified 17 days ago

raw

history blame contribute delete

15.6 kB

	"""
	Voice Screening MVP - Streamlit UI for browser-based voice interviews.
	"""
	import os
	import streamlit as st
	from datetime import datetime
	from pathlib import Path
	import uuid

	import sys
	from pathlib import Path

	# Load environment variables
	try:
	from dotenv import load_dotenv
	load_dotenv()
	except ImportError:
	pass # dotenv not installed, will try to get from environment

	# Add src directory to path so imports work
	sys.path.insert(0, str(Path(__file__).parent.parent))

	# Try to import requests for API calls (required)
	try:
	import requests
	HAS_REQUESTS = True
	except ImportError:
	HAS_REQUESTS = False
	raise ImportError("requests library is required for voice screening")

	# Helper function to get proxy URL
	def get_proxy_url(for_client=False):
	"""
	Get WebSocket proxy URL from environment or default.

	Args:
	for_client (bool): If True, returns a URL accessible from the browser (localhost).
	If False, returns the internal Docker URL (websocket_proxy).
	"""
	proxy_url = os.getenv("WEBSOCKET_PROXY_URL", "ws://localhost:8000/ws/realtime")

	if for_client:
	# Convert Docker internal URL to browser-accessible URL
	if "websocket_proxy" in proxy_url:
	proxy_url = proxy_url.replace("websocket_proxy", "localhost")

	return proxy_url

	def get_proxy_base_url(for_client: bool = False):
	"""Get HTTP base URL for proxy API calls.

	Args:
	for_client: If True, returns URL accessible from browser (localhost).
	If False, returns internal Docker URL (websocket_proxy).
	"""
	proxy_url = get_proxy_url(for_client=for_client)
	# Convert WebSocket URL to HTTP URL
	base_url = proxy_url.replace("ws://", "http://").replace("wss://", "https://").replace("/ws/realtime", "")
	# Ensure we have a protocol
	if not base_url.startswith(("http://", "https://")):
	base_url = f"http://{base_url}"
	return base_url

	def get_backend_url():
	"""Get backend API URL from environment or default."""
	return os.getenv("BACKEND_API_URL", "http://localhost:8000")

	# Page configuration
	st.set_page_config(
	page_title="Voice Screening Interview",
	page_icon="🎙️",
	layout="centered"
	)

	# Initialize session state
	if "session_id" not in st.session_state:
	st.session_state.session_id = None
	if "transcript" not in st.session_state:
	st.session_state.transcript = []
	if "is_interview_active" not in st.session_state:
	st.session_state.is_interview_active = False
	if "candidate_id" not in st.session_state:
	st.session_state.candidate_id = None
	if "session_token" not in st.session_state:
	st.session_state.session_token = None

	if "user_email" not in st.session_state:
	st.session_state.user_email = None
	if "auth_code" not in st.session_state:
	st.session_state.auth_code = None
	if "audio_file_path" not in st.session_state:
	st.session_state.audio_file_path = None

	st.title("🎙️ Voice Screening Interview")

	# Authentication screen
	if not st.session_state.session_token:
	st.markdown("### 🔐 Authentication")
	st.markdown("Please enter your email and authentication code to start.")

	with st.form("auth_form"):
	user_email = st.text_input("Email", placeholder="your.email@example.com", value=st.session_state.user_email or "")
	auth_code = st.text_input("Authentication Code", placeholder="Enter your code", value=st.session_state.auth_code or "")

	verify_submitted = st.form_submit_button("✅ Verify & Login", use_container_width=True, type="primary")

	if verify_submitted:
	if user_email and auth_code:
	try:
	# Use for_client=True to get localhost URL when running outside Docker
	# The Streamlit app might be accessed from browser, so use client-accessible URL
	proxy_base = get_proxy_base_url(for_client=True)
	# Ensure URL has protocol
	if not proxy_base.startswith(("http://", "https://")):
	proxy_base = f"http://{proxy_base}"
	auth_url = f"{proxy_base}/auth/verify"
	response = requests.post(
	auth_url,
	json={"email": user_email, "code": auth_code},
	timeout=5
	)
	if response.status_code == 200:
	data = response.json()
	st.session_state.session_token = data["session_token"]
	st.session_state.user_email = user_email

	# Auto-set candidate ID if returned
	if "candidate_id" in data and data["candidate_id"]:
	st.session_state.candidate_id = data["candidate_id"]

	st.success("✅ Authentication successful!")
	st.rerun()
	else:
	error_data = response.json() if response.content else {}
	st.error(f"❌ Authentication failed: {error_data.get('detail', response.text)}")
	except Exception as e:
	st.error(f"❌ Error connecting to proxy: {e}")
	st.info("💡 Make sure the WebSocket proxy service is running.")
	else:
	st.warning("⚠️ Please enter both email and code.")

	st.markdown("---")
	st.info("💡 Note: Enter your email and authentication code to proceed.")
	st.stop()

	# Main interview interface (only shown after authentication)
	col_header1, col_header2 = st.columns([3, 1])
	with col_header1:
	st.markdown(
	f"""
	Welcome, {st.session_state.user_email}!
	Click Start Interview to begin, then use the toggle button to speak.
	"""
	)
	with col_header2:
	if st.button("🚪 Logout", use_container_width=True):
	st.session_state.session_token = None
	st.session_state.user_email = None
	st.session_state.auth_code = None
	st.session_state.is_interview_active = False
	st.rerun()

	# Candidate selection
	with st.expander("Candidate Information", expanded=True):
	# Check for candidate_id in query parameters
	query_params = st.query_params
	if "candidate_id" in query_params and not st.session_state.candidate_id:
	st.session_state.candidate_id = query_params["candidate_id"]
	st.success(f"✅ Candidate ID loaded from URL: {st.session_state.candidate_id}")

	if st.session_state.candidate_id:
	st.info(f"Current Candidate ID: `{st.session_state.candidate_id}`")
	else:
	st.warning("⚠️ No candidate selected. Please provide a Candidate ID.")

	candidate_id_input = st.text_input("Enter Candidate ID", value=st.session_state.candidate_id or "")

	# Strip whitespace from input
	if candidate_id_input:
	candidate_id_input = candidate_id_input.strip()

	if candidate_id_input and candidate_id_input != st.session_state.candidate_id:
	st.session_state.candidate_id = candidate_id_input
	st.success(f"✅ Candidate ID set to: {candidate_id_input}")

	# Interview controls
	col1, col2 = st.columns(2)

	with col1:
	if not st.session_state.is_interview_active:
	if st.button("🚀 Start Interview", type="primary", use_container_width=True):
	st.session_state.is_interview_active = True
	st.session_state.session_id = str(uuid.uuid4())
	st.session_state.transcript = []
	st.session_state.transcript.append({
	"speaker": "system",
	"text": "Interview started",
	"timestamp": datetime.now().isoformat()
	})
	st.rerun()
	else:
	if st.button("⏹️ End Interview", type="secondary", use_container_width=True):
	# Save audio recording and transcript via backend API
	if st.session_state.session_id and st.session_state.session_token and st.session_state.candidate_id and HAS_REQUESTS:
	try:
	# Build transcript text
	transcript_text = "\n".join([
	f"{entry.get('speaker', 'unknown')}: {entry.get('text', '')}"
	for entry in st.session_state.transcript
	if entry.get("speaker") in ["agent", "candidate"]
	])

	backend_url = get_backend_url()
	st.info(f"🔍 Debug: Attempting to save to {backend_url}/api/v1/voice-screener/session/{st.session_state.session_id}/save")

	response = requests.post(
	f"{backend_url}/api/v1/voice-screener/session/{st.session_state.session_id}/save",
	json={
	"session_id": st.session_state.session_id,
	"candidate_id": st.session_state.candidate_id,
	"transcript_text": transcript_text,
	"proxy_token": st.session_state.session_token
	},
	timeout=30
	)
	st.info(f"🔍 Debug: Response Status: {response.status_code}")

	if response.status_code == 200:
	data = response.json()
	st.session_state.audio_file_path = data.get("audio_file_path")
	st.success(f"✅ Session saved successfully!")
	if st.session_state.audio_file_path:
	st.info(f"Audio: {st.session_state.audio_file_path}")
	else:
	st.error(f"❌ Backend Error ({response.status_code}): {response.text}")
	except Exception as e:
	st.error(f"❌ Connection Error: {e}")
	st.code(f"Backend URL: {get_backend_url()}\nError Type: {type(e).__name__}")
	else:
	st.error("❌ Missing session state for saving!")
	st.write(f"Session ID: {st.session_state.session_id}")
	st.write(f"Token: {bool(st.session_state.session_token)}")
	st.write(f"Candidate ID: {st.session_state.candidate_id}")

	st.session_state.is_interview_active = False
	# st.rerun() # Commented out to see debug messages

	with col2:
	if st.session_state.is_interview_active:
	st.info("🟢 Interview Active")

	# Voice interface component
	if st.session_state.is_interview_active:
	st.markdown("---")
	st.subheader("Voice Interface")

	# Load HTML component with WebSocket and audio handling
	html_file = Path(__file__).parent / "components" / "voice_interface.html"
	if html_file.exists():
	with open(html_file, "r", encoding="utf-8") as f:
	html_content = f.read()

	# Get proxy URL and session token
	proxy_url = get_proxy_url(for_client=True)
	session_token = st.session_state.session_token

	if not session_token:
	st.error("⚠️ No session token. Please authenticate first.")
	st.stop()

	# Show connection debug info
	with st.expander("🔍 Connection Debug Info", expanded=False):
	st.success(f"✅ Authenticated as: `{st.session_state.user_email}`")
	st.info(f"WebSocket Proxy: `{proxy_url}`")
	st.info("Note: The connection uses a WebSocket proxy to handle authentication. "
	"Browsers cannot set custom headers in WebSocket connections, so we proxy through the backend.")
	if "localhost" in proxy_url or "127.0.0.1" in proxy_url:
	st.warning("⚠️ Make sure the WebSocket proxy service is running! Check docker-compose logs.")

	# Proxy health check
	if HAS_REQUESTS:
	try:
	# Use for_client=True to get localhost URL when running outside Docker
	proxy_base = get_proxy_base_url(for_client=True)
	# Ensure URL has protocol
	if not proxy_base.startswith(("http://", "https://")):
	proxy_base = f"http://{proxy_base}"
	health_url = f"{proxy_base}/health"
	response = requests.get(health_url, timeout=2)
	if response.status_code == 200:
	health_data = response.json()
	st.success(f"✅ Proxy is healthy: {health_data.get('status', 'unknown')}")
	if health_data.get('openai_api_key_configured'):
	st.success("✅ OpenAI API key is configured in proxy")
	else:
	st.error("❌ OpenAI API key NOT configured in proxy")
	st.info(f"Active sessions: {health_data.get('active_sessions', 0)}")
	else:
	st.warning(f"⚠️ Proxy health check returned: {response.status_code}")
	except Exception as e:
	st.warning(f"⚠️ Could not check proxy health: {e}")
	st.info("💡 To view proxy logs: `docker compose logs -f websocket_proxy`")
	else:
	st.info("💡 To check proxy status: `docker compose logs websocket_proxy`")
	st.info("💡 To view live logs: `docker compose logs -f websocket_proxy`")

	# Build WebSocket URL with session token
	ws_url = f"{proxy_url}?token={session_token}"

	html_content = html_content.replace("{{SESSION_ID}}", st.session_state.session_id)
	html_content = html_content.replace("{{SESSION_TOKEN}}", session_token)
	html_content = html_content.replace("{{PROXY_URL}}", ws_url)

	st.components.v1.html(html_content, height=500) # Increased height for error messages
	else:
	st.warning("Voice interface component not found. Please ensure voice_interface.html exists.")

	# Transcript display
	st.markdown("---")
	st.subheader("Live Transcript")

	if st.session_state.transcript:
	for entry in st.session_state.transcript:
	speaker = entry.get("speaker", "unknown")
	text = entry.get("text", "")
	timestamp = entry.get("timestamp", "")

	if speaker == "agent":
	st.markdown(f"🤖 Agent: {text}")
	elif speaker == "candidate":
	st.markdown(f"👤 You: {text}")
	else:
	st.markdown(f"{text}")

	# Manual transcript update (for testing - in real app, JS updates this)
	with st.expander("Add Transcript Entry (Testing)"):
	col1, col2 = st.columns([3, 1])
	with col1:
	test_text = st.text_input("Text", key="test_transcript")
	with col2:
	test_speaker = st.selectbox("Speaker", ["candidate", "agent"], key="test_speaker")

	if st.button("Add Entry"):
	if test_text:
	st.session_state.transcript.append({
	"speaker": test_speaker,
	"text": test_text,
	"timestamp": datetime.now().isoformat()
	})
	st.rerun()