Spaces:

MCP-1st-Birthday
/

HR-Assistant

Running

File size: 15,610 Bytes

"""
Voice Screening MVP - Streamlit UI for browser-based voice interviews.
"""
import os
import streamlit as st
from datetime import datetime
from pathlib import Path
import uuid

import sys
from pathlib import Path

# Load environment variables
try:
    from dotenv import load_dotenv
    load_dotenv()
except ImportError:
    pass  # dotenv not installed, will try to get from environment

# Add src directory to path so imports work
sys.path.insert(0, str(Path(__file__).parent.parent))

# Try to import requests for API calls (required)
try:
    import requests
    HAS_REQUESTS = True
except ImportError:
    HAS_REQUESTS = False
    raise ImportError("requests library is required for voice screening")

# Helper function to get proxy URL
def get_proxy_url(for_client=False):
    """
    Get WebSocket proxy URL from environment or default.
    
    Args:
        for_client (bool): If True, returns a URL accessible from the browser (localhost).
                          If False, returns the internal Docker URL (websocket_proxy).
    """
    proxy_url = os.getenv("WEBSOCKET_PROXY_URL", "ws://localhost:8000/ws/realtime")
    
    if for_client:
        # Convert Docker internal URL to browser-accessible URL
        if "websocket_proxy" in proxy_url:
            proxy_url = proxy_url.replace("websocket_proxy", "localhost")
            
    return proxy_url

def get_proxy_base_url(for_client: bool = False):
    """Get HTTP base URL for proxy API calls.
    
    Args:
        for_client: If True, returns URL accessible from browser (localhost).
                   If False, returns internal Docker URL (websocket_proxy).
    """
    proxy_url = get_proxy_url(for_client=for_client)
    # Convert WebSocket URL to HTTP URL
    base_url = proxy_url.replace("ws://", "http://").replace("wss://", "https://").replace("/ws/realtime", "")
    # Ensure we have a protocol
    if not base_url.startswith(("http://", "https://")):
        base_url = f"http://{base_url}"
    return base_url

def get_backend_url():
    """Get backend API URL from environment or default."""
    return os.getenv("BACKEND_API_URL", "http://localhost:8000")

# Page configuration
st.set_page_config(
    page_title="Voice Screening Interview",
    page_icon="🎙️",
    layout="centered"
)

# Initialize session state
if "session_id" not in st.session_state:
    st.session_state.session_id = None
if "transcript" not in st.session_state:
    st.session_state.transcript = []
if "is_interview_active" not in st.session_state:
    st.session_state.is_interview_active = False
if "candidate_id" not in st.session_state:
    st.session_state.candidate_id = None
if "session_token" not in st.session_state:
    st.session_state.session_token = None

if "user_email" not in st.session_state:
    st.session_state.user_email = None
if "auth_code" not in st.session_state:
    st.session_state.auth_code = None
if "audio_file_path" not in st.session_state:
    st.session_state.audio_file_path = None

st.title("🎙️ Voice Screening Interview")

# Authentication screen
if not st.session_state.session_token:
    st.markdown("### 🔐 Authentication")
    st.markdown("Please enter your email and authentication code to start.")
    
    with st.form("auth_form"):
        user_email = st.text_input("Email", placeholder="your.email@example.com", value=st.session_state.user_email or "")
        auth_code = st.text_input("Authentication Code", placeholder="Enter your code", value=st.session_state.auth_code or "")
        
        verify_submitted = st.form_submit_button("✅ Verify & Login", use_container_width=True, type="primary")
        
        if verify_submitted:
            if user_email and auth_code:
                try:
                    # Use for_client=True to get localhost URL when running outside Docker
                    # The Streamlit app might be accessed from browser, so use client-accessible URL
                    proxy_base = get_proxy_base_url(for_client=True)
                    # Ensure URL has protocol
                    if not proxy_base.startswith(("http://", "https://")):
                        proxy_base = f"http://{proxy_base}"
                    auth_url = f"{proxy_base}/auth/verify"
                    response = requests.post(
                        auth_url,
                        json={"email": user_email, "code": auth_code},
                        timeout=5
                    )
                    if response.status_code == 200:
                        data = response.json()
                        st.session_state.session_token = data["session_token"]
                        st.session_state.user_email = user_email
                        
                        # Auto-set candidate ID if returned
                        if "candidate_id" in data and data["candidate_id"]:
                            st.session_state.candidate_id = data["candidate_id"]
                            
                        st.success("✅ Authentication successful!")
                        st.rerun()
                    else:
                        error_data = response.json() if response.content else {}
                        st.error(f"❌ Authentication failed: {error_data.get('detail', response.text)}")
                except Exception as e:
                    st.error(f"❌ Error connecting to proxy: {e}")
                    st.info("💡 Make sure the WebSocket proxy service is running.")
            else:
                st.warning("⚠️ Please enter both email and code.")
    
    st.markdown("---")
    st.info("💡 **Note:** Enter your email and authentication code to proceed.")
    st.stop()

# Main interview interface (only shown after authentication)
col_header1, col_header2 = st.columns([3, 1])
with col_header1:
    st.markdown(
        f"""
        Welcome, **{st.session_state.user_email}**!  
        Click **Start Interview** to begin, then use the toggle button to speak.
        """
    )
with col_header2:
    if st.button("🚪 Logout", use_container_width=True):
        st.session_state.session_token = None
        st.session_state.user_email = None
        st.session_state.auth_code = None
        st.session_state.is_interview_active = False
        st.rerun()

# Candidate selection
with st.expander("Candidate Information", expanded=True):
    # Check for candidate_id in query parameters
    query_params = st.query_params
    if "candidate_id" in query_params and not st.session_state.candidate_id:
        st.session_state.candidate_id = query_params["candidate_id"]
        st.success(f"✅ Candidate ID loaded from URL: {st.session_state.candidate_id}")
    
    if st.session_state.candidate_id:
        st.info(f"Current Candidate ID: `{st.session_state.candidate_id}`")
    else:
        st.warning("⚠️ No candidate selected. Please provide a Candidate ID.")
        
    candidate_id_input = st.text_input("Enter Candidate ID", value=st.session_state.candidate_id or "")
    
    # Strip whitespace from input
    if candidate_id_input:
        candidate_id_input = candidate_id_input.strip()
    
    if candidate_id_input and candidate_id_input != st.session_state.candidate_id:
        st.session_state.candidate_id = candidate_id_input
        st.success(f"✅ Candidate ID set to: {candidate_id_input}")

# Interview controls
col1, col2 = st.columns(2)

with col1:
    if not st.session_state.is_interview_active:
        if st.button("🚀 Start Interview", type="primary", use_container_width=True):
            st.session_state.is_interview_active = True
            st.session_state.session_id = str(uuid.uuid4())
            st.session_state.transcript = []
            st.session_state.transcript.append({
                "speaker": "system",
                "text": "Interview started",
                "timestamp": datetime.now().isoformat()
            })
            st.rerun()
    else:
        if st.button("⏹️ End Interview", type="secondary", use_container_width=True):
            # Save audio recording and transcript via backend API
            if st.session_state.session_id and st.session_state.session_token and st.session_state.candidate_id and HAS_REQUESTS:
                try:
                    # Build transcript text
                    transcript_text = "\n".join([
                        f"{entry.get('speaker', 'unknown')}: {entry.get('text', '')}"
                        for entry in st.session_state.transcript
                        if entry.get("speaker") in ["agent", "candidate"]
                    ])
                    
                    backend_url = get_backend_url()
                    st.info(f"🔍 Debug: Attempting to save to {backend_url}/api/v1/voice-screener/session/{st.session_state.session_id}/save")
                    
                    response = requests.post(
                        f"{backend_url}/api/v1/voice-screener/session/{st.session_state.session_id}/save",
                        json={
                            "session_id": st.session_state.session_id,
                            "candidate_id": st.session_state.candidate_id,
                            "transcript_text": transcript_text,
                            "proxy_token": st.session_state.session_token
                        },
                        timeout=30
                    )
                    st.info(f"🔍 Debug: Response Status: {response.status_code}")
                    
                    if response.status_code == 200:
                        data = response.json()
                        st.session_state.audio_file_path = data.get("audio_file_path")
                        st.success(f"✅ Session saved successfully!")
                        if st.session_state.audio_file_path:
                            st.info(f"Audio: {st.session_state.audio_file_path}")
                    else:
                        st.error(f"❌ Backend Error ({response.status_code}): {response.text}")
                except Exception as e:
                    st.error(f"❌ Connection Error: {e}")
                    st.code(f"Backend URL: {get_backend_url()}\nError Type: {type(e).__name__}")
            else:
                st.error("❌ Missing session state for saving!")
                st.write(f"Session ID: {st.session_state.session_id}")
                st.write(f"Token: {bool(st.session_state.session_token)}")
                st.write(f"Candidate ID: {st.session_state.candidate_id}")
            
            st.session_state.is_interview_active = False
            # st.rerun()  # Commented out to see debug messages

with col2:
    if st.session_state.is_interview_active:
        st.info("🟢 Interview Active")

# Voice interface component
if st.session_state.is_interview_active:
    st.markdown("---")
    st.subheader("Voice Interface")
    
    # Load HTML component with WebSocket and audio handling
    html_file = Path(__file__).parent / "components" / "voice_interface.html"
    if html_file.exists():
        with open(html_file, "r", encoding="utf-8") as f:
            html_content = f.read()
        
        # Get proxy URL and session token
        proxy_url = get_proxy_url(for_client=True)
        session_token = st.session_state.session_token
        
        if not session_token:
            st.error("⚠️ No session token. Please authenticate first.")
            st.stop()
        
        # Show connection debug info
        with st.expander("🔍 Connection Debug Info", expanded=False):
            st.success(f"✅ Authenticated as: `{st.session_state.user_email}`")
            st.info(f"**WebSocket Proxy:** `{proxy_url}`")
            st.info("**Note:** The connection uses a WebSocket proxy to handle authentication. "
                   "Browsers cannot set custom headers in WebSocket connections, so we proxy through the backend.")
            if "localhost" in proxy_url or "127.0.0.1" in proxy_url:
                st.warning("⚠️ Make sure the WebSocket proxy service is running! Check docker-compose logs.")
            
            # Proxy health check
            if HAS_REQUESTS:
                try:
                    # Use for_client=True to get localhost URL when running outside Docker
                    proxy_base = get_proxy_base_url(for_client=True)
                    # Ensure URL has protocol
                    if not proxy_base.startswith(("http://", "https://")):
                        proxy_base = f"http://{proxy_base}"
                    health_url = f"{proxy_base}/health"
                    response = requests.get(health_url, timeout=2)
                    if response.status_code == 200:
                        health_data = response.json()
                        st.success(f"✅ Proxy is healthy: {health_data.get('status', 'unknown')}")
                        if health_data.get('openai_api_key_configured'):
                            st.success("✅ OpenAI API key is configured in proxy")
                        else:
                            st.error("❌ OpenAI API key NOT configured in proxy")
                        st.info(f"Active sessions: {health_data.get('active_sessions', 0)}")
                    else:
                        st.warning(f"⚠️ Proxy health check returned: {response.status_code}")
                except Exception as e:
                    st.warning(f"⚠️ Could not check proxy health: {e}")
                    st.info("💡 **To view proxy logs:** `docker compose logs -f websocket_proxy`")
            else:
                st.info("💡 **To check proxy status:** `docker compose logs websocket_proxy`")
                st.info("💡 **To view live logs:** `docker compose logs -f websocket_proxy`")
        
        # Build WebSocket URL with session token
        ws_url = f"{proxy_url}?token={session_token}"
        
        html_content = html_content.replace("{{SESSION_ID}}", st.session_state.session_id)
        html_content = html_content.replace("{{SESSION_TOKEN}}", session_token)
        html_content = html_content.replace("{{PROXY_URL}}", ws_url)
            
        st.components.v1.html(html_content, height=500)  # Increased height for error messages
    else:
        st.warning("Voice interface component not found. Please ensure voice_interface.html exists.")
    
    # Transcript display
    st.markdown("---")
    st.subheader("Live Transcript")
    
    if st.session_state.transcript:
        for entry in st.session_state.transcript:
            speaker = entry.get("speaker", "unknown")
            text = entry.get("text", "")
            timestamp = entry.get("timestamp", "")
            
            if speaker == "agent":
                st.markdown(f"**🤖 Agent:** {text}")
            elif speaker == "candidate":
                st.markdown(f"**👤 You:** {text}")
            else:
                st.markdown(f"*{text}*")
    
    # Manual transcript update (for testing - in real app, JS updates this)
    with st.expander("Add Transcript Entry (Testing)"):
        col1, col2 = st.columns([3, 1])
        with col1:
            test_text = st.text_input("Text", key="test_transcript")
        with col2:
            test_speaker = st.selectbox("Speaker", ["candidate", "agent"], key="test_speaker")
        
        if st.button("Add Entry"):
            if test_text:
                st.session_state.transcript.append({
                    "speaker": test_speaker,
                    "text": test_text,
                    "timestamp": datetime.now().isoformat()
                })
                st.rerun()