Spaces:

themehmi
/

Drive-Safe-Assistant

Runtime error

File size: 48,572 Bytes

"""
main.py — Self-Contained, Fully Integrated Safe Driving Assistant
Consolidates all system configuration, custom non-blocking sound synthesizer, dlib Eye Landmark processor,
Ollama SLM action voice-assistant parser, Flask SSE Telemetry Dashboard, and main drowsiness timer logic
into one unified, ultra-premium script.
"""

import os
import sys
import time
import json
import queue
import collections
import threading
import logging
import urllib.request
import urllib.parse
import webbrowser
import re

# Force dummy audio driver for headless container environments
os.environ["SDL_AUDIODRIVER"] = "dummy"

import numpy as np
import scipy.io.wavfile as wavfile
import pygame
import pyttsx3
import cv2
import face_recognition
import speech_recognition as sr
from flask import Flask, render_template, Response, jsonify, request


#  1. DriveSafe Assistant — Configuration Settings
CAMERA_ID = int(os.environ.get("CAMERA_ID", 0))              # Index of the webcam (usually 0)
FRAME_WIDTH = int(os.environ.get("FRAME_WIDTH", 640))          # Video capture width
FRAME_HEIGHT = int(os.environ.get("FRAME_HEIGHT", 480))         # Video capture height

# Drowsiness Detection Thresholds
EAR_THRESHOLD = 0.23       # Eye Aspect Ratio below this indicates closed eyes
EAR_CONSEC_FRAMES = 3      # Consecutive frames below threshold to trigger eye-closed timer

# Alert Severity Levels (Durations in Seconds)
ALERT_LEVEL1_MIN = 3.0     # Min duration of closed eyes for Level 1 ("stay focused")
ALERT_LEVEL1_MAX = 5.0     # Max duration of closed eyes for Level 1
ALERT_LEVEL2_MIN = 5.0     # Closed eyes duration for Level 2 ("wake up stay focus on road" louder)

# Frequent Drowsiness Pattern Tracking
FREQUENT_DROWSY_WINDOW = 60.0  # Sliding window (seconds) to monitor drowsiness event frequency
FREQUENT_DROWSY_LIMIT = 2      # Max drowsiness warnings allowed in window before advising a break (Level 3)

# Voice Assistant & SLM Settings
OLLAMA_MODEL = os.environ.get("OLLAMA_MODEL", "drivesafe")                  # Our custom local Ollama model
OLLAMA_API_URL = os.environ.get("OLLAMA_API_URL", "http://localhost:11434/api/generate") # Ollama generation endpoint
SPEECH_RECOGNITION_TIMEOUT = 10             # Timeout for speech recognizer
WAKE_WORD = "assistant"                    # Wake word for general conversations

# Web HUD Dashboard Server
FLASK_HOST = os.environ.get("FLASK_HOST", "127.0.0.1")
FLASK_PORT = int(os.environ.get("FLASK_PORT", 5000))

# High Energy Music Links
ENERGETIC_MUSIC_URL = "https://music.youtube.com/playlist?list=PLYBSqm--lNVt1H63PlRvigxvPU_unQe8m"

#  2. Flask Web HUD Server & Shared DashboardState

# Initialize Flask app
app = Flask(__name__, template_folder='templates', static_folder='static')

# Thread-safe global state for Flask-main loop communication
class DashboardState:
    def __init__(self):
        self.lock = threading.Lock()
        self.latest_frame = None
        self.ear = 0.0
        self.state = "NORMAL"
        self.drowsiness_count = 0
        self.fps = 0
        self.alert_message = ""
        self.chat_history = []
        self.detection_active = True

dashboard_state = DashboardState()

@app.route('/')
def index():
    """Renders the futuristic cyberpunk HUD dashboard."""
    return render_template('index.html')

def gen_video_feed():
    """Generator function that yields JPEG frames for the live camera stream."""
    while True:
        with dashboard_state.lock:
            if dashboard_state.latest_frame is None:
                frame_to_send = None
            else:
                frame_to_send = dashboard_state.latest_frame.copy()
                
        if frame_to_send is not None:
            # Encode BGR OpenCV frame to standard JPEG
            ret, jpeg = cv2.imencode('.jpg', frame_to_send)
            if ret:
                yield (b'--frame\r\n'
                       b'Content-Type: image/jpeg\r\n\r\n' + jpeg.tobytes() + b'\r\n\r\n')
        
        # Frame-rate limiter (30 FPS max for the web stream to keep networking lightweight)
        time.sleep(1.0 / 30.0)

@app.route('/video_feed')
def video_feed():
    """Serves the real-time annotated video stream inside standard HTML img tags."""
    return Response(gen_video_feed(),
                    mimetype='multipart/x-mixed-replace; boundary=frame')

def gen_telemetry_stream():
    """Streams real-time system diagnostics to the browser via HTML5 Server-Sent Events (SSE)."""
    last_sent_time = 0
    while True:
        # Throttle telemetry updates slightly (e.g. 15 updates/second) to keep browser rendering butter-smooth
        current_time = time.time()
        if current_time - last_sent_time >= 0.06:
            with dashboard_state.lock:
                data = {
                    "ear": round(dashboard_state.ear, 3),
                    "state": dashboard_state.state,
                    "drowsiness_count": dashboard_state.drowsiness_count,
                    "fps": dashboard_state.fps,
                    "alert_message": dashboard_state.alert_message,
                    "chat_history": dashboard_state.chat_history,
                    "detection_active": dashboard_state.detection_active
                }
            
            # SSE data format: "data: <json>\n\n"
            yield f"data: {json.dumps(data)}\n\n"
            last_sent_time = current_time
            
        time.sleep(0.01)

@app.route('/telemetry')
def telemetry():
    """SSE endpoint for high-speed diagnostic telemetry streaming."""
    return Response(gen_telemetry_stream(), mimetype='text/event-stream')

# Interactive Control APIs

@app.route('/api/toggle_detection', methods=['POST'])
def toggle_detection():
    """Enables or disables active face and eye tracking."""
    with dashboard_state.lock:
        dashboard_state.detection_active = not dashboard_state.detection_active
        status = dashboard_state.detection_active
    return jsonify({"status": "success", "detection_active": status})

@app.route('/api/reset', methods=['POST'])
def api_reset():
    """Triggers a complete system reset from the dashboard panel."""
    if hasattr(app, 'reset_callback') and app.reset_callback:
        app.reset_callback()
        return jsonify({"status": "success", "message": "System alerts and warning log reset."})
    return jsonify({"status": "error", "message": "Reset callback not configured."})

@app.route('/api/trigger_music', methods=['POST'])
def api_trigger_music():
    """Manually triggers the energetic song from the dashboard panel."""
    if hasattr(app, 'play_music_callback') and app.play_music_callback:
        app.play_music_callback()
        return jsonify({"status": "success", "message": "Playing energetic synthwave music!"})
    return jsonify({"status": "error", "message": "Music callback not configured."})

def start_server_async():
    """Runs the Flask development server on a dedicated background thread."""
    # Suppress Flask development server startup messages to keep terminal clean
    log = logging.getLogger('werkzeug')
    log.setLevel(logging.ERROR)
    
    server_thread = threading.Thread(
        target=lambda: app.run(host=FLASK_HOST, port=FLASK_PORT, debug=False, use_reloader=False),
        daemon=True
    )
    server_thread.start()
    print(f"[Flask Server] Running in background at http://{FLASK_HOST}:{FLASK_PORT}")

# 3. AlertManager — Programmatic Sound Synthesis & Multi-Threaded Audio
class AlertManager:
    def __init__(self):
        # Ensure directories exist
        os.makedirs("audio", exist_ok=True)
        
        # Programmatically synthesize our warning and chime audio files
        self._synthesize_audio_assets()
        
        # Initialize Pygame Mixer for non-blocking SFX playback
        pygame.mixer.init()
        
        # Audio file paths
        self.calm_beep_path = os.path.join("audio", "calm_beep.wav")
        self.urgent_beep_path = os.path.join("audio", "urgent_beep.wav")
        
        # Thread-safe speech queue & worker setup
        self.speech_queue = queue.Queue()
        self.is_speaking = False
        self.speech_thread = threading.Thread(target=self._speech_worker, daemon=True)
        self.speech_thread.start()

    def _synthesize_audio_assets(self):
        """Synthesizes custom chime and alert WAV files using numpy and scipy."""
        sample_rate = 44100
        
        # 1. Calm chime (gentle 550Hz sine wave decaying)
        duration = 0.4
        t = np.linspace(0, duration, int(sample_rate * duration), False)
        envelope = np.exp(-5 * t)  # decay envelope
        tone = np.sin(2 * np.pi * 550 * t) * envelope
        calm_data = (tone * 20000).astype(np.int16)
        wavfile.write(os.path.join("audio", "calm_beep.wav"), sample_rate, calm_data)
        
        # 2. Urgent pulsing beeps (three rapid 1200Hz pulse bursts)
        urgent_data = []
        burst_duration = 0.08
        gap_duration = 0.05
        t_burst = np.linspace(0, burst_duration, int(sample_rate * burst_duration), False)
        burst = np.sin(2 * np.pi * 1200 * t_burst) * 32000
        gap = np.zeros(int(sample_rate * gap_duration))
        
        # Combine three bursts
        for _ in range(3):
            urgent_data.extend(burst)
            urgent_data.extend(gap)
            
        urgent_np = np.array(urgent_data, dtype=np.int16)
        wavfile.write(os.path.join("audio", "urgent_beep.wav"), sample_rate, urgent_np)

    def _speech_worker(self):
        """Background worker thread that serializes all speech requests using native PowerShell synthesis to prevent COM/threading locks."""
        print("[AlertManager] Speech worker thread active.")
        import subprocess
        while True:
            try:
                # Blocks until an item is available
                text, volume, rate = self.speech_queue.get()
                
                self.is_speaking = True
                
                # Escape single quotes and backslashes for PowerShell safety
                escaped_text = text.replace("\\", "\\\\").replace("'", "''")
                
                # Map rate (150-190) to PowerShell Rate (-10 to 10)
                ps_rate = 0
                if rate > 180:
                    ps_rate = 2
                elif rate < 150:
                    ps_rate = -2
                    
                # Map volume (0.0 to 1.0) to PowerShell Volume (0 to 100)
                ps_volume = int(volume * 100)
                
                ps_command = (
                    f"Add-Type -AssemblyName System.Speech; "
                    f"$speak = New-Object System.Speech.Synthesis.SpeechSynthesizer; "
                    f"$speak.Rate = {ps_rate}; "
                    f"$speak.Volume = {ps_volume}; "
                    f"$speak.Speak('{escaped_text}')"
                )
                
                # Run synchronously inside the worker thread to maintain sequential speech
                subprocess.run(
                    ["powershell", "-NoProfile", "-ExecutionPolicy", "Bypass", "-Command", ps_command],
                    stdout=subprocess.DEVNULL,
                    stderr=subprocess.DEVNULL
                )
                
                self.is_speaking = False
                self.speech_queue.task_done()
            except Exception as e:
                print(f"[AlertManager] Speech worker exception: {e}")
                self.is_speaking = False
                time.sleep(0.5)

    def speak(self, text, volume=0.8, rate=170):
        """Enqueues a text string to be spoken in the background thread."""
        self.speech_queue.put((text, volume, rate))

    def trigger_level1(self):
        """Level 1 Alert (3-5s closed): Soft chime, then calm voice."""
        print("[AlertManager] Triggering Level 1 Alert: Calm Stay Focused")
        pygame.mixer.Sound(self.calm_beep_path).play()
        self.speak("Stay focused on the road", volume=0.7, rate=160)

    def trigger_level2(self):
        """Level 2 Alert (>5s closed): Loud siren beep, then loud voice."""
        print("[AlertManager] Triggering Level 2 Alert: Loud WAKE UP!")
        pygame.mixer.Sound(self.urgent_beep_path).play()
        self.speak("Wake up! Stay focused on the road!", volume=1.0, rate=190)

    def trigger_level3_advisory(self):
        """Level 3 Alert (Frequent drowsiness): Ask to take a rest break on the side."""
        print("[AlertManager] Triggering Level 3 Alert: Rest break advisory")
        pygame.mixer.Sound(self.urgent_beep_path).play()
        self.speak("You are getting drowsy frequently. Please pull over on the side and take a rest.", volume=0.9, rate=170)

    def ask_energetic_song(self):
        """Ask the driver if they want to listen to an energetic song."""
        print("[AlertManager] Querying driver for energetic song")
        self.speak("Alright. Would you like to listen to an energetic song to help you stay awake?", volume=0.85, rate=170)

    def play_energetic_music(self):
        """Announce and play energetic music."""
        print("[AlertManager] Playing energetic music")
        self.speak("Playing some high energy synthwave beats. Turn it up and stay alert!", volume=0.9, rate=170)
        webbrowser.open(ENERGETIC_MUSIC_URL)


# 4. EyeDetector — 2x Downsampling dlib Eye Landmark Processor with Fallback

class EyeDetector:
    def __init__(self):
        self.scale_factor = 2  # Resizes to 50% width/height (4x speedup)
        self.last_warning_time = 0

    def _calculate_ear(self, eye_points):
        """Calculates the Eye Aspect Ratio (EAR) for a single eye list of 6 points."""
        p1 = np.array(eye_points[0])
        p2 = np.array(eye_points[1])
        p3 = np.array(eye_points[2])
        p4 = np.array(eye_points[3])
        p5 = np.array(eye_points[4])
        p6 = np.array(eye_points[5])
        
        vertical1 = np.linalg.norm(p2 - p6)
        vertical2 = np.linalg.norm(p3 - p5)
        horizontal = np.linalg.norm(p1 - p4)
        
        if horizontal == 0:
            return 0.0
            
        return (vertical1 + vertical2) / (2.0 * horizontal)

    def process_frame(self, frame):
        """Processes a single BGR camera frame with a robust full-res fallback."""
        height, width, _ = frame.shape
        debug_frame = frame.copy()
        
        # 1. Downsample the frame for high-speed face detection
        small_frame = cv2.resize(frame, (0, 0), fx=1.0/self.scale_factor, fy=1.0/self.scale_factor)
        rgb_small_frame = cv2.cvtColor(small_frame, cv2.COLOR_BGR2RGB)
        
        # 2. Try fast downscaled detection first
        face_landmarks_list = face_recognition.face_landmarks(rgb_small_frame)
        current_scale = self.scale_factor
        
        # 3. Fallback: If no face found in small frame, try the full-resolution frame!
        if not face_landmarks_list:
            rgb_full_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
            face_landmarks_list = face_recognition.face_landmarks(rgb_full_frame)
            current_scale = 1
        
        avg_ear = None
        landmarks_found = None
        
        if face_landmarks_list:
            face_landmarks = face_landmarks_list[0]
            landmarks_found = face_landmarks
            
            left_eye_raw = face_landmarks.get('left_eye', [])
            right_eye_raw = face_landmarks.get('right_eye', [])
            
            if len(left_eye_raw) == 6 and len(right_eye_raw) == 6:
                # Scale coordinates back up to original frame dimensions
                left_eye = [(int(x * current_scale), int(y * current_scale)) for (x, y) in left_eye_raw]
                right_eye = [(int(x * current_scale), int(y * current_scale)) for (x, y) in right_eye_raw]
                
                left_ear = self._calculate_ear(left_eye)
                right_ear = self._calculate_ear(right_eye)
                avg_ear = (left_ear + right_ear) / 2.0
                
                # Draw the glowing tech HUD outlines
                self._draw_eye_hud(debug_frame, left_eye, right_eye, avg_ear)
        else:
            # No face detected! Print throttled console warning and show overlay text
            current_time = time.time()
            if current_time - self.last_warning_time > 2.5:
                print("[EyeDetector] WARNING: No face detected in camera stream! Adjust position or lighting.")
                self.last_warning_time = current_time
                
            # Draw warning overlay on dashboard feed
            cv2.putText(debug_frame, "NO FACE DETECTED", (width // 2 - 120, height // 2), 
                        cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 255), 2)
            cv2.putText(debug_frame, "Adjust Camera / Lighting", (width // 2 - 140, height // 2 + 30), 
                        cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 165, 255), 1)
                
        return avg_ear, landmarks_found, debug_frame

    def _draw_eye_hud(self, frame, left_eye, right_eye, ear):
        """Draws glowing HUD tech contours on eyes and shows EAR readout."""
        if ear is not None and ear < EAR_THRESHOLD:
            color = (0, 0, 255)       # Red: Closed/Drowsy
            thickness = 2
        else:
            color = (0, 255, 0)       # Green: Open/Safe
            thickness = 1
            
        left_pts = np.array(left_eye, np.int32)
        cv2.polylines(frame, [left_pts], True, color, thickness)
        
        right_pts = np.array(right_eye, np.int32)
        cv2.polylines(frame, [right_pts], True, color, thickness)
        
        for (x, y) in left_eye + right_eye:
            cv2.circle(frame, (x, y), 2, (255, 255, 0), -1)
            
        if ear is not None:
            text = f"EAR: {ear:.2f}"
            cv2.putText(frame, text, (30, 40), cv2.FONT_HERSHEY_SIMPLEX, 0.7, color, 2)


# 5. VoiceAssistant — Dynamic Action Router & Background Speech Recognition

class VoiceAssistant:
    def __init__(self, alert_manager, state_callbacks):
        self.alert_manager = alert_manager
        self.callbacks = state_callbacks
        
        self.recognizer = sr.Recognizer()
        self.recognizer.energy_threshold = 4000
        self.recognizer.dynamic_energy_threshold = True
        
        self.running = True
        self.thread = threading.Thread(target=self._assistant_loop, daemon=True)
        self.thread.start()

    def query_ollama_slm(self, prompt):
        """Sends user transcription to the local custom drivesafe SLM on Ollama."""
        payload = {
            "model": OLLAMA_MODEL,
            "prompt": prompt,
            "stream": False
        }
        headers = {"Content-Type": "application/json"}
        
        try:
            req = urllib.request.Request(
                OLLAMA_API_URL,
                data=json.dumps(payload).encode("utf-8"),
                headers=headers,
                method="POST"
            )
            # Use a 10-second timeout to accommodate initial Ollama cold start weight loading
            with urllib.request.urlopen(req, timeout=10) as response:
                res_data = json.loads(response.read().decode("utf-8"))
                reply = res_data.get("response", "").strip()
                # Clean up any quotes or markdown from the SLM
                reply = reply.replace('"', '').replace('*', '').strip()
                return reply
        except Exception as e:
            print(f"[Ollama SLM] Error or timeout querying local model: {e}")
            lower_prompt = prompt.lower()
            if "hello" in lower_prompt or "hi" in lower_prompt:
                return "Hello! I am here. Eyes on the road, friend."
            elif "joke" in lower_prompt:
                return "Why did the scarecrow win an award? Because he was outstanding in his field. Stay alert!"
            else:
                return "Understood. Keep driving safely, stay focused on the road."

    def _assistant_loop(self):
        """Background continuous microphone listening loop."""
        print("[VoiceAssistant] Speech recognizer thread started.")
        
        try:
            mic = sr.Microphone()
        except Exception as e:
            print(f"[VoiceAssistant] Error accessing microphone: {e}. Voice controls disabled.")
            return
            
        with mic as source:
            print("[VoiceAssistant] Calibrating microphone for driving background noise...")
            self.recognizer.adjust_for_ambient_noise(source, duration=2)
            print("[VoiceAssistant] Calibration complete. Ready for voice interaction.")
            
            while self.running:
                if self.alert_manager.is_speaking:
                    time.sleep(0.3)
                    continue
                    
                try:
                    audio = self.recognizer.listen(source, timeout=1.5, phrase_time_limit=4.0)
                except sr.WaitTimeoutError:
                    continue
                except Exception as e:
                    print(f"[VoiceAssistant] Microphone capture error: {e}")
                    time.sleep(0.5)
                    continue

                if self.alert_manager.is_speaking:
                    continue

                # Run speech recognition in a separate thread to keep mic pipeline responsive
                threading.Thread(target=self._process_audio, args=(audio,), daemon=True).start()

    def _process_audio(self, audio):
        """Recognizes speech and routes commands dynamically."""
        try:
            text = self.recognizer.recognize_google(audio)
            print(f"[Driver Heard] {text}")
        except sr.UnknownValueError:
            return
        except sr.RequestError:
            try:
                print("[VoiceAssistant] Cloud Speech API unavailable. Attempting local Whisper...")
                text = self.recognizer.recognize_whisper(audio, model="base.en")
                print(f"[Driver Heard (Whisper)] {text}")
            except Exception as e:
                print(f"[VoiceAssistant] Offline recognition failed: {e}")
                return
                
        cleaned_text = text.strip().lower()
        if not cleaned_text:
            return

        # STATE-SPECIFIC ROUTING (Emergency Rest / Song Prompts)
        current_state = self.callbacks['get_system_state']()
        
        # 1. State: Driver has been warned of frequent drowsiness (Level 3 Advisory)
        if current_state == "WAITING_REST_RESPONSE":
            refusal_words = ["no", "never", "can't", "wont", "won't", "refuse", "impossible", "fine", "good", "no thanks", "no rest", "keep driving"]
            accepted_words = ["yes", "yeah", "ok", "okay", "fine I will", "sure", "pulling over"]
            
            if any(word in cleaned_text for word in refusal_words):
                print("[VoiceAssistant] Driver refused rest. Prompting for energetic song.")
                self.callbacks['set_system_state']("WAITING_SONG_RESPONSE")
                self.callbacks['add_chat_log'](text, "No, I'm fine. I won't stop.")
                
                time.sleep(0.5)
                self.alert_manager.ask_energetic_song()
                self.callbacks['add_chat_log']("System", "Alright. Would you like to listen to an energetic song to help you stay awake?")
                return
                
            elif any(word in cleaned_text for word in accepted_words) or "pull" in cleaned_text:
                print("[VoiceAssistant] Driver accepted rest.")
                self.callbacks['reset_warnings']()
                self.callbacks['add_chat_log'](text, "Okay, pulling over.")
                self.alert_manager.speak("Good decision. Pull over safely and take some rest.")
                self.callbacks['add_chat_log']("System", "Good decision. Pull over safely and take some rest.")
                return

        # 2. State: Driver refused rest, now confirming if they want a song
        elif current_state == "WAITING_SONG_RESPONSE":
            accepted_words = ["yes", "yeah", "sure", "ok", "okay", "play", "song", "music", "please"]
            
            if any(word in cleaned_text for word in accepted_words):
                print("[VoiceAssistant] Driver accepted song.")
                self.callbacks['add_chat_log'](text, "Yes, play some music.")
                self.alert_manager.play_energetic_music()
                self.callbacks['add_chat_log']("System", "Playing energetic synthwave beats! Stay awake!")
                self.callbacks['set_system_state']("PLAYING_MUSIC")
                return
            else:
                print("[VoiceAssistant] Driver declined song.")
                self.callbacks['add_chat_log'](text, "No, I'm okay.")
                self.alert_manager.speak("Understood. Keep your eyes on the road. Stay focused.")
                self.callbacks['add_chat_log']("System", "Understood. Keep your eyes on the road. Stay focused.")
                self.callbacks['reset_warnings']()
                return

        # DIRECT SYSTEM BACKUP COMMANDS (Local Regex Override)
        if "reset" in cleaned_text or "clear" in cleaned_text or "awake" in cleaned_text or "focused" in cleaned_text:
            print("[VoiceAssistant] Safe state reset command received.")
            self.callbacks['reset_warnings']()
            self.callbacks['add_chat_log'](text, "Reset assistant")
            self.alert_manager.speak("System reset. Let's keep driving safely.")
            self.callbacks['add_chat_log']("System", "System reset. Let's keep driving safely.")
            return
            
        has_play = any(p in cleaned_text for p in ["play", "start", "turn on", "listen", "put on", "launch"])
        has_music_kw = any(kw in cleaned_text for kw in ["music", "song", "beat", "tune", "track", "musc", "melody", "audio", "lofi"])
        
        if has_play:
            # Extract query after the play keyword
            play_keyword = next((p for p in ["play", "start", "turn on", "listen to", "put on", "launch"] if p in cleaned_text), "play")
            idx = cleaned_text.find(play_keyword)
            music_query = cleaned_text[idx + len(play_keyword):].strip()
            
            # Clean common filler words
            for filler in ["some", "a", "the", "music", "song", "track", "musc"]:
                if music_query.startswith(filler):
                    music_query = music_query[len(filler):].strip()
                if music_query.endswith(filler):
                    music_query = music_query[:-len(filler)].strip()
            
            # If the remaining query is empty or generic, play the custom playlist
            if not music_query or music_query in ["music", "song", "beat", "tune", "track", "musc", "melody"]:
                print("[VoiceAssistant] General music command recognized locally. Playing playlist.")
                self.callbacks['add_chat_log'](text, "Requested general music playback")
                self.alert_manager.play_energetic_music()
                self.callbacks['set_system_state']("PLAYING_MUSIC")
                return
            else:
                # Play specific song directly!
                print(f"[VoiceAssistant] Specific song command recognized locally: {music_query}")
                confirm_msg = f"Sure thing! Autoplay in progress for {music_query}."
                self.callbacks['add_chat_log'](text, confirm_msg)
                self.alert_manager.speak(confirm_msg)
                
                # Fetch first search result and autoplay!
                search_url = f"https://www.youtube.com/results?search_query={urllib.parse.quote(music_query)}"
                headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)'}
                try:
                    req = urllib.request.Request(search_url, headers=headers)
                    with urllib.request.urlopen(req, timeout=5) as res:
                        html = res.read().decode('utf-8')
                        video_ids = re.findall(r'/watch\?v=([a-zA-Z0-9_-]{11})', html)
                        if video_ids:
                            first_video_id = video_ids[0]
                            direct_url = f"https://www.youtube.com/watch?v={first_video_id}&autoplay=1"
                            print(f"[VoiceAssistant] Auto-playing first matching YouTube video: {direct_url}")
                            webbrowser.open(direct_url)
                        else:
                            webbrowser.open(search_url)
                except Exception as e:
                    print(f"[VoiceAssistant] Autoplay scraper failed: {e}. Falling back to search page.")
                    webbrowser.open(search_url)
                
                self.callbacks['set_system_state']("PLAYING_MUSIC")
                return

        has_stop = any(s in cleaned_text for s in ["stop", "pause", "turn off", "mute", "quiet", "halt", "shut up"])
        if has_stop and (has_music_kw or "music" in cleaned_text or "song" in cleaned_text or "sound" in cleaned_text or "radio" in cleaned_text):
            print("[VoiceAssistant] Flexible stop music command recognized.")
            # Simulate media play/pause key to halt browser/audio stream
            import ctypes
            VK_MEDIA_PLAY_PAUSE = 0xB3
            try:
                ctypes.windll.user32.keybd_event(VK_MEDIA_PLAY_PAUSE, 0, 0, 0)
                ctypes.windll.user32.keybd_event(VK_MEDIA_PLAY_PAUSE, 0, 2, 0)
            except Exception as e:
                print(f"[VoiceAssistant] Failed simulating media key: {e}")
                
            self.callbacks['set_system_state']("NORMAL")
            self.callbacks['add_chat_log'](text, "Stop the music")
            self.alert_manager.speak("Stopping the music. Keep your eyes on the road.")
            self.callbacks['add_chat_log']("System", "Music stopped.")
            return

        # CONVERSATIONAL LOCAL SLM (Always Active - No Wake Word/Filters Required!)
        # Route ANY general speech dynamically straight to our local Ollama custom model!
        print(f"[Ollama Query] {text}")
        reply = self.query_ollama_slm(text)
        print(f"[SLM Reply] {reply}")
        
        # Check if Ollama returned a dynamic PLAY action tag (e.g. "[PLAY] paint it black")
        if "[play]" in reply.lower():
            match = re.search(r'\[play\]\s*(.*)', reply, re.IGNORECASE)
            if match:
                music_query = match.group(1).strip()
                music_query = music_query.replace('"', '').replace('[', '').replace(']', '').strip()
                
                confirm_msg = f"Sure thing! Autoplay in progress for {music_query}."
                self.callbacks['add_chat_log'](text, confirm_msg)
                self.alert_manager.speak(confirm_msg)
                
                # Fetch the first search result from YouTube dynamically and play it directly!
                search_url = f"https://www.youtube.com/results?search_query={urllib.parse.quote(music_query)}"
                headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)'}
                try:
                    req = urllib.request.Request(search_url, headers=headers)
                    with urllib.request.urlopen(req, timeout=5) as res:
                        html = res.read().decode('utf-8')
                        # Search for video watch paths
                        video_ids = re.findall(r'/watch\?v=([a-zA-Z0-9_-]{11})', html)
                        if video_ids:
                            first_video_id = video_ids[0]
                            direct_url = f"https://www.youtube.com/watch?v={first_video_id}&autoplay=1"
                            print(f"[VoiceAssistant] Auto-playing first matching YouTube video: {direct_url}")
                            webbrowser.open(direct_url)
                        else:
                            webbrowser.open(search_url)
                except Exception as e:
                    print(f"[VoiceAssistant] Autoplay scraper failed: {e}. Falling back to search page.")
                    webbrowser.open(search_url)
                
                self.callbacks['set_system_state']("PLAYING_MUSIC")
                return

        # Check if Ollama returned a dynamic STOP action tag (e.g. "[STOP]")
        if "[stop]" in reply.lower():
            match = re.search(r'\[stop\]\s*(.*)', reply, re.IGNORECASE)
            clean_reply = match.group(1).strip() if match else "Stopping the music. Keep your eyes on the road!"
            clean_reply = clean_reply.replace('[', '').replace(']', '').strip()
            
            print("[VoiceAssistant] Action STOP triggered dynamically by Ollama.")
            # Simulate media play/pause key to stop the browser audio stream
            import ctypes
            VK_MEDIA_PLAY_PAUSE = 0xB3
            try:
                ctypes.windll.user32.keybd_event(VK_MEDIA_PLAY_PAUSE, 0, 0, 0)
                ctypes.windll.user32.keybd_event(VK_MEDIA_PLAY_PAUSE, 0, 2, 0)
            except Exception as e:
                print(f"[VoiceAssistant] Failed simulating media key: {e}")
                
            self.callbacks['set_system_state']("NORMAL")
            self.callbacks['add_chat_log'](text, clean_reply)
            self.alert_manager.speak(clean_reply)
            return
                
        # Check if Ollama returned a dynamic RESET action tag (e.g. "[RESET]")
        if "[reset]" in reply.lower():
            match = re.search(r'\[reset\]\s*(.*)', reply, re.IGNORECASE)
            clean_reply = match.group(1).strip() if match else "System warnings cleared. Drive safely!"
            clean_reply = clean_reply.replace('[', '').replace(']', '').strip()
            
            print("[VoiceAssistant] Action RESET triggered dynamically by Ollama.")
            self.callbacks['reset_warnings']()
            self.callbacks['add_chat_log'](text, clean_reply)
            self.alert_manager.speak(clean_reply)
            return

        # General conversational response
        self.callbacks['add_chat_log'](text, reply)
        self.alert_manager.speak(reply)

    def stop(self):
        """Stops the assistant background thread."""
        self.running = False


# 6. SafeDrivingAssistant Core Engine & Orchestrator Coordinator

class SafeDrivingAssistant:
    def __init__(self):
        print("[CoreEngine] Initializing Safe Driving Assistant...")
        
        # Initialize Audio Alert & Sound Synthesizer
        self.alert_manager = AlertManager()
        
        # Initialize face_recognition Eye Landmark Processor
        self.detector = EyeDetector()
        
        # Tracking states and timelines
        self.consec_closed_frames = 0
        self.eyes_closed_start_time = None
        self.active_alert_level = 0  # 0: None, 1: Stay Focused, 2: Wake Up Loud
        
        # Rolling log of drowsiness timestamps to monitor frequency
        self.drowsiness_events = collections.deque()
        
        # Keyboard reset helper
        self.last_key_press = None
        
        # Setup conversational callbacks for our Voice Assistant & SLM
        self.callbacks = {
            'get_system_state': self.get_system_state,
            'set_system_state': self.set_system_state,
            'reset_warnings': self.reset_warnings,
            'add_chat_log': self.add_chat_log
        }
        
        # Bind callbacks back to Flask REST API endpoints
        app.reset_callback = self.reset_warnings
        app.play_music_callback = self.play_energetic_music
        
        # Initialize speech listener thread
        self.assistant = VoiceAssistant(self.alert_manager, self.callbacks)
        
        # Boot Flask HUD Web Dashboard in the background
        start_server_async()

    # Coordinator Callback Handlers

    def get_system_state(self):
        """Thread-safe state getter for the Voice Assistant."""
        with dashboard_state.lock:
            return dashboard_state.state

    def set_system_state(self, new_state):
        """Thread-safe state setter for the Voice Assistant."""
        with dashboard_state.lock:
            dashboard_state.state = new_state
            if new_state == "NORMAL":
                dashboard_state.alert_message = ""
            elif new_state == "WAITING_REST_RESPONSE":
                dashboard_state.alert_message = "ADVISING REST BREAK"
            elif new_state == "WAITING_SONG_RESPONSE":
                dashboard_state.alert_message = "OFFERING ENERGETIC MUSIC"
            elif new_state == "PLAYING_MUSIC":
                dashboard_state.alert_message = "PLAYING HIGH ENERGY BEATS"

    def reset_warnings(self):
        """Complete reset of all active alarms, timers, and warning metrics."""
        print("[CoreEngine] Performing comprehensive system alert reset.")
        with dashboard_state.lock:
            dashboard_state.state = "NORMAL"
            dashboard_state.alert_message = ""
            dashboard_state.drowsiness_count = 0
        self.consec_closed_frames = 0
        self.eyes_closed_start_time = None
        self.active_alert_level = 0
        self.drowsiness_events.clear()
        
        # Enqueue a log message
        self.add_chat_log("System", "System alerts and warnings reset to NORMAL.")

    def add_chat_log(self, user_query, slm_reply=""):
        """Pushes voice transcripts to the dashboard log log history."""
        with dashboard_state.lock:
            if user_query == "System":
                dashboard_state.chat_history.append({
                    "speaker": "System",
                    "message": slm_reply
                })
            else:
                dashboard_state.chat_history.append({
                    "speaker": "Driver",
                    "query": user_query,
                    "message": slm_reply
                })

    def play_energetic_music(self):
        """Orchestrator hook to trigger the energetic music sequence."""
        self.set_system_state("PLAYING_MUSIC")
        self.alert_manager.play_energetic_music()
        self.add_chat_log("System", "Energetic synthwave music started. Stay alert!")

   # Core Drowsiness Evaluation & Loop

    def run(self):
        """Main camera acquisition loop that drives the safe assistant."""
        print("[CoreEngine] Accessing camera stream...")
        cap = cv2.VideoCapture(CAMERA_ID)
        
        # Configure video dimension overrides from settings
        cap.set(cv2.CAP_PROP_FRAME_WIDTH, FRAME_WIDTH)
        cap.set(cv2.CAP_PROP_FRAME_HEIGHT, FRAME_HEIGHT)
        
        # Detect if we are in a headless cloud environment without a webcam
        use_simulation = False
        if not cap.isOpened():
            print("[CoreEngine] WARNING: Could not access physical web camera.")
            print("[CoreEngine] Pivoting to Cloud Simulation Mode to keep web HUD alive...")
            use_simulation = True
        else:
            print("[CoreEngine] Camera stream operational. System fully active.")

        print("[CoreEngine] System loop running. Use the Web Dashboard to monitor telemetry.")
        
        prev_time = time.time()
        
        try:
            while True:
                current_time = time.time()
                
                if use_simulation:
                    # Generate an animated cyberpunk grid frame for the headless dashboard
                    frame = np.zeros((FRAME_HEIGHT, FRAME_WIDTH, 3), dtype=np.uint8)
                    # Create a scrolling scan line
                    scan_y = int(current_time * 120) % FRAME_HEIGHT
                    cv2.line(frame, (0, scan_y), (FRAME_WIDTH, scan_y), (40, 40, 40), 2)
                    cv2.putText(frame, "CLOUD SIMULATION FEED (NO PHYSICAL CAM)", (20, FRAME_HEIGHT - 20), 
                                cv2.FONT_HERSHEY_SIMPLEX, 0.4, (0, 255, 0), 1)
                    ret = True
                else:
                    ret, frame = cap.read()
                    if not ret:
                        time.sleep(0.01)
                        continue
                    # Mirror frame for intuitive pilot HUD overlay
                    frame = cv2.flip(frame, 1)
                
                # Check if tracking is active (controlled from Dashboard)
                with dashboard_state.lock:
                    active = dashboard_state.detection_active
                    
                if active:
                    if use_simulation:
                        # Cloud Demo Mode: Automatically simulate a drowsy event cycle every 25 seconds
                        # to let you test your Flask dashboard overlays and system responses safely!
                        cycle = int(current_time) % 25
                        if cycle > 18:  # Simulate closed eyes for 7 seconds
                            ear = 0.16
                            cv2.putText(frame, "SIMULATING DROWSINESS (EYES CLOSED)", (FRAME_WIDTH // 2 - 180, FRAME_HEIGHT // 2),
                                        cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 0, 255), 2)
                        else:
                            ear = 0.28
                        
                        processed_frame = frame.copy()
                        # Draw virtual telemetry eye dots onto the matrix background
                        cv2.circle(processed_frame, (int(FRAME_WIDTH * 0.4), int(FRAME_HEIGHT * 0.45)), 8, (0, 255, 0) if ear > EAR_THRESHOLD else (0, 0, 255), -1)
                        cv2.circle(processed_frame, (int(FRAME_WIDTH * 0.6), int(FRAME_HEIGHT * 0.45)), 8, (0, 255, 0) if ear > EAR_THRESHOLD else (0, 0, 255), -1)
                        if ear is not None:
                            cv2.putText(processed_frame, f"EAR: {ear:.2f}", (30, 40), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 255, 0) if ear > EAR_THRESHOLD else (0, 0, 255), 2)
                        landmarks = {}
                    else:
                        # Calculate EAR and overlay glow contours on frame via physical camera
                        ear, landmarks, processed_frame = self.detector.process_frame(frame)
                else:
                    processed_frame = frame.copy()
                    cv2.putText(processed_frame, "TRACKING PAUSED", (50, 50), 
                                cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0, 165, 255), 2)
                    ear = None

                # Calculate processing frame rate (FPS)
                fps = int(1.0 / (current_time - prev_time)) if (current_time - prev_time) > 0 else 30
                prev_time = current_time

                # Drowsiness Logic Decision Engine
                if ear is not None and active:
                    if ear < EAR_THRESHOLD:
                        self.consec_closed_frames += 1
                        
                        # Once consecutive frames pass noise filter, start duration timer
                        if self.consec_closed_frames >= EAR_CONSEC_FRAMES:
                            if self.eyes_closed_start_time is None:
                                self.eyes_closed_start_time = current_time
                            else:
                                closed_duration = current_time - self.eyes_closed_start_time
                                
                                # LEVEL 1: Eyes Closed 3-5 seconds
                                if ALERT_LEVEL1_MIN <= closed_duration < ALERT_LEVEL1_MAX:
                                    if self.active_alert_level < 1:
                                        self.active_alert_level = 1
                                        self.set_system_state("CLOSED_3S")
                                        self.alert_manager.trigger_level1()
                                        
                                        # Record timestamp to sliding frequency tracker
                                        self.drowsiness_events.append(current_time)
                                        with dashboard_state.lock:
                                            dashboard_state.drowsiness_count += 1
                                            
                                        self.add_chat_log("System", "WARNING: Eyes closed for 3 seconds! Stay focused!")
                                
                                # LEVEL 2: Eyes Closed > 5 seconds (Louder Warning!)
                                elif closed_duration >= ALERT_LEVEL2_MIN:
                                    if self.active_alert_level < 2:
                                        self.active_alert_level = 2
                                        self.set_system_state("CLOSED_5S")
                                        self.alert_manager.trigger_level2()
                                        
                                        # Record second timestamp
                                        self.drowsiness_events.append(current_time)
                                        with dashboard_state.lock:
                                            dashboard_state.drowsiness_count += 1
                                            
                                        self.add_chat_log("System", "CRITICAL ALARM: Eyes closed for 5+ seconds! WAKE UP!")
                    else:
                        # Eyes are open! Reset filters and check for Level 3 Advisory escalation
                        self.consec_closed_frames = 0
                        
                        if self.eyes_closed_start_time is not None:
                            self.eyes_closed_start_time = None
                            
                            while self.drowsiness_events and (current_time - self.drowsiness_events[0] > FREQUENT_DROWSY_WINDOW):
                                self.drowsiness_events.popleft()
                                
                            # LEVEL 3: Frequent Drowsiness check (if closed events occur >= limit in last 60s)
                            if len(self.drowsiness_events) >= FREQUENT_DROWSY_LIMIT:
                                print(f"[CoreEngine] Frequent drowsiness detected ({len(self.drowsiness_events)} events in 60s). Escalating to Level 3.")
                                self.set_system_state("WAITING_REST_RESPONSE")
                                self.alert_manager.trigger_level3_advisory()
                                self.add_chat_log("System", "FREQUENT DROWSINESS DETECTED. Prompting driver to pull over.")
                            else:
                                # Normal recovery
                                current_state = self.get_system_state()
                                if current_state not in ["WAITING_REST_RESPONSE", "WAITING_SONG_RESPONSE"]:
                                    self.set_system_state("NORMAL")
                                    self.active_alert_level = 0
                else:
                    self.consec_closed_frames = 0
                    self.eyes_closed_start_time = None

                # Update Global Telemetry Buffer for Flask Server
                with dashboard_state.lock:
                    dashboard_state.latest_frame = processed_frame.copy()
                    if ear is not None:
                        dashboard_state.ear = ear
                    else:
                        dashboard_state.ear = 0.30  # Default baseline when no face present
                    dashboard_state.fps = fps

                # OpenCV display output fallback (wrapped safely to prevent headless display context drops)
                try:
                    cv2.imshow("DriveSafe HUD AI Console", processed_frame)
                    key = cv2.waitKey(1) & 0xFF
                    if key == ord('q') or key == 27:
                        print("[CoreEngine] Exit key received. Terminating system.")
                        break
                    elif key == ord('r'):
                        self.reset_warnings()
                except Exception:
                    # Prevents crashes on platforms where standard desktop window pipelines are fully restricted
                    time.sleep(0.03)

        except KeyboardInterrupt:
            print("[CoreEngine] Keyboard interrupt. Shutting down.")
        finally:
            print("[CoreEngine] Releasing resources...")
            cap.release()
            try:
                cv2.destroyAllWindows()
            except Exception:
                pass
            self.assistant.stop()
            sys.exit(0)
                 

if __name__ == "__main__":
    assistant_app = SafeDrivingAssistant()
    assistant_app.run()