Spaces:

Gagan0141
/

MindSync_AI

Sleeping

File size: 14,750 Bytes

e7afd1c

# _virtual_chat.py
import queue
emotion_queue = queue.Queue()

from fer.fer import FER

# GPU optional – FER runs on CPU by default
emotion_detector = FER(mtcnn=True)

import streamlit as st
import cv2, time, os, tempfile, threading, datetime, glob, base64
import speech_recognition as sr
# from deepface import DeepFace
from db import get_db

import numpy as np

DEEPFACE_AVAILABLE = True
try:
    import deepface
except:
    DEEPFACE_AVAILABLE = False


def smooth_emotion_ema(emotion: str, confidence: float, alpha: float = 0.3):
    ema = st.session_state.emotion_ema

    if emotion not in ema:
        ema[emotion] = confidence
    else:
        ema[emotion] = alpha * confidence + (1 - alpha) * ema[emotion]

    # Decay other emotions
    for e in list(ema.keys()):
        if e != emotion:
            ema[e] *= (1 - alpha)

    # Pick strongest
    smoothed_emotion = max(ema, key=ema.get)
    return smoothed_emotion, ema[smoothed_emotion]


# ==================== Virtual Chat Mode ====================
def virtual_chat_mode(username=None, detect_text_emotion_func=None, retrieve_answer_func=None):
    if username is None:
        username = "Guest"
    
    if detect_text_emotion_func is None:
        def detect_text_emotion_func(text):
            return "neutral", 0.5
    
    if retrieve_answer_func is None:
        def retrieve_answer_func(query, emotion):
            return "I'm here to help. Please connect the RAG system."

    st.title("🎥 Virtual Chat - Live Face Emotion Detection")

    if not DEEPFACE_AVAILABLE:
        st.error("⚠️ DeepFace library not installed. Please install it: `pip install deepface`")
        return

    st.info("📸 Camera stays open! Chat freely with text or voice - bot speaks back!")

    EMOJI_MAP = {
        "happy": "😄", "sad": "😢", "angry": "😠", "fear": "😨",
        "neutral": "😐", "surprise": "😲", "disgust": "🤢"
    }

    # ==================== SESSION STATE ====================
    for key, val in {
        "live_emotion": "neutral",
        "live_confidence": 0.0,
        "camera_active": False,
        "frame_counter": 0,
        "cap": None,
        "emotion_ema": {},
        "virtual_chat_history": [],
        "emotion_timeline": [],
        "last_frame": None,
        "detecting_emotion": False,  # Flag to prevent multiple detections
    }.items():
        if key not in st.session_state:
            st.session_state[key] = val

    # ==================== TTS ====================
    try:
        import pyttsx3
        tts_engine = pyttsx3.init()
        tts_engine.setProperty('rate', 150)
        tts_engine.available = True
    except:
        tts_engine = type('', (), {"available": False})()

    def speak_async(text):
        if not tts_engine.available:
            return
        def speak():
            try:
                tts_engine.say(text)
                tts_engine.runAndWait()
            except:
                pass
        threading.Thread(target=speak, daemon=True).start()

    # ==================== ASYNC EMOTION DETECTION ====================
    def detect_emotion_async(frame_copy):
        if st.session_state.detecting_emotion:
            return

        st.session_state.detecting_emotion = True

        def _detect():
            try:
                # FER expects RGB
                rgb_frame = cv2.cvtColor(frame_copy, cv2.COLOR_BGR2RGB)

                result = emotion_detector.detect_emotions(rgb_frame)

                if not result:
                    return

                # pick largest face
                face = max(result, key=lambda r: r["box"][2] * r["box"][3])

                emotions = face["emotions"]
                emotion = max(emotions, key=emotions.get)
                confidence = emotions[emotion]

                emotion_queue.put((emotion, confidence))

            except Exception:
                pass
            finally:
                st.session_state.detecting_emotion = False

        threading.Thread(target=_detect, daemon=True).start()

    # ==================== CRISIS KEYWORDS ====================
    CRISIS_KEYWORDS = ["suicide", "kill myself", "end my life", "i want to die", "harm myself"]

    # ==================== LAYOUT ====================
    col1, col2 = st.columns([1, 1])

    # ==================== CAMERA ====================
    with col1:
        st.subheader("📹 Live Camera Feed")
        st.metric(
            "Your Current Emotion",
            f"{EMOJI_MAP.get(st.session_state.live_emotion, '😐')} {st.session_state.live_emotion.title()}",
            f"{st.session_state.live_confidence:.0%}"
        )

        btn_col1, btn_col2, btn_col3 = st.columns(3)
        
        with btn_col1:
            if not st.session_state.camera_active:
                if st.button("📷 Start Camera", use_container_width=True):
                    try:
                        # Release any existing camera
                        if st.session_state.cap is not None:
                            st.session_state.cap.release()
                        
                        # Open new camera
                        st.session_state.cap = cv2.VideoCapture(0)
                        st.session_state.cap.set(cv2.CAP_PROP_FRAME_WIDTH, 640)
                        st.session_state.cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 480)
                        st.session_state.cap.set(cv2.CAP_PROP_FPS, 30)
                        st.session_state.cap.set(cv2.CAP_PROP_BUFFERSIZE, 1)
                        
                        if st.session_state.cap.isOpened():
                            st.session_state.camera_active = True
                            st.session_state.frame_counter = 0
                            st.success("✅ Camera started!")
                        else:
                            st.error("❌ Failed to open camera")
                    except Exception as e:
                        st.error(f"Camera error: {str(e)}")
                    st.rerun()
            else:
                if st.button("⏹ Stop Camera", use_container_width=True):
                    st.session_state.camera_active = False
                    if st.session_state.cap:
                        st.session_state.cap.release()
                        st.session_state.cap = None
                    save_session_to_mongo(username)
                    st.success("Camera stopped and session saved!")
                    st.rerun()

        with btn_col2:
            if st.button("📸 Snapshot", use_container_width=True, disabled=not st.session_state.camera_active):
                if st.session_state.last_frame is not None:
                    os.makedirs("snapshots", exist_ok=True)
                    fname = f"snapshots/snap_{int(time.time())}.jpg"
                    cv2.imwrite(fname, st.session_state.last_frame)
                    st.success(f"📷 Saved!")
        
        with btn_col3:
            if st.button("🔄 Detect Now", use_container_width=True, disabled=not st.session_state.camera_active):
                if st.session_state.last_frame is not None and not st.session_state.detecting_emotion:
                    detect_emotion_async(st.session_state.last_frame.copy())
                    st.info("🔍 Detecting...")

        video_placeholder = st.empty()

        # ==================== CAMERA LOOP ====================
        if st.session_state.camera_active:

            # ✅ Process emotion results from background thread
            while not emotion_queue.empty():
                emotion, confidence = emotion_queue.get()

                smooth_e, smooth_c = smooth_emotion_ema(emotion, confidence)

                st.session_state.live_emotion = smooth_e
                st.session_state.live_confidence = smooth_c

                st.session_state.emotion_timeline.append({
                    "timestamp": datetime.datetime.utcnow().isoformat(),
                    "raw_emotion": emotion,
                    "raw_confidence": confidence,
                    "smoothed_emotion": smooth_e,
                    "smoothed_confidence": smooth_c
                })

                st.session_state.detecting_emotion = False

            # Ensure camera is open
            if st.session_state.cap is None or not st.session_state.cap.isOpened():
                st.session_state.cap = cv2.VideoCapture(0)
                st.session_state.cap.set(cv2.CAP_PROP_FRAME_WIDTH, 640)
                st.session_state.cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 480)

            ret, frame = st.session_state.cap.read()

            if ret:
                frame = cv2.flip(frame, 1)
                st.session_state.last_frame = frame.copy()
                st.session_state.frame_counter += 1

                # 🔍 Emotion detection every ~5 seconds (stable)
                if (
                    st.session_state.frame_counter % 150 == 0
                    and not st.session_state.detecting_emotion
                ):
                    detect_emotion_async(frame.copy())

                # Overlay emotion
                emotion_text = st.session_state.live_emotion.upper()
                confidence_text = f"{st.session_state.live_confidence:.0%}"

                cv2.rectangle(frame, (5, 5), (300, 70), (0, 0, 0), -1)
                cv2.rectangle(frame, (5, 5), (300, 70), (0, 255, 0), 2)

                cv2.putText(
                    frame, emotion_text, (15, 35),
                    cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0, 255, 0), 2
                )
                cv2.putText(
                    frame, confidence_text, (15, 60),
                    cv2.FONT_HERSHEY_SIMPLEX, 0.6, (255, 255, 255), 2
                )

                video_placeholder.image(frame.copy(), channels="BGR")
            else:
                video_placeholder.error("❌ Cannot read from camera")

                # 🔁 Controlled rerun (ONLY when camera is active)
                time.sleep(0.05)   # ~20 FPS (CPU-safe)
                st.rerun()


    # ==================== CHAT ====================
    with col2:
        st.subheader("💬 Chat Interface")
        
        # Display chat history in a scrollable container
        chat_container = st.container()
        with chat_container:
            for m in st.session_state.virtual_chat_history:
                with st.chat_message(m["role"]):
                    st.markdown(m["content"])

        # Input mode selection (stays inside column)
        input_mode = st.radio("Choose Input Mode:", ["💬 Type", "🎤 Speak"], horizontal=True)
    
    # ==================== INPUT SECTION (OUTSIDE COLUMNS) ====================
    user_input = ""
    
    if input_mode == "💬 Type":
        user_input = st.chat_input("Type your message here...")
    else:
        if st.button("🎤 Press & Speak", use_container_width=True):
            recognizer = sr.Recognizer()
            with st.spinner("🎤 Listening..."):
                try:
                    with sr.Microphone() as source:
                        st.info("Speak now...")
                        recognizer.adjust_for_ambient_noise(source, duration=0.5)
                        audio = recognizer.listen(source, timeout=5, phrase_time_limit=10)
                    user_input = recognizer.recognize_google(audio)
                    st.success(f"✅ You said: {user_input}")
                except sr.WaitTimeoutError:
                    st.error("⏱️ No speech detected")
                except sr.UnknownValueError:
                    st.error("❌ Could not understand audio")
                except Exception as e:
                    st.error(f"❌ Error: {str(e)}")

    # ==================== PROCESS USER INPUT ====================
    if user_input:
        # Get emotions
        face_emotion = st.session_state.live_emotion
        face_confidence = st.session_state.live_confidence
        text_emotion, text_confidence = detect_text_emotion_func(user_input)

        # Choose emotion based on confidence
        final_emotion = face_emotion if face_confidence > 0.5 else text_emotion

        # Check for crisis keywords
        is_crisis = any(keyword in user_input.lower() for keyword in CRISIS_KEYWORDS)

        if is_crisis:
            bot_reply = (
                "⚠️ I'm very concerned about what you're sharing. Please reach out for help immediately:\n\n"
                "🇮🇳 India Helplines:\n"
                "• AASRA: 91-22-27546669\n"
                "• Vandrevala Foundation: 1860-2662-345\n\n"
                "You are not alone. Please talk to someone who can help."
            )
        else:
            # Retrieve answer from RAG system
            bot_reply = retrieve_answer_func(user_input, final_emotion)

        # Add to chat history
        st.session_state.virtual_chat_history.append({
            "role": "user",
            "content": user_input
        })
        st.session_state.virtual_chat_history.append({
            "role": "assistant",
            "content": bot_reply
        })

        # Speak the reply
        speak_async(bot_reply)
        
        st.rerun()

# ==================== SAVE TO MONGODB ====================
def save_session_to_mongo(username: str):
    try:
        db = get_db()
        col = db["virtual_chat_sessions"]

        # Read all snapshots
        snapshot_data = []
        if os.path.exists("snapshots"):
            for f in glob.glob("snapshots/*.jpg"):
                try:
                    with open(f, "rb") as img_file:
                        snapshot_data.append(
                            base64.b64encode(img_file.read()).decode("utf-8")
                        )
                except Exception:
                    pass

        doc = {
            "username": username,
            "timestamp": datetime.datetime.utcnow(),
            "chat_history": st.session_state.virtual_chat_history,
            "emotion_timeline": st.session_state.emotion_timeline,
            "snapshots": snapshot_data,
            "total_messages": len(st.session_state.virtual_chat_history),
            "session_duration_emotions": len(st.session_state.emotion_timeline),
        }

        col.insert_one(doc)
        st.success("✅ Virtual Chat Session saved to MongoDB")

    except Exception as e:
        st.warning("⚠️ Could not save session to database.")