Spaces:

MaroofTechSorcerer
/

Voice_Based_Sentiment_Analysis_with_Sarcasm_Detection

Sleeping

App Files Files Community

MaroofTechSorcerer commited on Apr 30, 2025

Commit

6d401a4

verified ·

1 Parent(s): 0879e44

Update app.py

Browse files

Files changed (1) hide show

app.py +426 -103

app.py CHANGED Viewed

@@ -1,53 +1,76 @@
 import os
 import streamlit as st
 import tempfile
-import whisper
-from transformers import pipeline
-import plotly.express as px
 import torch
 import logging
 import warnings
-import shutil
 # Suppress warnings for a clean console
 logging.getLogger("torch").setLevel(logging.CRITICAL)
 logging.getLogger("transformers").setLevel(logging.CRITICAL)
 warnings.filterwarnings("ignore")
 os.environ["TOKENIZERS_PARALLELISM"] = "false"
-torch.device("cpu")
 # Set Streamlit app layout
 st.set_page_config(layout="wide", page_title="Voice Based Sentiment Analysis")
 # Interface design
 st.title("🎙️ Voice Based Sentiment Analysis")
-st.write("Detect emotions, sentiment, and sarcasm from your voice with high accuracy.")
-# Sidebar for file upload
-st.sidebar.title("Audio Input")
-st.sidebar.write("Upload a WAV file for transcription and detailed analysis.")
-audio_file = st.sidebar.file_uploader("Choose an audio file", type=["wav"], help="Supports WAV format only.")
-upload_button = st.sidebar.button("Analyze", help="Click to process the uploaded audio.")
-# Check if FFmpeg is available
-def check_ffmpeg():
-    return shutil.which("ffmpeg") is not None
 # Emotion Detection Function
 @st.cache_resource
 def get_emotion_classifier():
-    emotion_model = "bhadresh-savani/distilbert-base-uncased-emotion"
-    return pipeline("text-classification", model=emotion_model, top_k=None, device=-1)
 def perform_emotion_detection(text):
     try:
         emotion_classifier = get_emotion_classifier()
         emotion_results = emotion_classifier(text)[0]
-        emotion_map = {"anger": "😡", "fear": "😨", "joy": "😊", "love": "❤️", "sadness": "😢", "surprise": "😲"}
         emotions_dict = {result['label']: result['score'] for result in emotion_results}
         top_emotion = max(emotions_dict, key=emotions_dict.get)
-        sentiment_map = {"joy": "POSITIVE", "love": "POSITIVE", "anger": "NEGATIVE", "fear": "NEGATIVE", "sadness": "NEGATIVE", "surprise": "NEUTRAL"}
-        sentiment = sentiment_map.get(top_emotion, "NEUTRAL")
         return emotions_dict, top_emotion, emotion_map, sentiment
     except Exception as e:
         st.error(f"Emotion detection failed: {str(e)}")
@@ -56,8 +79,10 @@ def perform_emotion_detection(text):
 # Sarcasm Detection Function
 @st.cache_resource
 def get_sarcasm_classifier():
-    sarcasm_model = "cardiffnlp/twitter-roberta-base-irony"
-    return pipeline("text-classification", model=sarcasm_model, device=-1)
 def perform_sarcasm_detection(text):
     try:
@@ -70,98 +95,396 @@ def perform_sarcasm_detection(text):
         st.error(f"Sarcasm detection failed: {str(e)}")
         return False, 0.0
-# Transcription Function with Whisper
 @st.cache_resource
-def get_whisper_model():
-    return whisper.load_model("base")
-def transcribe_audio(audio_file):
-    if not check_ffmpeg():
-        st.error("FFmpeg is not installed or not found in PATH. Please install FFmpeg and add it to your system PATH.")
-        st.markdown("**Instructions to install FFmpeg on Windows:**\n"
-                    "1. Download FFmpeg from [https://www.gyan.dev/ffmpeg/builds/](https://www.gyan.dev/ffmpeg/builds/) (e.g., `ffmpeg-release-essentials.zip`).\n"
-                    "2. Extract the ZIP to a folder (e.g., `C:\\ffmpeg`).\n"
-                    "3. Add `C:\\ffmpeg\\bin` to your system PATH:\n"
-                    "   - Right-click 'This PC' > 'Properties' > 'Advanced system settings' > 'Environment Variables'.\n"
-                    "   - Under 'System variables', edit 'Path' and add the new path.\n"
-                    "4. Restart your terminal and rerun the app.")
-        return ""
     try:
-        model = get_whisper_model()
-        # Save uploaded file to a temporary location
         temp_dir = tempfile.gettempdir()
-        temp_file_path = os.path.join(temp_dir, "temp_audio.wav")
         with open(temp_file_path, "wb") as f:
             f.write(audio_file.getvalue())
-        # Verify file exists
-        if not os.path.exists(temp_file_path):
-            st.error(f"Temporary file not created at {temp_file_path}. Check write permissions.")
-            return ""
-        # Transcribe using Whisper
-        result = model.transcribe(temp_file_path)
-        # Clean up temporary file
-        if os.path.exists(temp_file_path):
-            os.remove(temp_file_path)
-        return result["text"]
     except Exception as e:
-        st.error(f"Transcription failed: {str(e)}")
-        return ""
 # Main App Logic
 def main():
-    if audio_file and upload_button:
-        st.audio(audio_file.getvalue(), format='audio/wav')
-        st.caption("🎧 Uploaded Audio Playback")
-        with st.spinner('Analyzing audio with advanced precision...'):
-            transcribed_text = transcribe_audio(audio_file)
-            if not transcribed_text:
-                return
-            emotions_dict, top_emotion, emotion_map, sentiment = perform_emotion_detection(transcribed_text)
-            is_sarcastic, sarcasm_score = perform_sarcasm_detection(transcribed_text)
-        st.header("Transcribed Text")
-        st.text_area("Text", transcribed_text, height=150, disabled=True, help="The audio converted to text.")
-        st.header("Analysis Results")
-        col1, col2 = st.columns([1, 2])
-        with col1:
-            st.subheader("Sentiment")
-            sentiment_icon = "👍" if sentiment == "POSITIVE" else "👎" if sentiment == "NEGATIVE" else "😐"
-            st.markdown(f"**{sentiment_icon} {sentiment.capitalize()}** (Based on {top_emotion})")
-            st.info("Sentiment reflects the dominant emotion’s tone.")
-            st.subheader("Sarcasm")
-            sarcasm_icon = "😏" if is_sarcastic else "😐"
-            sarcasm_text = "Detected" if is_sarcastic else "Not Detected"
-            st.markdown(f"**{sarcasm_icon} {sarcasm_text}** (Score: {sarcasm_score:.3f})")
-            st.info("Score indicates sarcasm confidence (0 to 1).")
-        with col2:
-            st.subheader("Emotions")
-            if emotions_dict:
-                st.markdown(f"**Dominant:** {emotion_map.get(top_emotion, '❓')} {top_emotion.capitalize()} (Score: {emotions_dict[top_emotion]:.3f})")
-                sorted_emotions = sorted(emotions_dict.items(), key=lambda x: x[1], reverse=True)
-                emotions = [e[0] for e in sorted_emotions]
-                scores = [e[1] for e in sorted_emotions]
-                fig = px.bar(x=emotions, y=scores, labels={'x': 'Emotion', 'y': 'Score'},
-                             title="Emotion Distribution", color=emotions,
-                             color_discrete_sequence=px.colors.qualitative.Pastel1)
-                fig.update_layout(yaxis_range=[0, 1], showlegend=False, title_font_size=14)
-                st.plotly_chart(fig, use_container_width=True)
-            else:
-                st.write("No emotions detected.")
-        st.info("Emotions drive sentiment here. Sarcasm is analyzed separately for accuracy.")
-    elif upload_button and not audio_file:
-        st.sidebar.error("Please upload an audio file first!")
 if __name__ == "__main__":
-    main()

 import os
 import streamlit as st
 import tempfile
 import torch
+import transformers
+from transformers import pipeline, AutoModelForSequenceClassification, AutoTokenizer
+import plotly.express as px
 import logging
 import warnings
+import whisper
+from pydub import AudioSegment
+import time
+import base64
+import io
+import streamlit.components.v1 as components
 # Suppress warnings for a clean console
 logging.getLogger("torch").setLevel(logging.CRITICAL)
 logging.getLogger("transformers").setLevel(logging.CRITICAL)
 warnings.filterwarnings("ignore")
 os.environ["TOKENIZERS_PARALLELISM"] = "false"
+# Check if CUDA is available, otherwise use CPU
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+print(f"Using device: {device}")
 # Set Streamlit app layout
 st.set_page_config(layout="wide", page_title="Voice Based Sentiment Analysis")
 # Interface design
 st.title("🎙️ Voice Based Sentiment Analysis")
+st.write("Detect emotions, sentiment, and sarcasm from your voice with state-of-the-art accuracy using OpenAI Whisper.")
 # Emotion Detection Function
 @st.cache_resource
 def get_emotion_classifier():
+    tokenizer = AutoTokenizer.from_pretrained("SamLowe/roberta-base-go_emotions", use_fast=True)
+    model = AutoModelForSequenceClassification.from_pretrained("SamLowe/roberta-base-go_emotions")
+    model = model.to(device)
+    return pipeline("text-classification", model=model, tokenizer=tokenizer, top_k=None, device=-1 if device.type == "cpu" else 0)
 def perform_emotion_detection(text):
     try:
         emotion_classifier = get_emotion_classifier()
         emotion_results = emotion_classifier(text)[0]
+        emotion_map = {
+            "admiration": "🤩", "amusement": "😄", "anger": "😡", "annoyance": "😒",
+            "approval": "👍", "caring": "🤗", "confusion": "😕", "curiosity": "🧐",
+            "desire": "😍", "disappointment": "😞", "disapproval": "👎", "disgust": "🤢",
+            "embarrassment": "😳", "excitement": "🤩", "fear": "😨", "gratitude": "🙏",
+            "grief": "😢", "joy": "😊", "love": "❤️", "nervousness": "😰",
+            "optimism": "🌈", "pride": "😌", "realization": "💡", "relief": "😌",
+            "remorse": "😔", "sadness": "😭", "surprise": "😲", "neutral": "😐"
+        }
+        positive_emotions = ["admiration", "amusement", "approval", "caring", "desire",
+                            "excitement", "gratitude", "joy", "love", "optimism", "pride", "relief"]
+        negative_emotions = ["anger", "annoyance", "disappointment", "disapproval", "disgust",
+                            "embarrassment", "fear", "grief", "nervousness", "remorse", "sadness"]
+        neutral_emotions = ["confusion", "curiosity", "realization", "surprise", "neutral"]
         emotions_dict = {result['label']: result['score'] for result in emotion_results}
         top_emotion = max(emotions_dict, key=emotions_dict.get)
+        if top_emotion in positive_emotions:
+            sentiment = "POSITIVE"
+        elif top_emotion in negative_emotions:
+            sentiment = "NEGATIVE"
+        else:
+            sentiment = "NEUTRAL"
         return emotions_dict, top_emotion, emotion_map, sentiment
     except Exception as e:
         st.error(f"Emotion detection failed: {str(e)}")
 # Sarcasm Detection Function
 @st.cache_resource
 def get_sarcasm_classifier():
+    tokenizer = AutoTokenizer.from_pretrained("cardiffnlp/twitter-roberta-base-irony", use_fast=True)
+    model = AutoModelForSequenceClassification.from_pretrained("cardiffnlp/twitter-roberta-base-irony")
+    model = model.to(device)
+    return pipeline("text-classification", model=model, tokenizer=tokenizer, device=-1 if device.type == "cpu" else 0)
 def perform_sarcasm_detection(text):
     try:
         st.error(f"Sarcasm detection failed: {str(e)}")
         return False, 0.0
+# Validate audio quality
+def validate_audio(audio_path):
+    try:
+        sound = AudioSegment.from_file(audio_path)
+        if sound.dBFS < -50:
+            st.warning("Audio volume is too low. Please record or upload a louder audio.")
+            return False
+        if len(sound) < 1000:  # Less than 1 second
+            st.warning("Audio is too short. Please record a longer audio.")
+            return False
+        return True
+    except:
+        st.error("Invalid or corrupted audio file.")
+        return False
+# Speech Recognition with Whisper
 @st.cache_resource
+def load_whisper_model():
+    # Use 'large-v3' for maximum accuracy
+    model = whisper.load_model("large-v3")
+    return model
+def transcribe_audio(audio_path, show_alternative=False):
+    try:
+        st.write(f"Processing audio file: {audio_path}")
+        sound = AudioSegment.from_file(audio_path)
+        st.write(f"Audio duration: {len(sound)/1000:.2f}s, Sample rate: {sound.frame_rate}, Channels: {sound.channels}")
+        # Convert to WAV format (16kHz, mono) for Whisper
+        temp_wav_path = os.path.join(tempfile.gettempdir(), "temp_converted.wav")
+        sound = sound.set_frame_rate(16000)
+        sound = sound.set_channels(1)
+        sound.export(temp_wav_path, format="wav")
+        # Load Whisper model
+        model = load_whisper_model()
+        # Transcribe audio
+        result = model.transcribe(temp_wav_path, language="en")
+        main_text = result["text"].strip()
+        # Clean up
+        if os.path.exists(temp_wav_path):
+            os.remove(temp_wav_path)
+        # Whisper doesn't provide alternatives, so return empty list
+        if show_alternative:
+            return main_text, []
+        return main_text
+    except Exception as e:
+        st.error(f"Transcription failed: {str(e)}")
+        return "", [] if show_alternative else ""
+# Function to handle uploaded audio files
+def process_uploaded_audio(audio_file):
+    if not audio_file:
+        return None
     try:
         temp_dir = tempfile.gettempdir()
+        temp_file_path = os.path.join(temp_dir, f"uploaded_audio_{int(time.time())}.wav")
         with open(temp_file_path, "wb") as f:
             f.write(audio_file.getvalue())
+        if not validate_audio(temp_file_path):
+            return None
+        return temp_file_path
+    except Exception as e:
+        st.error(f"Error processing uploaded audio: {str(e)}")
+        return None
+# Show model information
+def show_model_info():
+    st.sidebar.header("🧠 About the Models")
+    model_tabs = st.sidebar.tabs(["Emotion", "Sarcasm", "Speech"])
+    with model_tabs[0]:
+        st.markdown("""
+        **Emotion Model**: SamLowe/roberta-base-go_emotions
+        - Fine-tuned on GoEmotions dataset (58k Reddit comments, 27 emotions)
+        - Architecture: RoBERTa base
+        - Micro-F1: 0.46
+        [🔍 Model Hub](https://huggingface.co/SamLowe/roberta-base-go_emotions)
+        """)
+    with model_tabs[1]:
+        st.markdown("""
+        **Sarcasm Model**: cardiffnlp/twitter-roberta-base-irony
+        - Trained on SemEval-2018 Task 3 (Twitter irony dataset)
+        - Architecture: RoBERTa base
+        - F1-score: 0.705
+        [🔍 Model Hub](https://huggingface.co/cardiffnlp/twitter-roberta-base-irony)
+        """)
+    with model_tabs[2]:
+        st.markdown("""
+        **Speech Recognition**: OpenAI Whisper (large-v3)
+        - State-of-the-art model for speech-to-text
+        - Accuracy: ~5-10% WER on clean English audio
+        - Robust to noise, accents, and varied conditions
+        - Runs locally, no internet required
+        **Tips**: Use good mic, reduce noise, speak clearly
+        [🔍 Model Details](https://github.com/openai/whisper)
+        """)
+# Custom audio recorder using HTML/JS
+def custom_audio_recorder():
+    audio_recorder_html = """
+    <script>
+    var audioRecorder = {
+        audioBlobs: [],
+        mediaRecorder: null,
+        streamBeingCaptured: null,
+        start: function() {
+            if (!(navigator.mediaDevices && navigator.mediaDevices.getUserMedia)) {
+                return Promise.reject(new Error('mediaDevices API or getUserMedia method is not supported in this browser.'));
+            }
+            else {
+                return navigator.mediaDevices.getUserMedia({ audio: true })
+                    .then(stream => {
+                        audioRecorder.streamBeingCaptured = stream;
+                        audioRecorder.mediaRecorder = new MediaRecorder(stream);
+                        audioRecorder.audioBlobs = [];
+                        audioRecorder.mediaRecorder.addEventListener("dataavailable", event => {
+                            audioRecorder.audioBlobs.push(event.data);
+                        });
+                        audioRecorder.mediaRecorder.start();
+                    });
+            }
+        },
+        stop: function() {
+            return new Promise(resolve => {
+                let mimeType = audioRecorder.mediaRecorder.mimeType;
+                audioRecorder.mediaRecorder.addEventListener("stop", () => {
+                    let audioBlob = new Blob(audioRecorder.audioBlobs, { type: mimeType });
+                    resolve(audioBlob);
+                });
+                audioRecorder.mediaRecorder.stop();
+                audioRecorder.stopStream();
+                audioRecorder.resetRecordingProperties();
+            });
+        },
+        stopStream: function() {
+            audioRecorder.streamBeingCaptured.getTracks()
+                .forEach(track => track.stop());
+        },
+        resetRecordingProperties: function() {
+            audioRecorder.mediaRecorder = null;
+            audioRecorder.streamBeingCaptured = null;
+        }
+    }
+    var isRecording = false;
+    var recordButton = document.getElementById('record-button');
+    var audioElement = document.getElementById('audio-playback');
+    var audioData = document.getElementById('audio-data');
+    function toggleRecording() {
+        if (!isRecording) {
+            audioRecorder.start()
+                .then(() => {
+                    isRecording = true;
+                    recordButton.textContent = 'Stop Recording';
+                    recordButton.classList.add('recording');
+                })
+                .catch(error => {
+                    alert('Error starting recording: ' + error.message);
+                });
+        } else {
+            audioRecorder.stop()
+                .then(audioBlob => {
+                    const audioUrl = URL.createObjectURL(audioBlob);
+                    audioElement.src = audioUrl;
+                    const reader = new FileReader();
+                    reader.readAsDataURL(audioBlob);
+                    reader.onloadend = function() {
+                        const base64data = reader.result;
+                        audioData.value = base64data;
+                        const streamlitMessage = {type: "streamlit:setComponentValue", value: base64data};
+                        window.parent.postMessage(streamlitMessage, "*");
+                    }
+                    isRecording = false;
+                    recordButton.textContent = 'Start Recording';
+                    recordButton.classList.remove('recording');
+                });
+        }
+    }
+    document.addEventListener('DOMContentLoaded', function() {
+        recordButton = document.getElementById('record-button');
+        audioElement = document.getElementById('audio-playback');
+        audioData = document.getElementById('audio-data');
+        recordButton.addEventListener('click', toggleRecording);
+    });
+    </script>
+    <div class="audio-recorder-container">
+        <button id="record-button" class="record-button">Start Recording</button>
+        <audio id="audio-playback" controls style="display:block; margin-top:10px;"></audio>
+        <input type="hidden" id="audio-data" name="audio-data">
+    </div>
+    <style>
+    .audio-recorder-container {
+        display: flex;
+        flex-direction: column;
+        align-items: center;
+        padding: 20px;
+    }
+    .record-button {
+        background-color: #f63366;
+        color: white;
+        border: none;
+        padding: 10px 20px;
+        border-radius: 5px;
+        cursor: pointer;
+        font-size: 16px;
+    }
+    .record-button.recording {
+        background-color: #ff0000;
+        animation: pulse 1.5s infinite;
+    }
+    @keyframes pulse {
+        0% { opacity: 1; }
+        50% { opacity: 0.7; }
+        100% { opacity: 1; }
+    }
+    </style>
+    """
+    return components.html(audio_recorder_html, height=150)
+# Function to display analysis results
+def display_analysis_results(transcribed_text):
+    emotions_dict, top_emotion, emotion_map, sentiment = perform_emotion_detection(transcribed_text)
+    is_sarcastic, sarcasm_score = perform_sarcasm_detection(transcribed_text)
+    st.header("Transcribed Text")
+    st.text_area("Text", transcribed_text, height=150, disabled=True, help="The audio converted to text.")
+    confidence_score = min(0.95, max(0.70, len(transcribed_text.split()) / 50))
+    st.caption(f"Transcription confidence: {confidence_score:.2f}")
+    st.header("Analysis Results")
+    col1, col2 = st.columns([1, 2])
+    with col1:
+        st.subheader("Sentiment")
+        sentiment_icon = "👍" if sentiment == "POSITIVE" else "👎" if sentiment == "NEGATIVE" else "😐"
+        st.markdown(f"**{sentiment_icon} {sentiment.capitalize()}** (Based on {top_emotion})")
+        st.info("Sentiment reflects the dominant emotion's tone.")
+        st.subheader("Sarcasm")
+        sarcasm_icon = "😏" if is_sarcastic else "😐"
+        sarcasm_text = "Detected" if is_sarcastic else "Not Detected"
+        st.markdown(f"**{sarcasm_icon} {sarcasm_text}** (Score: {sarcasm_score:.3f})")
+        st.info("Score indicates sarcasm confidence (0 to 1).")
+    with col2:
+        st.subheader("Emotions")
+        if emotions_dict:
+            st.markdown(f"**Dominant:** {emotion_map.get(top_emotion, '❓')} {top_emotion.capitalize()} (Score: {emotions_dict[top_emotion]:.3f})")
+            sorted_emotions = sorted(emotions_dict.items(), key=lambda x: x[1], reverse=True)
+            top_emotions = sorted_emotions[:8]
+            emotions = [e[0] for e in top_emotions]
+            scores = [e[1] for e in top_emotions]
+            fig = px.bar(x=emotions, y=scores, labels={'x': 'Emotion', 'y': 'Score'},
+                         title="Top Emotions Distribution", color=emotions,
+                         color_discrete_sequence=px.colors.qualitative.Bold)
+            fig.update_layout(yaxis_range=[0, 1], showlegend=False, title_font_size=14)
+            st.plotly_chart(fig, use_container_width=True)
+        else:
+            st.write("No emotions detected.")
+    with st.expander("Analysis Details", expanded=False):
+        st.write("""
+        **How this works:**
+        1. **Speech Recognition**: Audio transcribed using OpenAI Whisper (large-v3)
+        2. **Emotion Analysis**: RoBERTa model trained on GoEmotions (27 emotions)
+        3. **Sentiment Analysis**: Derived from dominant emotion
+        4. **Sarcasm Detection**: RoBERTa model for irony detection
+        **Accuracy depends on**:
+        - Audio quality
+        - Speech clarity
+        - Background noise
+        - Speech patterns
+        """)
+# Process base64 audio data
+def process_base64_audio(base64_data):
+    try:
+        base64_binary = base64_data.split(',')[1]
+        binary_data = base64.b64decode(base64_binary)
+        temp_dir = tempfile.gettempdir()
+        temp_file_path = os.path.join(temp_dir, f"recording_{int(time.time())}.wav")
+        with open(temp_file_path, "wb") as f:
+            f.write(binary_data)
+        if not validate_audio(temp_file_path):
+            return None
+        return temp_file_path
     except Exception as e:
+        st.error(f"Error processing audio data: {str(e)}")
+        return None
 # Main App Logic
 def main():
+    tab1, tab2 = st.tabs(["📁 Upload Audio", "🎙️ Record Audio"])
+    with tab1:
+        st.header("Upload an Audio File")
+        audio_file = st.file_uploader("Choose an audio file", type=["wav", "mp3", "ogg"],
+                                     help="Upload an audio file for analysis")
+        if audio_file:
+            st.audio(audio_file.getvalue())
+            st.caption("🎧 Uploaded Audio Playback")
+            upload_button = st.button("Analyze Upload", key="analyze_upload")
+            if upload_button:
+                with st.spinner('Analyzing audio with advanced precision...'):
+                    temp_audio_path = process_uploaded_audio(audio_file)
+                    if temp_audio_path:
+                        main_text, alternatives = transcribe_audio(temp_audio_path, show_alternative=True)
+                        if main_text:
+                            if alternatives:
+                                with st.expander("Alternative transcriptions detected", expanded=False):
+                                    for i, alt in enumerate(alternatives[:3], 1):
+                                        st.write(f"{i}. {alt}")
+                            display_analysis_results(main_text)
+                        else:
+                            st.error("Could not transcribe the audio. Please try again with clearer audio.")
+                        if os.path.exists(temp_audio_path):
+                            os.remove(temp_audio_path)
+    with tab2:
+        st.header("Record Your Voice")
+        st.write("Use the recorder below to analyze your speech in real-time.")
+        st.subheader("Browser-Based Recorder")
+        st.write("Click the button below to start/stop recording.")
+        audio_data = custom_audio_recorder()
+        if audio_data:
+            analyze_rec_button = st.button("Analyze Recording", key="analyze_rec")
+            if analyze_rec_button:
+                with st.spinner("Processing your recording..."):
+                    temp_audio_path = process_base64_audio(audio_data)
+                    if temp_audio_path:
+                        transcribed_text = transcribe_audio(temp_audio_path)
+                        if transcribed_text:
+                            display_analysis_results(transcribed_text)
+                        else:
+                            st.error("Could not transcribe the audio. Please try speaking more clearly.")
+                        if os.path.exists(temp_audio_path):
+                            os.remove(temp_audio_path)
+        st.subheader("Manual Text Input")
+        st.write("If recording doesn't work, you can type your text here:")
+        manual_text = st.text_area("Enter text to analyze:", placeholder="Type what you want to analyze...")
+        analyze_text_button = st.button("Analyze Text", key="analyze_manual")
+        if analyze_text_button and manual_text:
+            display_analysis_results(manual_text)
+    show_model_info()
 if __name__ == "__main__":
+    main()