HealthVoiceAnalyzer1

Sleeping

App Files Files Community

geethareddy commited on Jun 23, 2025

Commit

930e181

verified ·

1 Parent(s): 341af6d

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -17

app.py CHANGED Viewed

@@ -61,15 +61,21 @@ def extract_health_features(audio, sr):
             raise ValueError("No voiced segments detected")
         voiced_audio = np.concatenate(voiced_frames)
-        # Pitch (F0)
-        pitches, magnitudes = librosa.piptrack(y=voiced_audio, sr=sr, fmin=50, fmax=500)
-        valid_pitches = [p for p in pitches[magnitudes > 0] if p > 0]
         pitch = np.mean(valid_pitches) if valid_pitches else 0
         jitter = np.std(valid_pitches) / pitch if pitch and valid_pitches else 0
         # Shimmer (amplitude variation)
         amplitudes = librosa.feature.rms(y=voiced_audio, frame_length=2048, hop_length=512)[0]
         shimmer = np.std(amplitudes) / np.mean(amplitudes) if np.mean(amplitudes) else 0
         # Energy
         energy = np.mean(librosa.feature.rms(y=voiced_audio, frame_length=2048, hop_length=512)[0])
@@ -102,11 +108,11 @@ def analyze_symptoms(text):
     text = text.lower()
     feedback = []
     if "cough" in text or "difficulty breathing" in text:
-        feedback.append("Symptoms like cough or difficulty breathing may indicate a respiratory condition, such as bronchitis or asthma. Consult a doctor.")
-    if "stressed" in text or "stress" in text or "tired" in text or "fatigue" in text:
-        feedback.append("Reported stress or fatigue may suggest conditions like anxiety or chronic fatigue syndrome. Seek medical advice.")
-    if not feedback:
-        feedback.append("No specific conditions detected from reported symptoms.")
     return "\n".join(feedback)
 def analyze_voice(audio_file=None):
@@ -126,7 +132,7 @@ def analyze_voice(audio_file=None):
         # Transcribe audio for symptom analysis
         transcription = transcribe_audio(audio)
-        symptom_feedback = analyze_symptoms(transcription) if transcription else "No transcription available for symptom analysis."
         # Analyze voice features for health indicators
         feedback = []
@@ -135,17 +141,17 @@ def analyze_voice(audio_file=None):
         # Rule-based analysis (thresholds from voice pathology studies)
         if respiratory_score > 1.0:
-            feedback.append(f"Elevated jitter ({respiratory_score:.2f}%) suggests potential respiratory issues, such as vocal cord irregularities or breathing difficulties. Consult a doctor.")
         if mental_health_score > 5.0:
-            feedback.append(f"Elevated shimmer ({mental_health_score:.2f}%) suggests potential stress or emotional strain, which may affect vocal stability. Consider consulting a healthcare provider.")
         if features["energy"] < 0.01:
-            feedback.append(f"Low vocal energy ({features['energy']:.4f}) may indicate fatigue or reduced vocal effort, potentially linked to physical or mental exhaustion.")
-        if not feedback:
-            feedback.append("No significant health indicators detected from voice features.")
         # Combine voice and symptom feedback
-        feedback.append("\n**Symptom Analysis (from transcription)**:")
         feedback.append(symptom_feedback)
         feedback.append("\n**Voice Analysis Details**:")
         feedback.append(f"Pitch: {features['pitch']:.2f} Hz (average fundamental frequency)")
@@ -191,9 +197,9 @@ iface = gr.Interface(
     inputs=gr.Audio(type="filepath", label="Record or Upload Your Voice (WAV, MP3, FLAC, 1+ sec)", format="wav"),
     outputs=gr.Textbox(label="Health Assessment Results"),
     title="Voice Health Analyzer",
-    description="Record or upload your voice (minimum 1 second) to receive preliminary health insights. Speak clearly in English about your symptoms."
 )
 if __name__ == "__main__":
-    logger.info("Starting Voice Health Analyzer at 12:05 PM IST, June 23, 2025")
     iface.launch(server_name="0.0.0.0", server_port=7860)

             raise ValueError("No voiced segments detected")
         voiced_audio = np.concatenate(voiced_frames)
+        # Pitch (F0) with range validation
+        pitches, magnitudes = librosa.piptrack(y=voiced_audio, sr=sr, fmin=75, fmax=300)  # Adult pitch range
+        valid_pitches = [p for p in pitches[magnitudes > 0] if 75 <= p <= 300]
         pitch = np.mean(valid_pitches) if valid_pitches else 0
         jitter = np.std(valid_pitches) / pitch if pitch and valid_pitches else 0
+        if jitter > 10:  # Cap extreme jitter (possible noise)
+            jitter = 10
+            logger.warning("Jitter exceeds 10%, likely due to noise or distortion")
         # Shimmer (amplitude variation)
         amplitudes = librosa.feature.rms(y=voiced_audio, frame_length=2048, hop_length=512)[0]
         shimmer = np.std(amplitudes) / np.mean(amplitudes) if np.mean(amplitudes) else 0
+        if shimmer > 10:  # Cap extreme shimmer (possible noise)
+            shimmer = 10
+            logger.warning("Shimmer exceeds 10%, likely due to noise or distortion")
         # Energy
         energy = np.mean(librosa.feature.rms(y=voiced_audio, frame_length=2048, hop_length=512)[0])
     text = text.lower()
     feedback = []
     if "cough" in text or "difficulty breathing" in text:
+        feedback.append("Your voice suggests possible respiratory issues, such as bronchitis or asthma. Please consult a doctor.")
+    elif "stressed" in text or "stress" in text or "tired" in text or "fatigue" in text:
+        feedback.append("Your voice and words indicate possible stress or fatigue, which may relate to anxiety or exhaustion. Consider seeking medical advice.")
+    else:
+        feedback.append("Your input didn’t specify clear symptoms. For a comprehensive health check, please describe any issues (e.g., cough, stress) and consult a healthcare provider.")
     return "\n".join(feedback)
 def analyze_voice(audio_file=None):
         # Transcribe audio for symptom analysis
         transcription = transcribe_audio(audio)
+        symptom_feedback = analyze_symptoms(transcription) if transcription else "No transcription available. Please record again with clear speech."
         # Analyze voice features for health indicators
         feedback = []
         # Rule-based analysis (thresholds from voice pathology studies)
         if respiratory_score > 1.0:
+            feedback.append(f"Your voice shows elevated jitter ({respiratory_score:.2f}%), which may indicate respiratory issues like vocal cord irregularities. Consult a doctor.")
         if mental_health_score > 5.0:
+            feedback.append(f"Your voice exhibits elevated shimmer ({mental_health_score:.2f}%), suggesting possible stress or emotional strain. Consider a health check.")
         if features["energy"] < 0.01:
+            feedback.append(f"Your vocal energy is low ({features['energy']:.4f}), which might suggest fatigue. Seek medical advice if persistent.")
+        if not feedback and not symptom_feedback.startswith("No transcription"):
+            feedback.append("Your voice shows no significant health indicators based on current analysis.")
         # Combine voice and symptom feedback
+        feedback.append("\n**Symptom Feedback (from your words)**:")
         feedback.append(symptom_feedback)
         feedback.append("\n**Voice Analysis Details**:")
         feedback.append(f"Pitch: {features['pitch']:.2f} Hz (average fundamental frequency)")
     inputs=gr.Audio(type="filepath", label="Record or Upload Your Voice (WAV, MP3, FLAC, 1+ sec)", format="wav"),
     outputs=gr.Textbox(label="Health Assessment Results"),
     title="Voice Health Analyzer",
+    description="Record or upload your voice (minimum 1 second) to receive preliminary health insights. Speak clearly in English about your symptoms (e.g., 'I have a cough' or 'I feel stressed')."
 )
 if __name__ == "__main__":
+    logger.info("Starting Voice Health Analyzer at 12:21 PM IST, June 23, 2025")
     iface.launch(server_name="0.0.0.0", server_port=7860)