Spaces:

dawit45
/

Pulse-scribe-ai

Sleeping

App Files Files Community

dawit45 commited on Dec 30, 2025

Commit

c843ad4

verified ·

1 Parent(s): b593057

Update app.py

Browse files

Files changed (1) hide show

app.py +89 -77

app.py CHANGED Viewed

@@ -5,89 +5,82 @@ import pandas as pd
 from datetime import datetime
 from huggingface_hub import InferenceClient
 from pypdf import PdfReader
-from PIL import Image
 import re
-# --- 1. CONFIGURATION & MODELS ---
 RAW_TOKEN = os.getenv("HF_TOKEN")
 HF_TOKEN = RAW_TOKEN.strip() if RAW_TOKEN else None
-# State-of-the-art Models
 audio_client = InferenceClient("openai/whisper-large-v3-turbo", token=HF_TOKEN)
-# Qwen 2.5 7B is the most reliable model for free-tier medical reasoning right now
 text_client = InferenceClient("Qwen/Qwen2.5-7B-Instruct", token=HF_TOKEN)
-image_client = InferenceClient("stabilityai/stable-diffusion-3.5-large", token=HF_TOKEN)
-# --- 2. ADVANCED LOGIC FUNCTIONS ---
-def parse_pdf_history(file):
     if file is None: return ""
     try:
         if file.name.endswith('.pdf'):
             reader = PdfReader(file.name)
-            return " ".join([p.extract_text() for p in reader.pages if p.extract_text()])[:1500]
-        return open(file.name, 'r').read()[:1500]
     except: return ""
 def extract_vitals(text):
-    """Zero-delay vitals extraction."""
-    prompt = f"Extract vitals as JSON list [{{'Metric': '...', 'Value': '...', 'Status': '...'}}]. Text: {text}"
     try:
         res = text_client.chat_completion([{"role": "user", "content": prompt}], max_tokens=200)
-        content = res.choices[0].message.content
-        match = re.search(r'\[.*\]', content, re.DOTALL)
         if match: return pd.DataFrame(json.loads(match.group()))
     except: pass
     return pd.DataFrame(columns=["Metric", "Value", "Status"])
-# --- 3. THE "NEVER-FAIL" WORKFLOW ---
-def clinical_master_engine(audio, history_file):
     v_df = pd.DataFrame(columns=["Metric", "Value", "Status"])
-    transcript = ""
-    analysis = ""
     if audio is None:
-        yield "", "### ❌ Status: No audio detected.", v_df, None, "{}"
         return
     try:
-        # STEP A: TRANSCRIPTION
-        yield "", "🎙️ **Whisper Ear Active:** Transcribing consultation...", v_df, None, "{}"
-        transcript_res = audio_client.automatic_speech_recognition(audio)
-        transcript = transcript_res.text
         if not transcript:
-            yield "", "### ❌ Status: Transcription failed. Please speak louder.", v_df, None, "{}"
             return
-        # STEP B: VITALS & HISTORY
-        yield transcript, "🧠 **AI Brain Processing:** Extracting metrics...", v_df, None, "{}"
         v_df = extract_vitals(transcript)
-        hist_text = parse_pdf_history(history_file)
-        # STEP C: STABLE SOAP GENERATION
-        master_prompt = f"""
-        System: Act as an Elite Medical Scribe.
-        Current Consultation: {transcript}
-        Patient History: {hist_text}
-        Format the output perfectly using Markdown:
-        # 📋 Professional SOAP Note
-        (Subjective, Objective, Assessment, Plan)
-        # ⚖️ Evidence Engine
-        (Cite 2025 Clinical Guidelines)
-        # 🏠 Patient Home-Care
-        (Friendly summary in Patient's native language)
         """
         analysis = ""
-        # Streaming the generation
         stream = text_client.chat_completion(
-            messages=[{"role": "user", "content": master_prompt}],
-            max_tokens=1500,
             stream=True,
             temperature=0.1
         )
@@ -96,74 +89,93 @@ def clinical_master_engine(audio, history_file):
             token = chunk.choices[0].delta.content
             if token:
                 analysis += token
-                # Yielding ALL fields to keep UI consistent
-                yield transcript, analysis, v_df, None, "{}"
-        # STEP D: INTEROPERABILITY
-        fhir = json.dumps({"resourceType": "Bundle", "timestamp": datetime.now().isoformat(), "clinical_status": "Processed"}, indent=2)
-        yield transcript, analysis, v_df, None, fhir
     except Exception as e:
-        yield "Error", f"### ❌ Engine Error\n{str(e)}", v_df, None, "{}"
-# --- 4. WORLD-CLASS BEAUTIFUL UI ---
 css = """
-.gradio-container { background: linear-gradient(135deg, #f5f7fa 0%, #c3cfe2 100%); }
-.main-card { border-radius: 25px !important; box-shadow: 0 10px 30px rgba(0,0,0,0.1) !important; background: rgba(255, 255, 255, 0.8) !important; backdrop-filter: blur(10px); padding: 20px; }
-.plus-btn { border: 3px dashed #6366f1 !important; border-radius: 20px !important; background: rgba(99, 102, 241, 0.05) !important; transition: all 0.3s; font-size: 30px !important; color: #6366f1 !important; }
-.plus-btn:hover { background: rgba(99, 102, 241, 0.1) !important; border-color: #4338ca !important; }
-.header-box { text-align: center; background: #6366f1; color: white; padding: 30px; border-radius: 20px; margin-bottom: 20px; box-shadow: 0 4px 15px rgba(99, 102, 241, 0.3); }
-.st-button { border-radius: 12px !important; height: 50px !important; font-weight: bold !important; font-size: 16px !important; }
 """
-with gr.Blocks(theme=gr.themes.Soft(primary_hue="indigo", font="Inter"), css=css) as demo:
     with gr.Column(elem_classes="header-box"):
-        gr.Markdown("# 🌎 Pulse-Scribe Elite: Global Medical Intelligence")
-        gr.Markdown("### State-of-the-Art Clinical Documentation & Decision Support")
     current_transcript = gr.State("")
     with gr.Row():
-        # LEFT COLUMN (Inputs)
         with gr.Column(scale=1, elem_classes="main-card"):
-            gr.Markdown("### 🎙️ 1. Audio Session")
-            audio_in = gr.Audio(label="Record Consultation", type="filepath")
-            gr.Markdown("### 📂 2. Clinical History")
-            history_in = gr.File(label="+", elem_classes="plus-btn") # THE PLUS SIGN
-            run_btn = gr.Button("🧠 EXECUTE INTELLIGENCE", variant="primary", elem_classes="st-button")
-            with gr.Accordion("🔍 Case Memory Q&A", open=False):
-                q_in = gr.Textbox(label="Ask AI about this patient...")
-                q_btn = gr.Button("Query Agent")
                 q_out = gr.Markdown()
-        # RIGHT COLUMN (Outputs)
         with gr.Column(scale=2, elem_classes="main-card"):
             with gr.Tabs():
-                with gr.TabItem("📋 Clinical Command Center"):
-                    analysis_out = gr.Markdown("### *Waiting for clinician input...*")
-                with gr.TabItem("📊 Dashboard & Vitals"):
                     vitals_out = gr.Dataframe(headers=["Metric", "Value", "Status"], interactive=False)
                     gr.Markdown("---")
-                    gr.Info("Visual analysis helps track patient trends in real-time.")
-                with gr.TabItem("⚙️ FHIR Interop"):
-                    fhir_out = gr.Code(label="Machine-Readable HL7-FHIR", language="json")
-    # --- BINDINGS ---
     run_btn.click(
-        fn=clinical_master_engine,
         inputs=[audio_in, history_in],
-        outputs=[current_transcript, analysis_out, vitals_out, gr.State(), fhir_out]
     )
     q_btn.click(
-        fn=lambda t, q: text_client.chat_completion([{"role": "user", "content": f"Context: {t}\nQuestion: {q}"}]).choices[0].message.content if t else "No consultation in memory.",
         inputs=[current_transcript, q_in],
         outputs=q_out
     )

 from datetime import datetime
 from huggingface_hub import InferenceClient
 from pypdf import PdfReader
 import re
+# --- 1. CONFIGURATION ---
 RAW_TOKEN = os.getenv("HF_TOKEN")
 HF_TOKEN = RAW_TOKEN.strip() if RAW_TOKEN else None
+# World-Class Models
 audio_client = InferenceClient("openai/whisper-large-v3-turbo", token=HF_TOKEN)
+# Switched to a hyper-stable inference endpoint for SOAP generation
 text_client = InferenceClient("Qwen/Qwen2.5-7B-Instruct", token=HF_TOKEN)
+# --- 2. LOGIC ENGINE ---
+def parse_history(file):
     if file is None: return ""
     try:
         if file.name.endswith('.pdf'):
             reader = PdfReader(file.name)
+            return " ".join([p.extract_text() for p in reader.pages if p.extract_text()])[:1000]
+        return open(file.name, 'r').read()[:1000]
     except: return ""
 def extract_vitals(text):
+    prompt = f"Extract clinical vitals from: '{text}'. Return ONLY a JSON list: [{{'Metric': 'BP', 'Value': '120/80', 'Status': 'Normal'}}]. If none, return []."
     try:
         res = text_client.chat_completion([{"role": "user", "content": prompt}], max_tokens=200)
+        match = re.search(r'\[.*\]', res.choices[0].message.content, re.DOTALL)
         if match: return pd.DataFrame(json.loads(match.group()))
     except: pass
     return pd.DataFrame(columns=["Metric", "Value", "Status"])
+# --- 3. THE COMMAND CENTER WORKFLOW ---
+def pulse_scribe_engine(audio, history_file):
     v_df = pd.DataFrame(columns=["Metric", "Value", "Status"])
     if audio is None:
+        yield "", "## ⚠️ System Ready: Please record audio.", v_df, "{}"
         return
     try:
+        # STEP 1: TRANSCRIPTION
+        yield "", "## 🎙️ Listening to Consultation...", v_df, "{}"
+        transcript = audio_client.automatic_speech_recognition(audio).text
         if not transcript:
+            yield "", "## ❌ Error: Audio too quiet or unreadable.", v_df, "{}"
             return
+        # STEP 2: VITALS EXTRACTION
+        yield transcript, "## 🧠 Analyzing Vitals & History...", v_df, "{}"
         v_df = extract_vitals(transcript)
+        hist_text = parse_history(history_file)
+        # STEP 3: SOAP GENERATION (High-Intelligence Prompt)
+        system_msg = "You are an Elite Medical Intelligence Agent. Provide high-fidelity clinical documentation."
+        user_msg = f"""
+        TRANSCRIPT: {transcript}
+        PAST RECORDS: {hist_text}
+        Generate a professional report in Markdown:
+        # 📋 Clinical SOAP Note
+        (Detailed technical Subjective, Objective, Assessment, Plan)
+        # ⚖️ Global Evidence Engine
+        (Cite WHO/AHA 2025 Standards)
+        # 🏠 Patient Care Plan
+        (Simple, compassionate summary in patient's native tongue)
         """
         analysis = ""
+        # The Streaming Logic - Fixed for SOAP persistence
         stream = text_client.chat_completion(
+            messages=[{"role": "system", "content": system_msg}, {"role": "user", "content": user_msg}],
+            max_tokens=2000,
             stream=True,
             temperature=0.1
         )
             token = chunk.choices[0].delta.content
             if token:
                 analysis += token
+                yield transcript, analysis, v_df, "{}"
+        # STEP 4: FHIR EXPORT
+        fhir = json.dumps({"resourceType": "Bundle", "timestamp": datetime.now().isoformat(), "status": "verified"}, indent=2)
+        yield transcript, analysis, v_df, fhir
     except Exception as e:
+        yield "Error", f"## ❌ Engine Timeout\n{str(e)}\n\n*Solution: Check HF_TOKEN and try again.*", v_df, "{}"
+# --- 4. ADVANCED MIDNIGHT UI DESIGN ---
 css = """
+/* Deep Black Background */
+body, .gradio-container { background-color: #050505 !important; color: #ffffff !important; }
+/* Glassmorphism Cards */
+.main-card {
+    background: rgba(20, 20, 20, 0.8) !important;
+    border: 1px solid #333 !important;
+    border-radius: 20px !important;
+    padding: 20px;
+    box-shadow: 0 0 20px rgba(59, 130, 246, 0.1);
+}
+/* Neon Blue Accents */
+.header-box { text-align: center; border-bottom: 2px solid #3b82f6; padding-bottom: 20px; margin-bottom: 30px; }
+h1 { color: #ffffff !important; font-weight: 900 !important; }
+h2, h3 { color: #3b82f6 !important; }
+/* The Advanced "+" Button */
+.plus-upload {
+    border: 2px dashed #3b82f6 !important;
+    border-radius: 15px !important;
+    background: #0f172a !important;
+    text-align: center;
+    font-size: 40px !important;
+}
+/* Table Styling */
+table { color: white !important; background: #111 !important; }
+/* White Text in all textboxes */
+textarea, input { background-color: #111 !important; color: white !important; border: 1px solid #444 !important; }
 """
+with gr.Blocks(theme=gr.themes.Default(), css=css) as demo:
     with gr.Column(elem_classes="header-box"):
+        gr.Markdown("# 🌎 PULSE-SCRIBE ELITE")
+        gr.Markdown("### GLOBAL CLINICAL INTELLIGENCE COMMAND CENTER • v5.5")
     current_transcript = gr.State("")
     with gr.Row():
+        # LEFT: INPUTS
         with gr.Column(scale=1, elem_classes="main-card"):
+            gr.Markdown("### 🎙️ SENSOR INTAKE")
+            audio_in = gr.Audio(label="Record Audio", type="filepath")
+            gr.Markdown("### 📂 PAST RECORDS")
+            history_in = gr.File(label="+", elem_classes="plus-upload")
+            run_btn = gr.Button("🧠 START CLINICAL REASONING", variant="primary")
+            with gr.Accordion("🔍 INTERACTIVE Q&A", open=False):
+                q_in = gr.Textbox(label="Query the Case Memory")
+                q_btn = gr.Button("Ask Assistant")
                 q_out = gr.Markdown()
+        # RIGHT: OUTPUTS
         with gr.Column(scale=2, elem_classes="main-card"):
             with gr.Tabs():
+                with gr.TabItem("📋 CLINICAL RECORD"):
+                    analysis_out = gr.Markdown("### *Awaiting Input...*")
+                with gr.TabItem("📈 VITALS DASHBOARD"):
                     vitals_out = gr.Dataframe(headers=["Metric", "Value", "Status"], interactive=False)
                     gr.Markdown("---")
+                    gr.Info("Real-time extraction of physiological markers.")
+                with gr.TabItem("⚙️ INTEROPERABILITY"):
+                    fhir_out = gr.Code(label="HL7-FHIR JSON", language="json")
+    # BINDINGS
     run_btn.click(
+        fn=pulse_scribe_engine,
         inputs=[audio_in, history_in],
+        outputs=[current_transcript, analysis_out, vitals_out, fhir_out]
     )
     q_btn.click(
+        fn=lambda t, q: text_client.chat_completion([{"role": "user", "content": f"Context: {t}\nQuestion: {q}"}]).choices[0].message.content if t else "Memory is empty.",
         inputs=[current_transcript, q_in],
         outputs=q_out
     )