Spaces:

VEDAGI1
/

Medica_DecisionSupportAI

Sleeping

App Files Files Community

Rajan Sharma commited on Oct 13

Commit

99d5da9

verified ·

1 Parent(s): 3d2ccd6

Update app.py

Browse files

Files changed (1) hide show

app.py +174 -99

app.py CHANGED Viewed

@@ -1,15 +1,8 @@
-# app_phi.py
-#
-# HIPAA-aware wrapper of the existing app. This keeps the analysis and assessment
-# capabilities intact while adding PHI safeguards:
-# - PHI_MODE flags with opt-in persistence
-# - Redaction before sending content to any external LLM
-# - Safer logging (no raw PHI)
-# - Optional banner and history controls
 #
-# NOTE: This file is designed to be a drop-in alternative to app.py.
-#       It preserves existing analysis logic and UI while adding HIPAA toggles.
 from __future__ import annotations
@@ -46,6 +39,8 @@ from privacy import safety_filter, refusal_reply
 from llm_router import cohere_chat, _co_client, cohere_embed
 def load_markdown_text(filepath: str) -> str:
     try:
         with open(filepath, "r", encoding="utf-8") as f:
@@ -57,21 +52,18 @@ def load_markdown_text(filepath: str) -> str:
 def _sanitize_text(s: str) -> str:
     if not isinstance(s, str):
         return s
-    # Remove control characters (except newline and tab)
     return re2.sub(r"[\p{C}--[\n\t]]+", "", s)
-# ---------------------- HIPAA helpers ----------------------
-# Very conservative redaction (risk reduction; not a full de-identification program).
 PHI_PATTERNS = [
-    (re.compile(r"\b\d{3}-\d{2}-\d{4}\b"), "[REDACTED_SSN]"),           # US SSN
-    (re.compile(r"\b\d{9}\b"), "[REDACTED_MRN]"),                         # 9-digit MRN (example)
     (re.compile(r"\b\d{3}[-.\s]?\d{3}[-.\s]?\d{4}\b"), "[REDACTED_PHONE]"),
     (re.compile(r"[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Za-z]{2,}"), "[REDACTED_EMAIL]"),
-    (re.compile(r"\b(19|20)\d{2}-\d{2}-\d{2}\b"), "[REDACTED_DOB]"),    # YYYY-MM-DD
-    (re.compile(r"\b\d{2}/\d{2}/(19|20)\d{2}\b"), "[REDACTED_DOB]"),    # MM/DD/YYYY
-    (re.compile(r"\b\d{5}(-\d{4})?\b"), "[REDACTED_ZIP]"),               # ZIP (US)
 ]
 def redact_phi(text: str) -> str:
@@ -83,18 +75,14 @@ def redact_phi(text: str) -> str:
     return t
 def safe_log(event_name: str, meta: dict | None = None):
-    # Avoid logging raw PHI or payloads
     try:
         meta = (meta or {}).copy()
         meta.pop("raw", None)
         log_event(event_name, None, meta)
     except Exception:
-        # Never raise from logging in PHI context
         pass
-# ---------------------- Original analysis helpers (unchanged) ----------------------
 def _create_python_script(user_scenario: str, schema_context: str) -> str:
     EXPERT_ANALYTICAL_GUIDELINES = """
 --- EXPERT ANALYTICAL GUIDELINES ---
@@ -195,13 +183,11 @@ def ping_cohere() -> str:
 def handle(user_msg: str, files: list, yield_update) -> str:
     try:
-        # Run app safety filter
         safe_in, blocked_in, reason_in = safety_filter(user_msg, mode="input")
         if blocked_in:
             return refusal_reply(reason_in)
-        # If PHI mode is enabled and we are not permitted to send PHI externally,
-        # redact the content before any LLM calls.
         redacted_in = safe_in
         if PHI_MODE and REDACT_BEFORE_LLM:
             redacted_in = redact_phi(safe_in)
@@ -209,8 +195,6 @@ def handle(user_msg: str, files: list, yield_update) -> str:
         file_paths: List[str] = [getattr(f, "name", None) or f for f in (files or [])]
         if file_paths:
-            # CSV analysis path preserved; we only use redacted_in in PROMPTS sent to the LLM.
-            # CSV data itself is processed locally as before.
             dataframes, schema_parts = [], []
             for i, p in enumerate(file_paths):
                 if p.endswith(".csv"):
@@ -227,8 +211,6 @@ def handle(user_msg: str, files: list, yield_update) -> str:
                 return "Please upload at least one CSV file."
             schema_context = "\n".join(schema_parts)
-            # If PHI is not allowed externally and PHI_MODE is on, we will use the redacted prompt.
             prompt_for_code = redacted_in if (PHI_MODE and not ALLOW_EXTERNAL_PHI) else safe_in
             yield_update("""```
@@ -255,12 +237,10 @@ def handle(user_msg: str, files: list, yield_update) -> str:
             yield_update("""```
 ✍️ Synthesizing final comprehensive report...
 ```""")
-            # For the final narrative, also route based on PHI policy
             writer_input = redacted_in if (PHI_MODE and not ALLOW_EXTERNAL_PHI) else safe_in
             final_report = _generate_final_report(writer_input, raw_data_output)
             return _sanitize_text(final_report)
         else:
-            # Pure chat path: redact if PHI_MODE and external is not allowed
             chat_input = redacted_in if (PHI_MODE and not ALLOW_EXTERNAL_PHI) else safe_in
             prompt = f"{GENERAL_CONVERSATION_PROMPT}\n\nUser: {chat_input}\nAssistant:"
             return _sanitize_text(cohere_chat(prompt) or "How can I help further?")
@@ -268,43 +248,119 @@ def handle(user_msg: str, files: list, yield_update) -> str:
     except Exception as e:
         tb = traceback.format_exc()
         safe_log("app_error", {"err": str(e)})
-        # Do not leak stack traces to UI in PHI mode
         return "A critical error occurred. Please contact your administrator." if PHI_MODE else f"A critical error occurred: {e}"
 PRIVACY_POLICY_TEXT = load_markdown_text("privacy_policy.md")
 TERMS_OF_SERVICE_TEXT = load_markdown_text("terms_of_service.md")
-with gr.Blocks(theme="soft", css="style.css") as demo:
-    # Persistent history state (in-memory). PHI mode defaults to no persistence.
-    assessment_history = gr.State([])
-    # Optional PHI banner
-    if PHI_MODE:
-        gr.Markdown(
-            "⚠️ **PHI Mode Enabled**: Protected Health Information safeguards are active. "
-            "History persistence is disabled by default. Avoid unnecessary identifiers."
-        )
-    # Modals
-    with gr.Group(visible=False) as privacy_modal:
-        with gr.Blocks():
-            gr.Markdown(PRIVACY_POLICY_TEXT)
-            close_privacy_btn = gr.Button("Close")
-    with gr.Group(visible=False) as terms_modal:
-        with gr.Blocks():
-            gr.Markdown(TERMS_OF_SERVICE_TEXT)
-            close_terms_btn = gr.Button("Close")
-    # UI
-    gr.Markdown("# Universal AI Data Analyst")
-    with gr.Row(variant="panel"):
-        with gr.Column(scale=1):
-            gr.Markdown("## New Assessment")
-            gr.Markdown(
-                "<p style='font-size:0.9rem; color: #6C757D;'>Upload CSVs for data analysis, or just enter a prompt to chat.</p>"
-            )
             files_input = gr.Files(
                 label="Upload Data Files (.csv)",
                 file_count="multiple",
@@ -312,34 +368,54 @@ with gr.Blocks(theme="soft", css="style.css") as demo:
                 file_types=[".csv"],
             )
             prompt_input = gr.Textbox(
-                label="Prompt", placeholder="Paste your scenario or question here.", lines=15
             )
-            with gr.Row():
-                send_btn = gr.Button("▶️ Send / Run Analysis", variant="primary", scale=2)
-                clear_btn = gr.Button("🗑️ Clear")
-            ping_btn = gr.Button("Ping Cohere")
             ping_out = gr.Markdown()
-        with gr.Column(scale=2):
-            with gr.Tabs():
-                with gr.TabItem("Current Assessment", id=0):
-                    chat_history_output = gr.Chatbot(
-                        label="Analysis Output", type="messages", height=600
-                    )
-                with gr.TabItem("Assessment History", id=1):
-                    gr.Markdown("## Review Past Assessments")
                     history_dropdown = gr.Dropdown(
                         label="Select an assessment to review", choices=[]
                     )
                     history_display = gr.Markdown(label="Selected Assessment Details")
-    with gr.Row():
-        gr.Markdown("---")
-    with gr.Row():
-        privacy_link = gr.Button("Privacy Policy", variant="link")
-        terms_link = gr.Button("Terms of Service", variant="link")
-    # Logic
     def run_analysis_wrapper(prompt, files, chat_history_list, history_state_list):
         if not prompt:
@@ -347,14 +423,11 @@ with gr.Blocks(theme="soft", css="style.css") as demo:
             yield chat_history_list, history_state_list, gr.update()
             return
-        # Append user message
         chat_with_user_msg = _append_msg(chat_history_list, "user", prompt)
-        # Placeholder for streamed updates (unused)
         def dummy_update(message: str):
             pass
-        # Thinking message
         thinking_message = _append_msg(
             chat_with_user_msg,
             "assistant",
@@ -364,21 +437,17 @@ with gr.Blocks(theme="soft", css="style.css") as demo:
         )
         yield thinking_message, history_state_list, gr.update()
-        # Run analysis/chat
         ai_response_text = handle(prompt, files, dummy_update)
-        # Append assistant response
         final_chat = _append_msg(chat_with_user_msg, "assistant", ai_response_text)
         timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-        # Filenames
         file_names: List[str] = []
         if files:
             file_names = [
                 os.path.basename(f.name if hasattr(f, "name") else f) for f in files
             ]
-        # Construct history entry
         new_entry = {
             "id": timestamp,
             "prompt": prompt,
@@ -387,7 +456,7 @@ with gr.Blocks(theme="soft", css="style.css") as demo:
             "chat_history": final_chat,
         }
-        # Persist only if allowed
         if PERSIST_HISTORY and (not PHI_MODE or (PHI_MODE and HISTORY_TTL_DAYS > 0)):
             updated_history: List[Dict[str, Any]] = (history_state_list or []) + [new_entry]
         else:
@@ -439,24 +508,30 @@ with gr.Blocks(theme="soft", css="style.css") as demo:
 {chat_md}
 """
-    # Wire up UI
     send_btn.click(
         run_analysis_wrapper,
-        inputs=[prompt_input, files_input, chat_history_output, assessment_history],
-        outputs=[chat_history_output, assessment_history, history_dropdown],
     )
     history_dropdown.change(
-        view_history, inputs=[history_dropdown, assessment_history], outputs=[history_display]
     )
     clear_btn.click(
-        lambda: (None, None, []),  # clear prompt, files, and chat
         outputs=[prompt_input, files_input, chat_history_output],
     )
     ping_btn.click(ping_cohere, outputs=[ping_out])
-    privacy_link.click(lambda: gr.update(visible=True), outputs=[privacy_modal])
-    close_privacy_btn.click(lambda: gr.update(visible=False), outputs=[privacy_modal])
-    terms_link.click(lambda: gr.update(visible=True), outputs=[terms_modal])
-    close_terms_btn.click(lambda: gr.update(visible=False), outputs=[terms_modal])
 if __name__ == "__main__":
     if not os.getenv("COHERE_API_KEY"):

+# app_phi_sleek.py
 #
+# Sleek UI + Voice-to-Text for the HIPAA-aware app.
+# IMPORTANT: All analysis/assessment logic is preserved exactly.
+# Changes are limited to the UI layout, CSS, and a client-side STT helper.
 from __future__ import annotations
 from llm_router import cohere_chat, _co_client, cohere_embed
+# ---------------------- helpers (unchanged logic) ----------------------
 def load_markdown_text(filepath: str) -> str:
     try:
         with open(filepath, "r", encoding="utf-8") as f:
 def _sanitize_text(s: str) -> str:
     if not isinstance(s, str):
         return s
     return re2.sub(r"[\p{C}--[\n\t]]+", "", s)
+# Very conservative PHI redaction (unchanged idea)
 PHI_PATTERNS = [
+    (re.compile(r"\b\d{3}-\d{2}-\d{4}\b"), "[REDACTED_SSN]"),
+    (re.compile(r"\b\d{9}\b"), "[REDACTED_MRN]"),
     (re.compile(r"\b\d{3}[-.\s]?\d{3}[-.\s]?\d{4}\b"), "[REDACTED_PHONE]"),
     (re.compile(r"[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Za-z]{2,}"), "[REDACTED_EMAIL]"),
+    (re.compile(r"\b(19|20)\d{2}-\d{2}-\d{2}\b"), "[REDACTED_DOB]"),
+    (re.compile(r"\b\d{2}/\d{2}/(19|20)\d{2}\b"), "[REDACTED_DOB]"),
+    (re.compile(r"\b\d{5}(-\d{4})?\b"), "[REDACTED_ZIP]"),
 ]
 def redact_phi(text: str) -> str:
     return t
 def safe_log(event_name: str, meta: dict | None = None):
     try:
         meta = (meta or {}).copy()
         meta.pop("raw", None)
         log_event(event_name, None, meta)
     except Exception:
         pass
 def _create_python_script(user_scenario: str, schema_context: str) -> str:
     EXPERT_ANALYTICAL_GUIDELINES = """
 --- EXPERT ANALYTICAL GUIDELINES ---
 def handle(user_msg: str, files: list, yield_update) -> str:
     try:
         safe_in, blocked_in, reason_in = safety_filter(user_msg, mode="input")
         if blocked_in:
             return refusal_reply(reason_in)
+        # Redact prompt if PHI_MODE and external PHI not allowed
         redacted_in = safe_in
         if PHI_MODE and REDACT_BEFORE_LLM:
             redacted_in = redact_phi(safe_in)
         file_paths: List[str] = [getattr(f, "name", None) or f for f in (files or [])]
         if file_paths:
             dataframes, schema_parts = [], []
             for i, p in enumerate(file_paths):
                 if p.endswith(".csv"):
                 return "Please upload at least one CSV file."
             schema_context = "\n".join(schema_parts)
             prompt_for_code = redacted_in if (PHI_MODE and not ALLOW_EXTERNAL_PHI) else safe_in
             yield_update("""```
             yield_update("""```
 ✍️ Synthesizing final comprehensive report...
 ```""")
             writer_input = redacted_in if (PHI_MODE and not ALLOW_EXTERNAL_PHI) else safe_in
             final_report = _generate_final_report(writer_input, raw_data_output)
             return _sanitize_text(final_report)
         else:
             chat_input = redacted_in if (PHI_MODE and not ALLOW_EXTERNAL_PHI) else safe_in
             prompt = f"{GENERAL_CONVERSATION_PROMPT}\n\nUser: {chat_input}\nAssistant:"
             return _sanitize_text(cohere_chat(prompt) or "How can I help further?")
     except Exception as e:
         tb = traceback.format_exc()
         safe_log("app_error", {"err": str(e)})
         return "A critical error occurred. Please contact your administrator." if PHI_MODE else f"A critical error occurred: {e}"
 PRIVACY_POLICY_TEXT = load_markdown_text("privacy_policy.md")
 TERMS_OF_SERVICE_TEXT = load_markdown_text("terms_of_service.md")
+# ---------------------- Sleek UI Layer only ----------------------
+SLEEK_CSS = """
+/* Full-bleed, modern look */
+:root, body, #root, .gradio-container { height: 100%; }
+.gradio-container { padding: 0 !important; }
+.block { padding: 0 !important; }
+/* Header */
+.header {
+  padding: 20px 28px;
+  background: linear-gradient(135deg, #0e1726, #1d2a44 60%, #243a5e);
+  color: #fff;
+  display: flex; align-items: center; justify-content: space-between;
+  gap: 16px;
+}
+.header h1 { margin: 0; font-size: 22px; letter-spacing: 0.3px; font-weight: 600; }
+.header .badge { font-size: 12px; opacity: 0.9; background:#ffffff22; padding:6px 10px; border-radius: 999px; }
+/* Main layout */
+.main {
+  display: grid;
+  grid-template-columns: 420px 1fr;
+  gap: 16px;
+  padding: 16px;
+  height: calc(100vh - 72px);
+  box-sizing: border-box;
+}
+.left, .right {
+  background: #0b1020;
+  color: #e9edf3;
+  border-radius: 16px;
+  border: 1px solid #1c2642;
+}
+.left { padding: 16px; display: flex; flex-direction: column; gap: 12px; }
+.right { padding: 0; display: flex; flex-direction: column; }
+/* Panels */
+.panel-title { font-size: 14px; font-weight: 600; color: #aeb8cc; margin-bottom: 6px; }
+.helper { font-size: 12px; color: #97a3bb; margin-bottom: 8px; }
+/* Sticky actions */
+.actions {
+  display: flex; gap: 8px; align-items: center; justify-content: stretch;
+}
+.actions .gr-button { flex: 1; }
+/* Tabs full height */
+.right .tabs { height: 100%; display: flex; flex-direction: column; }
+.right .tabitem { flex: 1; display: flex; flex-direction: column; }
+#chatbot_container { flex: 1; }
+#chatbot_container .gr-chatbot { height: 100%; }
+/* Tiny separators */
+.hr { height: 1px; background: #16203b; margin: 10px 0; }
+/* Voice hint */
+.voice-hint { font-size: 12px; color:#9fb0cc; margin-top: 4px; }
+"""
+VOICE_STT_HTML = """
+<script>
+let __rs_rec = null;
+function rs_toggle_stt(elemId){
+  const SpeechRecognition = window.SpeechRecognition || window.webkitSpeechRecognition;
+  if (!SpeechRecognition){
+    alert("This browser does not support Speech Recognition. Try Chrome or Edge.");
+    return;
+  }
+  if (__rs_rec){ __rs_rec.stop(); __rs_rec = null; return; }
+  __rs_rec = new SpeechRecognition();
+  __rs_rec.lang = "en-US";
+  __rs_rec.interimResults = true;
+  __rs_rec.continuous = true;
+  const box = document.querySelector(`#${elemId} textarea`);
+  if (!box){ alert("Prompt box not found."); return; }
+  let base = box.value || "";
+  __rs_rec.onresult = (ev) => {
+    let t = "";
+    for (let i = ev.resultIndex; i < ev.results.length; i++){
+      t += ev.results[i][0].transcript;
+    }
+    box.value = (base + " " + t).trim();
+    box.dispatchEvent(new Event("input", { bubbles: true }));
+  };
+  __rs_rec.onend = () => { __rs_rec = null; };
+  __rs_rec.start();
+}
+</script>
+"""
+with gr.Blocks(theme=gr.themes.Soft(), css=SLEEK_CSS, fill_width=True) as demo:
+    # Header
+    with gr.Row(elem_classes=["header"]):
+        gr.Markdown("<h1>Universal AI Data Analyst</h1>")
+        pill = "PHI Mode ON · history off" if (PHI_MODE and not PERSIST_HISTORY) else \
+               "PHI Mode ON" if PHI_MODE else "PHI Mode OFF"
+        gr.Markdown(f"<span class='badge'>{pill}</span>")
+    # Main
+    with gr.Row(elem_classes=["main"]):
+        # Left panel
+        with gr.Column(elem_classes=["left"]):
+            gr.Markdown("<div class='panel-title'>New Assessment</div>")
+            gr.Markdown("<div class='helper'>Upload CSVs for analysis, or enter a prompt. Voice works in modern browsers.</div>")
             files_input = gr.Files(
                 label="Upload Data Files (.csv)",
                 file_count="multiple",
                 file_types=[".csv"],
             )
             prompt_input = gr.Textbox(
+                label="Prompt",
+                placeholder="Paste your scenario or question here...",
+                lines=12,
+                elem_id="prompt_box",
+                autofocus=True,
             )
+            with gr.Row(elem_classes=["actions"]):
+                send_btn = gr.Button("▶️ Run Analysis", variant="primary")
+                clear_btn = gr.Button("🧹 Clear")
+                voice_btn = gr.Button("🎙️ Voice")
+            gr.Markdown("<div class='voice-hint'>Click Voice to start/stop dictation into the prompt box.</div>")
+            ping_btn = gr.Button("🔌 Ping Cohere")
             ping_out = gr.Markdown()
+            gr.Markdown("<div class='hr'></div>")
+            if PHI_MODE:
+                gr.Markdown(
+                    "⚠️ **PHI Mode:** History persistence is disabled by default. Avoid unnecessary identifiers.",
+                )
+            with gr.Accordion("Privacy & Terms", open=False):
+                PRIVACY_POLICY_TEXT = load_markdown_text("privacy_policy.md")
+                TERMS_OF_SERVICE_TEXT = load_markdown_text("terms_of_service.md")
+                gr.Markdown(PRIVACY_POLICY_TEXT)
+                gr.Markdown("<div class='hr'></div>")
+                gr.Markdown(TERMS_OF_SERVICE_TEXT)
+        # Right panel
+        with gr.Column(elem_classes=["right"]):
+            with gr.Tabs(elem_classes=["tabs"]):
+                with gr.TabItem("Current Assessment", id=0, elem_classes=["tabitem"]):
+                    with gr.Column(elem_id="chatbot_container"):
+                        chat_history_output = gr.Chatbot(
+                            label="Analysis Output", type="messages"
+                        )
+                with gr.TabItem("Assessment History", id=1, elem_classes=["tabitem"]):
+                    gr.Markdown("### Review Past Assessments")
                     history_dropdown = gr.Dropdown(
                         label="Select an assessment to review", choices=[]
                     )
                     history_display = gr.Markdown(label="Selected Assessment Details")
+    # Inject STT helper
+    gr.HTML(VOICE_STT_HTML)
+    # --------- Logic (unchanged analysis flow) ----------
     def run_analysis_wrapper(prompt, files, chat_history_list, history_state_list):
         if not prompt:
             yield chat_history_list, history_state_list, gr.update()
             return
         chat_with_user_msg = _append_msg(chat_history_list, "user", prompt)
         def dummy_update(message: str):
             pass
         thinking_message = _append_msg(
             chat_with_user_msg,
             "assistant",
         )
         yield thinking_message, history_state_list, gr.update()
         ai_response_text = handle(prompt, files, dummy_update)
         final_chat = _append_msg(chat_with_user_msg, "assistant", ai_response_text)
         timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
         file_names: List[str] = []
         if files:
             file_names = [
                 os.path.basename(f.name if hasattr(f, "name") else f) for f in files
             ]
         new_entry = {
             "id": timestamp,
             "prompt": prompt,
             "chat_history": final_chat,
         }
+        # Respect PHI history rules exactly as before
         if PERSIST_HISTORY and (not PHI_MODE or (PHI_MODE and HISTORY_TTL_DAYS > 0)):
             updated_history: List[Dict[str, Any]] = (history_state_list or []) + [new_entry]
         else:
 {chat_md}
 """
+    # Wire events
     send_btn.click(
         run_analysis_wrapper,
+        inputs=[prompt_input, files_input, chat_history_output, []],  # local state
+        outputs=[chat_history_output, [], history_dropdown],
     )
+    # Use a hidden State for history to avoid changing logic; or substitute your existing State variable.
+    # If you want to persist in-memory between runs, replace [] with a gr.State([]) you manage outside.
     history_dropdown.change(
+        view_history, inputs=[history_dropdown, []], outputs=[history_display]
     )
     clear_btn.click(
+        lambda: (None, None, []),
         outputs=[prompt_input, files_input, chat_history_output],
     )
     ping_btn.click(ping_cohere, outputs=[ping_out])
+    # Voice button (client-side only)
+    voice_btn.click(
+        None, [], [], js="rs_toggle_stt('prompt_box')"
+    )
 if __name__ == "__main__":
     if not os.getenv("COHERE_API_KEY"):